1d5d45c9bSBarry Smith /* 23369ce9aSBarry Smith Defines the basic matrix operations for the AIJ (compressed row) 3d5d45c9bSBarry Smith matrix storage format. 4d5d45c9bSBarry Smith */ 53369ce9aSBarry Smith 6c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/aij.h> /*I "petscmat.h" I*/ 7c6db04a5SJed Brown #include <petscblaslapack.h> 8c6db04a5SJed Brown #include <petscbt.h> 9af0996ceSBarry Smith #include <petsc/private/kernels/blocktranspose.h> 100716a85fSBarry Smith 114099cc6bSBarry Smith PetscErrorCode MatSeqAIJSetTypeFromOptions(Mat A) 124099cc6bSBarry Smith { 134099cc6bSBarry Smith PetscErrorCode ierr; 144099cc6bSBarry Smith PetscBool flg; 154099cc6bSBarry Smith char type[256]; 164099cc6bSBarry Smith 174099cc6bSBarry Smith PetscFunctionBegin; 189566063dSJacob Faibussowitsch ierr = PetscObjectOptionsBegin((PetscObject)A);PetscCall(ierr); 199566063dSJacob Faibussowitsch PetscCall(PetscOptionsFList("-mat_seqaij_type","Matrix SeqAIJ type","MatSeqAIJSetType",MatSeqAIJList,"seqaij",type,256,&flg)); 209566063dSJacob Faibussowitsch if (flg) PetscCall(MatSeqAIJSetType(A,type)); 219566063dSJacob Faibussowitsch ierr = PetscOptionsEnd();PetscCall(ierr); 224099cc6bSBarry Smith PetscFunctionReturn(0); 234099cc6bSBarry Smith } 244099cc6bSBarry Smith 25857cbf51SRichard Tran Mills PetscErrorCode MatGetColumnReductions_SeqAIJ(Mat A,PetscInt type,PetscReal *reductions) 260716a85fSBarry Smith { 270716a85fSBarry Smith PetscInt i,m,n; 280716a85fSBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ*)A->data; 290716a85fSBarry Smith 300716a85fSBarry Smith PetscFunctionBegin; 319566063dSJacob Faibussowitsch PetscCall(MatGetSize(A,&m,&n)); 329566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(reductions,n)); 330716a85fSBarry Smith if (type == NORM_2) { 340716a85fSBarry Smith for (i=0; i<aij->i[m]; i++) { 35a873a8cdSSam Reynolds reductions[aij->j[i]] += PetscAbsScalar(aij->a[i]*aij->a[i]); 360716a85fSBarry Smith } 370716a85fSBarry Smith } else if (type == NORM_1) { 380716a85fSBarry Smith for (i=0; i<aij->i[m]; i++) { 39a873a8cdSSam Reynolds reductions[aij->j[i]] += PetscAbsScalar(aij->a[i]); 400716a85fSBarry Smith } 410716a85fSBarry Smith } else if (type == NORM_INFINITY) { 420716a85fSBarry Smith for (i=0; i<aij->i[m]; i++) { 43a873a8cdSSam Reynolds reductions[aij->j[i]] = PetscMax(PetscAbsScalar(aij->a[i]),reductions[aij->j[i]]); 440716a85fSBarry Smith } 45857cbf51SRichard Tran Mills } else if (type == REDUCTION_SUM_REALPART || type == REDUCTION_MEAN_REALPART) { 46a873a8cdSSam Reynolds for (i=0; i<aij->i[m]; i++) { 47857cbf51SRichard Tran Mills reductions[aij->j[i]] += PetscRealPart(aij->a[i]); 48a873a8cdSSam Reynolds } 49857cbf51SRichard Tran Mills } else if (type == REDUCTION_SUM_IMAGINARYPART || type == REDUCTION_MEAN_IMAGINARYPART) { 50857cbf51SRichard Tran Mills for (i=0; i<aij->i[m]; i++) { 51857cbf51SRichard Tran Mills reductions[aij->j[i]] += PetscImaginaryPart(aij->a[i]); 52857cbf51SRichard Tran Mills } 53857cbf51SRichard Tran Mills } else SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONG,"Unknown reduction type"); 540716a85fSBarry Smith 550716a85fSBarry Smith if (type == NORM_2) { 56a873a8cdSSam Reynolds for (i=0; i<n; i++) reductions[i] = PetscSqrtReal(reductions[i]); 57857cbf51SRichard Tran Mills } else if (type == REDUCTION_MEAN_REALPART || type == REDUCTION_MEAN_IMAGINARYPART) { 58a873a8cdSSam Reynolds for (i=0; i<n; i++) reductions[i] /= m; 590716a85fSBarry Smith } 600716a85fSBarry Smith PetscFunctionReturn(0); 610716a85fSBarry Smith } 620716a85fSBarry Smith 633a062f41SBarry Smith PetscErrorCode MatFindOffBlockDiagonalEntries_SeqAIJ(Mat A,IS *is) 643a062f41SBarry Smith { 653a062f41SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 663a062f41SBarry Smith PetscInt i,m=A->rmap->n,cnt = 0, bs = A->rmap->bs; 673a062f41SBarry Smith const PetscInt *jj = a->j,*ii = a->i; 683a062f41SBarry Smith PetscInt *rows; 693a062f41SBarry Smith 703a062f41SBarry Smith PetscFunctionBegin; 713a062f41SBarry Smith for (i=0; i<m; i++) { 723a062f41SBarry Smith if ((ii[i] != ii[i+1]) && ((jj[ii[i]] < bs*(i/bs)) || (jj[ii[i+1]-1] > bs*((i+bs)/bs)-1))) { 733a062f41SBarry Smith cnt++; 743a062f41SBarry Smith } 753a062f41SBarry Smith } 769566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(cnt,&rows)); 773a062f41SBarry Smith cnt = 0; 783a062f41SBarry Smith for (i=0; i<m; i++) { 793a062f41SBarry Smith if ((ii[i] != ii[i+1]) && ((jj[ii[i]] < bs*(i/bs)) || (jj[ii[i+1]-1] > bs*((i+bs)/bs)-1))) { 803a062f41SBarry Smith rows[cnt] = i; 813a062f41SBarry Smith cnt++; 823a062f41SBarry Smith } 833a062f41SBarry Smith } 849566063dSJacob Faibussowitsch PetscCall(ISCreateGeneral(PETSC_COMM_SELF,cnt,rows,PETSC_OWN_POINTER,is)); 853a062f41SBarry Smith PetscFunctionReturn(0); 863a062f41SBarry Smith } 873a062f41SBarry Smith 88f1f41ecbSJed Brown PetscErrorCode MatFindZeroDiagonals_SeqAIJ_Private(Mat A,PetscInt *nrows,PetscInt **zrows) 896ce1633cSBarry Smith { 906ce1633cSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 91fff043a9SJunchao Zhang const MatScalar *aa; 926ce1633cSBarry Smith PetscInt i,m=A->rmap->n,cnt = 0; 93b2db7409Sstefano_zampini const PetscInt *ii = a->i,*jj = a->j,*diag; 946ce1633cSBarry Smith PetscInt *rows; 956ce1633cSBarry Smith 966ce1633cSBarry Smith PetscFunctionBegin; 979566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A,&aa)); 989566063dSJacob Faibussowitsch PetscCall(MatMarkDiagonal_SeqAIJ(A)); 996ce1633cSBarry Smith diag = a->diag; 1006ce1633cSBarry Smith for (i=0; i<m; i++) { 101b2db7409Sstefano_zampini if ((diag[i] >= ii[i+1]) || (jj[diag[i]] != i) || (aa[diag[i]] == 0.0)) { 1026ce1633cSBarry Smith cnt++; 1036ce1633cSBarry Smith } 1046ce1633cSBarry Smith } 1059566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(cnt,&rows)); 1066ce1633cSBarry Smith cnt = 0; 1076ce1633cSBarry Smith for (i=0; i<m; i++) { 108b2db7409Sstefano_zampini if ((diag[i] >= ii[i+1]) || (jj[diag[i]] != i) || (aa[diag[i]] == 0.0)) { 1096ce1633cSBarry Smith rows[cnt++] = i; 1106ce1633cSBarry Smith } 1116ce1633cSBarry Smith } 112f1f41ecbSJed Brown *nrows = cnt; 113f1f41ecbSJed Brown *zrows = rows; 1149566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A,&aa)); 115f1f41ecbSJed Brown PetscFunctionReturn(0); 116f1f41ecbSJed Brown } 117f1f41ecbSJed Brown 118f1f41ecbSJed Brown PetscErrorCode MatFindZeroDiagonals_SeqAIJ(Mat A,IS *zrows) 119f1f41ecbSJed Brown { 120f1f41ecbSJed Brown PetscInt nrows,*rows; 121f1f41ecbSJed Brown 122f1f41ecbSJed Brown PetscFunctionBegin; 1230298fd71SBarry Smith *zrows = NULL; 1249566063dSJacob Faibussowitsch PetscCall(MatFindZeroDiagonals_SeqAIJ_Private(A,&nrows,&rows)); 1259566063dSJacob Faibussowitsch PetscCall(ISCreateGeneral(PetscObjectComm((PetscObject)A),nrows,rows,PETSC_OWN_POINTER,zrows)); 1266ce1633cSBarry Smith PetscFunctionReturn(0); 1276ce1633cSBarry Smith } 1286ce1633cSBarry Smith 129b3a44c85SBarry Smith PetscErrorCode MatFindNonzeroRows_SeqAIJ(Mat A,IS *keptrows) 130b3a44c85SBarry Smith { 131b3a44c85SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 132b3a44c85SBarry Smith const MatScalar *aa; 133b3a44c85SBarry Smith PetscInt m=A->rmap->n,cnt = 0; 134b3a44c85SBarry Smith const PetscInt *ii; 135b3a44c85SBarry Smith PetscInt n,i,j,*rows; 136b3a44c85SBarry Smith 137b3a44c85SBarry Smith PetscFunctionBegin; 1389566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A,&aa)); 139f4259b30SLisandro Dalcin *keptrows = NULL; 140b3a44c85SBarry Smith ii = a->i; 141b3a44c85SBarry Smith for (i=0; i<m; i++) { 142b3a44c85SBarry Smith n = ii[i+1] - ii[i]; 143b3a44c85SBarry Smith if (!n) { 144b3a44c85SBarry Smith cnt++; 145b3a44c85SBarry Smith goto ok1; 146b3a44c85SBarry Smith } 1472e5835c6SStefano Zampini for (j=ii[i]; j<ii[i+1]; j++) { 148b3a44c85SBarry Smith if (aa[j] != 0.0) goto ok1; 149b3a44c85SBarry Smith } 150b3a44c85SBarry Smith cnt++; 151b3a44c85SBarry Smith ok1:; 152b3a44c85SBarry Smith } 1532e5835c6SStefano Zampini if (!cnt) { 1549566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A,&aa)); 1552e5835c6SStefano Zampini PetscFunctionReturn(0); 1562e5835c6SStefano Zampini } 1579566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(A->rmap->n-cnt,&rows)); 158b3a44c85SBarry Smith cnt = 0; 159b3a44c85SBarry Smith for (i=0; i<m; i++) { 160b3a44c85SBarry Smith n = ii[i+1] - ii[i]; 161b3a44c85SBarry Smith if (!n) continue; 1622e5835c6SStefano Zampini for (j=ii[i]; j<ii[i+1]; j++) { 163b3a44c85SBarry Smith if (aa[j] != 0.0) { 164b3a44c85SBarry Smith rows[cnt++] = i; 165b3a44c85SBarry Smith break; 166b3a44c85SBarry Smith } 167b3a44c85SBarry Smith } 168b3a44c85SBarry Smith } 1699566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A,&aa)); 1709566063dSJacob Faibussowitsch PetscCall(ISCreateGeneral(PETSC_COMM_SELF,cnt,rows,PETSC_OWN_POINTER,keptrows)); 171b3a44c85SBarry Smith PetscFunctionReturn(0); 172b3a44c85SBarry Smith } 173b3a44c85SBarry Smith 1747087cfbeSBarry Smith PetscErrorCode MatDiagonalSet_SeqAIJ(Mat Y,Vec D,InsertMode is) 17579299369SBarry Smith { 17679299369SBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ*) Y->data; 17799e65526SBarry Smith PetscInt i,m = Y->rmap->n; 17899e65526SBarry Smith const PetscInt *diag; 1792e5835c6SStefano Zampini MatScalar *aa; 18099e65526SBarry Smith const PetscScalar *v; 181ace3abfcSBarry Smith PetscBool missing; 18279299369SBarry Smith 18379299369SBarry Smith PetscFunctionBegin; 18409f38230SBarry Smith if (Y->assembled) { 1859566063dSJacob Faibussowitsch PetscCall(MatMissingDiagonal_SeqAIJ(Y,&missing,NULL)); 18609f38230SBarry Smith if (!missing) { 18779299369SBarry Smith diag = aij->diag; 1889566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(D,&v)); 1899566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(Y,&aa)); 19079299369SBarry Smith if (is == INSERT_VALUES) { 19179299369SBarry Smith for (i=0; i<m; i++) { 19279299369SBarry Smith aa[diag[i]] = v[i]; 19379299369SBarry Smith } 19479299369SBarry Smith } else { 19579299369SBarry Smith for (i=0; i<m; i++) { 19679299369SBarry Smith aa[diag[i]] += v[i]; 19779299369SBarry Smith } 19879299369SBarry Smith } 1999566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(Y,&aa)); 2009566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(D,&v)); 20179299369SBarry Smith PetscFunctionReturn(0); 20279299369SBarry Smith } 2039566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(Y)); 20409f38230SBarry Smith } 2059566063dSJacob Faibussowitsch PetscCall(MatDiagonalSet_Default(Y,D,is)); 20609f38230SBarry Smith PetscFunctionReturn(0); 20709f38230SBarry Smith } 20879299369SBarry Smith 2091a83f524SJed Brown PetscErrorCode MatGetRowIJ_SeqAIJ(Mat A,PetscInt oshift,PetscBool symmetric,PetscBool inodecompressed,PetscInt *m,const PetscInt *ia[],const PetscInt *ja[],PetscBool *done) 21017ab2063SBarry Smith { 211416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 21297f1f81fSBarry Smith PetscInt i,ishift; 21317ab2063SBarry Smith 2143a40ed3dSBarry Smith PetscFunctionBegin; 215d0f46423SBarry Smith *m = A->rmap->n; 2163a40ed3dSBarry Smith if (!ia) PetscFunctionReturn(0); 217bfeeae90SHong Zhang ishift = 0; 21853e63a63SBarry Smith if (symmetric && !A->structurally_symmetric) { 2199566063dSJacob Faibussowitsch PetscCall(MatToSymmetricIJ_SeqAIJ(A->rmap->n,a->i,a->j,PETSC_TRUE,ishift,oshift,(PetscInt**)ia,(PetscInt**)ja)); 220bfeeae90SHong Zhang } else if (oshift == 1) { 2211a83f524SJed Brown PetscInt *tia; 222d0f46423SBarry Smith PetscInt nz = a->i[A->rmap->n]; 2233b2fbd54SBarry Smith /* malloc space and add 1 to i and j indices */ 2249566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(A->rmap->n+1,&tia)); 2251a83f524SJed Brown for (i=0; i<A->rmap->n+1; i++) tia[i] = a->i[i] + 1; 2261a83f524SJed Brown *ia = tia; 227ecc77c7aSBarry Smith if (ja) { 2281a83f524SJed Brown PetscInt *tja; 2299566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nz+1,&tja)); 2301a83f524SJed Brown for (i=0; i<nz; i++) tja[i] = a->j[i] + 1; 2311a83f524SJed Brown *ja = tja; 232ecc77c7aSBarry Smith } 2336945ee14SBarry Smith } else { 234ecc77c7aSBarry Smith *ia = a->i; 235ecc77c7aSBarry Smith if (ja) *ja = a->j; 236a2ce50c7SBarry Smith } 2373a40ed3dSBarry Smith PetscFunctionReturn(0); 238a2744918SBarry Smith } 239a2744918SBarry Smith 2401a83f524SJed Brown PetscErrorCode MatRestoreRowIJ_SeqAIJ(Mat A,PetscInt oshift,PetscBool symmetric,PetscBool inodecompressed,PetscInt *n,const PetscInt *ia[],const PetscInt *ja[],PetscBool *done) 2416945ee14SBarry Smith { 2423a40ed3dSBarry Smith PetscFunctionBegin; 2433a40ed3dSBarry Smith if (!ia) PetscFunctionReturn(0); 244bfeeae90SHong Zhang if ((symmetric && !A->structurally_symmetric) || oshift == 1) { 2459566063dSJacob Faibussowitsch PetscCall(PetscFree(*ia)); 2469566063dSJacob Faibussowitsch if (ja) PetscCall(PetscFree(*ja)); 247bcd2baecSBarry Smith } 2483a40ed3dSBarry Smith PetscFunctionReturn(0); 24917ab2063SBarry Smith } 25017ab2063SBarry Smith 2511a83f524SJed Brown PetscErrorCode MatGetColumnIJ_SeqAIJ(Mat A,PetscInt oshift,PetscBool symmetric,PetscBool inodecompressed,PetscInt *nn,const PetscInt *ia[],const PetscInt *ja[],PetscBool *done) 2523b2fbd54SBarry Smith { 2533b2fbd54SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 254d0f46423SBarry Smith PetscInt i,*collengths,*cia,*cja,n = A->cmap->n,m = A->rmap->n; 25597f1f81fSBarry Smith PetscInt nz = a->i[m],row,*jj,mr,col; 2563b2fbd54SBarry Smith 2573a40ed3dSBarry Smith PetscFunctionBegin; 258899cda47SBarry Smith *nn = n; 2593a40ed3dSBarry Smith if (!ia) PetscFunctionReturn(0); 2603b2fbd54SBarry Smith if (symmetric) { 2619566063dSJacob Faibussowitsch PetscCall(MatToSymmetricIJ_SeqAIJ(A->rmap->n,a->i,a->j,PETSC_TRUE,0,oshift,(PetscInt**)ia,(PetscInt**)ja)); 2623b2fbd54SBarry Smith } else { 2639566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(n,&collengths)); 2649566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(n+1,&cia)); 2659566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nz,&cja)); 2663b2fbd54SBarry Smith jj = a->j; 2673b2fbd54SBarry Smith for (i=0; i<nz; i++) { 268bfeeae90SHong Zhang collengths[jj[i]]++; 2693b2fbd54SBarry Smith } 2703b2fbd54SBarry Smith cia[0] = oshift; 2713b2fbd54SBarry Smith for (i=0; i<n; i++) { 2723b2fbd54SBarry Smith cia[i+1] = cia[i] + collengths[i]; 2733b2fbd54SBarry Smith } 2749566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(collengths,n)); 2753b2fbd54SBarry Smith jj = a->j; 276a93ec695SBarry Smith for (row=0; row<m; row++) { 277a93ec695SBarry Smith mr = a->i[row+1] - a->i[row]; 278a93ec695SBarry Smith for (i=0; i<mr; i++) { 279bfeeae90SHong Zhang col = *jj++; 2802205254eSKarl Rupp 2813b2fbd54SBarry Smith cja[cia[col] + collengths[col]++ - oshift] = row + oshift; 2823b2fbd54SBarry Smith } 2833b2fbd54SBarry Smith } 2849566063dSJacob Faibussowitsch PetscCall(PetscFree(collengths)); 2853b2fbd54SBarry Smith *ia = cia; *ja = cja; 2863b2fbd54SBarry Smith } 2873a40ed3dSBarry Smith PetscFunctionReturn(0); 2883b2fbd54SBarry Smith } 2893b2fbd54SBarry Smith 2901a83f524SJed Brown PetscErrorCode MatRestoreColumnIJ_SeqAIJ(Mat A,PetscInt oshift,PetscBool symmetric,PetscBool inodecompressed,PetscInt *n,const PetscInt *ia[],const PetscInt *ja[],PetscBool *done) 2913b2fbd54SBarry Smith { 2923a40ed3dSBarry Smith PetscFunctionBegin; 2933a40ed3dSBarry Smith if (!ia) PetscFunctionReturn(0); 2943b2fbd54SBarry Smith 2959566063dSJacob Faibussowitsch PetscCall(PetscFree(*ia)); 2969566063dSJacob Faibussowitsch PetscCall(PetscFree(*ja)); 2973a40ed3dSBarry Smith PetscFunctionReturn(0); 2983b2fbd54SBarry Smith } 2993b2fbd54SBarry Smith 3007cee066cSHong Zhang /* 3017cee066cSHong Zhang MatGetColumnIJ_SeqAIJ_Color() and MatRestoreColumnIJ_SeqAIJ_Color() are customized from 3027cee066cSHong Zhang MatGetColumnIJ_SeqAIJ() and MatRestoreColumnIJ_SeqAIJ() by adding an output 303040ebd07SHong Zhang spidx[], index of a->a, to be used in MatTransposeColoringCreate_SeqAIJ() and MatFDColoringCreate_SeqXAIJ() 3047cee066cSHong Zhang */ 3057cee066cSHong Zhang PetscErrorCode MatGetColumnIJ_SeqAIJ_Color(Mat A,PetscInt oshift,PetscBool symmetric,PetscBool inodecompressed,PetscInt *nn,const PetscInt *ia[],const PetscInt *ja[],PetscInt *spidx[],PetscBool *done) 3067cee066cSHong Zhang { 3077cee066cSHong Zhang Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 3087cee066cSHong Zhang PetscInt i,*collengths,*cia,*cja,n = A->cmap->n,m = A->rmap->n; 309071fcb05SBarry Smith PetscInt nz = a->i[m],row,mr,col,tmp; 3107cee066cSHong Zhang PetscInt *cspidx; 311071fcb05SBarry Smith const PetscInt *jj; 3127cee066cSHong Zhang 3137cee066cSHong Zhang PetscFunctionBegin; 3147cee066cSHong Zhang *nn = n; 3157cee066cSHong Zhang if (!ia) PetscFunctionReturn(0); 316625f6d37SHong Zhang 3179566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(n,&collengths)); 3189566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(n+1,&cia)); 3199566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nz,&cja)); 3209566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nz,&cspidx)); 3217cee066cSHong Zhang jj = a->j; 3227cee066cSHong Zhang for (i=0; i<nz; i++) { 3237cee066cSHong Zhang collengths[jj[i]]++; 3247cee066cSHong Zhang } 3257cee066cSHong Zhang cia[0] = oshift; 3267cee066cSHong Zhang for (i=0; i<n; i++) { 3277cee066cSHong Zhang cia[i+1] = cia[i] + collengths[i]; 3287cee066cSHong Zhang } 3299566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(collengths,n)); 3307cee066cSHong Zhang jj = a->j; 3317cee066cSHong Zhang for (row=0; row<m; row++) { 3327cee066cSHong Zhang mr = a->i[row+1] - a->i[row]; 3337cee066cSHong Zhang for (i=0; i<mr; i++) { 3347cee066cSHong Zhang col = *jj++; 335071fcb05SBarry Smith tmp = cia[col] + collengths[col]++ - oshift; 336071fcb05SBarry Smith cspidx[tmp] = a->i[row] + i; /* index of a->j */ 337071fcb05SBarry Smith cja[tmp] = row + oshift; 3387cee066cSHong Zhang } 3397cee066cSHong Zhang } 3409566063dSJacob Faibussowitsch PetscCall(PetscFree(collengths)); 341071fcb05SBarry Smith *ia = cia; 342071fcb05SBarry Smith *ja = cja; 3437cee066cSHong Zhang *spidx = cspidx; 3447cee066cSHong Zhang PetscFunctionReturn(0); 3457cee066cSHong Zhang } 3467cee066cSHong Zhang 3477cee066cSHong Zhang PetscErrorCode MatRestoreColumnIJ_SeqAIJ_Color(Mat A,PetscInt oshift,PetscBool symmetric,PetscBool inodecompressed,PetscInt *n,const PetscInt *ia[],const PetscInt *ja[],PetscInt *spidx[],PetscBool *done) 3487cee066cSHong Zhang { 3497cee066cSHong Zhang PetscFunctionBegin; 3509566063dSJacob Faibussowitsch PetscCall(MatRestoreColumnIJ_SeqAIJ(A,oshift,symmetric,inodecompressed,n,ia,ja,done)); 3519566063dSJacob Faibussowitsch PetscCall(PetscFree(*spidx)); 3527cee066cSHong Zhang PetscFunctionReturn(0); 3537cee066cSHong Zhang } 3547cee066cSHong Zhang 35587d4246cSBarry Smith PetscErrorCode MatSetValuesRow_SeqAIJ(Mat A,PetscInt row,const PetscScalar v[]) 35687d4246cSBarry Smith { 35787d4246cSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 35887d4246cSBarry Smith PetscInt *ai = a->i; 359fff043a9SJunchao Zhang PetscScalar *aa; 36087d4246cSBarry Smith 36187d4246cSBarry Smith PetscFunctionBegin; 3629566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A,&aa)); 3639566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(aa+ai[row],v,ai[row+1]-ai[row])); 3649566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A,&aa)); 36587d4246cSBarry Smith PetscFunctionReturn(0); 36687d4246cSBarry Smith } 36787d4246cSBarry Smith 368bd04181cSBarry Smith /* 369bd04181cSBarry Smith MatSeqAIJSetValuesLocalFast - An optimized version of MatSetValuesLocal() for SeqAIJ matrices with several assumptions 370bd04181cSBarry Smith 371bd04181cSBarry Smith - a single row of values is set with each call 372bd04181cSBarry Smith - no row or column indices are negative or (in error) larger than the number of rows or columns 373bd04181cSBarry Smith - the values are always added to the matrix, not set 374bd04181cSBarry Smith - no new locations are introduced in the nonzero structure of the matrix 375bd04181cSBarry Smith 3761f763a69SBarry Smith This does NOT assume the global column indices are sorted 377bd04181cSBarry Smith 3781f763a69SBarry Smith */ 379bd04181cSBarry Smith 380af0996ceSBarry Smith #include <petsc/private/isimpl.h> 381189e4007SBarry Smith PetscErrorCode MatSeqAIJSetValuesLocalFast(Mat A,PetscInt m,const PetscInt im[],PetscInt n,const PetscInt in[],const PetscScalar v[],InsertMode is) 382189e4007SBarry Smith { 383189e4007SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 3841f763a69SBarry Smith PetscInt low,high,t,row,nrow,i,col,l; 3851f763a69SBarry Smith const PetscInt *rp,*ai = a->i,*ailen = a->ilen,*aj = a->j; 3861f763a69SBarry Smith PetscInt lastcol = -1; 387fff043a9SJunchao Zhang MatScalar *ap,value,*aa; 388189e4007SBarry Smith const PetscInt *ridx = A->rmap->mapping->indices,*cidx = A->cmap->mapping->indices; 389189e4007SBarry Smith 390fff043a9SJunchao Zhang PetscFunctionBegin; 3919566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A,&aa)); 392f38dd0b8SBarry Smith row = ridx[im[0]]; 3931f763a69SBarry Smith rp = aj + ai[row]; 3941f763a69SBarry Smith ap = aa + ai[row]; 3951f763a69SBarry Smith nrow = ailen[row]; 396189e4007SBarry Smith low = 0; 397189e4007SBarry Smith high = nrow; 398189e4007SBarry Smith for (l=0; l<n; l++) { /* loop over added columns */ 399189e4007SBarry Smith col = cidx[in[l]]; 400f38dd0b8SBarry Smith value = v[l]; 401189e4007SBarry Smith 402189e4007SBarry Smith if (col <= lastcol) low = 0; 403189e4007SBarry Smith else high = nrow; 404189e4007SBarry Smith lastcol = col; 405189e4007SBarry Smith while (high-low > 5) { 406189e4007SBarry Smith t = (low+high)/2; 407189e4007SBarry Smith if (rp[t] > col) high = t; 408189e4007SBarry Smith else low = t; 409189e4007SBarry Smith } 410189e4007SBarry Smith for (i=low; i<high; i++) { 411189e4007SBarry Smith if (rp[i] == col) { 4121f763a69SBarry Smith ap[i] += value; 413189e4007SBarry Smith low = i + 1; 4141f763a69SBarry Smith break; 415189e4007SBarry Smith } 416189e4007SBarry Smith } 417189e4007SBarry Smith } 4189566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A,&aa)); 419f38dd0b8SBarry Smith return 0; 420189e4007SBarry Smith } 421189e4007SBarry Smith 42297f1f81fSBarry Smith PetscErrorCode MatSetValues_SeqAIJ(Mat A,PetscInt m,const PetscInt im[],PetscInt n,const PetscInt in[],const PetscScalar v[],InsertMode is) 42317ab2063SBarry Smith { 424416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 425e2ee6c50SBarry Smith PetscInt *rp,k,low,high,t,ii,row,nrow,i,col,l,rmax,N; 42697f1f81fSBarry Smith PetscInt *imax = a->imax,*ai = a->i,*ailen = a->ilen; 427e2ee6c50SBarry Smith PetscInt *aj = a->j,nonew = a->nonew,lastcol = -1; 428ce496241SStefano Zampini MatScalar *ap=NULL,value=0.0,*aa; 429ace3abfcSBarry Smith PetscBool ignorezeroentries = a->ignorezeroentries; 430ace3abfcSBarry Smith PetscBool roworiented = a->roworiented; 43117ab2063SBarry Smith 4323a40ed3dSBarry Smith PetscFunctionBegin; 4339566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A,&aa)); 43417ab2063SBarry Smith for (k=0; k<m; k++) { /* loop over added rows */ 435416022c9SBarry Smith row = im[k]; 4365ef9f2a5SBarry Smith if (row < 0) continue; 4376bdcaf15SBarry Smith PetscCheck(row < A->rmap->n,PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Row too large: row %" PetscInt_FMT " max %" PetscInt_FMT,row,A->rmap->n-1); 438720833daSHong Zhang rp = aj + ai[row]; 439876c6284SHong Zhang if (!A->structure_only) ap = aa + ai[row]; 44017ab2063SBarry Smith rmax = imax[row]; nrow = ailen[row]; 441416022c9SBarry Smith low = 0; 442c71e6ed7SBarry Smith high = nrow; 44317ab2063SBarry Smith for (l=0; l<n; l++) { /* loop over added columns */ 4445ef9f2a5SBarry Smith if (in[l] < 0) continue; 4456bdcaf15SBarry Smith PetscCheck(in[l] < A->cmap->n,PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Column too large: col %" PetscInt_FMT " max %" PetscInt_FMT,in[l],A->cmap->n-1); 446bfeeae90SHong Zhang col = in[l]; 447071fcb05SBarry Smith if (v && !A->structure_only) value = roworiented ? v[l + k*n] : v[k + l*m]; 448071fcb05SBarry Smith if (!A->structure_only && value == 0.0 && ignorezeroentries && is == ADD_VALUES && row != col) continue; 44936db0b34SBarry Smith 4502205254eSKarl Rupp if (col <= lastcol) low = 0; 4512205254eSKarl Rupp else high = nrow; 452e2ee6c50SBarry Smith lastcol = col; 453416022c9SBarry Smith while (high-low > 5) { 454416022c9SBarry Smith t = (low+high)/2; 455416022c9SBarry Smith if (rp[t] > col) high = t; 456416022c9SBarry Smith else low = t; 45717ab2063SBarry Smith } 458416022c9SBarry Smith for (i=low; i<high; i++) { 45917ab2063SBarry Smith if (rp[i] > col) break; 46017ab2063SBarry Smith if (rp[i] == col) { 461876c6284SHong Zhang if (!A->structure_only) { 4620c0d7e18SFande Kong if (is == ADD_VALUES) { 4630c0d7e18SFande Kong ap[i] += value; 4640c0d7e18SFande Kong (void)PetscLogFlops(1.0); 4650c0d7e18SFande Kong } 46617ab2063SBarry Smith else ap[i] = value; 467720833daSHong Zhang } 468e44c0bd4SBarry Smith low = i + 1; 46917ab2063SBarry Smith goto noinsert; 47017ab2063SBarry Smith } 47117ab2063SBarry Smith } 472dcd36c23SBarry Smith if (value == 0.0 && ignorezeroentries && row != col) goto noinsert; 473c2653b3dSLois Curfman McInnes if (nonew == 1) goto noinsert; 4742c71b3e2SJacob Faibussowitsch PetscCheckFalse(nonew == -1,PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Inserting a new nonzero at (%" PetscInt_FMT ",%" PetscInt_FMT ") in the matrix",row,col); 475720833daSHong Zhang if (A->structure_only) { 476876c6284SHong Zhang MatSeqXAIJReallocateAIJ_structure_only(A,A->rmap->n,1,nrow,row,col,rmax,ai,aj,rp,imax,nonew,MatScalar); 477720833daSHong Zhang } else { 478fef13f97SBarry Smith MatSeqXAIJReallocateAIJ(A,A->rmap->n,1,nrow,row,col,rmax,aa,ai,aj,rp,ap,imax,nonew,MatScalar); 479720833daSHong Zhang } 480c03d1d03SSatish Balay N = nrow++ - 1; a->nz++; high++; 481416022c9SBarry Smith /* shift up all the later entries in this row */ 4829566063dSJacob Faibussowitsch PetscCall(PetscArraymove(rp+i+1,rp+i,N-i+1)); 48317ab2063SBarry Smith rp[i] = col; 484580bdb30SBarry Smith if (!A->structure_only) { 4859566063dSJacob Faibussowitsch PetscCall(PetscArraymove(ap+i+1,ap+i,N-i+1)); 486580bdb30SBarry Smith ap[i] = value; 487580bdb30SBarry Smith } 488416022c9SBarry Smith low = i + 1; 489e56f5c9eSBarry Smith A->nonzerostate++; 490e44c0bd4SBarry Smith noinsert:; 49117ab2063SBarry Smith } 49217ab2063SBarry Smith ailen[row] = nrow; 49317ab2063SBarry Smith } 4949566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A,&aa)); 4953a40ed3dSBarry Smith PetscFunctionReturn(0); 49617ab2063SBarry Smith } 49717ab2063SBarry Smith 49819b08ed1SBarry Smith PetscErrorCode MatSetValues_SeqAIJ_SortedFullNoPreallocation(Mat A,PetscInt m,const PetscInt im[],PetscInt n,const PetscInt in[],const PetscScalar v[],InsertMode is) 49919b08ed1SBarry Smith { 50019b08ed1SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 50119b08ed1SBarry Smith PetscInt *rp,k,row; 50219b08ed1SBarry Smith PetscInt *ai = a->i; 50319b08ed1SBarry Smith PetscInt *aj = a->j; 504fff043a9SJunchao Zhang MatScalar *aa,*ap; 50519b08ed1SBarry Smith 50619b08ed1SBarry Smith PetscFunctionBegin; 50728b400f6SJacob Faibussowitsch PetscCheck(!A->was_assembled,PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Cannot call on assembled matrix."); 5082c71b3e2SJacob Faibussowitsch PetscCheckFalse(m*n+a->nz > a->maxnz,PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Number of entries in matrix will be larger than maximum nonzeros allocated for %" PetscInt_FMT " in MatSeqAIJSetTotalPreallocation()",a->maxnz); 509fff043a9SJunchao Zhang 5109566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A,&aa)); 51119b08ed1SBarry Smith for (k=0; k<m; k++) { /* loop over added rows */ 51219b08ed1SBarry Smith row = im[k]; 51319b08ed1SBarry Smith rp = aj + ai[row]; 51419b08ed1SBarry Smith ap = aa + ai[row]; 51519b08ed1SBarry Smith 5169566063dSJacob Faibussowitsch PetscCall(PetscMemcpy(rp,in,n*sizeof(PetscInt))); 51719b08ed1SBarry Smith if (!A->structure_only) { 51819b08ed1SBarry Smith if (v) { 5199566063dSJacob Faibussowitsch PetscCall(PetscMemcpy(ap,v,n*sizeof(PetscScalar))); 52019b08ed1SBarry Smith v += n; 52119b08ed1SBarry Smith } else { 5229566063dSJacob Faibussowitsch PetscCall(PetscMemzero(ap,n*sizeof(PetscScalar))); 52319b08ed1SBarry Smith } 52419b08ed1SBarry Smith } 52519b08ed1SBarry Smith a->ilen[row] = n; 52619b08ed1SBarry Smith a->imax[row] = n; 52719b08ed1SBarry Smith a->i[row+1] = a->i[row]+n; 52819b08ed1SBarry Smith a->nz += n; 52919b08ed1SBarry Smith } 5309566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A,&aa)); 53119b08ed1SBarry Smith PetscFunctionReturn(0); 53219b08ed1SBarry Smith } 53319b08ed1SBarry Smith 53419b08ed1SBarry Smith /*@ 53519b08ed1SBarry Smith MatSeqAIJSetTotalPreallocation - Sets an upper bound on the total number of expected nonzeros in the matrix. 53619b08ed1SBarry Smith 53719b08ed1SBarry Smith Input Parameters: 53819b08ed1SBarry Smith + A - the SeqAIJ matrix 53919b08ed1SBarry Smith - nztotal - bound on the number of nonzeros 54019b08ed1SBarry Smith 54119b08ed1SBarry Smith Level: advanced 54219b08ed1SBarry Smith 54319b08ed1SBarry Smith Notes: 54419b08ed1SBarry Smith This can be called if you will be provided the matrix row by row (from row zero) with sorted column indices for each row. 54519b08ed1SBarry Smith Simply call MatSetValues() after this call to provide the matrix entries in the usual manner. This matrix may be used 54619b08ed1SBarry Smith as always with multiple matrix assemblies. 54719b08ed1SBarry Smith 54819b08ed1SBarry Smith .seealso: MatSetOption(), MAT_SORTED_FULL, MatSetValues(), MatSeqAIJSetPreallocation() 54919b08ed1SBarry Smith @*/ 55019b08ed1SBarry Smith 55119b08ed1SBarry Smith PetscErrorCode MatSeqAIJSetTotalPreallocation(Mat A,PetscInt nztotal) 55219b08ed1SBarry Smith { 55319b08ed1SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 55419b08ed1SBarry Smith 55519b08ed1SBarry Smith PetscFunctionBegin; 5569566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(A->rmap)); 5579566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(A->cmap)); 55819b08ed1SBarry Smith a->maxnz = nztotal; 55919b08ed1SBarry Smith if (!a->imax) { 5609566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(A->rmap->n,&a->imax)); 5619566063dSJacob Faibussowitsch PetscCall(PetscLogObjectMemory((PetscObject)A,A->rmap->n*sizeof(PetscInt))); 56219b08ed1SBarry Smith } 56319b08ed1SBarry Smith if (!a->ilen) { 5649566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(A->rmap->n,&a->ilen)); 5659566063dSJacob Faibussowitsch PetscCall(PetscLogObjectMemory((PetscObject)A,A->rmap->n*sizeof(PetscInt))); 56619b08ed1SBarry Smith } else { 5679566063dSJacob Faibussowitsch PetscCall(PetscMemzero(a->ilen,A->rmap->n*sizeof(PetscInt))); 56819b08ed1SBarry Smith } 56919b08ed1SBarry Smith 57019b08ed1SBarry Smith /* allocate the matrix space */ 57119b08ed1SBarry Smith if (A->structure_only) { 5729566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nztotal,&a->j)); 5739566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(A->rmap->n+1,&a->i)); 5749566063dSJacob Faibussowitsch PetscCall(PetscLogObjectMemory((PetscObject)A,(A->rmap->n+1)*sizeof(PetscInt)+nztotal*sizeof(PetscInt))); 57519b08ed1SBarry Smith } else { 5769566063dSJacob Faibussowitsch PetscCall(PetscMalloc3(nztotal,&a->a,nztotal,&a->j,A->rmap->n+1,&a->i)); 5779566063dSJacob Faibussowitsch PetscCall(PetscLogObjectMemory((PetscObject)A,(A->rmap->n+1)*sizeof(PetscInt)+nztotal*(sizeof(PetscScalar)+sizeof(PetscInt)))); 57819b08ed1SBarry Smith } 57919b08ed1SBarry Smith a->i[0] = 0; 58019b08ed1SBarry Smith if (A->structure_only) { 58119b08ed1SBarry Smith a->singlemalloc = PETSC_FALSE; 58219b08ed1SBarry Smith a->free_a = PETSC_FALSE; 58319b08ed1SBarry Smith } else { 58419b08ed1SBarry Smith a->singlemalloc = PETSC_TRUE; 58519b08ed1SBarry Smith a->free_a = PETSC_TRUE; 58619b08ed1SBarry Smith } 58719b08ed1SBarry Smith a->free_ij = PETSC_TRUE; 58819b08ed1SBarry Smith A->ops->setvalues = MatSetValues_SeqAIJ_SortedFullNoPreallocation; 58919b08ed1SBarry Smith A->preallocated = PETSC_TRUE; 59019b08ed1SBarry Smith PetscFunctionReturn(0); 59119b08ed1SBarry Smith } 59219b08ed1SBarry Smith 593071fcb05SBarry Smith PetscErrorCode MatSetValues_SeqAIJ_SortedFull(Mat A,PetscInt m,const PetscInt im[],PetscInt n,const PetscInt in[],const PetscScalar v[],InsertMode is) 594071fcb05SBarry Smith { 595071fcb05SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 596071fcb05SBarry Smith PetscInt *rp,k,row; 597071fcb05SBarry Smith PetscInt *ai = a->i,*ailen = a->ilen; 598071fcb05SBarry Smith PetscInt *aj = a->j; 599fff043a9SJunchao Zhang MatScalar *aa,*ap; 600071fcb05SBarry Smith 601071fcb05SBarry Smith PetscFunctionBegin; 6029566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A,&aa)); 603071fcb05SBarry Smith for (k=0; k<m; k++) { /* loop over added rows */ 604071fcb05SBarry Smith row = im[k]; 6056bdcaf15SBarry Smith PetscCheck(n <= a->imax[row],PETSC_COMM_SELF,PETSC_ERR_ARG_WRONG,"Preallocation for row %" PetscInt_FMT " does not match number of columns provided",n); 606071fcb05SBarry Smith rp = aj + ai[row]; 607071fcb05SBarry Smith ap = aa + ai[row]; 608071fcb05SBarry Smith if (!A->was_assembled) { 6099566063dSJacob Faibussowitsch PetscCall(PetscMemcpy(rp,in,n*sizeof(PetscInt))); 610071fcb05SBarry Smith } 611071fcb05SBarry Smith if (!A->structure_only) { 612071fcb05SBarry Smith if (v) { 6139566063dSJacob Faibussowitsch PetscCall(PetscMemcpy(ap,v,n*sizeof(PetscScalar))); 614071fcb05SBarry Smith v += n; 615071fcb05SBarry Smith } else { 6169566063dSJacob Faibussowitsch PetscCall(PetscMemzero(ap,n*sizeof(PetscScalar))); 617071fcb05SBarry Smith } 618071fcb05SBarry Smith } 619071fcb05SBarry Smith ailen[row] = n; 620071fcb05SBarry Smith a->nz += n; 621071fcb05SBarry Smith } 6229566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A,&aa)); 623071fcb05SBarry Smith PetscFunctionReturn(0); 624071fcb05SBarry Smith } 625071fcb05SBarry Smith 626a77337e4SBarry Smith PetscErrorCode MatGetValues_SeqAIJ(Mat A,PetscInt m,const PetscInt im[],PetscInt n,const PetscInt in[],PetscScalar v[]) 6277eb43aa7SLois Curfman McInnes { 6287eb43aa7SLois Curfman McInnes Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 62997f1f81fSBarry Smith PetscInt *rp,k,low,high,t,row,nrow,i,col,l,*aj = a->j; 63097f1f81fSBarry Smith PetscInt *ai = a->i,*ailen = a->ilen; 631fff043a9SJunchao Zhang MatScalar *ap,*aa; 6327eb43aa7SLois Curfman McInnes 6333a40ed3dSBarry Smith PetscFunctionBegin; 6349566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A,&aa)); 6357eb43aa7SLois Curfman McInnes for (k=0; k<m; k++) { /* loop over rows */ 6367eb43aa7SLois Curfman McInnes row = im[k]; 63754c59aa7SJacob Faibussowitsch if (row < 0) {v += n; continue;} /* negative row */ 63854c59aa7SJacob Faibussowitsch PetscCheck(row < A->rmap->n,PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Row too large: row %" PetscInt_FMT " max %" PetscInt_FMT,row,A->rmap->n-1); 639bfeeae90SHong Zhang rp = aj + ai[row]; ap = aa + ai[row]; 6407eb43aa7SLois Curfman McInnes nrow = ailen[row]; 6417eb43aa7SLois Curfman McInnes for (l=0; l<n; l++) { /* loop over columns */ 64254c59aa7SJacob Faibussowitsch if (in[l] < 0) {v++; continue;} /* negative column */ 64354c59aa7SJacob Faibussowitsch PetscCheck(in[l] < A->cmap->n,PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Column too large: col %" PetscInt_FMT " max %" PetscInt_FMT,in[l],A->cmap->n-1); 644bfeeae90SHong Zhang col = in[l]; 6457eb43aa7SLois Curfman McInnes high = nrow; low = 0; /* assume unsorted */ 6467eb43aa7SLois Curfman McInnes while (high-low > 5) { 6477eb43aa7SLois Curfman McInnes t = (low+high)/2; 6487eb43aa7SLois Curfman McInnes if (rp[t] > col) high = t; 6497eb43aa7SLois Curfman McInnes else low = t; 6507eb43aa7SLois Curfman McInnes } 6517eb43aa7SLois Curfman McInnes for (i=low; i<high; i++) { 6527eb43aa7SLois Curfman McInnes if (rp[i] > col) break; 6537eb43aa7SLois Curfman McInnes if (rp[i] == col) { 654b49de8d1SLois Curfman McInnes *v++ = ap[i]; 6557eb43aa7SLois Curfman McInnes goto finished; 6567eb43aa7SLois Curfman McInnes } 6577eb43aa7SLois Curfman McInnes } 65897e567efSBarry Smith *v++ = 0.0; 6597eb43aa7SLois Curfman McInnes finished:; 6607eb43aa7SLois Curfman McInnes } 6617eb43aa7SLois Curfman McInnes } 6629566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A,&aa)); 6633a40ed3dSBarry Smith PetscFunctionReturn(0); 6647eb43aa7SLois Curfman McInnes } 6657eb43aa7SLois Curfman McInnes 6663ea6fe3dSLisandro Dalcin PetscErrorCode MatView_SeqAIJ_Binary(Mat mat,PetscViewer viewer) 66717ab2063SBarry Smith { 6683ea6fe3dSLisandro Dalcin Mat_SeqAIJ *A = (Mat_SeqAIJ*)mat->data; 669c898d852SStefano Zampini const PetscScalar *av; 6703ea6fe3dSLisandro Dalcin PetscInt header[4],M,N,m,nz,i; 6713ea6fe3dSLisandro Dalcin PetscInt *rowlens; 67217ab2063SBarry Smith 6733a40ed3dSBarry Smith PetscFunctionBegin; 6749566063dSJacob Faibussowitsch PetscCall(PetscViewerSetUp(viewer)); 6752205254eSKarl Rupp 6763ea6fe3dSLisandro Dalcin M = mat->rmap->N; 6773ea6fe3dSLisandro Dalcin N = mat->cmap->N; 6783ea6fe3dSLisandro Dalcin m = mat->rmap->n; 6793ea6fe3dSLisandro Dalcin nz = A->nz; 680416022c9SBarry Smith 6813ea6fe3dSLisandro Dalcin /* write matrix header */ 6823ea6fe3dSLisandro Dalcin header[0] = MAT_FILE_CLASSID; 6833ea6fe3dSLisandro Dalcin header[1] = M; header[2] = N; header[3] = nz; 6849566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryWrite(viewer,header,4,PETSC_INT)); 685416022c9SBarry Smith 6863ea6fe3dSLisandro Dalcin /* fill in and store row lengths */ 6879566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m,&rowlens)); 6883ea6fe3dSLisandro Dalcin for (i=0; i<m; i++) rowlens[i] = A->i[i+1] - A->i[i]; 6899566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryWrite(viewer,rowlens,m,PETSC_INT)); 6909566063dSJacob Faibussowitsch PetscCall(PetscFree(rowlens)); 6913ea6fe3dSLisandro Dalcin /* store column indices */ 6929566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryWrite(viewer,A->j,nz,PETSC_INT)); 693416022c9SBarry Smith /* store nonzero values */ 6949566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(mat,&av)); 6959566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryWrite(viewer,av,nz,PETSC_SCALAR)); 6969566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(mat,&av)); 697b37d52dbSMark F. Adams 6983ea6fe3dSLisandro Dalcin /* write block size option to the viewer's .info file */ 6999566063dSJacob Faibussowitsch PetscCall(MatView_Binary_BlockSizes(mat,viewer)); 7003a40ed3dSBarry Smith PetscFunctionReturn(0); 70117ab2063SBarry Smith } 702416022c9SBarry Smith 7037dc0baabSHong Zhang static PetscErrorCode MatView_SeqAIJ_ASCII_structonly(Mat A,PetscViewer viewer) 7047dc0baabSHong Zhang { 7057dc0baabSHong Zhang Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 7067dc0baabSHong Zhang PetscInt i,k,m=A->rmap->N; 7077dc0baabSHong Zhang 7087dc0baabSHong Zhang PetscFunctionBegin; 7099566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer,PETSC_FALSE)); 7107dc0baabSHong Zhang for (i=0; i<m; i++) { 7119566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer,"row %" PetscInt_FMT ":",i)); 7127dc0baabSHong Zhang for (k=a->i[i]; k<a->i[i+1]; k++) { 7139566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer," (%" PetscInt_FMT ") ",a->j[k])); 7147dc0baabSHong Zhang } 7159566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer,"\n")); 7167dc0baabSHong Zhang } 7179566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer,PETSC_TRUE)); 7187dc0baabSHong Zhang PetscFunctionReturn(0); 7197dc0baabSHong Zhang } 7207dc0baabSHong Zhang 72109573ac7SBarry Smith extern PetscErrorCode MatSeqAIJFactorInfo_Matlab(Mat,PetscViewer); 722cd155464SBarry Smith 723dfbe8321SBarry Smith PetscErrorCode MatView_SeqAIJ_ASCII(Mat A,PetscViewer viewer) 724416022c9SBarry Smith { 725416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 726c898d852SStefano Zampini const PetscScalar *av; 72760e0710aSBarry Smith PetscInt i,j,m = A->rmap->n; 728e060cb09SBarry Smith const char *name; 729f3ef73ceSBarry Smith PetscViewerFormat format; 73017ab2063SBarry Smith 7313a40ed3dSBarry Smith PetscFunctionBegin; 7327dc0baabSHong Zhang if (A->structure_only) { 7339566063dSJacob Faibussowitsch PetscCall(MatView_SeqAIJ_ASCII_structonly(A,viewer)); 7347dc0baabSHong Zhang PetscFunctionReturn(0); 7357dc0baabSHong Zhang } 73643e49210SHong Zhang 7379566063dSJacob Faibussowitsch PetscCall(PetscViewerGetFormat(viewer,&format)); 7382e5835c6SStefano Zampini if (format == PETSC_VIEWER_ASCII_FACTOR_INFO || format == PETSC_VIEWER_ASCII_INFO || format == PETSC_VIEWER_ASCII_INFO_DETAIL) PetscFunctionReturn(0); 7392e5835c6SStefano Zampini 740c898d852SStefano Zampini /* trigger copy to CPU if needed */ 7419566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A,&av)); 7429566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A,&av)); 74371c2f376SKris Buschelman if (format == PETSC_VIEWER_ASCII_MATLAB) { 74497f1f81fSBarry Smith PetscInt nofinalvalue = 0; 74560e0710aSBarry Smith if (m && ((a->i[m] == a->i[m-1]) || (a->j[a->nz-1] != A->cmap->n-1))) { 746c337ccceSJed Brown /* Need a dummy value to ensure the dimension of the matrix. */ 747d00d2cf4SBarry Smith nofinalvalue = 1; 748d00d2cf4SBarry Smith } 7499566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer,PETSC_FALSE)); 7509566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer,"%% Size = %" PetscInt_FMT " %" PetscInt_FMT " \n",m,A->cmap->n)); 7519566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer,"%% Nonzeros = %" PetscInt_FMT " \n",a->nz)); 752fbfe6fa7SJed Brown #if defined(PETSC_USE_COMPLEX) 7539566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer,"zzz = zeros(%" PetscInt_FMT ",4);\n",a->nz+nofinalvalue)); 754fbfe6fa7SJed Brown #else 7559566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer,"zzz = zeros(%" PetscInt_FMT ",3);\n",a->nz+nofinalvalue)); 756fbfe6fa7SJed Brown #endif 7579566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer,"zzz = [\n")); 75817ab2063SBarry Smith 75917ab2063SBarry Smith for (i=0; i<m; i++) { 76060e0710aSBarry Smith for (j=a->i[i]; j<a->i[i+1]; j++) { 761aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 7629566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer,"%" PetscInt_FMT " %" PetscInt_FMT " %18.16e %18.16e\n",i+1,a->j[j]+1,(double)PetscRealPart(a->a[j]),(double)PetscImaginaryPart(a->a[j]))); 76317ab2063SBarry Smith #else 7649566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer,"%" PetscInt_FMT " %" PetscInt_FMT " %18.16e\n",i+1,a->j[j]+1,(double)a->a[j])); 76517ab2063SBarry Smith #endif 76617ab2063SBarry Smith } 76717ab2063SBarry Smith } 768d00d2cf4SBarry Smith if (nofinalvalue) { 769c337ccceSJed Brown #if defined(PETSC_USE_COMPLEX) 7709566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer,"%" PetscInt_FMT " %" PetscInt_FMT " %18.16e %18.16e\n",m,A->cmap->n,0.,0.)); 771c337ccceSJed Brown #else 7729566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer,"%" PetscInt_FMT " %" PetscInt_FMT " %18.16e\n",m,A->cmap->n,0.0)); 773c337ccceSJed Brown #endif 774d00d2cf4SBarry Smith } 7759566063dSJacob Faibussowitsch PetscCall(PetscObjectGetName((PetscObject)A,&name)); 7769566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer,"];\n %s = spconvert(zzz);\n",name)); 7779566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer,PETSC_TRUE)); 778fb9695e5SSatish Balay } else if (format == PETSC_VIEWER_ASCII_COMMON) { 7799566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer,PETSC_FALSE)); 78044cd7ae7SLois Curfman McInnes for (i=0; i<m; i++) { 7819566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer,"row %" PetscInt_FMT ":",i)); 78260e0710aSBarry Smith for (j=a->i[i]; j<a->i[i+1]; j++) { 783aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 78436db0b34SBarry Smith if (PetscImaginaryPart(a->a[j]) > 0.0 && PetscRealPart(a->a[j]) != 0.0) { 7859566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer," (%" PetscInt_FMT ", %g + %g i)",a->j[j],(double)PetscRealPart(a->a[j]),(double)PetscImaginaryPart(a->a[j]))); 78636db0b34SBarry Smith } else if (PetscImaginaryPart(a->a[j]) < 0.0 && PetscRealPart(a->a[j]) != 0.0) { 7879566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer," (%" PetscInt_FMT ", %g - %g i)",a->j[j],(double)PetscRealPart(a->a[j]),(double)-PetscImaginaryPart(a->a[j]))); 78836db0b34SBarry Smith } else if (PetscRealPart(a->a[j]) != 0.0) { 7899566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer," (%" PetscInt_FMT ", %g) ",a->j[j],(double)PetscRealPart(a->a[j]))); 7906831982aSBarry Smith } 79144cd7ae7SLois Curfman McInnes #else 7929566063dSJacob Faibussowitsch if (a->a[j] != 0.0) PetscCall(PetscViewerASCIIPrintf(viewer," (%" PetscInt_FMT ", %g) ",a->j[j],(double)a->a[j])); 79344cd7ae7SLois Curfman McInnes #endif 79444cd7ae7SLois Curfman McInnes } 7959566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer,"\n")); 79644cd7ae7SLois Curfman McInnes } 7979566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer,PETSC_TRUE)); 798fb9695e5SSatish Balay } else if (format == PETSC_VIEWER_ASCII_SYMMODU) { 79997f1f81fSBarry Smith PetscInt nzd=0,fshift=1,*sptr; 8009566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer,PETSC_FALSE)); 8019566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m+1,&sptr)); 802496be53dSLois Curfman McInnes for (i=0; i<m; i++) { 803496be53dSLois Curfman McInnes sptr[i] = nzd+1; 80460e0710aSBarry Smith for (j=a->i[i]; j<a->i[i+1]; j++) { 805496be53dSLois Curfman McInnes if (a->j[j] >= i) { 806aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 80736db0b34SBarry Smith if (PetscImaginaryPart(a->a[j]) != 0.0 || PetscRealPart(a->a[j]) != 0.0) nzd++; 808496be53dSLois Curfman McInnes #else 809496be53dSLois Curfman McInnes if (a->a[j] != 0.0) nzd++; 810496be53dSLois Curfman McInnes #endif 811496be53dSLois Curfman McInnes } 812496be53dSLois Curfman McInnes } 813496be53dSLois Curfman McInnes } 8142e44a96cSLois Curfman McInnes sptr[m] = nzd+1; 8159566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer," %" PetscInt_FMT " %" PetscInt_FMT "\n\n",m,nzd)); 8162e44a96cSLois Curfman McInnes for (i=0; i<m+1; i+=6) { 8172205254eSKarl Rupp if (i+4<m) { 8189566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer," %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT "\n",sptr[i],sptr[i+1],sptr[i+2],sptr[i+3],sptr[i+4],sptr[i+5])); 8192205254eSKarl Rupp } else if (i+3<m) { 8209566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer," %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT "\n",sptr[i],sptr[i+1],sptr[i+2],sptr[i+3],sptr[i+4])); 8212205254eSKarl Rupp } else if (i+2<m) { 8229566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer," %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT "\n",sptr[i],sptr[i+1],sptr[i+2],sptr[i+3])); 8232205254eSKarl Rupp } else if (i+1<m) { 8249566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer," %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT "\n",sptr[i],sptr[i+1],sptr[i+2])); 8252205254eSKarl Rupp } else if (i<m) { 8269566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer," %" PetscInt_FMT " %" PetscInt_FMT "\n",sptr[i],sptr[i+1])); 8272205254eSKarl Rupp } else { 8289566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer," %" PetscInt_FMT "\n",sptr[i])); 8292205254eSKarl Rupp } 830496be53dSLois Curfman McInnes } 8319566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer,"\n")); 8329566063dSJacob Faibussowitsch PetscCall(PetscFree(sptr)); 833496be53dSLois Curfman McInnes for (i=0; i<m; i++) { 83460e0710aSBarry Smith for (j=a->i[i]; j<a->i[i+1]; j++) { 8359566063dSJacob Faibussowitsch if (a->j[j] >= i) PetscCall(PetscViewerASCIIPrintf(viewer," %" PetscInt_FMT " ",a->j[j]+fshift)); 836496be53dSLois Curfman McInnes } 8379566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer,"\n")); 838496be53dSLois Curfman McInnes } 8399566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer,"\n")); 840496be53dSLois Curfman McInnes for (i=0; i<m; i++) { 84160e0710aSBarry Smith for (j=a->i[i]; j<a->i[i+1]; j++) { 842496be53dSLois Curfman McInnes if (a->j[j] >= i) { 843aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 84436db0b34SBarry Smith if (PetscImaginaryPart(a->a[j]) != 0.0 || PetscRealPart(a->a[j]) != 0.0) { 8459566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer," %18.16e %18.16e ",(double)PetscRealPart(a->a[j]),(double)PetscImaginaryPart(a->a[j]))); 8466831982aSBarry Smith } 847496be53dSLois Curfman McInnes #else 8489566063dSJacob Faibussowitsch if (a->a[j] != 0.0) PetscCall(PetscViewerASCIIPrintf(viewer," %18.16e ",(double)a->a[j])); 849496be53dSLois Curfman McInnes #endif 850496be53dSLois Curfman McInnes } 851496be53dSLois Curfman McInnes } 8529566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer,"\n")); 853496be53dSLois Curfman McInnes } 8549566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer,PETSC_TRUE)); 855fb9695e5SSatish Balay } else if (format == PETSC_VIEWER_ASCII_DENSE) { 85697f1f81fSBarry Smith PetscInt cnt = 0,jcnt; 85787828ca2SBarry Smith PetscScalar value; 85868f1ed48SBarry Smith #if defined(PETSC_USE_COMPLEX) 85968f1ed48SBarry Smith PetscBool realonly = PETSC_TRUE; 86068f1ed48SBarry Smith 86168f1ed48SBarry Smith for (i=0; i<a->i[m]; i++) { 86268f1ed48SBarry Smith if (PetscImaginaryPart(a->a[i]) != 0.0) { 86368f1ed48SBarry Smith realonly = PETSC_FALSE; 86468f1ed48SBarry Smith break; 86568f1ed48SBarry Smith } 86668f1ed48SBarry Smith } 86768f1ed48SBarry Smith #endif 86802594712SBarry Smith 8699566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer,PETSC_FALSE)); 87002594712SBarry Smith for (i=0; i<m; i++) { 87102594712SBarry Smith jcnt = 0; 872d0f46423SBarry Smith for (j=0; j<A->cmap->n; j++) { 873e24b481bSBarry Smith if (jcnt < a->i[i+1]-a->i[i] && j == a->j[cnt]) { 87402594712SBarry Smith value = a->a[cnt++]; 875e24b481bSBarry Smith jcnt++; 87602594712SBarry Smith } else { 87702594712SBarry Smith value = 0.0; 87802594712SBarry Smith } 879aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 88068f1ed48SBarry Smith if (realonly) { 8819566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer," %7.5e ",(double)PetscRealPart(value))); 88268f1ed48SBarry Smith } else { 8839566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer," %7.5e+%7.5e i ",(double)PetscRealPart(value),(double)PetscImaginaryPart(value))); 88468f1ed48SBarry Smith } 88502594712SBarry Smith #else 8869566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer," %7.5e ",(double)value)); 88702594712SBarry Smith #endif 88802594712SBarry Smith } 8899566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer,"\n")); 89002594712SBarry Smith } 8919566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer,PETSC_TRUE)); 8923c215bfdSMatthew Knepley } else if (format == PETSC_VIEWER_ASCII_MATRIXMARKET) { 893150b93efSMatthew G. Knepley PetscInt fshift=1; 8949566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer,PETSC_FALSE)); 8953c215bfdSMatthew Knepley #if defined(PETSC_USE_COMPLEX) 8969566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer,"%%%%MatrixMarket matrix coordinate complex general\n")); 8973c215bfdSMatthew Knepley #else 8989566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer,"%%%%MatrixMarket matrix coordinate real general\n")); 8993c215bfdSMatthew Knepley #endif 9009566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer,"%" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT "\n", m, A->cmap->n, a->nz)); 9013c215bfdSMatthew Knepley for (i=0; i<m; i++) { 90260e0710aSBarry Smith for (j=a->i[i]; j<a->i[i+1]; j++) { 9033c215bfdSMatthew Knepley #if defined(PETSC_USE_COMPLEX) 9049566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer,"%" PetscInt_FMT " %" PetscInt_FMT " %g %g\n", i+fshift,a->j[j]+fshift,(double)PetscRealPart(a->a[j]),(double)PetscImaginaryPart(a->a[j]))); 9053c215bfdSMatthew Knepley #else 9069566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer,"%" PetscInt_FMT " %" PetscInt_FMT " %g\n", i+fshift, a->j[j]+fshift, (double)a->a[j])); 9073c215bfdSMatthew Knepley #endif 9083c215bfdSMatthew Knepley } 9093c215bfdSMatthew Knepley } 9109566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer,PETSC_TRUE)); 9113a40ed3dSBarry Smith } else { 9129566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer,PETSC_FALSE)); 913d5f3da31SBarry Smith if (A->factortype) { 91416cd7e1dSShri Abhyankar for (i=0; i<m; i++) { 9159566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer,"row %" PetscInt_FMT ":",i)); 91616cd7e1dSShri Abhyankar /* L part */ 91760e0710aSBarry Smith for (j=a->i[i]; j<a->i[i+1]; j++) { 91816cd7e1dSShri Abhyankar #if defined(PETSC_USE_COMPLEX) 91916cd7e1dSShri Abhyankar if (PetscImaginaryPart(a->a[j]) > 0.0) { 9209566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer," (%" PetscInt_FMT ", %g + %g i)",a->j[j],(double)PetscRealPart(a->a[j]),(double)PetscImaginaryPart(a->a[j]))); 92116cd7e1dSShri Abhyankar } else if (PetscImaginaryPart(a->a[j]) < 0.0) { 9229566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer," (%" PetscInt_FMT ", %g - %g i)",a->j[j],(double)PetscRealPart(a->a[j]),(double)(-PetscImaginaryPart(a->a[j])))); 92316cd7e1dSShri Abhyankar } else { 9249566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer," (%" PetscInt_FMT ", %g) ",a->j[j],(double)PetscRealPart(a->a[j]))); 92516cd7e1dSShri Abhyankar } 92616cd7e1dSShri Abhyankar #else 9279566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer," (%" PetscInt_FMT ", %g) ",a->j[j],(double)a->a[j])); 92816cd7e1dSShri Abhyankar #endif 92916cd7e1dSShri Abhyankar } 93016cd7e1dSShri Abhyankar /* diagonal */ 93116cd7e1dSShri Abhyankar j = a->diag[i]; 93216cd7e1dSShri Abhyankar #if defined(PETSC_USE_COMPLEX) 93316cd7e1dSShri Abhyankar if (PetscImaginaryPart(a->a[j]) > 0.0) { 9349566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer," (%" PetscInt_FMT ", %g + %g i)",a->j[j],(double)PetscRealPart(1.0/a->a[j]),(double)PetscImaginaryPart(1.0/a->a[j]))); 93516cd7e1dSShri Abhyankar } else if (PetscImaginaryPart(a->a[j]) < 0.0) { 9369566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer," (%" PetscInt_FMT ", %g - %g i)",a->j[j],(double)PetscRealPart(1.0/a->a[j]),(double)(-PetscImaginaryPart(1.0/a->a[j])))); 93716cd7e1dSShri Abhyankar } else { 9389566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer," (%" PetscInt_FMT ", %g) ",a->j[j],(double)PetscRealPart(1.0/a->a[j]))); 93916cd7e1dSShri Abhyankar } 94016cd7e1dSShri Abhyankar #else 9419566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer," (%" PetscInt_FMT ", %g) ",a->j[j],(double)(1.0/a->a[j]))); 94216cd7e1dSShri Abhyankar #endif 94316cd7e1dSShri Abhyankar 94416cd7e1dSShri Abhyankar /* U part */ 94560e0710aSBarry Smith for (j=a->diag[i+1]+1; j<a->diag[i]; j++) { 94616cd7e1dSShri Abhyankar #if defined(PETSC_USE_COMPLEX) 94716cd7e1dSShri Abhyankar if (PetscImaginaryPart(a->a[j]) > 0.0) { 9489566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer," (%" PetscInt_FMT ", %g + %g i)",a->j[j],(double)PetscRealPart(a->a[j]),(double)PetscImaginaryPart(a->a[j]))); 94916cd7e1dSShri Abhyankar } else if (PetscImaginaryPart(a->a[j]) < 0.0) { 9509566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer," (%" PetscInt_FMT ", %g - %g i)",a->j[j],(double)PetscRealPart(a->a[j]),(double)(-PetscImaginaryPart(a->a[j])))); 95116cd7e1dSShri Abhyankar } else { 9529566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer," (%" PetscInt_FMT ", %g) ",a->j[j],(double)PetscRealPart(a->a[j]))); 95316cd7e1dSShri Abhyankar } 95416cd7e1dSShri Abhyankar #else 9559566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer," (%" PetscInt_FMT ", %g) ",a->j[j],(double)a->a[j])); 95616cd7e1dSShri Abhyankar #endif 95716cd7e1dSShri Abhyankar } 9589566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer,"\n")); 95916cd7e1dSShri Abhyankar } 96016cd7e1dSShri Abhyankar } else { 96117ab2063SBarry Smith for (i=0; i<m; i++) { 9629566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer,"row %" PetscInt_FMT ":",i)); 96360e0710aSBarry Smith for (j=a->i[i]; j<a->i[i+1]; j++) { 964aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 96536db0b34SBarry Smith if (PetscImaginaryPart(a->a[j]) > 0.0) { 9669566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer," (%" PetscInt_FMT ", %g + %g i)",a->j[j],(double)PetscRealPart(a->a[j]),(double)PetscImaginaryPart(a->a[j]))); 96736db0b34SBarry Smith } else if (PetscImaginaryPart(a->a[j]) < 0.0) { 9689566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer," (%" PetscInt_FMT ", %g - %g i)",a->j[j],(double)PetscRealPart(a->a[j]),(double)-PetscImaginaryPart(a->a[j]))); 9693a40ed3dSBarry Smith } else { 9709566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer," (%" PetscInt_FMT ", %g) ",a->j[j],(double)PetscRealPart(a->a[j]))); 97117ab2063SBarry Smith } 97217ab2063SBarry Smith #else 9739566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer," (%" PetscInt_FMT ", %g) ",a->j[j],(double)a->a[j])); 97417ab2063SBarry Smith #endif 97517ab2063SBarry Smith } 9769566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer,"\n")); 97717ab2063SBarry Smith } 97816cd7e1dSShri Abhyankar } 9799566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer,PETSC_TRUE)); 98017ab2063SBarry Smith } 9819566063dSJacob Faibussowitsch PetscCall(PetscViewerFlush(viewer)); 9823a40ed3dSBarry Smith PetscFunctionReturn(0); 983416022c9SBarry Smith } 984416022c9SBarry Smith 9859804daf3SBarry Smith #include <petscdraw.h> 986dfbe8321SBarry Smith PetscErrorCode MatView_SeqAIJ_Draw_Zoom(PetscDraw draw,void *Aa) 987416022c9SBarry Smith { 988480ef9eaSBarry Smith Mat A = (Mat) Aa; 989416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 990383922c3SLisandro Dalcin PetscInt i,j,m = A->rmap->n; 991383922c3SLisandro Dalcin int color; 992b05fc000SLisandro Dalcin PetscReal xl,yl,xr,yr,x_l,x_r,y_l,y_r; 993b0a32e0cSBarry Smith PetscViewer viewer; 994f3ef73ceSBarry Smith PetscViewerFormat format; 995fff043a9SJunchao Zhang const PetscScalar *aa; 996cddf8d76SBarry Smith 9973a40ed3dSBarry Smith PetscFunctionBegin; 9989566063dSJacob Faibussowitsch PetscCall(PetscObjectQuery((PetscObject)A,"Zoomviewer",(PetscObject*)&viewer)); 9999566063dSJacob Faibussowitsch PetscCall(PetscViewerGetFormat(viewer,&format)); 10009566063dSJacob Faibussowitsch PetscCall(PetscDrawGetCoordinates(draw,&xl,&yl,&xr,&yr)); 1001383922c3SLisandro Dalcin 1002416022c9SBarry Smith /* loop over matrix elements drawing boxes */ 10039566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A,&aa)); 1004fb9695e5SSatish Balay if (format != PETSC_VIEWER_DRAW_CONTOUR) { 10055f80ce2aSJacob Faibussowitsch PetscErrorCode ierr; 10069566063dSJacob Faibussowitsch ierr = PetscDrawCollectiveBegin(draw);PetscCall(ierr); 10070513a670SBarry Smith /* Blue for negative, Cyan for zero and Red for positive */ 1008b0a32e0cSBarry Smith color = PETSC_DRAW_BLUE; 1009416022c9SBarry Smith for (i=0; i<m; i++) { 1010cddf8d76SBarry Smith y_l = m - i - 1.0; y_r = y_l + 1.0; 1011bfeeae90SHong Zhang for (j=a->i[i]; j<a->i[i+1]; j++) { 1012bfeeae90SHong Zhang x_l = a->j[j]; x_r = x_l + 1.0; 1013fff043a9SJunchao Zhang if (PetscRealPart(aa[j]) >= 0.) continue; 10149566063dSJacob Faibussowitsch PetscCall(PetscDrawRectangle(draw,x_l,y_l,x_r,y_r,color,color,color,color)); 1015cddf8d76SBarry Smith } 1016cddf8d76SBarry Smith } 1017b0a32e0cSBarry Smith color = PETSC_DRAW_CYAN; 1018cddf8d76SBarry Smith for (i=0; i<m; i++) { 1019cddf8d76SBarry Smith y_l = m - i - 1.0; y_r = y_l + 1.0; 1020bfeeae90SHong Zhang for (j=a->i[i]; j<a->i[i+1]; j++) { 1021bfeeae90SHong Zhang x_l = a->j[j]; x_r = x_l + 1.0; 1022fff043a9SJunchao Zhang if (aa[j] != 0.) continue; 10239566063dSJacob Faibussowitsch PetscCall(PetscDrawRectangle(draw,x_l,y_l,x_r,y_r,color,color,color,color)); 1024cddf8d76SBarry Smith } 1025cddf8d76SBarry Smith } 1026b0a32e0cSBarry Smith color = PETSC_DRAW_RED; 1027cddf8d76SBarry Smith for (i=0; i<m; i++) { 1028cddf8d76SBarry Smith y_l = m - i - 1.0; y_r = y_l + 1.0; 1029bfeeae90SHong Zhang for (j=a->i[i]; j<a->i[i+1]; j++) { 1030bfeeae90SHong Zhang x_l = a->j[j]; x_r = x_l + 1.0; 1031fff043a9SJunchao Zhang if (PetscRealPart(aa[j]) <= 0.) continue; 10329566063dSJacob Faibussowitsch PetscCall(PetscDrawRectangle(draw,x_l,y_l,x_r,y_r,color,color,color,color)); 1033416022c9SBarry Smith } 1034416022c9SBarry Smith } 10359566063dSJacob Faibussowitsch ierr = PetscDrawCollectiveEnd(draw);PetscCall(ierr); 10360513a670SBarry Smith } else { 10370513a670SBarry Smith /* use contour shading to indicate magnitude of values */ 10380513a670SBarry Smith /* first determine max of all nonzero values */ 1039b05fc000SLisandro Dalcin PetscReal minv = 0.0, maxv = 0.0; 1040383922c3SLisandro Dalcin PetscInt nz = a->nz, count = 0; 1041b0a32e0cSBarry Smith PetscDraw popup; 10425f80ce2aSJacob Faibussowitsch PetscErrorCode ierr; 10430513a670SBarry Smith 10440513a670SBarry Smith for (i=0; i<nz; i++) { 1045fff043a9SJunchao Zhang if (PetscAbsScalar(aa[i]) > maxv) maxv = PetscAbsScalar(aa[i]); 10460513a670SBarry Smith } 1047383922c3SLisandro Dalcin if (minv >= maxv) maxv = minv + PETSC_SMALL; 10489566063dSJacob Faibussowitsch PetscCall(PetscDrawGetPopup(draw,&popup)); 10499566063dSJacob Faibussowitsch PetscCall(PetscDrawScalePopup(popup,minv,maxv)); 1050383922c3SLisandro Dalcin 10519566063dSJacob Faibussowitsch ierr = PetscDrawCollectiveBegin(draw);PetscCall(ierr); 10520513a670SBarry Smith for (i=0; i<m; i++) { 1053383922c3SLisandro Dalcin y_l = m - i - 1.0; 1054383922c3SLisandro Dalcin y_r = y_l + 1.0; 1055bfeeae90SHong Zhang for (j=a->i[i]; j<a->i[i+1]; j++) { 1056383922c3SLisandro Dalcin x_l = a->j[j]; 1057383922c3SLisandro Dalcin x_r = x_l + 1.0; 1058fff043a9SJunchao Zhang color = PetscDrawRealToColor(PetscAbsScalar(aa[count]),minv,maxv); 10599566063dSJacob Faibussowitsch PetscCall(PetscDrawRectangle(draw,x_l,y_l,x_r,y_r,color,color,color,color)); 10600513a670SBarry Smith count++; 10610513a670SBarry Smith } 10620513a670SBarry Smith } 10639566063dSJacob Faibussowitsch ierr = PetscDrawCollectiveEnd(draw);PetscCall(ierr); 10640513a670SBarry Smith } 10659566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A,&aa)); 1066480ef9eaSBarry Smith PetscFunctionReturn(0); 1067480ef9eaSBarry Smith } 1068cddf8d76SBarry Smith 10699804daf3SBarry Smith #include <petscdraw.h> 1070dfbe8321SBarry Smith PetscErrorCode MatView_SeqAIJ_Draw(Mat A,PetscViewer viewer) 1071480ef9eaSBarry Smith { 1072b0a32e0cSBarry Smith PetscDraw draw; 107336db0b34SBarry Smith PetscReal xr,yr,xl,yl,h,w; 1074ace3abfcSBarry Smith PetscBool isnull; 1075480ef9eaSBarry Smith 1076480ef9eaSBarry Smith PetscFunctionBegin; 10779566063dSJacob Faibussowitsch PetscCall(PetscViewerDrawGetDraw(viewer,0,&draw)); 10789566063dSJacob Faibussowitsch PetscCall(PetscDrawIsNull(draw,&isnull)); 1079480ef9eaSBarry Smith if (isnull) PetscFunctionReturn(0); 1080480ef9eaSBarry Smith 1081d0f46423SBarry Smith xr = A->cmap->n; yr = A->rmap->n; h = yr/10.0; w = xr/10.0; 1082480ef9eaSBarry Smith xr += w; yr += h; xl = -w; yl = -h; 10839566063dSJacob Faibussowitsch PetscCall(PetscDrawSetCoordinates(draw,xl,yl,xr,yr)); 10849566063dSJacob Faibussowitsch PetscCall(PetscObjectCompose((PetscObject)A,"Zoomviewer",(PetscObject)viewer)); 10859566063dSJacob Faibussowitsch PetscCall(PetscDrawZoom(draw,MatView_SeqAIJ_Draw_Zoom,A)); 10869566063dSJacob Faibussowitsch PetscCall(PetscObjectCompose((PetscObject)A,"Zoomviewer",NULL)); 10879566063dSJacob Faibussowitsch PetscCall(PetscDrawSave(draw)); 10883a40ed3dSBarry Smith PetscFunctionReturn(0); 1089416022c9SBarry Smith } 1090416022c9SBarry Smith 1091dfbe8321SBarry Smith PetscErrorCode MatView_SeqAIJ(Mat A,PetscViewer viewer) 1092416022c9SBarry Smith { 1093ace3abfcSBarry Smith PetscBool iascii,isbinary,isdraw; 1094416022c9SBarry Smith 10953a40ed3dSBarry Smith PetscFunctionBegin; 10969566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)viewer,PETSCVIEWERASCII,&iascii)); 10979566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)viewer,PETSCVIEWERBINARY,&isbinary)); 10989566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)viewer,PETSCVIEWERDRAW,&isdraw)); 1099c45a1595SBarry Smith if (iascii) { 11009566063dSJacob Faibussowitsch PetscCall(MatView_SeqAIJ_ASCII(A,viewer)); 11010f5bd95cSBarry Smith } else if (isbinary) { 11029566063dSJacob Faibussowitsch PetscCall(MatView_SeqAIJ_Binary(A,viewer)); 11030f5bd95cSBarry Smith } else if (isdraw) { 11049566063dSJacob Faibussowitsch PetscCall(MatView_SeqAIJ_Draw(A,viewer)); 110511aeaf0aSBarry Smith } 11069566063dSJacob Faibussowitsch PetscCall(MatView_SeqAIJ_Inode(A,viewer)); 11073a40ed3dSBarry Smith PetscFunctionReturn(0); 110817ab2063SBarry Smith } 110919bcc07fSBarry Smith 1110dfbe8321SBarry Smith PetscErrorCode MatAssemblyEnd_SeqAIJ(Mat A,MatAssemblyType mode) 111117ab2063SBarry Smith { 1112416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 1113580bdb30SBarry Smith PetscInt fshift = 0,i,*ai = a->i,*aj = a->j,*imax = a->imax; 1114d0f46423SBarry Smith PetscInt m = A->rmap->n,*ip,N,*ailen = a->ilen,rmax = 0; 111554f21887SBarry Smith MatScalar *aa = a->a,*ap; 11163447b6efSHong Zhang PetscReal ratio = 0.6; 111717ab2063SBarry Smith 11183a40ed3dSBarry Smith PetscFunctionBegin; 11193a40ed3dSBarry Smith if (mode == MAT_FLUSH_ASSEMBLY) PetscFunctionReturn(0); 11209566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(A)); 1121b215bc84SStefano Zampini if (A->was_assembled && A->ass_nonzerostate == A->nonzerostate) { 1122b215bc84SStefano Zampini /* we need to respect users asking to use or not the inodes routine in between matrix assemblies */ 11239566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd_SeqAIJ_Inode(A,mode)); 1124b215bc84SStefano Zampini PetscFunctionReturn(0); 1125b215bc84SStefano Zampini } 112617ab2063SBarry Smith 112743ee02c3SBarry Smith if (m) rmax = ailen[0]; /* determine row with most nonzeros */ 112817ab2063SBarry Smith for (i=1; i<m; i++) { 1129416022c9SBarry Smith /* move each row back by the amount of empty slots (fshift) before it*/ 113017ab2063SBarry Smith fshift += imax[i-1] - ailen[i-1]; 113194a9d846SBarry Smith rmax = PetscMax(rmax,ailen[i]); 113217ab2063SBarry Smith if (fshift) { 1133bfeeae90SHong Zhang ip = aj + ai[i]; 1134bfeeae90SHong Zhang ap = aa + ai[i]; 113517ab2063SBarry Smith N = ailen[i]; 11369566063dSJacob Faibussowitsch PetscCall(PetscArraymove(ip-fshift,ip,N)); 1137580bdb30SBarry Smith if (!A->structure_only) { 11389566063dSJacob Faibussowitsch PetscCall(PetscArraymove(ap-fshift,ap,N)); 113917ab2063SBarry Smith } 114017ab2063SBarry Smith } 114117ab2063SBarry Smith ai[i] = ai[i-1] + ailen[i-1]; 114217ab2063SBarry Smith } 114317ab2063SBarry Smith if (m) { 114417ab2063SBarry Smith fshift += imax[m-1] - ailen[m-1]; 114517ab2063SBarry Smith ai[m] = ai[m-1] + ailen[m-1]; 114617ab2063SBarry Smith } 11477b083b7cSBarry Smith 114817ab2063SBarry Smith /* reset ilen and imax for each row */ 11497b083b7cSBarry Smith a->nonzerorowcnt = 0; 1150396832f4SHong Zhang if (A->structure_only) { 11519566063dSJacob Faibussowitsch PetscCall(PetscFree(a->imax)); 11529566063dSJacob Faibussowitsch PetscCall(PetscFree(a->ilen)); 1153396832f4SHong Zhang } else { /* !A->structure_only */ 115417ab2063SBarry Smith for (i=0; i<m; i++) { 115517ab2063SBarry Smith ailen[i] = imax[i] = ai[i+1] - ai[i]; 11567b083b7cSBarry Smith a->nonzerorowcnt += ((ai[i+1] - ai[i]) > 0); 115717ab2063SBarry Smith } 1158396832f4SHong Zhang } 1159bfeeae90SHong Zhang a->nz = ai[m]; 11602c71b3e2SJacob Faibussowitsch PetscCheckFalse(fshift && a->nounused == -1,PETSC_COMM_SELF,PETSC_ERR_PLIB, "Unused space detected in matrix: %" PetscInt_FMT " X %" PetscInt_FMT ", %" PetscInt_FMT " unneeded", m, A->cmap->n, fshift); 116117ab2063SBarry Smith 11629566063dSJacob Faibussowitsch PetscCall(MatMarkDiagonal_SeqAIJ(A)); 11639566063dSJacob Faibussowitsch PetscCall(PetscInfo(A,"Matrix size: %" PetscInt_FMT " X %" PetscInt_FMT "; storage space: %" PetscInt_FMT " unneeded,%" PetscInt_FMT " used\n",m,A->cmap->n,fshift,a->nz)); 11649566063dSJacob Faibussowitsch PetscCall(PetscInfo(A,"Number of mallocs during MatSetValues() is %" PetscInt_FMT "\n",a->reallocs)); 11659566063dSJacob Faibussowitsch PetscCall(PetscInfo(A,"Maximum nonzeros in any row is %" PetscInt_FMT "\n",rmax)); 11662205254eSKarl Rupp 11678e58a170SBarry Smith A->info.mallocs += a->reallocs; 1168dd5f02e7SSatish Balay a->reallocs = 0; 11696712e2f1SBarry Smith A->info.nz_unneeded = (PetscReal)fshift; 117036db0b34SBarry Smith a->rmax = rmax; 11714e220ebcSLois Curfman McInnes 1172396832f4SHong Zhang if (!A->structure_only) { 11739566063dSJacob Faibussowitsch PetscCall(MatCheckCompressedRow(A,a->nonzerorowcnt,&a->compressedrow,a->i,m,ratio)); 1174396832f4SHong Zhang } 11759566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd_SeqAIJ_Inode(A,mode)); 11763a40ed3dSBarry Smith PetscFunctionReturn(0); 117717ab2063SBarry Smith } 117817ab2063SBarry Smith 117999cafbc1SBarry Smith PetscErrorCode MatRealPart_SeqAIJ(Mat A) 118099cafbc1SBarry Smith { 118199cafbc1SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 118299cafbc1SBarry Smith PetscInt i,nz = a->nz; 11832e5835c6SStefano Zampini MatScalar *aa; 118499cafbc1SBarry Smith 118599cafbc1SBarry Smith PetscFunctionBegin; 11869566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A,&aa)); 118799cafbc1SBarry Smith for (i=0; i<nz; i++) aa[i] = PetscRealPart(aa[i]); 11889566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A,&aa)); 11899566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(A)); 119099cafbc1SBarry Smith PetscFunctionReturn(0); 119199cafbc1SBarry Smith } 119299cafbc1SBarry Smith 119399cafbc1SBarry Smith PetscErrorCode MatImaginaryPart_SeqAIJ(Mat A) 119499cafbc1SBarry Smith { 119599cafbc1SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 119699cafbc1SBarry Smith PetscInt i,nz = a->nz; 11972e5835c6SStefano Zampini MatScalar *aa; 119899cafbc1SBarry Smith 119999cafbc1SBarry Smith PetscFunctionBegin; 12009566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A,&aa)); 120199cafbc1SBarry Smith for (i=0; i<nz; i++) aa[i] = PetscImaginaryPart(aa[i]); 12029566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A,&aa)); 12039566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(A)); 120499cafbc1SBarry Smith PetscFunctionReturn(0); 120599cafbc1SBarry Smith } 120699cafbc1SBarry Smith 1207dfbe8321SBarry Smith PetscErrorCode MatZeroEntries_SeqAIJ(Mat A) 120817ab2063SBarry Smith { 1209fff043a9SJunchao Zhang Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 1210fff043a9SJunchao Zhang MatScalar *aa; 12113a40ed3dSBarry Smith 12123a40ed3dSBarry Smith PetscFunctionBegin; 12139566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayWrite(A,&aa)); 12149566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(aa,a->i[A->rmap->n])); 12159566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayWrite(A,&aa)); 12169566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(A)); 12173a40ed3dSBarry Smith PetscFunctionReturn(0); 121817ab2063SBarry Smith } 1219416022c9SBarry Smith 1220cbc6b225SStefano Zampini PETSC_INTERN PetscErrorCode MatResetPreallocationCOO_SeqAIJ(Mat A) 1221cbc6b225SStefano Zampini { 1222cbc6b225SStefano Zampini Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 1223cbc6b225SStefano Zampini 1224cbc6b225SStefano Zampini PetscFunctionBegin; 12259566063dSJacob Faibussowitsch PetscCall(PetscFree(a->perm)); 12269566063dSJacob Faibussowitsch PetscCall(PetscFree(a->jmap)); 1227cbc6b225SStefano Zampini PetscFunctionReturn(0); 1228cbc6b225SStefano Zampini } 1229cbc6b225SStefano Zampini 1230dfbe8321SBarry Smith PetscErrorCode MatDestroy_SeqAIJ(Mat A) 123117ab2063SBarry Smith { 1232416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 1233d5d45c9bSBarry Smith 12343a40ed3dSBarry Smith PetscFunctionBegin; 1235aa482453SBarry Smith #if defined(PETSC_USE_LOG) 1236c0aa6a63SJacob Faibussowitsch PetscLogObjectState((PetscObject)A,"Rows=%" PetscInt_FMT ", Cols=%" PetscInt_FMT ", NZ=%" PetscInt_FMT,A->rmap->n,A->cmap->n,a->nz); 123717ab2063SBarry Smith #endif 12389566063dSJacob Faibussowitsch PetscCall(MatSeqXAIJFreeAIJ(A,&a->a,&a->j,&a->i)); 12399566063dSJacob Faibussowitsch PetscCall(MatResetPreallocationCOO_SeqAIJ(A)); 12409566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->row)); 12419566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->col)); 12429566063dSJacob Faibussowitsch PetscCall(PetscFree(a->diag)); 12439566063dSJacob Faibussowitsch PetscCall(PetscFree(a->ibdiag)); 12449566063dSJacob Faibussowitsch PetscCall(PetscFree(a->imax)); 12459566063dSJacob Faibussowitsch PetscCall(PetscFree(a->ilen)); 12469566063dSJacob Faibussowitsch PetscCall(PetscFree(a->ipre)); 12479566063dSJacob Faibussowitsch PetscCall(PetscFree3(a->idiag,a->mdiag,a->ssor_work)); 12489566063dSJacob Faibussowitsch PetscCall(PetscFree(a->solve_work)); 12499566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->icol)); 12509566063dSJacob Faibussowitsch PetscCall(PetscFree(a->saved_values)); 12519566063dSJacob Faibussowitsch PetscCall(PetscFree2(a->compressedrow.i,a->compressedrow.rindex)); 12529566063dSJacob Faibussowitsch PetscCall(MatDestroy_SeqAIJ_Inode(A)); 12539566063dSJacob Faibussowitsch PetscCall(PetscFree(A->data)); 1254901853e0SKris Buschelman 12556718818eSStefano Zampini /* MatMatMultNumeric_SeqAIJ_SeqAIJ_Sorted may allocate this. 12566718818eSStefano Zampini That function is so heavily used (sometimes in an hidden way through multnumeric function pointers) 12576718818eSStefano Zampini that is hard to properly add this data to the MatProduct data. We free it here to avoid 12586718818eSStefano Zampini users reusing the matrix object with different data to incur in obscure segmentation faults 12596718818eSStefano Zampini due to different matrix sizes */ 12609566063dSJacob Faibussowitsch PetscCall(PetscObjectCompose((PetscObject)A,"__PETSc__ab_dense",NULL)); 12616718818eSStefano Zampini 12629566063dSJacob Faibussowitsch PetscCall(PetscObjectChangeTypeName((PetscObject)A,NULL)); 12639566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A,"MatSeqAIJSetColumnIndices_C",NULL)); 12649566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A,"MatStoreValues_C",NULL)); 12659566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A,"MatRetrieveValues_C",NULL)); 12669566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A,"MatConvert_seqaij_seqsbaij_C",NULL)); 12679566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A,"MatConvert_seqaij_seqbaij_C",NULL)); 12689566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A,"MatConvert_seqaij_seqaijperm_C",NULL)); 12694222ddf1SHong Zhang #if defined(PETSC_HAVE_CUDA) 12709566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A,"MatConvert_seqaij_seqaijcusparse_C",NULL)); 12719566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A,"MatProductSetFromOptions_seqaijcusparse_seqaij_C",NULL)); 12729566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A,"MatProductSetFromOptions_seqaij_seqaijcusparse_C",NULL)); 12734222ddf1SHong Zhang #endif 12743d0639e7SStefano Zampini #if defined(PETSC_HAVE_KOKKOS_KERNELS) 12759566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A,"MatConvert_seqaij_seqaijkokkos_C",NULL)); 12763d0639e7SStefano Zampini #endif 12779566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A,"MatConvert_seqaij_seqaijcrl_C",NULL)); 1278af8000cdSHong Zhang #if defined(PETSC_HAVE_ELEMENTAL) 12799566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A,"MatConvert_seqaij_elemental_C",NULL)); 1280af8000cdSHong Zhang #endif 1281d24d4204SJose E. Roman #if defined(PETSC_HAVE_SCALAPACK) 12829566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A,"MatConvert_seqaij_scalapack_C",NULL)); 1283d24d4204SJose E. Roman #endif 128463c07aadSStefano Zampini #if defined(PETSC_HAVE_HYPRE) 12859566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A,"MatConvert_seqaij_hypre_C",NULL)); 12869566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A,"MatProductSetFromOptions_transpose_seqaij_seqaij_C",NULL)); 128763c07aadSStefano Zampini #endif 12889566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A,"MatConvert_seqaij_seqdense_C",NULL)); 12899566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A,"MatConvert_seqaij_seqsell_C",NULL)); 12909566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A,"MatConvert_seqaij_is_C",NULL)); 12919566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A,"MatIsTranspose_C",NULL)); 12929566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A,"MatSeqAIJSetPreallocation_C",NULL)); 12939566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A,"MatResetPreallocation_C",NULL)); 12949566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A,"MatSeqAIJSetPreallocationCSR_C",NULL)); 12959566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A,"MatReorderForNonzeroDiagonal_C",NULL)); 12969566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A,"MatProductSetFromOptions_is_seqaij_C",NULL)); 12979566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A,"MatProductSetFromOptions_seqdense_seqaij_C",NULL)); 12989566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A,"MatProductSetFromOptions_seqaij_seqaij_C",NULL)); 12999566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A,"MatSeqAIJKron_C",NULL)); 13009566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A,"MatSetPreallocationCOO_C",NULL)); 13019566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A,"MatSetValuesCOO_C",NULL)); 13023a40ed3dSBarry Smith PetscFunctionReturn(0); 130317ab2063SBarry Smith } 130417ab2063SBarry Smith 1305ace3abfcSBarry Smith PetscErrorCode MatSetOption_SeqAIJ(Mat A,MatOption op,PetscBool flg) 130617ab2063SBarry Smith { 1307416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 13083a40ed3dSBarry Smith 13093a40ed3dSBarry Smith PetscFunctionBegin; 1310a65d3064SKris Buschelman switch (op) { 1311a65d3064SKris Buschelman case MAT_ROW_ORIENTED: 13124e0d8c25SBarry Smith a->roworiented = flg; 1313a65d3064SKris Buschelman break; 1314a9817697SBarry Smith case MAT_KEEP_NONZERO_PATTERN: 1315a9817697SBarry Smith a->keepnonzeropattern = flg; 1316a65d3064SKris Buschelman break; 1317512a5fc5SBarry Smith case MAT_NEW_NONZERO_LOCATIONS: 1318512a5fc5SBarry Smith a->nonew = (flg ? 0 : 1); 1319a65d3064SKris Buschelman break; 1320a65d3064SKris Buschelman case MAT_NEW_NONZERO_LOCATION_ERR: 13214e0d8c25SBarry Smith a->nonew = (flg ? -1 : 0); 1322a65d3064SKris Buschelman break; 1323a65d3064SKris Buschelman case MAT_NEW_NONZERO_ALLOCATION_ERR: 13244e0d8c25SBarry Smith a->nonew = (flg ? -2 : 0); 1325a65d3064SKris Buschelman break; 132628b2fa4aSMatthew Knepley case MAT_UNUSED_NONZERO_LOCATION_ERR: 132728b2fa4aSMatthew Knepley a->nounused = (flg ? -1 : 0); 132828b2fa4aSMatthew Knepley break; 1329a65d3064SKris Buschelman case MAT_IGNORE_ZERO_ENTRIES: 13304e0d8c25SBarry Smith a->ignorezeroentries = flg; 13310df259c2SBarry Smith break; 13323d472b54SHong Zhang case MAT_SPD: 1333b1646e73SJed Brown case MAT_SYMMETRIC: 1334b1646e73SJed Brown case MAT_STRUCTURALLY_SYMMETRIC: 1335b1646e73SJed Brown case MAT_HERMITIAN: 1336b1646e73SJed Brown case MAT_SYMMETRY_ETERNAL: 1337957cac9fSHong Zhang case MAT_STRUCTURE_ONLY: 13385021d80fSJed Brown /* These options are handled directly by MatSetOption() */ 13395021d80fSJed Brown break; 13408c78258cSHong Zhang case MAT_FORCE_DIAGONAL_ENTRIES: 1341a65d3064SKris Buschelman case MAT_IGNORE_OFF_PROC_ENTRIES: 1342a65d3064SKris Buschelman case MAT_USE_HASH_TABLE: 13439566063dSJacob Faibussowitsch PetscCall(PetscInfo(A,"Option %s ignored\n",MatOptions[op])); 1344a65d3064SKris Buschelman break; 1345b87ac2d8SJed Brown case MAT_USE_INODES: 13469566063dSJacob Faibussowitsch PetscCall(MatSetOption_SeqAIJ_Inode(A,MAT_USE_INODES,flg)); 1347b87ac2d8SJed Brown break; 1348c10200c1SHong Zhang case MAT_SUBMAT_SINGLEIS: 1349c10200c1SHong Zhang A->submat_singleis = flg; 1350c10200c1SHong Zhang break; 1351071fcb05SBarry Smith case MAT_SORTED_FULL: 1352071fcb05SBarry Smith if (flg) A->ops->setvalues = MatSetValues_SeqAIJ_SortedFull; 1353071fcb05SBarry Smith else A->ops->setvalues = MatSetValues_SeqAIJ; 1354071fcb05SBarry Smith break; 13551a2c6b5cSJunchao Zhang case MAT_FORM_EXPLICIT_TRANSPOSE: 13561a2c6b5cSJunchao Zhang A->form_explicit_transpose = flg; 13571a2c6b5cSJunchao Zhang break; 1358a65d3064SKris Buschelman default: 135998921bdaSJacob Faibussowitsch SETERRQ(PETSC_COMM_SELF,PETSC_ERR_SUP,"unknown option %d",op); 1360a65d3064SKris Buschelman } 13613a40ed3dSBarry Smith PetscFunctionReturn(0); 136217ab2063SBarry Smith } 136317ab2063SBarry Smith 1364dfbe8321SBarry Smith PetscErrorCode MatGetDiagonal_SeqAIJ(Mat A,Vec v) 136517ab2063SBarry Smith { 1366416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 1367fdc842d1SBarry Smith PetscInt i,j,n,*ai=a->i,*aj=a->j; 1368c898d852SStefano Zampini PetscScalar *x; 1369c898d852SStefano Zampini const PetscScalar *aa; 137017ab2063SBarry Smith 13713a40ed3dSBarry Smith PetscFunctionBegin; 13729566063dSJacob Faibussowitsch PetscCall(VecGetLocalSize(v,&n)); 13732c71b3e2SJacob Faibussowitsch PetscCheckFalse(n != A->rmap->n,PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Nonconforming matrix and vector"); 13749566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A,&aa)); 1375d5f3da31SBarry Smith if (A->factortype == MAT_FACTOR_ILU || A->factortype == MAT_FACTOR_LU) { 1376d3e70bfaSHong Zhang PetscInt *diag=a->diag; 13779566063dSJacob Faibussowitsch PetscCall(VecGetArrayWrite(v,&x)); 13782c990fa1SHong Zhang for (i=0; i<n; i++) x[i] = 1.0/aa[diag[i]]; 13799566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayWrite(v,&x)); 13809566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A,&aa)); 138135e7444dSHong Zhang PetscFunctionReturn(0); 138235e7444dSHong Zhang } 138335e7444dSHong Zhang 13849566063dSJacob Faibussowitsch PetscCall(VecGetArrayWrite(v,&x)); 138535e7444dSHong Zhang for (i=0; i<n; i++) { 1386fdc842d1SBarry Smith x[i] = 0.0; 138735e7444dSHong Zhang for (j=ai[i]; j<ai[i+1]; j++) { 138835e7444dSHong Zhang if (aj[j] == i) { 138935e7444dSHong Zhang x[i] = aa[j]; 139017ab2063SBarry Smith break; 139117ab2063SBarry Smith } 139217ab2063SBarry Smith } 139317ab2063SBarry Smith } 13949566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayWrite(v,&x)); 13959566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A,&aa)); 13963a40ed3dSBarry Smith PetscFunctionReturn(0); 139717ab2063SBarry Smith } 139817ab2063SBarry Smith 1399c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/ftn-kernels/fmult.h> 1400dfbe8321SBarry Smith PetscErrorCode MatMultTransposeAdd_SeqAIJ(Mat A,Vec xx,Vec zz,Vec yy) 140117ab2063SBarry Smith { 1402416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 14035f22a7b3SSebastian Grimberg const MatScalar *aa; 1404d9ca1df4SBarry Smith PetscScalar *y; 1405d9ca1df4SBarry Smith const PetscScalar *x; 1406d0f46423SBarry Smith PetscInt m = A->rmap->n; 14075c897100SBarry Smith #if !defined(PETSC_USE_FORTRAN_KERNEL_MULTTRANSPOSEAIJ) 14085f22a7b3SSebastian Grimberg const MatScalar *v; 1409a77337e4SBarry Smith PetscScalar alpha; 1410d9ca1df4SBarry Smith PetscInt n,i,j; 1411d9ca1df4SBarry Smith const PetscInt *idx,*ii,*ridx=NULL; 14123447b6efSHong Zhang Mat_CompressedRow cprow = a->compressedrow; 1413ace3abfcSBarry Smith PetscBool usecprow = cprow.use; 14145c897100SBarry Smith #endif 141517ab2063SBarry Smith 14163a40ed3dSBarry Smith PetscFunctionBegin; 14179566063dSJacob Faibussowitsch if (zz != yy) PetscCall(VecCopy(zz,yy)); 14189566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(xx,&x)); 14199566063dSJacob Faibussowitsch PetscCall(VecGetArray(yy,&y)); 14209566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A,&aa)); 14215c897100SBarry Smith 14225c897100SBarry Smith #if defined(PETSC_USE_FORTRAN_KERNEL_MULTTRANSPOSEAIJ) 1423fff043a9SJunchao Zhang fortranmulttransposeaddaij_(&m,x,a->i,a->j,aa,y); 14245c897100SBarry Smith #else 14253447b6efSHong Zhang if (usecprow) { 14263447b6efSHong Zhang m = cprow.nrows; 14273447b6efSHong Zhang ii = cprow.i; 14287b2bb3b9SHong Zhang ridx = cprow.rindex; 14293447b6efSHong Zhang } else { 14303447b6efSHong Zhang ii = a->i; 14313447b6efSHong Zhang } 143217ab2063SBarry Smith for (i=0; i<m; i++) { 14333447b6efSHong Zhang idx = a->j + ii[i]; 1434fff043a9SJunchao Zhang v = aa + ii[i]; 14353447b6efSHong Zhang n = ii[i+1] - ii[i]; 14363447b6efSHong Zhang if (usecprow) { 14377b2bb3b9SHong Zhang alpha = x[ridx[i]]; 14383447b6efSHong Zhang } else { 143917ab2063SBarry Smith alpha = x[i]; 14403447b6efSHong Zhang } 144104fbf559SBarry Smith for (j=0; j<n; j++) y[idx[j]] += alpha*v[j]; 144217ab2063SBarry Smith } 14435c897100SBarry Smith #endif 14449566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0*a->nz)); 14459566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(xx,&x)); 14469566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(yy,&y)); 14479566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A,&aa)); 14483a40ed3dSBarry Smith PetscFunctionReturn(0); 144917ab2063SBarry Smith } 145017ab2063SBarry Smith 1451dfbe8321SBarry Smith PetscErrorCode MatMultTranspose_SeqAIJ(Mat A,Vec xx,Vec yy) 14525c897100SBarry Smith { 14535c897100SBarry Smith PetscFunctionBegin; 14549566063dSJacob Faibussowitsch PetscCall(VecSet(yy,0.0)); 14559566063dSJacob Faibussowitsch PetscCall(MatMultTransposeAdd_SeqAIJ(A,xx,yy,yy)); 14565c897100SBarry Smith PetscFunctionReturn(0); 14575c897100SBarry Smith } 14585c897100SBarry Smith 1459c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/ftn-kernels/fmult.h> 146078b84d54SShri Abhyankar 1461dfbe8321SBarry Smith PetscErrorCode MatMult_SeqAIJ(Mat A,Vec xx,Vec yy) 146217ab2063SBarry Smith { 1463416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 1464d9fead3dSBarry Smith PetscScalar *y; 146554f21887SBarry Smith const PetscScalar *x; 1466fff043a9SJunchao Zhang const MatScalar *aa,*a_a; 1467003131ecSBarry Smith PetscInt m=A->rmap->n; 14680298fd71SBarry Smith const PetscInt *aj,*ii,*ridx=NULL; 14697b083b7cSBarry Smith PetscInt n,i; 1470362ced78SSatish Balay PetscScalar sum; 1471ace3abfcSBarry Smith PetscBool usecprow=a->compressedrow.use; 147217ab2063SBarry Smith 1473b6410449SSatish Balay #if defined(PETSC_HAVE_PRAGMA_DISJOINT) 147497952fefSHong Zhang #pragma disjoint(*x,*y,*aa) 1475fee21e36SBarry Smith #endif 1476fee21e36SBarry Smith 14773a40ed3dSBarry Smith PetscFunctionBegin; 1478b215bc84SStefano Zampini if (a->inode.use && a->inode.checked) { 14799566063dSJacob Faibussowitsch PetscCall(MatMult_SeqAIJ_Inode(A,xx,yy)); 1480b215bc84SStefano Zampini PetscFunctionReturn(0); 1481b215bc84SStefano Zampini } 14829566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A,&a_a)); 14839566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(xx,&x)); 14849566063dSJacob Faibussowitsch PetscCall(VecGetArray(yy,&y)); 1485416022c9SBarry Smith ii = a->i; 14864eb6d288SHong Zhang if (usecprow) { /* use compressed row format */ 14879566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(y,m)); 148897952fefSHong Zhang m = a->compressedrow.nrows; 148997952fefSHong Zhang ii = a->compressedrow.i; 149097952fefSHong Zhang ridx = a->compressedrow.rindex; 149197952fefSHong Zhang for (i=0; i<m; i++) { 149297952fefSHong Zhang n = ii[i+1] - ii[i]; 149397952fefSHong Zhang aj = a->j + ii[i]; 1494fff043a9SJunchao Zhang aa = a_a + ii[i]; 149597952fefSHong Zhang sum = 0.0; 1496003131ecSBarry Smith PetscSparseDensePlusDot(sum,x,aa,aj,n); 1497003131ecSBarry Smith /* for (j=0; j<n; j++) sum += (*aa++)*x[*aj++]; */ 149897952fefSHong Zhang y[*ridx++] = sum; 149997952fefSHong Zhang } 150097952fefSHong Zhang } else { /* do not use compressed row format */ 1501b05257ddSBarry Smith #if defined(PETSC_USE_FORTRAN_KERNEL_MULTAIJ) 15023d3eaba7SBarry Smith aj = a->j; 1503fff043a9SJunchao Zhang aa = a_a; 1504b05257ddSBarry Smith fortranmultaij_(&m,x,ii,aj,aa,y); 1505b05257ddSBarry Smith #else 150617ab2063SBarry Smith for (i=0; i<m; i++) { 1507003131ecSBarry Smith n = ii[i+1] - ii[i]; 1508003131ecSBarry Smith aj = a->j + ii[i]; 1509fff043a9SJunchao Zhang aa = a_a + ii[i]; 151017ab2063SBarry Smith sum = 0.0; 1511003131ecSBarry Smith PetscSparseDensePlusDot(sum,x,aa,aj,n); 151217ab2063SBarry Smith y[i] = sum; 151317ab2063SBarry Smith } 15148d195f9aSBarry Smith #endif 1515b05257ddSBarry Smith } 15169566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0*a->nz - a->nonzerorowcnt)); 15179566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(xx,&x)); 15189566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(yy,&y)); 15199566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A,&a_a)); 15203a40ed3dSBarry Smith PetscFunctionReturn(0); 152117ab2063SBarry Smith } 152217ab2063SBarry Smith 1523b434eb95SMatthew G. Knepley PetscErrorCode MatMultMax_SeqAIJ(Mat A,Vec xx,Vec yy) 1524b434eb95SMatthew G. Knepley { 1525b434eb95SMatthew G. Knepley Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 1526b434eb95SMatthew G. Knepley PetscScalar *y; 1527b434eb95SMatthew G. Knepley const PetscScalar *x; 1528fff043a9SJunchao Zhang const MatScalar *aa,*a_a; 1529b434eb95SMatthew G. Knepley PetscInt m=A->rmap->n; 1530b434eb95SMatthew G. Knepley const PetscInt *aj,*ii,*ridx=NULL; 1531b434eb95SMatthew G. Knepley PetscInt n,i,nonzerorow=0; 1532b434eb95SMatthew G. Knepley PetscScalar sum; 1533b434eb95SMatthew G. Knepley PetscBool usecprow=a->compressedrow.use; 1534b434eb95SMatthew G. Knepley 1535b434eb95SMatthew G. Knepley #if defined(PETSC_HAVE_PRAGMA_DISJOINT) 1536b434eb95SMatthew G. Knepley #pragma disjoint(*x,*y,*aa) 1537b434eb95SMatthew G. Knepley #endif 1538b434eb95SMatthew G. Knepley 1539b434eb95SMatthew G. Knepley PetscFunctionBegin; 15409566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A,&a_a)); 15419566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(xx,&x)); 15429566063dSJacob Faibussowitsch PetscCall(VecGetArray(yy,&y)); 1543b434eb95SMatthew G. Knepley if (usecprow) { /* use compressed row format */ 1544b434eb95SMatthew G. Knepley m = a->compressedrow.nrows; 1545b434eb95SMatthew G. Knepley ii = a->compressedrow.i; 1546b434eb95SMatthew G. Knepley ridx = a->compressedrow.rindex; 1547b434eb95SMatthew G. Knepley for (i=0; i<m; i++) { 1548b434eb95SMatthew G. Knepley n = ii[i+1] - ii[i]; 1549b434eb95SMatthew G. Knepley aj = a->j + ii[i]; 1550fff043a9SJunchao Zhang aa = a_a + ii[i]; 1551b434eb95SMatthew G. Knepley sum = 0.0; 1552b434eb95SMatthew G. Knepley nonzerorow += (n>0); 1553b434eb95SMatthew G. Knepley PetscSparseDenseMaxDot(sum,x,aa,aj,n); 1554b434eb95SMatthew G. Knepley /* for (j=0; j<n; j++) sum += (*aa++)*x[*aj++]; */ 1555b434eb95SMatthew G. Knepley y[*ridx++] = sum; 1556b434eb95SMatthew G. Knepley } 1557b434eb95SMatthew G. Knepley } else { /* do not use compressed row format */ 15583d3eaba7SBarry Smith ii = a->i; 1559b434eb95SMatthew G. Knepley for (i=0; i<m; i++) { 1560b434eb95SMatthew G. Knepley n = ii[i+1] - ii[i]; 1561b434eb95SMatthew G. Knepley aj = a->j + ii[i]; 1562fff043a9SJunchao Zhang aa = a_a + ii[i]; 1563b434eb95SMatthew G. Knepley sum = 0.0; 1564b434eb95SMatthew G. Knepley nonzerorow += (n>0); 1565b434eb95SMatthew G. Knepley PetscSparseDenseMaxDot(sum,x,aa,aj,n); 1566b434eb95SMatthew G. Knepley y[i] = sum; 1567b434eb95SMatthew G. Knepley } 1568b434eb95SMatthew G. Knepley } 15699566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0*a->nz - nonzerorow)); 15709566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(xx,&x)); 15719566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(yy,&y)); 15729566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A,&a_a)); 1573b434eb95SMatthew G. Knepley PetscFunctionReturn(0); 1574b434eb95SMatthew G. Knepley } 1575b434eb95SMatthew G. Knepley 1576b434eb95SMatthew G. Knepley PetscErrorCode MatMultAddMax_SeqAIJ(Mat A,Vec xx,Vec yy,Vec zz) 1577b434eb95SMatthew G. Knepley { 1578b434eb95SMatthew G. Knepley Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 1579b434eb95SMatthew G. Knepley PetscScalar *y,*z; 1580b434eb95SMatthew G. Knepley const PetscScalar *x; 1581fff043a9SJunchao Zhang const MatScalar *aa,*a_a; 1582b434eb95SMatthew G. Knepley PetscInt m = A->rmap->n,*aj,*ii; 1583b434eb95SMatthew G. Knepley PetscInt n,i,*ridx=NULL; 1584b434eb95SMatthew G. Knepley PetscScalar sum; 1585b434eb95SMatthew G. Knepley PetscBool usecprow=a->compressedrow.use; 1586b434eb95SMatthew G. Knepley 1587b434eb95SMatthew G. Knepley PetscFunctionBegin; 15889566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A,&a_a)); 15899566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(xx,&x)); 15909566063dSJacob Faibussowitsch PetscCall(VecGetArrayPair(yy,zz,&y,&z)); 1591b434eb95SMatthew G. Knepley if (usecprow) { /* use compressed row format */ 1592b434eb95SMatthew G. Knepley if (zz != yy) { 15939566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(z,y,m)); 1594b434eb95SMatthew G. Knepley } 1595b434eb95SMatthew G. Knepley m = a->compressedrow.nrows; 1596b434eb95SMatthew G. Knepley ii = a->compressedrow.i; 1597b434eb95SMatthew G. Knepley ridx = a->compressedrow.rindex; 1598b434eb95SMatthew G. Knepley for (i=0; i<m; i++) { 1599b434eb95SMatthew G. Knepley n = ii[i+1] - ii[i]; 1600b434eb95SMatthew G. Knepley aj = a->j + ii[i]; 1601fff043a9SJunchao Zhang aa = a_a + ii[i]; 1602b434eb95SMatthew G. Knepley sum = y[*ridx]; 1603b434eb95SMatthew G. Knepley PetscSparseDenseMaxDot(sum,x,aa,aj,n); 1604b434eb95SMatthew G. Knepley z[*ridx++] = sum; 1605b434eb95SMatthew G. Knepley } 1606b434eb95SMatthew G. Knepley } else { /* do not use compressed row format */ 16073d3eaba7SBarry Smith ii = a->i; 1608b434eb95SMatthew G. Knepley for (i=0; i<m; i++) { 1609b434eb95SMatthew G. Knepley n = ii[i+1] - ii[i]; 1610b434eb95SMatthew G. Knepley aj = a->j + ii[i]; 1611fff043a9SJunchao Zhang aa = a_a + ii[i]; 1612b434eb95SMatthew G. Knepley sum = y[i]; 1613b434eb95SMatthew G. Knepley PetscSparseDenseMaxDot(sum,x,aa,aj,n); 1614b434eb95SMatthew G. Knepley z[i] = sum; 1615b434eb95SMatthew G. Knepley } 1616b434eb95SMatthew G. Knepley } 16179566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0*a->nz)); 16189566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(xx,&x)); 16199566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayPair(yy,zz,&y,&z)); 16209566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A,&a_a)); 1621b434eb95SMatthew G. Knepley PetscFunctionReturn(0); 1622b434eb95SMatthew G. Knepley } 1623b434eb95SMatthew G. Knepley 1624c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/ftn-kernels/fmultadd.h> 1625dfbe8321SBarry Smith PetscErrorCode MatMultAdd_SeqAIJ(Mat A,Vec xx,Vec yy,Vec zz) 162617ab2063SBarry Smith { 1627416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 1628f15663dcSBarry Smith PetscScalar *y,*z; 1629f15663dcSBarry Smith const PetscScalar *x; 1630fff043a9SJunchao Zhang const MatScalar *aa,*a_a; 1631d9ca1df4SBarry Smith const PetscInt *aj,*ii,*ridx=NULL; 1632d9ca1df4SBarry Smith PetscInt m = A->rmap->n,n,i; 1633362ced78SSatish Balay PetscScalar sum; 1634ace3abfcSBarry Smith PetscBool usecprow=a->compressedrow.use; 16359ea0dfa2SSatish Balay 16363a40ed3dSBarry Smith PetscFunctionBegin; 1637b215bc84SStefano Zampini if (a->inode.use && a->inode.checked) { 16389566063dSJacob Faibussowitsch PetscCall(MatMultAdd_SeqAIJ_Inode(A,xx,yy,zz)); 1639b215bc84SStefano Zampini PetscFunctionReturn(0); 1640b215bc84SStefano Zampini } 16419566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A,&a_a)); 16429566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(xx,&x)); 16439566063dSJacob Faibussowitsch PetscCall(VecGetArrayPair(yy,zz,&y,&z)); 16444eb6d288SHong Zhang if (usecprow) { /* use compressed row format */ 16454eb6d288SHong Zhang if (zz != yy) { 16469566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(z,y,m)); 16474eb6d288SHong Zhang } 164897952fefSHong Zhang m = a->compressedrow.nrows; 164997952fefSHong Zhang ii = a->compressedrow.i; 165097952fefSHong Zhang ridx = a->compressedrow.rindex; 165197952fefSHong Zhang for (i=0; i<m; i++) { 165297952fefSHong Zhang n = ii[i+1] - ii[i]; 165397952fefSHong Zhang aj = a->j + ii[i]; 1654fff043a9SJunchao Zhang aa = a_a + ii[i]; 165597952fefSHong Zhang sum = y[*ridx]; 1656f15663dcSBarry Smith PetscSparseDensePlusDot(sum,x,aa,aj,n); 165797952fefSHong Zhang z[*ridx++] = sum; 165897952fefSHong Zhang } 165997952fefSHong Zhang } else { /* do not use compressed row format */ 16603d3eaba7SBarry Smith ii = a->i; 1661f15663dcSBarry Smith #if defined(PETSC_USE_FORTRAN_KERNEL_MULTADDAIJ) 16623d3eaba7SBarry Smith aj = a->j; 1663fff043a9SJunchao Zhang aa = a_a; 1664f15663dcSBarry Smith fortranmultaddaij_(&m,x,ii,aj,aa,y,z); 1665f15663dcSBarry Smith #else 166617ab2063SBarry Smith for (i=0; i<m; i++) { 1667f15663dcSBarry Smith n = ii[i+1] - ii[i]; 1668f15663dcSBarry Smith aj = a->j + ii[i]; 1669fff043a9SJunchao Zhang aa = a_a + ii[i]; 167017ab2063SBarry Smith sum = y[i]; 1671f15663dcSBarry Smith PetscSparseDensePlusDot(sum,x,aa,aj,n); 167217ab2063SBarry Smith z[i] = sum; 167317ab2063SBarry Smith } 167402ab625aSSatish Balay #endif 1675f15663dcSBarry Smith } 16769566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0*a->nz)); 16779566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(xx,&x)); 16789566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayPair(yy,zz,&y,&z)); 16799566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A,&a_a)); 16803a40ed3dSBarry Smith PetscFunctionReturn(0); 168117ab2063SBarry Smith } 168217ab2063SBarry Smith 168317ab2063SBarry Smith /* 168417ab2063SBarry Smith Adds diagonal pointers to sparse matrix structure. 168517ab2063SBarry Smith */ 1686dfbe8321SBarry Smith PetscErrorCode MatMarkDiagonal_SeqAIJ(Mat A) 168717ab2063SBarry Smith { 1688416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 1689d0f46423SBarry Smith PetscInt i,j,m = A->rmap->n; 1690c0c07093SJunchao Zhang PetscBool alreadySet = PETSC_TRUE; 169117ab2063SBarry Smith 16923a40ed3dSBarry Smith PetscFunctionBegin; 169309f38230SBarry Smith if (!a->diag) { 16949566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m,&a->diag)); 16959566063dSJacob Faibussowitsch PetscCall(PetscLogObjectMemory((PetscObject)A, m*sizeof(PetscInt))); 1696c0c07093SJunchao Zhang alreadySet = PETSC_FALSE; 169709f38230SBarry Smith } 1698d0f46423SBarry Smith for (i=0; i<A->rmap->n; i++) { 1699c0c07093SJunchao Zhang /* If A's diagonal is already correctly set, this fast track enables cheap and repeated MatMarkDiagonal_SeqAIJ() calls */ 1700c0c07093SJunchao Zhang if (alreadySet) { 1701c0c07093SJunchao Zhang PetscInt pos = a->diag[i]; 1702c0c07093SJunchao Zhang if (pos >= a->i[i] && pos < a->i[i+1] && a->j[pos] == i) continue; 1703c0c07093SJunchao Zhang } 1704c0c07093SJunchao Zhang 170509f38230SBarry Smith a->diag[i] = a->i[i+1]; 1706bfeeae90SHong Zhang for (j=a->i[i]; j<a->i[i+1]; j++) { 1707bfeeae90SHong Zhang if (a->j[j] == i) { 170809f38230SBarry Smith a->diag[i] = j; 170917ab2063SBarry Smith break; 171017ab2063SBarry Smith } 171117ab2063SBarry Smith } 171217ab2063SBarry Smith } 17133a40ed3dSBarry Smith PetscFunctionReturn(0); 171417ab2063SBarry Smith } 171517ab2063SBarry Smith 171661ecd0c6SBarry Smith PetscErrorCode MatShift_SeqAIJ(Mat A,PetscScalar v) 171761ecd0c6SBarry Smith { 171861ecd0c6SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 171961ecd0c6SBarry Smith const PetscInt *diag = (const PetscInt*)a->diag; 172061ecd0c6SBarry Smith const PetscInt *ii = (const PetscInt*) a->i; 172161ecd0c6SBarry Smith PetscInt i,*mdiag = NULL; 172261ecd0c6SBarry Smith PetscInt cnt = 0; /* how many diagonals are missing */ 172361ecd0c6SBarry Smith 172461ecd0c6SBarry Smith PetscFunctionBegin; 172561ecd0c6SBarry Smith if (!A->preallocated || !a->nz) { 17269566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation(A,1,NULL)); 17279566063dSJacob Faibussowitsch PetscCall(MatShift_Basic(A,v)); 172861ecd0c6SBarry Smith PetscFunctionReturn(0); 172961ecd0c6SBarry Smith } 173061ecd0c6SBarry Smith 173161ecd0c6SBarry Smith if (a->diagonaldense) { 173261ecd0c6SBarry Smith cnt = 0; 173361ecd0c6SBarry Smith } else { 17349566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(A->rmap->n,&mdiag)); 173561ecd0c6SBarry Smith for (i=0; i<A->rmap->n; i++) { 1736*349d3b71SJunchao Zhang if (i < A->cmap->n && diag[i] >= ii[i+1]) { /* 'out of range' rows never have diagonals */ 173761ecd0c6SBarry Smith cnt++; 173861ecd0c6SBarry Smith mdiag[i] = 1; 173961ecd0c6SBarry Smith } 174061ecd0c6SBarry Smith } 174161ecd0c6SBarry Smith } 174261ecd0c6SBarry Smith if (!cnt) { 17439566063dSJacob Faibussowitsch PetscCall(MatShift_Basic(A,v)); 174461ecd0c6SBarry Smith } else { 1745b6f2aa54SBarry Smith PetscScalar *olda = a->a; /* preserve pointers to current matrix nonzeros structure and values */ 1746b6f2aa54SBarry Smith PetscInt *oldj = a->j, *oldi = a->i; 174761ecd0c6SBarry Smith PetscBool singlemalloc = a->singlemalloc,free_a = a->free_a,free_ij = a->free_ij; 174861ecd0c6SBarry Smith 174961ecd0c6SBarry Smith a->a = NULL; 175061ecd0c6SBarry Smith a->j = NULL; 175161ecd0c6SBarry Smith a->i = NULL; 175261ecd0c6SBarry Smith /* increase the values in imax for each row where a diagonal is being inserted then reallocate the matrix data structures */ 1753*349d3b71SJunchao Zhang for (i=0; i<PetscMin(A->rmap->n,A->cmap->n); i++) { 175461ecd0c6SBarry Smith a->imax[i] += mdiag[i]; 175561ecd0c6SBarry Smith } 17569566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(A,0,a->imax)); 175761ecd0c6SBarry Smith 175861ecd0c6SBarry Smith /* copy old values into new matrix data structure */ 175961ecd0c6SBarry Smith for (i=0; i<A->rmap->n; i++) { 17609566063dSJacob Faibussowitsch PetscCall(MatSetValues(A,1,&i,a->imax[i] - mdiag[i],&oldj[oldi[i]],&olda[oldi[i]],ADD_VALUES)); 1761447d62f5SStefano Zampini if (i < A->cmap->n) { 17629566063dSJacob Faibussowitsch PetscCall(MatSetValue(A,i,i,v,ADD_VALUES)); 176361ecd0c6SBarry Smith } 1764447d62f5SStefano Zampini } 17659566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(A,MAT_FINAL_ASSEMBLY)); 17669566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(A,MAT_FINAL_ASSEMBLY)); 176761ecd0c6SBarry Smith if (singlemalloc) { 17689566063dSJacob Faibussowitsch PetscCall(PetscFree3(olda,oldj,oldi)); 176961ecd0c6SBarry Smith } else { 17709566063dSJacob Faibussowitsch if (free_a) PetscCall(PetscFree(olda)); 17719566063dSJacob Faibussowitsch if (free_ij) PetscCall(PetscFree(oldj)); 17729566063dSJacob Faibussowitsch if (free_ij) PetscCall(PetscFree(oldi)); 177361ecd0c6SBarry Smith } 177461ecd0c6SBarry Smith } 17759566063dSJacob Faibussowitsch PetscCall(PetscFree(mdiag)); 177661ecd0c6SBarry Smith a->diagonaldense = PETSC_TRUE; 177761ecd0c6SBarry Smith PetscFunctionReturn(0); 177861ecd0c6SBarry Smith } 177961ecd0c6SBarry Smith 1780be5855fcSBarry Smith /* 1781be5855fcSBarry Smith Checks for missing diagonals 1782be5855fcSBarry Smith */ 1783ace3abfcSBarry Smith PetscErrorCode MatMissingDiagonal_SeqAIJ(Mat A,PetscBool *missing,PetscInt *d) 1784be5855fcSBarry Smith { 1785be5855fcSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 17867734d3b5SMatthew G. Knepley PetscInt *diag,*ii = a->i,i; 1787be5855fcSBarry Smith 1788be5855fcSBarry Smith PetscFunctionBegin; 178909f38230SBarry Smith *missing = PETSC_FALSE; 17907734d3b5SMatthew G. Knepley if (A->rmap->n > 0 && !ii) { 179109f38230SBarry Smith *missing = PETSC_TRUE; 179209f38230SBarry Smith if (d) *d = 0; 17939566063dSJacob Faibussowitsch PetscCall(PetscInfo(A,"Matrix has no entries therefore is missing diagonal\n")); 179409f38230SBarry Smith } else { 179501445905SHong Zhang PetscInt n; 179601445905SHong Zhang n = PetscMin(A->rmap->n, A->cmap->n); 1797f1e2ffcdSBarry Smith diag = a->diag; 179801445905SHong Zhang for (i=0; i<n; i++) { 17997734d3b5SMatthew G. Knepley if (diag[i] >= ii[i+1]) { 180009f38230SBarry Smith *missing = PETSC_TRUE; 180109f38230SBarry Smith if (d) *d = i; 18029566063dSJacob Faibussowitsch PetscCall(PetscInfo(A,"Matrix is missing diagonal number %" PetscInt_FMT "\n",i)); 1803358d2f5dSShri Abhyankar break; 180409f38230SBarry Smith } 1805be5855fcSBarry Smith } 1806be5855fcSBarry Smith } 1807be5855fcSBarry Smith PetscFunctionReturn(0); 1808be5855fcSBarry Smith } 1809be5855fcSBarry Smith 18100da83c2eSBarry Smith #include <petscblaslapack.h> 18110da83c2eSBarry Smith #include <petsc/private/kernels/blockinvert.h> 18120da83c2eSBarry Smith 18130da83c2eSBarry Smith /* 18140da83c2eSBarry Smith Note that values is allocated externally by the PC and then passed into this routine 18150da83c2eSBarry Smith */ 18160da83c2eSBarry Smith PetscErrorCode MatInvertVariableBlockDiagonal_SeqAIJ(Mat A,PetscInt nblocks,const PetscInt *bsizes,PetscScalar *diag) 18170da83c2eSBarry Smith { 18180da83c2eSBarry Smith PetscInt n = A->rmap->n, i, ncnt = 0, *indx,j,bsizemax = 0,*v_pivots; 18190da83c2eSBarry Smith PetscBool allowzeropivot,zeropivotdetected=PETSC_FALSE; 18200da83c2eSBarry Smith const PetscReal shift = 0.0; 18210da83c2eSBarry Smith PetscInt ipvt[5]; 18220da83c2eSBarry Smith PetscScalar work[25],*v_work; 18230da83c2eSBarry Smith 18240da83c2eSBarry Smith PetscFunctionBegin; 18250da83c2eSBarry Smith allowzeropivot = PetscNot(A->erroriffailure); 18260da83c2eSBarry Smith for (i=0; i<nblocks; i++) ncnt += bsizes[i]; 18272c71b3e2SJacob Faibussowitsch PetscCheckFalse(ncnt != n,PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Total blocksizes %" PetscInt_FMT " doesn't match number matrix rows %" PetscInt_FMT,ncnt,n); 18280da83c2eSBarry Smith for (i=0; i<nblocks; i++) { 18290da83c2eSBarry Smith bsizemax = PetscMax(bsizemax,bsizes[i]); 18300da83c2eSBarry Smith } 18319566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(bsizemax,&indx)); 18320da83c2eSBarry Smith if (bsizemax > 7) { 18339566063dSJacob Faibussowitsch PetscCall(PetscMalloc2(bsizemax,&v_work,bsizemax,&v_pivots)); 18340da83c2eSBarry Smith } 18350da83c2eSBarry Smith ncnt = 0; 18360da83c2eSBarry Smith for (i=0; i<nblocks; i++) { 18370da83c2eSBarry Smith for (j=0; j<bsizes[i]; j++) indx[j] = ncnt+j; 18389566063dSJacob Faibussowitsch PetscCall(MatGetValues(A,bsizes[i],indx,bsizes[i],indx,diag)); 18390da83c2eSBarry Smith switch (bsizes[i]) { 18400da83c2eSBarry Smith case 1: 18410da83c2eSBarry Smith *diag = 1.0/(*diag); 18420da83c2eSBarry Smith break; 18430da83c2eSBarry Smith case 2: 18449566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_2(diag,shift,allowzeropivot,&zeropivotdetected)); 18450da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 18469566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_2(diag)); 18470da83c2eSBarry Smith break; 18480da83c2eSBarry Smith case 3: 18499566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_3(diag,shift,allowzeropivot,&zeropivotdetected)); 18500da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 18519566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_3(diag)); 18520da83c2eSBarry Smith break; 18530da83c2eSBarry Smith case 4: 18549566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_4(diag,shift,allowzeropivot,&zeropivotdetected)); 18550da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 18569566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_4(diag)); 18570da83c2eSBarry Smith break; 18580da83c2eSBarry Smith case 5: 18599566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_5(diag,ipvt,work,shift,allowzeropivot,&zeropivotdetected)); 18600da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 18619566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_5(diag)); 18620da83c2eSBarry Smith break; 18630da83c2eSBarry Smith case 6: 18649566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_6(diag,shift,allowzeropivot,&zeropivotdetected)); 18650da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 18669566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_6(diag)); 18670da83c2eSBarry Smith break; 18680da83c2eSBarry Smith case 7: 18699566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_7(diag,shift,allowzeropivot,&zeropivotdetected)); 18700da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 18719566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_7(diag)); 18720da83c2eSBarry Smith break; 18730da83c2eSBarry Smith default: 18749566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A(bsizes[i],diag,v_pivots,v_work,allowzeropivot,&zeropivotdetected)); 18750da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 18769566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_N(diag,bsizes[i])); 18770da83c2eSBarry Smith } 18780da83c2eSBarry Smith ncnt += bsizes[i]; 18790da83c2eSBarry Smith diag += bsizes[i]*bsizes[i]; 18800da83c2eSBarry Smith } 18810da83c2eSBarry Smith if (bsizemax > 7) { 18829566063dSJacob Faibussowitsch PetscCall(PetscFree2(v_work,v_pivots)); 18830da83c2eSBarry Smith } 18849566063dSJacob Faibussowitsch PetscCall(PetscFree(indx)); 18850da83c2eSBarry Smith PetscFunctionReturn(0); 18860da83c2eSBarry Smith } 18870da83c2eSBarry Smith 1888422a814eSBarry Smith /* 1889422a814eSBarry Smith Negative shift indicates do not generate an error if there is a zero diagonal, just invert it anyways 1890422a814eSBarry Smith */ 18917087cfbeSBarry Smith PetscErrorCode MatInvertDiagonal_SeqAIJ(Mat A,PetscScalar omega,PetscScalar fshift) 189271f1c65dSBarry Smith { 189371f1c65dSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*) A->data; 1894d0f46423SBarry Smith PetscInt i,*diag,m = A->rmap->n; 18952e5835c6SStefano Zampini const MatScalar *v; 189654f21887SBarry Smith PetscScalar *idiag,*mdiag; 189771f1c65dSBarry Smith 189871f1c65dSBarry Smith PetscFunctionBegin; 189971f1c65dSBarry Smith if (a->idiagvalid) PetscFunctionReturn(0); 19009566063dSJacob Faibussowitsch PetscCall(MatMarkDiagonal_SeqAIJ(A)); 190171f1c65dSBarry Smith diag = a->diag; 190271f1c65dSBarry Smith if (!a->idiag) { 19039566063dSJacob Faibussowitsch PetscCall(PetscMalloc3(m,&a->idiag,m,&a->mdiag,m,&a->ssor_work)); 19049566063dSJacob Faibussowitsch PetscCall(PetscLogObjectMemory((PetscObject)A,3*m*sizeof(PetscScalar))); 190571f1c65dSBarry Smith } 19062e5835c6SStefano Zampini 190771f1c65dSBarry Smith mdiag = a->mdiag; 190871f1c65dSBarry Smith idiag = a->idiag; 19099566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A,&v)); 1910422a814eSBarry Smith if (omega == 1.0 && PetscRealPart(fshift) <= 0.0) { 191171f1c65dSBarry Smith for (i=0; i<m; i++) { 191271f1c65dSBarry Smith mdiag[i] = v[diag[i]]; 1913899639b0SHong Zhang if (!PetscAbsScalar(mdiag[i])) { /* zero diagonal */ 1914899639b0SHong Zhang if (PetscRealPart(fshift)) { 19159566063dSJacob Faibussowitsch PetscCall(PetscInfo(A,"Zero diagonal on row %" PetscInt_FMT "\n",i)); 19167b6c816cSBarry Smith A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 19177b6c816cSBarry Smith A->factorerror_zeropivot_value = 0.0; 19187b6c816cSBarry Smith A->factorerror_zeropivot_row = i; 191998921bdaSJacob Faibussowitsch } else SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_INCOMP,"Zero diagonal on row %" PetscInt_FMT,i); 1920899639b0SHong Zhang } 192171f1c65dSBarry Smith idiag[i] = 1.0/v[diag[i]]; 192271f1c65dSBarry Smith } 19239566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(m)); 192471f1c65dSBarry Smith } else { 192571f1c65dSBarry Smith for (i=0; i<m; i++) { 192671f1c65dSBarry Smith mdiag[i] = v[diag[i]]; 192771f1c65dSBarry Smith idiag[i] = omega/(fshift + v[diag[i]]); 192871f1c65dSBarry Smith } 19299566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0*m)); 193071f1c65dSBarry Smith } 193171f1c65dSBarry Smith a->idiagvalid = PETSC_TRUE; 19329566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A,&v)); 193371f1c65dSBarry Smith PetscFunctionReturn(0); 193471f1c65dSBarry Smith } 193571f1c65dSBarry Smith 1936c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/ftn-kernels/frelax.h> 193741f059aeSBarry Smith PetscErrorCode MatSOR_SeqAIJ(Mat A,Vec bb,PetscReal omega,MatSORType flag,PetscReal fshift,PetscInt its,PetscInt lits,Vec xx) 193817ab2063SBarry Smith { 1939416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 1940e6d1f457SBarry Smith PetscScalar *x,d,sum,*t,scale; 19412e5835c6SStefano Zampini const MatScalar *v,*idiag=NULL,*mdiag,*aa; 194254f21887SBarry Smith const PetscScalar *b, *bs,*xb, *ts; 19433d3eaba7SBarry Smith PetscInt n,m = A->rmap->n,i; 194497f1f81fSBarry Smith const PetscInt *idx,*diag; 194517ab2063SBarry Smith 19463a40ed3dSBarry Smith PetscFunctionBegin; 1947b215bc84SStefano Zampini if (a->inode.use && a->inode.checked && omega == 1.0 && fshift == 0.0) { 19489566063dSJacob Faibussowitsch PetscCall(MatSOR_SeqAIJ_Inode(A,bb,omega,flag,fshift,its,lits,xx)); 1949b215bc84SStefano Zampini PetscFunctionReturn(0); 1950b215bc84SStefano Zampini } 1951b965ef7fSBarry Smith its = its*lits; 195291723122SBarry Smith 195371f1c65dSBarry Smith if (fshift != a->fshift || omega != a->omega) a->idiagvalid = PETSC_FALSE; /* must recompute idiag[] */ 19549566063dSJacob Faibussowitsch if (!a->idiagvalid) PetscCall(MatInvertDiagonal_SeqAIJ(A,omega,fshift)); 195571f1c65dSBarry Smith a->fshift = fshift; 195671f1c65dSBarry Smith a->omega = omega; 1957ed480e8bSBarry Smith 195871f1c65dSBarry Smith diag = a->diag; 195971f1c65dSBarry Smith t = a->ssor_work; 1960ed480e8bSBarry Smith idiag = a->idiag; 196171f1c65dSBarry Smith mdiag = a->mdiag; 1962ed480e8bSBarry Smith 19639566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A,&aa)); 19649566063dSJacob Faibussowitsch PetscCall(VecGetArray(xx,&x)); 19659566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(bb,&b)); 1966ed480e8bSBarry Smith /* We count flops by assuming the upper triangular and lower triangular parts have the same number of nonzeros */ 196717ab2063SBarry Smith if (flag == SOR_APPLY_UPPER) { 196817ab2063SBarry Smith /* apply (U + D/omega) to the vector */ 1969ed480e8bSBarry Smith bs = b; 197017ab2063SBarry Smith for (i=0; i<m; i++) { 197171f1c65dSBarry Smith d = fshift + mdiag[i]; 1972416022c9SBarry Smith n = a->i[i+1] - diag[i] - 1; 1973ed480e8bSBarry Smith idx = a->j + diag[i] + 1; 19742e5835c6SStefano Zampini v = aa + diag[i] + 1; 197517ab2063SBarry Smith sum = b[i]*d/omega; 1976003131ecSBarry Smith PetscSparseDensePlusDot(sum,bs,v,idx,n); 197717ab2063SBarry Smith x[i] = sum; 197817ab2063SBarry Smith } 19799566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(xx,&x)); 19809566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(bb,&b)); 19819566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A,&aa)); 19829566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(a->nz)); 19833a40ed3dSBarry Smith PetscFunctionReturn(0); 198417ab2063SBarry Smith } 1985c783ea89SBarry Smith 19862c71b3e2SJacob Faibussowitsch PetscCheckFalse(flag == SOR_APPLY_LOWER,PETSC_COMM_SELF,PETSC_ERR_SUP,"SOR_APPLY_LOWER is not implemented"); 19872205254eSKarl Rupp else if (flag & SOR_EISENSTAT) { 19884c500f23SPierre Jolivet /* Let A = L + U + D; where L is lower triangular, 1989887ee2caSBarry Smith U is upper triangular, E = D/omega; This routine applies 199017ab2063SBarry Smith 199117ab2063SBarry Smith (L + E)^{-1} A (U + E)^{-1} 199217ab2063SBarry Smith 1993887ee2caSBarry Smith to a vector efficiently using Eisenstat's trick. 199417ab2063SBarry Smith */ 199517ab2063SBarry Smith scale = (2.0/omega) - 1.0; 199617ab2063SBarry Smith 199717ab2063SBarry Smith /* x = (E + U)^{-1} b */ 199817ab2063SBarry Smith for (i=m-1; i>=0; i--) { 1999416022c9SBarry Smith n = a->i[i+1] - diag[i] - 1; 2000ed480e8bSBarry Smith idx = a->j + diag[i] + 1; 20012e5835c6SStefano Zampini v = aa + diag[i] + 1; 200217ab2063SBarry Smith sum = b[i]; 2003e6d1f457SBarry Smith PetscSparseDenseMinusDot(sum,x,v,idx,n); 2004ed480e8bSBarry Smith x[i] = sum*idiag[i]; 200517ab2063SBarry Smith } 200617ab2063SBarry Smith 200717ab2063SBarry Smith /* t = b - (2*E - D)x */ 20082e5835c6SStefano Zampini v = aa; 20092205254eSKarl Rupp for (i=0; i<m; i++) t[i] = b[i] - scale*(v[*diag++])*x[i]; 201017ab2063SBarry Smith 201117ab2063SBarry Smith /* t = (E + L)^{-1}t */ 2012ed480e8bSBarry Smith ts = t; 2013416022c9SBarry Smith diag = a->diag; 201417ab2063SBarry Smith for (i=0; i<m; i++) { 2015416022c9SBarry Smith n = diag[i] - a->i[i]; 2016ed480e8bSBarry Smith idx = a->j + a->i[i]; 20172e5835c6SStefano Zampini v = aa + a->i[i]; 201817ab2063SBarry Smith sum = t[i]; 2019003131ecSBarry Smith PetscSparseDenseMinusDot(sum,ts,v,idx,n); 2020ed480e8bSBarry Smith t[i] = sum*idiag[i]; 2021733d66baSBarry Smith /* x = x + t */ 2022733d66baSBarry Smith x[i] += t[i]; 202317ab2063SBarry Smith } 202417ab2063SBarry Smith 20259566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(6.0*m-1 + 2.0*a->nz)); 20269566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(xx,&x)); 20279566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(bb,&b)); 20283a40ed3dSBarry Smith PetscFunctionReturn(0); 202917ab2063SBarry Smith } 203017ab2063SBarry Smith if (flag & SOR_ZERO_INITIAL_GUESS) { 203117ab2063SBarry Smith if (flag & SOR_FORWARD_SWEEP || flag & SOR_LOCAL_FORWARD_SWEEP) { 203217ab2063SBarry Smith for (i=0; i<m; i++) { 2033416022c9SBarry Smith n = diag[i] - a->i[i]; 2034ed480e8bSBarry Smith idx = a->j + a->i[i]; 20352e5835c6SStefano Zampini v = aa + a->i[i]; 203617ab2063SBarry Smith sum = b[i]; 2037e6d1f457SBarry Smith PetscSparseDenseMinusDot(sum,x,v,idx,n); 20385c99c7daSBarry Smith t[i] = sum; 2039ed480e8bSBarry Smith x[i] = sum*idiag[i]; 204017ab2063SBarry Smith } 20415c99c7daSBarry Smith xb = t; 20429566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(a->nz)); 20433a40ed3dSBarry Smith } else xb = b; 204417ab2063SBarry Smith if (flag & SOR_BACKWARD_SWEEP || flag & SOR_LOCAL_BACKWARD_SWEEP) { 204517ab2063SBarry Smith for (i=m-1; i>=0; i--) { 2046416022c9SBarry Smith n = a->i[i+1] - diag[i] - 1; 2047ed480e8bSBarry Smith idx = a->j + diag[i] + 1; 20482e5835c6SStefano Zampini v = aa + diag[i] + 1; 204917ab2063SBarry Smith sum = xb[i]; 2050e6d1f457SBarry Smith PetscSparseDenseMinusDot(sum,x,v,idx,n); 20515c99c7daSBarry Smith if (xb == b) { 2052ed480e8bSBarry Smith x[i] = sum*idiag[i]; 20535c99c7daSBarry Smith } else { 2054b19a5dc2SMark Adams x[i] = (1-omega)*x[i] + sum*idiag[i]; /* omega in idiag */ 205517ab2063SBarry Smith } 20565c99c7daSBarry Smith } 20579566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(a->nz)); /* assumes 1/2 in upper */ 205817ab2063SBarry Smith } 205917ab2063SBarry Smith its--; 206017ab2063SBarry Smith } 206117ab2063SBarry Smith while (its--) { 206217ab2063SBarry Smith if (flag & SOR_FORWARD_SWEEP || flag & SOR_LOCAL_FORWARD_SWEEP) { 206317ab2063SBarry Smith for (i=0; i<m; i++) { 2064b19a5dc2SMark Adams /* lower */ 2065b19a5dc2SMark Adams n = diag[i] - a->i[i]; 2066ed480e8bSBarry Smith idx = a->j + a->i[i]; 20672e5835c6SStefano Zampini v = aa + a->i[i]; 206817ab2063SBarry Smith sum = b[i]; 2069e6d1f457SBarry Smith PetscSparseDenseMinusDot(sum,x,v,idx,n); 2070b19a5dc2SMark Adams t[i] = sum; /* save application of the lower-triangular part */ 2071b19a5dc2SMark Adams /* upper */ 2072b19a5dc2SMark Adams n = a->i[i+1] - diag[i] - 1; 2073b19a5dc2SMark Adams idx = a->j + diag[i] + 1; 20742e5835c6SStefano Zampini v = aa + diag[i] + 1; 2075b19a5dc2SMark Adams PetscSparseDenseMinusDot(sum,x,v,idx,n); 2076b19a5dc2SMark Adams x[i] = (1. - omega)*x[i] + sum*idiag[i]; /* omega in idiag */ 207717ab2063SBarry Smith } 2078b19a5dc2SMark Adams xb = t; 20799566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0*a->nz)); 2080b19a5dc2SMark Adams } else xb = b; 208117ab2063SBarry Smith if (flag & SOR_BACKWARD_SWEEP || flag & SOR_LOCAL_BACKWARD_SWEEP) { 208217ab2063SBarry Smith for (i=m-1; i>=0; i--) { 2083b19a5dc2SMark Adams sum = xb[i]; 2084b19a5dc2SMark Adams if (xb == b) { 2085b19a5dc2SMark Adams /* whole matrix (no checkpointing available) */ 2086416022c9SBarry Smith n = a->i[i+1] - a->i[i]; 2087ed480e8bSBarry Smith idx = a->j + a->i[i]; 20882e5835c6SStefano Zampini v = aa + a->i[i]; 2089e6d1f457SBarry Smith PetscSparseDenseMinusDot(sum,x,v,idx,n); 2090ed480e8bSBarry Smith x[i] = (1. - omega)*x[i] + (sum + mdiag[i]*x[i])*idiag[i]; 2091b19a5dc2SMark Adams } else { /* lower-triangular part has been saved, so only apply upper-triangular */ 2092b19a5dc2SMark Adams n = a->i[i+1] - diag[i] - 1; 2093b19a5dc2SMark Adams idx = a->j + diag[i] + 1; 20942e5835c6SStefano Zampini v = aa + diag[i] + 1; 2095b19a5dc2SMark Adams PetscSparseDenseMinusDot(sum,x,v,idx,n); 2096b19a5dc2SMark Adams x[i] = (1. - omega)*x[i] + sum*idiag[i]; /* omega in idiag */ 209717ab2063SBarry Smith } 2098b19a5dc2SMark Adams } 2099b19a5dc2SMark Adams if (xb == b) { 21009566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0*a->nz)); 2101b19a5dc2SMark Adams } else { 21029566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(a->nz)); /* assumes 1/2 in upper */ 2103b19a5dc2SMark Adams } 210417ab2063SBarry Smith } 210517ab2063SBarry Smith } 21069566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A,&aa)); 21079566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(xx,&x)); 21089566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(bb,&b)); 2109365a8a9eSBarry Smith PetscFunctionReturn(0); 211017ab2063SBarry Smith } 211117ab2063SBarry Smith 2112dfbe8321SBarry Smith PetscErrorCode MatGetInfo_SeqAIJ(Mat A,MatInfoType flag,MatInfo *info) 211317ab2063SBarry Smith { 2114416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 21154e220ebcSLois Curfman McInnes 21163a40ed3dSBarry Smith PetscFunctionBegin; 21174e220ebcSLois Curfman McInnes info->block_size = 1.0; 21183966268fSBarry Smith info->nz_allocated = a->maxnz; 21193966268fSBarry Smith info->nz_used = a->nz; 21203966268fSBarry Smith info->nz_unneeded = (a->maxnz - a->nz); 21213966268fSBarry Smith info->assemblies = A->num_ass; 21223966268fSBarry Smith info->mallocs = A->info.mallocs; 21237adad957SLisandro Dalcin info->memory = ((PetscObject)A)->mem; 2124d5f3da31SBarry Smith if (A->factortype) { 21254e220ebcSLois Curfman McInnes info->fill_ratio_given = A->info.fill_ratio_given; 21264e220ebcSLois Curfman McInnes info->fill_ratio_needed = A->info.fill_ratio_needed; 21274e220ebcSLois Curfman McInnes info->factor_mallocs = A->info.factor_mallocs; 21284e220ebcSLois Curfman McInnes } else { 21294e220ebcSLois Curfman McInnes info->fill_ratio_given = 0; 21304e220ebcSLois Curfman McInnes info->fill_ratio_needed = 0; 21314e220ebcSLois Curfman McInnes info->factor_mallocs = 0; 21324e220ebcSLois Curfman McInnes } 21333a40ed3dSBarry Smith PetscFunctionReturn(0); 213417ab2063SBarry Smith } 213517ab2063SBarry Smith 21362b40b63fSBarry Smith PetscErrorCode MatZeroRows_SeqAIJ(Mat A,PetscInt N,const PetscInt rows[],PetscScalar diag,Vec x,Vec b) 213717ab2063SBarry Smith { 2138416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 2139c7da8527SEric Chamberland PetscInt i,m = A->rmap->n - 1; 214097b48c8fSBarry Smith const PetscScalar *xx; 21412e5835c6SStefano Zampini PetscScalar *bb,*aa; 2142c7da8527SEric Chamberland PetscInt d = 0; 214317ab2063SBarry Smith 21443a40ed3dSBarry Smith PetscFunctionBegin; 214597b48c8fSBarry Smith if (x && b) { 21469566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(x,&xx)); 21479566063dSJacob Faibussowitsch PetscCall(VecGetArray(b,&bb)); 214897b48c8fSBarry Smith for (i=0; i<N; i++) { 21492c71b3e2SJacob Faibussowitsch PetscCheckFalse(rows[i] < 0 || rows[i] > m,PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"row %" PetscInt_FMT " out of range", rows[i]); 2150447d62f5SStefano Zampini if (rows[i] >= A->cmap->n) continue; 215197b48c8fSBarry Smith bb[rows[i]] = diag*xx[rows[i]]; 215297b48c8fSBarry Smith } 21539566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(x,&xx)); 21549566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(b,&bb)); 215597b48c8fSBarry Smith } 215697b48c8fSBarry Smith 21579566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A,&aa)); 2158a9817697SBarry Smith if (a->keepnonzeropattern) { 2159f1e2ffcdSBarry Smith for (i=0; i<N; i++) { 21602c71b3e2SJacob Faibussowitsch PetscCheckFalse(rows[i] < 0 || rows[i] > m,PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"row %" PetscInt_FMT " out of range", rows[i]); 21619566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(&aa[a->i[rows[i]]],a->ilen[rows[i]])); 2162f1e2ffcdSBarry Smith } 2163f4df32b1SMatthew Knepley if (diag != 0.0) { 2164c7da8527SEric Chamberland for (i=0; i<N; i++) { 2165c7da8527SEric Chamberland d = rows[i]; 2166447d62f5SStefano Zampini if (rows[i] >= A->cmap->n) continue; 21672c71b3e2SJacob Faibussowitsch PetscCheckFalse(a->diag[d] >= a->i[d+1],PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Matrix is missing diagonal entry in the zeroed row %" PetscInt_FMT,d); 2168c7da8527SEric Chamberland } 2169f1e2ffcdSBarry Smith for (i=0; i<N; i++) { 2170447d62f5SStefano Zampini if (rows[i] >= A->cmap->n) continue; 21712e5835c6SStefano Zampini aa[a->diag[rows[i]]] = diag; 2172f1e2ffcdSBarry Smith } 2173f1e2ffcdSBarry Smith } 2174f1e2ffcdSBarry Smith } else { 2175f4df32b1SMatthew Knepley if (diag != 0.0) { 217617ab2063SBarry Smith for (i=0; i<N; i++) { 21772c71b3e2SJacob Faibussowitsch PetscCheckFalse(rows[i] < 0 || rows[i] > m,PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"row %" PetscInt_FMT " out of range", rows[i]); 21787ae801bdSBarry Smith if (a->ilen[rows[i]] > 0) { 2179447d62f5SStefano Zampini if (rows[i] >= A->cmap->n) { 2180447d62f5SStefano Zampini a->ilen[rows[i]] = 0; 2181447d62f5SStefano Zampini } else { 2182416022c9SBarry Smith a->ilen[rows[i]] = 1; 21832e5835c6SStefano Zampini aa[a->i[rows[i]]] = diag; 2184bfeeae90SHong Zhang a->j[a->i[rows[i]]] = rows[i]; 2185447d62f5SStefano Zampini } 2186447d62f5SStefano Zampini } else if (rows[i] < A->cmap->n) { /* in case row was completely empty */ 21879566063dSJacob Faibussowitsch PetscCall(MatSetValues_SeqAIJ(A,1,&rows[i],1,&rows[i],&diag,INSERT_VALUES)); 218817ab2063SBarry Smith } 218917ab2063SBarry Smith } 21903a40ed3dSBarry Smith } else { 219117ab2063SBarry Smith for (i=0; i<N; i++) { 21922c71b3e2SJacob Faibussowitsch PetscCheckFalse(rows[i] < 0 || rows[i] > m,PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"row %" PetscInt_FMT " out of range", rows[i]); 2193416022c9SBarry Smith a->ilen[rows[i]] = 0; 219417ab2063SBarry Smith } 219517ab2063SBarry Smith } 2196e56f5c9eSBarry Smith A->nonzerostate++; 2197f1e2ffcdSBarry Smith } 21989566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A,&aa)); 21999566063dSJacob Faibussowitsch PetscCall((*A->ops->assemblyend)(A,MAT_FINAL_ASSEMBLY)); 22003a40ed3dSBarry Smith PetscFunctionReturn(0); 220117ab2063SBarry Smith } 220217ab2063SBarry Smith 22036e169961SBarry Smith PetscErrorCode MatZeroRowsColumns_SeqAIJ(Mat A,PetscInt N,const PetscInt rows[],PetscScalar diag,Vec x,Vec b) 22046e169961SBarry Smith { 22056e169961SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 22066e169961SBarry Smith PetscInt i,j,m = A->rmap->n - 1,d = 0; 22072b40b63fSBarry Smith PetscBool missing,*zeroed,vecs = PETSC_FALSE; 22086e169961SBarry Smith const PetscScalar *xx; 22092e5835c6SStefano Zampini PetscScalar *bb,*aa; 22106e169961SBarry Smith 22116e169961SBarry Smith PetscFunctionBegin; 22122e5835c6SStefano Zampini if (!N) PetscFunctionReturn(0); 22139566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A,&aa)); 22146e169961SBarry Smith if (x && b) { 22159566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(x,&xx)); 22169566063dSJacob Faibussowitsch PetscCall(VecGetArray(b,&bb)); 22172b40b63fSBarry Smith vecs = PETSC_TRUE; 22186e169961SBarry Smith } 22199566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(A->rmap->n,&zeroed)); 22206e169961SBarry Smith for (i=0; i<N; i++) { 22212c71b3e2SJacob Faibussowitsch PetscCheckFalse(rows[i] < 0 || rows[i] > m,PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"row %" PetscInt_FMT " out of range", rows[i]); 22229566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(&aa[a->i[rows[i]]],a->ilen[rows[i]])); 22232205254eSKarl Rupp 22246e169961SBarry Smith zeroed[rows[i]] = PETSC_TRUE; 22256e169961SBarry Smith } 22266e169961SBarry Smith for (i=0; i<A->rmap->n; i++) { 22276e169961SBarry Smith if (!zeroed[i]) { 22286e169961SBarry Smith for (j=a->i[i]; j<a->i[i+1]; j++) { 22294cf107fdSStefano Zampini if (a->j[j] < A->rmap->n && zeroed[a->j[j]]) { 22302e5835c6SStefano Zampini if (vecs) bb[i] -= aa[j]*xx[a->j[j]]; 22312e5835c6SStefano Zampini aa[j] = 0.0; 22326e169961SBarry Smith } 22336e169961SBarry Smith } 22344cf107fdSStefano Zampini } else if (vecs && i < A->cmap->N) bb[i] = diag*xx[i]; 22356e169961SBarry Smith } 22366e169961SBarry Smith if (x && b) { 22379566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(x,&xx)); 22389566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(b,&bb)); 22396e169961SBarry Smith } 22409566063dSJacob Faibussowitsch PetscCall(PetscFree(zeroed)); 22416e169961SBarry Smith if (diag != 0.0) { 22429566063dSJacob Faibussowitsch PetscCall(MatMissingDiagonal_SeqAIJ(A,&missing,&d)); 22431d5a398dSstefano_zampini if (missing) { 22441d5a398dSstefano_zampini for (i=0; i<N; i++) { 22454cf107fdSStefano Zampini if (rows[i] >= A->cmap->N) continue; 22462c71b3e2SJacob Faibussowitsch PetscCheckFalse(a->nonew && rows[i] >= d,PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Matrix is missing diagonal entry in row %" PetscInt_FMT " (%" PetscInt_FMT ")",d,rows[i]); 22479566063dSJacob Faibussowitsch PetscCall(MatSetValues_SeqAIJ(A,1,&rows[i],1,&rows[i],&diag,INSERT_VALUES)); 22481d5a398dSstefano_zampini } 22491d5a398dSstefano_zampini } else { 22506e169961SBarry Smith for (i=0; i<N; i++) { 22512e5835c6SStefano Zampini aa[a->diag[rows[i]]] = diag; 22526e169961SBarry Smith } 22536e169961SBarry Smith } 22541d5a398dSstefano_zampini } 22559566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A,&aa)); 22569566063dSJacob Faibussowitsch PetscCall((*A->ops->assemblyend)(A,MAT_FINAL_ASSEMBLY)); 22576e169961SBarry Smith PetscFunctionReturn(0); 22586e169961SBarry Smith } 22596e169961SBarry Smith 2260a77337e4SBarry Smith PetscErrorCode MatGetRow_SeqAIJ(Mat A,PetscInt row,PetscInt *nz,PetscInt **idx,PetscScalar **v) 226117ab2063SBarry Smith { 2262fff043a9SJunchao Zhang Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 2263fff043a9SJunchao Zhang const PetscScalar *aa; 2264fff043a9SJunchao Zhang PetscInt *itmp; 226517ab2063SBarry Smith 22663a40ed3dSBarry Smith PetscFunctionBegin; 22679566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A,&aa)); 2268416022c9SBarry Smith *nz = a->i[row+1] - a->i[row]; 22692e5835c6SStefano Zampini if (v) *v = (PetscScalar*)(aa + a->i[row]); 227017ab2063SBarry Smith if (idx) { 2271bfeeae90SHong Zhang itmp = a->j + a->i[row]; 227226fbe8dcSKarl Rupp if (*nz) *idx = itmp; 2273f4259b30SLisandro Dalcin else *idx = NULL; 227417ab2063SBarry Smith } 22759566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A,&aa)); 22763a40ed3dSBarry Smith PetscFunctionReturn(0); 227717ab2063SBarry Smith } 227817ab2063SBarry Smith 2279a77337e4SBarry Smith PetscErrorCode MatRestoreRow_SeqAIJ(Mat A,PetscInt row,PetscInt *nz,PetscInt **idx,PetscScalar **v) 228017ab2063SBarry Smith { 22813a40ed3dSBarry Smith PetscFunctionBegin; 2282cb4a9cd9SHong Zhang if (nz) *nz = 0; 22832e5835c6SStefano Zampini if (idx) *idx = NULL; 22842e5835c6SStefano Zampini if (v) *v = NULL; 22853a40ed3dSBarry Smith PetscFunctionReturn(0); 228617ab2063SBarry Smith } 228717ab2063SBarry Smith 2288dfbe8321SBarry Smith PetscErrorCode MatNorm_SeqAIJ(Mat A,NormType type,PetscReal *nrm) 228917ab2063SBarry Smith { 2290416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 22912e5835c6SStefano Zampini const MatScalar *v; 229236db0b34SBarry Smith PetscReal sum = 0.0; 229397f1f81fSBarry Smith PetscInt i,j; 229417ab2063SBarry Smith 22953a40ed3dSBarry Smith PetscFunctionBegin; 22969566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A,&v)); 229717ab2063SBarry Smith if (type == NORM_FROBENIUS) { 2298570b7f6dSBarry Smith #if defined(PETSC_USE_REAL___FP16) 2299570b7f6dSBarry Smith PetscBLASInt one = 1,nz = a->nz; 230073cf7048SBarry Smith PetscStackCallBLAS("BLASnrm2",*nrm = BLASnrm2_(&nz,v,&one)); 2301570b7f6dSBarry Smith #else 2302416022c9SBarry Smith for (i=0; i<a->nz; i++) { 230336db0b34SBarry Smith sum += PetscRealPart(PetscConj(*v)*(*v)); v++; 230417ab2063SBarry Smith } 23058f1a2a5eSBarry Smith *nrm = PetscSqrtReal(sum); 2306570b7f6dSBarry Smith #endif 23079566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0*a->nz)); 23083a40ed3dSBarry Smith } else if (type == NORM_1) { 230936db0b34SBarry Smith PetscReal *tmp; 231097f1f81fSBarry Smith PetscInt *jj = a->j; 23119566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(A->cmap->n+1,&tmp)); 2312064f8208SBarry Smith *nrm = 0.0; 2313416022c9SBarry Smith for (j=0; j<a->nz; j++) { 2314bfeeae90SHong Zhang tmp[*jj++] += PetscAbsScalar(*v); v++; 231517ab2063SBarry Smith } 2316d0f46423SBarry Smith for (j=0; j<A->cmap->n; j++) { 2317064f8208SBarry Smith if (tmp[j] > *nrm) *nrm = tmp[j]; 231817ab2063SBarry Smith } 23199566063dSJacob Faibussowitsch PetscCall(PetscFree(tmp)); 23209566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(PetscMax(a->nz-1,0))); 23213a40ed3dSBarry Smith } else if (type == NORM_INFINITY) { 2322064f8208SBarry Smith *nrm = 0.0; 2323d0f46423SBarry Smith for (j=0; j<A->rmap->n; j++) { 23242e5835c6SStefano Zampini const PetscScalar *v2 = v + a->i[j]; 232517ab2063SBarry Smith sum = 0.0; 2326416022c9SBarry Smith for (i=0; i<a->i[j+1]-a->i[j]; i++) { 23272e5835c6SStefano Zampini sum += PetscAbsScalar(*v2); v2++; 232817ab2063SBarry Smith } 2329064f8208SBarry Smith if (sum > *nrm) *nrm = sum; 233017ab2063SBarry Smith } 23319566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(PetscMax(a->nz-1,0))); 2332f23aa3ddSBarry Smith } else SETERRQ(PETSC_COMM_SELF,PETSC_ERR_SUP,"No support for two norm"); 23339566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A,&v)); 23343a40ed3dSBarry Smith PetscFunctionReturn(0); 233517ab2063SBarry Smith } 233617ab2063SBarry Smith 23374e938277SHong Zhang /* Merged from MatGetSymbolicTranspose_SeqAIJ() - replace MatGetSymbolicTranspose_SeqAIJ()? */ 23384e938277SHong Zhang PetscErrorCode MatTransposeSymbolic_SeqAIJ(Mat A,Mat *B) 23394e938277SHong Zhang { 23404e938277SHong Zhang PetscInt i,j,anzj; 23414e938277SHong Zhang Mat_SeqAIJ *a=(Mat_SeqAIJ*)A->data,*b; 23424e938277SHong Zhang PetscInt an=A->cmap->N,am=A->rmap->N; 23434e938277SHong Zhang PetscInt *ati,*atj,*atfill,*ai=a->i,*aj=a->j; 23444e938277SHong Zhang 23454e938277SHong Zhang PetscFunctionBegin; 23464e938277SHong Zhang /* Allocate space for symbolic transpose info and work array */ 23479566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(an+1,&ati)); 23489566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(ai[am],&atj)); 23499566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(an,&atfill)); 23504e938277SHong Zhang 23514e938277SHong Zhang /* Walk through aj and count ## of non-zeros in each row of A^T. */ 23524e938277SHong Zhang /* Note: offset by 1 for fast conversion into csr format. */ 235326fbe8dcSKarl Rupp for (i=0;i<ai[am];i++) ati[aj[i]+1] += 1; 23544e938277SHong Zhang /* Form ati for csr format of A^T. */ 235526fbe8dcSKarl Rupp for (i=0;i<an;i++) ati[i+1] += ati[i]; 23564e938277SHong Zhang 23574e938277SHong Zhang /* Copy ati into atfill so we have locations of the next free space in atj */ 23589566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(atfill,ati,an)); 23594e938277SHong Zhang 23604e938277SHong Zhang /* Walk through A row-wise and mark nonzero entries of A^T. */ 23614e938277SHong Zhang for (i=0;i<am;i++) { 23624e938277SHong Zhang anzj = ai[i+1] - ai[i]; 23634e938277SHong Zhang for (j=0;j<anzj;j++) { 23644e938277SHong Zhang atj[atfill[*aj]] = i; 23654e938277SHong Zhang atfill[*aj++] += 1; 23664e938277SHong Zhang } 23674e938277SHong Zhang } 23684e938277SHong Zhang 23694e938277SHong Zhang /* Clean up temporary space and complete requests. */ 23709566063dSJacob Faibussowitsch PetscCall(PetscFree(atfill)); 23719566063dSJacob Faibussowitsch PetscCall(MatCreateSeqAIJWithArrays(PetscObjectComm((PetscObject)A),an,am,ati,atj,NULL,B)); 23729566063dSJacob Faibussowitsch PetscCall(MatSetBlockSizes(*B,PetscAbs(A->cmap->bs),PetscAbs(A->rmap->bs))); 23739566063dSJacob Faibussowitsch PetscCall(MatSetType(*B,((PetscObject)A)->type_name)); 2374a2f3521dSMark F. Adams 23754e938277SHong Zhang b = (Mat_SeqAIJ*)((*B)->data); 23764e938277SHong Zhang b->free_a = PETSC_FALSE; 23774e938277SHong Zhang b->free_ij = PETSC_TRUE; 23784e938277SHong Zhang b->nonew = 0; 23794e938277SHong Zhang PetscFunctionReturn(0); 23804e938277SHong Zhang } 23814e938277SHong Zhang 23827087cfbeSBarry Smith PetscErrorCode MatIsTranspose_SeqAIJ(Mat A,Mat B,PetscReal tol,PetscBool *f) 2383cd0d46ebSvictorle { 23843d3eaba7SBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ*) A->data,*bij = (Mat_SeqAIJ*) B->data; 238554f21887SBarry Smith PetscInt *adx,*bdx,*aii,*bii,*aptr,*bptr; 23862e5835c6SStefano Zampini const MatScalar *va,*vb; 238797f1f81fSBarry Smith PetscInt ma,na,mb,nb, i; 2388cd0d46ebSvictorle 2389cd0d46ebSvictorle PetscFunctionBegin; 23909566063dSJacob Faibussowitsch PetscCall(MatGetSize(A,&ma,&na)); 23919566063dSJacob Faibussowitsch PetscCall(MatGetSize(B,&mb,&nb)); 23925485867bSBarry Smith if (ma!=nb || na!=mb) { 23935485867bSBarry Smith *f = PETSC_FALSE; 23945485867bSBarry Smith PetscFunctionReturn(0); 23955485867bSBarry Smith } 23969566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A,&va)); 23979566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(B,&vb)); 2398cd0d46ebSvictorle aii = aij->i; bii = bij->i; 2399cd0d46ebSvictorle adx = aij->j; bdx = bij->j; 24009566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(ma,&aptr)); 24019566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(mb,&bptr)); 2402cd0d46ebSvictorle for (i=0; i<ma; i++) aptr[i] = aii[i]; 2403cd0d46ebSvictorle for (i=0; i<mb; i++) bptr[i] = bii[i]; 2404cd0d46ebSvictorle 2405cd0d46ebSvictorle *f = PETSC_TRUE; 2406cd0d46ebSvictorle for (i=0; i<ma; i++) { 2407cd0d46ebSvictorle while (aptr[i]<aii[i+1]) { 240897f1f81fSBarry Smith PetscInt idc,idr; 24095485867bSBarry Smith PetscScalar vc,vr; 2410cd0d46ebSvictorle /* column/row index/value */ 24115485867bSBarry Smith idc = adx[aptr[i]]; 24125485867bSBarry Smith idr = bdx[bptr[idc]]; 24135485867bSBarry Smith vc = va[aptr[i]]; 24145485867bSBarry Smith vr = vb[bptr[idc]]; 24155485867bSBarry Smith if (i!=idr || PetscAbsScalar(vc-vr) > tol) { 24165485867bSBarry Smith *f = PETSC_FALSE; 24175485867bSBarry Smith goto done; 2418cd0d46ebSvictorle } else { 24195485867bSBarry Smith aptr[i]++; 24205485867bSBarry Smith if (B || i!=idc) bptr[idc]++; 2421cd0d46ebSvictorle } 2422cd0d46ebSvictorle } 2423cd0d46ebSvictorle } 2424cd0d46ebSvictorle done: 24259566063dSJacob Faibussowitsch PetscCall(PetscFree(aptr)); 24269566063dSJacob Faibussowitsch PetscCall(PetscFree(bptr)); 24279566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A,&va)); 24289566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(B,&vb)); 2429cd0d46ebSvictorle PetscFunctionReturn(0); 2430cd0d46ebSvictorle } 2431cd0d46ebSvictorle 24327087cfbeSBarry Smith PetscErrorCode MatIsHermitianTranspose_SeqAIJ(Mat A,Mat B,PetscReal tol,PetscBool *f) 24331cbb95d3SBarry Smith { 24343d3eaba7SBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ*) A->data,*bij = (Mat_SeqAIJ*) B->data; 243554f21887SBarry Smith PetscInt *adx,*bdx,*aii,*bii,*aptr,*bptr; 243654f21887SBarry Smith MatScalar *va,*vb; 24371cbb95d3SBarry Smith PetscInt ma,na,mb,nb, i; 24381cbb95d3SBarry Smith 24391cbb95d3SBarry Smith PetscFunctionBegin; 24409566063dSJacob Faibussowitsch PetscCall(MatGetSize(A,&ma,&na)); 24419566063dSJacob Faibussowitsch PetscCall(MatGetSize(B,&mb,&nb)); 24421cbb95d3SBarry Smith if (ma!=nb || na!=mb) { 24431cbb95d3SBarry Smith *f = PETSC_FALSE; 24441cbb95d3SBarry Smith PetscFunctionReturn(0); 24451cbb95d3SBarry Smith } 24461cbb95d3SBarry Smith aii = aij->i; bii = bij->i; 24471cbb95d3SBarry Smith adx = aij->j; bdx = bij->j; 24481cbb95d3SBarry Smith va = aij->a; vb = bij->a; 24499566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(ma,&aptr)); 24509566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(mb,&bptr)); 24511cbb95d3SBarry Smith for (i=0; i<ma; i++) aptr[i] = aii[i]; 24521cbb95d3SBarry Smith for (i=0; i<mb; i++) bptr[i] = bii[i]; 24531cbb95d3SBarry Smith 24541cbb95d3SBarry Smith *f = PETSC_TRUE; 24551cbb95d3SBarry Smith for (i=0; i<ma; i++) { 24561cbb95d3SBarry Smith while (aptr[i]<aii[i+1]) { 24571cbb95d3SBarry Smith PetscInt idc,idr; 24581cbb95d3SBarry Smith PetscScalar vc,vr; 24591cbb95d3SBarry Smith /* column/row index/value */ 24601cbb95d3SBarry Smith idc = adx[aptr[i]]; 24611cbb95d3SBarry Smith idr = bdx[bptr[idc]]; 24621cbb95d3SBarry Smith vc = va[aptr[i]]; 24631cbb95d3SBarry Smith vr = vb[bptr[idc]]; 24641cbb95d3SBarry Smith if (i!=idr || PetscAbsScalar(vc-PetscConj(vr)) > tol) { 24651cbb95d3SBarry Smith *f = PETSC_FALSE; 24661cbb95d3SBarry Smith goto done; 24671cbb95d3SBarry Smith } else { 24681cbb95d3SBarry Smith aptr[i]++; 24691cbb95d3SBarry Smith if (B || i!=idc) bptr[idc]++; 24701cbb95d3SBarry Smith } 24711cbb95d3SBarry Smith } 24721cbb95d3SBarry Smith } 24731cbb95d3SBarry Smith done: 24749566063dSJacob Faibussowitsch PetscCall(PetscFree(aptr)); 24759566063dSJacob Faibussowitsch PetscCall(PetscFree(bptr)); 24761cbb95d3SBarry Smith PetscFunctionReturn(0); 24771cbb95d3SBarry Smith } 24781cbb95d3SBarry Smith 2479ace3abfcSBarry Smith PetscErrorCode MatIsSymmetric_SeqAIJ(Mat A,PetscReal tol,PetscBool *f) 24809e29f15eSvictorle { 24819e29f15eSvictorle PetscFunctionBegin; 24829566063dSJacob Faibussowitsch PetscCall(MatIsTranspose_SeqAIJ(A,A,tol,f)); 24839e29f15eSvictorle PetscFunctionReturn(0); 24849e29f15eSvictorle } 24859e29f15eSvictorle 2486ace3abfcSBarry Smith PetscErrorCode MatIsHermitian_SeqAIJ(Mat A,PetscReal tol,PetscBool *f) 24871cbb95d3SBarry Smith { 24881cbb95d3SBarry Smith PetscFunctionBegin; 24899566063dSJacob Faibussowitsch PetscCall(MatIsHermitianTranspose_SeqAIJ(A,A,tol,f)); 24901cbb95d3SBarry Smith PetscFunctionReturn(0); 24911cbb95d3SBarry Smith } 24921cbb95d3SBarry Smith 2493dfbe8321SBarry Smith PetscErrorCode MatDiagonalScale_SeqAIJ(Mat A,Vec ll,Vec rr) 249417ab2063SBarry Smith { 2495416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 2496fff8e43fSBarry Smith const PetscScalar *l,*r; 2497fff8e43fSBarry Smith PetscScalar x; 249854f21887SBarry Smith MatScalar *v; 2499fff8e43fSBarry Smith PetscInt i,j,m = A->rmap->n,n = A->cmap->n,M,nz = a->nz; 2500fff8e43fSBarry Smith const PetscInt *jj; 250117ab2063SBarry Smith 25023a40ed3dSBarry Smith PetscFunctionBegin; 250317ab2063SBarry Smith if (ll) { 25043ea7c6a1SSatish Balay /* The local size is used so that VecMPI can be passed to this routine 25053ea7c6a1SSatish Balay by MatDiagonalScale_MPIAIJ */ 25069566063dSJacob Faibussowitsch PetscCall(VecGetLocalSize(ll,&m)); 25072c71b3e2SJacob Faibussowitsch PetscCheckFalse(m != A->rmap->n,PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Left scaling vector wrong length"); 25089566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(ll,&l)); 25099566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A,&v)); 251017ab2063SBarry Smith for (i=0; i<m; i++) { 251117ab2063SBarry Smith x = l[i]; 2512416022c9SBarry Smith M = a->i[i+1] - a->i[i]; 25132205254eSKarl Rupp for (j=0; j<M; j++) (*v++) *= x; 251417ab2063SBarry Smith } 25159566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(ll,&l)); 25169566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(nz)); 25179566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A,&v)); 251817ab2063SBarry Smith } 251917ab2063SBarry Smith if (rr) { 25209566063dSJacob Faibussowitsch PetscCall(VecGetLocalSize(rr,&n)); 25212c71b3e2SJacob Faibussowitsch PetscCheckFalse(n != A->cmap->n,PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Right scaling vector wrong length"); 25229566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(rr,&r)); 25239566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A,&v)); 25242e5835c6SStefano Zampini jj = a->j; 25252205254eSKarl Rupp for (i=0; i<nz; i++) (*v++) *= r[*jj++]; 25269566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A,&v)); 25279566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(rr,&r)); 25289566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(nz)); 252917ab2063SBarry Smith } 25309566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(A)); 25313a40ed3dSBarry Smith PetscFunctionReturn(0); 253217ab2063SBarry Smith } 253317ab2063SBarry Smith 25347dae84e0SHong Zhang PetscErrorCode MatCreateSubMatrix_SeqAIJ(Mat A,IS isrow,IS iscol,PetscInt csize,MatReuse scall,Mat *B) 253517ab2063SBarry Smith { 2536db02288aSLois Curfman McInnes Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data,*c; 2537d0f46423SBarry Smith PetscInt *smap,i,k,kstart,kend,oldcols = A->cmap->n,*lens; 253897f1f81fSBarry Smith PetscInt row,mat_i,*mat_j,tcol,first,step,*mat_ilen,sum,lensi; 25395d0c19d7SBarry Smith const PetscInt *irow,*icol; 25402e5835c6SStefano Zampini const PetscScalar *aa; 25415d0c19d7SBarry Smith PetscInt nrows,ncols; 254297f1f81fSBarry Smith PetscInt *starts,*j_new,*i_new,*aj = a->j,*ai = a->i,ii,*ailen = a->ilen; 254354f21887SBarry Smith MatScalar *a_new,*mat_a; 2544416022c9SBarry Smith Mat C; 2545cdc6f3adSToby Isaac PetscBool stride; 254617ab2063SBarry Smith 25473a40ed3dSBarry Smith PetscFunctionBegin; 25489566063dSJacob Faibussowitsch PetscCall(ISGetIndices(isrow,&irow)); 25499566063dSJacob Faibussowitsch PetscCall(ISGetLocalSize(isrow,&nrows)); 25509566063dSJacob Faibussowitsch PetscCall(ISGetLocalSize(iscol,&ncols)); 255117ab2063SBarry Smith 25529566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)iscol,ISSTRIDE,&stride)); 2553ff718158SBarry Smith if (stride) { 25549566063dSJacob Faibussowitsch PetscCall(ISStrideGetInfo(iscol,&first,&step)); 2555ff718158SBarry Smith } else { 2556ff718158SBarry Smith first = 0; 2557ff718158SBarry Smith step = 0; 2558ff718158SBarry Smith } 2559fee21e36SBarry Smith if (stride && step == 1) { 256002834360SBarry Smith /* special case of contiguous rows */ 25619566063dSJacob Faibussowitsch PetscCall(PetscMalloc2(nrows,&lens,nrows,&starts)); 256202834360SBarry Smith /* loop over new rows determining lens and starting points */ 256302834360SBarry Smith for (i=0; i<nrows; i++) { 2564bfeeae90SHong Zhang kstart = ai[irow[i]]; 2565a2744918SBarry Smith kend = kstart + ailen[irow[i]]; 2566a91a9bebSLisandro Dalcin starts[i] = kstart; 256702834360SBarry Smith for (k=kstart; k<kend; k++) { 2568bfeeae90SHong Zhang if (aj[k] >= first) { 256902834360SBarry Smith starts[i] = k; 257002834360SBarry Smith break; 257102834360SBarry Smith } 257202834360SBarry Smith } 2573a2744918SBarry Smith sum = 0; 257402834360SBarry Smith while (k < kend) { 2575bfeeae90SHong Zhang if (aj[k++] >= first+ncols) break; 2576a2744918SBarry Smith sum++; 257702834360SBarry Smith } 2578a2744918SBarry Smith lens[i] = sum; 257902834360SBarry Smith } 258002834360SBarry Smith /* create submatrix */ 2581cddf8d76SBarry Smith if (scall == MAT_REUSE_MATRIX) { 258297f1f81fSBarry Smith PetscInt n_cols,n_rows; 25839566063dSJacob Faibussowitsch PetscCall(MatGetSize(*B,&n_rows,&n_cols)); 25842c71b3e2SJacob Faibussowitsch PetscCheckFalse(n_rows != nrows || n_cols != ncols,PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Reused submatrix wrong size"); 25859566063dSJacob Faibussowitsch PetscCall(MatZeroEntries(*B)); 258608480c60SBarry Smith C = *B; 25873a40ed3dSBarry Smith } else { 25883bef6203SJed Brown PetscInt rbs,cbs; 25899566063dSJacob Faibussowitsch PetscCall(MatCreate(PetscObjectComm((PetscObject)A),&C)); 25909566063dSJacob Faibussowitsch PetscCall(MatSetSizes(C,nrows,ncols,PETSC_DETERMINE,PETSC_DETERMINE)); 25919566063dSJacob Faibussowitsch PetscCall(ISGetBlockSize(isrow,&rbs)); 25929566063dSJacob Faibussowitsch PetscCall(ISGetBlockSize(iscol,&cbs)); 25939566063dSJacob Faibussowitsch PetscCall(MatSetBlockSizes(C,rbs,cbs)); 25949566063dSJacob Faibussowitsch PetscCall(MatSetType(C,((PetscObject)A)->type_name)); 25959566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(C,0,lens)); 259608480c60SBarry Smith } 2597db02288aSLois Curfman McInnes c = (Mat_SeqAIJ*)C->data; 2598db02288aSLois Curfman McInnes 259902834360SBarry Smith /* loop over rows inserting into submatrix */ 2600db02288aSLois Curfman McInnes a_new = c->a; 2601db02288aSLois Curfman McInnes j_new = c->j; 2602db02288aSLois Curfman McInnes i_new = c->i; 26039566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A,&aa)); 260402834360SBarry Smith for (i=0; i<nrows; i++) { 2605a2744918SBarry Smith ii = starts[i]; 2606a2744918SBarry Smith lensi = lens[i]; 2607a2744918SBarry Smith for (k=0; k<lensi; k++) { 2608a2744918SBarry Smith *j_new++ = aj[ii+k] - first; 260902834360SBarry Smith } 26109566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(a_new,aa + starts[i],lensi)); 2611a2744918SBarry Smith a_new += lensi; 2612a2744918SBarry Smith i_new[i+1] = i_new[i] + lensi; 2613a2744918SBarry Smith c->ilen[i] = lensi; 261402834360SBarry Smith } 26159566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A,&aa)); 26169566063dSJacob Faibussowitsch PetscCall(PetscFree2(lens,starts)); 26173a40ed3dSBarry Smith } else { 26189566063dSJacob Faibussowitsch PetscCall(ISGetIndices(iscol,&icol)); 26199566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(oldcols,&smap)); 26209566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(1+nrows,&lens)); 26214dcab191SBarry Smith for (i=0; i<ncols; i++) { 26226bdcaf15SBarry Smith PetscCheck(icol[i] < oldcols,PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Requesting column beyond largest column icol[%" PetscInt_FMT "] %" PetscInt_FMT " >= A->cmap->n %" PetscInt_FMT,i,icol[i],oldcols); 26234dcab191SBarry Smith smap[icol[i]] = i+1; 26244dcab191SBarry Smith } 26254dcab191SBarry Smith 262602834360SBarry Smith /* determine lens of each row */ 262702834360SBarry Smith for (i=0; i<nrows; i++) { 2628bfeeae90SHong Zhang kstart = ai[irow[i]]; 262902834360SBarry Smith kend = kstart + a->ilen[irow[i]]; 263002834360SBarry Smith lens[i] = 0; 263102834360SBarry Smith for (k=kstart; k<kend; k++) { 2632bfeeae90SHong Zhang if (smap[aj[k]]) { 263302834360SBarry Smith lens[i]++; 263402834360SBarry Smith } 263502834360SBarry Smith } 263602834360SBarry Smith } 263717ab2063SBarry Smith /* Create and fill new matrix */ 2638a2744918SBarry Smith if (scall == MAT_REUSE_MATRIX) { 2639ace3abfcSBarry Smith PetscBool equal; 26400f5bd95cSBarry Smith 264199141d43SSatish Balay c = (Mat_SeqAIJ*)((*B)->data); 26422c71b3e2SJacob Faibussowitsch PetscCheckFalse((*B)->rmap->n != nrows || (*B)->cmap->n != ncols,PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Cannot reuse matrix. wrong size"); 26439566063dSJacob Faibussowitsch PetscCall(PetscArraycmp(c->ilen,lens,(*B)->rmap->n,&equal)); 264428b400f6SJacob Faibussowitsch PetscCheck(equal,PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Cannot reuse matrix. wrong no of nonzeros"); 26459566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(c->ilen,(*B)->rmap->n)); 264608480c60SBarry Smith C = *B; 26473a40ed3dSBarry Smith } else { 26483bef6203SJed Brown PetscInt rbs,cbs; 26499566063dSJacob Faibussowitsch PetscCall(MatCreate(PetscObjectComm((PetscObject)A),&C)); 26509566063dSJacob Faibussowitsch PetscCall(MatSetSizes(C,nrows,ncols,PETSC_DETERMINE,PETSC_DETERMINE)); 26519566063dSJacob Faibussowitsch PetscCall(ISGetBlockSize(isrow,&rbs)); 26529566063dSJacob Faibussowitsch PetscCall(ISGetBlockSize(iscol,&cbs)); 26539566063dSJacob Faibussowitsch PetscCall(MatSetBlockSizes(C,rbs,cbs)); 26549566063dSJacob Faibussowitsch PetscCall(MatSetType(C,((PetscObject)A)->type_name)); 26559566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(C,0,lens)); 265608480c60SBarry Smith } 26579566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A,&aa)); 265899141d43SSatish Balay c = (Mat_SeqAIJ*)(C->data); 265917ab2063SBarry Smith for (i=0; i<nrows; i++) { 266099141d43SSatish Balay row = irow[i]; 2661bfeeae90SHong Zhang kstart = ai[row]; 266299141d43SSatish Balay kend = kstart + a->ilen[row]; 2663bfeeae90SHong Zhang mat_i = c->i[i]; 266499141d43SSatish Balay mat_j = c->j + mat_i; 266599141d43SSatish Balay mat_a = c->a + mat_i; 266699141d43SSatish Balay mat_ilen = c->ilen + i; 266717ab2063SBarry Smith for (k=kstart; k<kend; k++) { 2668bfeeae90SHong Zhang if ((tcol=smap[a->j[k]])) { 2669ed480e8bSBarry Smith *mat_j++ = tcol - 1; 26702e5835c6SStefano Zampini *mat_a++ = aa[k]; 267199141d43SSatish Balay (*mat_ilen)++; 267299141d43SSatish Balay 267317ab2063SBarry Smith } 267417ab2063SBarry Smith } 267517ab2063SBarry Smith } 26769566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A,&aa)); 267702834360SBarry Smith /* Free work space */ 26789566063dSJacob Faibussowitsch PetscCall(ISRestoreIndices(iscol,&icol)); 26799566063dSJacob Faibussowitsch PetscCall(PetscFree(smap)); 26809566063dSJacob Faibussowitsch PetscCall(PetscFree(lens)); 2681cdc6f3adSToby Isaac /* sort */ 2682cdc6f3adSToby Isaac for (i = 0; i < nrows; i++) { 2683cdc6f3adSToby Isaac PetscInt ilen; 2684cdc6f3adSToby Isaac 2685cdc6f3adSToby Isaac mat_i = c->i[i]; 2686cdc6f3adSToby Isaac mat_j = c->j + mat_i; 2687cdc6f3adSToby Isaac mat_a = c->a + mat_i; 2688cdc6f3adSToby Isaac ilen = c->ilen[i]; 26899566063dSJacob Faibussowitsch PetscCall(PetscSortIntWithScalarArray(ilen,mat_j,mat_a)); 2690cdc6f3adSToby Isaac } 269102834360SBarry Smith } 26928c3ff71bSJunchao Zhang #if defined(PETSC_HAVE_DEVICE) 26939566063dSJacob Faibussowitsch PetscCall(MatBindToCPU(C,A->boundtocpu)); 2694305c6ccfSStefano Zampini #endif 26959566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(C,MAT_FINAL_ASSEMBLY)); 26969566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(C,MAT_FINAL_ASSEMBLY)); 269717ab2063SBarry Smith 26989566063dSJacob Faibussowitsch PetscCall(ISRestoreIndices(isrow,&irow)); 2699416022c9SBarry Smith *B = C; 27003a40ed3dSBarry Smith PetscFunctionReturn(0); 270117ab2063SBarry Smith } 270217ab2063SBarry Smith 2703fc08c53fSHong Zhang PetscErrorCode MatGetMultiProcBlock_SeqAIJ(Mat mat,MPI_Comm subComm,MatReuse scall,Mat *subMat) 270482d44351SHong Zhang { 270582d44351SHong Zhang Mat B; 270682d44351SHong Zhang 270782d44351SHong Zhang PetscFunctionBegin; 2708c2d650bdSHong Zhang if (scall == MAT_INITIAL_MATRIX) { 27099566063dSJacob Faibussowitsch PetscCall(MatCreate(subComm,&B)); 27109566063dSJacob Faibussowitsch PetscCall(MatSetSizes(B,mat->rmap->n,mat->cmap->n,mat->rmap->n,mat->cmap->n)); 27119566063dSJacob Faibussowitsch PetscCall(MatSetBlockSizesFromMats(B,mat,mat)); 27129566063dSJacob Faibussowitsch PetscCall(MatSetType(B,MATSEQAIJ)); 27139566063dSJacob Faibussowitsch PetscCall(MatDuplicateNoCreate_SeqAIJ(B,mat,MAT_COPY_VALUES,PETSC_TRUE)); 271482d44351SHong Zhang *subMat = B; 2715c2d650bdSHong Zhang } else { 27169566063dSJacob Faibussowitsch PetscCall(MatCopy_SeqAIJ(mat,*subMat,SAME_NONZERO_PATTERN)); 2717c2d650bdSHong Zhang } 271882d44351SHong Zhang PetscFunctionReturn(0); 271982d44351SHong Zhang } 272082d44351SHong Zhang 27219a625307SHong Zhang PetscErrorCode MatILUFactor_SeqAIJ(Mat inA,IS row,IS col,const MatFactorInfo *info) 2722a871dcd8SBarry Smith { 272363b91edcSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)inA->data; 272463b91edcSBarry Smith Mat outA; 2725ace3abfcSBarry Smith PetscBool row_identity,col_identity; 272663b91edcSBarry Smith 27273a40ed3dSBarry Smith PetscFunctionBegin; 27282c71b3e2SJacob Faibussowitsch PetscCheckFalse(info->levels != 0,PETSC_COMM_SELF,PETSC_ERR_SUP,"Only levels=0 supported for in-place ilu"); 27291df811f5SHong Zhang 27309566063dSJacob Faibussowitsch PetscCall(ISIdentity(row,&row_identity)); 27319566063dSJacob Faibussowitsch PetscCall(ISIdentity(col,&col_identity)); 2732a871dcd8SBarry Smith 273363b91edcSBarry Smith outA = inA; 2734d5f3da31SBarry Smith outA->factortype = MAT_FACTOR_LU; 27359566063dSJacob Faibussowitsch PetscCall(PetscFree(inA->solvertype)); 27369566063dSJacob Faibussowitsch PetscCall(PetscStrallocpy(MATSOLVERPETSC,&inA->solvertype)); 27372205254eSKarl Rupp 27389566063dSJacob Faibussowitsch PetscCall(PetscObjectReference((PetscObject)row)); 27399566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->row)); 27402205254eSKarl Rupp 2741c3122656SLisandro Dalcin a->row = row; 27422205254eSKarl Rupp 27439566063dSJacob Faibussowitsch PetscCall(PetscObjectReference((PetscObject)col)); 27449566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->col)); 27452205254eSKarl Rupp 2746c3122656SLisandro Dalcin a->col = col; 274763b91edcSBarry Smith 274836db0b34SBarry Smith /* Create the inverse permutation so that it can be used in MatLUFactorNumeric() */ 27499566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->icol)); 27509566063dSJacob Faibussowitsch PetscCall(ISInvertPermutation(col,PETSC_DECIDE,&a->icol)); 27519566063dSJacob Faibussowitsch PetscCall(PetscLogObjectParent((PetscObject)inA,(PetscObject)a->icol)); 2752f0ec6fceSSatish Balay 275394a9d846SBarry Smith if (!a->solve_work) { /* this matrix may have been factored before */ 27549566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(inA->rmap->n+1,&a->solve_work)); 27559566063dSJacob Faibussowitsch PetscCall(PetscLogObjectMemory((PetscObject)inA, (inA->rmap->n+1)*sizeof(PetscScalar))); 275694a9d846SBarry Smith } 275763b91edcSBarry Smith 27589566063dSJacob Faibussowitsch PetscCall(MatMarkDiagonal_SeqAIJ(inA)); 2759137fb511SHong Zhang if (row_identity && col_identity) { 27609566063dSJacob Faibussowitsch PetscCall(MatLUFactorNumeric_SeqAIJ_inplace(outA,inA,info)); 2761137fb511SHong Zhang } else { 27629566063dSJacob Faibussowitsch PetscCall(MatLUFactorNumeric_SeqAIJ_InplaceWithPerm(outA,inA,info)); 2763137fb511SHong Zhang } 27643a40ed3dSBarry Smith PetscFunctionReturn(0); 2765a871dcd8SBarry Smith } 2766a871dcd8SBarry Smith 2767f4df32b1SMatthew Knepley PetscErrorCode MatScale_SeqAIJ(Mat inA,PetscScalar alpha) 2768f0b747eeSBarry Smith { 2769f0b747eeSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)inA->data; 2770dfa0f9e5SStefano Zampini PetscScalar *v; 2771c5df96a5SBarry Smith PetscBLASInt one = 1,bnz; 27723a40ed3dSBarry Smith 27733a40ed3dSBarry Smith PetscFunctionBegin; 27749566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(inA,&v)); 27759566063dSJacob Faibussowitsch PetscCall(PetscBLASIntCast(a->nz,&bnz)); 2776dfa0f9e5SStefano Zampini PetscStackCallBLAS("BLASscal",BLASscal_(&bnz,&alpha,v,&one)); 27779566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(a->nz)); 27789566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(inA,&v)); 27799566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(inA)); 27803a40ed3dSBarry Smith PetscFunctionReturn(0); 2781f0b747eeSBarry Smith } 2782f0b747eeSBarry Smith 2783f68bb481SHong Zhang PetscErrorCode MatDestroySubMatrix_Private(Mat_SubSppt *submatj) 278416b64355SHong Zhang { 278516b64355SHong Zhang PetscInt i; 278616b64355SHong Zhang 278716b64355SHong Zhang PetscFunctionBegin; 278816b64355SHong Zhang if (!submatj->id) { /* delete data that are linked only to submats[id=0] */ 27899566063dSJacob Faibussowitsch PetscCall(PetscFree4(submatj->sbuf1,submatj->ptr,submatj->tmp,submatj->ctr)); 279016b64355SHong Zhang 279116b64355SHong Zhang for (i=0; i<submatj->nrqr; ++i) { 27929566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj->sbuf2[i])); 279316b64355SHong Zhang } 27949566063dSJacob Faibussowitsch PetscCall(PetscFree3(submatj->sbuf2,submatj->req_size,submatj->req_source1)); 279516b64355SHong Zhang 279616b64355SHong Zhang if (submatj->rbuf1) { 27979566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj->rbuf1[0])); 27989566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj->rbuf1)); 279916b64355SHong Zhang } 280016b64355SHong Zhang 280116b64355SHong Zhang for (i=0; i<submatj->nrqs; ++i) { 28029566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj->rbuf3[i])); 280316b64355SHong Zhang } 28049566063dSJacob Faibussowitsch PetscCall(PetscFree3(submatj->req_source2,submatj->rbuf2,submatj->rbuf3)); 28059566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj->pa)); 280616b64355SHong Zhang } 280716b64355SHong Zhang 280816b64355SHong Zhang #if defined(PETSC_USE_CTABLE) 28099566063dSJacob Faibussowitsch PetscCall(PetscTableDestroy((PetscTable*)&submatj->rmap)); 28109566063dSJacob Faibussowitsch if (submatj->cmap_loc) PetscCall(PetscFree(submatj->cmap_loc)); 28119566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj->rmap_loc)); 281216b64355SHong Zhang #else 28139566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj->rmap)); 281416b64355SHong Zhang #endif 281516b64355SHong Zhang 281616b64355SHong Zhang if (!submatj->allcolumns) { 281716b64355SHong Zhang #if defined(PETSC_USE_CTABLE) 28189566063dSJacob Faibussowitsch PetscCall(PetscTableDestroy((PetscTable*)&submatj->cmap)); 281916b64355SHong Zhang #else 28209566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj->cmap)); 282116b64355SHong Zhang #endif 282216b64355SHong Zhang } 28239566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj->row2proc)); 282416b64355SHong Zhang 28259566063dSJacob Faibussowitsch PetscCall(PetscFree(submatj)); 282616b64355SHong Zhang PetscFunctionReturn(0); 282716b64355SHong Zhang } 282816b64355SHong Zhang 28290fb991dcSHong Zhang PetscErrorCode MatDestroySubMatrix_SeqAIJ(Mat C) 283016b64355SHong Zhang { 283116b64355SHong Zhang Mat_SeqAIJ *c = (Mat_SeqAIJ*)C->data; 28325c39f6d9SHong Zhang Mat_SubSppt *submatj = c->submatis1; 283316b64355SHong Zhang 283416b64355SHong Zhang PetscFunctionBegin; 28359566063dSJacob Faibussowitsch PetscCall((*submatj->destroy)(C)); 28369566063dSJacob Faibussowitsch PetscCall(MatDestroySubMatrix_Private(submatj)); 283716b64355SHong Zhang PetscFunctionReturn(0); 283816b64355SHong Zhang } 283916b64355SHong Zhang 28402d033e1fSHong Zhang PetscErrorCode MatDestroySubMatrices_SeqAIJ(PetscInt n,Mat *mat[]) 28412d033e1fSHong Zhang { 28422d033e1fSHong Zhang PetscInt i; 28430fb991dcSHong Zhang Mat C; 28440fb991dcSHong Zhang Mat_SeqAIJ *c; 28450fb991dcSHong Zhang Mat_SubSppt *submatj; 28462d033e1fSHong Zhang 28472d033e1fSHong Zhang PetscFunctionBegin; 28482d033e1fSHong Zhang for (i=0; i<n; i++) { 28490fb991dcSHong Zhang C = (*mat)[i]; 28500fb991dcSHong Zhang c = (Mat_SeqAIJ*)C->data; 28510fb991dcSHong Zhang submatj = c->submatis1; 28522d033e1fSHong Zhang if (submatj) { 2853682e4c99SStefano Zampini if (--((PetscObject)C)->refct <= 0) { 28549566063dSJacob Faibussowitsch PetscCall((*submatj->destroy)(C)); 28559566063dSJacob Faibussowitsch PetscCall(MatDestroySubMatrix_Private(submatj)); 28569566063dSJacob Faibussowitsch PetscCall(PetscFree(C->defaultvectype)); 28579566063dSJacob Faibussowitsch PetscCall(PetscLayoutDestroy(&C->rmap)); 28589566063dSJacob Faibussowitsch PetscCall(PetscLayoutDestroy(&C->cmap)); 28599566063dSJacob Faibussowitsch PetscCall(PetscHeaderDestroy(&C)); 2860682e4c99SStefano Zampini } 28612d033e1fSHong Zhang } else { 28629566063dSJacob Faibussowitsch PetscCall(MatDestroy(&C)); 28632d033e1fSHong Zhang } 28642d033e1fSHong Zhang } 286586e85357SHong Zhang 286663a75b2aSHong Zhang /* Destroy Dummy submatrices created for reuse */ 28679566063dSJacob Faibussowitsch PetscCall(MatDestroySubMatrices_Dummy(n,mat)); 286863a75b2aSHong Zhang 28699566063dSJacob Faibussowitsch PetscCall(PetscFree(*mat)); 28702d033e1fSHong Zhang PetscFunctionReturn(0); 28712d033e1fSHong Zhang } 28722d033e1fSHong Zhang 28737dae84e0SHong Zhang PetscErrorCode MatCreateSubMatrices_SeqAIJ(Mat A,PetscInt n,const IS irow[],const IS icol[],MatReuse scall,Mat *B[]) 2874cddf8d76SBarry Smith { 287597f1f81fSBarry Smith PetscInt i; 2876cddf8d76SBarry Smith 28773a40ed3dSBarry Smith PetscFunctionBegin; 2878cddf8d76SBarry Smith if (scall == MAT_INITIAL_MATRIX) { 28799566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(n+1,B)); 2880cddf8d76SBarry Smith } 2881cddf8d76SBarry Smith 2882cddf8d76SBarry Smith for (i=0; i<n; i++) { 28839566063dSJacob Faibussowitsch PetscCall(MatCreateSubMatrix_SeqAIJ(A,irow[i],icol[i],PETSC_DECIDE,scall,&(*B)[i])); 2884cddf8d76SBarry Smith } 28853a40ed3dSBarry Smith PetscFunctionReturn(0); 2886cddf8d76SBarry Smith } 2887cddf8d76SBarry Smith 288897f1f81fSBarry Smith PetscErrorCode MatIncreaseOverlap_SeqAIJ(Mat A,PetscInt is_max,IS is[],PetscInt ov) 28894dcbc457SBarry Smith { 2890e4d965acSSatish Balay Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 28915d0c19d7SBarry Smith PetscInt row,i,j,k,l,m,n,*nidx,isz,val; 28925d0c19d7SBarry Smith const PetscInt *idx; 289397f1f81fSBarry Smith PetscInt start,end,*ai,*aj; 2894f1af5d2fSBarry Smith PetscBT table; 2895bbd702dbSSatish Balay 28963a40ed3dSBarry Smith PetscFunctionBegin; 2897d0f46423SBarry Smith m = A->rmap->n; 2898e4d965acSSatish Balay ai = a->i; 2899bfeeae90SHong Zhang aj = a->j; 29008a047759SSatish Balay 29012c71b3e2SJacob Faibussowitsch PetscCheckFalse(ov < 0,PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"illegal negative overlap value used"); 290206763907SSatish Balay 29039566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m+1,&nidx)); 29049566063dSJacob Faibussowitsch PetscCall(PetscBTCreate(m,&table)); 290506763907SSatish Balay 2906e4d965acSSatish Balay for (i=0; i<is_max; i++) { 2907b97fc60eSLois Curfman McInnes /* Initialize the two local arrays */ 2908e4d965acSSatish Balay isz = 0; 29099566063dSJacob Faibussowitsch PetscCall(PetscBTMemzero(m,table)); 2910e4d965acSSatish Balay 2911e4d965acSSatish Balay /* Extract the indices, assume there can be duplicate entries */ 29129566063dSJacob Faibussowitsch PetscCall(ISGetIndices(is[i],&idx)); 29139566063dSJacob Faibussowitsch PetscCall(ISGetLocalSize(is[i],&n)); 2914e4d965acSSatish Balay 2915dd097bc3SLois Curfman McInnes /* Enter these into the temp arrays. I.e., mark table[row], enter row into new index */ 2916e4d965acSSatish Balay for (j=0; j<n; ++j) { 29172205254eSKarl Rupp if (!PetscBTLookupSet(table,idx[j])) nidx[isz++] = idx[j]; 29184dcbc457SBarry Smith } 29199566063dSJacob Faibussowitsch PetscCall(ISRestoreIndices(is[i],&idx)); 29209566063dSJacob Faibussowitsch PetscCall(ISDestroy(&is[i])); 2921e4d965acSSatish Balay 292204a348a9SBarry Smith k = 0; 292304a348a9SBarry Smith for (j=0; j<ov; j++) { /* for each overlap */ 292404a348a9SBarry Smith n = isz; 292506763907SSatish Balay for (; k<n; k++) { /* do only those rows in nidx[k], which are not done yet */ 2926e4d965acSSatish Balay row = nidx[k]; 2927e4d965acSSatish Balay start = ai[row]; 2928e4d965acSSatish Balay end = ai[row+1]; 292904a348a9SBarry Smith for (l = start; l<end; l++) { 2930efb16452SHong Zhang val = aj[l]; 29312205254eSKarl Rupp if (!PetscBTLookupSet(table,val)) nidx[isz++] = val; 2932e4d965acSSatish Balay } 2933e4d965acSSatish Balay } 2934e4d965acSSatish Balay } 29359566063dSJacob Faibussowitsch PetscCall(ISCreateGeneral(PETSC_COMM_SELF,isz,nidx,PETSC_COPY_VALUES,(is+i))); 2936e4d965acSSatish Balay } 29379566063dSJacob Faibussowitsch PetscCall(PetscBTDestroy(&table)); 29389566063dSJacob Faibussowitsch PetscCall(PetscFree(nidx)); 29393a40ed3dSBarry Smith PetscFunctionReturn(0); 29404dcbc457SBarry Smith } 294117ab2063SBarry Smith 29420513a670SBarry Smith /* -------------------------------------------------------------- */ 2943dfbe8321SBarry Smith PetscErrorCode MatPermute_SeqAIJ(Mat A,IS rowp,IS colp,Mat *B) 29440513a670SBarry Smith { 29450513a670SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 29463b98c0a2SBarry Smith PetscInt i,nz = 0,m = A->rmap->n,n = A->cmap->n; 29475d0c19d7SBarry Smith const PetscInt *row,*col; 29485d0c19d7SBarry Smith PetscInt *cnew,j,*lens; 294956cd22aeSBarry Smith IS icolp,irowp; 29500298fd71SBarry Smith PetscInt *cwork = NULL; 29510298fd71SBarry Smith PetscScalar *vwork = NULL; 29520513a670SBarry Smith 29533a40ed3dSBarry Smith PetscFunctionBegin; 29549566063dSJacob Faibussowitsch PetscCall(ISInvertPermutation(rowp,PETSC_DECIDE,&irowp)); 29559566063dSJacob Faibussowitsch PetscCall(ISGetIndices(irowp,&row)); 29569566063dSJacob Faibussowitsch PetscCall(ISInvertPermutation(colp,PETSC_DECIDE,&icolp)); 29579566063dSJacob Faibussowitsch PetscCall(ISGetIndices(icolp,&col)); 29580513a670SBarry Smith 29590513a670SBarry Smith /* determine lengths of permuted rows */ 29609566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m+1,&lens)); 29612205254eSKarl Rupp for (i=0; i<m; i++) lens[row[i]] = a->i[i+1] - a->i[i]; 29629566063dSJacob Faibussowitsch PetscCall(MatCreate(PetscObjectComm((PetscObject)A),B)); 29639566063dSJacob Faibussowitsch PetscCall(MatSetSizes(*B,m,n,m,n)); 29649566063dSJacob Faibussowitsch PetscCall(MatSetBlockSizesFromMats(*B,A,A)); 29659566063dSJacob Faibussowitsch PetscCall(MatSetType(*B,((PetscObject)A)->type_name)); 29669566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(*B,0,lens)); 29679566063dSJacob Faibussowitsch PetscCall(PetscFree(lens)); 29680513a670SBarry Smith 29699566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(n,&cnew)); 29700513a670SBarry Smith for (i=0; i<m; i++) { 29719566063dSJacob Faibussowitsch PetscCall(MatGetRow_SeqAIJ(A,i,&nz,&cwork,&vwork)); 29722205254eSKarl Rupp for (j=0; j<nz; j++) cnew[j] = col[cwork[j]]; 29739566063dSJacob Faibussowitsch PetscCall(MatSetValues_SeqAIJ(*B,1,&row[i],nz,cnew,vwork,INSERT_VALUES)); 29749566063dSJacob Faibussowitsch PetscCall(MatRestoreRow_SeqAIJ(A,i,&nz,&cwork,&vwork)); 29750513a670SBarry Smith } 29769566063dSJacob Faibussowitsch PetscCall(PetscFree(cnew)); 29772205254eSKarl Rupp 29783c7d62e4SBarry Smith (*B)->assembled = PETSC_FALSE; 29792205254eSKarl Rupp 29808c3ff71bSJunchao Zhang #if defined(PETSC_HAVE_DEVICE) 29819566063dSJacob Faibussowitsch PetscCall(MatBindToCPU(*B,A->boundtocpu)); 29829fe5e383SStefano Zampini #endif 29839566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(*B,MAT_FINAL_ASSEMBLY)); 29849566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(*B,MAT_FINAL_ASSEMBLY)); 29859566063dSJacob Faibussowitsch PetscCall(ISRestoreIndices(irowp,&row)); 29869566063dSJacob Faibussowitsch PetscCall(ISRestoreIndices(icolp,&col)); 29879566063dSJacob Faibussowitsch PetscCall(ISDestroy(&irowp)); 29889566063dSJacob Faibussowitsch PetscCall(ISDestroy(&icolp)); 29896768869dSprj- if (rowp == colp) { 29909566063dSJacob Faibussowitsch PetscCall(MatPropagateSymmetryOptions(A,*B)); 29916768869dSprj- } 29923a40ed3dSBarry Smith PetscFunctionReturn(0); 29930513a670SBarry Smith } 29940513a670SBarry Smith 2995dfbe8321SBarry Smith PetscErrorCode MatCopy_SeqAIJ(Mat A,Mat B,MatStructure str) 2996cb5b572fSBarry Smith { 2997cb5b572fSBarry Smith PetscFunctionBegin; 299833f4a19fSKris Buschelman /* If the two matrices have the same copy implementation, use fast copy. */ 299933f4a19fSKris Buschelman if (str == SAME_NONZERO_PATTERN && (A->ops->copy == B->ops->copy)) { 3000be6bf707SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 3001be6bf707SBarry Smith Mat_SeqAIJ *b = (Mat_SeqAIJ*)B->data; 30022e5835c6SStefano Zampini const PetscScalar *aa; 3003be6bf707SBarry Smith 30049566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A,&aa)); 30052c71b3e2SJacob Faibussowitsch PetscCheckFalse(a->i[A->rmap->n] != b->i[B->rmap->n],PETSC_COMM_SELF,PETSC_ERR_ARG_INCOMP,"Number of nonzeros in two matrices are different %" PetscInt_FMT " != %" PetscInt_FMT,a->i[A->rmap->n],b->i[B->rmap->n]); 30069566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(b->a,aa,a->i[A->rmap->n])); 30079566063dSJacob Faibussowitsch PetscCall(PetscObjectStateIncrease((PetscObject)B)); 30089566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A,&aa)); 3009cb5b572fSBarry Smith } else { 30109566063dSJacob Faibussowitsch PetscCall(MatCopy_Basic(A,B,str)); 3011cb5b572fSBarry Smith } 3012cb5b572fSBarry Smith PetscFunctionReturn(0); 3013cb5b572fSBarry Smith } 3014cb5b572fSBarry Smith 30154994cf47SJed Brown PetscErrorCode MatSetUp_SeqAIJ(Mat A) 3016273d9f13SBarry Smith { 3017273d9f13SBarry Smith PetscFunctionBegin; 30189566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(A,PETSC_DEFAULT,NULL)); 3019273d9f13SBarry Smith PetscFunctionReturn(0); 3020273d9f13SBarry Smith } 3021273d9f13SBarry Smith 3022f38c1e66SStefano Zampini PETSC_INTERN PetscErrorCode MatSeqAIJGetArray_SeqAIJ(Mat A,PetscScalar *array[]) 30236c0721eeSBarry Smith { 30246c0721eeSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 30256e111a19SKarl Rupp 30266c0721eeSBarry Smith PetscFunctionBegin; 30276c0721eeSBarry Smith *array = a->a; 30286c0721eeSBarry Smith PetscFunctionReturn(0); 30296c0721eeSBarry Smith } 30306c0721eeSBarry Smith 3031f38c1e66SStefano Zampini PETSC_INTERN PetscErrorCode MatSeqAIJRestoreArray_SeqAIJ(Mat A,PetscScalar *array[]) 30326c0721eeSBarry Smith { 30336c0721eeSBarry Smith PetscFunctionBegin; 3034f38c1e66SStefano Zampini *array = NULL; 30356c0721eeSBarry Smith PetscFunctionReturn(0); 30366c0721eeSBarry Smith } 3037273d9f13SBarry Smith 30388229c054SShri Abhyankar /* 30398229c054SShri Abhyankar Computes the number of nonzeros per row needed for preallocation when X and Y 30408229c054SShri Abhyankar have different nonzero structure. 30418229c054SShri Abhyankar */ 3042b264fe52SHong Zhang PetscErrorCode MatAXPYGetPreallocation_SeqX_private(PetscInt m,const PetscInt *xi,const PetscInt *xj,const PetscInt *yi,const PetscInt *yj,PetscInt *nnz) 3043ec7775f6SShri Abhyankar { 3044b264fe52SHong Zhang PetscInt i,j,k,nzx,nzy; 3045ec7775f6SShri Abhyankar 3046ec7775f6SShri Abhyankar PetscFunctionBegin; 3047ec7775f6SShri Abhyankar /* Set the number of nonzeros in the new matrix */ 3048ec7775f6SShri Abhyankar for (i=0; i<m; i++) { 3049b264fe52SHong Zhang const PetscInt *xjj = xj+xi[i],*yjj = yj+yi[i]; 3050b264fe52SHong Zhang nzx = xi[i+1] - xi[i]; 3051b264fe52SHong Zhang nzy = yi[i+1] - yi[i]; 30528af7cee1SJed Brown nnz[i] = 0; 30538af7cee1SJed Brown for (j=0,k=0; j<nzx; j++) { /* Point in X */ 3054b264fe52SHong Zhang for (; k<nzy && yjj[k]<xjj[j]; k++) nnz[i]++; /* Catch up to X */ 3055b264fe52SHong Zhang if (k<nzy && yjj[k]==xjj[j]) k++; /* Skip duplicate */ 30568af7cee1SJed Brown nnz[i]++; 30578af7cee1SJed Brown } 30588af7cee1SJed Brown for (; k<nzy; k++) nnz[i]++; 3059ec7775f6SShri Abhyankar } 3060ec7775f6SShri Abhyankar PetscFunctionReturn(0); 3061ec7775f6SShri Abhyankar } 3062ec7775f6SShri Abhyankar 3063b264fe52SHong Zhang PetscErrorCode MatAXPYGetPreallocation_SeqAIJ(Mat Y,Mat X,PetscInt *nnz) 3064b264fe52SHong Zhang { 3065b264fe52SHong Zhang PetscInt m = Y->rmap->N; 3066b264fe52SHong Zhang Mat_SeqAIJ *x = (Mat_SeqAIJ*)X->data; 3067b264fe52SHong Zhang Mat_SeqAIJ *y = (Mat_SeqAIJ*)Y->data; 3068b264fe52SHong Zhang 3069b264fe52SHong Zhang PetscFunctionBegin; 3070b264fe52SHong Zhang /* Set the number of nonzeros in the new matrix */ 30719566063dSJacob Faibussowitsch PetscCall(MatAXPYGetPreallocation_SeqX_private(m,x->i,x->j,y->i,y->j,nnz)); 3072b264fe52SHong Zhang PetscFunctionReturn(0); 3073b264fe52SHong Zhang } 3074b264fe52SHong Zhang 3075f4df32b1SMatthew Knepley PetscErrorCode MatAXPY_SeqAIJ(Mat Y,PetscScalar a,Mat X,MatStructure str) 3076ac90fabeSBarry Smith { 3077ac90fabeSBarry Smith Mat_SeqAIJ *x = (Mat_SeqAIJ*)X->data,*y = (Mat_SeqAIJ*)Y->data; 3078ac90fabeSBarry Smith 3079ac90fabeSBarry Smith PetscFunctionBegin; 3080134adf20SPierre Jolivet if (str == UNKNOWN_NONZERO_PATTERN || (PetscDefined(USE_DEBUG) && str == SAME_NONZERO_PATTERN)) { 3081134adf20SPierre Jolivet PetscBool e = x->nz == y->nz ? PETSC_TRUE : PETSC_FALSE; 3082134adf20SPierre Jolivet if (e) { 30839566063dSJacob Faibussowitsch PetscCall(PetscArraycmp(x->i,y->i,Y->rmap->n+1,&e)); 308481fa06acSBarry Smith if (e) { 30859566063dSJacob Faibussowitsch PetscCall(PetscArraycmp(x->j,y->j,y->nz,&e)); 3086134adf20SPierre Jolivet if (e) str = SAME_NONZERO_PATTERN; 308781fa06acSBarry Smith } 308881fa06acSBarry Smith } 308954c59aa7SJacob Faibussowitsch if (!e) PetscCheck(str != SAME_NONZERO_PATTERN,PETSC_COMM_SELF,PETSC_ERR_ARG_WRONG,"MatStructure is not SAME_NONZERO_PATTERN"); 309081fa06acSBarry Smith } 3091ac90fabeSBarry Smith if (str == SAME_NONZERO_PATTERN) { 30922e5835c6SStefano Zampini const PetscScalar *xa; 30932e5835c6SStefano Zampini PetscScalar *ya,alpha = a; 309481fa06acSBarry Smith PetscBLASInt one = 1,bnz; 309581fa06acSBarry Smith 30969566063dSJacob Faibussowitsch PetscCall(PetscBLASIntCast(x->nz,&bnz)); 30979566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(Y,&ya)); 30989566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(X,&xa)); 30992e5835c6SStefano Zampini PetscStackCallBLAS("BLASaxpy",BLASaxpy_(&bnz,&alpha,xa,&one,ya,&one)); 31009566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(X,&xa)); 31019566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(Y,&ya)); 31029566063dSJacob Faibussowitsch PetscCall(PetscLogFlops(2.0*bnz)); 31039566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(Y)); 31049566063dSJacob Faibussowitsch PetscCall(PetscObjectStateIncrease((PetscObject)Y)); 3105ab784542SHong Zhang } else if (str == SUBSET_NONZERO_PATTERN) { /* nonzeros of X is a subset of Y's */ 31069566063dSJacob Faibussowitsch PetscCall(MatAXPY_Basic(Y,a,X,str)); 3107ac90fabeSBarry Smith } else { 31088229c054SShri Abhyankar Mat B; 31098229c054SShri Abhyankar PetscInt *nnz; 31109566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(Y->rmap->N,&nnz)); 31119566063dSJacob Faibussowitsch PetscCall(MatCreate(PetscObjectComm((PetscObject)Y),&B)); 31129566063dSJacob Faibussowitsch PetscCall(PetscObjectSetName((PetscObject)B,((PetscObject)Y)->name)); 31139566063dSJacob Faibussowitsch PetscCall(MatSetLayouts(B,Y->rmap,Y->cmap)); 31149566063dSJacob Faibussowitsch PetscCall(MatSetType(B,((PetscObject)Y)->type_name)); 31159566063dSJacob Faibussowitsch PetscCall(MatAXPYGetPreallocation_SeqAIJ(Y,X,nnz)); 31169566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation(B,0,nnz)); 31179566063dSJacob Faibussowitsch PetscCall(MatAXPY_BasicWithPreallocation(B,Y,a,X,str)); 31189566063dSJacob Faibussowitsch PetscCall(MatHeaderMerge(Y,&B)); 31199566063dSJacob Faibussowitsch PetscCall(PetscFree(nnz)); 3120ac90fabeSBarry Smith } 3121ac90fabeSBarry Smith PetscFunctionReturn(0); 3122ac90fabeSBarry Smith } 3123ac90fabeSBarry Smith 31242726fb6dSPierre Jolivet PETSC_INTERN PetscErrorCode MatConjugate_SeqAIJ(Mat mat) 3125354c94deSBarry Smith { 3126354c94deSBarry Smith #if defined(PETSC_USE_COMPLEX) 3127354c94deSBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ*)mat->data; 3128354c94deSBarry Smith PetscInt i,nz; 3129354c94deSBarry Smith PetscScalar *a; 3130354c94deSBarry Smith 3131354c94deSBarry Smith PetscFunctionBegin; 3132354c94deSBarry Smith nz = aij->nz; 31339566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(mat,&a)); 31342205254eSKarl Rupp for (i=0; i<nz; i++) a[i] = PetscConj(a[i]); 31359566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(mat,&a)); 3136354c94deSBarry Smith #else 3137354c94deSBarry Smith PetscFunctionBegin; 3138354c94deSBarry Smith #endif 3139354c94deSBarry Smith PetscFunctionReturn(0); 3140354c94deSBarry Smith } 3141354c94deSBarry Smith 3142985db425SBarry Smith PetscErrorCode MatGetRowMaxAbs_SeqAIJ(Mat A,Vec v,PetscInt idx[]) 3143e34fafa9SBarry Smith { 3144e34fafa9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 3145d0f46423SBarry Smith PetscInt i,j,m = A->rmap->n,*ai,*aj,ncols,n; 3146e34fafa9SBarry Smith PetscReal atmp; 3147985db425SBarry Smith PetscScalar *x; 3148ce496241SStefano Zampini const MatScalar *aa,*av; 3149e34fafa9SBarry Smith 3150e34fafa9SBarry Smith PetscFunctionBegin; 315128b400f6SJacob Faibussowitsch PetscCheck(!A->factortype,PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Not for factored matrix"); 31529566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A,&av)); 3153ce496241SStefano Zampini aa = av; 3154e34fafa9SBarry Smith ai = a->i; 3155e34fafa9SBarry Smith aj = a->j; 3156e34fafa9SBarry Smith 31579566063dSJacob Faibussowitsch PetscCall(VecSet(v,0.0)); 31589566063dSJacob Faibussowitsch PetscCall(VecGetArrayWrite(v,&x)); 31599566063dSJacob Faibussowitsch PetscCall(VecGetLocalSize(v,&n)); 31602c71b3e2SJacob Faibussowitsch PetscCheckFalse(n != A->rmap->n,PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Nonconforming matrix and vector"); 3161e34fafa9SBarry Smith for (i=0; i<m; i++) { 3162e34fafa9SBarry Smith ncols = ai[1] - ai[0]; ai++; 3163e34fafa9SBarry Smith for (j=0; j<ncols; j++) { 3164985db425SBarry Smith atmp = PetscAbsScalar(*aa); 3165985db425SBarry Smith if (PetscAbsScalar(x[i]) < atmp) {x[i] = atmp; if (idx) idx[i] = *aj;} 3166985db425SBarry Smith aa++; aj++; 3167985db425SBarry Smith } 3168985db425SBarry Smith } 31699566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayWrite(v,&x)); 31709566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A,&av)); 3171985db425SBarry Smith PetscFunctionReturn(0); 3172985db425SBarry Smith } 3173985db425SBarry Smith 3174985db425SBarry Smith PetscErrorCode MatGetRowMax_SeqAIJ(Mat A,Vec v,PetscInt idx[]) 3175985db425SBarry Smith { 3176985db425SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 3177d0f46423SBarry Smith PetscInt i,j,m = A->rmap->n,*ai,*aj,ncols,n; 3178985db425SBarry Smith PetscScalar *x; 3179ce496241SStefano Zampini const MatScalar *aa,*av; 3180985db425SBarry Smith 3181985db425SBarry Smith PetscFunctionBegin; 318228b400f6SJacob Faibussowitsch PetscCheck(!A->factortype,PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Not for factored matrix"); 31839566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A,&av)); 3184ce496241SStefano Zampini aa = av; 3185985db425SBarry Smith ai = a->i; 3186985db425SBarry Smith aj = a->j; 3187985db425SBarry Smith 31889566063dSJacob Faibussowitsch PetscCall(VecSet(v,0.0)); 31899566063dSJacob Faibussowitsch PetscCall(VecGetArrayWrite(v,&x)); 31909566063dSJacob Faibussowitsch PetscCall(VecGetLocalSize(v,&n)); 31912c71b3e2SJacob Faibussowitsch PetscCheckFalse(n != A->rmap->n,PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Nonconforming matrix and vector"); 3192985db425SBarry Smith for (i=0; i<m; i++) { 3193985db425SBarry Smith ncols = ai[1] - ai[0]; ai++; 3194d0f46423SBarry Smith if (ncols == A->cmap->n) { /* row is dense */ 3195985db425SBarry Smith x[i] = *aa; if (idx) idx[i] = 0; 3196985db425SBarry Smith } else { /* row is sparse so already KNOW maximum is 0.0 or higher */ 3197985db425SBarry Smith x[i] = 0.0; 3198985db425SBarry Smith if (idx) { 3199985db425SBarry Smith for (j=0; j<ncols; j++) { /* find first implicit 0.0 in the row */ 3200985db425SBarry Smith if (aj[j] > j) { 3201985db425SBarry Smith idx[i] = j; 3202985db425SBarry Smith break; 3203985db425SBarry Smith } 3204985db425SBarry Smith } 32051a254869SHong Zhang /* in case first implicit 0.0 in the row occurs at ncols-th column */ 32061a254869SHong Zhang if (j==ncols && j < A->cmap->n) idx[i] = j; 3207985db425SBarry Smith } 3208985db425SBarry Smith } 3209985db425SBarry Smith for (j=0; j<ncols; j++) { 3210985db425SBarry Smith if (PetscRealPart(x[i]) < PetscRealPart(*aa)) {x[i] = *aa; if (idx) idx[i] = *aj;} 3211985db425SBarry Smith aa++; aj++; 3212985db425SBarry Smith } 3213985db425SBarry Smith } 32149566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayWrite(v,&x)); 32159566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A,&av)); 3216985db425SBarry Smith PetscFunctionReturn(0); 3217985db425SBarry Smith } 3218985db425SBarry Smith 3219c87e5d42SMatthew Knepley PetscErrorCode MatGetRowMinAbs_SeqAIJ(Mat A,Vec v,PetscInt idx[]) 3220c87e5d42SMatthew Knepley { 3221c87e5d42SMatthew Knepley Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 3222c87e5d42SMatthew Knepley PetscInt i,j,m = A->rmap->n,*ai,*aj,ncols,n; 3223ce496241SStefano Zampini PetscScalar *x; 3224ce496241SStefano Zampini const MatScalar *aa,*av; 3225c87e5d42SMatthew Knepley 3226c87e5d42SMatthew Knepley PetscFunctionBegin; 32279566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A,&av)); 3228ce496241SStefano Zampini aa = av; 3229c87e5d42SMatthew Knepley ai = a->i; 3230c87e5d42SMatthew Knepley aj = a->j; 3231c87e5d42SMatthew Knepley 32329566063dSJacob Faibussowitsch PetscCall(VecSet(v,0.0)); 32339566063dSJacob Faibussowitsch PetscCall(VecGetArrayWrite(v,&x)); 32349566063dSJacob Faibussowitsch PetscCall(VecGetLocalSize(v,&n)); 32352c71b3e2SJacob Faibussowitsch PetscCheckFalse(n != m,PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Nonconforming matrix and vector, %" PetscInt_FMT " vs. %" PetscInt_FMT " rows", m, n); 3236c87e5d42SMatthew Knepley for (i=0; i<m; i++) { 3237c87e5d42SMatthew Knepley ncols = ai[1] - ai[0]; ai++; 3238f07e67edSHong Zhang if (ncols == A->cmap->n) { /* row is dense */ 3239f07e67edSHong Zhang x[i] = *aa; if (idx) idx[i] = 0; 3240f07e67edSHong Zhang } else { /* row is sparse so already KNOW minimum is 0.0 or higher */ 3241f07e67edSHong Zhang x[i] = 0.0; 3242f07e67edSHong Zhang if (idx) { /* find first implicit 0.0 in the row */ 3243289a08f5SMatthew Knepley for (j=0; j<ncols; j++) { 3244f07e67edSHong Zhang if (aj[j] > j) { 3245f07e67edSHong Zhang idx[i] = j; 32462205254eSKarl Rupp break; 32472205254eSKarl Rupp } 3248289a08f5SMatthew Knepley } 3249f07e67edSHong Zhang /* in case first implicit 0.0 in the row occurs at ncols-th column */ 3250f07e67edSHong Zhang if (j==ncols && j < A->cmap->n) idx[i] = j; 3251f07e67edSHong Zhang } 3252289a08f5SMatthew Knepley } 3253c87e5d42SMatthew Knepley for (j=0; j<ncols; j++) { 3254f07e67edSHong Zhang if (PetscAbsScalar(x[i]) > PetscAbsScalar(*aa)) {x[i] = *aa; if (idx) idx[i] = *aj;} 3255c87e5d42SMatthew Knepley aa++; aj++; 3256c87e5d42SMatthew Knepley } 3257c87e5d42SMatthew Knepley } 32589566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayWrite(v,&x)); 32599566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A,&av)); 3260c87e5d42SMatthew Knepley PetscFunctionReturn(0); 3261c87e5d42SMatthew Knepley } 3262c87e5d42SMatthew Knepley 3263985db425SBarry Smith PetscErrorCode MatGetRowMin_SeqAIJ(Mat A,Vec v,PetscInt idx[]) 3264985db425SBarry Smith { 3265985db425SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 3266d9ca1df4SBarry Smith PetscInt i,j,m = A->rmap->n,ncols,n; 3267d9ca1df4SBarry Smith const PetscInt *ai,*aj; 3268985db425SBarry Smith PetscScalar *x; 3269ce496241SStefano Zampini const MatScalar *aa,*av; 3270985db425SBarry Smith 3271985db425SBarry Smith PetscFunctionBegin; 327228b400f6SJacob Faibussowitsch PetscCheck(!A->factortype,PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Not for factored matrix"); 32739566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A,&av)); 3274ce496241SStefano Zampini aa = av; 3275985db425SBarry Smith ai = a->i; 3276985db425SBarry Smith aj = a->j; 3277985db425SBarry Smith 32789566063dSJacob Faibussowitsch PetscCall(VecSet(v,0.0)); 32799566063dSJacob Faibussowitsch PetscCall(VecGetArrayWrite(v,&x)); 32809566063dSJacob Faibussowitsch PetscCall(VecGetLocalSize(v,&n)); 32812c71b3e2SJacob Faibussowitsch PetscCheckFalse(n != m,PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Nonconforming matrix and vector"); 3282985db425SBarry Smith for (i=0; i<m; i++) { 3283985db425SBarry Smith ncols = ai[1] - ai[0]; ai++; 3284d0f46423SBarry Smith if (ncols == A->cmap->n) { /* row is dense */ 3285985db425SBarry Smith x[i] = *aa; if (idx) idx[i] = 0; 3286985db425SBarry Smith } else { /* row is sparse so already KNOW minimum is 0.0 or lower */ 3287985db425SBarry Smith x[i] = 0.0; 3288985db425SBarry Smith if (idx) { /* find first implicit 0.0 in the row */ 3289985db425SBarry Smith for (j=0; j<ncols; j++) { 3290985db425SBarry Smith if (aj[j] > j) { 3291985db425SBarry Smith idx[i] = j; 3292985db425SBarry Smith break; 3293985db425SBarry Smith } 3294985db425SBarry Smith } 3295fa213d2fSHong Zhang /* in case first implicit 0.0 in the row occurs at ncols-th column */ 3296fa213d2fSHong Zhang if (j==ncols && j < A->cmap->n) idx[i] = j; 3297985db425SBarry Smith } 3298985db425SBarry Smith } 3299985db425SBarry Smith for (j=0; j<ncols; j++) { 3300985db425SBarry Smith if (PetscRealPart(x[i]) > PetscRealPart(*aa)) {x[i] = *aa; if (idx) idx[i] = *aj;} 3301985db425SBarry Smith aa++; aj++; 3302e34fafa9SBarry Smith } 3303e34fafa9SBarry Smith } 33049566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayWrite(v,&x)); 33059566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A,&av)); 3306e34fafa9SBarry Smith PetscFunctionReturn(0); 3307e34fafa9SBarry Smith } 3308bbead8a2SBarry Smith 3309713ccfa9SJed Brown PetscErrorCode MatInvertBlockDiagonal_SeqAIJ(Mat A,const PetscScalar **values) 3310bbead8a2SBarry Smith { 3311bbead8a2SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*) A->data; 331233d57670SJed Brown PetscInt i,bs = PetscAbs(A->rmap->bs),mbs = A->rmap->n/bs,ipvt[5],bs2 = bs*bs,*v_pivots,ij[7],*IJ,j; 3313bbead8a2SBarry Smith MatScalar *diag,work[25],*v_work; 33140da83c2eSBarry Smith const PetscReal shift = 0.0; 33151a9391e3SHong Zhang PetscBool allowzeropivot,zeropivotdetected=PETSC_FALSE; 3316bbead8a2SBarry Smith 3317bbead8a2SBarry Smith PetscFunctionBegin; 3318a455e926SHong Zhang allowzeropivot = PetscNot(A->erroriffailure); 33194a0d0026SBarry Smith if (a->ibdiagvalid) { 33204a0d0026SBarry Smith if (values) *values = a->ibdiag; 33214a0d0026SBarry Smith PetscFunctionReturn(0); 33224a0d0026SBarry Smith } 33239566063dSJacob Faibussowitsch PetscCall(MatMarkDiagonal_SeqAIJ(A)); 3324bbead8a2SBarry Smith if (!a->ibdiag) { 33259566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(bs2*mbs,&a->ibdiag)); 33269566063dSJacob Faibussowitsch PetscCall(PetscLogObjectMemory((PetscObject)A,bs2*mbs*sizeof(PetscScalar))); 3327bbead8a2SBarry Smith } 3328bbead8a2SBarry Smith diag = a->ibdiag; 3329bbead8a2SBarry Smith if (values) *values = a->ibdiag; 3330bbead8a2SBarry Smith /* factor and invert each block */ 3331bbead8a2SBarry Smith switch (bs) { 3332bbead8a2SBarry Smith case 1: 3333bbead8a2SBarry Smith for (i=0; i<mbs; i++) { 33349566063dSJacob Faibussowitsch PetscCall(MatGetValues(A,1,&i,1,&i,diag+i)); 3335ec1892c8SHong Zhang if (PetscAbsScalar(diag[i] + shift) < PETSC_MACHINE_EPSILON) { 3336ec1892c8SHong Zhang if (allowzeropivot) { 33377b6c816cSBarry Smith A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 33387b6c816cSBarry Smith A->factorerror_zeropivot_value = PetscAbsScalar(diag[i]); 33397b6c816cSBarry Smith A->factorerror_zeropivot_row = i; 33409566063dSJacob Faibussowitsch PetscCall(PetscInfo(A,"Zero pivot, row %" PetscInt_FMT " pivot %g tolerance %g\n",i,(double)PetscAbsScalar(diag[i]),(double)PETSC_MACHINE_EPSILON)); 334198921bdaSJacob Faibussowitsch } else SETERRQ(PETSC_COMM_SELF,PETSC_ERR_MAT_LU_ZRPVT,"Zero pivot, row %" PetscInt_FMT " pivot %g tolerance %g",i,(double)PetscAbsScalar(diag[i]),(double)PETSC_MACHINE_EPSILON); 3342ec1892c8SHong Zhang } 3343bbead8a2SBarry Smith diag[i] = (PetscScalar)1.0 / (diag[i] + shift); 3344bbead8a2SBarry Smith } 3345bbead8a2SBarry Smith break; 3346bbead8a2SBarry Smith case 2: 3347bbead8a2SBarry Smith for (i=0; i<mbs; i++) { 3348bbead8a2SBarry Smith ij[0] = 2*i; ij[1] = 2*i + 1; 33499566063dSJacob Faibussowitsch PetscCall(MatGetValues(A,2,ij,2,ij,diag)); 33509566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_2(diag,shift,allowzeropivot,&zeropivotdetected)); 33517b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 33529566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_2(diag)); 3353bbead8a2SBarry Smith diag += 4; 3354bbead8a2SBarry Smith } 3355bbead8a2SBarry Smith break; 3356bbead8a2SBarry Smith case 3: 3357bbead8a2SBarry Smith for (i=0; i<mbs; i++) { 3358bbead8a2SBarry Smith ij[0] = 3*i; ij[1] = 3*i + 1; ij[2] = 3*i + 2; 33599566063dSJacob Faibussowitsch PetscCall(MatGetValues(A,3,ij,3,ij,diag)); 33609566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_3(diag,shift,allowzeropivot,&zeropivotdetected)); 33617b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 33629566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_3(diag)); 3363bbead8a2SBarry Smith diag += 9; 3364bbead8a2SBarry Smith } 3365bbead8a2SBarry Smith break; 3366bbead8a2SBarry Smith case 4: 3367bbead8a2SBarry Smith for (i=0; i<mbs; i++) { 3368bbead8a2SBarry Smith ij[0] = 4*i; ij[1] = 4*i + 1; ij[2] = 4*i + 2; ij[3] = 4*i + 3; 33699566063dSJacob Faibussowitsch PetscCall(MatGetValues(A,4,ij,4,ij,diag)); 33709566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_4(diag,shift,allowzeropivot,&zeropivotdetected)); 33717b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 33729566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_4(diag)); 3373bbead8a2SBarry Smith diag += 16; 3374bbead8a2SBarry Smith } 3375bbead8a2SBarry Smith break; 3376bbead8a2SBarry Smith case 5: 3377bbead8a2SBarry Smith for (i=0; i<mbs; i++) { 3378bbead8a2SBarry Smith ij[0] = 5*i; ij[1] = 5*i + 1; ij[2] = 5*i + 2; ij[3] = 5*i + 3; ij[4] = 5*i + 4; 33799566063dSJacob Faibussowitsch PetscCall(MatGetValues(A,5,ij,5,ij,diag)); 33809566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_5(diag,ipvt,work,shift,allowzeropivot,&zeropivotdetected)); 33817b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 33829566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_5(diag)); 3383bbead8a2SBarry Smith diag += 25; 3384bbead8a2SBarry Smith } 3385bbead8a2SBarry Smith break; 3386bbead8a2SBarry Smith case 6: 3387bbead8a2SBarry Smith for (i=0; i<mbs; i++) { 3388bbead8a2SBarry Smith ij[0] = 6*i; ij[1] = 6*i + 1; ij[2] = 6*i + 2; ij[3] = 6*i + 3; ij[4] = 6*i + 4; ij[5] = 6*i + 5; 33899566063dSJacob Faibussowitsch PetscCall(MatGetValues(A,6,ij,6,ij,diag)); 33909566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_6(diag,shift,allowzeropivot,&zeropivotdetected)); 33917b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 33929566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_6(diag)); 3393bbead8a2SBarry Smith diag += 36; 3394bbead8a2SBarry Smith } 3395bbead8a2SBarry Smith break; 3396bbead8a2SBarry Smith case 7: 3397bbead8a2SBarry Smith for (i=0; i<mbs; i++) { 3398bbead8a2SBarry Smith ij[0] = 7*i; ij[1] = 7*i + 1; ij[2] = 7*i + 2; ij[3] = 7*i + 3; ij[4] = 7*i + 4; ij[5] = 7*i + 5; ij[5] = 7*i + 6; 33999566063dSJacob Faibussowitsch PetscCall(MatGetValues(A,7,ij,7,ij,diag)); 34009566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A_7(diag,shift,allowzeropivot,&zeropivotdetected)); 34017b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 34029566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_7(diag)); 3403bbead8a2SBarry Smith diag += 49; 3404bbead8a2SBarry Smith } 3405bbead8a2SBarry Smith break; 3406bbead8a2SBarry Smith default: 34079566063dSJacob Faibussowitsch PetscCall(PetscMalloc3(bs,&v_work,bs,&v_pivots,bs,&IJ)); 3408bbead8a2SBarry Smith for (i=0; i<mbs; i++) { 3409bbead8a2SBarry Smith for (j=0; j<bs; j++) { 3410bbead8a2SBarry Smith IJ[j] = bs*i + j; 3411bbead8a2SBarry Smith } 34129566063dSJacob Faibussowitsch PetscCall(MatGetValues(A,bs,IJ,bs,IJ,diag)); 34139566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_inverse_A(bs,diag,v_pivots,v_work,allowzeropivot,&zeropivotdetected)); 34147b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 34159566063dSJacob Faibussowitsch PetscCall(PetscKernel_A_gets_transpose_A_N(diag,bs)); 3416bbead8a2SBarry Smith diag += bs2; 3417bbead8a2SBarry Smith } 34189566063dSJacob Faibussowitsch PetscCall(PetscFree3(v_work,v_pivots,IJ)); 3419bbead8a2SBarry Smith } 3420bbead8a2SBarry Smith a->ibdiagvalid = PETSC_TRUE; 3421bbead8a2SBarry Smith PetscFunctionReturn(0); 3422bbead8a2SBarry Smith } 3423bbead8a2SBarry Smith 342473a71a0fSBarry Smith static PetscErrorCode MatSetRandom_SeqAIJ(Mat x,PetscRandom rctx) 342573a71a0fSBarry Smith { 342673a71a0fSBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ*)x->data; 3427fff043a9SJunchao Zhang PetscScalar a,*aa; 342873a71a0fSBarry Smith PetscInt m,n,i,j,col; 342973a71a0fSBarry Smith 343073a71a0fSBarry Smith PetscFunctionBegin; 343173a71a0fSBarry Smith if (!x->assembled) { 34329566063dSJacob Faibussowitsch PetscCall(MatGetSize(x,&m,&n)); 343373a71a0fSBarry Smith for (i=0; i<m; i++) { 343473a71a0fSBarry Smith for (j=0; j<aij->imax[i]; j++) { 34359566063dSJacob Faibussowitsch PetscCall(PetscRandomGetValue(rctx,&a)); 343673a71a0fSBarry Smith col = (PetscInt)(n*PetscRealPart(a)); 34379566063dSJacob Faibussowitsch PetscCall(MatSetValues(x,1,&i,1,&col,&a,ADD_VALUES)); 343873a71a0fSBarry Smith } 343973a71a0fSBarry Smith } 3440e2ce353bSJunchao Zhang } else { 34419566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayWrite(x,&aa)); 34429566063dSJacob Faibussowitsch for (i=0; i<aij->nz; i++) PetscCall(PetscRandomGetValue(rctx,aa+i)); 34439566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayWrite(x,&aa)); 3444e2ce353bSJunchao Zhang } 34459566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(x,MAT_FINAL_ASSEMBLY)); 34469566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(x,MAT_FINAL_ASSEMBLY)); 344773a71a0fSBarry Smith PetscFunctionReturn(0); 344873a71a0fSBarry Smith } 344973a71a0fSBarry Smith 3450679944adSJunchao Zhang /* Like MatSetRandom_SeqAIJ, but do not set values on columns in range of [low, high) */ 3451679944adSJunchao Zhang PetscErrorCode MatSetRandomSkipColumnRange_SeqAIJ_Private(Mat x,PetscInt low,PetscInt high,PetscRandom rctx) 3452679944adSJunchao Zhang { 3453679944adSJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ*)x->data; 3454679944adSJunchao Zhang PetscScalar a; 3455679944adSJunchao Zhang PetscInt m,n,i,j,col,nskip; 3456679944adSJunchao Zhang 3457679944adSJunchao Zhang PetscFunctionBegin; 3458679944adSJunchao Zhang nskip = high - low; 34599566063dSJacob Faibussowitsch PetscCall(MatGetSize(x,&m,&n)); 3460679944adSJunchao Zhang n -= nskip; /* shrink number of columns where nonzeros can be set */ 3461679944adSJunchao Zhang for (i=0; i<m; i++) { 3462679944adSJunchao Zhang for (j=0; j<aij->imax[i]; j++) { 34639566063dSJacob Faibussowitsch PetscCall(PetscRandomGetValue(rctx,&a)); 3464679944adSJunchao Zhang col = (PetscInt)(n*PetscRealPart(a)); 3465679944adSJunchao Zhang if (col >= low) col += nskip; /* shift col rightward to skip the hole */ 34669566063dSJacob Faibussowitsch PetscCall(MatSetValues(x,1,&i,1,&col,&a,ADD_VALUES)); 3467679944adSJunchao Zhang } 3468e2ce353bSJunchao Zhang } 34699566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(x,MAT_FINAL_ASSEMBLY)); 34709566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(x,MAT_FINAL_ASSEMBLY)); 3471679944adSJunchao Zhang PetscFunctionReturn(0); 3472679944adSJunchao Zhang } 3473679944adSJunchao Zhang 3474682d7d0cSBarry Smith /* -------------------------------------------------------------------*/ 34750a6ffc59SBarry Smith static struct _MatOps MatOps_Values = { MatSetValues_SeqAIJ, 3476cb5b572fSBarry Smith MatGetRow_SeqAIJ, 3477cb5b572fSBarry Smith MatRestoreRow_SeqAIJ, 3478cb5b572fSBarry Smith MatMult_SeqAIJ, 347997304618SKris Buschelman /* 4*/ MatMultAdd_SeqAIJ, 34807c922b88SBarry Smith MatMultTranspose_SeqAIJ, 34817c922b88SBarry Smith MatMultTransposeAdd_SeqAIJ, 3482f4259b30SLisandro Dalcin NULL, 3483f4259b30SLisandro Dalcin NULL, 3484f4259b30SLisandro Dalcin NULL, 3485f4259b30SLisandro Dalcin /* 10*/ NULL, 3486cb5b572fSBarry Smith MatLUFactor_SeqAIJ, 3487f4259b30SLisandro Dalcin NULL, 348841f059aeSBarry Smith MatSOR_SeqAIJ, 348991e9d3e2SHong Zhang MatTranspose_SeqAIJ, 349097304618SKris Buschelman /*1 5*/ MatGetInfo_SeqAIJ, 3491cb5b572fSBarry Smith MatEqual_SeqAIJ, 3492cb5b572fSBarry Smith MatGetDiagonal_SeqAIJ, 3493cb5b572fSBarry Smith MatDiagonalScale_SeqAIJ, 3494cb5b572fSBarry Smith MatNorm_SeqAIJ, 3495f4259b30SLisandro Dalcin /* 20*/ NULL, 3496cb5b572fSBarry Smith MatAssemblyEnd_SeqAIJ, 3497cb5b572fSBarry Smith MatSetOption_SeqAIJ, 3498cb5b572fSBarry Smith MatZeroEntries_SeqAIJ, 3499d519adbfSMatthew Knepley /* 24*/ MatZeroRows_SeqAIJ, 3500f4259b30SLisandro Dalcin NULL, 3501f4259b30SLisandro Dalcin NULL, 3502f4259b30SLisandro Dalcin NULL, 3503f4259b30SLisandro Dalcin NULL, 35044994cf47SJed Brown /* 29*/ MatSetUp_SeqAIJ, 3505f4259b30SLisandro Dalcin NULL, 3506f4259b30SLisandro Dalcin NULL, 3507f4259b30SLisandro Dalcin NULL, 3508f4259b30SLisandro Dalcin NULL, 3509d519adbfSMatthew Knepley /* 34*/ MatDuplicate_SeqAIJ, 3510f4259b30SLisandro Dalcin NULL, 3511f4259b30SLisandro Dalcin NULL, 3512cb5b572fSBarry Smith MatILUFactor_SeqAIJ, 3513f4259b30SLisandro Dalcin NULL, 3514d519adbfSMatthew Knepley /* 39*/ MatAXPY_SeqAIJ, 35157dae84e0SHong Zhang MatCreateSubMatrices_SeqAIJ, 3516cb5b572fSBarry Smith MatIncreaseOverlap_SeqAIJ, 3517cb5b572fSBarry Smith MatGetValues_SeqAIJ, 3518cb5b572fSBarry Smith MatCopy_SeqAIJ, 3519d519adbfSMatthew Knepley /* 44*/ MatGetRowMax_SeqAIJ, 3520cb5b572fSBarry Smith MatScale_SeqAIJ, 35217d68702bSBarry Smith MatShift_SeqAIJ, 352279299369SBarry Smith MatDiagonalSet_SeqAIJ, 35236e169961SBarry Smith MatZeroRowsColumns_SeqAIJ, 352473a71a0fSBarry Smith /* 49*/ MatSetRandom_SeqAIJ, 35253b2fbd54SBarry Smith MatGetRowIJ_SeqAIJ, 35263b2fbd54SBarry Smith MatRestoreRowIJ_SeqAIJ, 35273b2fbd54SBarry Smith MatGetColumnIJ_SeqAIJ, 3528a93ec695SBarry Smith MatRestoreColumnIJ_SeqAIJ, 352993dfae19SHong Zhang /* 54*/ MatFDColoringCreate_SeqXAIJ, 3530f4259b30SLisandro Dalcin NULL, 3531f4259b30SLisandro Dalcin NULL, 3532cda55fadSBarry Smith MatPermute_SeqAIJ, 3533f4259b30SLisandro Dalcin NULL, 3534f4259b30SLisandro Dalcin /* 59*/ NULL, 3535b9b97703SBarry Smith MatDestroy_SeqAIJ, 3536b9b97703SBarry Smith MatView_SeqAIJ, 3537f4259b30SLisandro Dalcin NULL, 3538f4259b30SLisandro Dalcin NULL, 3539f4259b30SLisandro Dalcin /* 64*/ NULL, 3540321b30b9SSatish Balay MatMatMatMultNumeric_SeqAIJ_SeqAIJ_SeqAIJ, 3541f4259b30SLisandro Dalcin NULL, 3542f4259b30SLisandro Dalcin NULL, 3543f4259b30SLisandro Dalcin NULL, 3544d519adbfSMatthew Knepley /* 69*/ MatGetRowMaxAbs_SeqAIJ, 3545c87e5d42SMatthew Knepley MatGetRowMinAbs_SeqAIJ, 3546f4259b30SLisandro Dalcin NULL, 3547f4259b30SLisandro Dalcin NULL, 3548f4259b30SLisandro Dalcin NULL, 3549f4259b30SLisandro Dalcin /* 74*/ NULL, 35503acb8795SBarry Smith MatFDColoringApply_AIJ, 3551f4259b30SLisandro Dalcin NULL, 3552f4259b30SLisandro Dalcin NULL, 3553f4259b30SLisandro Dalcin NULL, 35546ce1633cSBarry Smith /* 79*/ MatFindZeroDiagonals_SeqAIJ, 3555f4259b30SLisandro Dalcin NULL, 3556f4259b30SLisandro Dalcin NULL, 3557f4259b30SLisandro Dalcin NULL, 3558bc011b1eSHong Zhang MatLoad_SeqAIJ, 3559d519adbfSMatthew Knepley /* 84*/ MatIsSymmetric_SeqAIJ, 35601cbb95d3SBarry Smith MatIsHermitian_SeqAIJ, 3561f4259b30SLisandro Dalcin NULL, 3562f4259b30SLisandro Dalcin NULL, 3563f4259b30SLisandro Dalcin NULL, 3564f4259b30SLisandro Dalcin /* 89*/ NULL, 3565f4259b30SLisandro Dalcin NULL, 356626be0446SHong Zhang MatMatMultNumeric_SeqAIJ_SeqAIJ, 3567f4259b30SLisandro Dalcin NULL, 3568f4259b30SLisandro Dalcin NULL, 35698fa4b5a6SHong Zhang /* 94*/ MatPtAPNumeric_SeqAIJ_SeqAIJ_SparseAxpy, 3570f4259b30SLisandro Dalcin NULL, 3571f4259b30SLisandro Dalcin NULL, 35726fc122caSHong Zhang MatMatTransposeMultNumeric_SeqAIJ_SeqAIJ, 3573f4259b30SLisandro Dalcin NULL, 35744222ddf1SHong Zhang /* 99*/ MatProductSetFromOptions_SeqAIJ, 3575f4259b30SLisandro Dalcin NULL, 3576f4259b30SLisandro Dalcin NULL, 357787d4246cSBarry Smith MatConjugate_SeqAIJ, 3578f4259b30SLisandro Dalcin NULL, 3579d519adbfSMatthew Knepley /*104*/ MatSetValuesRow_SeqAIJ, 358099cafbc1SBarry Smith MatRealPart_SeqAIJ, 3581f5edf698SHong Zhang MatImaginaryPart_SeqAIJ, 3582f4259b30SLisandro Dalcin NULL, 3583f4259b30SLisandro Dalcin NULL, 3584cbd44569SHong Zhang /*109*/ MatMatSolve_SeqAIJ, 3585f4259b30SLisandro Dalcin NULL, 35862af78befSBarry Smith MatGetRowMin_SeqAIJ, 3587f4259b30SLisandro Dalcin NULL, 3588599ef60dSHong Zhang MatMissingDiagonal_SeqAIJ, 3589f4259b30SLisandro Dalcin /*114*/ NULL, 3590f4259b30SLisandro Dalcin NULL, 3591f4259b30SLisandro Dalcin NULL, 3592f4259b30SLisandro Dalcin NULL, 3593f4259b30SLisandro Dalcin NULL, 3594f4259b30SLisandro Dalcin /*119*/ NULL, 3595f4259b30SLisandro Dalcin NULL, 3596f4259b30SLisandro Dalcin NULL, 3597f4259b30SLisandro Dalcin NULL, 3598b3a44c85SBarry Smith MatGetMultiProcBlock_SeqAIJ, 35990716a85fSBarry Smith /*124*/ MatFindNonzeroRows_SeqAIJ, 3600a873a8cdSSam Reynolds MatGetColumnReductions_SeqAIJ, 360137868618SMatthew G Knepley MatInvertBlockDiagonal_SeqAIJ, 36020da83c2eSBarry Smith MatInvertVariableBlockDiagonal_SeqAIJ, 3603f4259b30SLisandro Dalcin NULL, 3604f4259b30SLisandro Dalcin /*129*/ NULL, 3605f4259b30SLisandro Dalcin NULL, 3606f4259b30SLisandro Dalcin NULL, 360775648e8dSHong Zhang MatTransposeMatMultNumeric_SeqAIJ_SeqAIJ, 3608b9af6bddSHong Zhang MatTransposeColoringCreate_SeqAIJ, 3609b9af6bddSHong Zhang /*134*/ MatTransColoringApplySpToDen_SeqAIJ, 36102b8ad9a3SHong Zhang MatTransColoringApplyDenToSp_SeqAIJ, 3611f4259b30SLisandro Dalcin NULL, 3612f4259b30SLisandro Dalcin NULL, 36133964eb88SJed Brown MatRARtNumeric_SeqAIJ_SeqAIJ, 3614f4259b30SLisandro Dalcin /*139*/NULL, 3615f4259b30SLisandro Dalcin NULL, 3616f4259b30SLisandro Dalcin NULL, 36173a062f41SBarry Smith MatFDColoringSetUp_SeqXAIJ, 36189c8f2541SHong Zhang MatFindOffBlockDiagonalEntries_SeqAIJ, 36194222ddf1SHong Zhang MatCreateMPIMatConcatenateSeqMat_SeqAIJ, 36204222ddf1SHong Zhang /*145*/MatDestroySubMatrices_SeqAIJ, 3621f4259b30SLisandro Dalcin NULL, 3622f4259b30SLisandro Dalcin NULL 36239e29f15eSvictorle }; 362417ab2063SBarry Smith 36257087cfbeSBarry Smith PetscErrorCode MatSeqAIJSetColumnIndices_SeqAIJ(Mat mat,PetscInt *indices) 3626bef8e0ddSBarry Smith { 3627bef8e0ddSBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ*)mat->data; 362897f1f81fSBarry Smith PetscInt i,nz,n; 3629bef8e0ddSBarry Smith 3630bef8e0ddSBarry Smith PetscFunctionBegin; 3631bef8e0ddSBarry Smith nz = aij->maxnz; 3632d0f46423SBarry Smith n = mat->rmap->n; 3633bef8e0ddSBarry Smith for (i=0; i<nz; i++) { 3634bef8e0ddSBarry Smith aij->j[i] = indices[i]; 3635bef8e0ddSBarry Smith } 3636bef8e0ddSBarry Smith aij->nz = nz; 3637bef8e0ddSBarry Smith for (i=0; i<n; i++) { 3638bef8e0ddSBarry Smith aij->ilen[i] = aij->imax[i]; 3639bef8e0ddSBarry Smith } 3640bef8e0ddSBarry Smith PetscFunctionReturn(0); 3641bef8e0ddSBarry Smith } 3642bef8e0ddSBarry Smith 3643a3bb6f32SFande Kong /* 3644ddea5d60SJunchao Zhang * Given a sparse matrix with global column indices, compact it by using a local column space. 3645ddea5d60SJunchao Zhang * The result matrix helps saving memory in other algorithms, such as MatPtAPSymbolic_MPIAIJ_MPIAIJ_scalable() 3646ddea5d60SJunchao Zhang */ 3647a3bb6f32SFande Kong PetscErrorCode MatSeqAIJCompactOutExtraColumns_SeqAIJ(Mat mat, ISLocalToGlobalMapping *mapping) 3648a3bb6f32SFande Kong { 3649a3bb6f32SFande Kong Mat_SeqAIJ *aij = (Mat_SeqAIJ*)mat->data; 3650a3bb6f32SFande Kong PetscTable gid1_lid1; 3651a3bb6f32SFande Kong PetscTablePosition tpos; 365225b670f0SStefano Zampini PetscInt gid,lid,i,ec,nz = aij->nz; 365325b670f0SStefano Zampini PetscInt *garray,*jj = aij->j; 3654a3bb6f32SFande Kong 3655a3bb6f32SFande Kong PetscFunctionBegin; 3656a3bb6f32SFande Kong PetscValidHeaderSpecific(mat,MAT_CLASSID,1); 3657a3bb6f32SFande Kong PetscValidPointer(mapping,2); 3658a3bb6f32SFande Kong /* use a table */ 36599566063dSJacob Faibussowitsch PetscCall(PetscTableCreate(mat->rmap->n,mat->cmap->N+1,&gid1_lid1)); 3660a3bb6f32SFande Kong ec = 0; 366125b670f0SStefano Zampini for (i=0; i<nz; i++) { 366225b670f0SStefano Zampini PetscInt data,gid1 = jj[i] + 1; 36639566063dSJacob Faibussowitsch PetscCall(PetscTableFind(gid1_lid1,gid1,&data)); 3664a3bb6f32SFande Kong if (!data) { 3665a3bb6f32SFande Kong /* one based table */ 36669566063dSJacob Faibussowitsch PetscCall(PetscTableAdd(gid1_lid1,gid1,++ec,INSERT_VALUES)); 3667a3bb6f32SFande Kong } 3668a3bb6f32SFande Kong } 3669a3bb6f32SFande Kong /* form array of columns we need */ 36709566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(ec,&garray)); 36719566063dSJacob Faibussowitsch PetscCall(PetscTableGetHeadPosition(gid1_lid1,&tpos)); 3672a3bb6f32SFande Kong while (tpos) { 36739566063dSJacob Faibussowitsch PetscCall(PetscTableGetNext(gid1_lid1,&tpos,&gid,&lid)); 3674a3bb6f32SFande Kong gid--; 3675a3bb6f32SFande Kong lid--; 3676a3bb6f32SFande Kong garray[lid] = gid; 3677a3bb6f32SFande Kong } 36789566063dSJacob Faibussowitsch PetscCall(PetscSortInt(ec,garray)); /* sort, and rebuild */ 36799566063dSJacob Faibussowitsch PetscCall(PetscTableRemoveAll(gid1_lid1)); 3680a3bb6f32SFande Kong for (i=0; i<ec; i++) { 36819566063dSJacob Faibussowitsch PetscCall(PetscTableAdd(gid1_lid1,garray[i]+1,i+1,INSERT_VALUES)); 3682a3bb6f32SFande Kong } 3683a3bb6f32SFande Kong /* compact out the extra columns in B */ 368425b670f0SStefano Zampini for (i=0; i<nz; i++) { 368525b670f0SStefano Zampini PetscInt gid1 = jj[i] + 1; 36869566063dSJacob Faibussowitsch PetscCall(PetscTableFind(gid1_lid1,gid1,&lid)); 3687a3bb6f32SFande Kong lid--; 368825b670f0SStefano Zampini jj[i] = lid; 3689a3bb6f32SFande Kong } 36909566063dSJacob Faibussowitsch PetscCall(PetscLayoutDestroy(&mat->cmap)); 36919566063dSJacob Faibussowitsch PetscCall(PetscTableDestroy(&gid1_lid1)); 36929566063dSJacob Faibussowitsch PetscCall(PetscLayoutCreateFromSizes(PetscObjectComm((PetscObject)mat),ec,ec,1,&mat->cmap)); 36939566063dSJacob Faibussowitsch PetscCall(ISLocalToGlobalMappingCreate(PETSC_COMM_SELF,mat->cmap->bs,mat->cmap->n,garray,PETSC_OWN_POINTER,mapping)); 36949566063dSJacob Faibussowitsch PetscCall(ISLocalToGlobalMappingSetType(*mapping,ISLOCALTOGLOBALMAPPINGHASH)); 3695a3bb6f32SFande Kong PetscFunctionReturn(0); 3696a3bb6f32SFande Kong } 3697a3bb6f32SFande Kong 3698bef8e0ddSBarry Smith /*@ 3699bef8e0ddSBarry Smith MatSeqAIJSetColumnIndices - Set the column indices for all the rows 3700bef8e0ddSBarry Smith in the matrix. 3701bef8e0ddSBarry Smith 3702bef8e0ddSBarry Smith Input Parameters: 3703bef8e0ddSBarry Smith + mat - the SeqAIJ matrix 3704bef8e0ddSBarry Smith - indices - the column indices 3705bef8e0ddSBarry Smith 370615091d37SBarry Smith Level: advanced 370715091d37SBarry Smith 3708bef8e0ddSBarry Smith Notes: 3709bef8e0ddSBarry Smith This can be called if you have precomputed the nonzero structure of the 3710bef8e0ddSBarry Smith matrix and want to provide it to the matrix object to improve the performance 3711bef8e0ddSBarry Smith of the MatSetValues() operation. 3712bef8e0ddSBarry Smith 3713bef8e0ddSBarry Smith You MUST have set the correct numbers of nonzeros per row in the call to 3714d1be2dadSMatthew Knepley MatCreateSeqAIJ(), and the columns indices MUST be sorted. 3715bef8e0ddSBarry Smith 3716bef8e0ddSBarry Smith MUST be called before any calls to MatSetValues(); 3717bef8e0ddSBarry Smith 3718b9617806SBarry Smith The indices should start with zero, not one. 3719b9617806SBarry Smith 3720bef8e0ddSBarry Smith @*/ 37217087cfbeSBarry Smith PetscErrorCode MatSeqAIJSetColumnIndices(Mat mat,PetscInt *indices) 3722bef8e0ddSBarry Smith { 3723bef8e0ddSBarry Smith PetscFunctionBegin; 37240700a824SBarry Smith PetscValidHeaderSpecific(mat,MAT_CLASSID,1); 3725dadcf809SJacob Faibussowitsch PetscValidIntPointer(indices,2); 3726cac4c232SBarry Smith PetscUseMethod(mat,"MatSeqAIJSetColumnIndices_C",(Mat,PetscInt*),(mat,indices)); 3727bef8e0ddSBarry Smith PetscFunctionReturn(0); 3728bef8e0ddSBarry Smith } 3729bef8e0ddSBarry Smith 3730be6bf707SBarry Smith /* ----------------------------------------------------------------------------------------*/ 3731be6bf707SBarry Smith 37327087cfbeSBarry Smith PetscErrorCode MatStoreValues_SeqAIJ(Mat mat) 3733be6bf707SBarry Smith { 3734be6bf707SBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ*)mat->data; 3735d0f46423SBarry Smith size_t nz = aij->i[mat->rmap->n]; 3736be6bf707SBarry Smith 3737be6bf707SBarry Smith PetscFunctionBegin; 373828b400f6SJacob Faibussowitsch PetscCheck(aij->nonew,PETSC_COMM_SELF,PETSC_ERR_ORDER,"Must call MatSetOption(A,MAT_NEW_NONZERO_LOCATIONS,PETSC_FALSE);first"); 3739be6bf707SBarry Smith 3740be6bf707SBarry Smith /* allocate space for values if not already there */ 3741be6bf707SBarry Smith if (!aij->saved_values) { 37429566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nz+1,&aij->saved_values)); 37439566063dSJacob Faibussowitsch PetscCall(PetscLogObjectMemory((PetscObject)mat,(nz+1)*sizeof(PetscScalar))); 3744be6bf707SBarry Smith } 3745be6bf707SBarry Smith 3746be6bf707SBarry Smith /* copy values over */ 37479566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(aij->saved_values,aij->a,nz)); 3748be6bf707SBarry Smith PetscFunctionReturn(0); 3749be6bf707SBarry Smith } 3750be6bf707SBarry Smith 3751be6bf707SBarry Smith /*@ 3752be6bf707SBarry Smith MatStoreValues - Stashes a copy of the matrix values; this allows, for 3753be6bf707SBarry Smith example, reuse of the linear part of a Jacobian, while recomputing the 3754be6bf707SBarry Smith nonlinear portion. 3755be6bf707SBarry Smith 3756be6bf707SBarry Smith Collect on Mat 3757be6bf707SBarry Smith 3758be6bf707SBarry Smith Input Parameters: 37590e609b76SBarry Smith . mat - the matrix (currently only AIJ matrices support this option) 3760be6bf707SBarry Smith 376115091d37SBarry Smith Level: advanced 376215091d37SBarry Smith 3763be6bf707SBarry Smith Common Usage, with SNESSolve(): 3764be6bf707SBarry Smith $ Create Jacobian matrix 3765be6bf707SBarry Smith $ Set linear terms into matrix 3766be6bf707SBarry Smith $ Apply boundary conditions to matrix, at this time matrix must have 3767be6bf707SBarry Smith $ final nonzero structure (i.e. setting the nonlinear terms and applying 3768be6bf707SBarry Smith $ boundary conditions again will not change the nonzero structure 3769512a5fc5SBarry Smith $ ierr = MatSetOption(mat,MAT_NEW_NONZERO_LOCATIONS,PETSC_FALSE); 3770be6bf707SBarry Smith $ ierr = MatStoreValues(mat); 3771be6bf707SBarry Smith $ Call SNESSetJacobian() with matrix 3772be6bf707SBarry Smith $ In your Jacobian routine 3773be6bf707SBarry Smith $ ierr = MatRetrieveValues(mat); 3774be6bf707SBarry Smith $ Set nonlinear terms in matrix 3775be6bf707SBarry Smith 3776be6bf707SBarry Smith Common Usage without SNESSolve(), i.e. when you handle nonlinear solve yourself: 3777be6bf707SBarry Smith $ // build linear portion of Jacobian 3778512a5fc5SBarry Smith $ ierr = MatSetOption(mat,MAT_NEW_NONZERO_LOCATIONS,PETSC_FALSE); 3779be6bf707SBarry Smith $ ierr = MatStoreValues(mat); 3780be6bf707SBarry Smith $ loop over nonlinear iterations 3781be6bf707SBarry Smith $ ierr = MatRetrieveValues(mat); 3782be6bf707SBarry Smith $ // call MatSetValues(mat,...) to set nonliner portion of Jacobian 3783be6bf707SBarry Smith $ // call MatAssemblyBegin/End() on matrix 3784be6bf707SBarry Smith $ Solve linear system with Jacobian 3785be6bf707SBarry Smith $ endloop 3786be6bf707SBarry Smith 3787be6bf707SBarry Smith Notes: 3788be6bf707SBarry Smith Matrix must already be assemblied before calling this routine 3789512a5fc5SBarry Smith Must set the matrix option MatSetOption(mat,MAT_NEW_NONZERO_LOCATIONS,PETSC_FALSE); before 3790be6bf707SBarry Smith calling this routine. 3791be6bf707SBarry Smith 37920c468ba9SBarry Smith When this is called multiple times it overwrites the previous set of stored values 37930c468ba9SBarry Smith and does not allocated additional space. 37940c468ba9SBarry Smith 3795be6bf707SBarry Smith .seealso: MatRetrieveValues() 3796be6bf707SBarry Smith 3797be6bf707SBarry Smith @*/ 37987087cfbeSBarry Smith PetscErrorCode MatStoreValues(Mat mat) 3799be6bf707SBarry Smith { 3800be6bf707SBarry Smith PetscFunctionBegin; 38010700a824SBarry Smith PetscValidHeaderSpecific(mat,MAT_CLASSID,1); 380228b400f6SJacob Faibussowitsch PetscCheck(mat->assembled,PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Not for unassembled matrix"); 380328b400f6SJacob Faibussowitsch PetscCheck(!mat->factortype,PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Not for factored matrix"); 3804cac4c232SBarry Smith PetscUseMethod(mat,"MatStoreValues_C",(Mat),(mat)); 3805be6bf707SBarry Smith PetscFunctionReturn(0); 3806be6bf707SBarry Smith } 3807be6bf707SBarry Smith 38087087cfbeSBarry Smith PetscErrorCode MatRetrieveValues_SeqAIJ(Mat mat) 3809be6bf707SBarry Smith { 3810be6bf707SBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ*)mat->data; 3811d0f46423SBarry Smith PetscInt nz = aij->i[mat->rmap->n]; 3812be6bf707SBarry Smith 3813be6bf707SBarry Smith PetscFunctionBegin; 381428b400f6SJacob Faibussowitsch PetscCheck(aij->nonew,PETSC_COMM_SELF,PETSC_ERR_ORDER,"Must call MatSetOption(A,MAT_NEW_NONZERO_LOCATIONS,PETSC_FALSE);first"); 381528b400f6SJacob Faibussowitsch PetscCheck(aij->saved_values,PETSC_COMM_SELF,PETSC_ERR_ORDER,"Must call MatStoreValues(A);first"); 3816be6bf707SBarry Smith /* copy values over */ 38179566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(aij->a,aij->saved_values,nz)); 3818be6bf707SBarry Smith PetscFunctionReturn(0); 3819be6bf707SBarry Smith } 3820be6bf707SBarry Smith 3821be6bf707SBarry Smith /*@ 3822be6bf707SBarry Smith MatRetrieveValues - Retrieves the copy of the matrix values; this allows, for 3823be6bf707SBarry Smith example, reuse of the linear part of a Jacobian, while recomputing the 3824be6bf707SBarry Smith nonlinear portion. 3825be6bf707SBarry Smith 3826be6bf707SBarry Smith Collect on Mat 3827be6bf707SBarry Smith 3828be6bf707SBarry Smith Input Parameters: 3829386f7cf9SBarry Smith . mat - the matrix (currently only AIJ matrices support this option) 3830be6bf707SBarry Smith 383115091d37SBarry Smith Level: advanced 383215091d37SBarry Smith 3833be6bf707SBarry Smith .seealso: MatStoreValues() 3834be6bf707SBarry Smith 3835be6bf707SBarry Smith @*/ 38367087cfbeSBarry Smith PetscErrorCode MatRetrieveValues(Mat mat) 3837be6bf707SBarry Smith { 3838be6bf707SBarry Smith PetscFunctionBegin; 38390700a824SBarry Smith PetscValidHeaderSpecific(mat,MAT_CLASSID,1); 384028b400f6SJacob Faibussowitsch PetscCheck(mat->assembled,PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Not for unassembled matrix"); 384128b400f6SJacob Faibussowitsch PetscCheck(!mat->factortype,PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Not for factored matrix"); 3842cac4c232SBarry Smith PetscUseMethod(mat,"MatRetrieveValues_C",(Mat),(mat)); 3843be6bf707SBarry Smith PetscFunctionReturn(0); 3844be6bf707SBarry Smith } 3845be6bf707SBarry Smith 3846be6bf707SBarry Smith /* --------------------------------------------------------------------------------*/ 384717ab2063SBarry Smith /*@C 3848682d7d0cSBarry Smith MatCreateSeqAIJ - Creates a sparse matrix in AIJ (compressed row) format 38490d15e28bSLois Curfman McInnes (the default parallel PETSc format). For good matrix assembly performance 38506e62573dSLois Curfman McInnes the user should preallocate the matrix storage by setting the parameter nz 385151c19458SBarry Smith (or the array nnz). By setting these parameters accurately, performance 38522bd5e0b2SLois Curfman McInnes during matrix assembly can be increased by more than a factor of 50. 385317ab2063SBarry Smith 3854d083f849SBarry Smith Collective 3855db81eaa0SLois Curfman McInnes 385617ab2063SBarry Smith Input Parameters: 3857db81eaa0SLois Curfman McInnes + comm - MPI communicator, set to PETSC_COMM_SELF 385817ab2063SBarry Smith . m - number of rows 385917ab2063SBarry Smith . n - number of columns 386017ab2063SBarry Smith . nz - number of nonzeros per row (same for all rows) 386151c19458SBarry Smith - nnz - array containing the number of nonzeros in the various rows 38620298fd71SBarry Smith (possibly different for each row) or NULL 386317ab2063SBarry Smith 386417ab2063SBarry Smith Output Parameter: 3865416022c9SBarry Smith . A - the matrix 386617ab2063SBarry Smith 3867175b88e8SBarry Smith It is recommended that one use the MatCreate(), MatSetType() and/or MatSetFromOptions(), 3868f6f02116SRichard Tran Mills MatXXXXSetPreallocation() paradigm instead of this routine directly. 3869175b88e8SBarry Smith [MatXXXXSetPreallocation() is, for example, MatSeqAIJSetPreallocation] 3870175b88e8SBarry Smith 3871b259b22eSLois Curfman McInnes Notes: 387249a6f317SBarry Smith If nnz is given then nz is ignored 387349a6f317SBarry Smith 387417ab2063SBarry Smith The AIJ format (also called the Yale sparse matrix format or 387517ab2063SBarry Smith compressed row storage), is fully compatible with standard Fortran 77 38760002213bSLois Curfman McInnes storage. That is, the stored row and column indices can begin at 387744cd7ae7SLois Curfman McInnes either one (as in Fortran) or zero. See the users' manual for details. 387817ab2063SBarry Smith 387917ab2063SBarry Smith Specify the preallocated storage with either nz or nnz (not both). 38800298fd71SBarry Smith Set nz=PETSC_DEFAULT and nnz=NULL for PETSc to control dynamic memory 38813d323bbdSBarry Smith allocation. For large problems you MUST preallocate memory or you 38826da5968aSLois Curfman McInnes will get TERRIBLE performance, see the users' manual chapter on matrices. 388317ab2063SBarry Smith 3884682d7d0cSBarry Smith By default, this format uses inodes (identical nodes) when possible, to 38854fca80b9SLois Curfman McInnes improve numerical efficiency of matrix-vector products and solves. We 3886682d7d0cSBarry Smith search for consecutive rows with the same nonzero structure, thereby 38876c7ebb05SLois Curfman McInnes reusing matrix information to achieve increased efficiency. 38886c7ebb05SLois Curfman McInnes 38896c7ebb05SLois Curfman McInnes Options Database Keys: 3890698d4c6aSKris Buschelman + -mat_no_inode - Do not use inodes 38919db58ca8SBarry Smith - -mat_inode_limit <limit> - Sets inode limit (max limit=5) 389217ab2063SBarry Smith 3893027ccd11SLois Curfman McInnes Level: intermediate 3894027ccd11SLois Curfman McInnes 389569b1f4b7SBarry Smith .seealso: MatCreate(), MatCreateAIJ(), MatSetValues(), MatSeqAIJSetColumnIndices(), MatCreateSeqAIJWithArrays() 389636db0b34SBarry Smith 389717ab2063SBarry Smith @*/ 38987087cfbeSBarry Smith PetscErrorCode MatCreateSeqAIJ(MPI_Comm comm,PetscInt m,PetscInt n,PetscInt nz,const PetscInt nnz[],Mat *A) 389917ab2063SBarry Smith { 39003a40ed3dSBarry Smith PetscFunctionBegin; 39019566063dSJacob Faibussowitsch PetscCall(MatCreate(comm,A)); 39029566063dSJacob Faibussowitsch PetscCall(MatSetSizes(*A,m,n,m,n)); 39039566063dSJacob Faibussowitsch PetscCall(MatSetType(*A,MATSEQAIJ)); 39049566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(*A,nz,nnz)); 3905273d9f13SBarry Smith PetscFunctionReturn(0); 3906273d9f13SBarry Smith } 3907273d9f13SBarry Smith 3908273d9f13SBarry Smith /*@C 3909273d9f13SBarry Smith MatSeqAIJSetPreallocation - For good matrix assembly performance 3910273d9f13SBarry Smith the user should preallocate the matrix storage by setting the parameter nz 3911273d9f13SBarry Smith (or the array nnz). By setting these parameters accurately, performance 3912273d9f13SBarry Smith during matrix assembly can be increased by more than a factor of 50. 3913273d9f13SBarry Smith 3914d083f849SBarry Smith Collective 3915273d9f13SBarry Smith 3916273d9f13SBarry Smith Input Parameters: 39171c4f3114SJed Brown + B - The matrix 3918273d9f13SBarry Smith . nz - number of nonzeros per row (same for all rows) 3919273d9f13SBarry Smith - nnz - array containing the number of nonzeros in the various rows 39200298fd71SBarry Smith (possibly different for each row) or NULL 3921273d9f13SBarry Smith 3922273d9f13SBarry Smith Notes: 392349a6f317SBarry Smith If nnz is given then nz is ignored 392449a6f317SBarry Smith 3925273d9f13SBarry Smith The AIJ format (also called the Yale sparse matrix format or 3926273d9f13SBarry Smith compressed row storage), is fully compatible with standard Fortran 77 3927273d9f13SBarry Smith storage. That is, the stored row and column indices can begin at 3928273d9f13SBarry Smith either one (as in Fortran) or zero. See the users' manual for details. 3929273d9f13SBarry Smith 3930273d9f13SBarry Smith Specify the preallocated storage with either nz or nnz (not both). 39310298fd71SBarry Smith Set nz=PETSC_DEFAULT and nnz=NULL for PETSc to control dynamic memory 3932273d9f13SBarry Smith allocation. For large problems you MUST preallocate memory or you 3933273d9f13SBarry Smith will get TERRIBLE performance, see the users' manual chapter on matrices. 3934273d9f13SBarry Smith 3935aa95bbe8SBarry Smith You can call MatGetInfo() to get information on how effective the preallocation was; 3936aa95bbe8SBarry Smith for example the fields mallocs,nz_allocated,nz_used,nz_unneeded; 3937aa95bbe8SBarry Smith You can also run with the option -info and look for messages with the string 3938aa95bbe8SBarry Smith malloc in them to see if additional memory allocation was needed. 3939aa95bbe8SBarry Smith 3940a96a251dSBarry Smith Developers: Use nz of MAT_SKIP_ALLOCATION to not allocate any space for the matrix 3941a96a251dSBarry Smith entries or columns indices 3942a96a251dSBarry Smith 3943273d9f13SBarry Smith By default, this format uses inodes (identical nodes) when possible, to 3944273d9f13SBarry Smith improve numerical efficiency of matrix-vector products and solves. We 3945273d9f13SBarry Smith search for consecutive rows with the same nonzero structure, thereby 3946273d9f13SBarry Smith reusing matrix information to achieve increased efficiency. 3947273d9f13SBarry Smith 3948273d9f13SBarry Smith Options Database Keys: 3949698d4c6aSKris Buschelman + -mat_no_inode - Do not use inodes 395047b2e64bSBarry Smith - -mat_inode_limit <limit> - Sets inode limit (max limit=5) 3951273d9f13SBarry Smith 3952273d9f13SBarry Smith Level: intermediate 3953273d9f13SBarry Smith 395419b08ed1SBarry Smith .seealso: MatCreate(), MatCreateAIJ(), MatSetValues(), MatSeqAIJSetColumnIndices(), MatCreateSeqAIJWithArrays(), MatGetInfo(), 395519b08ed1SBarry Smith MatSeqAIJSetTotalPreallocation() 3956273d9f13SBarry Smith 3957273d9f13SBarry Smith @*/ 39587087cfbeSBarry Smith PetscErrorCode MatSeqAIJSetPreallocation(Mat B,PetscInt nz,const PetscInt nnz[]) 3959273d9f13SBarry Smith { 3960a23d5eceSKris Buschelman PetscFunctionBegin; 39616ba663aaSJed Brown PetscValidHeaderSpecific(B,MAT_CLASSID,1); 39626ba663aaSJed Brown PetscValidType(B,1); 3963cac4c232SBarry Smith PetscTryMethod(B,"MatSeqAIJSetPreallocation_C",(Mat,PetscInt,const PetscInt[]),(B,nz,nnz)); 3964a23d5eceSKris Buschelman PetscFunctionReturn(0); 3965a23d5eceSKris Buschelman } 3966a23d5eceSKris Buschelman 39677087cfbeSBarry Smith PetscErrorCode MatSeqAIJSetPreallocation_SeqAIJ(Mat B,PetscInt nz,const PetscInt *nnz) 3968a23d5eceSKris Buschelman { 3969273d9f13SBarry Smith Mat_SeqAIJ *b; 39702576faa2SJed Brown PetscBool skipallocation = PETSC_FALSE,realalloc = PETSC_FALSE; 397197f1f81fSBarry Smith PetscInt i; 3972273d9f13SBarry Smith 3973273d9f13SBarry Smith PetscFunctionBegin; 39742576faa2SJed Brown if (nz >= 0 || nnz) realalloc = PETSC_TRUE; 3975a96a251dSBarry Smith if (nz == MAT_SKIP_ALLOCATION) { 3976c461c341SBarry Smith skipallocation = PETSC_TRUE; 3977c461c341SBarry Smith nz = 0; 3978c461c341SBarry Smith } 39799566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(B->rmap)); 39809566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(B->cmap)); 3981899cda47SBarry Smith 3982435da068SBarry Smith if (nz == PETSC_DEFAULT || nz == PETSC_DECIDE) nz = 5; 39832c71b3e2SJacob Faibussowitsch PetscCheckFalse(nz < 0,PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"nz cannot be less than 0: value %" PetscInt_FMT,nz); 3984cf9c20a2SJed Brown if (PetscUnlikelyDebug(nnz)) { 3985d0f46423SBarry Smith for (i=0; i<B->rmap->n; i++) { 39862c71b3e2SJacob Faibussowitsch PetscCheckFalse(nnz[i] < 0,PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"nnz cannot be less than 0: local row %" PetscInt_FMT " value %" PetscInt_FMT,i,nnz[i]); 39872c71b3e2SJacob Faibussowitsch PetscCheckFalse(nnz[i] > B->cmap->n,PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"nnz cannot be greater than row length: local row %" PetscInt_FMT " value %" PetscInt_FMT " rowlength %" PetscInt_FMT,i,nnz[i],B->cmap->n); 3988b73539f3SBarry Smith } 3989b73539f3SBarry Smith } 3990b73539f3SBarry Smith 3991273d9f13SBarry Smith B->preallocated = PETSC_TRUE; 39922205254eSKarl Rupp 3993273d9f13SBarry Smith b = (Mat_SeqAIJ*)B->data; 3994273d9f13SBarry Smith 3995ab93d7beSBarry Smith if (!skipallocation) { 39962ee49352SLisandro Dalcin if (!b->imax) { 39979566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(B->rmap->n,&b->imax)); 39989566063dSJacob Faibussowitsch PetscCall(PetscLogObjectMemory((PetscObject)B,B->rmap->n*sizeof(PetscInt))); 3999071fcb05SBarry Smith } 4000071fcb05SBarry Smith if (!b->ilen) { 4001071fcb05SBarry Smith /* b->ilen will count nonzeros in each row so far. */ 40029566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(B->rmap->n,&b->ilen)); 40039566063dSJacob Faibussowitsch PetscCall(PetscLogObjectMemory((PetscObject)B,B->rmap->n*sizeof(PetscInt))); 4004071fcb05SBarry Smith } else { 40059566063dSJacob Faibussowitsch PetscCall(PetscMemzero(b->ilen,B->rmap->n*sizeof(PetscInt))); 40062ee49352SLisandro Dalcin } 4007846b4da1SFande Kong if (!b->ipre) { 40089566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(B->rmap->n,&b->ipre)); 40099566063dSJacob Faibussowitsch PetscCall(PetscLogObjectMemory((PetscObject)B,B->rmap->n*sizeof(PetscInt))); 4010846b4da1SFande Kong } 4011273d9f13SBarry Smith if (!nnz) { 4012435da068SBarry Smith if (nz == PETSC_DEFAULT || nz == PETSC_DECIDE) nz = 10; 4013c62bd62aSJed Brown else if (nz < 0) nz = 1; 40145d2a9ed1SStefano Zampini nz = PetscMin(nz,B->cmap->n); 4015d0f46423SBarry Smith for (i=0; i<B->rmap->n; i++) b->imax[i] = nz; 4016d0f46423SBarry Smith nz = nz*B->rmap->n; 4017273d9f13SBarry Smith } else { 4018c73702f5SBarry Smith PetscInt64 nz64 = 0; 4019c73702f5SBarry Smith for (i=0; i<B->rmap->n; i++) {b->imax[i] = nnz[i]; nz64 += nnz[i];} 40209566063dSJacob Faibussowitsch PetscCall(PetscIntCast(nz64,&nz)); 4021273d9f13SBarry Smith } 4022ab93d7beSBarry Smith 4023273d9f13SBarry Smith /* allocate the matrix space */ 402453dd7562SDmitry Karpeev /* FIXME: should B's old memory be unlogged? */ 40259566063dSJacob Faibussowitsch PetscCall(MatSeqXAIJFreeAIJ(B,&b->a,&b->j,&b->i)); 4026396832f4SHong Zhang if (B->structure_only) { 40279566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nz,&b->j)); 40289566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(B->rmap->n+1,&b->i)); 40299566063dSJacob Faibussowitsch PetscCall(PetscLogObjectMemory((PetscObject)B,(B->rmap->n+1)*sizeof(PetscInt)+nz*sizeof(PetscInt))); 4030396832f4SHong Zhang } else { 40319566063dSJacob Faibussowitsch PetscCall(PetscMalloc3(nz,&b->a,nz,&b->j,B->rmap->n+1,&b->i)); 40329566063dSJacob Faibussowitsch PetscCall(PetscLogObjectMemory((PetscObject)B,(B->rmap->n+1)*sizeof(PetscInt)+nz*(sizeof(PetscScalar)+sizeof(PetscInt)))); 4033396832f4SHong Zhang } 4034bfeeae90SHong Zhang b->i[0] = 0; 4035d0f46423SBarry Smith for (i=1; i<B->rmap->n+1; i++) { 40365da197adSKris Buschelman b->i[i] = b->i[i-1] + b->imax[i-1]; 40375da197adSKris Buschelman } 4038396832f4SHong Zhang if (B->structure_only) { 4039396832f4SHong Zhang b->singlemalloc = PETSC_FALSE; 4040396832f4SHong Zhang b->free_a = PETSC_FALSE; 4041396832f4SHong Zhang } else { 4042273d9f13SBarry Smith b->singlemalloc = PETSC_TRUE; 4043e6b907acSBarry Smith b->free_a = PETSC_TRUE; 4044396832f4SHong Zhang } 4045e6b907acSBarry Smith b->free_ij = PETSC_TRUE; 4046c461c341SBarry Smith } else { 4047e6b907acSBarry Smith b->free_a = PETSC_FALSE; 4048e6b907acSBarry Smith b->free_ij = PETSC_FALSE; 4049c461c341SBarry Smith } 4050273d9f13SBarry Smith 4051846b4da1SFande Kong if (b->ipre && nnz != b->ipre && b->imax) { 4052846b4da1SFande Kong /* reserve user-requested sparsity */ 40539566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(b->ipre,b->imax,B->rmap->n)); 4054846b4da1SFande Kong } 4055846b4da1SFande Kong 4056273d9f13SBarry Smith b->nz = 0; 4057273d9f13SBarry Smith b->maxnz = nz; 4058273d9f13SBarry Smith B->info.nz_unneeded = (double)b->maxnz; 40592205254eSKarl Rupp if (realalloc) { 40609566063dSJacob Faibussowitsch PetscCall(MatSetOption(B,MAT_NEW_NONZERO_ALLOCATION_ERR,PETSC_TRUE)); 40612205254eSKarl Rupp } 4062cb7b82ddSBarry Smith B->was_assembled = PETSC_FALSE; 4063cb7b82ddSBarry Smith B->assembled = PETSC_FALSE; 4064273d9f13SBarry Smith PetscFunctionReturn(0); 4065273d9f13SBarry Smith } 4066273d9f13SBarry Smith 4067846b4da1SFande Kong PetscErrorCode MatResetPreallocation_SeqAIJ(Mat A) 4068846b4da1SFande Kong { 4069846b4da1SFande Kong Mat_SeqAIJ *a; 4070a5bbaf83SFande Kong PetscInt i; 4071846b4da1SFande Kong 4072846b4da1SFande Kong PetscFunctionBegin; 4073846b4da1SFande Kong PetscValidHeaderSpecific(A,MAT_CLASSID,1); 407414d0e64fSAlex Lindsay 407514d0e64fSAlex Lindsay /* Check local size. If zero, then return */ 407614d0e64fSAlex Lindsay if (!A->rmap->n) PetscFunctionReturn(0); 407714d0e64fSAlex Lindsay 4078846b4da1SFande Kong a = (Mat_SeqAIJ*)A->data; 40792c814fdeSFande Kong /* if no saved info, we error out */ 408028b400f6SJacob Faibussowitsch PetscCheck(a->ipre,PETSC_COMM_SELF,PETSC_ERR_ARG_NULL,"No saved preallocation info "); 40812c814fdeSFande Kong 40822c71b3e2SJacob Faibussowitsch PetscCheckFalse(!a->i || !a->j || !a->a || !a->imax || !a->ilen,PETSC_COMM_SELF,PETSC_ERR_ARG_NULL,"Memory info is incomplete, and can not reset preallocation "); 40832c814fdeSFande Kong 40849566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(a->imax,a->ipre,A->rmap->n)); 40859566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(a->ilen,A->rmap->n)); 4086846b4da1SFande Kong a->i[0] = 0; 4087846b4da1SFande Kong for (i=1; i<A->rmap->n+1; i++) { 4088846b4da1SFande Kong a->i[i] = a->i[i-1] + a->imax[i-1]; 4089846b4da1SFande Kong } 4090846b4da1SFande Kong A->preallocated = PETSC_TRUE; 4091846b4da1SFande Kong a->nz = 0; 4092846b4da1SFande Kong a->maxnz = a->i[A->rmap->n]; 4093846b4da1SFande Kong A->info.nz_unneeded = (double)a->maxnz; 4094846b4da1SFande Kong A->was_assembled = PETSC_FALSE; 4095846b4da1SFande Kong A->assembled = PETSC_FALSE; 4096846b4da1SFande Kong PetscFunctionReturn(0); 4097846b4da1SFande Kong } 4098846b4da1SFande Kong 409958d36128SBarry Smith /*@ 4100a1661176SMatthew Knepley MatSeqAIJSetPreallocationCSR - Allocates memory for a sparse sequential matrix in AIJ format. 4101a1661176SMatthew Knepley 4102a1661176SMatthew Knepley Input Parameters: 4103a1661176SMatthew Knepley + B - the matrix 4104a1661176SMatthew Knepley . i - the indices into j for the start of each row (starts with zero) 4105a1661176SMatthew Knepley . j - the column indices for each row (starts with zero) these must be sorted for each row 4106a1661176SMatthew Knepley - v - optional values in the matrix 4107a1661176SMatthew Knepley 4108a1661176SMatthew Knepley Level: developer 4109a1661176SMatthew Knepley 41106a9b8d82SBarry Smith Notes: 411158d36128SBarry Smith The i,j,v values are COPIED with this routine; to avoid the copy use MatCreateSeqAIJWithArrays() 411258d36128SBarry Smith 41136a9b8d82SBarry Smith This routine may be called multiple times with different nonzero patterns (or the same nonzero pattern). The nonzero 41146a9b8d82SBarry Smith structure will be the union of all the previous nonzero structures. 41156a9b8d82SBarry Smith 41166a9b8d82SBarry Smith Developer Notes: 41176a9b8d82SBarry Smith An optimization could be added to the implementation where it checks if the i, and j are identical to the current i and j and 41186a9b8d82SBarry Smith then just copies the v values directly with PetscMemcpy(). 41196a9b8d82SBarry Smith 41206a9b8d82SBarry Smith This routine could also take a PetscCopyMode argument to allow sharing the values instead of always copying them. 41216a9b8d82SBarry Smith 41226a9b8d82SBarry Smith .seealso: MatCreate(), MatCreateSeqAIJ(), MatSetValues(), MatSeqAIJSetPreallocation(), MatCreateSeqAIJ(), MATSEQAIJ, MatResetPreallocation() 4123a1661176SMatthew Knepley @*/ 4124a1661176SMatthew Knepley PetscErrorCode MatSeqAIJSetPreallocationCSR(Mat B,const PetscInt i[],const PetscInt j[],const PetscScalar v[]) 4125a1661176SMatthew Knepley { 4126a1661176SMatthew Knepley PetscFunctionBegin; 41270700a824SBarry Smith PetscValidHeaderSpecific(B,MAT_CLASSID,1); 41286ba663aaSJed Brown PetscValidType(B,1); 4129cac4c232SBarry Smith PetscTryMethod(B,"MatSeqAIJSetPreallocationCSR_C",(Mat,const PetscInt[],const PetscInt[],const PetscScalar[]),(B,i,j,v)); 4130a1661176SMatthew Knepley PetscFunctionReturn(0); 4131a1661176SMatthew Knepley } 4132a1661176SMatthew Knepley 41337087cfbeSBarry Smith PetscErrorCode MatSeqAIJSetPreallocationCSR_SeqAIJ(Mat B,const PetscInt Ii[],const PetscInt J[],const PetscScalar v[]) 4134a1661176SMatthew Knepley { 4135a1661176SMatthew Knepley PetscInt i; 4136a1661176SMatthew Knepley PetscInt m,n; 4137a1661176SMatthew Knepley PetscInt nz; 41386a9b8d82SBarry Smith PetscInt *nnz; 4139a1661176SMatthew Knepley 4140a1661176SMatthew Knepley PetscFunctionBegin; 41412c71b3e2SJacob Faibussowitsch PetscCheckFalse(Ii[0],PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE, "Ii[0] must be 0 it is %" PetscInt_FMT, Ii[0]); 4142779a8d59SSatish Balay 41439566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(B->rmap)); 41449566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(B->cmap)); 4145779a8d59SSatish Balay 41469566063dSJacob Faibussowitsch PetscCall(MatGetSize(B, &m, &n)); 41479566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m+1, &nnz)); 4148a1661176SMatthew Knepley for (i = 0; i < m; i++) { 4149b7940d39SSatish Balay nz = Ii[i+1]- Ii[i]; 41502c71b3e2SJacob Faibussowitsch PetscCheckFalse(nz < 0,PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE, "Local row %" PetscInt_FMT " has a negative number of columns %" PetscInt_FMT, i, nz); 4151a1661176SMatthew Knepley nnz[i] = nz; 4152a1661176SMatthew Knepley } 41539566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation(B, 0, nnz)); 41549566063dSJacob Faibussowitsch PetscCall(PetscFree(nnz)); 4155a1661176SMatthew Knepley 4156a1661176SMatthew Knepley for (i = 0; i < m; i++) { 41579566063dSJacob Faibussowitsch PetscCall(MatSetValues_SeqAIJ(B, 1, &i, Ii[i+1] - Ii[i], J+Ii[i], v ? v + Ii[i] : NULL, INSERT_VALUES)); 4158a1661176SMatthew Knepley } 4159a1661176SMatthew Knepley 41609566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(B,MAT_FINAL_ASSEMBLY)); 41619566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(B,MAT_FINAL_ASSEMBLY)); 4162a1661176SMatthew Knepley 41639566063dSJacob Faibussowitsch PetscCall(MatSetOption(B,MAT_NEW_NONZERO_LOCATION_ERR,PETSC_TRUE)); 4164a1661176SMatthew Knepley PetscFunctionReturn(0); 4165a1661176SMatthew Knepley } 4166a1661176SMatthew Knepley 4167ad7e164aSPierre Jolivet /*@ 4168ad7e164aSPierre Jolivet MatSeqAIJKron - Computes C, the Kronecker product of A and B. 4169ad7e164aSPierre Jolivet 4170ad7e164aSPierre Jolivet Input Parameters: 4171ad7e164aSPierre Jolivet + A - left-hand side matrix 4172ad7e164aSPierre Jolivet . B - right-hand side matrix 4173ad7e164aSPierre Jolivet - reuse - either MAT_INITIAL_MATRIX or MAT_REUSE_MATRIX 4174ad7e164aSPierre Jolivet 4175ad7e164aSPierre Jolivet Output Parameter: 4176ad7e164aSPierre Jolivet . C - Kronecker product of A and B 4177ad7e164aSPierre Jolivet 4178ad7e164aSPierre Jolivet Level: intermediate 4179ad7e164aSPierre Jolivet 4180ad7e164aSPierre Jolivet Notes: 4181ad7e164aSPierre Jolivet MAT_REUSE_MATRIX can only be used when the nonzero structure of the product matrix has not changed from that last call to MatSeqAIJKron(). 4182ad7e164aSPierre Jolivet 4183ad7e164aSPierre Jolivet .seealso: MatCreateSeqAIJ(), MATSEQAIJ, MATKAIJ, MatReuse 4184ad7e164aSPierre Jolivet @*/ 4185ad7e164aSPierre Jolivet PetscErrorCode MatSeqAIJKron(Mat A,Mat B,MatReuse reuse,Mat *C) 4186ad7e164aSPierre Jolivet { 4187ad7e164aSPierre Jolivet PetscFunctionBegin; 4188ad7e164aSPierre Jolivet PetscValidHeaderSpecific(A,MAT_CLASSID,1); 4189ad7e164aSPierre Jolivet PetscValidType(A,1); 4190ad7e164aSPierre Jolivet PetscValidHeaderSpecific(B,MAT_CLASSID,2); 4191ad7e164aSPierre Jolivet PetscValidType(B,2); 4192ad7e164aSPierre Jolivet PetscValidPointer(C,4); 4193ad7e164aSPierre Jolivet if (reuse == MAT_REUSE_MATRIX) { 4194ad7e164aSPierre Jolivet PetscValidHeaderSpecific(*C,MAT_CLASSID,4); 4195ad7e164aSPierre Jolivet PetscValidType(*C,4); 4196ad7e164aSPierre Jolivet } 4197cac4c232SBarry Smith PetscTryMethod(A,"MatSeqAIJKron_C",(Mat,Mat,MatReuse,Mat*),(A,B,reuse,C)); 4198ad7e164aSPierre Jolivet PetscFunctionReturn(0); 4199ad7e164aSPierre Jolivet } 4200ad7e164aSPierre Jolivet 4201ad7e164aSPierre Jolivet PetscErrorCode MatSeqAIJKron_SeqAIJ(Mat A,Mat B,MatReuse reuse,Mat *C) 4202ad7e164aSPierre Jolivet { 4203ad7e164aSPierre Jolivet Mat newmat; 4204ad7e164aSPierre Jolivet Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 4205ad7e164aSPierre Jolivet Mat_SeqAIJ *b = (Mat_SeqAIJ*)B->data; 4206ad7e164aSPierre Jolivet PetscScalar *v; 4207fff043a9SJunchao Zhang const PetscScalar *aa,*ba; 4208ad7e164aSPierre Jolivet PetscInt *i,*j,m,n,p,q,nnz = 0,am = A->rmap->n,bm = B->rmap->n,an = A->cmap->n, bn = B->cmap->n; 4209ad7e164aSPierre Jolivet PetscBool flg; 4210ad7e164aSPierre Jolivet 4211ad7e164aSPierre Jolivet PetscFunctionBegin; 421228b400f6SJacob Faibussowitsch PetscCheck(!A->factortype,PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Not for factored matrix"); 421328b400f6SJacob Faibussowitsch PetscCheck(A->assembled,PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Not for unassembled matrix"); 421428b400f6SJacob Faibussowitsch PetscCheck(!B->factortype,PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Not for factored matrix"); 421528b400f6SJacob Faibussowitsch PetscCheck(B->assembled,PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Not for unassembled matrix"); 42169566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)B,MATSEQAIJ,&flg)); 421728b400f6SJacob Faibussowitsch PetscCheck(flg,PETSC_COMM_SELF,PETSC_ERR_SUP,"MatType %s",((PetscObject)B)->type_name); 42182c71b3e2SJacob Faibussowitsch PetscCheckFalse(reuse != MAT_INITIAL_MATRIX && reuse != MAT_REUSE_MATRIX,PETSC_COMM_SELF,PETSC_ERR_SUP,"MatReuse %d",(int)reuse); 4219ad7e164aSPierre Jolivet if (reuse == MAT_INITIAL_MATRIX) { 42209566063dSJacob Faibussowitsch PetscCall(PetscMalloc2(am*bm+1,&i,a->i[am]*b->i[bm],&j)); 42219566063dSJacob Faibussowitsch PetscCall(MatCreate(PETSC_COMM_SELF,&newmat)); 42229566063dSJacob Faibussowitsch PetscCall(MatSetSizes(newmat,am*bm,an*bn,am*bm,an*bn)); 42239566063dSJacob Faibussowitsch PetscCall(MatSetType(newmat,MATAIJ)); 4224ad7e164aSPierre Jolivet i[0] = 0; 4225ad7e164aSPierre Jolivet for (m = 0; m < am; ++m) { 4226ad7e164aSPierre Jolivet for (p = 0; p < bm; ++p) { 4227ad7e164aSPierre Jolivet i[m*bm + p + 1] = i[m*bm + p] + (a->i[m+1] - a->i[m]) * (b->i[p+1] - b->i[p]); 4228ad7e164aSPierre Jolivet for (n = a->i[m]; n < a->i[m+1]; ++n) { 4229ad7e164aSPierre Jolivet for (q = b->i[p]; q < b->i[p+1]; ++q) { 4230ad7e164aSPierre Jolivet j[nnz++] = a->j[n]*bn + b->j[q]; 4231ad7e164aSPierre Jolivet } 4232ad7e164aSPierre Jolivet } 4233ad7e164aSPierre Jolivet } 4234ad7e164aSPierre Jolivet } 42359566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocationCSR(newmat,i,j,NULL)); 4236ad7e164aSPierre Jolivet *C = newmat; 42379566063dSJacob Faibussowitsch PetscCall(PetscFree2(i,j)); 4238ad7e164aSPierre Jolivet nnz = 0; 4239ad7e164aSPierre Jolivet } 42409566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(*C,&v)); 42419566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A,&aa)); 42429566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(B,&ba)); 4243ad7e164aSPierre Jolivet for (m = 0; m < am; ++m) { 4244ad7e164aSPierre Jolivet for (p = 0; p < bm; ++p) { 4245ad7e164aSPierre Jolivet for (n = a->i[m]; n < a->i[m+1]; ++n) { 4246ad7e164aSPierre Jolivet for (q = b->i[p]; q < b->i[p+1]; ++q) { 4247fff043a9SJunchao Zhang v[nnz++] = aa[n] * ba[q]; 4248ad7e164aSPierre Jolivet } 4249ad7e164aSPierre Jolivet } 4250ad7e164aSPierre Jolivet } 4251ad7e164aSPierre Jolivet } 42529566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(*C,&v)); 42539566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A,&aa)); 42549566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(B,&ba)); 4255ad7e164aSPierre Jolivet PetscFunctionReturn(0); 4256ad7e164aSPierre Jolivet } 4257ad7e164aSPierre Jolivet 4258c6db04a5SJed Brown #include <../src/mat/impls/dense/seq/dense.h> 4259af0996ceSBarry Smith #include <petsc/private/kernels/petscaxpy.h> 4260170fe5c8SBarry Smith 4261170fe5c8SBarry Smith /* 4262170fe5c8SBarry Smith Computes (B'*A')' since computing B*A directly is untenable 4263170fe5c8SBarry Smith 4264170fe5c8SBarry Smith n p p 42652da392ccSBarry Smith [ ] [ ] [ ] 42662da392ccSBarry Smith m [ A ] * n [ B ] = m [ C ] 42672da392ccSBarry Smith [ ] [ ] [ ] 4268170fe5c8SBarry Smith 4269170fe5c8SBarry Smith */ 4270170fe5c8SBarry Smith PetscErrorCode MatMatMultNumeric_SeqDense_SeqAIJ(Mat A,Mat B,Mat C) 4271170fe5c8SBarry Smith { 4272170fe5c8SBarry Smith Mat_SeqDense *sub_a = (Mat_SeqDense*)A->data; 4273170fe5c8SBarry Smith Mat_SeqAIJ *sub_b = (Mat_SeqAIJ*)B->data; 4274170fe5c8SBarry Smith Mat_SeqDense *sub_c = (Mat_SeqDense*)C->data; 427586214ceeSStefano Zampini PetscInt i,j,n,m,q,p; 4276170fe5c8SBarry Smith const PetscInt *ii,*idx; 4277170fe5c8SBarry Smith const PetscScalar *b,*a,*a_q; 4278170fe5c8SBarry Smith PetscScalar *c,*c_q; 427986214ceeSStefano Zampini PetscInt clda = sub_c->lda; 428086214ceeSStefano Zampini PetscInt alda = sub_a->lda; 4281170fe5c8SBarry Smith 4282170fe5c8SBarry Smith PetscFunctionBegin; 4283d0f46423SBarry Smith m = A->rmap->n; 4284d0f46423SBarry Smith n = A->cmap->n; 4285d0f46423SBarry Smith p = B->cmap->n; 4286170fe5c8SBarry Smith a = sub_a->v; 4287170fe5c8SBarry Smith b = sub_b->a; 4288170fe5c8SBarry Smith c = sub_c->v; 428986214ceeSStefano Zampini if (clda == m) { 42909566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(c,m*p)); 429186214ceeSStefano Zampini } else { 429286214ceeSStefano Zampini for (j=0;j<p;j++) 429386214ceeSStefano Zampini for (i=0;i<m;i++) 429486214ceeSStefano Zampini c[j*clda + i] = 0.0; 429586214ceeSStefano Zampini } 4296170fe5c8SBarry Smith ii = sub_b->i; 4297170fe5c8SBarry Smith idx = sub_b->j; 4298170fe5c8SBarry Smith for (i=0; i<n; i++) { 4299170fe5c8SBarry Smith q = ii[i+1] - ii[i]; 4300170fe5c8SBarry Smith while (q-->0) { 430186214ceeSStefano Zampini c_q = c + clda*(*idx); 430286214ceeSStefano Zampini a_q = a + alda*i; 4303854c7f52SBarry Smith PetscKernelAXPY(c_q,*b,a_q,m); 4304170fe5c8SBarry Smith idx++; 4305170fe5c8SBarry Smith b++; 4306170fe5c8SBarry Smith } 4307170fe5c8SBarry Smith } 4308170fe5c8SBarry Smith PetscFunctionReturn(0); 4309170fe5c8SBarry Smith } 4310170fe5c8SBarry Smith 43114222ddf1SHong Zhang PetscErrorCode MatMatMultSymbolic_SeqDense_SeqAIJ(Mat A,Mat B,PetscReal fill,Mat C) 4312170fe5c8SBarry Smith { 4313d0f46423SBarry Smith PetscInt m=A->rmap->n,n=B->cmap->n; 431486214ceeSStefano Zampini PetscBool cisdense; 4315170fe5c8SBarry Smith 4316170fe5c8SBarry Smith PetscFunctionBegin; 43172c71b3e2SJacob Faibussowitsch PetscCheckFalse(A->cmap->n != B->rmap->n,PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"A->cmap->n %" PetscInt_FMT " != B->rmap->n %" PetscInt_FMT,A->cmap->n,B->rmap->n); 43189566063dSJacob Faibussowitsch PetscCall(MatSetSizes(C,m,n,m,n)); 43199566063dSJacob Faibussowitsch PetscCall(MatSetBlockSizesFromMats(C,A,B)); 43209566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompareAny((PetscObject)C,&cisdense,MATSEQDENSE,MATSEQDENSECUDA,"")); 432186214ceeSStefano Zampini if (!cisdense) { 43229566063dSJacob Faibussowitsch PetscCall(MatSetType(C,MATDENSE)); 432386214ceeSStefano Zampini } 43249566063dSJacob Faibussowitsch PetscCall(MatSetUp(C)); 4325d73949e8SHong Zhang 43264222ddf1SHong Zhang C->ops->matmultnumeric = MatMatMultNumeric_SeqDense_SeqAIJ; 4327170fe5c8SBarry Smith PetscFunctionReturn(0); 4328170fe5c8SBarry Smith } 4329170fe5c8SBarry Smith 4330170fe5c8SBarry Smith /* ----------------------------------------------------------------*/ 43310bad9183SKris Buschelman /*MC 4332fafad747SKris Buschelman MATSEQAIJ - MATSEQAIJ = "seqaij" - A matrix type to be used for sequential sparse matrices, 43330bad9183SKris Buschelman based on compressed sparse row format. 43340bad9183SKris Buschelman 43350bad9183SKris Buschelman Options Database Keys: 43360bad9183SKris Buschelman . -mat_type seqaij - sets the matrix type to "seqaij" during a call to MatSetFromOptions() 43370bad9183SKris Buschelman 43380bad9183SKris Buschelman Level: beginner 43390bad9183SKris Buschelman 43400cd7f59aSBarry Smith Notes: 43410cd7f59aSBarry Smith MatSetValues() may be called for this matrix type with a NULL argument for the numerical values, 43420cd7f59aSBarry Smith in this case the values associated with the rows and columns one passes in are set to zero 43430cd7f59aSBarry Smith in the matrix 43440cd7f59aSBarry Smith 43450cd7f59aSBarry Smith MatSetOptions(,MAT_STRUCTURE_ONLY,PETSC_TRUE) may be called for this matrix type. In this no 43460cd7f59aSBarry Smith space is allocated for the nonzero entries and any entries passed with MatSetValues() are ignored 43470cd7f59aSBarry Smith 43480cd7f59aSBarry Smith Developer Notes: 43490cd7f59aSBarry Smith It would be nice if all matrix formats supported passing NULL in for the numerical values 43500cd7f59aSBarry Smith 4351ed73aabaSBarry Smith .seealso: MatCreateSeqAIJ(), MatSetFromOptions(), MatSetType(), MatCreate(), MatType, MATSELL, MATSEQSELL, MATMPISELL 43520bad9183SKris Buschelman M*/ 43530bad9183SKris Buschelman 4354ccd284c7SBarry Smith /*MC 4355ccd284c7SBarry Smith MATAIJ - MATAIJ = "aij" - A matrix type to be used for sparse matrices. 4356ccd284c7SBarry Smith 4357ccd284c7SBarry Smith This matrix type is identical to MATSEQAIJ when constructed with a single process communicator, 4358ccd284c7SBarry Smith and MATMPIAIJ otherwise. As a result, for single process communicators, 4359ed73aabaSBarry Smith MatSeqAIJSetPreallocation() is supported, and similarly MatMPIAIJSetPreallocation() is supported 4360ccd284c7SBarry Smith for communicators controlling multiple processes. It is recommended that you call both of 4361ccd284c7SBarry Smith the above preallocation routines for simplicity. 4362ccd284c7SBarry Smith 4363ccd284c7SBarry Smith Options Database Keys: 4364ccd284c7SBarry Smith . -mat_type aij - sets the matrix type to "aij" during a call to MatSetFromOptions() 4365ccd284c7SBarry Smith 436695452b02SPatrick Sanan Developer Notes: 4367ca9cdca7SRichard Tran Mills Subclasses include MATAIJCUSPARSE, MATAIJPERM, MATAIJSELL, MATAIJMKL, MATAIJCRL, and also automatically switches over to use inodes when 4368ccd284c7SBarry Smith enough exist. 4369ccd284c7SBarry Smith 4370ccd284c7SBarry Smith Level: beginner 4371ccd284c7SBarry Smith 4372ed73aabaSBarry Smith .seealso: MatCreateAIJ(), MatCreateSeqAIJ(), MATSEQAIJ, MATMPIAIJ, MATSELL, MATSEQSELL, MATMPISELL 4373ccd284c7SBarry Smith M*/ 4374ccd284c7SBarry Smith 4375ccd284c7SBarry Smith /*MC 4376ccd284c7SBarry Smith MATAIJCRL - MATAIJCRL = "aijcrl" - A matrix type to be used for sparse matrices. 4377ccd284c7SBarry Smith 4378ccd284c7SBarry Smith This matrix type is identical to MATSEQAIJCRL when constructed with a single process communicator, 4379ccd284c7SBarry Smith and MATMPIAIJCRL otherwise. As a result, for single process communicators, 4380ccd284c7SBarry Smith MatSeqAIJSetPreallocation() is supported, and similarly MatMPIAIJSetPreallocation() is supported 4381ccd284c7SBarry Smith for communicators controlling multiple processes. It is recommended that you call both of 4382ccd284c7SBarry Smith the above preallocation routines for simplicity. 4383ccd284c7SBarry Smith 4384ccd284c7SBarry Smith Options Database Keys: 4385ccd284c7SBarry Smith . -mat_type aijcrl - sets the matrix type to "aijcrl" during a call to MatSetFromOptions() 4386ccd284c7SBarry Smith 4387ccd284c7SBarry Smith Level: beginner 4388ccd284c7SBarry Smith 4389ccd284c7SBarry Smith .seealso: MatCreateMPIAIJCRL,MATSEQAIJCRL,MATMPIAIJCRL, MATSEQAIJCRL, MATMPIAIJCRL 4390ccd284c7SBarry Smith M*/ 4391ccd284c7SBarry Smith 43927906f579SHong Zhang PETSC_INTERN PetscErrorCode MatConvert_SeqAIJ_SeqAIJCRL(Mat,MatType,MatReuse,Mat*); 43937906f579SHong Zhang #if defined(PETSC_HAVE_ELEMENTAL) 43947906f579SHong Zhang PETSC_INTERN PetscErrorCode MatConvert_SeqAIJ_Elemental(Mat,MatType,MatReuse,Mat*); 43957906f579SHong Zhang #endif 4396d24d4204SJose E. Roman #if defined(PETSC_HAVE_SCALAPACK) 4397d24d4204SJose E. Roman PETSC_INTERN PetscErrorCode MatConvert_AIJ_ScaLAPACK(Mat,MatType,MatReuse,Mat*); 4398d24d4204SJose E. Roman #endif 43997906f579SHong Zhang #if defined(PETSC_HAVE_HYPRE) 44007906f579SHong Zhang PETSC_INTERN PetscErrorCode MatConvert_AIJ_HYPRE(Mat A,MatType,MatReuse,Mat*); 44017906f579SHong Zhang #endif 44027906f579SHong Zhang 4403d4002b98SHong Zhang PETSC_EXTERN PetscErrorCode MatConvert_SeqAIJ_SeqSELL(Mat,MatType,MatReuse,Mat*); 4404c9225affSStefano Zampini PETSC_INTERN PetscErrorCode MatConvert_XAIJ_IS(Mat,MatType,MatReuse,Mat*); 44054222ddf1SHong Zhang PETSC_INTERN PetscErrorCode MatProductSetFromOptions_IS_XAIJ(Mat); 44067906f579SHong Zhang 44078c778c55SBarry Smith /*@C 44088f1ea47aSStefano Zampini MatSeqAIJGetArray - gives read/write access to the array where the data for a MATSEQAIJ matrix is stored 44098c778c55SBarry Smith 44108c778c55SBarry Smith Not Collective 44118c778c55SBarry Smith 44128c778c55SBarry Smith Input Parameter: 4413579dbff0SBarry Smith . mat - a MATSEQAIJ matrix 44148c778c55SBarry Smith 44158c778c55SBarry Smith Output Parameter: 44168c778c55SBarry Smith . array - pointer to the data 44178c778c55SBarry Smith 44188c778c55SBarry Smith Level: intermediate 44198c778c55SBarry Smith 4420774cf152SJed Brown .seealso: MatSeqAIJRestoreArray(), MatSeqAIJGetArrayF90() 44218c778c55SBarry Smith @*/ 44228c778c55SBarry Smith PetscErrorCode MatSeqAIJGetArray(Mat A,PetscScalar **array) 44238c778c55SBarry Smith { 4424d67d9f35SJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ*)A->data; 44258c778c55SBarry Smith 44268c778c55SBarry Smith PetscFunctionBegin; 4427d67d9f35SJunchao Zhang if (aij->ops->getarray) { 44289566063dSJacob Faibussowitsch PetscCall((*aij->ops->getarray)(A,array)); 4429d67d9f35SJunchao Zhang } else { 4430d67d9f35SJunchao Zhang *array = aij->a; 4431d67d9f35SJunchao Zhang } 4432d67d9f35SJunchao Zhang PetscFunctionReturn(0); 4433d67d9f35SJunchao Zhang } 4434d67d9f35SJunchao Zhang 4435d67d9f35SJunchao Zhang /*@C 4436d67d9f35SJunchao Zhang MatSeqAIJRestoreArray - returns access to the array where the data for a MATSEQAIJ matrix is stored obtained by MatSeqAIJGetArray() 4437d67d9f35SJunchao Zhang 4438d67d9f35SJunchao Zhang Not Collective 4439d67d9f35SJunchao Zhang 4440d67d9f35SJunchao Zhang Input Parameters: 4441d67d9f35SJunchao Zhang + mat - a MATSEQAIJ matrix 4442d67d9f35SJunchao Zhang - array - pointer to the data 4443d67d9f35SJunchao Zhang 4444d67d9f35SJunchao Zhang Level: intermediate 4445d67d9f35SJunchao Zhang 4446d67d9f35SJunchao Zhang .seealso: MatSeqAIJGetArray(), MatSeqAIJRestoreArrayF90() 4447d67d9f35SJunchao Zhang @*/ 4448d67d9f35SJunchao Zhang PetscErrorCode MatSeqAIJRestoreArray(Mat A,PetscScalar **array) 4449d67d9f35SJunchao Zhang { 4450d67d9f35SJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ*)A->data; 4451d67d9f35SJunchao Zhang 4452d67d9f35SJunchao Zhang PetscFunctionBegin; 4453d67d9f35SJunchao Zhang if (aij->ops->restorearray) { 44549566063dSJacob Faibussowitsch PetscCall((*aij->ops->restorearray)(A,array)); 4455d67d9f35SJunchao Zhang } else { 4456d67d9f35SJunchao Zhang *array = NULL; 4457d67d9f35SJunchao Zhang } 44589566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(A)); 44599566063dSJacob Faibussowitsch PetscCall(PetscObjectStateIncrease((PetscObject)A)); 44608c778c55SBarry Smith PetscFunctionReturn(0); 44618c778c55SBarry Smith } 44628c778c55SBarry Smith 446321e72a00SBarry Smith /*@C 44648f1ea47aSStefano Zampini MatSeqAIJGetArrayRead - gives read-only access to the array where the data for a MATSEQAIJ matrix is stored 44658f1ea47aSStefano Zampini 44668f1ea47aSStefano Zampini Not Collective 44678f1ea47aSStefano Zampini 44688f1ea47aSStefano Zampini Input Parameter: 44698f1ea47aSStefano Zampini . mat - a MATSEQAIJ matrix 44708f1ea47aSStefano Zampini 44718f1ea47aSStefano Zampini Output Parameter: 44728f1ea47aSStefano Zampini . array - pointer to the data 44738f1ea47aSStefano Zampini 44748f1ea47aSStefano Zampini Level: intermediate 44758f1ea47aSStefano Zampini 44768f1ea47aSStefano Zampini .seealso: MatSeqAIJGetArray(), MatSeqAIJRestoreArrayRead() 44778f1ea47aSStefano Zampini @*/ 44788f1ea47aSStefano Zampini PetscErrorCode MatSeqAIJGetArrayRead(Mat A,const PetscScalar **array) 44798f1ea47aSStefano Zampini { 4480d67d9f35SJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ*)A->data; 44818f1ea47aSStefano Zampini 44828f1ea47aSStefano Zampini PetscFunctionBegin; 4483d67d9f35SJunchao Zhang if (aij->ops->getarrayread) { 44849566063dSJacob Faibussowitsch PetscCall((*aij->ops->getarrayread)(A,array)); 4485d67d9f35SJunchao Zhang } else { 4486d67d9f35SJunchao Zhang *array = aij->a; 4487d67d9f35SJunchao Zhang } 44888f1ea47aSStefano Zampini PetscFunctionReturn(0); 44898f1ea47aSStefano Zampini } 44908f1ea47aSStefano Zampini 44918f1ea47aSStefano Zampini /*@C 44928f1ea47aSStefano Zampini MatSeqAIJRestoreArrayRead - restore the read-only access array obtained from MatSeqAIJGetArrayRead 44938f1ea47aSStefano Zampini 44948f1ea47aSStefano Zampini Not Collective 44958f1ea47aSStefano Zampini 44968f1ea47aSStefano Zampini Input Parameter: 44978f1ea47aSStefano Zampini . mat - a MATSEQAIJ matrix 44988f1ea47aSStefano Zampini 44998f1ea47aSStefano Zampini Output Parameter: 45008f1ea47aSStefano Zampini . array - pointer to the data 45018f1ea47aSStefano Zampini 45028f1ea47aSStefano Zampini Level: intermediate 45038f1ea47aSStefano Zampini 45048f1ea47aSStefano Zampini .seealso: MatSeqAIJGetArray(), MatSeqAIJGetArrayRead() 45058f1ea47aSStefano Zampini @*/ 45068f1ea47aSStefano Zampini PetscErrorCode MatSeqAIJRestoreArrayRead(Mat A,const PetscScalar **array) 45078f1ea47aSStefano Zampini { 4508d67d9f35SJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ*)A->data; 45098f1ea47aSStefano Zampini 45108f1ea47aSStefano Zampini PetscFunctionBegin; 4511d67d9f35SJunchao Zhang if (aij->ops->restorearrayread) { 45129566063dSJacob Faibussowitsch PetscCall((*aij->ops->restorearrayread)(A,array)); 4513d67d9f35SJunchao Zhang } else { 4514d67d9f35SJunchao Zhang *array = NULL; 4515d67d9f35SJunchao Zhang } 4516d67d9f35SJunchao Zhang PetscFunctionReturn(0); 4517d67d9f35SJunchao Zhang } 4518d67d9f35SJunchao Zhang 4519d67d9f35SJunchao Zhang /*@C 4520d67d9f35SJunchao Zhang MatSeqAIJGetArrayWrite - gives write-only access to the array where the data for a MATSEQAIJ matrix is stored 4521d67d9f35SJunchao Zhang 4522d67d9f35SJunchao Zhang Not Collective 4523d67d9f35SJunchao Zhang 4524d67d9f35SJunchao Zhang Input Parameter: 4525d67d9f35SJunchao Zhang . mat - a MATSEQAIJ matrix 4526d67d9f35SJunchao Zhang 4527d67d9f35SJunchao Zhang Output Parameter: 4528d67d9f35SJunchao Zhang . array - pointer to the data 4529d67d9f35SJunchao Zhang 4530d67d9f35SJunchao Zhang Level: intermediate 4531d67d9f35SJunchao Zhang 4532d67d9f35SJunchao Zhang .seealso: MatSeqAIJGetArray(), MatSeqAIJRestoreArrayRead() 4533d67d9f35SJunchao Zhang @*/ 4534d67d9f35SJunchao Zhang PetscErrorCode MatSeqAIJGetArrayWrite(Mat A,PetscScalar **array) 4535d67d9f35SJunchao Zhang { 4536d67d9f35SJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ*)A->data; 4537d67d9f35SJunchao Zhang 4538d67d9f35SJunchao Zhang PetscFunctionBegin; 4539d67d9f35SJunchao Zhang if (aij->ops->getarraywrite) { 45409566063dSJacob Faibussowitsch PetscCall((*aij->ops->getarraywrite)(A,array)); 4541d67d9f35SJunchao Zhang } else { 4542d67d9f35SJunchao Zhang *array = aij->a; 4543d67d9f35SJunchao Zhang } 45449566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal(A)); 45459566063dSJacob Faibussowitsch PetscCall(PetscObjectStateIncrease((PetscObject)A)); 4546d67d9f35SJunchao Zhang PetscFunctionReturn(0); 4547d67d9f35SJunchao Zhang } 4548d67d9f35SJunchao Zhang 4549d67d9f35SJunchao Zhang /*@C 4550d67d9f35SJunchao Zhang MatSeqAIJRestoreArrayWrite - restore the read-only access array obtained from MatSeqAIJGetArrayRead 4551d67d9f35SJunchao Zhang 4552d67d9f35SJunchao Zhang Not Collective 4553d67d9f35SJunchao Zhang 4554d67d9f35SJunchao Zhang Input Parameter: 4555d67d9f35SJunchao Zhang . mat - a MATSEQAIJ matrix 4556d67d9f35SJunchao Zhang 4557d67d9f35SJunchao Zhang Output Parameter: 4558d67d9f35SJunchao Zhang . array - pointer to the data 4559d67d9f35SJunchao Zhang 4560d67d9f35SJunchao Zhang Level: intermediate 4561d67d9f35SJunchao Zhang 4562d67d9f35SJunchao Zhang .seealso: MatSeqAIJGetArray(), MatSeqAIJGetArrayRead() 4563d67d9f35SJunchao Zhang @*/ 4564d67d9f35SJunchao Zhang PetscErrorCode MatSeqAIJRestoreArrayWrite(Mat A,PetscScalar **array) 4565d67d9f35SJunchao Zhang { 4566d67d9f35SJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ*)A->data; 4567d67d9f35SJunchao Zhang 4568d67d9f35SJunchao Zhang PetscFunctionBegin; 4569d67d9f35SJunchao Zhang if (aij->ops->restorearraywrite) { 45709566063dSJacob Faibussowitsch PetscCall((*aij->ops->restorearraywrite)(A,array)); 4571d67d9f35SJunchao Zhang } else { 4572d67d9f35SJunchao Zhang *array = NULL; 4573d67d9f35SJunchao Zhang } 45748f1ea47aSStefano Zampini PetscFunctionReturn(0); 45758f1ea47aSStefano Zampini } 45768f1ea47aSStefano Zampini 45778f1ea47aSStefano Zampini /*@C 45787ee59b9bSJunchao Zhang MatSeqAIJGetCSRAndMemType - Get the CSR arrays and the memory type of the SEQAIJ matrix 45797ee59b9bSJunchao Zhang 45807ee59b9bSJunchao Zhang Not Collective 45817ee59b9bSJunchao Zhang 45827ee59b9bSJunchao Zhang Input Parameter: 45837ee59b9bSJunchao Zhang . mat - a matrix of type MATSEQAIJ or its subclasses 45847ee59b9bSJunchao Zhang 45857ee59b9bSJunchao Zhang Output Parameters: 45867ee59b9bSJunchao Zhang + i - row map array of the matrix 45877ee59b9bSJunchao Zhang . j - column index array of the matrix 45887ee59b9bSJunchao Zhang . a - data array of the matrix 45897ee59b9bSJunchao Zhang - memtype - memory type of the arrays 45907ee59b9bSJunchao Zhang 45917ee59b9bSJunchao Zhang Notes: 45927ee59b9bSJunchao Zhang Any of the output parameters can be NULL, in which case the corresponding value is not returned. 45937ee59b9bSJunchao Zhang If mat is a device matrix, the arrays are on the device. Otherwise, they are on the host. 45947ee59b9bSJunchao Zhang 45957ee59b9bSJunchao Zhang One can call this routine on a preallocated but not assembled matrix to just get the memory of the CSR underneath the matrix. 45967ee59b9bSJunchao Zhang If the matrix is assembled, the data array 'a' is guaranteed to have the latest values of the matrix. 45977ee59b9bSJunchao Zhang 45987ee59b9bSJunchao Zhang Level: Developer 45997ee59b9bSJunchao Zhang 46007ee59b9bSJunchao Zhang .seealso: MatSeqAIJGetArray(), MatSeqAIJGetArrayRead() 46017ee59b9bSJunchao Zhang @*/ 46027ee59b9bSJunchao Zhang PetscErrorCode MatSeqAIJGetCSRAndMemType(Mat mat,const PetscInt **i,const PetscInt **j,PetscScalar **a,PetscMemType *mtype) 46037ee59b9bSJunchao Zhang { 46047ee59b9bSJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ*)mat->data; 46057ee59b9bSJunchao Zhang 46067ee59b9bSJunchao Zhang PetscFunctionBegin; 46077ee59b9bSJunchao Zhang PetscCheck(mat->preallocated,PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"matrix is not preallocated"); 46087ee59b9bSJunchao Zhang if (aij->ops->getcsrandmemtype) { 46097ee59b9bSJunchao Zhang PetscCall((*aij->ops->getcsrandmemtype)(mat,i,j,a,mtype)); 46107ee59b9bSJunchao Zhang } else { 46117ee59b9bSJunchao Zhang if (i) *i = aij->i; 46127ee59b9bSJunchao Zhang if (j) *j = aij->j; 46137ee59b9bSJunchao Zhang if (a) *a = aij->a; 46147ee59b9bSJunchao Zhang if (mtype) *mtype = PETSC_MEMTYPE_HOST; 46157ee59b9bSJunchao Zhang } 46167ee59b9bSJunchao Zhang PetscFunctionReturn(0); 46177ee59b9bSJunchao Zhang } 46187ee59b9bSJunchao Zhang 46197ee59b9bSJunchao Zhang /*@C 462021e72a00SBarry Smith MatSeqAIJGetMaxRowNonzeros - returns the maximum number of nonzeros in any row 462121e72a00SBarry Smith 462221e72a00SBarry Smith Not Collective 462321e72a00SBarry Smith 462421e72a00SBarry Smith Input Parameter: 4625579dbff0SBarry Smith . mat - a MATSEQAIJ matrix 462621e72a00SBarry Smith 462721e72a00SBarry Smith Output Parameter: 462821e72a00SBarry Smith . nz - the maximum number of nonzeros in any row 462921e72a00SBarry Smith 463021e72a00SBarry Smith Level: intermediate 463121e72a00SBarry Smith 463221e72a00SBarry Smith .seealso: MatSeqAIJRestoreArray(), MatSeqAIJGetArrayF90() 463321e72a00SBarry Smith @*/ 463421e72a00SBarry Smith PetscErrorCode MatSeqAIJGetMaxRowNonzeros(Mat A,PetscInt *nz) 463521e72a00SBarry Smith { 463621e72a00SBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ*)A->data; 463721e72a00SBarry Smith 463821e72a00SBarry Smith PetscFunctionBegin; 463921e72a00SBarry Smith *nz = aij->rmax; 464021e72a00SBarry Smith PetscFunctionReturn(0); 464121e72a00SBarry Smith } 464221e72a00SBarry Smith 4643394ed5ebSJunchao Zhang PetscErrorCode MatSetPreallocationCOO_SeqAIJ(Mat mat, PetscCount coo_n, const PetscInt coo_i[], const PetscInt coo_j[]) 4644394ed5ebSJunchao Zhang { 4645394ed5ebSJunchao Zhang MPI_Comm comm; 4646394ed5ebSJunchao Zhang PetscInt *i,*j; 4647394ed5ebSJunchao Zhang PetscInt M,N,row; 4648394ed5ebSJunchao Zhang PetscCount k,p,q,nneg,nnz,start,end; /* Index the coo array, so use PetscCount as their type */ 4649394ed5ebSJunchao Zhang PetscInt *Ai; /* Change to PetscCount once we use it for row pointers */ 4650394ed5ebSJunchao Zhang PetscInt *Aj; 4651394ed5ebSJunchao Zhang PetscScalar *Aa; 4652cbc6b225SStefano Zampini Mat_SeqAIJ *seqaij = (Mat_SeqAIJ*)(mat->data); 4653cbc6b225SStefano Zampini MatType rtype; 4654394ed5ebSJunchao Zhang PetscCount *perm,*jmap; 4655394ed5ebSJunchao Zhang 4656394ed5ebSJunchao Zhang PetscFunctionBegin; 46579566063dSJacob Faibussowitsch PetscCall(MatResetPreallocationCOO_SeqAIJ(mat)); 46589566063dSJacob Faibussowitsch PetscCall(PetscObjectGetComm((PetscObject)mat,&comm)); 46599566063dSJacob Faibussowitsch PetscCall(MatGetSize(mat,&M,&N)); 46609566063dSJacob Faibussowitsch PetscCall(PetscMalloc2(coo_n,&i,coo_n,&j)); 46619566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(i,coo_i,coo_n)); /* Make a copy since we'll modify it */ 46629566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(j,coo_j,coo_n)); 46639566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(coo_n,&perm)); 4664394ed5ebSJunchao Zhang for (k=0; k<coo_n; k++) { /* Ignore entries with negative row or col indices */ 4665394ed5ebSJunchao Zhang if (j[k] < 0) i[k] = -1; 4666394ed5ebSJunchao Zhang perm[k] = k; 4667394ed5ebSJunchao Zhang } 4668394ed5ebSJunchao Zhang 4669394ed5ebSJunchao Zhang /* Sort by row */ 46709566063dSJacob Faibussowitsch PetscCall(PetscSortIntWithIntCountArrayPair(coo_n,i,j,perm)); 4671394ed5ebSJunchao Zhang for (k=0; k<coo_n; k++) {if (i[k] >= 0) break;} /* Advance k to the first row with a non-negative index */ 4672394ed5ebSJunchao Zhang nneg = k; 46739566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(coo_n-nneg+1,&jmap)); /* +1 to make a CSR-like data structure. jmap[i] originally is the number of repeats for i-th nonzero */ 4674394ed5ebSJunchao Zhang nnz = 0; /* Total number of unique nonzeros to be counted */ 4675394ed5ebSJunchao Zhang jmap++; /* Inc jmap by 1 for convinience */ 4676394ed5ebSJunchao Zhang 46779566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(M+1,&Ai)); /* CSR of A */ 46789566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(coo_n-nneg,&Aj)); /* We have at most coo_n-nneg unique nonzeros */ 4679394ed5ebSJunchao Zhang 4680394ed5ebSJunchao Zhang /* In each row, sort by column, then unique column indices to get row length */ 4681394ed5ebSJunchao Zhang Ai++; /* Inc by 1 for convinience */ 4682394ed5ebSJunchao Zhang q = 0; /* q-th unique nonzero, with q starting from 0 */ 4683394ed5ebSJunchao Zhang while (k<coo_n) { 4684394ed5ebSJunchao Zhang row = i[k]; 4685394ed5ebSJunchao Zhang start = k; /* [start,end) indices for this row */ 4686394ed5ebSJunchao Zhang while (k<coo_n && i[k] == row) k++; 4687394ed5ebSJunchao Zhang end = k; 46889566063dSJacob Faibussowitsch PetscCall(PetscSortIntWithCountArray(end-start,j+start,perm+start)); 4689394ed5ebSJunchao Zhang /* Find number of unique col entries in this row */ 4690394ed5ebSJunchao Zhang Aj[q] = j[start]; /* Log the first nonzero in this row */ 4691394ed5ebSJunchao Zhang jmap[q] = 1; /* Number of repeats of this nozero entry */ 4692394ed5ebSJunchao Zhang Ai[row] = 1; 4693394ed5ebSJunchao Zhang nnz++; 4694394ed5ebSJunchao Zhang 4695394ed5ebSJunchao Zhang for (p=start+1; p<end; p++) { /* Scan remaining nonzero in this row */ 4696394ed5ebSJunchao Zhang if (j[p] != j[p-1]) { /* Meet a new nonzero */ 4697394ed5ebSJunchao Zhang q++; 4698394ed5ebSJunchao Zhang jmap[q] = 1; 4699394ed5ebSJunchao Zhang Aj[q] = j[p]; 4700394ed5ebSJunchao Zhang Ai[row]++; 4701394ed5ebSJunchao Zhang nnz++; 4702394ed5ebSJunchao Zhang } else { 4703394ed5ebSJunchao Zhang jmap[q]++; 4704394ed5ebSJunchao Zhang } 4705394ed5ebSJunchao Zhang } 4706394ed5ebSJunchao Zhang q++; /* Move to next row and thus next unique nonzero */ 4707394ed5ebSJunchao Zhang } 47089566063dSJacob Faibussowitsch PetscCall(PetscFree2(i,j)); 4709394ed5ebSJunchao Zhang 4710394ed5ebSJunchao Zhang Ai--; /* Back to the beginning of Ai[] */ 4711394ed5ebSJunchao Zhang for (k=0; k<M; k++) Ai[k+1] += Ai[k]; 4712394ed5ebSJunchao Zhang jmap--; /* Back to the beginning of jmap[] */ 4713394ed5ebSJunchao Zhang jmap[0] = 0; 4714394ed5ebSJunchao Zhang for (k=0; k<nnz; k++) jmap[k+1] += jmap[k]; 4715394ed5ebSJunchao Zhang if (nnz < coo_n-nneg) { /* Realloc with actual number of unique nonzeros */ 4716394ed5ebSJunchao Zhang PetscCount *jmap_new; 4717394ed5ebSJunchao Zhang PetscInt *Aj_new; 4718394ed5ebSJunchao Zhang 47199566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nnz+1,&jmap_new)); 47209566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(jmap_new,jmap,nnz+1)); 47219566063dSJacob Faibussowitsch PetscCall(PetscFree(jmap)); 4722394ed5ebSJunchao Zhang jmap = jmap_new; 4723394ed5ebSJunchao Zhang 47249566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nnz,&Aj_new)); 47259566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(Aj_new,Aj,nnz)); 47269566063dSJacob Faibussowitsch PetscCall(PetscFree(Aj)); 4727394ed5ebSJunchao Zhang Aj = Aj_new; 4728394ed5ebSJunchao Zhang } 4729394ed5ebSJunchao Zhang 4730394ed5ebSJunchao Zhang if (nneg) { /* Discard heading entries with negative indices in perm[], as we'll access it from index 0 in MatSetValuesCOO */ 4731394ed5ebSJunchao Zhang PetscCount *perm_new; 4732cbc6b225SStefano Zampini 47339566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(coo_n-nneg,&perm_new)); 47349566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(perm_new,perm+nneg,coo_n-nneg)); 47359566063dSJacob Faibussowitsch PetscCall(PetscFree(perm)); 4736394ed5ebSJunchao Zhang perm = perm_new; 4737394ed5ebSJunchao Zhang } 4738394ed5ebSJunchao Zhang 47399566063dSJacob Faibussowitsch PetscCall(MatGetRootType_Private(mat,&rtype)); 47409566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(nnz,&Aa)); /* Zero the matrix */ 47419566063dSJacob Faibussowitsch PetscCall(MatSetSeqAIJWithArrays_private(PETSC_COMM_SELF,M,N,Ai,Aj,Aa,rtype,mat)); 4742394ed5ebSJunchao Zhang 4743394ed5ebSJunchao Zhang seqaij->singlemalloc = PETSC_FALSE; /* Ai, Aj and Aa are not allocated in one big malloc */ 4744394ed5ebSJunchao Zhang seqaij->free_a = seqaij->free_ij = PETSC_TRUE; /* Let newmat own Ai, Aj and Aa */ 4745394ed5ebSJunchao Zhang /* Record COO fields */ 4746394ed5ebSJunchao Zhang seqaij->coo_n = coo_n; 4747394ed5ebSJunchao Zhang seqaij->Atot = coo_n-nneg; /* Annz is seqaij->nz, so no need to record that again */ 4748394ed5ebSJunchao Zhang seqaij->jmap = jmap; /* of length nnz+1 */ 4749394ed5ebSJunchao Zhang seqaij->perm = perm; 4750394ed5ebSJunchao Zhang PetscFunctionReturn(0); 4751394ed5ebSJunchao Zhang } 4752394ed5ebSJunchao Zhang 4753394ed5ebSJunchao Zhang static PetscErrorCode MatSetValuesCOO_SeqAIJ(Mat A,const PetscScalar v[],InsertMode imode) 4754394ed5ebSJunchao Zhang { 4755394ed5ebSJunchao Zhang Mat_SeqAIJ *aseq = (Mat_SeqAIJ*)A->data; 4756394ed5ebSJunchao Zhang PetscCount i,j,Annz = aseq->nz; 4757394ed5ebSJunchao Zhang PetscCount *perm = aseq->perm,*jmap = aseq->jmap; 4758394ed5ebSJunchao Zhang PetscScalar *Aa; 4759394ed5ebSJunchao Zhang 4760394ed5ebSJunchao Zhang PetscFunctionBegin; 47619566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArray(A,&Aa)); 4762394ed5ebSJunchao Zhang for (i=0; i<Annz; i++) { 4763b6c38306SJunchao Zhang PetscScalar sum = 0.0; 4764b6c38306SJunchao Zhang for (j=jmap[i]; j<jmap[i+1]; j++) sum += v[perm[j]]; 4765b6c38306SJunchao Zhang Aa[i] = (imode == INSERT_VALUES? 0.0 : Aa[i]) + sum; 4766394ed5ebSJunchao Zhang } 47679566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArray(A,&Aa)); 4768394ed5ebSJunchao Zhang PetscFunctionReturn(0); 4769394ed5ebSJunchao Zhang } 4770394ed5ebSJunchao Zhang 477134b5b067SBarry Smith #if defined(PETSC_HAVE_CUDA) 47725063d097SStefano Zampini PETSC_INTERN PetscErrorCode MatConvert_SeqAIJ_SeqAIJCUSPARSE(Mat,MatType,MatReuse,Mat*); 477302fe1965SBarry Smith #endif 47743d0639e7SStefano Zampini #if defined(PETSC_HAVE_KOKKOS_KERNELS) 47755063d097SStefano Zampini PETSC_INTERN PetscErrorCode MatConvert_SeqAIJ_SeqAIJKokkos(Mat,MatType,MatReuse,Mat*); 47763d0639e7SStefano Zampini #endif 477702fe1965SBarry Smith 47788cc058d9SJed Brown PETSC_EXTERN PetscErrorCode MatCreate_SeqAIJ(Mat B) 4779273d9f13SBarry Smith { 4780273d9f13SBarry Smith Mat_SeqAIJ *b; 478138baddfdSBarry Smith PetscMPIInt size; 4782273d9f13SBarry Smith 4783273d9f13SBarry Smith PetscFunctionBegin; 47849566063dSJacob Faibussowitsch PetscCallMPI(MPI_Comm_size(PetscObjectComm((PetscObject)B),&size)); 47852c71b3e2SJacob Faibussowitsch PetscCheckFalse(size > 1,PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Comm must be of size 1"); 4786273d9f13SBarry Smith 47879566063dSJacob Faibussowitsch PetscCall(PetscNewLog(B,&b)); 47882205254eSKarl Rupp 4789b0a32e0cSBarry Smith B->data = (void*)b; 47902205254eSKarl Rupp 47919566063dSJacob Faibussowitsch PetscCall(PetscMemcpy(B->ops,&MatOps_Values,sizeof(struct _MatOps))); 4792071fcb05SBarry Smith if (B->sortedfull) B->ops->setvalues = MatSetValues_SeqAIJ_SortedFull; 47932205254eSKarl Rupp 4794f4259b30SLisandro Dalcin b->row = NULL; 4795f4259b30SLisandro Dalcin b->col = NULL; 4796f4259b30SLisandro Dalcin b->icol = NULL; 4797b810aeb4SBarry Smith b->reallocs = 0; 479836db0b34SBarry Smith b->ignorezeroentries = PETSC_FALSE; 4799f1e2ffcdSBarry Smith b->roworiented = PETSC_TRUE; 4800416022c9SBarry Smith b->nonew = 0; 4801f4259b30SLisandro Dalcin b->diag = NULL; 4802f4259b30SLisandro Dalcin b->solve_work = NULL; 4803f4259b30SLisandro Dalcin B->spptr = NULL; 4804f4259b30SLisandro Dalcin b->saved_values = NULL; 4805f4259b30SLisandro Dalcin b->idiag = NULL; 4806f4259b30SLisandro Dalcin b->mdiag = NULL; 4807f4259b30SLisandro Dalcin b->ssor_work = NULL; 480871f1c65dSBarry Smith b->omega = 1.0; 480971f1c65dSBarry Smith b->fshift = 0.0; 481071f1c65dSBarry Smith b->idiagvalid = PETSC_FALSE; 4811bbead8a2SBarry Smith b->ibdiagvalid = PETSC_FALSE; 4812a9817697SBarry Smith b->keepnonzeropattern = PETSC_FALSE; 481317ab2063SBarry Smith 48149566063dSJacob Faibussowitsch PetscCall(PetscObjectChangeTypeName((PetscObject)B,MATSEQAIJ)); 48158c778c55SBarry Smith 4816b3866ffcSBarry Smith #if defined(PETSC_HAVE_MATLAB_ENGINE) 48179566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B,"PetscMatlabEnginePut_C",MatlabEnginePut_SeqAIJ)); 48189566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B,"PetscMatlabEngineGet_C",MatlabEngineGet_SeqAIJ)); 4819b3866ffcSBarry Smith #endif 482017f1a0eaSHong Zhang 48219566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B,"MatSeqAIJSetColumnIndices_C",MatSeqAIJSetColumnIndices_SeqAIJ)); 48229566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B,"MatStoreValues_C",MatStoreValues_SeqAIJ)); 48239566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B,"MatRetrieveValues_C",MatRetrieveValues_SeqAIJ)); 48249566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B,"MatConvert_seqaij_seqsbaij_C",MatConvert_SeqAIJ_SeqSBAIJ)); 48259566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B,"MatConvert_seqaij_seqbaij_C",MatConvert_SeqAIJ_SeqBAIJ)); 48269566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B,"MatConvert_seqaij_seqaijperm_C",MatConvert_SeqAIJ_SeqAIJPERM)); 48279566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B,"MatConvert_seqaij_seqaijsell_C",MatConvert_SeqAIJ_SeqAIJSELL)); 48289779e05dSSatish Balay #if defined(PETSC_HAVE_MKL_SPARSE) 48299566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B,"MatConvert_seqaij_seqaijmkl_C",MatConvert_SeqAIJ_SeqAIJMKL)); 4830191b95cbSRichard Tran Mills #endif 483134b5b067SBarry Smith #if defined(PETSC_HAVE_CUDA) 48329566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B,"MatConvert_seqaij_seqaijcusparse_C",MatConvert_SeqAIJ_SeqAIJCUSPARSE)); 48339566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B,"MatProductSetFromOptions_seqaijcusparse_seqaij_C",MatProductSetFromOptions_SeqAIJ)); 48349566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B,"MatProductSetFromOptions_seqaij_seqaijcusparse_C",MatProductSetFromOptions_SeqAIJ)); 483502fe1965SBarry Smith #endif 48363d0639e7SStefano Zampini #if defined(PETSC_HAVE_KOKKOS_KERNELS) 48379566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B,"MatConvert_seqaij_seqaijkokkos_C",MatConvert_SeqAIJ_SeqAIJKokkos)); 48383d0639e7SStefano Zampini #endif 48399566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B,"MatConvert_seqaij_seqaijcrl_C",MatConvert_SeqAIJ_SeqAIJCRL)); 4840af8000cdSHong Zhang #if defined(PETSC_HAVE_ELEMENTAL) 48419566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B,"MatConvert_seqaij_elemental_C",MatConvert_SeqAIJ_Elemental)); 4842af8000cdSHong Zhang #endif 4843d24d4204SJose E. Roman #if defined(PETSC_HAVE_SCALAPACK) 48449566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B,"MatConvert_seqaij_scalapack_C",MatConvert_AIJ_ScaLAPACK)); 4845d24d4204SJose E. Roman #endif 484663c07aadSStefano Zampini #if defined(PETSC_HAVE_HYPRE) 48479566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B,"MatConvert_seqaij_hypre_C",MatConvert_AIJ_HYPRE)); 48489566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B,"MatProductSetFromOptions_transpose_seqaij_seqaij_C",MatProductSetFromOptions_Transpose_AIJ_AIJ)); 484963c07aadSStefano Zampini #endif 48509566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B,"MatConvert_seqaij_seqdense_C",MatConvert_SeqAIJ_SeqDense)); 48519566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B,"MatConvert_seqaij_seqsell_C",MatConvert_SeqAIJ_SeqSELL)); 48529566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B,"MatConvert_seqaij_is_C",MatConvert_XAIJ_IS)); 48539566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B,"MatIsTranspose_C",MatIsTranspose_SeqAIJ)); 48549566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B,"MatIsHermitianTranspose_C",MatIsTranspose_SeqAIJ)); 48559566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B,"MatSeqAIJSetPreallocation_C",MatSeqAIJSetPreallocation_SeqAIJ)); 48569566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B,"MatResetPreallocation_C",MatResetPreallocation_SeqAIJ)); 48579566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B,"MatSeqAIJSetPreallocationCSR_C",MatSeqAIJSetPreallocationCSR_SeqAIJ)); 48589566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B,"MatReorderForNonzeroDiagonal_C",MatReorderForNonzeroDiagonal_SeqAIJ)); 48599566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B,"MatProductSetFromOptions_is_seqaij_C",MatProductSetFromOptions_IS_XAIJ)); 48609566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B,"MatProductSetFromOptions_seqdense_seqaij_C",MatProductSetFromOptions_SeqDense_SeqAIJ)); 48619566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B,"MatProductSetFromOptions_seqaij_seqaij_C",MatProductSetFromOptions_SeqAIJ)); 48629566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B,"MatSeqAIJKron_C",MatSeqAIJKron_SeqAIJ)); 48639566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B,"MatSetPreallocationCOO_C",MatSetPreallocationCOO_SeqAIJ)); 48649566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B,"MatSetValuesCOO_C",MatSetValuesCOO_SeqAIJ)); 48659566063dSJacob Faibussowitsch PetscCall(MatCreate_SeqAIJ_Inode(B)); 48669566063dSJacob Faibussowitsch PetscCall(PetscObjectChangeTypeName((PetscObject)B,MATSEQAIJ)); 48679566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetTypeFromOptions(B)); /* this allows changing the matrix subtype to say MATSEQAIJPERM */ 48683a40ed3dSBarry Smith PetscFunctionReturn(0); 486917ab2063SBarry Smith } 487017ab2063SBarry Smith 4871b24902e0SBarry Smith /* 4872b24902e0SBarry Smith Given a matrix generated with MatGetFactor() duplicates all the information in A into B 4873b24902e0SBarry Smith */ 4874ace3abfcSBarry Smith PetscErrorCode MatDuplicateNoCreate_SeqAIJ(Mat C,Mat A,MatDuplicateOption cpvalues,PetscBool mallocmatspace) 487517ab2063SBarry Smith { 48762a350339SBarry Smith Mat_SeqAIJ *c = (Mat_SeqAIJ*)C->data,*a = (Mat_SeqAIJ*)A->data; 4877071fcb05SBarry Smith PetscInt m = A->rmap->n,i; 487817ab2063SBarry Smith 48793a40ed3dSBarry Smith PetscFunctionBegin; 48802c71b3e2SJacob Faibussowitsch PetscCheckFalse(!A->assembled && cpvalues!=MAT_DO_NOT_COPY_VALUES,PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Cannot duplicate unassembled matrix"); 4881273d9f13SBarry Smith 4882d5f3da31SBarry Smith C->factortype = A->factortype; 4883f4259b30SLisandro Dalcin c->row = NULL; 4884f4259b30SLisandro Dalcin c->col = NULL; 4885f4259b30SLisandro Dalcin c->icol = NULL; 48866ad4291fSHong Zhang c->reallocs = 0; 488717ab2063SBarry Smith 488869272f91SPierre Jolivet C->assembled = A->assembled; 488969272f91SPierre Jolivet C->preallocated = A->preallocated; 489017ab2063SBarry Smith 489169272f91SPierre Jolivet if (A->preallocated) { 48929566063dSJacob Faibussowitsch PetscCall(PetscLayoutReference(A->rmap,&C->rmap)); 48939566063dSJacob Faibussowitsch PetscCall(PetscLayoutReference(A->cmap,&C->cmap)); 4894eec197d1SBarry Smith 48959566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m,&c->imax)); 48969566063dSJacob Faibussowitsch PetscCall(PetscMemcpy(c->imax,a->imax,m*sizeof(PetscInt))); 48979566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m,&c->ilen)); 48989566063dSJacob Faibussowitsch PetscCall(PetscMemcpy(c->ilen,a->ilen,m*sizeof(PetscInt))); 48999566063dSJacob Faibussowitsch PetscCall(PetscLogObjectMemory((PetscObject)C, 2*m*sizeof(PetscInt))); 490017ab2063SBarry Smith 490117ab2063SBarry Smith /* allocate the matrix space */ 4902f77e22a1SHong Zhang if (mallocmatspace) { 49039566063dSJacob Faibussowitsch PetscCall(PetscMalloc3(a->i[m],&c->a,a->i[m],&c->j,m+1,&c->i)); 49049566063dSJacob Faibussowitsch PetscCall(PetscLogObjectMemory((PetscObject)C, a->i[m]*(sizeof(PetscScalar)+sizeof(PetscInt))+(m+1)*sizeof(PetscInt))); 49052205254eSKarl Rupp 4906f1e2ffcdSBarry Smith c->singlemalloc = PETSC_TRUE; 49072205254eSKarl Rupp 49089566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(c->i,a->i,m+1)); 490917ab2063SBarry Smith if (m > 0) { 49109566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(c->j,a->j,a->i[m])); 4911be6bf707SBarry Smith if (cpvalues == MAT_COPY_VALUES) { 49122e5835c6SStefano Zampini const PetscScalar *aa; 49132e5835c6SStefano Zampini 49149566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A,&aa)); 49159566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(c->a,aa,a->i[m])); 49169566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A,&aa)); 4917be6bf707SBarry Smith } else { 49189566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(c->a,a->i[m])); 491917ab2063SBarry Smith } 492008480c60SBarry Smith } 4921f77e22a1SHong Zhang } 492217ab2063SBarry Smith 49236ad4291fSHong Zhang c->ignorezeroentries = a->ignorezeroentries; 4924416022c9SBarry Smith c->roworiented = a->roworiented; 4925416022c9SBarry Smith c->nonew = a->nonew; 4926416022c9SBarry Smith if (a->diag) { 49279566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m+1,&c->diag)); 49289566063dSJacob Faibussowitsch PetscCall(PetscMemcpy(c->diag,a->diag,m*sizeof(PetscInt))); 49299566063dSJacob Faibussowitsch PetscCall(PetscLogObjectMemory((PetscObject)C,(m+1)*sizeof(PetscInt))); 4930071fcb05SBarry Smith } else c->diag = NULL; 49312205254eSKarl Rupp 4932f4259b30SLisandro Dalcin c->solve_work = NULL; 4933f4259b30SLisandro Dalcin c->saved_values = NULL; 4934f4259b30SLisandro Dalcin c->idiag = NULL; 4935f4259b30SLisandro Dalcin c->ssor_work = NULL; 4936a9817697SBarry Smith c->keepnonzeropattern = a->keepnonzeropattern; 4937e6b907acSBarry Smith c->free_a = PETSC_TRUE; 4938e6b907acSBarry Smith c->free_ij = PETSC_TRUE; 49396ad4291fSHong Zhang 4940893ad86cSHong Zhang c->rmax = a->rmax; 4941416022c9SBarry Smith c->nz = a->nz; 49428ed568f8SMatthew G Knepley c->maxnz = a->nz; /* Since we allocate exactly the right amount */ 4943754ec7b1SSatish Balay 49446ad4291fSHong Zhang c->compressedrow.use = a->compressedrow.use; 49456ad4291fSHong Zhang c->compressedrow.nrows = a->compressedrow.nrows; 4946cd6b891eSBarry Smith if (a->compressedrow.use) { 49476ad4291fSHong Zhang i = a->compressedrow.nrows; 49489566063dSJacob Faibussowitsch PetscCall(PetscMalloc2(i+1,&c->compressedrow.i,i,&c->compressedrow.rindex)); 49499566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(c->compressedrow.i,a->compressedrow.i,i+1)); 49509566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(c->compressedrow.rindex,a->compressedrow.rindex,i)); 495127ea64f8SHong Zhang } else { 495227ea64f8SHong Zhang c->compressedrow.use = PETSC_FALSE; 49530298fd71SBarry Smith c->compressedrow.i = NULL; 49540298fd71SBarry Smith c->compressedrow.rindex = NULL; 49556ad4291fSHong Zhang } 4956ea632784SBarry Smith c->nonzerorowcnt = a->nonzerorowcnt; 4957e56f5c9eSBarry Smith C->nonzerostate = A->nonzerostate; 49584846f1f5SKris Buschelman 49599566063dSJacob Faibussowitsch PetscCall(MatDuplicate_SeqAIJ_Inode(A,cpvalues,&C)); 496069272f91SPierre Jolivet } 49619566063dSJacob Faibussowitsch PetscCall(PetscFunctionListDuplicate(((PetscObject)A)->qlist,&((PetscObject)C)->qlist)); 49623a40ed3dSBarry Smith PetscFunctionReturn(0); 496317ab2063SBarry Smith } 496417ab2063SBarry Smith 4965b24902e0SBarry Smith PetscErrorCode MatDuplicate_SeqAIJ(Mat A,MatDuplicateOption cpvalues,Mat *B) 4966b24902e0SBarry Smith { 4967b24902e0SBarry Smith PetscFunctionBegin; 49689566063dSJacob Faibussowitsch PetscCall(MatCreate(PetscObjectComm((PetscObject)A),B)); 49699566063dSJacob Faibussowitsch PetscCall(MatSetSizes(*B,A->rmap->n,A->cmap->n,A->rmap->n,A->cmap->n)); 4970cfd3f464SBarry Smith if (!(A->rmap->n % A->rmap->bs) && !(A->cmap->n % A->cmap->bs)) { 49719566063dSJacob Faibussowitsch PetscCall(MatSetBlockSizesFromMats(*B,A,A)); 4972cfd3f464SBarry Smith } 49739566063dSJacob Faibussowitsch PetscCall(MatSetType(*B,((PetscObject)A)->type_name)); 49749566063dSJacob Faibussowitsch PetscCall(MatDuplicateNoCreate_SeqAIJ(*B,A,cpvalues,PETSC_TRUE)); 4975b24902e0SBarry Smith PetscFunctionReturn(0); 4976b24902e0SBarry Smith } 4977b24902e0SBarry Smith 4978112444f4SShri Abhyankar PetscErrorCode MatLoad_SeqAIJ(Mat newMat, PetscViewer viewer) 4979fbdbba38SShri Abhyankar { 498052f91c60SVaclav Hapla PetscBool isbinary, ishdf5; 498152f91c60SVaclav Hapla 498252f91c60SVaclav Hapla PetscFunctionBegin; 498352f91c60SVaclav Hapla PetscValidHeaderSpecific(newMat,MAT_CLASSID,1); 498452f91c60SVaclav Hapla PetscValidHeaderSpecific(viewer,PETSC_VIEWER_CLASSID,2); 4985c27b3999SVaclav Hapla /* force binary viewer to load .info file if it has not yet done so */ 49869566063dSJacob Faibussowitsch PetscCall(PetscViewerSetUp(viewer)); 49879566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)viewer,PETSCVIEWERBINARY,&isbinary)); 49889566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)viewer,PETSCVIEWERHDF5, &ishdf5)); 498952f91c60SVaclav Hapla if (isbinary) { 49909566063dSJacob Faibussowitsch PetscCall(MatLoad_SeqAIJ_Binary(newMat,viewer)); 499152f91c60SVaclav Hapla } else if (ishdf5) { 499252f91c60SVaclav Hapla #if defined(PETSC_HAVE_HDF5) 49939566063dSJacob Faibussowitsch PetscCall(MatLoad_AIJ_HDF5(newMat,viewer)); 499452f91c60SVaclav Hapla #else 499552f91c60SVaclav Hapla SETERRQ(PetscObjectComm((PetscObject)newMat),PETSC_ERR_SUP,"HDF5 not supported in this build.\nPlease reconfigure using --download-hdf5"); 499652f91c60SVaclav Hapla #endif 499752f91c60SVaclav Hapla } else { 499898921bdaSJacob Faibussowitsch SETERRQ(PetscObjectComm((PetscObject)newMat),PETSC_ERR_SUP,"Viewer type %s not yet supported for reading %s matrices",((PetscObject)viewer)->type_name,((PetscObject)newMat)->type_name); 499952f91c60SVaclav Hapla } 500052f91c60SVaclav Hapla PetscFunctionReturn(0); 500152f91c60SVaclav Hapla } 500252f91c60SVaclav Hapla 50033ea6fe3dSLisandro Dalcin PetscErrorCode MatLoad_SeqAIJ_Binary(Mat mat, PetscViewer viewer) 500452f91c60SVaclav Hapla { 50053ea6fe3dSLisandro Dalcin Mat_SeqAIJ *a = (Mat_SeqAIJ*)mat->data; 50063ea6fe3dSLisandro Dalcin PetscInt header[4],*rowlens,M,N,nz,sum,rows,cols,i; 5007fbdbba38SShri Abhyankar 5008fbdbba38SShri Abhyankar PetscFunctionBegin; 50099566063dSJacob Faibussowitsch PetscCall(PetscViewerSetUp(viewer)); 5010bbead8a2SBarry Smith 50113ea6fe3dSLisandro Dalcin /* read in matrix header */ 50129566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryRead(viewer,header,4,NULL,PETSC_INT)); 50132c71b3e2SJacob Faibussowitsch PetscCheckFalse(header[0] != MAT_FILE_CLASSID,PETSC_COMM_SELF,PETSC_ERR_FILE_UNEXPECTED,"Not a matrix object in file"); 5014fbdbba38SShri Abhyankar M = header[1]; N = header[2]; nz = header[3]; 50152c71b3e2SJacob Faibussowitsch PetscCheckFalse(M < 0,PetscObjectComm((PetscObject)viewer),PETSC_ERR_FILE_UNEXPECTED,"Matrix row size (%" PetscInt_FMT ") in file is negative",M); 50162c71b3e2SJacob Faibussowitsch PetscCheckFalse(N < 0,PetscObjectComm((PetscObject)viewer),PETSC_ERR_FILE_UNEXPECTED,"Matrix column size (%" PetscInt_FMT ") in file is negative",N); 50172c71b3e2SJacob Faibussowitsch PetscCheckFalse(nz < 0,PETSC_COMM_SELF,PETSC_ERR_FILE_UNEXPECTED,"Matrix stored in special format on disk, cannot load as SeqAIJ"); 5018fbdbba38SShri Abhyankar 50193ea6fe3dSLisandro Dalcin /* set block sizes from the viewer's .info file */ 50209566063dSJacob Faibussowitsch PetscCall(MatLoad_Binary_BlockSizes(mat,viewer)); 50213ea6fe3dSLisandro Dalcin /* set local and global sizes if not set already */ 50223ea6fe3dSLisandro Dalcin if (mat->rmap->n < 0) mat->rmap->n = M; 50233ea6fe3dSLisandro Dalcin if (mat->cmap->n < 0) mat->cmap->n = N; 50243ea6fe3dSLisandro Dalcin if (mat->rmap->N < 0) mat->rmap->N = M; 50253ea6fe3dSLisandro Dalcin if (mat->cmap->N < 0) mat->cmap->N = N; 50269566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(mat->rmap)); 50279566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(mat->cmap)); 50283ea6fe3dSLisandro Dalcin 50293ea6fe3dSLisandro Dalcin /* check if the matrix sizes are correct */ 50309566063dSJacob Faibussowitsch PetscCall(MatGetSize(mat,&rows,&cols)); 50312c71b3e2SJacob Faibussowitsch PetscCheckFalse(M != rows || N != cols,PETSC_COMM_SELF,PETSC_ERR_FILE_UNEXPECTED, "Matrix in file of different sizes (%" PetscInt_FMT ", %" PetscInt_FMT ") than the input matrix (%" PetscInt_FMT ", %" PetscInt_FMT ")",M,N,rows,cols); 50323ea6fe3dSLisandro Dalcin 5033fbdbba38SShri Abhyankar /* read in row lengths */ 50349566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(M,&rowlens)); 50359566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryRead(viewer,rowlens,M,NULL,PETSC_INT)); 50363ea6fe3dSLisandro Dalcin /* check if sum(rowlens) is same as nz */ 50373ea6fe3dSLisandro Dalcin sum = 0; for (i=0; i<M; i++) sum += rowlens[i]; 50382c71b3e2SJacob Faibussowitsch PetscCheckFalse(sum != nz,PETSC_COMM_SELF,PETSC_ERR_FILE_UNEXPECTED,"Inconsistent matrix data in file: nonzeros = %" PetscInt_FMT ", sum-row-lengths = %" PetscInt_FMT,nz,sum); 50393ea6fe3dSLisandro Dalcin /* preallocate and check sizes */ 50409566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(mat,0,rowlens)); 50419566063dSJacob Faibussowitsch PetscCall(MatGetSize(mat,&rows,&cols)); 50422c71b3e2SJacob Faibussowitsch PetscCheckFalse(M != rows || N != cols,PETSC_COMM_SELF,PETSC_ERR_FILE_UNEXPECTED, "Matrix in file of different length (%" PetscInt_FMT ", %" PetscInt_FMT ") than the input matrix (%" PetscInt_FMT ", %" PetscInt_FMT ")",M,N,rows,cols); 50433ea6fe3dSLisandro Dalcin /* store row lengths */ 50449566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(a->ilen,rowlens,M)); 50459566063dSJacob Faibussowitsch PetscCall(PetscFree(rowlens)); 5046fbdbba38SShri Abhyankar 50473ea6fe3dSLisandro Dalcin /* fill in "i" row pointers */ 50483ea6fe3dSLisandro Dalcin a->i[0] = 0; for (i=0; i<M; i++) a->i[i+1] = a->i[i] + a->ilen[i]; 50493ea6fe3dSLisandro Dalcin /* read in "j" column indices */ 50509566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryRead(viewer,a->j,nz,NULL,PETSC_INT)); 50513ea6fe3dSLisandro Dalcin /* read in "a" nonzero values */ 50529566063dSJacob Faibussowitsch PetscCall(PetscViewerBinaryRead(viewer,a->a,nz,NULL,PETSC_SCALAR)); 5053fbdbba38SShri Abhyankar 50549566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(mat,MAT_FINAL_ASSEMBLY)); 50559566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(mat,MAT_FINAL_ASSEMBLY)); 5056fbdbba38SShri Abhyankar PetscFunctionReturn(0); 5057fbdbba38SShri Abhyankar } 5058fbdbba38SShri Abhyankar 5059ace3abfcSBarry Smith PetscErrorCode MatEqual_SeqAIJ(Mat A,Mat B,PetscBool * flg) 50607264ac53SSatish Balay { 50617264ac53SSatish Balay Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data,*b = (Mat_SeqAIJ*)B->data; 5062fff043a9SJunchao Zhang const PetscScalar *aa,*ba; 5063eeffb40dSHong Zhang #if defined(PETSC_USE_COMPLEX) 5064eeffb40dSHong Zhang PetscInt k; 5065eeffb40dSHong Zhang #endif 50667264ac53SSatish Balay 50673a40ed3dSBarry Smith PetscFunctionBegin; 5068bfeeae90SHong Zhang /* If the matrix dimensions are not equal,or no of nonzeros */ 5069d0f46423SBarry Smith if ((A->rmap->n != B->rmap->n) || (A->cmap->n != B->cmap->n) ||(a->nz != b->nz)) { 5070ca44d042SBarry Smith *flg = PETSC_FALSE; 5071ca44d042SBarry Smith PetscFunctionReturn(0); 5072bcd2baecSBarry Smith } 50737264ac53SSatish Balay 50747264ac53SSatish Balay /* if the a->i are the same */ 50759566063dSJacob Faibussowitsch PetscCall(PetscArraycmp(a->i,b->i,A->rmap->n+1,flg)); 5076abc0a331SBarry Smith if (!*flg) PetscFunctionReturn(0); 50777264ac53SSatish Balay 50787264ac53SSatish Balay /* if a->j are the same */ 50799566063dSJacob Faibussowitsch PetscCall(PetscArraycmp(a->j,b->j,a->nz,flg)); 5080abc0a331SBarry Smith if (!*flg) PetscFunctionReturn(0); 5081bcd2baecSBarry Smith 50829566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(A,&aa)); 50839566063dSJacob Faibussowitsch PetscCall(MatSeqAIJGetArrayRead(B,&ba)); 5084bcd2baecSBarry Smith /* if a->a are the same */ 5085eeffb40dSHong Zhang #if defined(PETSC_USE_COMPLEX) 5086eeffb40dSHong Zhang for (k=0; k<a->nz; k++) { 5087fff043a9SJunchao Zhang if (PetscRealPart(aa[k]) != PetscRealPart(ba[k]) || PetscImaginaryPart(aa[k]) != PetscImaginaryPart(ba[k])) { 5088eeffb40dSHong Zhang *flg = PETSC_FALSE; 50893a40ed3dSBarry Smith PetscFunctionReturn(0); 5090eeffb40dSHong Zhang } 5091eeffb40dSHong Zhang } 5092eeffb40dSHong Zhang #else 50939566063dSJacob Faibussowitsch PetscCall(PetscArraycmp(aa,ba,a->nz,flg)); 5094eeffb40dSHong Zhang #endif 50959566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(A,&aa)); 50969566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRestoreArrayRead(B,&ba)); 5097eeffb40dSHong Zhang PetscFunctionReturn(0); 50987264ac53SSatish Balay } 509936db0b34SBarry Smith 510005869f15SSatish Balay /*@ 510136db0b34SBarry Smith MatCreateSeqAIJWithArrays - Creates an sequential AIJ matrix using matrix elements (in CSR format) 510236db0b34SBarry Smith provided by the user. 510336db0b34SBarry Smith 5104d083f849SBarry Smith Collective 510536db0b34SBarry Smith 510636db0b34SBarry Smith Input Parameters: 510736db0b34SBarry Smith + comm - must be an MPI communicator of size 1 510836db0b34SBarry Smith . m - number of rows 510936db0b34SBarry Smith . n - number of columns 5110483a2f95SBarry Smith . i - row indices; that is i[0] = 0, i[row] = i[row-1] + number of elements in that row of the matrix 511136db0b34SBarry Smith . j - column indices 511236db0b34SBarry Smith - a - matrix values 511336db0b34SBarry Smith 511436db0b34SBarry Smith Output Parameter: 511536db0b34SBarry Smith . mat - the matrix 511636db0b34SBarry Smith 511736db0b34SBarry Smith Level: intermediate 511836db0b34SBarry Smith 511936db0b34SBarry Smith Notes: 51200551d7c0SBarry Smith The i, j, and a arrays are not copied by this routine, the user must free these arrays 5121292fb18eSBarry Smith once the matrix is destroyed and not before 512236db0b34SBarry Smith 512336db0b34SBarry Smith You cannot set new nonzero locations into this matrix, that will generate an error. 512436db0b34SBarry Smith 5125bfeeae90SHong Zhang The i and j indices are 0 based 512636db0b34SBarry Smith 5127a4552177SSatish Balay The format which is used for the sparse matrix input, is equivalent to a 5128a4552177SSatish Balay row-major ordering.. i.e for the following matrix, the input data expected is 51298eef79e4SBarry Smith as shown 5130a4552177SSatish Balay 51318eef79e4SBarry Smith $ 1 0 0 51328eef79e4SBarry Smith $ 2 0 3 51338eef79e4SBarry Smith $ 4 5 6 51348eef79e4SBarry Smith $ 51358eef79e4SBarry Smith $ i = {0,1,3,6} [size = nrow+1 = 3+1] 51368eef79e4SBarry Smith $ j = {0,0,2,0,1,2} [size = 6]; values must be sorted for each row 51378eef79e4SBarry Smith $ v = {1,2,3,4,5,6} [size = 6] 5138a4552177SSatish Balay 513969b1f4b7SBarry Smith .seealso: MatCreate(), MatCreateAIJ(), MatCreateSeqAIJ(), MatCreateMPIAIJWithArrays(), MatMPIAIJSetPreallocationCSR() 514036db0b34SBarry Smith 514136db0b34SBarry Smith @*/ 5142c3c607ccSBarry Smith PetscErrorCode MatCreateSeqAIJWithArrays(MPI_Comm comm,PetscInt m,PetscInt n,PetscInt i[],PetscInt j[],PetscScalar a[],Mat *mat) 514336db0b34SBarry Smith { 5144cbcfb4deSHong Zhang PetscInt ii; 514536db0b34SBarry Smith Mat_SeqAIJ *aij; 5146cbcfb4deSHong Zhang PetscInt jj; 514736db0b34SBarry Smith 514836db0b34SBarry Smith PetscFunctionBegin; 51492c71b3e2SJacob Faibussowitsch PetscCheckFalse(m > 0 && i[0],PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"i (row indices) must start with 0"); 51509566063dSJacob Faibussowitsch PetscCall(MatCreate(comm,mat)); 51519566063dSJacob Faibussowitsch PetscCall(MatSetSizes(*mat,m,n,m,n)); 51529566063dSJacob Faibussowitsch /* PetscCall(MatSetBlockSizes(*mat,,)); */ 51539566063dSJacob Faibussowitsch PetscCall(MatSetType(*mat,MATSEQAIJ)); 51549566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(*mat,MAT_SKIP_ALLOCATION,NULL)); 5155ab93d7beSBarry Smith aij = (Mat_SeqAIJ*)(*mat)->data; 51569566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m,&aij->imax)); 51579566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m,&aij->ilen)); 5158ab93d7beSBarry Smith 515936db0b34SBarry Smith aij->i = i; 516036db0b34SBarry Smith aij->j = j; 516136db0b34SBarry Smith aij->a = a; 516236db0b34SBarry Smith aij->singlemalloc = PETSC_FALSE; 516336db0b34SBarry Smith aij->nonew = -1; /*this indicates that inserting a new value in the matrix that generates a new nonzero is an error*/ 5164e6b907acSBarry Smith aij->free_a = PETSC_FALSE; 5165e6b907acSBarry Smith aij->free_ij = PETSC_FALSE; 516636db0b34SBarry Smith 5167cbc6b225SStefano Zampini for (ii=0,aij->nonzerorowcnt=0,aij->rmax=0; ii<m; ii++) { 516836db0b34SBarry Smith aij->ilen[ii] = aij->imax[ii] = i[ii+1] - i[ii]; 516976bd3646SJed Brown if (PetscDefined(USE_DEBUG)) { 51702c71b3e2SJacob Faibussowitsch PetscCheckFalse(i[ii+1] - i[ii] < 0,PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Negative row length in i (row indices) row = %" PetscInt_FMT " length = %" PetscInt_FMT,ii,i[ii+1] - i[ii]); 51719985e31cSBarry Smith for (jj=i[ii]+1; jj<i[ii+1]; jj++) { 51722c71b3e2SJacob Faibussowitsch PetscCheckFalse(j[jj] < j[jj-1],PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Column entry number %" PetscInt_FMT " (actual column %" PetscInt_FMT ") in row %" PetscInt_FMT " is not sorted",jj-i[ii],j[jj],ii); 51732c71b3e2SJacob Faibussowitsch PetscCheckFalse(j[jj] == j[jj-1],PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Column entry number %" PetscInt_FMT " (actual column %" PetscInt_FMT ") in row %" PetscInt_FMT " is identical to previous entry",jj-i[ii],j[jj],ii); 51749985e31cSBarry Smith } 517536db0b34SBarry Smith } 517676bd3646SJed Brown } 517776bd3646SJed Brown if (PetscDefined(USE_DEBUG)) { 517836db0b34SBarry Smith for (ii=0; ii<aij->i[m]; ii++) { 51792c71b3e2SJacob Faibussowitsch PetscCheckFalse(j[ii] < 0,PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Negative column index at location = %" PetscInt_FMT " index = %" PetscInt_FMT,ii,j[ii]); 51802c71b3e2SJacob Faibussowitsch PetscCheckFalse(j[ii] > n - 1,PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Column index to large at location = %" PetscInt_FMT " index = %" PetscInt_FMT,ii,j[ii]); 518136db0b34SBarry Smith } 518276bd3646SJed Brown } 518336db0b34SBarry Smith 51849566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(*mat,MAT_FINAL_ASSEMBLY)); 51859566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(*mat,MAT_FINAL_ASSEMBLY)); 518636db0b34SBarry Smith PetscFunctionReturn(0); 518736db0b34SBarry Smith } 5188cbc6b225SStefano Zampini 518980ef6e79SMatthew G Knepley /*@C 5190d021a1c5SVictor Minden MatCreateSeqAIJFromTriple - Creates an sequential AIJ matrix using matrix elements (in COO format) 51918a0b0e6bSVictor Minden provided by the user. 51928a0b0e6bSVictor Minden 5193d083f849SBarry Smith Collective 51948a0b0e6bSVictor Minden 51958a0b0e6bSVictor Minden Input Parameters: 51968a0b0e6bSVictor Minden + comm - must be an MPI communicator of size 1 51978a0b0e6bSVictor Minden . m - number of rows 51988a0b0e6bSVictor Minden . n - number of columns 51998a0b0e6bSVictor Minden . i - row indices 52008a0b0e6bSVictor Minden . j - column indices 52011230e6d1SVictor Minden . a - matrix values 52021230e6d1SVictor Minden . nz - number of nonzeros 52031230e6d1SVictor Minden - idx - 0 or 1 based 52048a0b0e6bSVictor Minden 52058a0b0e6bSVictor Minden Output Parameter: 52068a0b0e6bSVictor Minden . mat - the matrix 52078a0b0e6bSVictor Minden 52088a0b0e6bSVictor Minden Level: intermediate 52098a0b0e6bSVictor Minden 52108a0b0e6bSVictor Minden Notes: 52119e99939fSJunchao Zhang The i and j indices are 0 based. The format which is used for the sparse matrix input, is equivalent to a row-major ordering. i.e for the following matrix, 52129e99939fSJunchao Zhang the input data expected is as shown 52139e99939fSJunchao Zhang .vb 52148a0b0e6bSVictor Minden 1 0 0 52158a0b0e6bSVictor Minden 2 0 3 52168a0b0e6bSVictor Minden 4 5 6 52178a0b0e6bSVictor Minden 52188a0b0e6bSVictor Minden i = {0,1,1,2,2,2} 52198a0b0e6bSVictor Minden j = {0,0,2,0,1,2} 52208a0b0e6bSVictor Minden v = {1,2,3,4,5,6} 52219e99939fSJunchao Zhang .ve 52228a0b0e6bSVictor Minden 522369b1f4b7SBarry Smith .seealso: MatCreate(), MatCreateAIJ(), MatCreateSeqAIJ(), MatCreateSeqAIJWithArrays(), MatMPIAIJSetPreallocationCSR() 52248a0b0e6bSVictor Minden 52258a0b0e6bSVictor Minden @*/ 5226c3c607ccSBarry Smith PetscErrorCode MatCreateSeqAIJFromTriple(MPI_Comm comm,PetscInt m,PetscInt n,PetscInt i[],PetscInt j[],PetscScalar a[],Mat *mat,PetscInt nz,PetscBool idx) 52278a0b0e6bSVictor Minden { 5228d021a1c5SVictor Minden PetscInt ii, *nnz, one = 1,row,col; 52298a0b0e6bSVictor Minden 52308a0b0e6bSVictor Minden PetscFunctionBegin; 52319566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(m,&nnz)); 52321230e6d1SVictor Minden for (ii = 0; ii < nz; ii++) { 5233c8d679ebSHong Zhang nnz[i[ii] - !!idx] += 1; 52341230e6d1SVictor Minden } 52359566063dSJacob Faibussowitsch PetscCall(MatCreate(comm,mat)); 52369566063dSJacob Faibussowitsch PetscCall(MatSetSizes(*mat,m,n,m,n)); 52379566063dSJacob Faibussowitsch PetscCall(MatSetType(*mat,MATSEQAIJ)); 52389566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(*mat,0,nnz)); 52391230e6d1SVictor Minden for (ii = 0; ii < nz; ii++) { 52401230e6d1SVictor Minden if (idx) { 52411230e6d1SVictor Minden row = i[ii] - 1; 52421230e6d1SVictor Minden col = j[ii] - 1; 52431230e6d1SVictor Minden } else { 52441230e6d1SVictor Minden row = i[ii]; 52451230e6d1SVictor Minden col = j[ii]; 52468a0b0e6bSVictor Minden } 52479566063dSJacob Faibussowitsch PetscCall(MatSetValues(*mat,one,&row,one,&col,&a[ii],ADD_VALUES)); 52488a0b0e6bSVictor Minden } 52499566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(*mat,MAT_FINAL_ASSEMBLY)); 52509566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(*mat,MAT_FINAL_ASSEMBLY)); 52519566063dSJacob Faibussowitsch PetscCall(PetscFree(nnz)); 52528a0b0e6bSVictor Minden PetscFunctionReturn(0); 52538a0b0e6bSVictor Minden } 525436db0b34SBarry Smith 5255acf2f550SJed Brown PetscErrorCode MatSeqAIJInvalidateDiagonal(Mat A) 5256acf2f550SJed Brown { 5257acf2f550SJed Brown Mat_SeqAIJ *a=(Mat_SeqAIJ*)A->data; 5258acf2f550SJed Brown 5259acf2f550SJed Brown PetscFunctionBegin; 5260acf2f550SJed Brown a->idiagvalid = PETSC_FALSE; 5261acf2f550SJed Brown a->ibdiagvalid = PETSC_FALSE; 52622205254eSKarl Rupp 52639566063dSJacob Faibussowitsch PetscCall(MatSeqAIJInvalidateDiagonal_Inode(A)); 5264acf2f550SJed Brown PetscFunctionReturn(0); 5265acf2f550SJed Brown } 5266acf2f550SJed Brown 52679c8f2541SHong Zhang PetscErrorCode MatCreateMPIMatConcatenateSeqMat_SeqAIJ(MPI_Comm comm,Mat inmat,PetscInt n,MatReuse scall,Mat *outmat) 52689c8f2541SHong Zhang { 52698761c3d6SHong Zhang PetscMPIInt size; 52709c8f2541SHong Zhang 52719c8f2541SHong Zhang PetscFunctionBegin; 52729566063dSJacob Faibussowitsch PetscCallMPI(MPI_Comm_size(comm,&size)); 52737bbdc51dSHong Zhang if (size == 1) { 52747bbdc51dSHong Zhang if (scall == MAT_INITIAL_MATRIX) { 52759566063dSJacob Faibussowitsch PetscCall(MatDuplicate(inmat,MAT_COPY_VALUES,outmat)); 52767bbdc51dSHong Zhang } else { 52779566063dSJacob Faibussowitsch PetscCall(MatCopy(inmat,*outmat,SAME_NONZERO_PATTERN)); 52787bbdc51dSHong Zhang } 52798761c3d6SHong Zhang } else { 52809566063dSJacob Faibussowitsch PetscCall(MatCreateMPIMatConcatenateSeqMat_MPIAIJ(comm,inmat,n,scall,outmat)); 52818761c3d6SHong Zhang } 52829c8f2541SHong Zhang PetscFunctionReturn(0); 52839c8f2541SHong Zhang } 52849c8f2541SHong Zhang 528581824310SBarry Smith /* 528653dd7562SDmitry Karpeev Permute A into C's *local* index space using rowemb,colemb. 528753dd7562SDmitry Karpeev The embedding are supposed to be injections and the above implies that the range of rowemb is a subset 528853dd7562SDmitry Karpeev of [0,m), colemb is in [0,n). 528953dd7562SDmitry Karpeev If pattern == DIFFERENT_NONZERO_PATTERN, C is preallocated according to A. 529053dd7562SDmitry Karpeev */ 529153dd7562SDmitry Karpeev PetscErrorCode MatSetSeqMat_SeqAIJ(Mat C,IS rowemb,IS colemb,MatStructure pattern,Mat B) 529253dd7562SDmitry Karpeev { 529353dd7562SDmitry Karpeev /* If making this function public, change the error returned in this function away from _PLIB. */ 529453dd7562SDmitry Karpeev Mat_SeqAIJ *Baij; 529553dd7562SDmitry Karpeev PetscBool seqaij; 529653dd7562SDmitry Karpeev PetscInt m,n,*nz,i,j,count; 529753dd7562SDmitry Karpeev PetscScalar v; 529853dd7562SDmitry Karpeev const PetscInt *rowindices,*colindices; 529953dd7562SDmitry Karpeev 530053dd7562SDmitry Karpeev PetscFunctionBegin; 530153dd7562SDmitry Karpeev if (!B) PetscFunctionReturn(0); 530253dd7562SDmitry Karpeev /* Check to make sure the target matrix (and embeddings) are compatible with C and each other. */ 53039566063dSJacob Faibussowitsch PetscCall(PetscObjectBaseTypeCompare((PetscObject)B,MATSEQAIJ,&seqaij)); 530428b400f6SJacob Faibussowitsch PetscCheck(seqaij,PETSC_COMM_SELF,PETSC_ERR_PLIB,"Input matrix is of wrong type"); 530553dd7562SDmitry Karpeev if (rowemb) { 53069566063dSJacob Faibussowitsch PetscCall(ISGetLocalSize(rowemb,&m)); 53072c71b3e2SJacob Faibussowitsch PetscCheckFalse(m != B->rmap->n,PETSC_COMM_SELF,PETSC_ERR_PLIB,"Row IS of size %" PetscInt_FMT " is incompatible with matrix row size %" PetscInt_FMT,m,B->rmap->n); 530853dd7562SDmitry Karpeev } else { 53092c71b3e2SJacob Faibussowitsch PetscCheckFalse(C->rmap->n != B->rmap->n,PETSC_COMM_SELF,PETSC_ERR_PLIB,"Input matrix is row-incompatible with the target matrix"); 531053dd7562SDmitry Karpeev } 531153dd7562SDmitry Karpeev if (colemb) { 53129566063dSJacob Faibussowitsch PetscCall(ISGetLocalSize(colemb,&n)); 53132c71b3e2SJacob Faibussowitsch PetscCheckFalse(n != B->cmap->n,PETSC_COMM_SELF,PETSC_ERR_PLIB,"Diag col IS of size %" PetscInt_FMT " is incompatible with input matrix col size %" PetscInt_FMT,n,B->cmap->n); 531453dd7562SDmitry Karpeev } else { 53152c71b3e2SJacob Faibussowitsch PetscCheckFalse(C->cmap->n != B->cmap->n,PETSC_COMM_SELF,PETSC_ERR_PLIB,"Input matrix is col-incompatible with the target matrix"); 531653dd7562SDmitry Karpeev } 531753dd7562SDmitry Karpeev 531853dd7562SDmitry Karpeev Baij = (Mat_SeqAIJ*)(B->data); 531953dd7562SDmitry Karpeev if (pattern == DIFFERENT_NONZERO_PATTERN) { 53209566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(B->rmap->n,&nz)); 532153dd7562SDmitry Karpeev for (i=0; i<B->rmap->n; i++) { 532253dd7562SDmitry Karpeev nz[i] = Baij->i[i+1] - Baij->i[i]; 532353dd7562SDmitry Karpeev } 53249566063dSJacob Faibussowitsch PetscCall(MatSeqAIJSetPreallocation(C,0,nz)); 53259566063dSJacob Faibussowitsch PetscCall(PetscFree(nz)); 532653dd7562SDmitry Karpeev } 532753dd7562SDmitry Karpeev if (pattern == SUBSET_NONZERO_PATTERN) { 53289566063dSJacob Faibussowitsch PetscCall(MatZeroEntries(C)); 532953dd7562SDmitry Karpeev } 533053dd7562SDmitry Karpeev count = 0; 533153dd7562SDmitry Karpeev rowindices = NULL; 533253dd7562SDmitry Karpeev colindices = NULL; 533353dd7562SDmitry Karpeev if (rowemb) { 53349566063dSJacob Faibussowitsch PetscCall(ISGetIndices(rowemb,&rowindices)); 533553dd7562SDmitry Karpeev } 533653dd7562SDmitry Karpeev if (colemb) { 53379566063dSJacob Faibussowitsch PetscCall(ISGetIndices(colemb,&colindices)); 533853dd7562SDmitry Karpeev } 533953dd7562SDmitry Karpeev for (i=0; i<B->rmap->n; i++) { 534053dd7562SDmitry Karpeev PetscInt row; 534153dd7562SDmitry Karpeev row = i; 534253dd7562SDmitry Karpeev if (rowindices) row = rowindices[i]; 534353dd7562SDmitry Karpeev for (j=Baij->i[i]; j<Baij->i[i+1]; j++) { 534453dd7562SDmitry Karpeev PetscInt col; 534553dd7562SDmitry Karpeev col = Baij->j[count]; 534653dd7562SDmitry Karpeev if (colindices) col = colindices[col]; 534753dd7562SDmitry Karpeev v = Baij->a[count]; 53489566063dSJacob Faibussowitsch PetscCall(MatSetValues(C,1,&row,1,&col,&v,INSERT_VALUES)); 534953dd7562SDmitry Karpeev ++count; 535053dd7562SDmitry Karpeev } 535153dd7562SDmitry Karpeev } 535253dd7562SDmitry Karpeev /* FIXME: set C's nonzerostate correctly. */ 535353dd7562SDmitry Karpeev /* Assembly for C is necessary. */ 535453dd7562SDmitry Karpeev C->preallocated = PETSC_TRUE; 535553dd7562SDmitry Karpeev C->assembled = PETSC_TRUE; 535653dd7562SDmitry Karpeev C->was_assembled = PETSC_FALSE; 535753dd7562SDmitry Karpeev PetscFunctionReturn(0); 535853dd7562SDmitry Karpeev } 535953dd7562SDmitry Karpeev 53604099cc6bSBarry Smith PetscFunctionList MatSeqAIJList = NULL; 53614099cc6bSBarry Smith 53624099cc6bSBarry Smith /*@C 53634099cc6bSBarry Smith MatSeqAIJSetType - Converts a MATSEQAIJ matrix to a subtype 53644099cc6bSBarry Smith 53654099cc6bSBarry Smith Collective on Mat 53664099cc6bSBarry Smith 53674099cc6bSBarry Smith Input Parameters: 53684099cc6bSBarry Smith + mat - the matrix object 53694099cc6bSBarry Smith - matype - matrix type 53704099cc6bSBarry Smith 53714099cc6bSBarry Smith Options Database Key: 53724099cc6bSBarry Smith . -mat_seqai_type <method> - for example seqaijcrl 53734099cc6bSBarry Smith 53744099cc6bSBarry Smith Level: intermediate 53754099cc6bSBarry Smith 53764099cc6bSBarry Smith .seealso: PCSetType(), VecSetType(), MatCreate(), MatType, Mat 53774099cc6bSBarry Smith @*/ 53784099cc6bSBarry Smith PetscErrorCode MatSeqAIJSetType(Mat mat, MatType matype) 53794099cc6bSBarry Smith { 53804099cc6bSBarry Smith PetscBool sametype; 53815f80ce2aSJacob Faibussowitsch PetscErrorCode (*r)(Mat,MatType,MatReuse,Mat*); 53824099cc6bSBarry Smith 53834099cc6bSBarry Smith PetscFunctionBegin; 53844099cc6bSBarry Smith PetscValidHeaderSpecific(mat,MAT_CLASSID,1); 53859566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)mat,matype,&sametype)); 53864099cc6bSBarry Smith if (sametype) PetscFunctionReturn(0); 53874099cc6bSBarry Smith 53889566063dSJacob Faibussowitsch PetscCall(PetscFunctionListFind(MatSeqAIJList,matype,&r)); 53895f80ce2aSJacob Faibussowitsch PetscCheck(r,PETSC_COMM_SELF,PETSC_ERR_ARG_UNKNOWN_TYPE,"Unknown Mat type given: %s",matype); 53909566063dSJacob Faibussowitsch PetscCall((*r)(mat,matype,MAT_INPLACE_MATRIX,&mat)); 53914099cc6bSBarry Smith PetscFunctionReturn(0); 53924099cc6bSBarry Smith } 53934099cc6bSBarry Smith 53944099cc6bSBarry Smith /*@C 53954099cc6bSBarry Smith MatSeqAIJRegister - - Adds a new sub-matrix type for sequential AIJ matrices 53964099cc6bSBarry Smith 53974099cc6bSBarry Smith Not Collective 53984099cc6bSBarry Smith 53994099cc6bSBarry Smith Input Parameters: 54004099cc6bSBarry Smith + name - name of a new user-defined matrix type, for example MATSEQAIJCRL 54014099cc6bSBarry Smith - function - routine to convert to subtype 54024099cc6bSBarry Smith 54034099cc6bSBarry Smith Notes: 54044099cc6bSBarry Smith MatSeqAIJRegister() may be called multiple times to add several user-defined solvers. 54054099cc6bSBarry Smith 54064099cc6bSBarry Smith Then, your matrix can be chosen with the procedural interface at runtime via the option 54074099cc6bSBarry Smith $ -mat_seqaij_type my_mat 54084099cc6bSBarry Smith 54094099cc6bSBarry Smith Level: advanced 54104099cc6bSBarry Smith 54114099cc6bSBarry Smith .seealso: MatSeqAIJRegisterAll() 54124099cc6bSBarry Smith 54134099cc6bSBarry Smith Level: advanced 54144099cc6bSBarry Smith @*/ 5415388d47a6SSatish Balay PetscErrorCode MatSeqAIJRegister(const char sname[],PetscErrorCode (*function)(Mat,MatType,MatReuse,Mat *)) 54164099cc6bSBarry Smith { 54174099cc6bSBarry Smith PetscFunctionBegin; 54189566063dSJacob Faibussowitsch PetscCall(MatInitializePackage()); 54199566063dSJacob Faibussowitsch PetscCall(PetscFunctionListAdd(&MatSeqAIJList,sname,function)); 54204099cc6bSBarry Smith PetscFunctionReturn(0); 54214099cc6bSBarry Smith } 54224099cc6bSBarry Smith 54234099cc6bSBarry Smith PetscBool MatSeqAIJRegisterAllCalled = PETSC_FALSE; 54244099cc6bSBarry Smith 54254099cc6bSBarry Smith /*@C 54264099cc6bSBarry Smith MatSeqAIJRegisterAll - Registers all of the matrix subtypes of SeqAIJ 54274099cc6bSBarry Smith 54284099cc6bSBarry Smith Not Collective 54294099cc6bSBarry Smith 54304099cc6bSBarry Smith Level: advanced 54314099cc6bSBarry Smith 54324099cc6bSBarry Smith .seealso: MatRegisterAll(), MatSeqAIJRegister() 54334099cc6bSBarry Smith @*/ 54344099cc6bSBarry Smith PetscErrorCode MatSeqAIJRegisterAll(void) 54354099cc6bSBarry Smith { 54364099cc6bSBarry Smith PetscFunctionBegin; 54374099cc6bSBarry Smith if (MatSeqAIJRegisterAllCalled) PetscFunctionReturn(0); 54384099cc6bSBarry Smith MatSeqAIJRegisterAllCalled = PETSC_TRUE; 54394099cc6bSBarry Smith 54409566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRegister(MATSEQAIJCRL, MatConvert_SeqAIJ_SeqAIJCRL)); 54419566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRegister(MATSEQAIJPERM, MatConvert_SeqAIJ_SeqAIJPERM)); 54429566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRegister(MATSEQAIJSELL, MatConvert_SeqAIJ_SeqAIJSELL)); 54439779e05dSSatish Balay #if defined(PETSC_HAVE_MKL_SPARSE) 54449566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRegister(MATSEQAIJMKL, MatConvert_SeqAIJ_SeqAIJMKL)); 5445485f9817SRichard Tran Mills #endif 54465063d097SStefano Zampini #if defined(PETSC_HAVE_CUDA) 54479566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRegister(MATSEQAIJCUSPARSE, MatConvert_SeqAIJ_SeqAIJCUSPARSE)); 54485063d097SStefano Zampini #endif 54495063d097SStefano Zampini #if defined(PETSC_HAVE_KOKKOS_KERNELS) 54509566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRegister(MATSEQAIJKOKKOS, MatConvert_SeqAIJ_SeqAIJKokkos)); 54515063d097SStefano Zampini #endif 54524099cc6bSBarry Smith #if defined(PETSC_HAVE_VIENNACL) && defined(PETSC_HAVE_VIENNACL_NO_CUDA) 54539566063dSJacob Faibussowitsch PetscCall(MatSeqAIJRegister(MATMPIAIJVIENNACL, MatConvert_SeqAIJ_SeqAIJViennaCL)); 54544099cc6bSBarry Smith #endif 54554099cc6bSBarry Smith PetscFunctionReturn(0); 54564099cc6bSBarry Smith } 545753dd7562SDmitry Karpeev 545853dd7562SDmitry Karpeev /* 545981824310SBarry Smith Special version for direct calls from Fortran 546081824310SBarry Smith */ 5461af0996ceSBarry Smith #include <petsc/private/fortranimpl.h> 546281824310SBarry Smith #if defined(PETSC_HAVE_FORTRAN_CAPS) 546381824310SBarry Smith #define matsetvaluesseqaij_ MATSETVALUESSEQAIJ 546481824310SBarry Smith #elif !defined(PETSC_HAVE_FORTRAN_UNDERSCORE) 546581824310SBarry Smith #define matsetvaluesseqaij_ matsetvaluesseqaij 546681824310SBarry Smith #endif 546781824310SBarry Smith 546881824310SBarry Smith /* Change these macros so can be used in void function */ 546998921bdaSJacob Faibussowitsch 547098921bdaSJacob Faibussowitsch /* Change these macros so can be used in void function */ 54719566063dSJacob Faibussowitsch /* Identical to PetscCallVoid, except it assigns to *_ierr */ 54729566063dSJacob Faibussowitsch #undef PetscCall 54739566063dSJacob Faibussowitsch #define PetscCall(...) do { \ 54745f80ce2aSJacob Faibussowitsch PetscErrorCode ierr_msv_mpiaij = __VA_ARGS__; \ 547598921bdaSJacob Faibussowitsch if (PetscUnlikely(ierr_msv_mpiaij)) { \ 547698921bdaSJacob Faibussowitsch *_ierr = PetscError(PETSC_COMM_SELF,__LINE__,PETSC_FUNCTION_NAME,__FILE__,ierr_msv_mpiaij,PETSC_ERROR_REPEAT," "); \ 547798921bdaSJacob Faibussowitsch return; \ 547898921bdaSJacob Faibussowitsch } \ 547998921bdaSJacob Faibussowitsch } while (0) 548098921bdaSJacob Faibussowitsch 548198921bdaSJacob Faibussowitsch #undef SETERRQ 548298921bdaSJacob Faibussowitsch #define SETERRQ(comm,ierr,...) do { \ 548398921bdaSJacob Faibussowitsch *_ierr = PetscError(comm,__LINE__,PETSC_FUNCTION_NAME,__FILE__,ierr,PETSC_ERROR_INITIAL,__VA_ARGS__); \ 548498921bdaSJacob Faibussowitsch return; \ 548598921bdaSJacob Faibussowitsch } while (0) 548681824310SBarry Smith 548719caf8f3SSatish Balay PETSC_EXTERN void matsetvaluesseqaij_(Mat *AA,PetscInt *mm,const PetscInt im[],PetscInt *nn,const PetscInt in[],const PetscScalar v[],InsertMode *isis, PetscErrorCode *_ierr) 548881824310SBarry Smith { 548981824310SBarry Smith Mat A = *AA; 549081824310SBarry Smith PetscInt m = *mm, n = *nn; 549181824310SBarry Smith InsertMode is = *isis; 549281824310SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 549381824310SBarry Smith PetscInt *rp,k,low,high,t,ii,row,nrow,i,col,l,rmax,N; 549481824310SBarry Smith PetscInt *imax,*ai,*ailen; 549581824310SBarry Smith PetscInt *aj,nonew = a->nonew,lastcol = -1; 549654f21887SBarry Smith MatScalar *ap,value,*aa; 5497ace3abfcSBarry Smith PetscBool ignorezeroentries = a->ignorezeroentries; 5498ace3abfcSBarry Smith PetscBool roworiented = a->roworiented; 549981824310SBarry Smith 550081824310SBarry Smith PetscFunctionBegin; 55014994cf47SJed Brown MatCheckPreallocated(A,1); 550281824310SBarry Smith imax = a->imax; 550381824310SBarry Smith ai = a->i; 550481824310SBarry Smith ailen = a->ilen; 550581824310SBarry Smith aj = a->j; 550681824310SBarry Smith aa = a->a; 550781824310SBarry Smith 550881824310SBarry Smith for (k=0; k<m; k++) { /* loop over added rows */ 550981824310SBarry Smith row = im[k]; 551081824310SBarry Smith if (row < 0) continue; 55115f80ce2aSJacob Faibussowitsch PetscCheck(row < A->rmap->n,PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_OUTOFRANGE,"Row too large"); 551281824310SBarry Smith rp = aj + ai[row]; ap = aa + ai[row]; 551381824310SBarry Smith rmax = imax[row]; nrow = ailen[row]; 551481824310SBarry Smith low = 0; 551581824310SBarry Smith high = nrow; 551681824310SBarry Smith for (l=0; l<n; l++) { /* loop over added columns */ 551781824310SBarry Smith if (in[l] < 0) continue; 55185f80ce2aSJacob Faibussowitsch PetscCheck(in[l] < A->cmap->n,PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_OUTOFRANGE,"Column too large"); 551981824310SBarry Smith col = in[l]; 55202205254eSKarl Rupp if (roworiented) value = v[l + k*n]; 55212205254eSKarl Rupp else value = v[k + l*m]; 55222205254eSKarl Rupp 552381824310SBarry Smith if (value == 0.0 && ignorezeroentries && (is == ADD_VALUES)) continue; 552481824310SBarry Smith 55252205254eSKarl Rupp if (col <= lastcol) low = 0; 55262205254eSKarl Rupp else high = nrow; 552781824310SBarry Smith lastcol = col; 552881824310SBarry Smith while (high-low > 5) { 552981824310SBarry Smith t = (low+high)/2; 553081824310SBarry Smith if (rp[t] > col) high = t; 553181824310SBarry Smith else low = t; 553281824310SBarry Smith } 553381824310SBarry Smith for (i=low; i<high; i++) { 553481824310SBarry Smith if (rp[i] > col) break; 553581824310SBarry Smith if (rp[i] == col) { 553681824310SBarry Smith if (is == ADD_VALUES) ap[i] += value; 553781824310SBarry Smith else ap[i] = value; 553881824310SBarry Smith goto noinsert; 553981824310SBarry Smith } 554081824310SBarry Smith } 554181824310SBarry Smith if (value == 0.0 && ignorezeroentries) goto noinsert; 554281824310SBarry Smith if (nonew == 1) goto noinsert; 55435f80ce2aSJacob Faibussowitsch PetscCheck(nonew != -1,PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_OUTOFRANGE,"Inserting a new nonzero in the matrix"); 5544fef13f97SBarry Smith MatSeqXAIJReallocateAIJ(A,A->rmap->n,1,nrow,row,col,rmax,aa,ai,aj,rp,ap,imax,nonew,MatScalar); 554581824310SBarry Smith N = nrow++ - 1; a->nz++; high++; 554681824310SBarry Smith /* shift up all the later entries in this row */ 554781824310SBarry Smith for (ii=N; ii>=i; ii--) { 554881824310SBarry Smith rp[ii+1] = rp[ii]; 554981824310SBarry Smith ap[ii+1] = ap[ii]; 555081824310SBarry Smith } 555181824310SBarry Smith rp[i] = col; 555281824310SBarry Smith ap[i] = value; 5553e56f5c9eSBarry Smith A->nonzerostate++; 555481824310SBarry Smith noinsert:; 555581824310SBarry Smith low = i + 1; 555681824310SBarry Smith } 555781824310SBarry Smith ailen[row] = nrow; 555881824310SBarry Smith } 555981824310SBarry Smith PetscFunctionReturnVoid(); 556081824310SBarry Smith } 556198921bdaSJacob Faibussowitsch /* Undefining these here since they were redefined from their original definition above! No 556298921bdaSJacob Faibussowitsch * other PETSc functions should be defined past this point, as it is impossible to recover the 556398921bdaSJacob Faibussowitsch * original definitions */ 55649566063dSJacob Faibussowitsch #undef PetscCall 556598921bdaSJacob Faibussowitsch #undef SETERRQ 5566