1d5d45c9bSBarry Smith /* 23369ce9aSBarry Smith Defines the basic matrix operations for the AIJ (compressed row) 3d5d45c9bSBarry Smith matrix storage format. 4d5d45c9bSBarry Smith */ 53369ce9aSBarry Smith 67c4f633dSBarry Smith 7c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/aij.h> /*I "petscmat.h" I*/ 8c6db04a5SJed Brown #include <petscblaslapack.h> 9c6db04a5SJed Brown #include <petscbt.h> 10af0996ceSBarry Smith #include <petsc/private/kernels/blocktranspose.h> 110716a85fSBarry Smith 124099cc6bSBarry Smith PetscErrorCode MatSeqAIJSetTypeFromOptions(Mat A) 134099cc6bSBarry Smith { 144099cc6bSBarry Smith PetscErrorCode ierr; 154099cc6bSBarry Smith PetscBool flg; 164099cc6bSBarry Smith char type[256]; 174099cc6bSBarry Smith 184099cc6bSBarry Smith PetscFunctionBegin; 194099cc6bSBarry Smith ierr = PetscObjectOptionsBegin((PetscObject)A); 204099cc6bSBarry Smith ierr = PetscOptionsFList("-mat_seqaij_type","Matrix SeqAIJ type","MatSeqAIJSetType",MatSeqAIJList,"seqaij",type,256,&flg);CHKERRQ(ierr); 214099cc6bSBarry Smith if (flg) { 224099cc6bSBarry Smith ierr = MatSeqAIJSetType(A,type);CHKERRQ(ierr); 234099cc6bSBarry Smith } 244099cc6bSBarry Smith ierr = PetscOptionsEnd();CHKERRQ(ierr); 254099cc6bSBarry Smith PetscFunctionReturn(0); 264099cc6bSBarry Smith } 274099cc6bSBarry Smith 280716a85fSBarry Smith PetscErrorCode MatGetColumnNorms_SeqAIJ(Mat A,NormType type,PetscReal *norms) 290716a85fSBarry Smith { 300716a85fSBarry Smith PetscErrorCode ierr; 310716a85fSBarry Smith PetscInt i,m,n; 320716a85fSBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ*)A->data; 330716a85fSBarry Smith 340716a85fSBarry Smith PetscFunctionBegin; 350716a85fSBarry Smith ierr = MatGetSize(A,&m,&n);CHKERRQ(ierr); 36580bdb30SBarry Smith ierr = PetscArrayzero(norms,n);CHKERRQ(ierr); 370716a85fSBarry Smith if (type == NORM_2) { 380716a85fSBarry Smith for (i=0; i<aij->i[m]; i++) { 390716a85fSBarry Smith norms[aij->j[i]] += PetscAbsScalar(aij->a[i]*aij->a[i]); 400716a85fSBarry Smith } 410716a85fSBarry Smith } else if (type == NORM_1) { 420716a85fSBarry Smith for (i=0; i<aij->i[m]; i++) { 430716a85fSBarry Smith norms[aij->j[i]] += PetscAbsScalar(aij->a[i]); 440716a85fSBarry Smith } 450716a85fSBarry Smith } else if (type == NORM_INFINITY) { 460716a85fSBarry Smith for (i=0; i<aij->i[m]; i++) { 470716a85fSBarry Smith norms[aij->j[i]] = PetscMax(PetscAbsScalar(aij->a[i]),norms[aij->j[i]]); 480716a85fSBarry Smith } 490716a85fSBarry Smith } else SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONG,"Unknown NormType"); 500716a85fSBarry Smith 510716a85fSBarry Smith if (type == NORM_2) { 528f1a2a5eSBarry Smith for (i=0; i<n; i++) norms[i] = PetscSqrtReal(norms[i]); 530716a85fSBarry Smith } 540716a85fSBarry Smith PetscFunctionReturn(0); 550716a85fSBarry Smith } 560716a85fSBarry Smith 573a062f41SBarry Smith PetscErrorCode MatFindOffBlockDiagonalEntries_SeqAIJ(Mat A,IS *is) 583a062f41SBarry Smith { 593a062f41SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 603a062f41SBarry Smith PetscInt i,m=A->rmap->n,cnt = 0, bs = A->rmap->bs; 613a062f41SBarry Smith const PetscInt *jj = a->j,*ii = a->i; 623a062f41SBarry Smith PetscInt *rows; 633a062f41SBarry Smith PetscErrorCode ierr; 643a062f41SBarry Smith 653a062f41SBarry Smith PetscFunctionBegin; 663a062f41SBarry Smith for (i=0; i<m; i++) { 673a062f41SBarry Smith if ((ii[i] != ii[i+1]) && ((jj[ii[i]] < bs*(i/bs)) || (jj[ii[i+1]-1] > bs*((i+bs)/bs)-1))) { 683a062f41SBarry Smith cnt++; 693a062f41SBarry Smith } 703a062f41SBarry Smith } 713a062f41SBarry Smith ierr = PetscMalloc1(cnt,&rows);CHKERRQ(ierr); 723a062f41SBarry Smith cnt = 0; 733a062f41SBarry Smith for (i=0; i<m; i++) { 743a062f41SBarry Smith if ((ii[i] != ii[i+1]) && ((jj[ii[i]] < bs*(i/bs)) || (jj[ii[i+1]-1] > bs*((i+bs)/bs)-1))) { 753a062f41SBarry Smith rows[cnt] = i; 763a062f41SBarry Smith cnt++; 773a062f41SBarry Smith } 783a062f41SBarry Smith } 793a062f41SBarry Smith ierr = ISCreateGeneral(PETSC_COMM_SELF,cnt,rows,PETSC_OWN_POINTER,is);CHKERRQ(ierr); 803a062f41SBarry Smith PetscFunctionReturn(0); 813a062f41SBarry Smith } 823a062f41SBarry Smith 83f1f41ecbSJed Brown PetscErrorCode MatFindZeroDiagonals_SeqAIJ_Private(Mat A,PetscInt *nrows,PetscInt **zrows) 846ce1633cSBarry Smith { 856ce1633cSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 866ce1633cSBarry Smith const MatScalar *aa = a->a; 876ce1633cSBarry Smith PetscInt i,m=A->rmap->n,cnt = 0; 88b2db7409Sstefano_zampini const PetscInt *ii = a->i,*jj = a->j,*diag; 896ce1633cSBarry Smith PetscInt *rows; 906ce1633cSBarry Smith PetscErrorCode ierr; 916ce1633cSBarry Smith 926ce1633cSBarry Smith PetscFunctionBegin; 936ce1633cSBarry Smith ierr = MatMarkDiagonal_SeqAIJ(A);CHKERRQ(ierr); 946ce1633cSBarry Smith diag = a->diag; 956ce1633cSBarry Smith for (i=0; i<m; i++) { 96b2db7409Sstefano_zampini if ((diag[i] >= ii[i+1]) || (jj[diag[i]] != i) || (aa[diag[i]] == 0.0)) { 976ce1633cSBarry Smith cnt++; 986ce1633cSBarry Smith } 996ce1633cSBarry Smith } 100785e854fSJed Brown ierr = PetscMalloc1(cnt,&rows);CHKERRQ(ierr); 1016ce1633cSBarry Smith cnt = 0; 1026ce1633cSBarry Smith for (i=0; i<m; i++) { 103b2db7409Sstefano_zampini if ((diag[i] >= ii[i+1]) || (jj[diag[i]] != i) || (aa[diag[i]] == 0.0)) { 1046ce1633cSBarry Smith rows[cnt++] = i; 1056ce1633cSBarry Smith } 1066ce1633cSBarry Smith } 107f1f41ecbSJed Brown *nrows = cnt; 108f1f41ecbSJed Brown *zrows = rows; 109f1f41ecbSJed Brown PetscFunctionReturn(0); 110f1f41ecbSJed Brown } 111f1f41ecbSJed Brown 112f1f41ecbSJed Brown PetscErrorCode MatFindZeroDiagonals_SeqAIJ(Mat A,IS *zrows) 113f1f41ecbSJed Brown { 114f1f41ecbSJed Brown PetscInt nrows,*rows; 115f1f41ecbSJed Brown PetscErrorCode ierr; 116f1f41ecbSJed Brown 117f1f41ecbSJed Brown PetscFunctionBegin; 1180298fd71SBarry Smith *zrows = NULL; 119f1f41ecbSJed Brown ierr = MatFindZeroDiagonals_SeqAIJ_Private(A,&nrows,&rows);CHKERRQ(ierr); 120ce94432eSBarry Smith ierr = ISCreateGeneral(PetscObjectComm((PetscObject)A),nrows,rows,PETSC_OWN_POINTER,zrows);CHKERRQ(ierr); 1216ce1633cSBarry Smith PetscFunctionReturn(0); 1226ce1633cSBarry Smith } 1236ce1633cSBarry Smith 124b3a44c85SBarry Smith PetscErrorCode MatFindNonzeroRows_SeqAIJ(Mat A,IS *keptrows) 125b3a44c85SBarry Smith { 126b3a44c85SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 127b3a44c85SBarry Smith const MatScalar *aa; 128b3a44c85SBarry Smith PetscInt m=A->rmap->n,cnt = 0; 129b3a44c85SBarry Smith const PetscInt *ii; 130b3a44c85SBarry Smith PetscInt n,i,j,*rows; 131b3a44c85SBarry Smith PetscErrorCode ierr; 132b3a44c85SBarry Smith 133b3a44c85SBarry Smith PetscFunctionBegin; 134b3a44c85SBarry Smith *keptrows = 0; 135b3a44c85SBarry Smith ii = a->i; 136b3a44c85SBarry Smith for (i=0; i<m; i++) { 137b3a44c85SBarry Smith n = ii[i+1] - ii[i]; 138b3a44c85SBarry Smith if (!n) { 139b3a44c85SBarry Smith cnt++; 140b3a44c85SBarry Smith goto ok1; 141b3a44c85SBarry Smith } 142b3a44c85SBarry Smith aa = a->a + ii[i]; 143b3a44c85SBarry Smith for (j=0; j<n; j++) { 144b3a44c85SBarry Smith if (aa[j] != 0.0) goto ok1; 145b3a44c85SBarry Smith } 146b3a44c85SBarry Smith cnt++; 147b3a44c85SBarry Smith ok1:; 148b3a44c85SBarry Smith } 149b3a44c85SBarry Smith if (!cnt) PetscFunctionReturn(0); 150854ce69bSBarry Smith ierr = PetscMalloc1(A->rmap->n-cnt,&rows);CHKERRQ(ierr); 151b3a44c85SBarry Smith cnt = 0; 152b3a44c85SBarry Smith for (i=0; i<m; i++) { 153b3a44c85SBarry Smith n = ii[i+1] - ii[i]; 154b3a44c85SBarry Smith if (!n) continue; 155b3a44c85SBarry Smith aa = a->a + ii[i]; 156b3a44c85SBarry Smith for (j=0; j<n; j++) { 157b3a44c85SBarry Smith if (aa[j] != 0.0) { 158b3a44c85SBarry Smith rows[cnt++] = i; 159b3a44c85SBarry Smith break; 160b3a44c85SBarry Smith } 161b3a44c85SBarry Smith } 162b3a44c85SBarry Smith } 163b3a44c85SBarry Smith ierr = ISCreateGeneral(PETSC_COMM_SELF,cnt,rows,PETSC_OWN_POINTER,keptrows);CHKERRQ(ierr); 164b3a44c85SBarry Smith PetscFunctionReturn(0); 165b3a44c85SBarry Smith } 166b3a44c85SBarry Smith 1677087cfbeSBarry Smith PetscErrorCode MatDiagonalSet_SeqAIJ(Mat Y,Vec D,InsertMode is) 16879299369SBarry Smith { 16979299369SBarry Smith PetscErrorCode ierr; 17079299369SBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ*) Y->data; 17199e65526SBarry Smith PetscInt i,m = Y->rmap->n; 17299e65526SBarry Smith const PetscInt *diag; 17354f21887SBarry Smith MatScalar *aa = aij->a; 17499e65526SBarry Smith const PetscScalar *v; 175ace3abfcSBarry Smith PetscBool missing; 176837a59e1SRichard Tran Mills #if defined(PETSC_HAVE_VIENNACL) || defined(PETSC_HAVE_CUDA) 177837a59e1SRichard Tran Mills PetscBool inserted = PETSC_FALSE; 178837a59e1SRichard Tran Mills #endif 17979299369SBarry Smith 18079299369SBarry Smith PetscFunctionBegin; 18109f38230SBarry Smith if (Y->assembled) { 1820298fd71SBarry Smith ierr = MatMissingDiagonal_SeqAIJ(Y,&missing,NULL);CHKERRQ(ierr); 18309f38230SBarry Smith if (!missing) { 18479299369SBarry Smith diag = aij->diag; 18599e65526SBarry Smith ierr = VecGetArrayRead(D,&v);CHKERRQ(ierr); 18679299369SBarry Smith if (is == INSERT_VALUES) { 187837a59e1SRichard Tran Mills #if defined(PETSC_HAVE_VIENNACL) || defined(PETSC_HAVE_CUDA) 188837a59e1SRichard Tran Mills inserted = PETSC_TRUE; 189837a59e1SRichard Tran Mills #endif 19079299369SBarry Smith for (i=0; i<m; i++) { 19179299369SBarry Smith aa[diag[i]] = v[i]; 19279299369SBarry Smith } 19379299369SBarry Smith } else { 19479299369SBarry Smith for (i=0; i<m; i++) { 195837a59e1SRichard Tran Mills #if defined(PETSC_HAVE_VIENNACL) || defined(PETSC_HAVE_CUDA) 196837a59e1SRichard Tran Mills if (v[i] != 0.0) inserted = PETSC_TRUE; 197837a59e1SRichard Tran Mills #endif 19879299369SBarry Smith aa[diag[i]] += v[i]; 19979299369SBarry Smith } 20079299369SBarry Smith } 201837a59e1SRichard Tran Mills #if defined(PETSC_HAVE_VIENNACL) || defined(PETSC_HAVE_CUDA) 202837a59e1SRichard Tran Mills if (inserted) Y->offloadmask = PETSC_OFFLOAD_CPU; 203837a59e1SRichard Tran Mills #endif 20499e65526SBarry Smith ierr = VecRestoreArrayRead(D,&v);CHKERRQ(ierr); 20579299369SBarry Smith PetscFunctionReturn(0); 20679299369SBarry Smith } 207acf2f550SJed Brown ierr = MatSeqAIJInvalidateDiagonal(Y);CHKERRQ(ierr); 20809f38230SBarry Smith } 20909f38230SBarry Smith ierr = MatDiagonalSet_Default(Y,D,is);CHKERRQ(ierr); 21009f38230SBarry Smith PetscFunctionReturn(0); 21109f38230SBarry Smith } 21279299369SBarry Smith 2131a83f524SJed Brown PetscErrorCode MatGetRowIJ_SeqAIJ(Mat A,PetscInt oshift,PetscBool symmetric,PetscBool inodecompressed,PetscInt *m,const PetscInt *ia[],const PetscInt *ja[],PetscBool *done) 21417ab2063SBarry Smith { 215416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 216dfbe8321SBarry Smith PetscErrorCode ierr; 21797f1f81fSBarry Smith PetscInt i,ishift; 21817ab2063SBarry Smith 2193a40ed3dSBarry Smith PetscFunctionBegin; 220d0f46423SBarry Smith *m = A->rmap->n; 2213a40ed3dSBarry Smith if (!ia) PetscFunctionReturn(0); 222bfeeae90SHong Zhang ishift = 0; 22353e63a63SBarry Smith if (symmetric && !A->structurally_symmetric) { 2242462f5fdSStefano Zampini ierr = MatToSymmetricIJ_SeqAIJ(A->rmap->n,a->i,a->j,PETSC_TRUE,ishift,oshift,(PetscInt**)ia,(PetscInt**)ja);CHKERRQ(ierr); 225bfeeae90SHong Zhang } else if (oshift == 1) { 2261a83f524SJed Brown PetscInt *tia; 227d0f46423SBarry Smith PetscInt nz = a->i[A->rmap->n]; 2283b2fbd54SBarry Smith /* malloc space and add 1 to i and j indices */ 229854ce69bSBarry Smith ierr = PetscMalloc1(A->rmap->n+1,&tia);CHKERRQ(ierr); 2301a83f524SJed Brown for (i=0; i<A->rmap->n+1; i++) tia[i] = a->i[i] + 1; 2311a83f524SJed Brown *ia = tia; 232ecc77c7aSBarry Smith if (ja) { 2331a83f524SJed Brown PetscInt *tja; 234854ce69bSBarry Smith ierr = PetscMalloc1(nz+1,&tja);CHKERRQ(ierr); 2351a83f524SJed Brown for (i=0; i<nz; i++) tja[i] = a->j[i] + 1; 2361a83f524SJed Brown *ja = tja; 237ecc77c7aSBarry Smith } 2386945ee14SBarry Smith } else { 239ecc77c7aSBarry Smith *ia = a->i; 240ecc77c7aSBarry Smith if (ja) *ja = a->j; 241a2ce50c7SBarry Smith } 2423a40ed3dSBarry Smith PetscFunctionReturn(0); 243a2744918SBarry Smith } 244a2744918SBarry Smith 2451a83f524SJed Brown PetscErrorCode MatRestoreRowIJ_SeqAIJ(Mat A,PetscInt oshift,PetscBool symmetric,PetscBool inodecompressed,PetscInt *n,const PetscInt *ia[],const PetscInt *ja[],PetscBool *done) 2466945ee14SBarry Smith { 247dfbe8321SBarry Smith PetscErrorCode ierr; 2486945ee14SBarry Smith 2493a40ed3dSBarry Smith PetscFunctionBegin; 2503a40ed3dSBarry Smith if (!ia) PetscFunctionReturn(0); 251bfeeae90SHong Zhang if ((symmetric && !A->structurally_symmetric) || oshift == 1) { 252606d414cSSatish Balay ierr = PetscFree(*ia);CHKERRQ(ierr); 253ecc77c7aSBarry Smith if (ja) {ierr = PetscFree(*ja);CHKERRQ(ierr);} 254bcd2baecSBarry Smith } 2553a40ed3dSBarry Smith PetscFunctionReturn(0); 25617ab2063SBarry Smith } 25717ab2063SBarry Smith 2581a83f524SJed Brown PetscErrorCode MatGetColumnIJ_SeqAIJ(Mat A,PetscInt oshift,PetscBool symmetric,PetscBool inodecompressed,PetscInt *nn,const PetscInt *ia[],const PetscInt *ja[],PetscBool *done) 2593b2fbd54SBarry Smith { 2603b2fbd54SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 261dfbe8321SBarry Smith PetscErrorCode ierr; 262d0f46423SBarry Smith PetscInt i,*collengths,*cia,*cja,n = A->cmap->n,m = A->rmap->n; 26397f1f81fSBarry Smith PetscInt nz = a->i[m],row,*jj,mr,col; 2643b2fbd54SBarry Smith 2653a40ed3dSBarry Smith PetscFunctionBegin; 266899cda47SBarry Smith *nn = n; 2673a40ed3dSBarry Smith if (!ia) PetscFunctionReturn(0); 2683b2fbd54SBarry Smith if (symmetric) { 2692462f5fdSStefano Zampini ierr = MatToSymmetricIJ_SeqAIJ(A->rmap->n,a->i,a->j,PETSC_TRUE,0,oshift,(PetscInt**)ia,(PetscInt**)ja);CHKERRQ(ierr); 2703b2fbd54SBarry Smith } else { 271b9e7e5c1SBarry Smith ierr = PetscCalloc1(n,&collengths);CHKERRQ(ierr); 272854ce69bSBarry Smith ierr = PetscMalloc1(n+1,&cia);CHKERRQ(ierr); 273b9e7e5c1SBarry Smith ierr = PetscMalloc1(nz,&cja);CHKERRQ(ierr); 2743b2fbd54SBarry Smith jj = a->j; 2753b2fbd54SBarry Smith for (i=0; i<nz; i++) { 276bfeeae90SHong Zhang collengths[jj[i]]++; 2773b2fbd54SBarry Smith } 2783b2fbd54SBarry Smith cia[0] = oshift; 2793b2fbd54SBarry Smith for (i=0; i<n; i++) { 2803b2fbd54SBarry Smith cia[i+1] = cia[i] + collengths[i]; 2813b2fbd54SBarry Smith } 282580bdb30SBarry Smith ierr = PetscArrayzero(collengths,n);CHKERRQ(ierr); 2833b2fbd54SBarry Smith jj = a->j; 284a93ec695SBarry Smith for (row=0; row<m; row++) { 285a93ec695SBarry Smith mr = a->i[row+1] - a->i[row]; 286a93ec695SBarry Smith for (i=0; i<mr; i++) { 287bfeeae90SHong Zhang col = *jj++; 2882205254eSKarl Rupp 2893b2fbd54SBarry Smith cja[cia[col] + collengths[col]++ - oshift] = row + oshift; 2903b2fbd54SBarry Smith } 2913b2fbd54SBarry Smith } 292606d414cSSatish Balay ierr = PetscFree(collengths);CHKERRQ(ierr); 2933b2fbd54SBarry Smith *ia = cia; *ja = cja; 2943b2fbd54SBarry Smith } 2953a40ed3dSBarry Smith PetscFunctionReturn(0); 2963b2fbd54SBarry Smith } 2973b2fbd54SBarry Smith 2981a83f524SJed Brown PetscErrorCode MatRestoreColumnIJ_SeqAIJ(Mat A,PetscInt oshift,PetscBool symmetric,PetscBool inodecompressed,PetscInt *n,const PetscInt *ia[],const PetscInt *ja[],PetscBool *done) 2993b2fbd54SBarry Smith { 300dfbe8321SBarry Smith PetscErrorCode ierr; 301606d414cSSatish Balay 3023a40ed3dSBarry Smith PetscFunctionBegin; 3033a40ed3dSBarry Smith if (!ia) PetscFunctionReturn(0); 3043b2fbd54SBarry Smith 305606d414cSSatish Balay ierr = PetscFree(*ia);CHKERRQ(ierr); 306606d414cSSatish Balay ierr = PetscFree(*ja);CHKERRQ(ierr); 3073a40ed3dSBarry Smith PetscFunctionReturn(0); 3083b2fbd54SBarry Smith } 3093b2fbd54SBarry Smith 3107cee066cSHong Zhang /* 3117cee066cSHong Zhang MatGetColumnIJ_SeqAIJ_Color() and MatRestoreColumnIJ_SeqAIJ_Color() are customized from 3127cee066cSHong Zhang MatGetColumnIJ_SeqAIJ() and MatRestoreColumnIJ_SeqAIJ() by adding an output 313040ebd07SHong Zhang spidx[], index of a->a, to be used in MatTransposeColoringCreate_SeqAIJ() and MatFDColoringCreate_SeqXAIJ() 3147cee066cSHong Zhang */ 3157cee066cSHong Zhang PetscErrorCode MatGetColumnIJ_SeqAIJ_Color(Mat A,PetscInt oshift,PetscBool symmetric,PetscBool inodecompressed,PetscInt *nn,const PetscInt *ia[],const PetscInt *ja[],PetscInt *spidx[],PetscBool *done) 3167cee066cSHong Zhang { 3177cee066cSHong Zhang Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 3187cee066cSHong Zhang PetscErrorCode ierr; 3197cee066cSHong Zhang PetscInt i,*collengths,*cia,*cja,n = A->cmap->n,m = A->rmap->n; 320071fcb05SBarry Smith PetscInt nz = a->i[m],row,mr,col,tmp; 3217cee066cSHong Zhang PetscInt *cspidx; 322071fcb05SBarry Smith const PetscInt *jj; 3237cee066cSHong Zhang 3247cee066cSHong Zhang PetscFunctionBegin; 3257cee066cSHong Zhang *nn = n; 3267cee066cSHong Zhang if (!ia) PetscFunctionReturn(0); 327625f6d37SHong Zhang 328b9e7e5c1SBarry Smith ierr = PetscCalloc1(n,&collengths);CHKERRQ(ierr); 329854ce69bSBarry Smith ierr = PetscMalloc1(n+1,&cia);CHKERRQ(ierr); 330b9e7e5c1SBarry Smith ierr = PetscMalloc1(nz,&cja);CHKERRQ(ierr); 331b9e7e5c1SBarry Smith ierr = PetscMalloc1(nz,&cspidx);CHKERRQ(ierr); 3327cee066cSHong Zhang jj = a->j; 3337cee066cSHong Zhang for (i=0; i<nz; i++) { 3347cee066cSHong Zhang collengths[jj[i]]++; 3357cee066cSHong Zhang } 3367cee066cSHong Zhang cia[0] = oshift; 3377cee066cSHong Zhang for (i=0; i<n; i++) { 3387cee066cSHong Zhang cia[i+1] = cia[i] + collengths[i]; 3397cee066cSHong Zhang } 340580bdb30SBarry Smith ierr = PetscArrayzero(collengths,n);CHKERRQ(ierr); 3417cee066cSHong Zhang jj = a->j; 3427cee066cSHong Zhang for (row=0; row<m; row++) { 3437cee066cSHong Zhang mr = a->i[row+1] - a->i[row]; 3447cee066cSHong Zhang for (i=0; i<mr; i++) { 3457cee066cSHong Zhang col = *jj++; 346071fcb05SBarry Smith tmp = cia[col] + collengths[col]++ - oshift; 347071fcb05SBarry Smith cspidx[tmp] = a->i[row] + i; /* index of a->j */ 348071fcb05SBarry Smith cja[tmp] = row + oshift; 3497cee066cSHong Zhang } 3507cee066cSHong Zhang } 3517cee066cSHong Zhang ierr = PetscFree(collengths);CHKERRQ(ierr); 352071fcb05SBarry Smith *ia = cia; 353071fcb05SBarry Smith *ja = cja; 3547cee066cSHong Zhang *spidx = cspidx; 3557cee066cSHong Zhang PetscFunctionReturn(0); 3567cee066cSHong Zhang } 3577cee066cSHong Zhang 3587cee066cSHong Zhang PetscErrorCode MatRestoreColumnIJ_SeqAIJ_Color(Mat A,PetscInt oshift,PetscBool symmetric,PetscBool inodecompressed,PetscInt *n,const PetscInt *ia[],const PetscInt *ja[],PetscInt *spidx[],PetscBool *done) 3597cee066cSHong Zhang { 3607cee066cSHong Zhang PetscErrorCode ierr; 3617cee066cSHong Zhang 3627cee066cSHong Zhang PetscFunctionBegin; 3635243ef75SHong Zhang ierr = MatRestoreColumnIJ_SeqAIJ(A,oshift,symmetric,inodecompressed,n,ia,ja,done);CHKERRQ(ierr); 3647cee066cSHong Zhang ierr = PetscFree(*spidx);CHKERRQ(ierr); 3657cee066cSHong Zhang PetscFunctionReturn(0); 3667cee066cSHong Zhang } 3677cee066cSHong Zhang 36887d4246cSBarry Smith PetscErrorCode MatSetValuesRow_SeqAIJ(Mat A,PetscInt row,const PetscScalar v[]) 36987d4246cSBarry Smith { 37087d4246cSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 37187d4246cSBarry Smith PetscInt *ai = a->i; 37287d4246cSBarry Smith PetscErrorCode ierr; 37387d4246cSBarry Smith 37487d4246cSBarry Smith PetscFunctionBegin; 375580bdb30SBarry Smith ierr = PetscArraycpy(a->a+ai[row],v,ai[row+1]-ai[row]);CHKERRQ(ierr); 376e2cf4d64SStefano Zampini #if defined(PETSC_HAVE_VIENNACL) || defined(PETSC_HAVE_CUDA) 377c70f7ee4SJunchao Zhang if (A->offloadmask != PETSC_OFFLOAD_UNALLOCATED && ai[row+1]-ai[row]) A->offloadmask = PETSC_OFFLOAD_CPU; 378e2cf4d64SStefano Zampini #endif 37987d4246cSBarry Smith PetscFunctionReturn(0); 38087d4246cSBarry Smith } 38187d4246cSBarry Smith 382bd04181cSBarry Smith /* 383bd04181cSBarry Smith MatSeqAIJSetValuesLocalFast - An optimized version of MatSetValuesLocal() for SeqAIJ matrices with several assumptions 384bd04181cSBarry Smith 385bd04181cSBarry Smith - a single row of values is set with each call 386bd04181cSBarry Smith - no row or column indices are negative or (in error) larger than the number of rows or columns 387bd04181cSBarry Smith - the values are always added to the matrix, not set 388bd04181cSBarry Smith - no new locations are introduced in the nonzero structure of the matrix 389bd04181cSBarry Smith 3901f763a69SBarry Smith This does NOT assume the global column indices are sorted 391bd04181cSBarry Smith 3921f763a69SBarry Smith */ 393bd04181cSBarry Smith 394af0996ceSBarry Smith #include <petsc/private/isimpl.h> 395189e4007SBarry Smith PetscErrorCode MatSeqAIJSetValuesLocalFast(Mat A,PetscInt m,const PetscInt im[],PetscInt n,const PetscInt in[],const PetscScalar v[],InsertMode is) 396189e4007SBarry Smith { 397189e4007SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 3981f763a69SBarry Smith PetscInt low,high,t,row,nrow,i,col,l; 3991f763a69SBarry Smith const PetscInt *rp,*ai = a->i,*ailen = a->ilen,*aj = a->j; 4001f763a69SBarry Smith PetscInt lastcol = -1; 401189e4007SBarry Smith MatScalar *ap,value,*aa = a->a; 402189e4007SBarry Smith const PetscInt *ridx = A->rmap->mapping->indices,*cidx = A->cmap->mapping->indices; 403189e4007SBarry Smith 404f38dd0b8SBarry Smith row = ridx[im[0]]; 4051f763a69SBarry Smith rp = aj + ai[row]; 4061f763a69SBarry Smith ap = aa + ai[row]; 4071f763a69SBarry Smith nrow = ailen[row]; 408189e4007SBarry Smith low = 0; 409189e4007SBarry Smith high = nrow; 410189e4007SBarry Smith for (l=0; l<n; l++) { /* loop over added columns */ 411189e4007SBarry Smith col = cidx[in[l]]; 412f38dd0b8SBarry Smith value = v[l]; 413189e4007SBarry Smith 414189e4007SBarry Smith if (col <= lastcol) low = 0; 415189e4007SBarry Smith else high = nrow; 416189e4007SBarry Smith lastcol = col; 417189e4007SBarry Smith while (high-low > 5) { 418189e4007SBarry Smith t = (low+high)/2; 419189e4007SBarry Smith if (rp[t] > col) high = t; 420189e4007SBarry Smith else low = t; 421189e4007SBarry Smith } 422189e4007SBarry Smith for (i=low; i<high; i++) { 423189e4007SBarry Smith if (rp[i] == col) { 4241f763a69SBarry Smith ap[i] += value; 425189e4007SBarry Smith low = i + 1; 4261f763a69SBarry Smith break; 427189e4007SBarry Smith } 428189e4007SBarry Smith } 429189e4007SBarry Smith } 430e2cf4d64SStefano Zampini #if defined(PETSC_HAVE_VIENNACL) || defined(PETSC_HAVE_CUDA) 431c70f7ee4SJunchao Zhang if (A->offloadmask != PETSC_OFFLOAD_UNALLOCATED && m && n) A->offloadmask = PETSC_OFFLOAD_CPU; 432e2cf4d64SStefano Zampini #endif 433f38dd0b8SBarry Smith return 0; 434189e4007SBarry Smith } 435189e4007SBarry Smith 43697f1f81fSBarry Smith PetscErrorCode MatSetValues_SeqAIJ(Mat A,PetscInt m,const PetscInt im[],PetscInt n,const PetscInt in[],const PetscScalar v[],InsertMode is) 43717ab2063SBarry Smith { 438416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 439e2ee6c50SBarry Smith PetscInt *rp,k,low,high,t,ii,row,nrow,i,col,l,rmax,N; 44097f1f81fSBarry Smith PetscInt *imax = a->imax,*ai = a->i,*ailen = a->ilen; 4416849ba73SBarry Smith PetscErrorCode ierr; 442e2ee6c50SBarry Smith PetscInt *aj = a->j,nonew = a->nonew,lastcol = -1; 443d8cdefa3SHong Zhang MatScalar *ap=NULL,value=0.0,*aa = a->a; 444ace3abfcSBarry Smith PetscBool ignorezeroentries = a->ignorezeroentries; 445ace3abfcSBarry Smith PetscBool roworiented = a->roworiented; 446e2cf4d64SStefano Zampini #if defined(PETSC_HAVE_VIENNACL) || defined(PETSC_HAVE_CUDA) 447e2cf4d64SStefano Zampini PetscBool inserted = PETSC_FALSE; 448e2cf4d64SStefano Zampini #endif 44917ab2063SBarry Smith 4503a40ed3dSBarry Smith PetscFunctionBegin; 45117ab2063SBarry Smith for (k=0; k<m; k++) { /* loop over added rows */ 452416022c9SBarry Smith row = im[k]; 4535ef9f2a5SBarry Smith if (row < 0) continue; 454cf9c20a2SJed Brown if (PetscUnlikelyDebug(row >= A->rmap->n)) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Row too large: row %D max %D",row,A->rmap->n-1); 455720833daSHong Zhang rp = aj + ai[row]; 456876c6284SHong Zhang if (!A->structure_only) ap = aa + ai[row]; 45717ab2063SBarry Smith rmax = imax[row]; nrow = ailen[row]; 458416022c9SBarry Smith low = 0; 459c71e6ed7SBarry Smith high = nrow; 46017ab2063SBarry Smith for (l=0; l<n; l++) { /* loop over added columns */ 4615ef9f2a5SBarry Smith if (in[l] < 0) continue; 462cf9c20a2SJed Brown if (PetscUnlikelyDebug(in[l] >= A->cmap->n)) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Column too large: col %D max %D",in[l],A->cmap->n-1); 463bfeeae90SHong Zhang col = in[l]; 464071fcb05SBarry Smith if (v && !A->structure_only) value = roworiented ? v[l + k*n] : v[k + l*m]; 465071fcb05SBarry Smith if (!A->structure_only && value == 0.0 && ignorezeroentries && is == ADD_VALUES && row != col) continue; 46636db0b34SBarry Smith 4672205254eSKarl Rupp if (col <= lastcol) low = 0; 4682205254eSKarl Rupp else high = nrow; 469e2ee6c50SBarry Smith lastcol = col; 470416022c9SBarry Smith while (high-low > 5) { 471416022c9SBarry Smith t = (low+high)/2; 472416022c9SBarry Smith if (rp[t] > col) high = t; 473416022c9SBarry Smith else low = t; 47417ab2063SBarry Smith } 475416022c9SBarry Smith for (i=low; i<high; i++) { 47617ab2063SBarry Smith if (rp[i] > col) break; 47717ab2063SBarry Smith if (rp[i] == col) { 478876c6284SHong Zhang if (!A->structure_only) { 4790c0d7e18SFande Kong if (is == ADD_VALUES) { 4800c0d7e18SFande Kong ap[i] += value; 4810c0d7e18SFande Kong (void)PetscLogFlops(1.0); 4820c0d7e18SFande Kong } 48317ab2063SBarry Smith else ap[i] = value; 484e2cf4d64SStefano Zampini #if defined(PETSC_HAVE_VIENNACL) || defined(PETSC_HAVE_CUDA) 485e2cf4d64SStefano Zampini inserted = PETSC_TRUE; 486e2cf4d64SStefano Zampini #endif 487720833daSHong Zhang } 488e44c0bd4SBarry Smith low = i + 1; 48917ab2063SBarry Smith goto noinsert; 49017ab2063SBarry Smith } 49117ab2063SBarry Smith } 492dcd36c23SBarry Smith if (value == 0.0 && ignorezeroentries && row != col) goto noinsert; 493c2653b3dSLois Curfman McInnes if (nonew == 1) goto noinsert; 494e32f2f54SBarry Smith if (nonew == -1) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Inserting a new nonzero at (%D,%D) in the matrix",row,col); 495720833daSHong Zhang if (A->structure_only) { 496876c6284SHong Zhang MatSeqXAIJReallocateAIJ_structure_only(A,A->rmap->n,1,nrow,row,col,rmax,ai,aj,rp,imax,nonew,MatScalar); 497720833daSHong Zhang } else { 498fef13f97SBarry Smith MatSeqXAIJReallocateAIJ(A,A->rmap->n,1,nrow,row,col,rmax,aa,ai,aj,rp,ap,imax,nonew,MatScalar); 499720833daSHong Zhang } 500c03d1d03SSatish Balay N = nrow++ - 1; a->nz++; high++; 501416022c9SBarry Smith /* shift up all the later entries in this row */ 502580bdb30SBarry Smith ierr = PetscArraymove(rp+i+1,rp+i,N-i+1);CHKERRQ(ierr); 50317ab2063SBarry Smith rp[i] = col; 504580bdb30SBarry Smith if (!A->structure_only){ 505580bdb30SBarry Smith ierr = PetscArraymove(ap+i+1,ap+i,N-i+1);CHKERRQ(ierr); 506580bdb30SBarry Smith ap[i] = value; 507580bdb30SBarry Smith } 508416022c9SBarry Smith low = i + 1; 509e56f5c9eSBarry Smith A->nonzerostate++; 510e2cf4d64SStefano Zampini #if defined(PETSC_HAVE_VIENNACL) || defined(PETSC_HAVE_CUDA) 511e2cf4d64SStefano Zampini inserted = PETSC_TRUE; 512e2cf4d64SStefano Zampini #endif 513e44c0bd4SBarry Smith noinsert:; 51417ab2063SBarry Smith } 51517ab2063SBarry Smith ailen[row] = nrow; 51617ab2063SBarry Smith } 517e2cf4d64SStefano Zampini #if defined(PETSC_HAVE_VIENNACL) || defined(PETSC_HAVE_CUDA) 518c70f7ee4SJunchao Zhang if (A->offloadmask != PETSC_OFFLOAD_UNALLOCATED && inserted) A->offloadmask = PETSC_OFFLOAD_CPU; 519e2cf4d64SStefano Zampini #endif 5203a40ed3dSBarry Smith PetscFunctionReturn(0); 52117ab2063SBarry Smith } 52217ab2063SBarry Smith 523071fcb05SBarry Smith PetscErrorCode MatSetValues_SeqAIJ_SortedFull(Mat A,PetscInt m,const PetscInt im[],PetscInt n,const PetscInt in[],const PetscScalar v[],InsertMode is) 524071fcb05SBarry Smith { 525071fcb05SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 526071fcb05SBarry Smith PetscInt *rp,k,row; 527071fcb05SBarry Smith PetscInt *ai = a->i,*ailen = a->ilen; 528071fcb05SBarry Smith PetscErrorCode ierr; 529071fcb05SBarry Smith PetscInt *aj = a->j; 530071fcb05SBarry Smith MatScalar *aa = a->a,*ap; 531071fcb05SBarry Smith 532071fcb05SBarry Smith PetscFunctionBegin; 533071fcb05SBarry Smith for (k=0; k<m; k++) { /* loop over added rows */ 534071fcb05SBarry Smith row = im[k]; 535071fcb05SBarry Smith rp = aj + ai[row]; 536071fcb05SBarry Smith ap = aa + ai[row]; 537071fcb05SBarry Smith if (!A->was_assembled) { 538071fcb05SBarry Smith ierr = PetscMemcpy(rp,in,n*sizeof(PetscInt));CHKERRQ(ierr); 539071fcb05SBarry Smith } 540071fcb05SBarry Smith if (!A->structure_only) { 541071fcb05SBarry Smith if (v) { 542071fcb05SBarry Smith ierr = PetscMemcpy(ap,v,n*sizeof(PetscScalar));CHKERRQ(ierr); 543071fcb05SBarry Smith v += n; 544071fcb05SBarry Smith } else { 545071fcb05SBarry Smith ierr = PetscMemzero(ap,n*sizeof(PetscScalar));CHKERRQ(ierr); 546071fcb05SBarry Smith } 547071fcb05SBarry Smith } 548071fcb05SBarry Smith ailen[row] = n; 549071fcb05SBarry Smith a->nz += n; 550071fcb05SBarry Smith } 551e2cf4d64SStefano Zampini #if defined(PETSC_HAVE_VIENNACL) || defined(PETSC_HAVE_CUDA) 552c70f7ee4SJunchao Zhang if (A->offloadmask != PETSC_OFFLOAD_UNALLOCATED && m && n) A->offloadmask = PETSC_OFFLOAD_CPU; 553e2cf4d64SStefano Zampini #endif 554071fcb05SBarry Smith PetscFunctionReturn(0); 555071fcb05SBarry Smith } 556071fcb05SBarry Smith 55781824310SBarry Smith 558a77337e4SBarry Smith PetscErrorCode MatGetValues_SeqAIJ(Mat A,PetscInt m,const PetscInt im[],PetscInt n,const PetscInt in[],PetscScalar v[]) 5597eb43aa7SLois Curfman McInnes { 5607eb43aa7SLois Curfman McInnes Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 56197f1f81fSBarry Smith PetscInt *rp,k,low,high,t,row,nrow,i,col,l,*aj = a->j; 56297f1f81fSBarry Smith PetscInt *ai = a->i,*ailen = a->ilen; 56354f21887SBarry Smith MatScalar *ap,*aa = a->a; 5647eb43aa7SLois Curfman McInnes 5653a40ed3dSBarry Smith PetscFunctionBegin; 5667eb43aa7SLois Curfman McInnes for (k=0; k<m; k++) { /* loop over rows */ 5677eb43aa7SLois Curfman McInnes row = im[k]; 568e32f2f54SBarry Smith if (row < 0) {v += n; continue;} /* SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Negative row: %D",row); */ 569e32f2f54SBarry Smith if (row >= A->rmap->n) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Row too large: row %D max %D",row,A->rmap->n-1); 570bfeeae90SHong Zhang rp = aj + ai[row]; ap = aa + ai[row]; 5717eb43aa7SLois Curfman McInnes nrow = ailen[row]; 5727eb43aa7SLois Curfman McInnes for (l=0; l<n; l++) { /* loop over columns */ 573e32f2f54SBarry Smith if (in[l] < 0) {v++; continue;} /* SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Negative column: %D",in[l]); */ 574e32f2f54SBarry Smith if (in[l] >= A->cmap->n) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Column too large: col %D max %D",in[l],A->cmap->n-1); 575bfeeae90SHong Zhang col = in[l]; 5767eb43aa7SLois Curfman McInnes high = nrow; low = 0; /* assume unsorted */ 5777eb43aa7SLois Curfman McInnes while (high-low > 5) { 5787eb43aa7SLois Curfman McInnes t = (low+high)/2; 5797eb43aa7SLois Curfman McInnes if (rp[t] > col) high = t; 5807eb43aa7SLois Curfman McInnes else low = t; 5817eb43aa7SLois Curfman McInnes } 5827eb43aa7SLois Curfman McInnes for (i=low; i<high; i++) { 5837eb43aa7SLois Curfman McInnes if (rp[i] > col) break; 5847eb43aa7SLois Curfman McInnes if (rp[i] == col) { 585b49de8d1SLois Curfman McInnes *v++ = ap[i]; 5867eb43aa7SLois Curfman McInnes goto finished; 5877eb43aa7SLois Curfman McInnes } 5887eb43aa7SLois Curfman McInnes } 58997e567efSBarry Smith *v++ = 0.0; 5907eb43aa7SLois Curfman McInnes finished:; 5917eb43aa7SLois Curfman McInnes } 5927eb43aa7SLois Curfman McInnes } 5933a40ed3dSBarry Smith PetscFunctionReturn(0); 5947eb43aa7SLois Curfman McInnes } 5957eb43aa7SLois Curfman McInnes 5963ea6fe3dSLisandro Dalcin PetscErrorCode MatView_SeqAIJ_Binary(Mat mat,PetscViewer viewer) 59717ab2063SBarry Smith { 5983ea6fe3dSLisandro Dalcin Mat_SeqAIJ *A = (Mat_SeqAIJ*)mat->data; 5993ea6fe3dSLisandro Dalcin PetscInt header[4],M,N,m,nz,i; 6003ea6fe3dSLisandro Dalcin PetscInt *rowlens; 6016849ba73SBarry Smith PetscErrorCode ierr; 60217ab2063SBarry Smith 6033a40ed3dSBarry Smith PetscFunctionBegin; 6043ea6fe3dSLisandro Dalcin ierr = PetscViewerSetUp(viewer);CHKERRQ(ierr); 6052205254eSKarl Rupp 6063ea6fe3dSLisandro Dalcin M = mat->rmap->N; 6073ea6fe3dSLisandro Dalcin N = mat->cmap->N; 6083ea6fe3dSLisandro Dalcin m = mat->rmap->n; 6093ea6fe3dSLisandro Dalcin nz = A->nz; 610416022c9SBarry Smith 6113ea6fe3dSLisandro Dalcin /* write matrix header */ 6123ea6fe3dSLisandro Dalcin header[0] = MAT_FILE_CLASSID; 6133ea6fe3dSLisandro Dalcin header[1] = M; header[2] = N; header[3] = nz; 6143ea6fe3dSLisandro Dalcin ierr = PetscViewerBinaryWrite(viewer,header,4,PETSC_INT);CHKERRQ(ierr); 615416022c9SBarry Smith 6163ea6fe3dSLisandro Dalcin /* fill in and store row lengths */ 6173ea6fe3dSLisandro Dalcin ierr = PetscMalloc1(m,&rowlens);CHKERRQ(ierr); 6183ea6fe3dSLisandro Dalcin for (i=0; i<m; i++) rowlens[i] = A->i[i+1] - A->i[i]; 6193ea6fe3dSLisandro Dalcin ierr = PetscViewerBinaryWrite(viewer,rowlens,m,PETSC_INT);CHKERRQ(ierr); 6203ea6fe3dSLisandro Dalcin ierr = PetscFree(rowlens);CHKERRQ(ierr); 6213ea6fe3dSLisandro Dalcin /* store column indices */ 6223ea6fe3dSLisandro Dalcin ierr = PetscViewerBinaryWrite(viewer,A->j,nz,PETSC_INT);CHKERRQ(ierr); 623416022c9SBarry Smith /* store nonzero values */ 6243ea6fe3dSLisandro Dalcin ierr = PetscViewerBinaryWrite(viewer,A->a,nz,PETSC_SCALAR);CHKERRQ(ierr); 625b37d52dbSMark F. Adams 6263ea6fe3dSLisandro Dalcin /* write block size option to the viewer's .info file */ 6273ea6fe3dSLisandro Dalcin ierr = MatView_Binary_BlockSizes(mat,viewer);CHKERRQ(ierr); 6283a40ed3dSBarry Smith PetscFunctionReturn(0); 62917ab2063SBarry Smith } 630416022c9SBarry Smith 6317dc0baabSHong Zhang static PetscErrorCode MatView_SeqAIJ_ASCII_structonly(Mat A,PetscViewer viewer) 6327dc0baabSHong Zhang { 6337dc0baabSHong Zhang PetscErrorCode ierr; 6347dc0baabSHong Zhang Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 6357dc0baabSHong Zhang PetscInt i,k,m=A->rmap->N; 6367dc0baabSHong Zhang 6377dc0baabSHong Zhang PetscFunctionBegin; 6387dc0baabSHong Zhang ierr = PetscViewerASCIIUseTabs(viewer,PETSC_FALSE);CHKERRQ(ierr); 6397dc0baabSHong Zhang for (i=0; i<m; i++) { 6407dc0baabSHong Zhang ierr = PetscViewerASCIIPrintf(viewer,"row %D:",i);CHKERRQ(ierr); 6417dc0baabSHong Zhang for (k=a->i[i]; k<a->i[i+1]; k++) { 6427dc0baabSHong Zhang ierr = PetscViewerASCIIPrintf(viewer," (%D) ",a->j[k]);CHKERRQ(ierr); 6437dc0baabSHong Zhang } 6447dc0baabSHong Zhang ierr = PetscViewerASCIIPrintf(viewer,"\n");CHKERRQ(ierr); 6457dc0baabSHong Zhang } 6467dc0baabSHong Zhang ierr = PetscViewerASCIIUseTabs(viewer,PETSC_TRUE);CHKERRQ(ierr); 6477dc0baabSHong Zhang PetscFunctionReturn(0); 6487dc0baabSHong Zhang } 6497dc0baabSHong Zhang 65009573ac7SBarry Smith extern PetscErrorCode MatSeqAIJFactorInfo_Matlab(Mat,PetscViewer); 651cd155464SBarry Smith 652dfbe8321SBarry Smith PetscErrorCode MatView_SeqAIJ_ASCII(Mat A,PetscViewer viewer) 653416022c9SBarry Smith { 654416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 655dfbe8321SBarry Smith PetscErrorCode ierr; 65660e0710aSBarry Smith PetscInt i,j,m = A->rmap->n; 657e060cb09SBarry Smith const char *name; 658f3ef73ceSBarry Smith PetscViewerFormat format; 65917ab2063SBarry Smith 6603a40ed3dSBarry Smith PetscFunctionBegin; 6617dc0baabSHong Zhang if (A->structure_only) { 6627dc0baabSHong Zhang ierr = MatView_SeqAIJ_ASCII_structonly(A,viewer);CHKERRQ(ierr); 6637dc0baabSHong Zhang PetscFunctionReturn(0); 6647dc0baabSHong Zhang } 66543e49210SHong Zhang 666b0a32e0cSBarry Smith ierr = PetscViewerGetFormat(viewer,&format);CHKERRQ(ierr); 66771c2f376SKris Buschelman if (format == PETSC_VIEWER_ASCII_MATLAB) { 66897f1f81fSBarry Smith PetscInt nofinalvalue = 0; 66960e0710aSBarry Smith if (m && ((a->i[m] == a->i[m-1]) || (a->j[a->nz-1] != A->cmap->n-1))) { 670c337ccceSJed Brown /* Need a dummy value to ensure the dimension of the matrix. */ 671d00d2cf4SBarry Smith nofinalvalue = 1; 672d00d2cf4SBarry Smith } 673d00279f6SBarry Smith ierr = PetscViewerASCIIUseTabs(viewer,PETSC_FALSE);CHKERRQ(ierr); 674d0f46423SBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"%% Size = %D %D \n",m,A->cmap->n);CHKERRQ(ierr); 67577431f27SBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"%% Nonzeros = %D \n",a->nz);CHKERRQ(ierr); 676fbfe6fa7SJed Brown #if defined(PETSC_USE_COMPLEX) 677fbfe6fa7SJed Brown ierr = PetscViewerASCIIPrintf(viewer,"zzz = zeros(%D,4);\n",a->nz+nofinalvalue);CHKERRQ(ierr); 678fbfe6fa7SJed Brown #else 67977431f27SBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"zzz = zeros(%D,3);\n",a->nz+nofinalvalue);CHKERRQ(ierr); 680fbfe6fa7SJed Brown #endif 681b0a32e0cSBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"zzz = [\n");CHKERRQ(ierr); 68217ab2063SBarry Smith 68317ab2063SBarry Smith for (i=0; i<m; i++) { 68460e0710aSBarry Smith for (j=a->i[i]; j<a->i[i+1]; j++) { 685aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 686a9bf72d8SJed Brown ierr = PetscViewerASCIIPrintf(viewer,"%D %D %18.16e %18.16e\n",i+1,a->j[j]+1,(double)PetscRealPart(a->a[j]),(double)PetscImaginaryPart(a->a[j]));CHKERRQ(ierr); 68717ab2063SBarry Smith #else 68860e0710aSBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"%D %D %18.16e\n",i+1,a->j[j]+1,(double)a->a[j]);CHKERRQ(ierr); 68917ab2063SBarry Smith #endif 69017ab2063SBarry Smith } 69117ab2063SBarry Smith } 692d00d2cf4SBarry Smith if (nofinalvalue) { 693c337ccceSJed Brown #if defined(PETSC_USE_COMPLEX) 694c337ccceSJed Brown ierr = PetscViewerASCIIPrintf(viewer,"%D %D %18.16e %18.16e\n",m,A->cmap->n,0.,0.);CHKERRQ(ierr); 695c337ccceSJed Brown #else 696d0f46423SBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"%D %D %18.16e\n",m,A->cmap->n,0.0);CHKERRQ(ierr); 697c337ccceSJed Brown #endif 698d00d2cf4SBarry Smith } 699317d6ea6SBarry Smith ierr = PetscObjectGetName((PetscObject)A,&name);CHKERRQ(ierr); 700fb9695e5SSatish Balay ierr = PetscViewerASCIIPrintf(viewer,"];\n %s = spconvert(zzz);\n",name);CHKERRQ(ierr); 701d00279f6SBarry Smith ierr = PetscViewerASCIIUseTabs(viewer,PETSC_TRUE);CHKERRQ(ierr); 7022950ac48SStefano Zampini } else if (format == PETSC_VIEWER_ASCII_FACTOR_INFO || format == PETSC_VIEWER_ASCII_INFO || format == PETSC_VIEWER_ASCII_INFO_DETAIL) { 703cd155464SBarry Smith PetscFunctionReturn(0); 704fb9695e5SSatish Balay } else if (format == PETSC_VIEWER_ASCII_COMMON) { 705d00279f6SBarry Smith ierr = PetscViewerASCIIUseTabs(viewer,PETSC_FALSE);CHKERRQ(ierr); 70644cd7ae7SLois Curfman McInnes for (i=0; i<m; i++) { 70777431f27SBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"row %D:",i);CHKERRQ(ierr); 70860e0710aSBarry Smith for (j=a->i[i]; j<a->i[i+1]; j++) { 709aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 71036db0b34SBarry Smith if (PetscImaginaryPart(a->a[j]) > 0.0 && PetscRealPart(a->a[j]) != 0.0) { 71160e0710aSBarry Smith ierr = PetscViewerASCIIPrintf(viewer," (%D, %g + %g i)",a->j[j],(double)PetscRealPart(a->a[j]),(double)PetscImaginaryPart(a->a[j]));CHKERRQ(ierr); 71236db0b34SBarry Smith } else if (PetscImaginaryPart(a->a[j]) < 0.0 && PetscRealPart(a->a[j]) != 0.0) { 71360e0710aSBarry Smith ierr = PetscViewerASCIIPrintf(viewer," (%D, %g - %g i)",a->j[j],(double)PetscRealPart(a->a[j]),(double)-PetscImaginaryPart(a->a[j]));CHKERRQ(ierr); 71436db0b34SBarry Smith } else if (PetscRealPart(a->a[j]) != 0.0) { 71560e0710aSBarry Smith ierr = PetscViewerASCIIPrintf(viewer," (%D, %g) ",a->j[j],(double)PetscRealPart(a->a[j]));CHKERRQ(ierr); 7166831982aSBarry Smith } 71744cd7ae7SLois Curfman McInnes #else 71860e0710aSBarry Smith if (a->a[j] != 0.0) {ierr = PetscViewerASCIIPrintf(viewer," (%D, %g) ",a->j[j],(double)a->a[j]);CHKERRQ(ierr);} 71944cd7ae7SLois Curfman McInnes #endif 72044cd7ae7SLois Curfman McInnes } 721b0a32e0cSBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"\n");CHKERRQ(ierr); 72244cd7ae7SLois Curfman McInnes } 723d00279f6SBarry Smith ierr = PetscViewerASCIIUseTabs(viewer,PETSC_TRUE);CHKERRQ(ierr); 724fb9695e5SSatish Balay } else if (format == PETSC_VIEWER_ASCII_SYMMODU) { 72597f1f81fSBarry Smith PetscInt nzd=0,fshift=1,*sptr; 726d00279f6SBarry Smith ierr = PetscViewerASCIIUseTabs(viewer,PETSC_FALSE);CHKERRQ(ierr); 727854ce69bSBarry Smith ierr = PetscMalloc1(m+1,&sptr);CHKERRQ(ierr); 728496be53dSLois Curfman McInnes for (i=0; i<m; i++) { 729496be53dSLois Curfman McInnes sptr[i] = nzd+1; 73060e0710aSBarry Smith for (j=a->i[i]; j<a->i[i+1]; j++) { 731496be53dSLois Curfman McInnes if (a->j[j] >= i) { 732aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 73336db0b34SBarry Smith if (PetscImaginaryPart(a->a[j]) != 0.0 || PetscRealPart(a->a[j]) != 0.0) nzd++; 734496be53dSLois Curfman McInnes #else 735496be53dSLois Curfman McInnes if (a->a[j] != 0.0) nzd++; 736496be53dSLois Curfman McInnes #endif 737496be53dSLois Curfman McInnes } 738496be53dSLois Curfman McInnes } 739496be53dSLois Curfman McInnes } 7402e44a96cSLois Curfman McInnes sptr[m] = nzd+1; 74177431f27SBarry Smith ierr = PetscViewerASCIIPrintf(viewer," %D %D\n\n",m,nzd);CHKERRQ(ierr); 7422e44a96cSLois Curfman McInnes for (i=0; i<m+1; i+=6) { 7432205254eSKarl Rupp if (i+4<m) { 7442205254eSKarl Rupp ierr = PetscViewerASCIIPrintf(viewer," %D %D %D %D %D %D\n",sptr[i],sptr[i+1],sptr[i+2],sptr[i+3],sptr[i+4],sptr[i+5]);CHKERRQ(ierr); 7452205254eSKarl Rupp } else if (i+3<m) { 7462205254eSKarl Rupp ierr = PetscViewerASCIIPrintf(viewer," %D %D %D %D %D\n",sptr[i],sptr[i+1],sptr[i+2],sptr[i+3],sptr[i+4]);CHKERRQ(ierr); 7472205254eSKarl Rupp } else if (i+2<m) { 7482205254eSKarl Rupp ierr = PetscViewerASCIIPrintf(viewer," %D %D %D %D\n",sptr[i],sptr[i+1],sptr[i+2],sptr[i+3]);CHKERRQ(ierr); 7492205254eSKarl Rupp } else if (i+1<m) { 7502205254eSKarl Rupp ierr = PetscViewerASCIIPrintf(viewer," %D %D %D\n",sptr[i],sptr[i+1],sptr[i+2]);CHKERRQ(ierr); 7512205254eSKarl Rupp } else if (i<m) { 7522205254eSKarl Rupp ierr = PetscViewerASCIIPrintf(viewer," %D %D\n",sptr[i],sptr[i+1]);CHKERRQ(ierr); 7532205254eSKarl Rupp } else { 7542205254eSKarl Rupp ierr = PetscViewerASCIIPrintf(viewer," %D\n",sptr[i]);CHKERRQ(ierr); 7552205254eSKarl Rupp } 756496be53dSLois Curfman McInnes } 757b0a32e0cSBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"\n");CHKERRQ(ierr); 758606d414cSSatish Balay ierr = PetscFree(sptr);CHKERRQ(ierr); 759496be53dSLois Curfman McInnes for (i=0; i<m; i++) { 76060e0710aSBarry Smith for (j=a->i[i]; j<a->i[i+1]; j++) { 76177431f27SBarry Smith if (a->j[j] >= i) {ierr = PetscViewerASCIIPrintf(viewer," %D ",a->j[j]+fshift);CHKERRQ(ierr);} 762496be53dSLois Curfman McInnes } 763b0a32e0cSBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"\n");CHKERRQ(ierr); 764496be53dSLois Curfman McInnes } 765b0a32e0cSBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"\n");CHKERRQ(ierr); 766496be53dSLois Curfman McInnes for (i=0; i<m; i++) { 76760e0710aSBarry Smith for (j=a->i[i]; j<a->i[i+1]; j++) { 768496be53dSLois Curfman McInnes if (a->j[j] >= i) { 769aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 77036db0b34SBarry Smith if (PetscImaginaryPart(a->a[j]) != 0.0 || PetscRealPart(a->a[j]) != 0.0) { 77160e0710aSBarry Smith ierr = PetscViewerASCIIPrintf(viewer," %18.16e %18.16e ",(double)PetscRealPart(a->a[j]),(double)PetscImaginaryPart(a->a[j]));CHKERRQ(ierr); 7726831982aSBarry Smith } 773496be53dSLois Curfman McInnes #else 77460e0710aSBarry Smith if (a->a[j] != 0.0) {ierr = PetscViewerASCIIPrintf(viewer," %18.16e ",(double)a->a[j]);CHKERRQ(ierr);} 775496be53dSLois Curfman McInnes #endif 776496be53dSLois Curfman McInnes } 777496be53dSLois Curfman McInnes } 778b0a32e0cSBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"\n");CHKERRQ(ierr); 779496be53dSLois Curfman McInnes } 780d00279f6SBarry Smith ierr = PetscViewerASCIIUseTabs(viewer,PETSC_TRUE);CHKERRQ(ierr); 781fb9695e5SSatish Balay } else if (format == PETSC_VIEWER_ASCII_DENSE) { 78297f1f81fSBarry Smith PetscInt cnt = 0,jcnt; 78387828ca2SBarry Smith PetscScalar value; 78468f1ed48SBarry Smith #if defined(PETSC_USE_COMPLEX) 78568f1ed48SBarry Smith PetscBool realonly = PETSC_TRUE; 78668f1ed48SBarry Smith 78768f1ed48SBarry Smith for (i=0; i<a->i[m]; i++) { 78868f1ed48SBarry Smith if (PetscImaginaryPart(a->a[i]) != 0.0) { 78968f1ed48SBarry Smith realonly = PETSC_FALSE; 79068f1ed48SBarry Smith break; 79168f1ed48SBarry Smith } 79268f1ed48SBarry Smith } 79368f1ed48SBarry Smith #endif 79402594712SBarry Smith 795d00279f6SBarry Smith ierr = PetscViewerASCIIUseTabs(viewer,PETSC_FALSE);CHKERRQ(ierr); 79602594712SBarry Smith for (i=0; i<m; i++) { 79702594712SBarry Smith jcnt = 0; 798d0f46423SBarry Smith for (j=0; j<A->cmap->n; j++) { 799e24b481bSBarry Smith if (jcnt < a->i[i+1]-a->i[i] && j == a->j[cnt]) { 80002594712SBarry Smith value = a->a[cnt++]; 801e24b481bSBarry Smith jcnt++; 80202594712SBarry Smith } else { 80302594712SBarry Smith value = 0.0; 80402594712SBarry Smith } 805aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 80668f1ed48SBarry Smith if (realonly) { 80760e0710aSBarry Smith ierr = PetscViewerASCIIPrintf(viewer," %7.5e ",(double)PetscRealPart(value));CHKERRQ(ierr); 80868f1ed48SBarry Smith } else { 80960e0710aSBarry Smith ierr = PetscViewerASCIIPrintf(viewer," %7.5e+%7.5e i ",(double)PetscRealPart(value),(double)PetscImaginaryPart(value));CHKERRQ(ierr); 81068f1ed48SBarry Smith } 81102594712SBarry Smith #else 81260e0710aSBarry Smith ierr = PetscViewerASCIIPrintf(viewer," %7.5e ",(double)value);CHKERRQ(ierr); 81302594712SBarry Smith #endif 81402594712SBarry Smith } 815b0a32e0cSBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"\n");CHKERRQ(ierr); 81602594712SBarry Smith } 817d00279f6SBarry Smith ierr = PetscViewerASCIIUseTabs(viewer,PETSC_TRUE);CHKERRQ(ierr); 8183c215bfdSMatthew Knepley } else if (format == PETSC_VIEWER_ASCII_MATRIXMARKET) { 819150b93efSMatthew G. Knepley PetscInt fshift=1; 820d00279f6SBarry Smith ierr = PetscViewerASCIIUseTabs(viewer,PETSC_FALSE);CHKERRQ(ierr); 8213c215bfdSMatthew Knepley #if defined(PETSC_USE_COMPLEX) 82219303e72SJonathan Guyer ierr = PetscViewerASCIIPrintf(viewer,"%%%%MatrixMarket matrix coordinate complex general\n");CHKERRQ(ierr); 8233c215bfdSMatthew Knepley #else 82419303e72SJonathan Guyer ierr = PetscViewerASCIIPrintf(viewer,"%%%%MatrixMarket matrix coordinate real general\n");CHKERRQ(ierr); 8253c215bfdSMatthew Knepley #endif 826d0f46423SBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"%D %D %D\n", m, A->cmap->n, a->nz);CHKERRQ(ierr); 8273c215bfdSMatthew Knepley for (i=0; i<m; i++) { 82860e0710aSBarry Smith for (j=a->i[i]; j<a->i[i+1]; j++) { 8293c215bfdSMatthew Knepley #if defined(PETSC_USE_COMPLEX) 830a9a0e077SKarl Rupp ierr = PetscViewerASCIIPrintf(viewer,"%D %D %g %g\n", i+fshift,a->j[j]+fshift,(double)PetscRealPart(a->a[j]),(double)PetscImaginaryPart(a->a[j]));CHKERRQ(ierr); 8313c215bfdSMatthew Knepley #else 832150b93efSMatthew G. Knepley ierr = PetscViewerASCIIPrintf(viewer,"%D %D %g\n", i+fshift, a->j[j]+fshift, (double)a->a[j]);CHKERRQ(ierr); 8333c215bfdSMatthew Knepley #endif 8343c215bfdSMatthew Knepley } 8353c215bfdSMatthew Knepley } 836d00279f6SBarry Smith ierr = PetscViewerASCIIUseTabs(viewer,PETSC_TRUE);CHKERRQ(ierr); 8373a40ed3dSBarry Smith } else { 838d00279f6SBarry Smith ierr = PetscViewerASCIIUseTabs(viewer,PETSC_FALSE);CHKERRQ(ierr); 839d5f3da31SBarry Smith if (A->factortype) { 84016cd7e1dSShri Abhyankar for (i=0; i<m; i++) { 84116cd7e1dSShri Abhyankar ierr = PetscViewerASCIIPrintf(viewer,"row %D:",i);CHKERRQ(ierr); 84216cd7e1dSShri Abhyankar /* L part */ 84360e0710aSBarry Smith for (j=a->i[i]; j<a->i[i+1]; j++) { 84416cd7e1dSShri Abhyankar #if defined(PETSC_USE_COMPLEX) 84516cd7e1dSShri Abhyankar if (PetscImaginaryPart(a->a[j]) > 0.0) { 84660e0710aSBarry Smith ierr = PetscViewerASCIIPrintf(viewer," (%D, %g + %g i)",a->j[j],(double)PetscRealPart(a->a[j]),(double)PetscImaginaryPart(a->a[j]));CHKERRQ(ierr); 84716cd7e1dSShri Abhyankar } else if (PetscImaginaryPart(a->a[j]) < 0.0) { 8486712e2f1SBarry Smith ierr = PetscViewerASCIIPrintf(viewer," (%D, %g - %g i)",a->j[j],(double)PetscRealPart(a->a[j]),(double)(-PetscImaginaryPart(a->a[j])));CHKERRQ(ierr); 84916cd7e1dSShri Abhyankar } else { 85060e0710aSBarry Smith ierr = PetscViewerASCIIPrintf(viewer," (%D, %g) ",a->j[j],(double)PetscRealPart(a->a[j]));CHKERRQ(ierr); 85116cd7e1dSShri Abhyankar } 85216cd7e1dSShri Abhyankar #else 85360e0710aSBarry Smith ierr = PetscViewerASCIIPrintf(viewer," (%D, %g) ",a->j[j],(double)a->a[j]);CHKERRQ(ierr); 85416cd7e1dSShri Abhyankar #endif 85516cd7e1dSShri Abhyankar } 85616cd7e1dSShri Abhyankar /* diagonal */ 85716cd7e1dSShri Abhyankar j = a->diag[i]; 85816cd7e1dSShri Abhyankar #if defined(PETSC_USE_COMPLEX) 85916cd7e1dSShri Abhyankar if (PetscImaginaryPart(a->a[j]) > 0.0) { 86060e0710aSBarry Smith ierr = PetscViewerASCIIPrintf(viewer," (%D, %g + %g i)",a->j[j],(double)PetscRealPart(1.0/a->a[j]),(double)PetscImaginaryPart(1.0/a->a[j]));CHKERRQ(ierr); 86116cd7e1dSShri Abhyankar } else if (PetscImaginaryPart(a->a[j]) < 0.0) { 8626712e2f1SBarry Smith ierr = PetscViewerASCIIPrintf(viewer," (%D, %g - %g i)",a->j[j],(double)PetscRealPart(1.0/a->a[j]),(double)(-PetscImaginaryPart(1.0/a->a[j])));CHKERRQ(ierr); 86316cd7e1dSShri Abhyankar } else { 86460e0710aSBarry Smith ierr = PetscViewerASCIIPrintf(viewer," (%D, %g) ",a->j[j],(double)PetscRealPart(1.0/a->a[j]));CHKERRQ(ierr); 86516cd7e1dSShri Abhyankar } 86616cd7e1dSShri Abhyankar #else 86760e0710aSBarry Smith ierr = PetscViewerASCIIPrintf(viewer," (%D, %g) ",a->j[j],(double)(1.0/a->a[j]));CHKERRQ(ierr); 86816cd7e1dSShri Abhyankar #endif 86916cd7e1dSShri Abhyankar 87016cd7e1dSShri Abhyankar /* U part */ 87160e0710aSBarry Smith for (j=a->diag[i+1]+1; j<a->diag[i]; j++) { 87216cd7e1dSShri Abhyankar #if defined(PETSC_USE_COMPLEX) 87316cd7e1dSShri Abhyankar if (PetscImaginaryPart(a->a[j]) > 0.0) { 87460e0710aSBarry Smith ierr = PetscViewerASCIIPrintf(viewer," (%D, %g + %g i)",a->j[j],(double)PetscRealPart(a->a[j]),(double)PetscImaginaryPart(a->a[j]));CHKERRQ(ierr); 87516cd7e1dSShri Abhyankar } else if (PetscImaginaryPart(a->a[j]) < 0.0) { 87622ab088eSBarry Smith ierr = PetscViewerASCIIPrintf(viewer," (%D, %g - %g i)",a->j[j],(double)PetscRealPart(a->a[j]),(double)(-PetscImaginaryPart(a->a[j])));CHKERRQ(ierr); 87716cd7e1dSShri Abhyankar } else { 87860e0710aSBarry Smith ierr = PetscViewerASCIIPrintf(viewer," (%D, %g) ",a->j[j],(double)PetscRealPart(a->a[j]));CHKERRQ(ierr); 87916cd7e1dSShri Abhyankar } 88016cd7e1dSShri Abhyankar #else 88160e0710aSBarry Smith ierr = PetscViewerASCIIPrintf(viewer," (%D, %g) ",a->j[j],(double)a->a[j]);CHKERRQ(ierr); 88216cd7e1dSShri Abhyankar #endif 88316cd7e1dSShri Abhyankar } 88416cd7e1dSShri Abhyankar ierr = PetscViewerASCIIPrintf(viewer,"\n");CHKERRQ(ierr); 88516cd7e1dSShri Abhyankar } 88616cd7e1dSShri Abhyankar } else { 88717ab2063SBarry Smith for (i=0; i<m; i++) { 88877431f27SBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"row %D:",i);CHKERRQ(ierr); 88960e0710aSBarry Smith for (j=a->i[i]; j<a->i[i+1]; j++) { 890aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 89136db0b34SBarry Smith if (PetscImaginaryPart(a->a[j]) > 0.0) { 89260e0710aSBarry Smith ierr = PetscViewerASCIIPrintf(viewer," (%D, %g + %g i)",a->j[j],(double)PetscRealPart(a->a[j]),(double)PetscImaginaryPart(a->a[j]));CHKERRQ(ierr); 89336db0b34SBarry Smith } else if (PetscImaginaryPart(a->a[j]) < 0.0) { 89460e0710aSBarry Smith ierr = PetscViewerASCIIPrintf(viewer," (%D, %g - %g i)",a->j[j],(double)PetscRealPart(a->a[j]),(double)-PetscImaginaryPart(a->a[j]));CHKERRQ(ierr); 8953a40ed3dSBarry Smith } else { 89660e0710aSBarry Smith ierr = PetscViewerASCIIPrintf(viewer," (%D, %g) ",a->j[j],(double)PetscRealPart(a->a[j]));CHKERRQ(ierr); 89717ab2063SBarry Smith } 89817ab2063SBarry Smith #else 89960e0710aSBarry Smith ierr = PetscViewerASCIIPrintf(viewer," (%D, %g) ",a->j[j],(double)a->a[j]);CHKERRQ(ierr); 90017ab2063SBarry Smith #endif 90117ab2063SBarry Smith } 902b0a32e0cSBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"\n");CHKERRQ(ierr); 90317ab2063SBarry Smith } 90416cd7e1dSShri Abhyankar } 905d00279f6SBarry Smith ierr = PetscViewerASCIIUseTabs(viewer,PETSC_TRUE);CHKERRQ(ierr); 90617ab2063SBarry Smith } 907b0a32e0cSBarry Smith ierr = PetscViewerFlush(viewer);CHKERRQ(ierr); 9083a40ed3dSBarry Smith PetscFunctionReturn(0); 909416022c9SBarry Smith } 910416022c9SBarry Smith 9119804daf3SBarry Smith #include <petscdraw.h> 912dfbe8321SBarry Smith PetscErrorCode MatView_SeqAIJ_Draw_Zoom(PetscDraw draw,void *Aa) 913416022c9SBarry Smith { 914480ef9eaSBarry Smith Mat A = (Mat) Aa; 915416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 916dfbe8321SBarry Smith PetscErrorCode ierr; 917383922c3SLisandro Dalcin PetscInt i,j,m = A->rmap->n; 918383922c3SLisandro Dalcin int color; 919b05fc000SLisandro Dalcin PetscReal xl,yl,xr,yr,x_l,x_r,y_l,y_r; 920b0a32e0cSBarry Smith PetscViewer viewer; 921f3ef73ceSBarry Smith PetscViewerFormat format; 922cddf8d76SBarry Smith 9233a40ed3dSBarry Smith PetscFunctionBegin; 924480ef9eaSBarry Smith ierr = PetscObjectQuery((PetscObject)A,"Zoomviewer",(PetscObject*)&viewer);CHKERRQ(ierr); 925b0a32e0cSBarry Smith ierr = PetscViewerGetFormat(viewer,&format);CHKERRQ(ierr); 926b0a32e0cSBarry Smith ierr = PetscDrawGetCoordinates(draw,&xl,&yl,&xr,&yr);CHKERRQ(ierr); 927383922c3SLisandro Dalcin 928416022c9SBarry Smith /* loop over matrix elements drawing boxes */ 9290513a670SBarry Smith 930fb9695e5SSatish Balay if (format != PETSC_VIEWER_DRAW_CONTOUR) { 931383922c3SLisandro Dalcin ierr = PetscDrawCollectiveBegin(draw);CHKERRQ(ierr); 9320513a670SBarry Smith /* Blue for negative, Cyan for zero and Red for positive */ 933b0a32e0cSBarry Smith color = PETSC_DRAW_BLUE; 934416022c9SBarry Smith for (i=0; i<m; i++) { 935cddf8d76SBarry Smith y_l = m - i - 1.0; y_r = y_l + 1.0; 936bfeeae90SHong Zhang for (j=a->i[i]; j<a->i[i+1]; j++) { 937bfeeae90SHong Zhang x_l = a->j[j]; x_r = x_l + 1.0; 93836db0b34SBarry Smith if (PetscRealPart(a->a[j]) >= 0.) continue; 939b0a32e0cSBarry Smith ierr = PetscDrawRectangle(draw,x_l,y_l,x_r,y_r,color,color,color,color);CHKERRQ(ierr); 940cddf8d76SBarry Smith } 941cddf8d76SBarry Smith } 942b0a32e0cSBarry Smith color = PETSC_DRAW_CYAN; 943cddf8d76SBarry Smith for (i=0; i<m; i++) { 944cddf8d76SBarry Smith y_l = m - i - 1.0; y_r = y_l + 1.0; 945bfeeae90SHong Zhang for (j=a->i[i]; j<a->i[i+1]; j++) { 946bfeeae90SHong Zhang x_l = a->j[j]; x_r = x_l + 1.0; 947cddf8d76SBarry Smith if (a->a[j] != 0.) continue; 948b0a32e0cSBarry Smith ierr = PetscDrawRectangle(draw,x_l,y_l,x_r,y_r,color,color,color,color);CHKERRQ(ierr); 949cddf8d76SBarry Smith } 950cddf8d76SBarry Smith } 951b0a32e0cSBarry Smith color = PETSC_DRAW_RED; 952cddf8d76SBarry Smith for (i=0; i<m; i++) { 953cddf8d76SBarry Smith y_l = m - i - 1.0; y_r = y_l + 1.0; 954bfeeae90SHong Zhang for (j=a->i[i]; j<a->i[i+1]; j++) { 955bfeeae90SHong Zhang x_l = a->j[j]; x_r = x_l + 1.0; 95636db0b34SBarry Smith if (PetscRealPart(a->a[j]) <= 0.) continue; 957b0a32e0cSBarry Smith ierr = PetscDrawRectangle(draw,x_l,y_l,x_r,y_r,color,color,color,color);CHKERRQ(ierr); 958416022c9SBarry Smith } 959416022c9SBarry Smith } 960383922c3SLisandro Dalcin ierr = PetscDrawCollectiveEnd(draw);CHKERRQ(ierr); 9610513a670SBarry Smith } else { 9620513a670SBarry Smith /* use contour shading to indicate magnitude of values */ 9630513a670SBarry Smith /* first determine max of all nonzero values */ 964b05fc000SLisandro Dalcin PetscReal minv = 0.0, maxv = 0.0; 965383922c3SLisandro Dalcin PetscInt nz = a->nz, count = 0; 966b0a32e0cSBarry Smith PetscDraw popup; 9670513a670SBarry Smith 9680513a670SBarry Smith for (i=0; i<nz; i++) { 9690513a670SBarry Smith if (PetscAbsScalar(a->a[i]) > maxv) maxv = PetscAbsScalar(a->a[i]); 9700513a670SBarry Smith } 971383922c3SLisandro Dalcin if (minv >= maxv) maxv = minv + PETSC_SMALL; 972b0a32e0cSBarry Smith ierr = PetscDrawGetPopup(draw,&popup);CHKERRQ(ierr); 97345f3bb6eSLisandro Dalcin ierr = PetscDrawScalePopup(popup,minv,maxv);CHKERRQ(ierr); 974383922c3SLisandro Dalcin 975383922c3SLisandro Dalcin ierr = PetscDrawCollectiveBegin(draw);CHKERRQ(ierr); 9760513a670SBarry Smith for (i=0; i<m; i++) { 977383922c3SLisandro Dalcin y_l = m - i - 1.0; 978383922c3SLisandro Dalcin y_r = y_l + 1.0; 979bfeeae90SHong Zhang for (j=a->i[i]; j<a->i[i+1]; j++) { 980383922c3SLisandro Dalcin x_l = a->j[j]; 981383922c3SLisandro Dalcin x_r = x_l + 1.0; 982b05fc000SLisandro Dalcin color = PetscDrawRealToColor(PetscAbsScalar(a->a[count]),minv,maxv); 983b0a32e0cSBarry Smith ierr = PetscDrawRectangle(draw,x_l,y_l,x_r,y_r,color,color,color,color);CHKERRQ(ierr); 9840513a670SBarry Smith count++; 9850513a670SBarry Smith } 9860513a670SBarry Smith } 987383922c3SLisandro Dalcin ierr = PetscDrawCollectiveEnd(draw);CHKERRQ(ierr); 9880513a670SBarry Smith } 989480ef9eaSBarry Smith PetscFunctionReturn(0); 990480ef9eaSBarry Smith } 991cddf8d76SBarry Smith 9929804daf3SBarry Smith #include <petscdraw.h> 993dfbe8321SBarry Smith PetscErrorCode MatView_SeqAIJ_Draw(Mat A,PetscViewer viewer) 994480ef9eaSBarry Smith { 995dfbe8321SBarry Smith PetscErrorCode ierr; 996b0a32e0cSBarry Smith PetscDraw draw; 99736db0b34SBarry Smith PetscReal xr,yr,xl,yl,h,w; 998ace3abfcSBarry Smith PetscBool isnull; 999480ef9eaSBarry Smith 1000480ef9eaSBarry Smith PetscFunctionBegin; 1001b0a32e0cSBarry Smith ierr = PetscViewerDrawGetDraw(viewer,0,&draw);CHKERRQ(ierr); 1002b0a32e0cSBarry Smith ierr = PetscDrawIsNull(draw,&isnull);CHKERRQ(ierr); 1003480ef9eaSBarry Smith if (isnull) PetscFunctionReturn(0); 1004480ef9eaSBarry Smith 1005d0f46423SBarry Smith xr = A->cmap->n; yr = A->rmap->n; h = yr/10.0; w = xr/10.0; 1006480ef9eaSBarry Smith xr += w; yr += h; xl = -w; yl = -h; 1007b0a32e0cSBarry Smith ierr = PetscDrawSetCoordinates(draw,xl,yl,xr,yr);CHKERRQ(ierr); 1008832b7cebSLisandro Dalcin ierr = PetscObjectCompose((PetscObject)A,"Zoomviewer",(PetscObject)viewer);CHKERRQ(ierr); 1009b0a32e0cSBarry Smith ierr = PetscDrawZoom(draw,MatView_SeqAIJ_Draw_Zoom,A);CHKERRQ(ierr); 10100298fd71SBarry Smith ierr = PetscObjectCompose((PetscObject)A,"Zoomviewer",NULL);CHKERRQ(ierr); 1011832b7cebSLisandro Dalcin ierr = PetscDrawSave(draw);CHKERRQ(ierr); 10123a40ed3dSBarry Smith PetscFunctionReturn(0); 1013416022c9SBarry Smith } 1014416022c9SBarry Smith 1015dfbe8321SBarry Smith PetscErrorCode MatView_SeqAIJ(Mat A,PetscViewer viewer) 1016416022c9SBarry Smith { 1017dfbe8321SBarry Smith PetscErrorCode ierr; 1018ace3abfcSBarry Smith PetscBool iascii,isbinary,isdraw; 1019416022c9SBarry Smith 10203a40ed3dSBarry Smith PetscFunctionBegin; 1021251f4c67SDmitry Karpeev ierr = PetscObjectTypeCompare((PetscObject)viewer,PETSCVIEWERASCII,&iascii);CHKERRQ(ierr); 1022251f4c67SDmitry Karpeev ierr = PetscObjectTypeCompare((PetscObject)viewer,PETSCVIEWERBINARY,&isbinary);CHKERRQ(ierr); 1023251f4c67SDmitry Karpeev ierr = PetscObjectTypeCompare((PetscObject)viewer,PETSCVIEWERDRAW,&isdraw);CHKERRQ(ierr); 1024c45a1595SBarry Smith if (iascii) { 10253a40ed3dSBarry Smith ierr = MatView_SeqAIJ_ASCII(A,viewer);CHKERRQ(ierr); 10260f5bd95cSBarry Smith } else if (isbinary) { 10273a40ed3dSBarry Smith ierr = MatView_SeqAIJ_Binary(A,viewer);CHKERRQ(ierr); 10280f5bd95cSBarry Smith } else if (isdraw) { 10293a40ed3dSBarry Smith ierr = MatView_SeqAIJ_Draw(A,viewer);CHKERRQ(ierr); 103011aeaf0aSBarry Smith } 10314108e4d5SBarry Smith ierr = MatView_SeqAIJ_Inode(A,viewer);CHKERRQ(ierr); 10323a40ed3dSBarry Smith PetscFunctionReturn(0); 103317ab2063SBarry Smith } 103419bcc07fSBarry Smith 1035dfbe8321SBarry Smith PetscErrorCode MatAssemblyEnd_SeqAIJ(Mat A,MatAssemblyType mode) 103617ab2063SBarry Smith { 1037416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 10386849ba73SBarry Smith PetscErrorCode ierr; 1039580bdb30SBarry Smith PetscInt fshift = 0,i,*ai = a->i,*aj = a->j,*imax = a->imax; 1040d0f46423SBarry Smith PetscInt m = A->rmap->n,*ip,N,*ailen = a->ilen,rmax = 0; 104154f21887SBarry Smith MatScalar *aa = a->a,*ap; 10423447b6efSHong Zhang PetscReal ratio = 0.6; 104317ab2063SBarry Smith 10443a40ed3dSBarry Smith PetscFunctionBegin; 10453a40ed3dSBarry Smith if (mode == MAT_FLUSH_ASSEMBLY) PetscFunctionReturn(0); 1046071fcb05SBarry Smith ierr = MatSeqAIJInvalidateDiagonal(A);CHKERRQ(ierr); 1047071fcb05SBarry Smith if (A->was_assembled && A->ass_nonzerostate == A->nonzerostate) PetscFunctionReturn(0); 104817ab2063SBarry Smith 104943ee02c3SBarry Smith if (m) rmax = ailen[0]; /* determine row with most nonzeros */ 105017ab2063SBarry Smith for (i=1; i<m; i++) { 1051416022c9SBarry Smith /* move each row back by the amount of empty slots (fshift) before it*/ 105217ab2063SBarry Smith fshift += imax[i-1] - ailen[i-1]; 105394a9d846SBarry Smith rmax = PetscMax(rmax,ailen[i]); 105417ab2063SBarry Smith if (fshift) { 1055bfeeae90SHong Zhang ip = aj + ai[i]; 1056bfeeae90SHong Zhang ap = aa + ai[i]; 105717ab2063SBarry Smith N = ailen[i]; 1058580bdb30SBarry Smith ierr = PetscArraymove(ip-fshift,ip,N);CHKERRQ(ierr); 1059580bdb30SBarry Smith if (!A->structure_only) { 1060580bdb30SBarry Smith ierr = PetscArraymove(ap-fshift,ap,N);CHKERRQ(ierr); 106117ab2063SBarry Smith } 106217ab2063SBarry Smith } 106317ab2063SBarry Smith ai[i] = ai[i-1] + ailen[i-1]; 106417ab2063SBarry Smith } 106517ab2063SBarry Smith if (m) { 106617ab2063SBarry Smith fshift += imax[m-1] - ailen[m-1]; 106717ab2063SBarry Smith ai[m] = ai[m-1] + ailen[m-1]; 106817ab2063SBarry Smith } 10697b083b7cSBarry Smith 107017ab2063SBarry Smith /* reset ilen and imax for each row */ 10717b083b7cSBarry Smith a->nonzerorowcnt = 0; 1072396832f4SHong Zhang if (A->structure_only) { 1073071fcb05SBarry Smith ierr = PetscFree(a->imax);CHKERRQ(ierr); 1074071fcb05SBarry Smith ierr = PetscFree(a->ilen);CHKERRQ(ierr); 1075396832f4SHong Zhang } else { /* !A->structure_only */ 107617ab2063SBarry Smith for (i=0; i<m; i++) { 107717ab2063SBarry Smith ailen[i] = imax[i] = ai[i+1] - ai[i]; 10787b083b7cSBarry Smith a->nonzerorowcnt += ((ai[i+1] - ai[i]) > 0); 107917ab2063SBarry Smith } 1080396832f4SHong Zhang } 1081bfeeae90SHong Zhang a->nz = ai[m]; 108265e19b50SBarry Smith if (fshift && a->nounused == -1) SETERRQ3(PETSC_COMM_SELF,PETSC_ERR_PLIB, "Unused space detected in matrix: %D X %D, %D unneeded", m, A->cmap->n, fshift); 108317ab2063SBarry Smith 108409f38230SBarry Smith ierr = MatMarkDiagonal_SeqAIJ(A);CHKERRQ(ierr); 1085d0f46423SBarry Smith ierr = PetscInfo4(A,"Matrix size: %D X %D; storage space: %D unneeded,%D used\n",m,A->cmap->n,fshift,a->nz);CHKERRQ(ierr); 1086ae15b995SBarry Smith ierr = PetscInfo1(A,"Number of mallocs during MatSetValues() is %D\n",a->reallocs);CHKERRQ(ierr); 1087ae15b995SBarry Smith ierr = PetscInfo1(A,"Maximum nonzeros in any row is %D\n",rmax);CHKERRQ(ierr); 10882205254eSKarl Rupp 10898e58a170SBarry Smith A->info.mallocs += a->reallocs; 1090dd5f02e7SSatish Balay a->reallocs = 0; 10916712e2f1SBarry Smith A->info.nz_unneeded = (PetscReal)fshift; 109236db0b34SBarry Smith a->rmax = rmax; 10934e220ebcSLois Curfman McInnes 1094396832f4SHong Zhang if (!A->structure_only) { 109511e456e1SBarry Smith ierr = MatCheckCompressedRow(A,a->nonzerorowcnt,&a->compressedrow,a->i,m,ratio);CHKERRQ(ierr); 1096396832f4SHong Zhang } 10974108e4d5SBarry Smith ierr = MatAssemblyEnd_SeqAIJ_Inode(A,mode);CHKERRQ(ierr); 10983a40ed3dSBarry Smith PetscFunctionReturn(0); 109917ab2063SBarry Smith } 110017ab2063SBarry Smith 110199cafbc1SBarry Smith PetscErrorCode MatRealPart_SeqAIJ(Mat A) 110299cafbc1SBarry Smith { 110399cafbc1SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 110499cafbc1SBarry Smith PetscInt i,nz = a->nz; 110554f21887SBarry Smith MatScalar *aa = a->a; 1106acf2f550SJed Brown PetscErrorCode ierr; 110799cafbc1SBarry Smith 110899cafbc1SBarry Smith PetscFunctionBegin; 110999cafbc1SBarry Smith for (i=0; i<nz; i++) aa[i] = PetscRealPart(aa[i]); 1110acf2f550SJed Brown ierr = MatSeqAIJInvalidateDiagonal(A);CHKERRQ(ierr); 1111e2cf4d64SStefano Zampini #if defined(PETSC_HAVE_VIENNACL) || defined(PETSC_HAVE_CUDA) 1112c70f7ee4SJunchao Zhang if (A->offloadmask != PETSC_OFFLOAD_UNALLOCATED) A->offloadmask = PETSC_OFFLOAD_CPU; 1113e2cf4d64SStefano Zampini #endif 111499cafbc1SBarry Smith PetscFunctionReturn(0); 111599cafbc1SBarry Smith } 111699cafbc1SBarry Smith 111799cafbc1SBarry Smith PetscErrorCode MatImaginaryPart_SeqAIJ(Mat A) 111899cafbc1SBarry Smith { 111999cafbc1SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 112099cafbc1SBarry Smith PetscInt i,nz = a->nz; 112154f21887SBarry Smith MatScalar *aa = a->a; 1122acf2f550SJed Brown PetscErrorCode ierr; 112399cafbc1SBarry Smith 112499cafbc1SBarry Smith PetscFunctionBegin; 112599cafbc1SBarry Smith for (i=0; i<nz; i++) aa[i] = PetscImaginaryPart(aa[i]); 1126acf2f550SJed Brown ierr = MatSeqAIJInvalidateDiagonal(A);CHKERRQ(ierr); 1127e2cf4d64SStefano Zampini #if defined(PETSC_HAVE_VIENNACL) || defined(PETSC_HAVE_CUDA) 1128c70f7ee4SJunchao Zhang if (A->offloadmask != PETSC_OFFLOAD_UNALLOCATED) A->offloadmask = PETSC_OFFLOAD_CPU; 1129e2cf4d64SStefano Zampini #endif 113099cafbc1SBarry Smith PetscFunctionReturn(0); 113199cafbc1SBarry Smith } 113299cafbc1SBarry Smith 1133dfbe8321SBarry Smith PetscErrorCode MatZeroEntries_SeqAIJ(Mat A) 113417ab2063SBarry Smith { 1135416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 1136dfbe8321SBarry Smith PetscErrorCode ierr; 11373a40ed3dSBarry Smith 11383a40ed3dSBarry Smith PetscFunctionBegin; 1139580bdb30SBarry Smith ierr = PetscArrayzero(a->a,a->i[A->rmap->n]);CHKERRQ(ierr); 1140acf2f550SJed Brown ierr = MatSeqAIJInvalidateDiagonal(A);CHKERRQ(ierr); 1141e2cf4d64SStefano Zampini #if defined(PETSC_HAVE_VIENNACL) || defined(PETSC_HAVE_CUDA) 1142c70f7ee4SJunchao Zhang if (A->offloadmask != PETSC_OFFLOAD_UNALLOCATED) A->offloadmask = PETSC_OFFLOAD_CPU; 1143e2cf4d64SStefano Zampini #endif 11443a40ed3dSBarry Smith PetscFunctionReturn(0); 114517ab2063SBarry Smith } 1146416022c9SBarry Smith 1147dfbe8321SBarry Smith PetscErrorCode MatDestroy_SeqAIJ(Mat A) 114817ab2063SBarry Smith { 1149416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 1150dfbe8321SBarry Smith PetscErrorCode ierr; 1151d5d45c9bSBarry Smith 11523a40ed3dSBarry Smith PetscFunctionBegin; 1153aa482453SBarry Smith #if defined(PETSC_USE_LOG) 1154d0f46423SBarry Smith PetscLogObjectState((PetscObject)A,"Rows=%D, Cols=%D, NZ=%D",A->rmap->n,A->cmap->n,a->nz); 115517ab2063SBarry Smith #endif 1156e6b907acSBarry Smith ierr = MatSeqXAIJFreeAIJ(A,&a->a,&a->j,&a->i);CHKERRQ(ierr); 11576bf464f9SBarry Smith ierr = ISDestroy(&a->row);CHKERRQ(ierr); 11586bf464f9SBarry Smith ierr = ISDestroy(&a->col);CHKERRQ(ierr); 115905b42c5fSBarry Smith ierr = PetscFree(a->diag);CHKERRQ(ierr); 1160d48dcb14SBarry Smith ierr = PetscFree(a->ibdiag);CHKERRQ(ierr); 1161071fcb05SBarry Smith ierr = PetscFree(a->imax);CHKERRQ(ierr); 1162071fcb05SBarry Smith ierr = PetscFree(a->ilen);CHKERRQ(ierr); 1163846b4da1SFande Kong ierr = PetscFree(a->ipre);CHKERRQ(ierr); 116471f1c65dSBarry Smith ierr = PetscFree3(a->idiag,a->mdiag,a->ssor_work);CHKERRQ(ierr); 116505b42c5fSBarry Smith ierr = PetscFree(a->solve_work);CHKERRQ(ierr); 11666bf464f9SBarry Smith ierr = ISDestroy(&a->icol);CHKERRQ(ierr); 116705b42c5fSBarry Smith ierr = PetscFree(a->saved_values);CHKERRQ(ierr); 11686bf464f9SBarry Smith ierr = ISColoringDestroy(&a->coloring);CHKERRQ(ierr); 1169cd6b891eSBarry Smith ierr = PetscFree2(a->compressedrow.i,a->compressedrow.rindex);CHKERRQ(ierr); 11700b7e3e3dSHong Zhang ierr = PetscFree(a->matmult_abdense);CHKERRQ(ierr); 1171a30b2313SHong Zhang 11724108e4d5SBarry Smith ierr = MatDestroy_SeqAIJ_Inode(A);CHKERRQ(ierr); 1173bf0cc555SLisandro Dalcin ierr = PetscFree(A->data);CHKERRQ(ierr); 1174901853e0SKris Buschelman 1175dbd8c25aSHong Zhang ierr = PetscObjectChangeTypeName((PetscObject)A,0);CHKERRQ(ierr); 1176bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)A,"MatSeqAIJSetColumnIndices_C",NULL);CHKERRQ(ierr); 1177bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)A,"MatStoreValues_C",NULL);CHKERRQ(ierr); 1178bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)A,"MatRetrieveValues_C",NULL);CHKERRQ(ierr); 1179bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)A,"MatConvert_seqaij_seqsbaij_C",NULL);CHKERRQ(ierr); 1180bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)A,"MatConvert_seqaij_seqbaij_C",NULL);CHKERRQ(ierr); 1181bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)A,"MatConvert_seqaij_seqaijperm_C",NULL);CHKERRQ(ierr); 11824222ddf1SHong Zhang 11834222ddf1SHong Zhang #if defined(PETSC_HAVE_CUDA) 11844222ddf1SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)A,"MatConvert_seqaij_seqaijcusparse_C",NULL);CHKERRQ(ierr); 11854222ddf1SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)A,"MatSetFromOptions_seqaijcusparse_seqaij_C",NULL);CHKERRQ(ierr); 11864222ddf1SHong Zhang #endif 11874222ddf1SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)A,"MatConvert_seqaij_seqaijcrl_C",NULL);CHKERRQ(ierr); 1188af8000cdSHong Zhang #if defined(PETSC_HAVE_ELEMENTAL) 1189af8000cdSHong Zhang ierr = PetscObjectComposeFunction((PetscObject)A,"MatConvert_seqaij_elemental_C",NULL);CHKERRQ(ierr); 1190af8000cdSHong Zhang #endif 119163c07aadSStefano Zampini #if defined(PETSC_HAVE_HYPRE) 119263c07aadSStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)A,"MatConvert_seqaij_hypre_C",NULL);CHKERRQ(ierr); 11934222ddf1SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)A,"MatProductSetFromOptions_transpose_seqaij_seqaij_C",NULL);CHKERRQ(ierr); 119463c07aadSStefano Zampini #endif 1195b49cda9fSStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)A,"MatConvert_seqaij_seqdense_C",NULL);CHKERRQ(ierr); 1196c9225affSStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)A,"MatConvert_seqaij_seqsell_C",NULL);CHKERRQ(ierr); 1197c9225affSStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)A,"MatConvert_seqaij_is_C",NULL);CHKERRQ(ierr); 1198bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)A,"MatIsTranspose_C",NULL);CHKERRQ(ierr); 1199bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)A,"MatSeqAIJSetPreallocation_C",NULL);CHKERRQ(ierr); 1200846b4da1SFande Kong ierr = PetscObjectComposeFunction((PetscObject)A,"MatResetPreallocation_C",NULL);CHKERRQ(ierr); 1201bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)A,"MatSeqAIJSetPreallocationCSR_C",NULL);CHKERRQ(ierr); 1202bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)A,"MatReorderForNonzeroDiagonal_C",NULL);CHKERRQ(ierr); 12034222ddf1SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)A,"MatProductSetFromOptions_is_seqaij_C",NULL);CHKERRQ(ierr); 12044222ddf1SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)A,"MatProductSetFromOptions_seqdense_seqaij_C",NULL);CHKERRQ(ierr); 12054222ddf1SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)A,"MatProductSetFromOptions_seqaij_seqaij_C",NULL);CHKERRQ(ierr); 12063a40ed3dSBarry Smith PetscFunctionReturn(0); 120717ab2063SBarry Smith } 120817ab2063SBarry Smith 1209ace3abfcSBarry Smith PetscErrorCode MatSetOption_SeqAIJ(Mat A,MatOption op,PetscBool flg) 121017ab2063SBarry Smith { 1211416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 12124846f1f5SKris Buschelman PetscErrorCode ierr; 12133a40ed3dSBarry Smith 12143a40ed3dSBarry Smith PetscFunctionBegin; 1215a65d3064SKris Buschelman switch (op) { 1216a65d3064SKris Buschelman case MAT_ROW_ORIENTED: 12174e0d8c25SBarry Smith a->roworiented = flg; 1218a65d3064SKris Buschelman break; 1219a9817697SBarry Smith case MAT_KEEP_NONZERO_PATTERN: 1220a9817697SBarry Smith a->keepnonzeropattern = flg; 1221a65d3064SKris Buschelman break; 1222512a5fc5SBarry Smith case MAT_NEW_NONZERO_LOCATIONS: 1223512a5fc5SBarry Smith a->nonew = (flg ? 0 : 1); 1224a65d3064SKris Buschelman break; 1225a65d3064SKris Buschelman case MAT_NEW_NONZERO_LOCATION_ERR: 12264e0d8c25SBarry Smith a->nonew = (flg ? -1 : 0); 1227a65d3064SKris Buschelman break; 1228a65d3064SKris Buschelman case MAT_NEW_NONZERO_ALLOCATION_ERR: 12294e0d8c25SBarry Smith a->nonew = (flg ? -2 : 0); 1230a65d3064SKris Buschelman break; 123128b2fa4aSMatthew Knepley case MAT_UNUSED_NONZERO_LOCATION_ERR: 123228b2fa4aSMatthew Knepley a->nounused = (flg ? -1 : 0); 123328b2fa4aSMatthew Knepley break; 1234a65d3064SKris Buschelman case MAT_IGNORE_ZERO_ENTRIES: 12354e0d8c25SBarry Smith a->ignorezeroentries = flg; 12360df259c2SBarry Smith break; 12373d472b54SHong Zhang case MAT_SPD: 1238b1646e73SJed Brown case MAT_SYMMETRIC: 1239b1646e73SJed Brown case MAT_STRUCTURALLY_SYMMETRIC: 1240b1646e73SJed Brown case MAT_HERMITIAN: 1241b1646e73SJed Brown case MAT_SYMMETRY_ETERNAL: 1242957cac9fSHong Zhang case MAT_STRUCTURE_ONLY: 12435021d80fSJed Brown /* These options are handled directly by MatSetOption() */ 12445021d80fSJed Brown break; 12454e0d8c25SBarry Smith case MAT_NEW_DIAGONALS: 1246a65d3064SKris Buschelman case MAT_IGNORE_OFF_PROC_ENTRIES: 1247a65d3064SKris Buschelman case MAT_USE_HASH_TABLE: 1248290bbb0aSBarry Smith ierr = PetscInfo1(A,"Option %s ignored\n",MatOptions[op]);CHKERRQ(ierr); 1249a65d3064SKris Buschelman break; 1250b87ac2d8SJed Brown case MAT_USE_INODES: 1251b87ac2d8SJed Brown /* Not an error because MatSetOption_SeqAIJ_Inode handles this one */ 1252b87ac2d8SJed Brown break; 1253c10200c1SHong Zhang case MAT_SUBMAT_SINGLEIS: 1254c10200c1SHong Zhang A->submat_singleis = flg; 1255c10200c1SHong Zhang break; 1256071fcb05SBarry Smith case MAT_SORTED_FULL: 1257071fcb05SBarry Smith if (flg) A->ops->setvalues = MatSetValues_SeqAIJ_SortedFull; 1258071fcb05SBarry Smith else A->ops->setvalues = MatSetValues_SeqAIJ; 1259071fcb05SBarry Smith break; 1260a65d3064SKris Buschelman default: 1261e32f2f54SBarry Smith SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_SUP,"unknown option %d",op); 1262a65d3064SKris Buschelman } 12634108e4d5SBarry Smith ierr = MatSetOption_SeqAIJ_Inode(A,op,flg);CHKERRQ(ierr); 12643a40ed3dSBarry Smith PetscFunctionReturn(0); 126517ab2063SBarry Smith } 126617ab2063SBarry Smith 1267dfbe8321SBarry Smith PetscErrorCode MatGetDiagonal_SeqAIJ(Mat A,Vec v) 126817ab2063SBarry Smith { 1269416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 12706849ba73SBarry Smith PetscErrorCode ierr; 1271fdc842d1SBarry Smith PetscInt i,j,n,*ai=a->i,*aj=a->j; 1272fdc842d1SBarry Smith PetscScalar *aa=a->a,*x; 127317ab2063SBarry Smith 12743a40ed3dSBarry Smith PetscFunctionBegin; 1275d3e70bfaSHong Zhang ierr = VecGetLocalSize(v,&n);CHKERRQ(ierr); 1276e32f2f54SBarry Smith if (n != A->rmap->n) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Nonconforming matrix and vector"); 127735e7444dSHong Zhang 1278d5f3da31SBarry Smith if (A->factortype == MAT_FACTOR_ILU || A->factortype == MAT_FACTOR_LU) { 1279d3e70bfaSHong Zhang PetscInt *diag=a->diag; 1280fdc842d1SBarry Smith ierr = VecGetArrayWrite(v,&x);CHKERRQ(ierr); 12812c990fa1SHong Zhang for (i=0; i<n; i++) x[i] = 1.0/aa[diag[i]]; 1282fdc842d1SBarry Smith ierr = VecRestoreArrayWrite(v,&x);CHKERRQ(ierr); 128335e7444dSHong Zhang PetscFunctionReturn(0); 128435e7444dSHong Zhang } 128535e7444dSHong Zhang 1286fdc842d1SBarry Smith ierr = VecGetArrayWrite(v,&x);CHKERRQ(ierr); 128735e7444dSHong Zhang for (i=0; i<n; i++) { 1288fdc842d1SBarry Smith x[i] = 0.0; 128935e7444dSHong Zhang for (j=ai[i]; j<ai[i+1]; j++) { 129035e7444dSHong Zhang if (aj[j] == i) { 129135e7444dSHong Zhang x[i] = aa[j]; 129217ab2063SBarry Smith break; 129317ab2063SBarry Smith } 129417ab2063SBarry Smith } 129517ab2063SBarry Smith } 1296fdc842d1SBarry Smith ierr = VecRestoreArrayWrite(v,&x);CHKERRQ(ierr); 12973a40ed3dSBarry Smith PetscFunctionReturn(0); 129817ab2063SBarry Smith } 129917ab2063SBarry Smith 1300c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/ftn-kernels/fmult.h> 1301dfbe8321SBarry Smith PetscErrorCode MatMultTransposeAdd_SeqAIJ(Mat A,Vec xx,Vec zz,Vec yy) 130217ab2063SBarry Smith { 1303416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 1304d9ca1df4SBarry Smith PetscScalar *y; 1305d9ca1df4SBarry Smith const PetscScalar *x; 1306dfbe8321SBarry Smith PetscErrorCode ierr; 1307d0f46423SBarry Smith PetscInt m = A->rmap->n; 13085c897100SBarry Smith #if !defined(PETSC_USE_FORTRAN_KERNEL_MULTTRANSPOSEAIJ) 1309d9ca1df4SBarry Smith const MatScalar *v; 1310a77337e4SBarry Smith PetscScalar alpha; 1311d9ca1df4SBarry Smith PetscInt n,i,j; 1312d9ca1df4SBarry Smith const PetscInt *idx,*ii,*ridx=NULL; 13133447b6efSHong Zhang Mat_CompressedRow cprow = a->compressedrow; 1314ace3abfcSBarry Smith PetscBool usecprow = cprow.use; 13155c897100SBarry Smith #endif 131617ab2063SBarry Smith 13173a40ed3dSBarry Smith PetscFunctionBegin; 13182e8a6d31SBarry Smith if (zz != yy) {ierr = VecCopy(zz,yy);CHKERRQ(ierr);} 1319d9ca1df4SBarry Smith ierr = VecGetArrayRead(xx,&x);CHKERRQ(ierr); 13201ebc52fbSHong Zhang ierr = VecGetArray(yy,&y);CHKERRQ(ierr); 13215c897100SBarry Smith 13225c897100SBarry Smith #if defined(PETSC_USE_FORTRAN_KERNEL_MULTTRANSPOSEAIJ) 1323bfeeae90SHong Zhang fortranmulttransposeaddaij_(&m,x,a->i,a->j,a->a,y); 13245c897100SBarry Smith #else 13253447b6efSHong Zhang if (usecprow) { 13263447b6efSHong Zhang m = cprow.nrows; 13273447b6efSHong Zhang ii = cprow.i; 13287b2bb3b9SHong Zhang ridx = cprow.rindex; 13293447b6efSHong Zhang } else { 13303447b6efSHong Zhang ii = a->i; 13313447b6efSHong Zhang } 133217ab2063SBarry Smith for (i=0; i<m; i++) { 13333447b6efSHong Zhang idx = a->j + ii[i]; 13343447b6efSHong Zhang v = a->a + ii[i]; 13353447b6efSHong Zhang n = ii[i+1] - ii[i]; 13363447b6efSHong Zhang if (usecprow) { 13377b2bb3b9SHong Zhang alpha = x[ridx[i]]; 13383447b6efSHong Zhang } else { 133917ab2063SBarry Smith alpha = x[i]; 13403447b6efSHong Zhang } 134104fbf559SBarry Smith for (j=0; j<n; j++) y[idx[j]] += alpha*v[j]; 134217ab2063SBarry Smith } 13435c897100SBarry Smith #endif 1344dc0b31edSSatish Balay ierr = PetscLogFlops(2.0*a->nz);CHKERRQ(ierr); 1345d9ca1df4SBarry Smith ierr = VecRestoreArrayRead(xx,&x);CHKERRQ(ierr); 13461ebc52fbSHong Zhang ierr = VecRestoreArray(yy,&y);CHKERRQ(ierr); 13473a40ed3dSBarry Smith PetscFunctionReturn(0); 134817ab2063SBarry Smith } 134917ab2063SBarry Smith 1350dfbe8321SBarry Smith PetscErrorCode MatMultTranspose_SeqAIJ(Mat A,Vec xx,Vec yy) 13515c897100SBarry Smith { 1352dfbe8321SBarry Smith PetscErrorCode ierr; 13535c897100SBarry Smith 13545c897100SBarry Smith PetscFunctionBegin; 1355170fe5c8SBarry Smith ierr = VecSet(yy,0.0);CHKERRQ(ierr); 13565c897100SBarry Smith ierr = MatMultTransposeAdd_SeqAIJ(A,xx,yy,yy);CHKERRQ(ierr); 13575c897100SBarry Smith PetscFunctionReturn(0); 13585c897100SBarry Smith } 13595c897100SBarry Smith 1360c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/ftn-kernels/fmult.h> 136178b84d54SShri Abhyankar 1362dfbe8321SBarry Smith PetscErrorCode MatMult_SeqAIJ(Mat A,Vec xx,Vec yy) 136317ab2063SBarry Smith { 1364416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 1365d9fead3dSBarry Smith PetscScalar *y; 136654f21887SBarry Smith const PetscScalar *x; 136754f21887SBarry Smith const MatScalar *aa; 1368dfbe8321SBarry Smith PetscErrorCode ierr; 1369003131ecSBarry Smith PetscInt m=A->rmap->n; 13700298fd71SBarry Smith const PetscInt *aj,*ii,*ridx=NULL; 13717b083b7cSBarry Smith PetscInt n,i; 1372362ced78SSatish Balay PetscScalar sum; 1373ace3abfcSBarry Smith PetscBool usecprow=a->compressedrow.use; 137417ab2063SBarry Smith 1375b6410449SSatish Balay #if defined(PETSC_HAVE_PRAGMA_DISJOINT) 137697952fefSHong Zhang #pragma disjoint(*x,*y,*aa) 1377fee21e36SBarry Smith #endif 1378fee21e36SBarry Smith 13793a40ed3dSBarry Smith PetscFunctionBegin; 13803649974fSBarry Smith ierr = VecGetArrayRead(xx,&x);CHKERRQ(ierr); 13811ebc52fbSHong Zhang ierr = VecGetArray(yy,&y);CHKERRQ(ierr); 1382416022c9SBarry Smith ii = a->i; 13834eb6d288SHong Zhang if (usecprow) { /* use compressed row format */ 1384580bdb30SBarry Smith ierr = PetscArrayzero(y,m);CHKERRQ(ierr); 138597952fefSHong Zhang m = a->compressedrow.nrows; 138697952fefSHong Zhang ii = a->compressedrow.i; 138797952fefSHong Zhang ridx = a->compressedrow.rindex; 138897952fefSHong Zhang for (i=0; i<m; i++) { 138997952fefSHong Zhang n = ii[i+1] - ii[i]; 139097952fefSHong Zhang aj = a->j + ii[i]; 139197952fefSHong Zhang aa = a->a + ii[i]; 139297952fefSHong Zhang sum = 0.0; 1393003131ecSBarry Smith PetscSparseDensePlusDot(sum,x,aa,aj,n); 1394003131ecSBarry Smith /* for (j=0; j<n; j++) sum += (*aa++)*x[*aj++]; */ 139597952fefSHong Zhang y[*ridx++] = sum; 139697952fefSHong Zhang } 139797952fefSHong Zhang } else { /* do not use compressed row format */ 1398b05257ddSBarry Smith #if defined(PETSC_USE_FORTRAN_KERNEL_MULTAIJ) 13993d3eaba7SBarry Smith aj = a->j; 14003d3eaba7SBarry Smith aa = a->a; 1401b05257ddSBarry Smith fortranmultaij_(&m,x,ii,aj,aa,y); 1402b05257ddSBarry Smith #else 140317ab2063SBarry Smith for (i=0; i<m; i++) { 1404003131ecSBarry Smith n = ii[i+1] - ii[i]; 1405003131ecSBarry Smith aj = a->j + ii[i]; 1406003131ecSBarry Smith aa = a->a + ii[i]; 140717ab2063SBarry Smith sum = 0.0; 1408003131ecSBarry Smith PetscSparseDensePlusDot(sum,x,aa,aj,n); 140917ab2063SBarry Smith y[i] = sum; 141017ab2063SBarry Smith } 14118d195f9aSBarry Smith #endif 1412b05257ddSBarry Smith } 14137b083b7cSBarry Smith ierr = PetscLogFlops(2.0*a->nz - a->nonzerorowcnt);CHKERRQ(ierr); 14143649974fSBarry Smith ierr = VecRestoreArrayRead(xx,&x);CHKERRQ(ierr); 14151ebc52fbSHong Zhang ierr = VecRestoreArray(yy,&y);CHKERRQ(ierr); 14163a40ed3dSBarry Smith PetscFunctionReturn(0); 141717ab2063SBarry Smith } 141817ab2063SBarry Smith 1419b434eb95SMatthew G. Knepley PetscErrorCode MatMultMax_SeqAIJ(Mat A,Vec xx,Vec yy) 1420b434eb95SMatthew G. Knepley { 1421b434eb95SMatthew G. Knepley Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 1422b434eb95SMatthew G. Knepley PetscScalar *y; 1423b434eb95SMatthew G. Knepley const PetscScalar *x; 1424b434eb95SMatthew G. Knepley const MatScalar *aa; 1425b434eb95SMatthew G. Knepley PetscErrorCode ierr; 1426b434eb95SMatthew G. Knepley PetscInt m=A->rmap->n; 1427b434eb95SMatthew G. Knepley const PetscInt *aj,*ii,*ridx=NULL; 1428b434eb95SMatthew G. Knepley PetscInt n,i,nonzerorow=0; 1429b434eb95SMatthew G. Knepley PetscScalar sum; 1430b434eb95SMatthew G. Knepley PetscBool usecprow=a->compressedrow.use; 1431b434eb95SMatthew G. Knepley 1432b434eb95SMatthew G. Knepley #if defined(PETSC_HAVE_PRAGMA_DISJOINT) 1433b434eb95SMatthew G. Knepley #pragma disjoint(*x,*y,*aa) 1434b434eb95SMatthew G. Knepley #endif 1435b434eb95SMatthew G. Knepley 1436b434eb95SMatthew G. Knepley PetscFunctionBegin; 1437b434eb95SMatthew G. Knepley ierr = VecGetArrayRead(xx,&x);CHKERRQ(ierr); 1438b434eb95SMatthew G. Knepley ierr = VecGetArray(yy,&y);CHKERRQ(ierr); 1439b434eb95SMatthew G. Knepley if (usecprow) { /* use compressed row format */ 1440b434eb95SMatthew G. Knepley m = a->compressedrow.nrows; 1441b434eb95SMatthew G. Knepley ii = a->compressedrow.i; 1442b434eb95SMatthew G. Knepley ridx = a->compressedrow.rindex; 1443b434eb95SMatthew G. Knepley for (i=0; i<m; i++) { 1444b434eb95SMatthew G. Knepley n = ii[i+1] - ii[i]; 1445b434eb95SMatthew G. Knepley aj = a->j + ii[i]; 1446b434eb95SMatthew G. Knepley aa = a->a + ii[i]; 1447b434eb95SMatthew G. Knepley sum = 0.0; 1448b434eb95SMatthew G. Knepley nonzerorow += (n>0); 1449b434eb95SMatthew G. Knepley PetscSparseDenseMaxDot(sum,x,aa,aj,n); 1450b434eb95SMatthew G. Knepley /* for (j=0; j<n; j++) sum += (*aa++)*x[*aj++]; */ 1451b434eb95SMatthew G. Knepley y[*ridx++] = sum; 1452b434eb95SMatthew G. Knepley } 1453b434eb95SMatthew G. Knepley } else { /* do not use compressed row format */ 14543d3eaba7SBarry Smith ii = a->i; 1455b434eb95SMatthew G. Knepley for (i=0; i<m; i++) { 1456b434eb95SMatthew G. Knepley n = ii[i+1] - ii[i]; 1457b434eb95SMatthew G. Knepley aj = a->j + ii[i]; 1458b434eb95SMatthew G. Knepley aa = a->a + ii[i]; 1459b434eb95SMatthew G. Knepley sum = 0.0; 1460b434eb95SMatthew G. Knepley nonzerorow += (n>0); 1461b434eb95SMatthew G. Knepley PetscSparseDenseMaxDot(sum,x,aa,aj,n); 1462b434eb95SMatthew G. Knepley y[i] = sum; 1463b434eb95SMatthew G. Knepley } 1464b434eb95SMatthew G. Knepley } 1465b434eb95SMatthew G. Knepley ierr = PetscLogFlops(2.0*a->nz - nonzerorow);CHKERRQ(ierr); 1466b434eb95SMatthew G. Knepley ierr = VecRestoreArrayRead(xx,&x);CHKERRQ(ierr); 1467b434eb95SMatthew G. Knepley ierr = VecRestoreArray(yy,&y);CHKERRQ(ierr); 1468b434eb95SMatthew G. Knepley PetscFunctionReturn(0); 1469b434eb95SMatthew G. Knepley } 1470b434eb95SMatthew G. Knepley 1471b434eb95SMatthew G. Knepley PetscErrorCode MatMultAddMax_SeqAIJ(Mat A,Vec xx,Vec yy,Vec zz) 1472b434eb95SMatthew G. Knepley { 1473b434eb95SMatthew G. Knepley Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 1474b434eb95SMatthew G. Knepley PetscScalar *y,*z; 1475b434eb95SMatthew G. Knepley const PetscScalar *x; 1476b434eb95SMatthew G. Knepley const MatScalar *aa; 1477b434eb95SMatthew G. Knepley PetscErrorCode ierr; 1478b434eb95SMatthew G. Knepley PetscInt m = A->rmap->n,*aj,*ii; 1479b434eb95SMatthew G. Knepley PetscInt n,i,*ridx=NULL; 1480b434eb95SMatthew G. Knepley PetscScalar sum; 1481b434eb95SMatthew G. Knepley PetscBool usecprow=a->compressedrow.use; 1482b434eb95SMatthew G. Knepley 1483b434eb95SMatthew G. Knepley PetscFunctionBegin; 1484b434eb95SMatthew G. Knepley ierr = VecGetArrayRead(xx,&x);CHKERRQ(ierr); 1485d9ca1df4SBarry Smith ierr = VecGetArrayPair(yy,zz,&y,&z);CHKERRQ(ierr); 1486b434eb95SMatthew G. Knepley if (usecprow) { /* use compressed row format */ 1487b434eb95SMatthew G. Knepley if (zz != yy) { 1488580bdb30SBarry Smith ierr = PetscArraycpy(z,y,m);CHKERRQ(ierr); 1489b434eb95SMatthew G. Knepley } 1490b434eb95SMatthew G. Knepley m = a->compressedrow.nrows; 1491b434eb95SMatthew G. Knepley ii = a->compressedrow.i; 1492b434eb95SMatthew G. Knepley ridx = a->compressedrow.rindex; 1493b434eb95SMatthew G. Knepley for (i=0; i<m; i++) { 1494b434eb95SMatthew G. Knepley n = ii[i+1] - ii[i]; 1495b434eb95SMatthew G. Knepley aj = a->j + ii[i]; 1496b434eb95SMatthew G. Knepley aa = a->a + ii[i]; 1497b434eb95SMatthew G. Knepley sum = y[*ridx]; 1498b434eb95SMatthew G. Knepley PetscSparseDenseMaxDot(sum,x,aa,aj,n); 1499b434eb95SMatthew G. Knepley z[*ridx++] = sum; 1500b434eb95SMatthew G. Knepley } 1501b434eb95SMatthew G. Knepley } else { /* do not use compressed row format */ 15023d3eaba7SBarry Smith ii = a->i; 1503b434eb95SMatthew G. Knepley for (i=0; i<m; i++) { 1504b434eb95SMatthew G. Knepley n = ii[i+1] - ii[i]; 1505b434eb95SMatthew G. Knepley aj = a->j + ii[i]; 1506b434eb95SMatthew G. Knepley aa = a->a + ii[i]; 1507b434eb95SMatthew G. Knepley sum = y[i]; 1508b434eb95SMatthew G. Knepley PetscSparseDenseMaxDot(sum,x,aa,aj,n); 1509b434eb95SMatthew G. Knepley z[i] = sum; 1510b434eb95SMatthew G. Knepley } 1511b434eb95SMatthew G. Knepley } 1512b434eb95SMatthew G. Knepley ierr = PetscLogFlops(2.0*a->nz);CHKERRQ(ierr); 1513b434eb95SMatthew G. Knepley ierr = VecRestoreArrayRead(xx,&x);CHKERRQ(ierr); 1514d9ca1df4SBarry Smith ierr = VecRestoreArrayPair(yy,zz,&y,&z);CHKERRQ(ierr); 1515b434eb95SMatthew G. Knepley PetscFunctionReturn(0); 1516b434eb95SMatthew G. Knepley } 1517b434eb95SMatthew G. Knepley 1518c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/ftn-kernels/fmultadd.h> 1519dfbe8321SBarry Smith PetscErrorCode MatMultAdd_SeqAIJ(Mat A,Vec xx,Vec yy,Vec zz) 152017ab2063SBarry Smith { 1521416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 1522f15663dcSBarry Smith PetscScalar *y,*z; 1523f15663dcSBarry Smith const PetscScalar *x; 152454f21887SBarry Smith const MatScalar *aa; 1525dfbe8321SBarry Smith PetscErrorCode ierr; 1526d9ca1df4SBarry Smith const PetscInt *aj,*ii,*ridx=NULL; 1527d9ca1df4SBarry Smith PetscInt m = A->rmap->n,n,i; 1528362ced78SSatish Balay PetscScalar sum; 1529ace3abfcSBarry Smith PetscBool usecprow=a->compressedrow.use; 15309ea0dfa2SSatish Balay 15313a40ed3dSBarry Smith PetscFunctionBegin; 1532f15663dcSBarry Smith ierr = VecGetArrayRead(xx,&x);CHKERRQ(ierr); 1533d9ca1df4SBarry Smith ierr = VecGetArrayPair(yy,zz,&y,&z);CHKERRQ(ierr); 15344eb6d288SHong Zhang if (usecprow) { /* use compressed row format */ 15354eb6d288SHong Zhang if (zz != yy) { 1536580bdb30SBarry Smith ierr = PetscArraycpy(z,y,m);CHKERRQ(ierr); 15374eb6d288SHong Zhang } 153897952fefSHong Zhang m = a->compressedrow.nrows; 153997952fefSHong Zhang ii = a->compressedrow.i; 154097952fefSHong Zhang ridx = a->compressedrow.rindex; 154197952fefSHong Zhang for (i=0; i<m; i++) { 154297952fefSHong Zhang n = ii[i+1] - ii[i]; 154397952fefSHong Zhang aj = a->j + ii[i]; 154497952fefSHong Zhang aa = a->a + ii[i]; 154597952fefSHong Zhang sum = y[*ridx]; 1546f15663dcSBarry Smith PetscSparseDensePlusDot(sum,x,aa,aj,n); 154797952fefSHong Zhang z[*ridx++] = sum; 154897952fefSHong Zhang } 154997952fefSHong Zhang } else { /* do not use compressed row format */ 15503d3eaba7SBarry Smith ii = a->i; 1551f15663dcSBarry Smith #if defined(PETSC_USE_FORTRAN_KERNEL_MULTADDAIJ) 15523d3eaba7SBarry Smith aj = a->j; 15533d3eaba7SBarry Smith aa = a->a; 1554f15663dcSBarry Smith fortranmultaddaij_(&m,x,ii,aj,aa,y,z); 1555f15663dcSBarry Smith #else 155617ab2063SBarry Smith for (i=0; i<m; i++) { 1557f15663dcSBarry Smith n = ii[i+1] - ii[i]; 1558f15663dcSBarry Smith aj = a->j + ii[i]; 1559f15663dcSBarry Smith aa = a->a + ii[i]; 156017ab2063SBarry Smith sum = y[i]; 1561f15663dcSBarry Smith PetscSparseDensePlusDot(sum,x,aa,aj,n); 156217ab2063SBarry Smith z[i] = sum; 156317ab2063SBarry Smith } 156402ab625aSSatish Balay #endif 1565f15663dcSBarry Smith } 1566dc0b31edSSatish Balay ierr = PetscLogFlops(2.0*a->nz);CHKERRQ(ierr); 1567f15663dcSBarry Smith ierr = VecRestoreArrayRead(xx,&x);CHKERRQ(ierr); 1568d9ca1df4SBarry Smith ierr = VecRestoreArrayPair(yy,zz,&y,&z);CHKERRQ(ierr); 15693a40ed3dSBarry Smith PetscFunctionReturn(0); 157017ab2063SBarry Smith } 157117ab2063SBarry Smith 157217ab2063SBarry Smith /* 157317ab2063SBarry Smith Adds diagonal pointers to sparse matrix structure. 157417ab2063SBarry Smith */ 1575dfbe8321SBarry Smith PetscErrorCode MatMarkDiagonal_SeqAIJ(Mat A) 157617ab2063SBarry Smith { 1577416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 15786849ba73SBarry Smith PetscErrorCode ierr; 1579d0f46423SBarry Smith PetscInt i,j,m = A->rmap->n; 158017ab2063SBarry Smith 15813a40ed3dSBarry Smith PetscFunctionBegin; 158209f38230SBarry Smith if (!a->diag) { 1583785e854fSJed Brown ierr = PetscMalloc1(m,&a->diag);CHKERRQ(ierr); 15843bb1ff40SBarry Smith ierr = PetscLogObjectMemory((PetscObject)A, m*sizeof(PetscInt));CHKERRQ(ierr); 158509f38230SBarry Smith } 1586d0f46423SBarry Smith for (i=0; i<A->rmap->n; i++) { 158709f38230SBarry Smith a->diag[i] = a->i[i+1]; 1588bfeeae90SHong Zhang for (j=a->i[i]; j<a->i[i+1]; j++) { 1589bfeeae90SHong Zhang if (a->j[j] == i) { 159009f38230SBarry Smith a->diag[i] = j; 159117ab2063SBarry Smith break; 159217ab2063SBarry Smith } 159317ab2063SBarry Smith } 159417ab2063SBarry Smith } 15953a40ed3dSBarry Smith PetscFunctionReturn(0); 159617ab2063SBarry Smith } 159717ab2063SBarry Smith 159861ecd0c6SBarry Smith PetscErrorCode MatShift_SeqAIJ(Mat A,PetscScalar v) 159961ecd0c6SBarry Smith { 160061ecd0c6SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 160161ecd0c6SBarry Smith const PetscInt *diag = (const PetscInt*)a->diag; 160261ecd0c6SBarry Smith const PetscInt *ii = (const PetscInt*) a->i; 160361ecd0c6SBarry Smith PetscInt i,*mdiag = NULL; 160461ecd0c6SBarry Smith PetscErrorCode ierr; 160561ecd0c6SBarry Smith PetscInt cnt = 0; /* how many diagonals are missing */ 160661ecd0c6SBarry Smith 160761ecd0c6SBarry Smith PetscFunctionBegin; 160861ecd0c6SBarry Smith if (!A->preallocated || !a->nz) { 160961ecd0c6SBarry Smith ierr = MatSeqAIJSetPreallocation(A,1,NULL);CHKERRQ(ierr); 161061ecd0c6SBarry Smith ierr = MatShift_Basic(A,v);CHKERRQ(ierr); 161161ecd0c6SBarry Smith PetscFunctionReturn(0); 161261ecd0c6SBarry Smith } 161361ecd0c6SBarry Smith 161461ecd0c6SBarry Smith if (a->diagonaldense) { 161561ecd0c6SBarry Smith cnt = 0; 161661ecd0c6SBarry Smith } else { 161761ecd0c6SBarry Smith ierr = PetscCalloc1(A->rmap->n,&mdiag);CHKERRQ(ierr); 161861ecd0c6SBarry Smith for (i=0; i<A->rmap->n; i++) { 161961ecd0c6SBarry Smith if (diag[i] >= ii[i+1]) { 162061ecd0c6SBarry Smith cnt++; 162161ecd0c6SBarry Smith mdiag[i] = 1; 162261ecd0c6SBarry Smith } 162361ecd0c6SBarry Smith } 162461ecd0c6SBarry Smith } 162561ecd0c6SBarry Smith if (!cnt) { 162661ecd0c6SBarry Smith ierr = MatShift_Basic(A,v);CHKERRQ(ierr); 162761ecd0c6SBarry Smith } else { 1628b6f2aa54SBarry Smith PetscScalar *olda = a->a; /* preserve pointers to current matrix nonzeros structure and values */ 1629b6f2aa54SBarry Smith PetscInt *oldj = a->j, *oldi = a->i; 163061ecd0c6SBarry Smith PetscBool singlemalloc = a->singlemalloc,free_a = a->free_a,free_ij = a->free_ij; 163161ecd0c6SBarry Smith 163261ecd0c6SBarry Smith a->a = NULL; 163361ecd0c6SBarry Smith a->j = NULL; 163461ecd0c6SBarry Smith a->i = NULL; 163561ecd0c6SBarry Smith /* increase the values in imax for each row where a diagonal is being inserted then reallocate the matrix data structures */ 163661ecd0c6SBarry Smith for (i=0; i<A->rmap->n; i++) { 163761ecd0c6SBarry Smith a->imax[i] += mdiag[i]; 1638447d62f5SStefano Zampini a->imax[i] = PetscMin(a->imax[i],A->cmap->n); 163961ecd0c6SBarry Smith } 164061ecd0c6SBarry Smith ierr = MatSeqAIJSetPreallocation_SeqAIJ(A,0,a->imax);CHKERRQ(ierr); 164161ecd0c6SBarry Smith 164261ecd0c6SBarry Smith /* copy old values into new matrix data structure */ 164361ecd0c6SBarry Smith for (i=0; i<A->rmap->n; i++) { 164461ecd0c6SBarry Smith ierr = MatSetValues(A,1,&i,a->imax[i] - mdiag[i],&oldj[oldi[i]],&olda[oldi[i]],ADD_VALUES);CHKERRQ(ierr); 1645447d62f5SStefano Zampini if (i < A->cmap->n) { 164661ecd0c6SBarry Smith ierr = MatSetValue(A,i,i,v,ADD_VALUES);CHKERRQ(ierr); 164761ecd0c6SBarry Smith } 1648447d62f5SStefano Zampini } 164961ecd0c6SBarry Smith ierr = MatAssemblyBegin(A,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 165061ecd0c6SBarry Smith ierr = MatAssemblyEnd(A,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 165161ecd0c6SBarry Smith if (singlemalloc) { 165261ecd0c6SBarry Smith ierr = PetscFree3(olda,oldj,oldi);CHKERRQ(ierr); 165361ecd0c6SBarry Smith } else { 165461ecd0c6SBarry Smith if (free_a) {ierr = PetscFree(olda);CHKERRQ(ierr);} 165561ecd0c6SBarry Smith if (free_ij) {ierr = PetscFree(oldj);CHKERRQ(ierr);} 165661ecd0c6SBarry Smith if (free_ij) {ierr = PetscFree(oldi);CHKERRQ(ierr);} 165761ecd0c6SBarry Smith } 165861ecd0c6SBarry Smith } 165961ecd0c6SBarry Smith ierr = PetscFree(mdiag);CHKERRQ(ierr); 166061ecd0c6SBarry Smith a->diagonaldense = PETSC_TRUE; 166161ecd0c6SBarry Smith PetscFunctionReturn(0); 166261ecd0c6SBarry Smith } 166361ecd0c6SBarry Smith 1664be5855fcSBarry Smith /* 1665be5855fcSBarry Smith Checks for missing diagonals 1666be5855fcSBarry Smith */ 1667ace3abfcSBarry Smith PetscErrorCode MatMissingDiagonal_SeqAIJ(Mat A,PetscBool *missing,PetscInt *d) 1668be5855fcSBarry Smith { 1669be5855fcSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 16707734d3b5SMatthew G. Knepley PetscInt *diag,*ii = a->i,i; 1671994fe344SLisandro Dalcin PetscErrorCode ierr; 1672be5855fcSBarry Smith 1673be5855fcSBarry Smith PetscFunctionBegin; 167409f38230SBarry Smith *missing = PETSC_FALSE; 16757734d3b5SMatthew G. Knepley if (A->rmap->n > 0 && !ii) { 167609f38230SBarry Smith *missing = PETSC_TRUE; 167709f38230SBarry Smith if (d) *d = 0; 1678994fe344SLisandro Dalcin ierr = PetscInfo(A,"Matrix has no entries therefore is missing diagonal\n");CHKERRQ(ierr); 167909f38230SBarry Smith } else { 168001445905SHong Zhang PetscInt n; 168101445905SHong Zhang n = PetscMin(A->rmap->n, A->cmap->n); 1682f1e2ffcdSBarry Smith diag = a->diag; 168301445905SHong Zhang for (i=0; i<n; i++) { 16847734d3b5SMatthew G. Knepley if (diag[i] >= ii[i+1]) { 168509f38230SBarry Smith *missing = PETSC_TRUE; 168609f38230SBarry Smith if (d) *d = i; 1687994fe344SLisandro Dalcin ierr = PetscInfo1(A,"Matrix is missing diagonal number %D\n",i);CHKERRQ(ierr); 1688358d2f5dSShri Abhyankar break; 168909f38230SBarry Smith } 1690be5855fcSBarry Smith } 1691be5855fcSBarry Smith } 1692be5855fcSBarry Smith PetscFunctionReturn(0); 1693be5855fcSBarry Smith } 1694be5855fcSBarry Smith 16950da83c2eSBarry Smith #include <petscblaslapack.h> 16960da83c2eSBarry Smith #include <petsc/private/kernels/blockinvert.h> 16970da83c2eSBarry Smith 16980da83c2eSBarry Smith /* 16990da83c2eSBarry Smith Note that values is allocated externally by the PC and then passed into this routine 17000da83c2eSBarry Smith */ 17010da83c2eSBarry Smith PetscErrorCode MatInvertVariableBlockDiagonal_SeqAIJ(Mat A,PetscInt nblocks,const PetscInt *bsizes,PetscScalar *diag) 17020da83c2eSBarry Smith { 17030da83c2eSBarry Smith PetscErrorCode ierr; 17040da83c2eSBarry Smith PetscInt n = A->rmap->n, i, ncnt = 0, *indx,j,bsizemax = 0,*v_pivots; 17050da83c2eSBarry Smith PetscBool allowzeropivot,zeropivotdetected=PETSC_FALSE; 17060da83c2eSBarry Smith const PetscReal shift = 0.0; 17070da83c2eSBarry Smith PetscInt ipvt[5]; 17080da83c2eSBarry Smith PetscScalar work[25],*v_work; 17090da83c2eSBarry Smith 17100da83c2eSBarry Smith PetscFunctionBegin; 17110da83c2eSBarry Smith allowzeropivot = PetscNot(A->erroriffailure); 17120da83c2eSBarry Smith for (i=0; i<nblocks; i++) ncnt += bsizes[i]; 17130da83c2eSBarry Smith if (ncnt != n) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Total blocksizes %D doesn't match number matrix rows %D",ncnt,n); 17140da83c2eSBarry Smith for (i=0; i<nblocks; i++) { 17150da83c2eSBarry Smith bsizemax = PetscMax(bsizemax,bsizes[i]); 17160da83c2eSBarry Smith } 17170da83c2eSBarry Smith ierr = PetscMalloc1(bsizemax,&indx);CHKERRQ(ierr); 17180da83c2eSBarry Smith if (bsizemax > 7) { 17190da83c2eSBarry Smith ierr = PetscMalloc2(bsizemax,&v_work,bsizemax,&v_pivots);CHKERRQ(ierr); 17200da83c2eSBarry Smith } 17210da83c2eSBarry Smith ncnt = 0; 17220da83c2eSBarry Smith for (i=0; i<nblocks; i++) { 17230da83c2eSBarry Smith for (j=0; j<bsizes[i]; j++) indx[j] = ncnt+j; 17240da83c2eSBarry Smith ierr = MatGetValues(A,bsizes[i],indx,bsizes[i],indx,diag);CHKERRQ(ierr); 17250da83c2eSBarry Smith switch (bsizes[i]) { 17260da83c2eSBarry Smith case 1: 17270da83c2eSBarry Smith *diag = 1.0/(*diag); 17280da83c2eSBarry Smith break; 17290da83c2eSBarry Smith case 2: 17300da83c2eSBarry Smith ierr = PetscKernel_A_gets_inverse_A_2(diag,shift,allowzeropivot,&zeropivotdetected);CHKERRQ(ierr); 17310da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 17320da83c2eSBarry Smith ierr = PetscKernel_A_gets_transpose_A_2(diag);CHKERRQ(ierr); 17330da83c2eSBarry Smith break; 17340da83c2eSBarry Smith case 3: 17350da83c2eSBarry Smith ierr = PetscKernel_A_gets_inverse_A_3(diag,shift,allowzeropivot,&zeropivotdetected);CHKERRQ(ierr); 17360da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 17370da83c2eSBarry Smith ierr = PetscKernel_A_gets_transpose_A_3(diag);CHKERRQ(ierr); 17380da83c2eSBarry Smith break; 17390da83c2eSBarry Smith case 4: 17400da83c2eSBarry Smith ierr = PetscKernel_A_gets_inverse_A_4(diag,shift,allowzeropivot,&zeropivotdetected);CHKERRQ(ierr); 17410da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 17420da83c2eSBarry Smith ierr = PetscKernel_A_gets_transpose_A_4(diag);CHKERRQ(ierr); 17430da83c2eSBarry Smith break; 17440da83c2eSBarry Smith case 5: 17450da83c2eSBarry Smith ierr = PetscKernel_A_gets_inverse_A_5(diag,ipvt,work,shift,allowzeropivot,&zeropivotdetected);CHKERRQ(ierr); 17460da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 17470da83c2eSBarry Smith ierr = PetscKernel_A_gets_transpose_A_5(diag);CHKERRQ(ierr); 17480da83c2eSBarry Smith break; 17490da83c2eSBarry Smith case 6: 17500da83c2eSBarry Smith ierr = PetscKernel_A_gets_inverse_A_6(diag,shift,allowzeropivot,&zeropivotdetected);CHKERRQ(ierr); 17510da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 17520da83c2eSBarry Smith ierr = PetscKernel_A_gets_transpose_A_6(diag);CHKERRQ(ierr); 17530da83c2eSBarry Smith break; 17540da83c2eSBarry Smith case 7: 17550da83c2eSBarry Smith ierr = PetscKernel_A_gets_inverse_A_7(diag,shift,allowzeropivot,&zeropivotdetected);CHKERRQ(ierr); 17560da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 17570da83c2eSBarry Smith ierr = PetscKernel_A_gets_transpose_A_7(diag);CHKERRQ(ierr); 17580da83c2eSBarry Smith break; 17590da83c2eSBarry Smith default: 17600da83c2eSBarry Smith ierr = PetscKernel_A_gets_inverse_A(bsizes[i],diag,v_pivots,v_work,allowzeropivot,&zeropivotdetected);CHKERRQ(ierr); 17610da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 17620da83c2eSBarry Smith ierr = PetscKernel_A_gets_transpose_A_N(diag,bsizes[i]);CHKERRQ(ierr); 17630da83c2eSBarry Smith } 17640da83c2eSBarry Smith ncnt += bsizes[i]; 17650da83c2eSBarry Smith diag += bsizes[i]*bsizes[i]; 17660da83c2eSBarry Smith } 17670da83c2eSBarry Smith if (bsizemax > 7) { 17680da83c2eSBarry Smith ierr = PetscFree2(v_work,v_pivots);CHKERRQ(ierr); 17690da83c2eSBarry Smith } 17700da83c2eSBarry Smith ierr = PetscFree(indx);CHKERRQ(ierr); 17710da83c2eSBarry Smith PetscFunctionReturn(0); 17720da83c2eSBarry Smith } 17730da83c2eSBarry Smith 1774422a814eSBarry Smith /* 1775422a814eSBarry Smith Negative shift indicates do not generate an error if there is a zero diagonal, just invert it anyways 1776422a814eSBarry Smith */ 17777087cfbeSBarry Smith PetscErrorCode MatInvertDiagonal_SeqAIJ(Mat A,PetscScalar omega,PetscScalar fshift) 177871f1c65dSBarry Smith { 177971f1c65dSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*) A->data; 178071f1c65dSBarry Smith PetscErrorCode ierr; 1781d0f46423SBarry Smith PetscInt i,*diag,m = A->rmap->n; 178254f21887SBarry Smith MatScalar *v = a->a; 178354f21887SBarry Smith PetscScalar *idiag,*mdiag; 178471f1c65dSBarry Smith 178571f1c65dSBarry Smith PetscFunctionBegin; 178671f1c65dSBarry Smith if (a->idiagvalid) PetscFunctionReturn(0); 178771f1c65dSBarry Smith ierr = MatMarkDiagonal_SeqAIJ(A);CHKERRQ(ierr); 178871f1c65dSBarry Smith diag = a->diag; 178971f1c65dSBarry Smith if (!a->idiag) { 1790dcca6d9dSJed Brown ierr = PetscMalloc3(m,&a->idiag,m,&a->mdiag,m,&a->ssor_work);CHKERRQ(ierr); 17913bb1ff40SBarry Smith ierr = PetscLogObjectMemory((PetscObject)A, 3*m*sizeof(PetscScalar));CHKERRQ(ierr); 179271f1c65dSBarry Smith v = a->a; 179371f1c65dSBarry Smith } 179471f1c65dSBarry Smith mdiag = a->mdiag; 179571f1c65dSBarry Smith idiag = a->idiag; 179671f1c65dSBarry Smith 1797422a814eSBarry Smith if (omega == 1.0 && PetscRealPart(fshift) <= 0.0) { 179871f1c65dSBarry Smith for (i=0; i<m; i++) { 179971f1c65dSBarry Smith mdiag[i] = v[diag[i]]; 1800899639b0SHong Zhang if (!PetscAbsScalar(mdiag[i])) { /* zero diagonal */ 1801899639b0SHong Zhang if (PetscRealPart(fshift)) { 1802899639b0SHong Zhang ierr = PetscInfo1(A,"Zero diagonal on row %D\n",i);CHKERRQ(ierr); 18037b6c816cSBarry Smith A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 18047b6c816cSBarry Smith A->factorerror_zeropivot_value = 0.0; 18057b6c816cSBarry Smith A->factorerror_zeropivot_row = i; 1806a6fa060aSHong Zhang } else SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_ARG_INCOMP,"Zero diagonal on row %D",i); 1807899639b0SHong Zhang } 180871f1c65dSBarry Smith idiag[i] = 1.0/v[diag[i]]; 180971f1c65dSBarry Smith } 181071f1c65dSBarry Smith ierr = PetscLogFlops(m);CHKERRQ(ierr); 181171f1c65dSBarry Smith } else { 181271f1c65dSBarry Smith for (i=0; i<m; i++) { 181371f1c65dSBarry Smith mdiag[i] = v[diag[i]]; 181471f1c65dSBarry Smith idiag[i] = omega/(fshift + v[diag[i]]); 181571f1c65dSBarry Smith } 1816dc0b31edSSatish Balay ierr = PetscLogFlops(2.0*m);CHKERRQ(ierr); 181771f1c65dSBarry Smith } 181871f1c65dSBarry Smith a->idiagvalid = PETSC_TRUE; 181971f1c65dSBarry Smith PetscFunctionReturn(0); 182071f1c65dSBarry Smith } 182171f1c65dSBarry Smith 1822c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/ftn-kernels/frelax.h> 182341f059aeSBarry Smith PetscErrorCode MatSOR_SeqAIJ(Mat A,Vec bb,PetscReal omega,MatSORType flag,PetscReal fshift,PetscInt its,PetscInt lits,Vec xx) 182417ab2063SBarry Smith { 1825416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 1826e6d1f457SBarry Smith PetscScalar *x,d,sum,*t,scale; 18273d3eaba7SBarry Smith const MatScalar *v,*idiag=0,*mdiag; 182854f21887SBarry Smith const PetscScalar *b, *bs,*xb, *ts; 1829dfbe8321SBarry Smith PetscErrorCode ierr; 18303d3eaba7SBarry Smith PetscInt n,m = A->rmap->n,i; 183197f1f81fSBarry Smith const PetscInt *idx,*diag; 183217ab2063SBarry Smith 18333a40ed3dSBarry Smith PetscFunctionBegin; 1834b965ef7fSBarry Smith its = its*lits; 183591723122SBarry Smith 183671f1c65dSBarry Smith if (fshift != a->fshift || omega != a->omega) a->idiagvalid = PETSC_FALSE; /* must recompute idiag[] */ 183771f1c65dSBarry Smith if (!a->idiagvalid) {ierr = MatInvertDiagonal_SeqAIJ(A,omega,fshift);CHKERRQ(ierr);} 183871f1c65dSBarry Smith a->fshift = fshift; 183971f1c65dSBarry Smith a->omega = omega; 1840ed480e8bSBarry Smith 184171f1c65dSBarry Smith diag = a->diag; 184271f1c65dSBarry Smith t = a->ssor_work; 1843ed480e8bSBarry Smith idiag = a->idiag; 184471f1c65dSBarry Smith mdiag = a->mdiag; 1845ed480e8bSBarry Smith 18461ebc52fbSHong Zhang ierr = VecGetArray(xx,&x);CHKERRQ(ierr); 18473649974fSBarry Smith ierr = VecGetArrayRead(bb,&b);CHKERRQ(ierr); 1848ed480e8bSBarry Smith /* We count flops by assuming the upper triangular and lower triangular parts have the same number of nonzeros */ 184917ab2063SBarry Smith if (flag == SOR_APPLY_UPPER) { 185017ab2063SBarry Smith /* apply (U + D/omega) to the vector */ 1851ed480e8bSBarry Smith bs = b; 185217ab2063SBarry Smith for (i=0; i<m; i++) { 185371f1c65dSBarry Smith d = fshift + mdiag[i]; 1854416022c9SBarry Smith n = a->i[i+1] - diag[i] - 1; 1855ed480e8bSBarry Smith idx = a->j + diag[i] + 1; 1856ed480e8bSBarry Smith v = a->a + diag[i] + 1; 185717ab2063SBarry Smith sum = b[i]*d/omega; 1858003131ecSBarry Smith PetscSparseDensePlusDot(sum,bs,v,idx,n); 185917ab2063SBarry Smith x[i] = sum; 186017ab2063SBarry Smith } 18611ebc52fbSHong Zhang ierr = VecRestoreArray(xx,&x);CHKERRQ(ierr); 18623649974fSBarry Smith ierr = VecRestoreArrayRead(bb,&b);CHKERRQ(ierr); 1863efee365bSSatish Balay ierr = PetscLogFlops(a->nz);CHKERRQ(ierr); 18643a40ed3dSBarry Smith PetscFunctionReturn(0); 186517ab2063SBarry Smith } 1866c783ea89SBarry Smith 18672205254eSKarl Rupp if (flag == SOR_APPLY_LOWER) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_SUP,"SOR_APPLY_LOWER is not implemented"); 18682205254eSKarl Rupp else if (flag & SOR_EISENSTAT) { 18694c500f23SPierre Jolivet /* Let A = L + U + D; where L is lower triangular, 1870887ee2caSBarry Smith U is upper triangular, E = D/omega; This routine applies 187117ab2063SBarry Smith 187217ab2063SBarry Smith (L + E)^{-1} A (U + E)^{-1} 187317ab2063SBarry Smith 1874887ee2caSBarry Smith to a vector efficiently using Eisenstat's trick. 187517ab2063SBarry Smith */ 187617ab2063SBarry Smith scale = (2.0/omega) - 1.0; 187717ab2063SBarry Smith 187817ab2063SBarry Smith /* x = (E + U)^{-1} b */ 187917ab2063SBarry Smith for (i=m-1; i>=0; i--) { 1880416022c9SBarry Smith n = a->i[i+1] - diag[i] - 1; 1881ed480e8bSBarry Smith idx = a->j + diag[i] + 1; 1882ed480e8bSBarry Smith v = a->a + diag[i] + 1; 188317ab2063SBarry Smith sum = b[i]; 1884e6d1f457SBarry Smith PetscSparseDenseMinusDot(sum,x,v,idx,n); 1885ed480e8bSBarry Smith x[i] = sum*idiag[i]; 188617ab2063SBarry Smith } 188717ab2063SBarry Smith 188817ab2063SBarry Smith /* t = b - (2*E - D)x */ 1889416022c9SBarry Smith v = a->a; 18902205254eSKarl Rupp for (i=0; i<m; i++) t[i] = b[i] - scale*(v[*diag++])*x[i]; 189117ab2063SBarry Smith 189217ab2063SBarry Smith /* t = (E + L)^{-1}t */ 1893ed480e8bSBarry Smith ts = t; 1894416022c9SBarry Smith diag = a->diag; 189517ab2063SBarry Smith for (i=0; i<m; i++) { 1896416022c9SBarry Smith n = diag[i] - a->i[i]; 1897ed480e8bSBarry Smith idx = a->j + a->i[i]; 1898ed480e8bSBarry Smith v = a->a + a->i[i]; 189917ab2063SBarry Smith sum = t[i]; 1900003131ecSBarry Smith PetscSparseDenseMinusDot(sum,ts,v,idx,n); 1901ed480e8bSBarry Smith t[i] = sum*idiag[i]; 1902733d66baSBarry Smith /* x = x + t */ 1903733d66baSBarry Smith x[i] += t[i]; 190417ab2063SBarry Smith } 190517ab2063SBarry Smith 1906dc0b31edSSatish Balay ierr = PetscLogFlops(6.0*m-1 + 2.0*a->nz);CHKERRQ(ierr); 19071ebc52fbSHong Zhang ierr = VecRestoreArray(xx,&x);CHKERRQ(ierr); 19083649974fSBarry Smith ierr = VecRestoreArrayRead(bb,&b);CHKERRQ(ierr); 19093a40ed3dSBarry Smith PetscFunctionReturn(0); 191017ab2063SBarry Smith } 191117ab2063SBarry Smith if (flag & SOR_ZERO_INITIAL_GUESS) { 191217ab2063SBarry Smith if (flag & SOR_FORWARD_SWEEP || flag & SOR_LOCAL_FORWARD_SWEEP) { 191317ab2063SBarry Smith for (i=0; i<m; i++) { 1914416022c9SBarry Smith n = diag[i] - a->i[i]; 1915ed480e8bSBarry Smith idx = a->j + a->i[i]; 1916ed480e8bSBarry Smith v = a->a + a->i[i]; 191717ab2063SBarry Smith sum = b[i]; 1918e6d1f457SBarry Smith PetscSparseDenseMinusDot(sum,x,v,idx,n); 19195c99c7daSBarry Smith t[i] = sum; 1920ed480e8bSBarry Smith x[i] = sum*idiag[i]; 192117ab2063SBarry Smith } 19225c99c7daSBarry Smith xb = t; 1923efee365bSSatish Balay ierr = PetscLogFlops(a->nz);CHKERRQ(ierr); 19243a40ed3dSBarry Smith } else xb = b; 192517ab2063SBarry Smith if (flag & SOR_BACKWARD_SWEEP || flag & SOR_LOCAL_BACKWARD_SWEEP) { 192617ab2063SBarry Smith for (i=m-1; i>=0; i--) { 1927416022c9SBarry Smith n = a->i[i+1] - diag[i] - 1; 1928ed480e8bSBarry Smith idx = a->j + diag[i] + 1; 1929ed480e8bSBarry Smith v = a->a + diag[i] + 1; 193017ab2063SBarry Smith sum = xb[i]; 1931e6d1f457SBarry Smith PetscSparseDenseMinusDot(sum,x,v,idx,n); 19325c99c7daSBarry Smith if (xb == b) { 1933ed480e8bSBarry Smith x[i] = sum*idiag[i]; 19345c99c7daSBarry Smith } else { 1935b19a5dc2SMark Adams x[i] = (1-omega)*x[i] + sum*idiag[i]; /* omega in idiag */ 193617ab2063SBarry Smith } 19375c99c7daSBarry Smith } 1938b19a5dc2SMark Adams ierr = PetscLogFlops(a->nz);CHKERRQ(ierr); /* assumes 1/2 in upper */ 193917ab2063SBarry Smith } 194017ab2063SBarry Smith its--; 194117ab2063SBarry Smith } 194217ab2063SBarry Smith while (its--) { 194317ab2063SBarry Smith if (flag & SOR_FORWARD_SWEEP || flag & SOR_LOCAL_FORWARD_SWEEP) { 194417ab2063SBarry Smith for (i=0; i<m; i++) { 1945b19a5dc2SMark Adams /* lower */ 1946b19a5dc2SMark Adams n = diag[i] - a->i[i]; 1947ed480e8bSBarry Smith idx = a->j + a->i[i]; 1948ed480e8bSBarry Smith v = a->a + a->i[i]; 194917ab2063SBarry Smith sum = b[i]; 1950e6d1f457SBarry Smith PetscSparseDenseMinusDot(sum,x,v,idx,n); 1951b19a5dc2SMark Adams t[i] = sum; /* save application of the lower-triangular part */ 1952b19a5dc2SMark Adams /* upper */ 1953b19a5dc2SMark Adams n = a->i[i+1] - diag[i] - 1; 1954b19a5dc2SMark Adams idx = a->j + diag[i] + 1; 1955b19a5dc2SMark Adams v = a->a + diag[i] + 1; 1956b19a5dc2SMark Adams PetscSparseDenseMinusDot(sum,x,v,idx,n); 1957b19a5dc2SMark Adams x[i] = (1. - omega)*x[i] + sum*idiag[i]; /* omega in idiag */ 195817ab2063SBarry Smith } 1959b19a5dc2SMark Adams xb = t; 19609f863219SBarry Smith ierr = PetscLogFlops(2.0*a->nz);CHKERRQ(ierr); 1961b19a5dc2SMark Adams } else xb = b; 196217ab2063SBarry Smith if (flag & SOR_BACKWARD_SWEEP || flag & SOR_LOCAL_BACKWARD_SWEEP) { 196317ab2063SBarry Smith for (i=m-1; i>=0; i--) { 1964b19a5dc2SMark Adams sum = xb[i]; 1965b19a5dc2SMark Adams if (xb == b) { 1966b19a5dc2SMark Adams /* whole matrix (no checkpointing available) */ 1967416022c9SBarry Smith n = a->i[i+1] - a->i[i]; 1968ed480e8bSBarry Smith idx = a->j + a->i[i]; 1969ed480e8bSBarry Smith v = a->a + a->i[i]; 1970e6d1f457SBarry Smith PetscSparseDenseMinusDot(sum,x,v,idx,n); 1971ed480e8bSBarry Smith x[i] = (1. - omega)*x[i] + (sum + mdiag[i]*x[i])*idiag[i]; 1972b19a5dc2SMark Adams } else { /* lower-triangular part has been saved, so only apply upper-triangular */ 1973b19a5dc2SMark Adams n = a->i[i+1] - diag[i] - 1; 1974b19a5dc2SMark Adams idx = a->j + diag[i] + 1; 1975b19a5dc2SMark Adams v = a->a + diag[i] + 1; 1976b19a5dc2SMark Adams PetscSparseDenseMinusDot(sum,x,v,idx,n); 1977b19a5dc2SMark Adams x[i] = (1. - omega)*x[i] + sum*idiag[i]; /* omega in idiag */ 197817ab2063SBarry Smith } 1979b19a5dc2SMark Adams } 1980b19a5dc2SMark Adams if (xb == b) { 19819f863219SBarry Smith ierr = PetscLogFlops(2.0*a->nz);CHKERRQ(ierr); 1982b19a5dc2SMark Adams } else { 1983b19a5dc2SMark Adams ierr = PetscLogFlops(a->nz);CHKERRQ(ierr); /* assumes 1/2 in upper */ 1984b19a5dc2SMark Adams } 198517ab2063SBarry Smith } 198617ab2063SBarry Smith } 19871ebc52fbSHong Zhang ierr = VecRestoreArray(xx,&x);CHKERRQ(ierr); 19883649974fSBarry Smith ierr = VecRestoreArrayRead(bb,&b);CHKERRQ(ierr); 1989365a8a9eSBarry Smith PetscFunctionReturn(0); 199017ab2063SBarry Smith } 199117ab2063SBarry Smith 19922af78befSBarry Smith 1993dfbe8321SBarry Smith PetscErrorCode MatGetInfo_SeqAIJ(Mat A,MatInfoType flag,MatInfo *info) 199417ab2063SBarry Smith { 1995416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 19964e220ebcSLois Curfman McInnes 19973a40ed3dSBarry Smith PetscFunctionBegin; 19984e220ebcSLois Curfman McInnes info->block_size = 1.0; 19993966268fSBarry Smith info->nz_allocated = a->maxnz; 20003966268fSBarry Smith info->nz_used = a->nz; 20013966268fSBarry Smith info->nz_unneeded = (a->maxnz - a->nz); 20023966268fSBarry Smith info->assemblies = A->num_ass; 20033966268fSBarry Smith info->mallocs = A->info.mallocs; 20047adad957SLisandro Dalcin info->memory = ((PetscObject)A)->mem; 2005d5f3da31SBarry Smith if (A->factortype) { 20064e220ebcSLois Curfman McInnes info->fill_ratio_given = A->info.fill_ratio_given; 20074e220ebcSLois Curfman McInnes info->fill_ratio_needed = A->info.fill_ratio_needed; 20084e220ebcSLois Curfman McInnes info->factor_mallocs = A->info.factor_mallocs; 20094e220ebcSLois Curfman McInnes } else { 20104e220ebcSLois Curfman McInnes info->fill_ratio_given = 0; 20114e220ebcSLois Curfman McInnes info->fill_ratio_needed = 0; 20124e220ebcSLois Curfman McInnes info->factor_mallocs = 0; 20134e220ebcSLois Curfman McInnes } 20143a40ed3dSBarry Smith PetscFunctionReturn(0); 201517ab2063SBarry Smith } 201617ab2063SBarry Smith 20172b40b63fSBarry Smith PetscErrorCode MatZeroRows_SeqAIJ(Mat A,PetscInt N,const PetscInt rows[],PetscScalar diag,Vec x,Vec b) 201817ab2063SBarry Smith { 2019416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 2020c7da8527SEric Chamberland PetscInt i,m = A->rmap->n - 1; 20216849ba73SBarry Smith PetscErrorCode ierr; 202297b48c8fSBarry Smith const PetscScalar *xx; 202397b48c8fSBarry Smith PetscScalar *bb; 2024c7da8527SEric Chamberland PetscInt d = 0; 202517ab2063SBarry Smith 20263a40ed3dSBarry Smith PetscFunctionBegin; 202797b48c8fSBarry Smith if (x && b) { 202897b48c8fSBarry Smith ierr = VecGetArrayRead(x,&xx);CHKERRQ(ierr); 202997b48c8fSBarry Smith ierr = VecGetArray(b,&bb);CHKERRQ(ierr); 203097b48c8fSBarry Smith for (i=0; i<N; i++) { 203197b48c8fSBarry Smith if (rows[i] < 0 || rows[i] > m) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"row %D out of range", rows[i]); 2032447d62f5SStefano Zampini if (rows[i] >= A->cmap->n) continue; 203397b48c8fSBarry Smith bb[rows[i]] = diag*xx[rows[i]]; 203497b48c8fSBarry Smith } 203597b48c8fSBarry Smith ierr = VecRestoreArrayRead(x,&xx);CHKERRQ(ierr); 203697b48c8fSBarry Smith ierr = VecRestoreArray(b,&bb);CHKERRQ(ierr); 203797b48c8fSBarry Smith } 203897b48c8fSBarry Smith 2039a9817697SBarry Smith if (a->keepnonzeropattern) { 2040f1e2ffcdSBarry Smith for (i=0; i<N; i++) { 2041e32f2f54SBarry Smith if (rows[i] < 0 || rows[i] > m) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"row %D out of range", rows[i]); 2042580bdb30SBarry Smith ierr = PetscArrayzero(&a->a[a->i[rows[i]]],a->ilen[rows[i]]);CHKERRQ(ierr); 2043f1e2ffcdSBarry Smith } 2044f4df32b1SMatthew Knepley if (diag != 0.0) { 2045c7da8527SEric Chamberland for (i=0; i<N; i++) { 2046c7da8527SEric Chamberland d = rows[i]; 2047447d62f5SStefano Zampini if (rows[i] >= A->cmap->n) continue; 2048c7da8527SEric Chamberland if (a->diag[d] >= a->i[d+1]) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Matrix is missing diagonal entry in the zeroed row %D",d); 2049c7da8527SEric Chamberland } 2050f1e2ffcdSBarry Smith for (i=0; i<N; i++) { 2051447d62f5SStefano Zampini if (rows[i] >= A->cmap->n) continue; 2052f4df32b1SMatthew Knepley a->a[a->diag[rows[i]]] = diag; 2053f1e2ffcdSBarry Smith } 2054f1e2ffcdSBarry Smith } 2055f1e2ffcdSBarry Smith } else { 2056f4df32b1SMatthew Knepley if (diag != 0.0) { 205717ab2063SBarry Smith for (i=0; i<N; i++) { 2058e32f2f54SBarry Smith if (rows[i] < 0 || rows[i] > m) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"row %D out of range", rows[i]); 20597ae801bdSBarry Smith if (a->ilen[rows[i]] > 0) { 2060447d62f5SStefano Zampini if (rows[i] >= A->cmap->n) { 2061447d62f5SStefano Zampini a->ilen[rows[i]] = 0; 2062447d62f5SStefano Zampini } else { 2063416022c9SBarry Smith a->ilen[rows[i]] = 1; 2064f4df32b1SMatthew Knepley a->a[a->i[rows[i]]] = diag; 2065bfeeae90SHong Zhang a->j[a->i[rows[i]]] = rows[i]; 2066447d62f5SStefano Zampini } 2067447d62f5SStefano Zampini } else if (rows[i] < A->cmap->n) { /* in case row was completely empty */ 2068f4df32b1SMatthew Knepley ierr = MatSetValues_SeqAIJ(A,1,&rows[i],1,&rows[i],&diag,INSERT_VALUES);CHKERRQ(ierr); 206917ab2063SBarry Smith } 207017ab2063SBarry Smith } 20713a40ed3dSBarry Smith } else { 207217ab2063SBarry Smith for (i=0; i<N; i++) { 2073e32f2f54SBarry Smith if (rows[i] < 0 || rows[i] > m) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"row %D out of range", rows[i]); 2074416022c9SBarry Smith a->ilen[rows[i]] = 0; 207517ab2063SBarry Smith } 207617ab2063SBarry Smith } 2077e56f5c9eSBarry Smith A->nonzerostate++; 2078f1e2ffcdSBarry Smith } 2079e2cf4d64SStefano Zampini #if defined(PETSC_HAVE_VIENNACL) || defined(PETSC_HAVE_CUDA) 2080c70f7ee4SJunchao Zhang if (A->offloadmask != PETSC_OFFLOAD_UNALLOCATED) A->offloadmask = PETSC_OFFLOAD_CPU; 2081e2cf4d64SStefano Zampini #endif 20824099cc6bSBarry Smith ierr = (*A->ops->assemblyend)(A,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 20833a40ed3dSBarry Smith PetscFunctionReturn(0); 208417ab2063SBarry Smith } 208517ab2063SBarry Smith 20866e169961SBarry Smith PetscErrorCode MatZeroRowsColumns_SeqAIJ(Mat A,PetscInt N,const PetscInt rows[],PetscScalar diag,Vec x,Vec b) 20876e169961SBarry Smith { 20886e169961SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 20896e169961SBarry Smith PetscInt i,j,m = A->rmap->n - 1,d = 0; 20906e169961SBarry Smith PetscErrorCode ierr; 20912b40b63fSBarry Smith PetscBool missing,*zeroed,vecs = PETSC_FALSE; 20926e169961SBarry Smith const PetscScalar *xx; 20936e169961SBarry Smith PetscScalar *bb; 20946e169961SBarry Smith 20956e169961SBarry Smith PetscFunctionBegin; 20966e169961SBarry Smith if (x && b) { 20976e169961SBarry Smith ierr = VecGetArrayRead(x,&xx);CHKERRQ(ierr); 20986e169961SBarry Smith ierr = VecGetArray(b,&bb);CHKERRQ(ierr); 20992b40b63fSBarry Smith vecs = PETSC_TRUE; 21006e169961SBarry Smith } 21011795a4d1SJed Brown ierr = PetscCalloc1(A->rmap->n,&zeroed);CHKERRQ(ierr); 21026e169961SBarry Smith for (i=0; i<N; i++) { 21036e169961SBarry Smith if (rows[i] < 0 || rows[i] > m) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"row %D out of range", rows[i]); 2104580bdb30SBarry Smith ierr = PetscArrayzero(&a->a[a->i[rows[i]]],a->ilen[rows[i]]);CHKERRQ(ierr); 21052205254eSKarl Rupp 21066e169961SBarry Smith zeroed[rows[i]] = PETSC_TRUE; 21076e169961SBarry Smith } 21086e169961SBarry Smith for (i=0; i<A->rmap->n; i++) { 21096e169961SBarry Smith if (!zeroed[i]) { 21106e169961SBarry Smith for (j=a->i[i]; j<a->i[i+1]; j++) { 21114cf107fdSStefano Zampini if (a->j[j] < A->rmap->n && zeroed[a->j[j]]) { 21122b40b63fSBarry Smith if (vecs) bb[i] -= a->a[j]*xx[a->j[j]]; 21136e169961SBarry Smith a->a[j] = 0.0; 21146e169961SBarry Smith } 21156e169961SBarry Smith } 21164cf107fdSStefano Zampini } else if (vecs && i < A->cmap->N) bb[i] = diag*xx[i]; 21176e169961SBarry Smith } 21186e169961SBarry Smith if (x && b) { 21196e169961SBarry Smith ierr = VecRestoreArrayRead(x,&xx);CHKERRQ(ierr); 21206e169961SBarry Smith ierr = VecRestoreArray(b,&bb);CHKERRQ(ierr); 21216e169961SBarry Smith } 21226e169961SBarry Smith ierr = PetscFree(zeroed);CHKERRQ(ierr); 21236e169961SBarry Smith if (diag != 0.0) { 21246e169961SBarry Smith ierr = MatMissingDiagonal_SeqAIJ(A,&missing,&d);CHKERRQ(ierr); 21251d5a398dSstefano_zampini if (missing) { 21261d5a398dSstefano_zampini for (i=0; i<N; i++) { 21274cf107fdSStefano Zampini if (rows[i] >= A->cmap->N) continue; 21284cf107fdSStefano Zampini if (a->nonew && rows[i] >= d) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Matrix is missing diagonal entry in row %D (%D)",d,rows[i]); 21291d5a398dSstefano_zampini ierr = MatSetValues_SeqAIJ(A,1,&rows[i],1,&rows[i],&diag,INSERT_VALUES);CHKERRQ(ierr); 21301d5a398dSstefano_zampini } 21311d5a398dSstefano_zampini } else { 21326e169961SBarry Smith for (i=0; i<N; i++) { 21336e169961SBarry Smith a->a[a->diag[rows[i]]] = diag; 21346e169961SBarry Smith } 21356e169961SBarry Smith } 21361d5a398dSstefano_zampini } 2137e2cf4d64SStefano Zampini #if defined(PETSC_HAVE_VIENNACL) || defined(PETSC_HAVE_CUDA) 2138c70f7ee4SJunchao Zhang if (A->offloadmask != PETSC_OFFLOAD_UNALLOCATED) A->offloadmask = PETSC_OFFLOAD_CPU; 2139e2cf4d64SStefano Zampini #endif 21404099cc6bSBarry Smith ierr = (*A->ops->assemblyend)(A,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 21416e169961SBarry Smith PetscFunctionReturn(0); 21426e169961SBarry Smith } 21436e169961SBarry Smith 2144a77337e4SBarry Smith PetscErrorCode MatGetRow_SeqAIJ(Mat A,PetscInt row,PetscInt *nz,PetscInt **idx,PetscScalar **v) 214517ab2063SBarry Smith { 2146416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 214797f1f81fSBarry Smith PetscInt *itmp; 214817ab2063SBarry Smith 21493a40ed3dSBarry Smith PetscFunctionBegin; 2150e32f2f54SBarry Smith if (row < 0 || row >= A->rmap->n) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Row %D out of range",row); 215117ab2063SBarry Smith 2152416022c9SBarry Smith *nz = a->i[row+1] - a->i[row]; 2153bfeeae90SHong Zhang if (v) *v = a->a + a->i[row]; 215417ab2063SBarry Smith if (idx) { 2155bfeeae90SHong Zhang itmp = a->j + a->i[row]; 215626fbe8dcSKarl Rupp if (*nz) *idx = itmp; 215717ab2063SBarry Smith else *idx = 0; 215817ab2063SBarry Smith } 21593a40ed3dSBarry Smith PetscFunctionReturn(0); 216017ab2063SBarry Smith } 216117ab2063SBarry Smith 2162bfeeae90SHong Zhang /* remove this function? */ 2163a77337e4SBarry Smith PetscErrorCode MatRestoreRow_SeqAIJ(Mat A,PetscInt row,PetscInt *nz,PetscInt **idx,PetscScalar **v) 216417ab2063SBarry Smith { 21653a40ed3dSBarry Smith PetscFunctionBegin; 21663a40ed3dSBarry Smith PetscFunctionReturn(0); 216717ab2063SBarry Smith } 216817ab2063SBarry Smith 2169dfbe8321SBarry Smith PetscErrorCode MatNorm_SeqAIJ(Mat A,NormType type,PetscReal *nrm) 217017ab2063SBarry Smith { 2171416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 217254f21887SBarry Smith MatScalar *v = a->a; 217336db0b34SBarry Smith PetscReal sum = 0.0; 21746849ba73SBarry Smith PetscErrorCode ierr; 217597f1f81fSBarry Smith PetscInt i,j; 217617ab2063SBarry Smith 21773a40ed3dSBarry Smith PetscFunctionBegin; 217817ab2063SBarry Smith if (type == NORM_FROBENIUS) { 2179570b7f6dSBarry Smith #if defined(PETSC_USE_REAL___FP16) 2180570b7f6dSBarry Smith PetscBLASInt one = 1,nz = a->nz; 2181570b7f6dSBarry Smith *nrm = BLASnrm2_(&nz,v,&one); 2182570b7f6dSBarry Smith #else 2183416022c9SBarry Smith for (i=0; i<a->nz; i++) { 218436db0b34SBarry Smith sum += PetscRealPart(PetscConj(*v)*(*v)); v++; 218517ab2063SBarry Smith } 21868f1a2a5eSBarry Smith *nrm = PetscSqrtReal(sum); 2187570b7f6dSBarry Smith #endif 218851f70360SJed Brown ierr = PetscLogFlops(2*a->nz);CHKERRQ(ierr); 21893a40ed3dSBarry Smith } else if (type == NORM_1) { 219036db0b34SBarry Smith PetscReal *tmp; 219197f1f81fSBarry Smith PetscInt *jj = a->j; 21921795a4d1SJed Brown ierr = PetscCalloc1(A->cmap->n+1,&tmp);CHKERRQ(ierr); 2193064f8208SBarry Smith *nrm = 0.0; 2194416022c9SBarry Smith for (j=0; j<a->nz; j++) { 2195bfeeae90SHong Zhang tmp[*jj++] += PetscAbsScalar(*v); v++; 219617ab2063SBarry Smith } 2197d0f46423SBarry Smith for (j=0; j<A->cmap->n; j++) { 2198064f8208SBarry Smith if (tmp[j] > *nrm) *nrm = tmp[j]; 219917ab2063SBarry Smith } 2200606d414cSSatish Balay ierr = PetscFree(tmp);CHKERRQ(ierr); 220151f70360SJed Brown ierr = PetscLogFlops(PetscMax(a->nz-1,0));CHKERRQ(ierr); 22023a40ed3dSBarry Smith } else if (type == NORM_INFINITY) { 2203064f8208SBarry Smith *nrm = 0.0; 2204d0f46423SBarry Smith for (j=0; j<A->rmap->n; j++) { 2205bfeeae90SHong Zhang v = a->a + a->i[j]; 220617ab2063SBarry Smith sum = 0.0; 2207416022c9SBarry Smith for (i=0; i<a->i[j+1]-a->i[j]; i++) { 2208cddf8d76SBarry Smith sum += PetscAbsScalar(*v); v++; 220917ab2063SBarry Smith } 2210064f8208SBarry Smith if (sum > *nrm) *nrm = sum; 221117ab2063SBarry Smith } 221251f70360SJed Brown ierr = PetscLogFlops(PetscMax(a->nz-1,0));CHKERRQ(ierr); 2213f23aa3ddSBarry Smith } else SETERRQ(PETSC_COMM_SELF,PETSC_ERR_SUP,"No support for two norm"); 22143a40ed3dSBarry Smith PetscFunctionReturn(0); 221517ab2063SBarry Smith } 221617ab2063SBarry Smith 22174e938277SHong Zhang /* Merged from MatGetSymbolicTranspose_SeqAIJ() - replace MatGetSymbolicTranspose_SeqAIJ()? */ 22184e938277SHong Zhang PetscErrorCode MatTransposeSymbolic_SeqAIJ(Mat A,Mat *B) 22194e938277SHong Zhang { 22204e938277SHong Zhang PetscErrorCode ierr; 22214e938277SHong Zhang PetscInt i,j,anzj; 22224e938277SHong Zhang Mat_SeqAIJ *a=(Mat_SeqAIJ*)A->data,*b; 22234e938277SHong Zhang PetscInt an=A->cmap->N,am=A->rmap->N; 22244e938277SHong Zhang PetscInt *ati,*atj,*atfill,*ai=a->i,*aj=a->j; 22254e938277SHong Zhang 22264e938277SHong Zhang PetscFunctionBegin; 22274e938277SHong Zhang /* Allocate space for symbolic transpose info and work array */ 2228854ce69bSBarry Smith ierr = PetscCalloc1(an+1,&ati);CHKERRQ(ierr); 2229785e854fSJed Brown ierr = PetscMalloc1(ai[am],&atj);CHKERRQ(ierr); 2230785e854fSJed Brown ierr = PetscMalloc1(an,&atfill);CHKERRQ(ierr); 22314e938277SHong Zhang 22324e938277SHong Zhang /* Walk through aj and count ## of non-zeros in each row of A^T. */ 22334e938277SHong Zhang /* Note: offset by 1 for fast conversion into csr format. */ 223426fbe8dcSKarl Rupp for (i=0;i<ai[am];i++) ati[aj[i]+1] += 1; 22354e938277SHong Zhang /* Form ati for csr format of A^T. */ 223626fbe8dcSKarl Rupp for (i=0;i<an;i++) ati[i+1] += ati[i]; 22374e938277SHong Zhang 22384e938277SHong Zhang /* Copy ati into atfill so we have locations of the next free space in atj */ 2239580bdb30SBarry Smith ierr = PetscArraycpy(atfill,ati,an);CHKERRQ(ierr); 22404e938277SHong Zhang 22414e938277SHong Zhang /* Walk through A row-wise and mark nonzero entries of A^T. */ 22424e938277SHong Zhang for (i=0;i<am;i++) { 22434e938277SHong Zhang anzj = ai[i+1] - ai[i]; 22444e938277SHong Zhang for (j=0;j<anzj;j++) { 22454e938277SHong Zhang atj[atfill[*aj]] = i; 22464e938277SHong Zhang atfill[*aj++] += 1; 22474e938277SHong Zhang } 22484e938277SHong Zhang } 22494e938277SHong Zhang 22504e938277SHong Zhang /* Clean up temporary space and complete requests. */ 22514e938277SHong Zhang ierr = PetscFree(atfill);CHKERRQ(ierr); 2252ce94432eSBarry Smith ierr = MatCreateSeqAIJWithArrays(PetscObjectComm((PetscObject)A),an,am,ati,atj,NULL,B);CHKERRQ(ierr); 225333d57670SJed Brown ierr = MatSetBlockSizes(*B,PetscAbs(A->cmap->bs),PetscAbs(A->rmap->bs));CHKERRQ(ierr); 2254b5bb3eecSMark Adams ierr = MatSetType(*B,((PetscObject)A)->type_name);CHKERRQ(ierr); 2255a2f3521dSMark F. Adams 22564e938277SHong Zhang b = (Mat_SeqAIJ*)((*B)->data); 22574e938277SHong Zhang b->free_a = PETSC_FALSE; 22584e938277SHong Zhang b->free_ij = PETSC_TRUE; 22594e938277SHong Zhang b->nonew = 0; 22604e938277SHong Zhang PetscFunctionReturn(0); 22614e938277SHong Zhang } 22624e938277SHong Zhang 22637087cfbeSBarry Smith PetscErrorCode MatIsTranspose_SeqAIJ(Mat A,Mat B,PetscReal tol,PetscBool *f) 2264cd0d46ebSvictorle { 22653d3eaba7SBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ*) A->data,*bij = (Mat_SeqAIJ*) B->data; 226654f21887SBarry Smith PetscInt *adx,*bdx,*aii,*bii,*aptr,*bptr; 226754f21887SBarry Smith MatScalar *va,*vb; 22686849ba73SBarry Smith PetscErrorCode ierr; 226997f1f81fSBarry Smith PetscInt ma,na,mb,nb, i; 2270cd0d46ebSvictorle 2271cd0d46ebSvictorle PetscFunctionBegin; 2272cd0d46ebSvictorle ierr = MatGetSize(A,&ma,&na);CHKERRQ(ierr); 2273cd0d46ebSvictorle ierr = MatGetSize(B,&mb,&nb);CHKERRQ(ierr); 22745485867bSBarry Smith if (ma!=nb || na!=mb) { 22755485867bSBarry Smith *f = PETSC_FALSE; 22765485867bSBarry Smith PetscFunctionReturn(0); 22775485867bSBarry Smith } 2278cd0d46ebSvictorle aii = aij->i; bii = bij->i; 2279cd0d46ebSvictorle adx = aij->j; bdx = bij->j; 2280cd0d46ebSvictorle va = aij->a; vb = bij->a; 2281785e854fSJed Brown ierr = PetscMalloc1(ma,&aptr);CHKERRQ(ierr); 2282785e854fSJed Brown ierr = PetscMalloc1(mb,&bptr);CHKERRQ(ierr); 2283cd0d46ebSvictorle for (i=0; i<ma; i++) aptr[i] = aii[i]; 2284cd0d46ebSvictorle for (i=0; i<mb; i++) bptr[i] = bii[i]; 2285cd0d46ebSvictorle 2286cd0d46ebSvictorle *f = PETSC_TRUE; 2287cd0d46ebSvictorle for (i=0; i<ma; i++) { 2288cd0d46ebSvictorle while (aptr[i]<aii[i+1]) { 228997f1f81fSBarry Smith PetscInt idc,idr; 22905485867bSBarry Smith PetscScalar vc,vr; 2291cd0d46ebSvictorle /* column/row index/value */ 22925485867bSBarry Smith idc = adx[aptr[i]]; 22935485867bSBarry Smith idr = bdx[bptr[idc]]; 22945485867bSBarry Smith vc = va[aptr[i]]; 22955485867bSBarry Smith vr = vb[bptr[idc]]; 22965485867bSBarry Smith if (i!=idr || PetscAbsScalar(vc-vr) > tol) { 22975485867bSBarry Smith *f = PETSC_FALSE; 22985485867bSBarry Smith goto done; 2299cd0d46ebSvictorle } else { 23005485867bSBarry Smith aptr[i]++; 23015485867bSBarry Smith if (B || i!=idc) bptr[idc]++; 2302cd0d46ebSvictorle } 2303cd0d46ebSvictorle } 2304cd0d46ebSvictorle } 2305cd0d46ebSvictorle done: 2306cd0d46ebSvictorle ierr = PetscFree(aptr);CHKERRQ(ierr); 23073aeef889SHong Zhang ierr = PetscFree(bptr);CHKERRQ(ierr); 2308cd0d46ebSvictorle PetscFunctionReturn(0); 2309cd0d46ebSvictorle } 2310cd0d46ebSvictorle 23117087cfbeSBarry Smith PetscErrorCode MatIsHermitianTranspose_SeqAIJ(Mat A,Mat B,PetscReal tol,PetscBool *f) 23121cbb95d3SBarry Smith { 23133d3eaba7SBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ*) A->data,*bij = (Mat_SeqAIJ*) B->data; 231454f21887SBarry Smith PetscInt *adx,*bdx,*aii,*bii,*aptr,*bptr; 231554f21887SBarry Smith MatScalar *va,*vb; 23161cbb95d3SBarry Smith PetscErrorCode ierr; 23171cbb95d3SBarry Smith PetscInt ma,na,mb,nb, i; 23181cbb95d3SBarry Smith 23191cbb95d3SBarry Smith PetscFunctionBegin; 23201cbb95d3SBarry Smith ierr = MatGetSize(A,&ma,&na);CHKERRQ(ierr); 23211cbb95d3SBarry Smith ierr = MatGetSize(B,&mb,&nb);CHKERRQ(ierr); 23221cbb95d3SBarry Smith if (ma!=nb || na!=mb) { 23231cbb95d3SBarry Smith *f = PETSC_FALSE; 23241cbb95d3SBarry Smith PetscFunctionReturn(0); 23251cbb95d3SBarry Smith } 23261cbb95d3SBarry Smith aii = aij->i; bii = bij->i; 23271cbb95d3SBarry Smith adx = aij->j; bdx = bij->j; 23281cbb95d3SBarry Smith va = aij->a; vb = bij->a; 2329785e854fSJed Brown ierr = PetscMalloc1(ma,&aptr);CHKERRQ(ierr); 2330785e854fSJed Brown ierr = PetscMalloc1(mb,&bptr);CHKERRQ(ierr); 23311cbb95d3SBarry Smith for (i=0; i<ma; i++) aptr[i] = aii[i]; 23321cbb95d3SBarry Smith for (i=0; i<mb; i++) bptr[i] = bii[i]; 23331cbb95d3SBarry Smith 23341cbb95d3SBarry Smith *f = PETSC_TRUE; 23351cbb95d3SBarry Smith for (i=0; i<ma; i++) { 23361cbb95d3SBarry Smith while (aptr[i]<aii[i+1]) { 23371cbb95d3SBarry Smith PetscInt idc,idr; 23381cbb95d3SBarry Smith PetscScalar vc,vr; 23391cbb95d3SBarry Smith /* column/row index/value */ 23401cbb95d3SBarry Smith idc = adx[aptr[i]]; 23411cbb95d3SBarry Smith idr = bdx[bptr[idc]]; 23421cbb95d3SBarry Smith vc = va[aptr[i]]; 23431cbb95d3SBarry Smith vr = vb[bptr[idc]]; 23441cbb95d3SBarry Smith if (i!=idr || PetscAbsScalar(vc-PetscConj(vr)) > tol) { 23451cbb95d3SBarry Smith *f = PETSC_FALSE; 23461cbb95d3SBarry Smith goto done; 23471cbb95d3SBarry Smith } else { 23481cbb95d3SBarry Smith aptr[i]++; 23491cbb95d3SBarry Smith if (B || i!=idc) bptr[idc]++; 23501cbb95d3SBarry Smith } 23511cbb95d3SBarry Smith } 23521cbb95d3SBarry Smith } 23531cbb95d3SBarry Smith done: 23541cbb95d3SBarry Smith ierr = PetscFree(aptr);CHKERRQ(ierr); 23551cbb95d3SBarry Smith ierr = PetscFree(bptr);CHKERRQ(ierr); 23561cbb95d3SBarry Smith PetscFunctionReturn(0); 23571cbb95d3SBarry Smith } 23581cbb95d3SBarry Smith 2359ace3abfcSBarry Smith PetscErrorCode MatIsSymmetric_SeqAIJ(Mat A,PetscReal tol,PetscBool *f) 23609e29f15eSvictorle { 2361dfbe8321SBarry Smith PetscErrorCode ierr; 23626e111a19SKarl Rupp 23639e29f15eSvictorle PetscFunctionBegin; 23645485867bSBarry Smith ierr = MatIsTranspose_SeqAIJ(A,A,tol,f);CHKERRQ(ierr); 23659e29f15eSvictorle PetscFunctionReturn(0); 23669e29f15eSvictorle } 23679e29f15eSvictorle 2368ace3abfcSBarry Smith PetscErrorCode MatIsHermitian_SeqAIJ(Mat A,PetscReal tol,PetscBool *f) 23691cbb95d3SBarry Smith { 23701cbb95d3SBarry Smith PetscErrorCode ierr; 23716e111a19SKarl Rupp 23721cbb95d3SBarry Smith PetscFunctionBegin; 23731cbb95d3SBarry Smith ierr = MatIsHermitianTranspose_SeqAIJ(A,A,tol,f);CHKERRQ(ierr); 23741cbb95d3SBarry Smith PetscFunctionReturn(0); 23751cbb95d3SBarry Smith } 23761cbb95d3SBarry Smith 2377dfbe8321SBarry Smith PetscErrorCode MatDiagonalScale_SeqAIJ(Mat A,Vec ll,Vec rr) 237817ab2063SBarry Smith { 2379416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 2380fff8e43fSBarry Smith const PetscScalar *l,*r; 2381fff8e43fSBarry Smith PetscScalar x; 238254f21887SBarry Smith MatScalar *v; 2383dfbe8321SBarry Smith PetscErrorCode ierr; 2384fff8e43fSBarry Smith PetscInt i,j,m = A->rmap->n,n = A->cmap->n,M,nz = a->nz; 2385fff8e43fSBarry Smith const PetscInt *jj; 238617ab2063SBarry Smith 23873a40ed3dSBarry Smith PetscFunctionBegin; 238817ab2063SBarry Smith if (ll) { 23893ea7c6a1SSatish Balay /* The local size is used so that VecMPI can be passed to this routine 23903ea7c6a1SSatish Balay by MatDiagonalScale_MPIAIJ */ 2391e1311b90SBarry Smith ierr = VecGetLocalSize(ll,&m);CHKERRQ(ierr); 2392e32f2f54SBarry Smith if (m != A->rmap->n) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Left scaling vector wrong length"); 2393fff8e43fSBarry Smith ierr = VecGetArrayRead(ll,&l);CHKERRQ(ierr); 2394416022c9SBarry Smith v = a->a; 239517ab2063SBarry Smith for (i=0; i<m; i++) { 239617ab2063SBarry Smith x = l[i]; 2397416022c9SBarry Smith M = a->i[i+1] - a->i[i]; 23982205254eSKarl Rupp for (j=0; j<M; j++) (*v++) *= x; 239917ab2063SBarry Smith } 2400fff8e43fSBarry Smith ierr = VecRestoreArrayRead(ll,&l);CHKERRQ(ierr); 2401efee365bSSatish Balay ierr = PetscLogFlops(nz);CHKERRQ(ierr); 240217ab2063SBarry Smith } 240317ab2063SBarry Smith if (rr) { 2404e1311b90SBarry Smith ierr = VecGetLocalSize(rr,&n);CHKERRQ(ierr); 2405e32f2f54SBarry Smith if (n != A->cmap->n) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Right scaling vector wrong length"); 2406fff8e43fSBarry Smith ierr = VecGetArrayRead(rr,&r);CHKERRQ(ierr); 2407416022c9SBarry Smith v = a->a; jj = a->j; 24082205254eSKarl Rupp for (i=0; i<nz; i++) (*v++) *= r[*jj++]; 2409fff8e43fSBarry Smith ierr = VecRestoreArrayRead(rr,&r);CHKERRQ(ierr); 2410efee365bSSatish Balay ierr = PetscLogFlops(nz);CHKERRQ(ierr); 241117ab2063SBarry Smith } 2412acf2f550SJed Brown ierr = MatSeqAIJInvalidateDiagonal(A);CHKERRQ(ierr); 2413e2cf4d64SStefano Zampini #if defined(PETSC_HAVE_VIENNACL) || defined(PETSC_HAVE_CUDA) 2414c70f7ee4SJunchao Zhang if (A->offloadmask != PETSC_OFFLOAD_UNALLOCATED) A->offloadmask = PETSC_OFFLOAD_CPU; 2415e2cf4d64SStefano Zampini #endif 24163a40ed3dSBarry Smith PetscFunctionReturn(0); 241717ab2063SBarry Smith } 241817ab2063SBarry Smith 24197dae84e0SHong Zhang PetscErrorCode MatCreateSubMatrix_SeqAIJ(Mat A,IS isrow,IS iscol,PetscInt csize,MatReuse scall,Mat *B) 242017ab2063SBarry Smith { 2421db02288aSLois Curfman McInnes Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data,*c; 24226849ba73SBarry Smith PetscErrorCode ierr; 2423d0f46423SBarry Smith PetscInt *smap,i,k,kstart,kend,oldcols = A->cmap->n,*lens; 242497f1f81fSBarry Smith PetscInt row,mat_i,*mat_j,tcol,first,step,*mat_ilen,sum,lensi; 24255d0c19d7SBarry Smith const PetscInt *irow,*icol; 24265d0c19d7SBarry Smith PetscInt nrows,ncols; 242797f1f81fSBarry Smith PetscInt *starts,*j_new,*i_new,*aj = a->j,*ai = a->i,ii,*ailen = a->ilen; 242854f21887SBarry Smith MatScalar *a_new,*mat_a; 2429416022c9SBarry Smith Mat C; 2430cdc6f3adSToby Isaac PetscBool stride; 243117ab2063SBarry Smith 24323a40ed3dSBarry Smith PetscFunctionBegin; 243399141d43SSatish Balay 243417ab2063SBarry Smith ierr = ISGetIndices(isrow,&irow);CHKERRQ(ierr); 2435b9b97703SBarry Smith ierr = ISGetLocalSize(isrow,&nrows);CHKERRQ(ierr); 2436b9b97703SBarry Smith ierr = ISGetLocalSize(iscol,&ncols);CHKERRQ(ierr); 243717ab2063SBarry Smith 2438251f4c67SDmitry Karpeev ierr = PetscObjectTypeCompare((PetscObject)iscol,ISSTRIDE,&stride);CHKERRQ(ierr); 2439ff718158SBarry Smith if (stride) { 2440ff718158SBarry Smith ierr = ISStrideGetInfo(iscol,&first,&step);CHKERRQ(ierr); 2441ff718158SBarry Smith } else { 2442ff718158SBarry Smith first = 0; 2443ff718158SBarry Smith step = 0; 2444ff718158SBarry Smith } 2445fee21e36SBarry Smith if (stride && step == 1) { 244602834360SBarry Smith /* special case of contiguous rows */ 2447dcca6d9dSJed Brown ierr = PetscMalloc2(nrows,&lens,nrows,&starts);CHKERRQ(ierr); 244802834360SBarry Smith /* loop over new rows determining lens and starting points */ 244902834360SBarry Smith for (i=0; i<nrows; i++) { 2450bfeeae90SHong Zhang kstart = ai[irow[i]]; 2451a2744918SBarry Smith kend = kstart + ailen[irow[i]]; 2452a91a9bebSLisandro Dalcin starts[i] = kstart; 245302834360SBarry Smith for (k=kstart; k<kend; k++) { 2454bfeeae90SHong Zhang if (aj[k] >= first) { 245502834360SBarry Smith starts[i] = k; 245602834360SBarry Smith break; 245702834360SBarry Smith } 245802834360SBarry Smith } 2459a2744918SBarry Smith sum = 0; 246002834360SBarry Smith while (k < kend) { 2461bfeeae90SHong Zhang if (aj[k++] >= first+ncols) break; 2462a2744918SBarry Smith sum++; 246302834360SBarry Smith } 2464a2744918SBarry Smith lens[i] = sum; 246502834360SBarry Smith } 246602834360SBarry Smith /* create submatrix */ 2467cddf8d76SBarry Smith if (scall == MAT_REUSE_MATRIX) { 246897f1f81fSBarry Smith PetscInt n_cols,n_rows; 246908480c60SBarry Smith ierr = MatGetSize(*B,&n_rows,&n_cols);CHKERRQ(ierr); 2470e32f2f54SBarry Smith if (n_rows != nrows || n_cols != ncols) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Reused submatrix wrong size"); 2471d8ced48eSBarry Smith ierr = MatZeroEntries(*B);CHKERRQ(ierr); 247208480c60SBarry Smith C = *B; 24733a40ed3dSBarry Smith } else { 24743bef6203SJed Brown PetscInt rbs,cbs; 2475ce94432eSBarry Smith ierr = MatCreate(PetscObjectComm((PetscObject)A),&C);CHKERRQ(ierr); 2476f69a0ea3SMatthew Knepley ierr = MatSetSizes(C,nrows,ncols,PETSC_DETERMINE,PETSC_DETERMINE);CHKERRQ(ierr); 24773bef6203SJed Brown ierr = ISGetBlockSize(isrow,&rbs);CHKERRQ(ierr); 24783bef6203SJed Brown ierr = ISGetBlockSize(iscol,&cbs);CHKERRQ(ierr); 24793bef6203SJed Brown ierr = MatSetBlockSizes(C,rbs,cbs);CHKERRQ(ierr); 24807adad957SLisandro Dalcin ierr = MatSetType(C,((PetscObject)A)->type_name);CHKERRQ(ierr); 2481ab93d7beSBarry Smith ierr = MatSeqAIJSetPreallocation_SeqAIJ(C,0,lens);CHKERRQ(ierr); 248208480c60SBarry Smith } 2483db02288aSLois Curfman McInnes c = (Mat_SeqAIJ*)C->data; 2484db02288aSLois Curfman McInnes 248502834360SBarry Smith /* loop over rows inserting into submatrix */ 2486db02288aSLois Curfman McInnes a_new = c->a; 2487db02288aSLois Curfman McInnes j_new = c->j; 2488db02288aSLois Curfman McInnes i_new = c->i; 2489bfeeae90SHong Zhang 249002834360SBarry Smith for (i=0; i<nrows; i++) { 2491a2744918SBarry Smith ii = starts[i]; 2492a2744918SBarry Smith lensi = lens[i]; 2493a2744918SBarry Smith for (k=0; k<lensi; k++) { 2494a2744918SBarry Smith *j_new++ = aj[ii+k] - first; 249502834360SBarry Smith } 2496580bdb30SBarry Smith ierr = PetscArraycpy(a_new,a->a + starts[i],lensi);CHKERRQ(ierr); 2497a2744918SBarry Smith a_new += lensi; 2498a2744918SBarry Smith i_new[i+1] = i_new[i] + lensi; 2499a2744918SBarry Smith c->ilen[i] = lensi; 250002834360SBarry Smith } 25010e83c824SBarry Smith ierr = PetscFree2(lens,starts);CHKERRQ(ierr); 25023a40ed3dSBarry Smith } else { 250302834360SBarry Smith ierr = ISGetIndices(iscol,&icol);CHKERRQ(ierr); 25041795a4d1SJed Brown ierr = PetscCalloc1(oldcols,&smap);CHKERRQ(ierr); 2505854ce69bSBarry Smith ierr = PetscMalloc1(1+nrows,&lens);CHKERRQ(ierr); 25064dcab191SBarry Smith for (i=0; i<ncols; i++) { 2507d9ef940eSSatish Balay if (PetscUnlikelyDebug(icol[i] >= oldcols)) SETERRQ3(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Requesting column beyond largest column icol[%D] %D >= A->cmap->n %D",i,icol[i],oldcols); 25084dcab191SBarry Smith smap[icol[i]] = i+1; 25094dcab191SBarry Smith } 25104dcab191SBarry Smith 251102834360SBarry Smith /* determine lens of each row */ 251202834360SBarry Smith for (i=0; i<nrows; i++) { 2513bfeeae90SHong Zhang kstart = ai[irow[i]]; 251402834360SBarry Smith kend = kstart + a->ilen[irow[i]]; 251502834360SBarry Smith lens[i] = 0; 251602834360SBarry Smith for (k=kstart; k<kend; k++) { 2517bfeeae90SHong Zhang if (smap[aj[k]]) { 251802834360SBarry Smith lens[i]++; 251902834360SBarry Smith } 252002834360SBarry Smith } 252102834360SBarry Smith } 252217ab2063SBarry Smith /* Create and fill new matrix */ 2523a2744918SBarry Smith if (scall == MAT_REUSE_MATRIX) { 2524ace3abfcSBarry Smith PetscBool equal; 25250f5bd95cSBarry Smith 252699141d43SSatish Balay c = (Mat_SeqAIJ*)((*B)->data); 2527e32f2f54SBarry Smith if ((*B)->rmap->n != nrows || (*B)->cmap->n != ncols) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Cannot reuse matrix. wrong size"); 2528580bdb30SBarry Smith ierr = PetscArraycmp(c->ilen,lens,(*B)->rmap->n,&equal);CHKERRQ(ierr); 2529f23aa3ddSBarry Smith if (!equal) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Cannot reuse matrix. wrong no of nonzeros"); 2530580bdb30SBarry Smith ierr = PetscArrayzero(c->ilen,(*B)->rmap->n);CHKERRQ(ierr); 253108480c60SBarry Smith C = *B; 25323a40ed3dSBarry Smith } else { 25333bef6203SJed Brown PetscInt rbs,cbs; 2534ce94432eSBarry Smith ierr = MatCreate(PetscObjectComm((PetscObject)A),&C);CHKERRQ(ierr); 2535f69a0ea3SMatthew Knepley ierr = MatSetSizes(C,nrows,ncols,PETSC_DETERMINE,PETSC_DETERMINE);CHKERRQ(ierr); 25363bef6203SJed Brown ierr = ISGetBlockSize(isrow,&rbs);CHKERRQ(ierr); 25373bef6203SJed Brown ierr = ISGetBlockSize(iscol,&cbs);CHKERRQ(ierr); 25383bef6203SJed Brown ierr = MatSetBlockSizes(C,rbs,cbs);CHKERRQ(ierr); 25397adad957SLisandro Dalcin ierr = MatSetType(C,((PetscObject)A)->type_name);CHKERRQ(ierr); 2540ab93d7beSBarry Smith ierr = MatSeqAIJSetPreallocation_SeqAIJ(C,0,lens);CHKERRQ(ierr); 254108480c60SBarry Smith } 254299141d43SSatish Balay c = (Mat_SeqAIJ*)(C->data); 254317ab2063SBarry Smith for (i=0; i<nrows; i++) { 254499141d43SSatish Balay row = irow[i]; 2545bfeeae90SHong Zhang kstart = ai[row]; 254699141d43SSatish Balay kend = kstart + a->ilen[row]; 2547bfeeae90SHong Zhang mat_i = c->i[i]; 254899141d43SSatish Balay mat_j = c->j + mat_i; 254999141d43SSatish Balay mat_a = c->a + mat_i; 255099141d43SSatish Balay mat_ilen = c->ilen + i; 255117ab2063SBarry Smith for (k=kstart; k<kend; k++) { 2552bfeeae90SHong Zhang if ((tcol=smap[a->j[k]])) { 2553ed480e8bSBarry Smith *mat_j++ = tcol - 1; 255499141d43SSatish Balay *mat_a++ = a->a[k]; 255599141d43SSatish Balay (*mat_ilen)++; 255699141d43SSatish Balay 255717ab2063SBarry Smith } 255817ab2063SBarry Smith } 255917ab2063SBarry Smith } 256002834360SBarry Smith /* Free work space */ 256102834360SBarry Smith ierr = ISRestoreIndices(iscol,&icol);CHKERRQ(ierr); 2562606d414cSSatish Balay ierr = PetscFree(smap);CHKERRQ(ierr); 2563606d414cSSatish Balay ierr = PetscFree(lens);CHKERRQ(ierr); 2564cdc6f3adSToby Isaac /* sort */ 2565cdc6f3adSToby Isaac for (i = 0; i < nrows; i++) { 2566cdc6f3adSToby Isaac PetscInt ilen; 2567cdc6f3adSToby Isaac 2568cdc6f3adSToby Isaac mat_i = c->i[i]; 2569cdc6f3adSToby Isaac mat_j = c->j + mat_i; 2570cdc6f3adSToby Isaac mat_a = c->a + mat_i; 2571cdc6f3adSToby Isaac ilen = c->ilen[i]; 2572390e1bf2SBarry Smith ierr = PetscSortIntWithScalarArray(ilen,mat_j,mat_a);CHKERRQ(ierr); 2573cdc6f3adSToby Isaac } 257402834360SBarry Smith } 2575305c6ccfSStefano Zampini #if defined(PETSC_HAVE_VIENNACL) || defined(PETSC_HAVE_CUDA) 2576b470e4b4SRichard Tran Mills ierr = MatBindToCPU(C,A->boundtocpu);CHKERRQ(ierr); 2577305c6ccfSStefano Zampini #endif 25786d4a8577SBarry Smith ierr = MatAssemblyBegin(C,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 25796d4a8577SBarry Smith ierr = MatAssemblyEnd(C,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 258017ab2063SBarry Smith 258117ab2063SBarry Smith ierr = ISRestoreIndices(isrow,&irow);CHKERRQ(ierr); 2582416022c9SBarry Smith *B = C; 25833a40ed3dSBarry Smith PetscFunctionReturn(0); 258417ab2063SBarry Smith } 258517ab2063SBarry Smith 2586fc08c53fSHong Zhang PetscErrorCode MatGetMultiProcBlock_SeqAIJ(Mat mat,MPI_Comm subComm,MatReuse scall,Mat *subMat) 258782d44351SHong Zhang { 258882d44351SHong Zhang PetscErrorCode ierr; 258982d44351SHong Zhang Mat B; 259082d44351SHong Zhang 259182d44351SHong Zhang PetscFunctionBegin; 2592c2d650bdSHong Zhang if (scall == MAT_INITIAL_MATRIX) { 259382d44351SHong Zhang ierr = MatCreate(subComm,&B);CHKERRQ(ierr); 259482d44351SHong Zhang ierr = MatSetSizes(B,mat->rmap->n,mat->cmap->n,mat->rmap->n,mat->cmap->n);CHKERRQ(ierr); 259533d57670SJed Brown ierr = MatSetBlockSizesFromMats(B,mat,mat);CHKERRQ(ierr); 259682d44351SHong Zhang ierr = MatSetType(B,MATSEQAIJ);CHKERRQ(ierr); 259782d44351SHong Zhang ierr = MatDuplicateNoCreate_SeqAIJ(B,mat,MAT_COPY_VALUES,PETSC_TRUE);CHKERRQ(ierr); 259882d44351SHong Zhang *subMat = B; 2599c2d650bdSHong Zhang } else { 2600c2d650bdSHong Zhang ierr = MatCopy_SeqAIJ(mat,*subMat,SAME_NONZERO_PATTERN);CHKERRQ(ierr); 2601c2d650bdSHong Zhang } 260282d44351SHong Zhang PetscFunctionReturn(0); 260382d44351SHong Zhang } 260482d44351SHong Zhang 26059a625307SHong Zhang PetscErrorCode MatILUFactor_SeqAIJ(Mat inA,IS row,IS col,const MatFactorInfo *info) 2606a871dcd8SBarry Smith { 260763b91edcSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)inA->data; 2608dfbe8321SBarry Smith PetscErrorCode ierr; 260963b91edcSBarry Smith Mat outA; 2610ace3abfcSBarry Smith PetscBool row_identity,col_identity; 261163b91edcSBarry Smith 26123a40ed3dSBarry Smith PetscFunctionBegin; 2613e32f2f54SBarry Smith if (info->levels != 0) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_SUP,"Only levels=0 supported for in-place ilu"); 26141df811f5SHong Zhang 2615b8a78c4aSBarry Smith ierr = ISIdentity(row,&row_identity);CHKERRQ(ierr); 2616b8a78c4aSBarry Smith ierr = ISIdentity(col,&col_identity);CHKERRQ(ierr); 2617a871dcd8SBarry Smith 261863b91edcSBarry Smith outA = inA; 2619d5f3da31SBarry Smith outA->factortype = MAT_FACTOR_LU; 2620f6224b95SHong Zhang ierr = PetscFree(inA->solvertype);CHKERRQ(ierr); 2621f6224b95SHong Zhang ierr = PetscStrallocpy(MATSOLVERPETSC,&inA->solvertype);CHKERRQ(ierr); 26222205254eSKarl Rupp 2623c38d4ed2SBarry Smith ierr = PetscObjectReference((PetscObject)row);CHKERRQ(ierr); 26246bf464f9SBarry Smith ierr = ISDestroy(&a->row);CHKERRQ(ierr); 26252205254eSKarl Rupp 2626c3122656SLisandro Dalcin a->row = row; 26272205254eSKarl Rupp 2628c38d4ed2SBarry Smith ierr = PetscObjectReference((PetscObject)col);CHKERRQ(ierr); 26296bf464f9SBarry Smith ierr = ISDestroy(&a->col);CHKERRQ(ierr); 26302205254eSKarl Rupp 2631c3122656SLisandro Dalcin a->col = col; 263263b91edcSBarry Smith 263336db0b34SBarry Smith /* Create the inverse permutation so that it can be used in MatLUFactorNumeric() */ 26346bf464f9SBarry Smith ierr = ISDestroy(&a->icol);CHKERRQ(ierr); 26354c49b128SBarry Smith ierr = ISInvertPermutation(col,PETSC_DECIDE,&a->icol);CHKERRQ(ierr); 26363bb1ff40SBarry Smith ierr = PetscLogObjectParent((PetscObject)inA,(PetscObject)a->icol);CHKERRQ(ierr); 2637f0ec6fceSSatish Balay 263894a9d846SBarry Smith if (!a->solve_work) { /* this matrix may have been factored before */ 2639854ce69bSBarry Smith ierr = PetscMalloc1(inA->rmap->n+1,&a->solve_work);CHKERRQ(ierr); 26403bb1ff40SBarry Smith ierr = PetscLogObjectMemory((PetscObject)inA, (inA->rmap->n+1)*sizeof(PetscScalar));CHKERRQ(ierr); 264194a9d846SBarry Smith } 264263b91edcSBarry Smith 2643f1e2ffcdSBarry Smith ierr = MatMarkDiagonal_SeqAIJ(inA);CHKERRQ(ierr); 2644137fb511SHong Zhang if (row_identity && col_identity) { 2645ad04f41aSHong Zhang ierr = MatLUFactorNumeric_SeqAIJ_inplace(outA,inA,info);CHKERRQ(ierr); 2646137fb511SHong Zhang } else { 2647719d5645SBarry Smith ierr = MatLUFactorNumeric_SeqAIJ_InplaceWithPerm(outA,inA,info);CHKERRQ(ierr); 2648137fb511SHong Zhang } 26493a40ed3dSBarry Smith PetscFunctionReturn(0); 2650a871dcd8SBarry Smith } 2651a871dcd8SBarry Smith 2652f4df32b1SMatthew Knepley PetscErrorCode MatScale_SeqAIJ(Mat inA,PetscScalar alpha) 2653f0b747eeSBarry Smith { 2654f0b747eeSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)inA->data; 2655f4df32b1SMatthew Knepley PetscScalar oalpha = alpha; 2656efee365bSSatish Balay PetscErrorCode ierr; 2657c5df96a5SBarry Smith PetscBLASInt one = 1,bnz; 26583a40ed3dSBarry Smith 26593a40ed3dSBarry Smith PetscFunctionBegin; 2660c5df96a5SBarry Smith ierr = PetscBLASIntCast(a->nz,&bnz);CHKERRQ(ierr); 26618b83055fSJed Brown PetscStackCallBLAS("BLASscal",BLASscal_(&bnz,&oalpha,a->a,&one)); 2662efee365bSSatish Balay ierr = PetscLogFlops(a->nz);CHKERRQ(ierr); 2663acf2f550SJed Brown ierr = MatSeqAIJInvalidateDiagonal(inA);CHKERRQ(ierr); 2664e2cf4d64SStefano Zampini #if defined(PETSC_HAVE_VIENNACL) || defined(PETSC_HAVE_CUDA) 2665c70f7ee4SJunchao Zhang if (inA->offloadmask != PETSC_OFFLOAD_UNALLOCATED) inA->offloadmask = PETSC_OFFLOAD_CPU; 2666e2cf4d64SStefano Zampini #endif 26673a40ed3dSBarry Smith PetscFunctionReturn(0); 2668f0b747eeSBarry Smith } 2669f0b747eeSBarry Smith 2670f68bb481SHong Zhang PetscErrorCode MatDestroySubMatrix_Private(Mat_SubSppt *submatj) 267116b64355SHong Zhang { 267216b64355SHong Zhang PetscErrorCode ierr; 267316b64355SHong Zhang PetscInt i; 267416b64355SHong Zhang 267516b64355SHong Zhang PetscFunctionBegin; 267616b64355SHong Zhang if (!submatj->id) { /* delete data that are linked only to submats[id=0] */ 267716b64355SHong Zhang ierr = PetscFree4(submatj->sbuf1,submatj->ptr,submatj->tmp,submatj->ctr);CHKERRQ(ierr); 267816b64355SHong Zhang 267916b64355SHong Zhang for (i=0; i<submatj->nrqr; ++i) { 268016b64355SHong Zhang ierr = PetscFree(submatj->sbuf2[i]);CHKERRQ(ierr); 268116b64355SHong Zhang } 268216b64355SHong Zhang ierr = PetscFree3(submatj->sbuf2,submatj->req_size,submatj->req_source1);CHKERRQ(ierr); 268316b64355SHong Zhang 268416b64355SHong Zhang if (submatj->rbuf1) { 268516b64355SHong Zhang ierr = PetscFree(submatj->rbuf1[0]);CHKERRQ(ierr); 268616b64355SHong Zhang ierr = PetscFree(submatj->rbuf1);CHKERRQ(ierr); 268716b64355SHong Zhang } 268816b64355SHong Zhang 268916b64355SHong Zhang for (i=0; i<submatj->nrqs; ++i) { 269016b64355SHong Zhang ierr = PetscFree(submatj->rbuf3[i]);CHKERRQ(ierr); 269116b64355SHong Zhang } 269216b64355SHong Zhang ierr = PetscFree3(submatj->req_source2,submatj->rbuf2,submatj->rbuf3);CHKERRQ(ierr); 269316b64355SHong Zhang ierr = PetscFree(submatj->pa);CHKERRQ(ierr); 269416b64355SHong Zhang } 269516b64355SHong Zhang 269616b64355SHong Zhang #if defined(PETSC_USE_CTABLE) 269716b64355SHong Zhang ierr = PetscTableDestroy((PetscTable*)&submatj->rmap);CHKERRQ(ierr); 269816b64355SHong Zhang if (submatj->cmap_loc) {ierr = PetscFree(submatj->cmap_loc);CHKERRQ(ierr);} 269916b64355SHong Zhang ierr = PetscFree(submatj->rmap_loc);CHKERRQ(ierr); 270016b64355SHong Zhang #else 270116b64355SHong Zhang ierr = PetscFree(submatj->rmap);CHKERRQ(ierr); 270216b64355SHong Zhang #endif 270316b64355SHong Zhang 270416b64355SHong Zhang if (!submatj->allcolumns) { 270516b64355SHong Zhang #if defined(PETSC_USE_CTABLE) 270616b64355SHong Zhang ierr = PetscTableDestroy((PetscTable*)&submatj->cmap);CHKERRQ(ierr); 270716b64355SHong Zhang #else 270816b64355SHong Zhang ierr = PetscFree(submatj->cmap);CHKERRQ(ierr); 270916b64355SHong Zhang #endif 271016b64355SHong Zhang } 271116b64355SHong Zhang ierr = PetscFree(submatj->row2proc);CHKERRQ(ierr); 271216b64355SHong Zhang 271316b64355SHong Zhang ierr = PetscFree(submatj);CHKERRQ(ierr); 271416b64355SHong Zhang PetscFunctionReturn(0); 271516b64355SHong Zhang } 271616b64355SHong Zhang 27170fb991dcSHong Zhang PetscErrorCode MatDestroySubMatrix_SeqAIJ(Mat C) 271816b64355SHong Zhang { 271916b64355SHong Zhang PetscErrorCode ierr; 272016b64355SHong Zhang Mat_SeqAIJ *c = (Mat_SeqAIJ*)C->data; 27215c39f6d9SHong Zhang Mat_SubSppt *submatj = c->submatis1; 272216b64355SHong Zhang 272316b64355SHong Zhang PetscFunctionBegin; 272434136279SStefano Zampini ierr = (*submatj->destroy)(C);CHKERRQ(ierr); 2725f68bb481SHong Zhang ierr = MatDestroySubMatrix_Private(submatj);CHKERRQ(ierr); 272616b64355SHong Zhang PetscFunctionReturn(0); 272716b64355SHong Zhang } 272816b64355SHong Zhang 27292d033e1fSHong Zhang PetscErrorCode MatDestroySubMatrices_SeqAIJ(PetscInt n,Mat *mat[]) 27302d033e1fSHong Zhang { 27312d033e1fSHong Zhang PetscErrorCode ierr; 27322d033e1fSHong Zhang PetscInt i; 27330fb991dcSHong Zhang Mat C; 27340fb991dcSHong Zhang Mat_SeqAIJ *c; 27350fb991dcSHong Zhang Mat_SubSppt *submatj; 27362d033e1fSHong Zhang 27372d033e1fSHong Zhang PetscFunctionBegin; 27382d033e1fSHong Zhang for (i=0; i<n; i++) { 27390fb991dcSHong Zhang C = (*mat)[i]; 27400fb991dcSHong Zhang c = (Mat_SeqAIJ*)C->data; 27410fb991dcSHong Zhang submatj = c->submatis1; 27422d033e1fSHong Zhang if (submatj) { 2743682e4c99SStefano Zampini if (--((PetscObject)C)->refct <= 0) { 274434136279SStefano Zampini ierr = (*submatj->destroy)(C);CHKERRQ(ierr); 2745f68bb481SHong Zhang ierr = MatDestroySubMatrix_Private(submatj);CHKERRQ(ierr); 274634136279SStefano Zampini ierr = PetscFree(C->defaultvectype);CHKERRQ(ierr); 27472d033e1fSHong Zhang ierr = PetscLayoutDestroy(&C->rmap);CHKERRQ(ierr); 27482d033e1fSHong Zhang ierr = PetscLayoutDestroy(&C->cmap);CHKERRQ(ierr); 27492d033e1fSHong Zhang ierr = PetscHeaderDestroy(&C);CHKERRQ(ierr); 2750682e4c99SStefano Zampini } 27512d033e1fSHong Zhang } else { 27522d033e1fSHong Zhang ierr = MatDestroy(&C);CHKERRQ(ierr); 27532d033e1fSHong Zhang } 27542d033e1fSHong Zhang } 275586e85357SHong Zhang 275663a75b2aSHong Zhang /* Destroy Dummy submatrices created for reuse */ 275763a75b2aSHong Zhang ierr = MatDestroySubMatrices_Dummy(n,mat);CHKERRQ(ierr); 275863a75b2aSHong Zhang 27592d033e1fSHong Zhang ierr = PetscFree(*mat);CHKERRQ(ierr); 27602d033e1fSHong Zhang PetscFunctionReturn(0); 27612d033e1fSHong Zhang } 27622d033e1fSHong Zhang 27637dae84e0SHong Zhang PetscErrorCode MatCreateSubMatrices_SeqAIJ(Mat A,PetscInt n,const IS irow[],const IS icol[],MatReuse scall,Mat *B[]) 2764cddf8d76SBarry Smith { 2765dfbe8321SBarry Smith PetscErrorCode ierr; 276697f1f81fSBarry Smith PetscInt i; 2767cddf8d76SBarry Smith 27683a40ed3dSBarry Smith PetscFunctionBegin; 2769cddf8d76SBarry Smith if (scall == MAT_INITIAL_MATRIX) { 2770df750dc8SHong Zhang ierr = PetscCalloc1(n+1,B);CHKERRQ(ierr); 2771cddf8d76SBarry Smith } 2772cddf8d76SBarry Smith 2773cddf8d76SBarry Smith for (i=0; i<n; i++) { 27747dae84e0SHong Zhang ierr = MatCreateSubMatrix_SeqAIJ(A,irow[i],icol[i],PETSC_DECIDE,scall,&(*B)[i]);CHKERRQ(ierr); 2775cddf8d76SBarry Smith } 27763a40ed3dSBarry Smith PetscFunctionReturn(0); 2777cddf8d76SBarry Smith } 2778cddf8d76SBarry Smith 277997f1f81fSBarry Smith PetscErrorCode MatIncreaseOverlap_SeqAIJ(Mat A,PetscInt is_max,IS is[],PetscInt ov) 27804dcbc457SBarry Smith { 2781e4d965acSSatish Balay Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 27826849ba73SBarry Smith PetscErrorCode ierr; 27835d0c19d7SBarry Smith PetscInt row,i,j,k,l,m,n,*nidx,isz,val; 27845d0c19d7SBarry Smith const PetscInt *idx; 278597f1f81fSBarry Smith PetscInt start,end,*ai,*aj; 2786f1af5d2fSBarry Smith PetscBT table; 2787bbd702dbSSatish Balay 27883a40ed3dSBarry Smith PetscFunctionBegin; 2789d0f46423SBarry Smith m = A->rmap->n; 2790e4d965acSSatish Balay ai = a->i; 2791bfeeae90SHong Zhang aj = a->j; 27928a047759SSatish Balay 2793e32f2f54SBarry Smith if (ov < 0) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"illegal negative overlap value used"); 279406763907SSatish Balay 2795854ce69bSBarry Smith ierr = PetscMalloc1(m+1,&nidx);CHKERRQ(ierr); 279653b8de81SBarry Smith ierr = PetscBTCreate(m,&table);CHKERRQ(ierr); 279706763907SSatish Balay 2798e4d965acSSatish Balay for (i=0; i<is_max; i++) { 2799b97fc60eSLois Curfman McInnes /* Initialize the two local arrays */ 2800e4d965acSSatish Balay isz = 0; 28016831982aSBarry Smith ierr = PetscBTMemzero(m,table);CHKERRQ(ierr); 2802e4d965acSSatish Balay 2803e4d965acSSatish Balay /* Extract the indices, assume there can be duplicate entries */ 28044dcbc457SBarry Smith ierr = ISGetIndices(is[i],&idx);CHKERRQ(ierr); 2805b9b97703SBarry Smith ierr = ISGetLocalSize(is[i],&n);CHKERRQ(ierr); 2806e4d965acSSatish Balay 2807dd097bc3SLois Curfman McInnes /* Enter these into the temp arrays. I.e., mark table[row], enter row into new index */ 2808e4d965acSSatish Balay for (j=0; j<n; ++j) { 28092205254eSKarl Rupp if (!PetscBTLookupSet(table,idx[j])) nidx[isz++] = idx[j]; 28104dcbc457SBarry Smith } 281106763907SSatish Balay ierr = ISRestoreIndices(is[i],&idx);CHKERRQ(ierr); 28126bf464f9SBarry Smith ierr = ISDestroy(&is[i]);CHKERRQ(ierr); 2813e4d965acSSatish Balay 281404a348a9SBarry Smith k = 0; 281504a348a9SBarry Smith for (j=0; j<ov; j++) { /* for each overlap */ 281604a348a9SBarry Smith n = isz; 281706763907SSatish Balay for (; k<n; k++) { /* do only those rows in nidx[k], which are not done yet */ 2818e4d965acSSatish Balay row = nidx[k]; 2819e4d965acSSatish Balay start = ai[row]; 2820e4d965acSSatish Balay end = ai[row+1]; 282104a348a9SBarry Smith for (l = start; l<end; l++) { 2822efb16452SHong Zhang val = aj[l]; 28232205254eSKarl Rupp if (!PetscBTLookupSet(table,val)) nidx[isz++] = val; 2824e4d965acSSatish Balay } 2825e4d965acSSatish Balay } 2826e4d965acSSatish Balay } 282770b3c8c7SBarry Smith ierr = ISCreateGeneral(PETSC_COMM_SELF,isz,nidx,PETSC_COPY_VALUES,(is+i));CHKERRQ(ierr); 2828e4d965acSSatish Balay } 282994bacf5dSBarry Smith ierr = PetscBTDestroy(&table);CHKERRQ(ierr); 2830606d414cSSatish Balay ierr = PetscFree(nidx);CHKERRQ(ierr); 28313a40ed3dSBarry Smith PetscFunctionReturn(0); 28324dcbc457SBarry Smith } 283317ab2063SBarry Smith 28340513a670SBarry Smith /* -------------------------------------------------------------- */ 2835dfbe8321SBarry Smith PetscErrorCode MatPermute_SeqAIJ(Mat A,IS rowp,IS colp,Mat *B) 28360513a670SBarry Smith { 28370513a670SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 28386849ba73SBarry Smith PetscErrorCode ierr; 28393b98c0a2SBarry Smith PetscInt i,nz = 0,m = A->rmap->n,n = A->cmap->n; 28405d0c19d7SBarry Smith const PetscInt *row,*col; 28415d0c19d7SBarry Smith PetscInt *cnew,j,*lens; 284256cd22aeSBarry Smith IS icolp,irowp; 28430298fd71SBarry Smith PetscInt *cwork = NULL; 28440298fd71SBarry Smith PetscScalar *vwork = NULL; 28450513a670SBarry Smith 28463a40ed3dSBarry Smith PetscFunctionBegin; 28474c49b128SBarry Smith ierr = ISInvertPermutation(rowp,PETSC_DECIDE,&irowp);CHKERRQ(ierr); 284856cd22aeSBarry Smith ierr = ISGetIndices(irowp,&row);CHKERRQ(ierr); 28494c49b128SBarry Smith ierr = ISInvertPermutation(colp,PETSC_DECIDE,&icolp);CHKERRQ(ierr); 285056cd22aeSBarry Smith ierr = ISGetIndices(icolp,&col);CHKERRQ(ierr); 28510513a670SBarry Smith 28520513a670SBarry Smith /* determine lengths of permuted rows */ 2853854ce69bSBarry Smith ierr = PetscMalloc1(m+1,&lens);CHKERRQ(ierr); 28542205254eSKarl Rupp for (i=0; i<m; i++) lens[row[i]] = a->i[i+1] - a->i[i]; 2855ce94432eSBarry Smith ierr = MatCreate(PetscObjectComm((PetscObject)A),B);CHKERRQ(ierr); 2856f69a0ea3SMatthew Knepley ierr = MatSetSizes(*B,m,n,m,n);CHKERRQ(ierr); 285733d57670SJed Brown ierr = MatSetBlockSizesFromMats(*B,A,A);CHKERRQ(ierr); 28587adad957SLisandro Dalcin ierr = MatSetType(*B,((PetscObject)A)->type_name);CHKERRQ(ierr); 2859ab93d7beSBarry Smith ierr = MatSeqAIJSetPreallocation_SeqAIJ(*B,0,lens);CHKERRQ(ierr); 2860606d414cSSatish Balay ierr = PetscFree(lens);CHKERRQ(ierr); 28610513a670SBarry Smith 2862785e854fSJed Brown ierr = PetscMalloc1(n,&cnew);CHKERRQ(ierr); 28630513a670SBarry Smith for (i=0; i<m; i++) { 286432ec9ce4SBarry Smith ierr = MatGetRow_SeqAIJ(A,i,&nz,&cwork,&vwork);CHKERRQ(ierr); 28652205254eSKarl Rupp for (j=0; j<nz; j++) cnew[j] = col[cwork[j]]; 2866cdc0ba36SBarry Smith ierr = MatSetValues_SeqAIJ(*B,1,&row[i],nz,cnew,vwork,INSERT_VALUES);CHKERRQ(ierr); 286732ec9ce4SBarry Smith ierr = MatRestoreRow_SeqAIJ(A,i,&nz,&cwork,&vwork);CHKERRQ(ierr); 28680513a670SBarry Smith } 2869606d414cSSatish Balay ierr = PetscFree(cnew);CHKERRQ(ierr); 28702205254eSKarl Rupp 28713c7d62e4SBarry Smith (*B)->assembled = PETSC_FALSE; 28722205254eSKarl Rupp 28739fe5e383SStefano Zampini #if defined(PETSC_HAVE_VIENNACL) || defined(PETSC_HAVE_CUDA) 2874b470e4b4SRichard Tran Mills ierr = MatBindToCPU(*B,A->boundtocpu);CHKERRQ(ierr); 28759fe5e383SStefano Zampini #endif 28760513a670SBarry Smith ierr = MatAssemblyBegin(*B,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 28770513a670SBarry Smith ierr = MatAssemblyEnd(*B,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 287856cd22aeSBarry Smith ierr = ISRestoreIndices(irowp,&row);CHKERRQ(ierr); 287956cd22aeSBarry Smith ierr = ISRestoreIndices(icolp,&col);CHKERRQ(ierr); 28806bf464f9SBarry Smith ierr = ISDestroy(&irowp);CHKERRQ(ierr); 28816bf464f9SBarry Smith ierr = ISDestroy(&icolp);CHKERRQ(ierr); 28826768869dSprj- if (rowp == colp) { 28836768869dSprj- if (A->symmetric) { 28846768869dSprj- ierr = MatSetOption(*B,MAT_SYMMETRIC,PETSC_TRUE);CHKERRQ(ierr); 28856768869dSprj- } 28866768869dSprj- if (A->hermitian) { 28876768869dSprj- ierr = MatSetOption(*B,MAT_HERMITIAN,PETSC_TRUE);CHKERRQ(ierr); 28886768869dSprj- } 28896768869dSprj- } 28903a40ed3dSBarry Smith PetscFunctionReturn(0); 28910513a670SBarry Smith } 28920513a670SBarry Smith 2893dfbe8321SBarry Smith PetscErrorCode MatCopy_SeqAIJ(Mat A,Mat B,MatStructure str) 2894cb5b572fSBarry Smith { 2895dfbe8321SBarry Smith PetscErrorCode ierr; 2896cb5b572fSBarry Smith 2897cb5b572fSBarry Smith PetscFunctionBegin; 289833f4a19fSKris Buschelman /* If the two matrices have the same copy implementation, use fast copy. */ 289933f4a19fSKris Buschelman if (str == SAME_NONZERO_PATTERN && (A->ops->copy == B->ops->copy)) { 2900be6bf707SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 2901be6bf707SBarry Smith Mat_SeqAIJ *b = (Mat_SeqAIJ*)B->data; 2902be6bf707SBarry Smith 29034d805d7cSStefano Zampini if (a->i[A->rmap->n] != b->i[B->rmap->n]) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_INCOMP,"Number of nonzeros in two matrices are different %D != %D",a->i[A->rmap->n],b->i[B->rmap->n]); 2904580bdb30SBarry Smith ierr = PetscArraycpy(b->a,a->a,a->i[A->rmap->n]);CHKERRQ(ierr); 2905cdc753b6SBarry Smith ierr = PetscObjectStateIncrease((PetscObject)B);CHKERRQ(ierr); 2906cb5b572fSBarry Smith } else { 2907cb5b572fSBarry Smith ierr = MatCopy_Basic(A,B,str);CHKERRQ(ierr); 2908cb5b572fSBarry Smith } 2909cb5b572fSBarry Smith PetscFunctionReturn(0); 2910cb5b572fSBarry Smith } 2911cb5b572fSBarry Smith 29124994cf47SJed Brown PetscErrorCode MatSetUp_SeqAIJ(Mat A) 2913273d9f13SBarry Smith { 2914dfbe8321SBarry Smith PetscErrorCode ierr; 2915273d9f13SBarry Smith 2916273d9f13SBarry Smith PetscFunctionBegin; 2917ab93d7beSBarry Smith ierr = MatSeqAIJSetPreallocation_SeqAIJ(A,PETSC_DEFAULT,0);CHKERRQ(ierr); 2918273d9f13SBarry Smith PetscFunctionReturn(0); 2919273d9f13SBarry Smith } 2920273d9f13SBarry Smith 2921f38c1e66SStefano Zampini PETSC_INTERN PetscErrorCode MatSeqAIJGetArray_SeqAIJ(Mat A,PetscScalar *array[]) 29226c0721eeSBarry Smith { 29236c0721eeSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 29246e111a19SKarl Rupp 29256c0721eeSBarry Smith PetscFunctionBegin; 29266c0721eeSBarry Smith *array = a->a; 29276c0721eeSBarry Smith PetscFunctionReturn(0); 29286c0721eeSBarry Smith } 29296c0721eeSBarry Smith 2930f38c1e66SStefano Zampini PETSC_INTERN PetscErrorCode MatSeqAIJRestoreArray_SeqAIJ(Mat A,PetscScalar *array[]) 29316c0721eeSBarry Smith { 29326c0721eeSBarry Smith PetscFunctionBegin; 2933f38c1e66SStefano Zampini *array = NULL; 29346c0721eeSBarry Smith PetscFunctionReturn(0); 29356c0721eeSBarry Smith } 2936273d9f13SBarry Smith 29378229c054SShri Abhyankar /* 29388229c054SShri Abhyankar Computes the number of nonzeros per row needed for preallocation when X and Y 29398229c054SShri Abhyankar have different nonzero structure. 29408229c054SShri Abhyankar */ 2941b264fe52SHong Zhang PetscErrorCode MatAXPYGetPreallocation_SeqX_private(PetscInt m,const PetscInt *xi,const PetscInt *xj,const PetscInt *yi,const PetscInt *yj,PetscInt *nnz) 2942ec7775f6SShri Abhyankar { 2943b264fe52SHong Zhang PetscInt i,j,k,nzx,nzy; 2944ec7775f6SShri Abhyankar 2945ec7775f6SShri Abhyankar PetscFunctionBegin; 2946ec7775f6SShri Abhyankar /* Set the number of nonzeros in the new matrix */ 2947ec7775f6SShri Abhyankar for (i=0; i<m; i++) { 2948b264fe52SHong Zhang const PetscInt *xjj = xj+xi[i],*yjj = yj+yi[i]; 2949b264fe52SHong Zhang nzx = xi[i+1] - xi[i]; 2950b264fe52SHong Zhang nzy = yi[i+1] - yi[i]; 29518af7cee1SJed Brown nnz[i] = 0; 29528af7cee1SJed Brown for (j=0,k=0; j<nzx; j++) { /* Point in X */ 2953b264fe52SHong Zhang for (; k<nzy && yjj[k]<xjj[j]; k++) nnz[i]++; /* Catch up to X */ 2954b264fe52SHong Zhang if (k<nzy && yjj[k]==xjj[j]) k++; /* Skip duplicate */ 29558af7cee1SJed Brown nnz[i]++; 29568af7cee1SJed Brown } 29578af7cee1SJed Brown for (; k<nzy; k++) nnz[i]++; 2958ec7775f6SShri Abhyankar } 2959ec7775f6SShri Abhyankar PetscFunctionReturn(0); 2960ec7775f6SShri Abhyankar } 2961ec7775f6SShri Abhyankar 2962b264fe52SHong Zhang PetscErrorCode MatAXPYGetPreallocation_SeqAIJ(Mat Y,Mat X,PetscInt *nnz) 2963b264fe52SHong Zhang { 2964b264fe52SHong Zhang PetscInt m = Y->rmap->N; 2965b264fe52SHong Zhang Mat_SeqAIJ *x = (Mat_SeqAIJ*)X->data; 2966b264fe52SHong Zhang Mat_SeqAIJ *y = (Mat_SeqAIJ*)Y->data; 2967b264fe52SHong Zhang PetscErrorCode ierr; 2968b264fe52SHong Zhang 2969b264fe52SHong Zhang PetscFunctionBegin; 2970b264fe52SHong Zhang /* Set the number of nonzeros in the new matrix */ 2971b264fe52SHong Zhang ierr = MatAXPYGetPreallocation_SeqX_private(m,x->i,x->j,y->i,y->j,nnz);CHKERRQ(ierr); 2972b264fe52SHong Zhang PetscFunctionReturn(0); 2973b264fe52SHong Zhang } 2974b264fe52SHong Zhang 2975f4df32b1SMatthew Knepley PetscErrorCode MatAXPY_SeqAIJ(Mat Y,PetscScalar a,Mat X,MatStructure str) 2976ac90fabeSBarry Smith { 2977dfbe8321SBarry Smith PetscErrorCode ierr; 2978ac90fabeSBarry Smith Mat_SeqAIJ *x = (Mat_SeqAIJ*)X->data,*y = (Mat_SeqAIJ*)Y->data; 2979c5df96a5SBarry Smith PetscBLASInt one=1,bnz; 2980ac90fabeSBarry Smith 2981ac90fabeSBarry Smith PetscFunctionBegin; 2982c5df96a5SBarry Smith ierr = PetscBLASIntCast(x->nz,&bnz);CHKERRQ(ierr); 2983ac90fabeSBarry Smith if (str == SAME_NONZERO_PATTERN) { 2984f4df32b1SMatthew Knepley PetscScalar alpha = a; 29858b83055fSJed Brown PetscStackCallBLAS("BLASaxpy",BLASaxpy_(&bnz,&alpha,x->a,&one,y->a,&one)); 2986acf2f550SJed Brown ierr = MatSeqAIJInvalidateDiagonal(Y);CHKERRQ(ierr); 2987a3fa217bSJose E. Roman ierr = PetscObjectStateIncrease((PetscObject)Y);CHKERRQ(ierr); 2988e2cf4d64SStefano Zampini /* the MatAXPY_Basic* subroutines calls MatAssembly, so the matrix on the GPU 2989e2cf4d64SStefano Zampini will be updated */ 2990e2cf4d64SStefano Zampini #if defined(PETSC_HAVE_VIENNACL) || defined(PETSC_HAVE_CUDA) 2991c70f7ee4SJunchao Zhang if (Y->offloadmask != PETSC_OFFLOAD_UNALLOCATED) { 2992c70f7ee4SJunchao Zhang Y->offloadmask = PETSC_OFFLOAD_CPU; 2993e2cf4d64SStefano Zampini } 2994e2cf4d64SStefano Zampini #endif 2995ab784542SHong Zhang } else if (str == SUBSET_NONZERO_PATTERN) { /* nonzeros of X is a subset of Y's */ 2996ab784542SHong Zhang ierr = MatAXPY_Basic(Y,a,X,str);CHKERRQ(ierr); 2997ac90fabeSBarry Smith } else { 29988229c054SShri Abhyankar Mat B; 29998229c054SShri Abhyankar PetscInt *nnz; 3000785e854fSJed Brown ierr = PetscMalloc1(Y->rmap->N,&nnz);CHKERRQ(ierr); 3001ce94432eSBarry Smith ierr = MatCreate(PetscObjectComm((PetscObject)Y),&B);CHKERRQ(ierr); 3002bc5a2726SShri Abhyankar ierr = PetscObjectSetName((PetscObject)B,((PetscObject)Y)->name);CHKERRQ(ierr); 30034aa94f47SShri Abhyankar ierr = MatSetSizes(B,Y->rmap->n,Y->cmap->n,Y->rmap->N,Y->cmap->N);CHKERRQ(ierr); 300433d57670SJed Brown ierr = MatSetBlockSizesFromMats(B,Y,Y);CHKERRQ(ierr); 3005176df525SBarry Smith ierr = MatSetType(B,(MatType) ((PetscObject)Y)->type_name);CHKERRQ(ierr); 30068229c054SShri Abhyankar ierr = MatAXPYGetPreallocation_SeqAIJ(Y,X,nnz);CHKERRQ(ierr); 3007ecd8bba6SJed Brown ierr = MatSeqAIJSetPreallocation(B,0,nnz);CHKERRQ(ierr); 3008ec7775f6SShri Abhyankar ierr = MatAXPY_BasicWithPreallocation(B,Y,a,X,str);CHKERRQ(ierr); 300928be2f97SBarry Smith ierr = MatHeaderReplace(Y,&B);CHKERRQ(ierr); 30108229c054SShri Abhyankar ierr = PetscFree(nnz);CHKERRQ(ierr); 3011ac90fabeSBarry Smith } 3012ac90fabeSBarry Smith PetscFunctionReturn(0); 3013ac90fabeSBarry Smith } 3014ac90fabeSBarry Smith 30157087cfbeSBarry Smith PetscErrorCode MatConjugate_SeqAIJ(Mat mat) 3016354c94deSBarry Smith { 3017354c94deSBarry Smith #if defined(PETSC_USE_COMPLEX) 3018354c94deSBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ*)mat->data; 3019354c94deSBarry Smith PetscInt i,nz; 3020354c94deSBarry Smith PetscScalar *a; 3021354c94deSBarry Smith 3022354c94deSBarry Smith PetscFunctionBegin; 3023354c94deSBarry Smith nz = aij->nz; 3024354c94deSBarry Smith a = aij->a; 30252205254eSKarl Rupp for (i=0; i<nz; i++) a[i] = PetscConj(a[i]); 3026e2cf4d64SStefano Zampini #if defined(PETSC_HAVE_VIENNACL) || defined(PETSC_HAVE_CUDA) 3027c70f7ee4SJunchao Zhang if (mat->offloadmask != PETSC_OFFLOAD_UNALLOCATED) mat->offloadmask = PETSC_OFFLOAD_CPU; 3028e2cf4d64SStefano Zampini #endif 3029354c94deSBarry Smith #else 3030354c94deSBarry Smith PetscFunctionBegin; 3031354c94deSBarry Smith #endif 3032354c94deSBarry Smith PetscFunctionReturn(0); 3033354c94deSBarry Smith } 3034354c94deSBarry Smith 3035985db425SBarry Smith PetscErrorCode MatGetRowMaxAbs_SeqAIJ(Mat A,Vec v,PetscInt idx[]) 3036e34fafa9SBarry Smith { 3037e34fafa9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 3038e34fafa9SBarry Smith PetscErrorCode ierr; 3039d0f46423SBarry Smith PetscInt i,j,m = A->rmap->n,*ai,*aj,ncols,n; 3040e34fafa9SBarry Smith PetscReal atmp; 3041985db425SBarry Smith PetscScalar *x; 3042e34fafa9SBarry Smith MatScalar *aa; 3043e34fafa9SBarry Smith 3044e34fafa9SBarry Smith PetscFunctionBegin; 3045e32f2f54SBarry Smith if (A->factortype) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Not for factored matrix"); 3046e34fafa9SBarry Smith aa = a->a; 3047e34fafa9SBarry Smith ai = a->i; 3048e34fafa9SBarry Smith aj = a->j; 3049e34fafa9SBarry Smith 3050985db425SBarry Smith ierr = VecSet(v,0.0);CHKERRQ(ierr); 3051e34fafa9SBarry Smith ierr = VecGetArray(v,&x);CHKERRQ(ierr); 3052e34fafa9SBarry Smith ierr = VecGetLocalSize(v,&n);CHKERRQ(ierr); 3053e32f2f54SBarry Smith if (n != A->rmap->n) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Nonconforming matrix and vector"); 3054e34fafa9SBarry Smith for (i=0; i<m; i++) { 3055e34fafa9SBarry Smith ncols = ai[1] - ai[0]; ai++; 30569189402eSHong Zhang x[i] = 0.0; 3057e34fafa9SBarry Smith for (j=0; j<ncols; j++) { 3058985db425SBarry Smith atmp = PetscAbsScalar(*aa); 3059985db425SBarry Smith if (PetscAbsScalar(x[i]) < atmp) {x[i] = atmp; if (idx) idx[i] = *aj;} 3060985db425SBarry Smith aa++; aj++; 3061985db425SBarry Smith } 3062985db425SBarry Smith } 3063985db425SBarry Smith ierr = VecRestoreArray(v,&x);CHKERRQ(ierr); 3064985db425SBarry Smith PetscFunctionReturn(0); 3065985db425SBarry Smith } 3066985db425SBarry Smith 3067985db425SBarry Smith PetscErrorCode MatGetRowMax_SeqAIJ(Mat A,Vec v,PetscInt idx[]) 3068985db425SBarry Smith { 3069985db425SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 3070985db425SBarry Smith PetscErrorCode ierr; 3071d0f46423SBarry Smith PetscInt i,j,m = A->rmap->n,*ai,*aj,ncols,n; 3072985db425SBarry Smith PetscScalar *x; 3073985db425SBarry Smith MatScalar *aa; 3074985db425SBarry Smith 3075985db425SBarry Smith PetscFunctionBegin; 3076e32f2f54SBarry Smith if (A->factortype) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Not for factored matrix"); 3077985db425SBarry Smith aa = a->a; 3078985db425SBarry Smith ai = a->i; 3079985db425SBarry Smith aj = a->j; 3080985db425SBarry Smith 3081985db425SBarry Smith ierr = VecSet(v,0.0);CHKERRQ(ierr); 3082985db425SBarry Smith ierr = VecGetArray(v,&x);CHKERRQ(ierr); 3083985db425SBarry Smith ierr = VecGetLocalSize(v,&n);CHKERRQ(ierr); 3084e32f2f54SBarry Smith if (n != A->rmap->n) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Nonconforming matrix and vector"); 3085985db425SBarry Smith for (i=0; i<m; i++) { 3086985db425SBarry Smith ncols = ai[1] - ai[0]; ai++; 3087d0f46423SBarry Smith if (ncols == A->cmap->n) { /* row is dense */ 3088985db425SBarry Smith x[i] = *aa; if (idx) idx[i] = 0; 3089985db425SBarry Smith } else { /* row is sparse so already KNOW maximum is 0.0 or higher */ 3090985db425SBarry Smith x[i] = 0.0; 3091985db425SBarry Smith if (idx) { 3092985db425SBarry Smith idx[i] = 0; /* in case ncols is zero */ 3093985db425SBarry Smith for (j=0;j<ncols;j++) { /* find first implicit 0.0 in the row */ 3094985db425SBarry Smith if (aj[j] > j) { 3095985db425SBarry Smith idx[i] = j; 3096985db425SBarry Smith break; 3097985db425SBarry Smith } 3098985db425SBarry Smith } 3099985db425SBarry Smith } 3100985db425SBarry Smith } 3101985db425SBarry Smith for (j=0; j<ncols; j++) { 3102985db425SBarry Smith if (PetscRealPart(x[i]) < PetscRealPart(*aa)) {x[i] = *aa; if (idx) idx[i] = *aj;} 3103985db425SBarry Smith aa++; aj++; 3104985db425SBarry Smith } 3105985db425SBarry Smith } 3106985db425SBarry Smith ierr = VecRestoreArray(v,&x);CHKERRQ(ierr); 3107985db425SBarry Smith PetscFunctionReturn(0); 3108985db425SBarry Smith } 3109985db425SBarry Smith 3110c87e5d42SMatthew Knepley PetscErrorCode MatGetRowMinAbs_SeqAIJ(Mat A,Vec v,PetscInt idx[]) 3111c87e5d42SMatthew Knepley { 3112c87e5d42SMatthew Knepley Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 3113c87e5d42SMatthew Knepley PetscErrorCode ierr; 3114c87e5d42SMatthew Knepley PetscInt i,j,m = A->rmap->n,*ai,*aj,ncols,n; 3115c87e5d42SMatthew Knepley PetscReal atmp; 3116c87e5d42SMatthew Knepley PetscScalar *x; 3117c87e5d42SMatthew Knepley MatScalar *aa; 3118c87e5d42SMatthew Knepley 3119c87e5d42SMatthew Knepley PetscFunctionBegin; 3120e32f2f54SBarry Smith if (A->factortype) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Not for factored matrix"); 3121c87e5d42SMatthew Knepley aa = a->a; 3122c87e5d42SMatthew Knepley ai = a->i; 3123c87e5d42SMatthew Knepley aj = a->j; 3124c87e5d42SMatthew Knepley 3125c87e5d42SMatthew Knepley ierr = VecSet(v,0.0);CHKERRQ(ierr); 3126c87e5d42SMatthew Knepley ierr = VecGetArray(v,&x);CHKERRQ(ierr); 3127c87e5d42SMatthew Knepley ierr = VecGetLocalSize(v,&n);CHKERRQ(ierr); 312860e0710aSBarry Smith if (n != A->rmap->n) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Nonconforming matrix and vector, %D vs. %D rows", A->rmap->n, n); 3129c87e5d42SMatthew Knepley for (i=0; i<m; i++) { 3130c87e5d42SMatthew Knepley ncols = ai[1] - ai[0]; ai++; 3131289a08f5SMatthew Knepley if (ncols) { 3132289a08f5SMatthew Knepley /* Get first nonzero */ 3133289a08f5SMatthew Knepley for (j = 0; j < ncols; j++) { 3134289a08f5SMatthew Knepley atmp = PetscAbsScalar(aa[j]); 31352205254eSKarl Rupp if (atmp > 1.0e-12) { 31362205254eSKarl Rupp x[i] = atmp; 31372205254eSKarl Rupp if (idx) idx[i] = aj[j]; 31382205254eSKarl Rupp break; 31392205254eSKarl Rupp } 3140289a08f5SMatthew Knepley } 314112431cb0SMatthew G Knepley if (j == ncols) {x[i] = PetscAbsScalar(*aa); if (idx) idx[i] = *aj;} 3142289a08f5SMatthew Knepley } else { 3143289a08f5SMatthew Knepley x[i] = 0.0; if (idx) idx[i] = 0; 3144289a08f5SMatthew Knepley } 3145c87e5d42SMatthew Knepley for (j = 0; j < ncols; j++) { 3146c87e5d42SMatthew Knepley atmp = PetscAbsScalar(*aa); 3147289a08f5SMatthew Knepley if (atmp > 1.0e-12 && PetscAbsScalar(x[i]) > atmp) {x[i] = atmp; if (idx) idx[i] = *aj;} 3148c87e5d42SMatthew Knepley aa++; aj++; 3149c87e5d42SMatthew Knepley } 3150c87e5d42SMatthew Knepley } 3151c87e5d42SMatthew Knepley ierr = VecRestoreArray(v,&x);CHKERRQ(ierr); 3152c87e5d42SMatthew Knepley PetscFunctionReturn(0); 3153c87e5d42SMatthew Knepley } 3154c87e5d42SMatthew Knepley 3155985db425SBarry Smith PetscErrorCode MatGetRowMin_SeqAIJ(Mat A,Vec v,PetscInt idx[]) 3156985db425SBarry Smith { 3157985db425SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 3158985db425SBarry Smith PetscErrorCode ierr; 3159d9ca1df4SBarry Smith PetscInt i,j,m = A->rmap->n,ncols,n; 3160d9ca1df4SBarry Smith const PetscInt *ai,*aj; 3161985db425SBarry Smith PetscScalar *x; 3162d9ca1df4SBarry Smith const MatScalar *aa; 3163985db425SBarry Smith 3164985db425SBarry Smith PetscFunctionBegin; 3165e32f2f54SBarry Smith if (A->factortype) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Not for factored matrix"); 3166985db425SBarry Smith aa = a->a; 3167985db425SBarry Smith ai = a->i; 3168985db425SBarry Smith aj = a->j; 3169985db425SBarry Smith 3170985db425SBarry Smith ierr = VecSet(v,0.0);CHKERRQ(ierr); 3171985db425SBarry Smith ierr = VecGetArray(v,&x);CHKERRQ(ierr); 3172985db425SBarry Smith ierr = VecGetLocalSize(v,&n);CHKERRQ(ierr); 3173e32f2f54SBarry Smith if (n != A->rmap->n) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Nonconforming matrix and vector"); 3174985db425SBarry Smith for (i=0; i<m; i++) { 3175985db425SBarry Smith ncols = ai[1] - ai[0]; ai++; 3176d0f46423SBarry Smith if (ncols == A->cmap->n) { /* row is dense */ 3177985db425SBarry Smith x[i] = *aa; if (idx) idx[i] = 0; 3178985db425SBarry Smith } else { /* row is sparse so already KNOW minimum is 0.0 or lower */ 3179985db425SBarry Smith x[i] = 0.0; 3180985db425SBarry Smith if (idx) { /* find first implicit 0.0 in the row */ 3181985db425SBarry Smith idx[i] = 0; /* in case ncols is zero */ 3182985db425SBarry Smith for (j=0; j<ncols; j++) { 3183985db425SBarry Smith if (aj[j] > j) { 3184985db425SBarry Smith idx[i] = j; 3185985db425SBarry Smith break; 3186985db425SBarry Smith } 3187985db425SBarry Smith } 3188985db425SBarry Smith } 3189985db425SBarry Smith } 3190985db425SBarry Smith for (j=0; j<ncols; j++) { 3191985db425SBarry Smith if (PetscRealPart(x[i]) > PetscRealPart(*aa)) {x[i] = *aa; if (idx) idx[i] = *aj;} 3192985db425SBarry Smith aa++; aj++; 3193e34fafa9SBarry Smith } 3194e34fafa9SBarry Smith } 3195e34fafa9SBarry Smith ierr = VecRestoreArray(v,&x);CHKERRQ(ierr); 3196e34fafa9SBarry Smith PetscFunctionReturn(0); 3197e34fafa9SBarry Smith } 3198bbead8a2SBarry Smith 3199713ccfa9SJed Brown PetscErrorCode MatInvertBlockDiagonal_SeqAIJ(Mat A,const PetscScalar **values) 3200bbead8a2SBarry Smith { 3201bbead8a2SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*) A->data; 3202bbead8a2SBarry Smith PetscErrorCode ierr; 320333d57670SJed Brown PetscInt i,bs = PetscAbs(A->rmap->bs),mbs = A->rmap->n/bs,ipvt[5],bs2 = bs*bs,*v_pivots,ij[7],*IJ,j; 3204bbead8a2SBarry Smith MatScalar *diag,work[25],*v_work; 32050da83c2eSBarry Smith const PetscReal shift = 0.0; 32061a9391e3SHong Zhang PetscBool allowzeropivot,zeropivotdetected=PETSC_FALSE; 3207bbead8a2SBarry Smith 3208bbead8a2SBarry Smith PetscFunctionBegin; 3209a455e926SHong Zhang allowzeropivot = PetscNot(A->erroriffailure); 32104a0d0026SBarry Smith if (a->ibdiagvalid) { 32114a0d0026SBarry Smith if (values) *values = a->ibdiag; 32124a0d0026SBarry Smith PetscFunctionReturn(0); 32134a0d0026SBarry Smith } 3214bbead8a2SBarry Smith ierr = MatMarkDiagonal_SeqAIJ(A);CHKERRQ(ierr); 3215bbead8a2SBarry Smith if (!a->ibdiag) { 3216785e854fSJed Brown ierr = PetscMalloc1(bs2*mbs,&a->ibdiag);CHKERRQ(ierr); 32173bb1ff40SBarry Smith ierr = PetscLogObjectMemory((PetscObject)A,bs2*mbs*sizeof(PetscScalar));CHKERRQ(ierr); 3218bbead8a2SBarry Smith } 3219bbead8a2SBarry Smith diag = a->ibdiag; 3220bbead8a2SBarry Smith if (values) *values = a->ibdiag; 3221bbead8a2SBarry Smith /* factor and invert each block */ 3222bbead8a2SBarry Smith switch (bs) { 3223bbead8a2SBarry Smith case 1: 3224bbead8a2SBarry Smith for (i=0; i<mbs; i++) { 3225bbead8a2SBarry Smith ierr = MatGetValues(A,1,&i,1,&i,diag+i);CHKERRQ(ierr); 3226ec1892c8SHong Zhang if (PetscAbsScalar(diag[i] + shift) < PETSC_MACHINE_EPSILON) { 3227ec1892c8SHong Zhang if (allowzeropivot) { 32287b6c816cSBarry Smith A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 32297b6c816cSBarry Smith A->factorerror_zeropivot_value = PetscAbsScalar(diag[i]); 32307b6c816cSBarry Smith A->factorerror_zeropivot_row = i; 32317b6c816cSBarry Smith ierr = PetscInfo3(A,"Zero pivot, row %D pivot %g tolerance %g\n",i,(double)PetscAbsScalar(diag[i]),(double)PETSC_MACHINE_EPSILON);CHKERRQ(ierr); 32327b6c816cSBarry Smith } else SETERRQ3(PETSC_COMM_SELF,PETSC_ERR_MAT_LU_ZRPVT,"Zero pivot, row %D pivot %g tolerance %g",i,(double)PetscAbsScalar(diag[i]),(double)PETSC_MACHINE_EPSILON); 3233ec1892c8SHong Zhang } 3234bbead8a2SBarry Smith diag[i] = (PetscScalar)1.0 / (diag[i] + shift); 3235bbead8a2SBarry Smith } 3236bbead8a2SBarry Smith break; 3237bbead8a2SBarry Smith case 2: 3238bbead8a2SBarry Smith for (i=0; i<mbs; i++) { 3239bbead8a2SBarry Smith ij[0] = 2*i; ij[1] = 2*i + 1; 3240bbead8a2SBarry Smith ierr = MatGetValues(A,2,ij,2,ij,diag);CHKERRQ(ierr); 3241a455e926SHong Zhang ierr = PetscKernel_A_gets_inverse_A_2(diag,shift,allowzeropivot,&zeropivotdetected);CHKERRQ(ierr); 32427b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 324396b95a6bSBarry Smith ierr = PetscKernel_A_gets_transpose_A_2(diag);CHKERRQ(ierr); 3244bbead8a2SBarry Smith diag += 4; 3245bbead8a2SBarry Smith } 3246bbead8a2SBarry Smith break; 3247bbead8a2SBarry Smith case 3: 3248bbead8a2SBarry Smith for (i=0; i<mbs; i++) { 3249bbead8a2SBarry Smith ij[0] = 3*i; ij[1] = 3*i + 1; ij[2] = 3*i + 2; 3250bbead8a2SBarry Smith ierr = MatGetValues(A,3,ij,3,ij,diag);CHKERRQ(ierr); 3251a455e926SHong Zhang ierr = PetscKernel_A_gets_inverse_A_3(diag,shift,allowzeropivot,&zeropivotdetected);CHKERRQ(ierr); 32527b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 325396b95a6bSBarry Smith ierr = PetscKernel_A_gets_transpose_A_3(diag);CHKERRQ(ierr); 3254bbead8a2SBarry Smith diag += 9; 3255bbead8a2SBarry Smith } 3256bbead8a2SBarry Smith break; 3257bbead8a2SBarry Smith case 4: 3258bbead8a2SBarry Smith for (i=0; i<mbs; i++) { 3259bbead8a2SBarry Smith ij[0] = 4*i; ij[1] = 4*i + 1; ij[2] = 4*i + 2; ij[3] = 4*i + 3; 3260bbead8a2SBarry Smith ierr = MatGetValues(A,4,ij,4,ij,diag);CHKERRQ(ierr); 3261a455e926SHong Zhang ierr = PetscKernel_A_gets_inverse_A_4(diag,shift,allowzeropivot,&zeropivotdetected);CHKERRQ(ierr); 32627b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 326396b95a6bSBarry Smith ierr = PetscKernel_A_gets_transpose_A_4(diag);CHKERRQ(ierr); 3264bbead8a2SBarry Smith diag += 16; 3265bbead8a2SBarry Smith } 3266bbead8a2SBarry Smith break; 3267bbead8a2SBarry Smith case 5: 3268bbead8a2SBarry Smith for (i=0; i<mbs; i++) { 3269bbead8a2SBarry Smith ij[0] = 5*i; ij[1] = 5*i + 1; ij[2] = 5*i + 2; ij[3] = 5*i + 3; ij[4] = 5*i + 4; 3270bbead8a2SBarry Smith ierr = MatGetValues(A,5,ij,5,ij,diag);CHKERRQ(ierr); 3271a455e926SHong Zhang ierr = PetscKernel_A_gets_inverse_A_5(diag,ipvt,work,shift,allowzeropivot,&zeropivotdetected);CHKERRQ(ierr); 32727b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 327396b95a6bSBarry Smith ierr = PetscKernel_A_gets_transpose_A_5(diag);CHKERRQ(ierr); 3274bbead8a2SBarry Smith diag += 25; 3275bbead8a2SBarry Smith } 3276bbead8a2SBarry Smith break; 3277bbead8a2SBarry Smith case 6: 3278bbead8a2SBarry Smith for (i=0; i<mbs; i++) { 3279bbead8a2SBarry Smith ij[0] = 6*i; ij[1] = 6*i + 1; ij[2] = 6*i + 2; ij[3] = 6*i + 3; ij[4] = 6*i + 4; ij[5] = 6*i + 5; 3280bbead8a2SBarry Smith ierr = MatGetValues(A,6,ij,6,ij,diag);CHKERRQ(ierr); 3281a455e926SHong Zhang ierr = PetscKernel_A_gets_inverse_A_6(diag,shift,allowzeropivot,&zeropivotdetected);CHKERRQ(ierr); 32827b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 328396b95a6bSBarry Smith ierr = PetscKernel_A_gets_transpose_A_6(diag);CHKERRQ(ierr); 3284bbead8a2SBarry Smith diag += 36; 3285bbead8a2SBarry Smith } 3286bbead8a2SBarry Smith break; 3287bbead8a2SBarry Smith case 7: 3288bbead8a2SBarry Smith for (i=0; i<mbs; i++) { 3289bbead8a2SBarry Smith ij[0] = 7*i; ij[1] = 7*i + 1; ij[2] = 7*i + 2; ij[3] = 7*i + 3; ij[4] = 7*i + 4; ij[5] = 7*i + 5; ij[5] = 7*i + 6; 3290bbead8a2SBarry Smith ierr = MatGetValues(A,7,ij,7,ij,diag);CHKERRQ(ierr); 3291a455e926SHong Zhang ierr = PetscKernel_A_gets_inverse_A_7(diag,shift,allowzeropivot,&zeropivotdetected);CHKERRQ(ierr); 32927b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 329396b95a6bSBarry Smith ierr = PetscKernel_A_gets_transpose_A_7(diag);CHKERRQ(ierr); 3294bbead8a2SBarry Smith diag += 49; 3295bbead8a2SBarry Smith } 3296bbead8a2SBarry Smith break; 3297bbead8a2SBarry Smith default: 3298dcca6d9dSJed Brown ierr = PetscMalloc3(bs,&v_work,bs,&v_pivots,bs,&IJ);CHKERRQ(ierr); 3299bbead8a2SBarry Smith for (i=0; i<mbs; i++) { 3300bbead8a2SBarry Smith for (j=0; j<bs; j++) { 3301bbead8a2SBarry Smith IJ[j] = bs*i + j; 3302bbead8a2SBarry Smith } 3303bbead8a2SBarry Smith ierr = MatGetValues(A,bs,IJ,bs,IJ,diag);CHKERRQ(ierr); 33045f8bbccaSHong Zhang ierr = PetscKernel_A_gets_inverse_A(bs,diag,v_pivots,v_work,allowzeropivot,&zeropivotdetected);CHKERRQ(ierr); 33057b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 330696b95a6bSBarry Smith ierr = PetscKernel_A_gets_transpose_A_N(diag,bs);CHKERRQ(ierr); 3307bbead8a2SBarry Smith diag += bs2; 3308bbead8a2SBarry Smith } 3309bbead8a2SBarry Smith ierr = PetscFree3(v_work,v_pivots,IJ);CHKERRQ(ierr); 3310bbead8a2SBarry Smith } 3311bbead8a2SBarry Smith a->ibdiagvalid = PETSC_TRUE; 3312bbead8a2SBarry Smith PetscFunctionReturn(0); 3313bbead8a2SBarry Smith } 3314bbead8a2SBarry Smith 331573a71a0fSBarry Smith static PetscErrorCode MatSetRandom_SeqAIJ(Mat x,PetscRandom rctx) 331673a71a0fSBarry Smith { 331773a71a0fSBarry Smith PetscErrorCode ierr; 331873a71a0fSBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ*)x->data; 331973a71a0fSBarry Smith PetscScalar a; 332073a71a0fSBarry Smith PetscInt m,n,i,j,col; 332173a71a0fSBarry Smith 332273a71a0fSBarry Smith PetscFunctionBegin; 332373a71a0fSBarry Smith if (!x->assembled) { 332473a71a0fSBarry Smith ierr = MatGetSize(x,&m,&n);CHKERRQ(ierr); 332573a71a0fSBarry Smith for (i=0; i<m; i++) { 332673a71a0fSBarry Smith for (j=0; j<aij->imax[i]; j++) { 332773a71a0fSBarry Smith ierr = PetscRandomGetValue(rctx,&a);CHKERRQ(ierr); 332873a71a0fSBarry Smith col = (PetscInt)(n*PetscRealPart(a)); 332973a71a0fSBarry Smith ierr = MatSetValues(x,1,&i,1,&col,&a,ADD_VALUES);CHKERRQ(ierr); 333073a71a0fSBarry Smith } 333173a71a0fSBarry Smith } 3332e2ce353bSJunchao Zhang } else { 3333e2ce353bSJunchao Zhang for (i=0; i<aij->nz; i++) {ierr = PetscRandomGetValue(rctx,aij->a+i);CHKERRQ(ierr);} 3334e2ce353bSJunchao Zhang } 333573a71a0fSBarry Smith ierr = MatAssemblyBegin(x,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 333673a71a0fSBarry Smith ierr = MatAssemblyEnd(x,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 333773a71a0fSBarry Smith PetscFunctionReturn(0); 333873a71a0fSBarry Smith } 333973a71a0fSBarry Smith 3340679944adSJunchao Zhang /* Like MatSetRandom_SeqAIJ, but do not set values on columns in range of [low, high) */ 3341679944adSJunchao Zhang PetscErrorCode MatSetRandomSkipColumnRange_SeqAIJ_Private(Mat x,PetscInt low,PetscInt high,PetscRandom rctx) 3342679944adSJunchao Zhang { 3343679944adSJunchao Zhang PetscErrorCode ierr; 3344679944adSJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ*)x->data; 3345679944adSJunchao Zhang PetscScalar a; 3346679944adSJunchao Zhang PetscInt m,n,i,j,col,nskip; 3347679944adSJunchao Zhang 3348679944adSJunchao Zhang PetscFunctionBegin; 3349679944adSJunchao Zhang nskip = high - low; 3350679944adSJunchao Zhang ierr = MatGetSize(x,&m,&n);CHKERRQ(ierr); 3351679944adSJunchao Zhang n -= nskip; /* shrink number of columns where nonzeros can be set */ 3352679944adSJunchao Zhang for (i=0; i<m; i++) { 3353679944adSJunchao Zhang for (j=0; j<aij->imax[i]; j++) { 3354679944adSJunchao Zhang ierr = PetscRandomGetValue(rctx,&a);CHKERRQ(ierr); 3355679944adSJunchao Zhang col = (PetscInt)(n*PetscRealPart(a)); 3356679944adSJunchao Zhang if (col >= low) col += nskip; /* shift col rightward to skip the hole */ 3357679944adSJunchao Zhang ierr = MatSetValues(x,1,&i,1,&col,&a,ADD_VALUES);CHKERRQ(ierr); 3358679944adSJunchao Zhang } 3359e2ce353bSJunchao Zhang } 3360679944adSJunchao Zhang ierr = MatAssemblyBegin(x,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 3361679944adSJunchao Zhang ierr = MatAssemblyEnd(x,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 3362679944adSJunchao Zhang PetscFunctionReturn(0); 3363679944adSJunchao Zhang } 3364679944adSJunchao Zhang 3365679944adSJunchao Zhang 3366682d7d0cSBarry Smith /* -------------------------------------------------------------------*/ 33670a6ffc59SBarry Smith static struct _MatOps MatOps_Values = { MatSetValues_SeqAIJ, 3368cb5b572fSBarry Smith MatGetRow_SeqAIJ, 3369cb5b572fSBarry Smith MatRestoreRow_SeqAIJ, 3370cb5b572fSBarry Smith MatMult_SeqAIJ, 337197304618SKris Buschelman /* 4*/ MatMultAdd_SeqAIJ, 33727c922b88SBarry Smith MatMultTranspose_SeqAIJ, 33737c922b88SBarry Smith MatMultTransposeAdd_SeqAIJ, 3374db4efbfdSBarry Smith 0, 3375db4efbfdSBarry Smith 0, 3376db4efbfdSBarry Smith 0, 3377db4efbfdSBarry Smith /* 10*/ 0, 3378cb5b572fSBarry Smith MatLUFactor_SeqAIJ, 3379cb5b572fSBarry Smith 0, 338041f059aeSBarry Smith MatSOR_SeqAIJ, 338191e9d3e2SHong Zhang MatTranspose_SeqAIJ, 338297304618SKris Buschelman /*1 5*/ MatGetInfo_SeqAIJ, 3383cb5b572fSBarry Smith MatEqual_SeqAIJ, 3384cb5b572fSBarry Smith MatGetDiagonal_SeqAIJ, 3385cb5b572fSBarry Smith MatDiagonalScale_SeqAIJ, 3386cb5b572fSBarry Smith MatNorm_SeqAIJ, 338797304618SKris Buschelman /* 20*/ 0, 3388cb5b572fSBarry Smith MatAssemblyEnd_SeqAIJ, 3389cb5b572fSBarry Smith MatSetOption_SeqAIJ, 3390cb5b572fSBarry Smith MatZeroEntries_SeqAIJ, 3391d519adbfSMatthew Knepley /* 24*/ MatZeroRows_SeqAIJ, 3392db4efbfdSBarry Smith 0, 3393db4efbfdSBarry Smith 0, 3394db4efbfdSBarry Smith 0, 3395db4efbfdSBarry Smith 0, 33964994cf47SJed Brown /* 29*/ MatSetUp_SeqAIJ, 3397db4efbfdSBarry Smith 0, 3398db4efbfdSBarry Smith 0, 33998c778c55SBarry Smith 0, 34008c778c55SBarry Smith 0, 3401d519adbfSMatthew Knepley /* 34*/ MatDuplicate_SeqAIJ, 3402cb5b572fSBarry Smith 0, 3403cb5b572fSBarry Smith 0, 3404cb5b572fSBarry Smith MatILUFactor_SeqAIJ, 3405cb5b572fSBarry Smith 0, 3406d519adbfSMatthew Knepley /* 39*/ MatAXPY_SeqAIJ, 34077dae84e0SHong Zhang MatCreateSubMatrices_SeqAIJ, 3408cb5b572fSBarry Smith MatIncreaseOverlap_SeqAIJ, 3409cb5b572fSBarry Smith MatGetValues_SeqAIJ, 3410cb5b572fSBarry Smith MatCopy_SeqAIJ, 3411d519adbfSMatthew Knepley /* 44*/ MatGetRowMax_SeqAIJ, 3412cb5b572fSBarry Smith MatScale_SeqAIJ, 34137d68702bSBarry Smith MatShift_SeqAIJ, 341479299369SBarry Smith MatDiagonalSet_SeqAIJ, 34156e169961SBarry Smith MatZeroRowsColumns_SeqAIJ, 341673a71a0fSBarry Smith /* 49*/ MatSetRandom_SeqAIJ, 34173b2fbd54SBarry Smith MatGetRowIJ_SeqAIJ, 34183b2fbd54SBarry Smith MatRestoreRowIJ_SeqAIJ, 34193b2fbd54SBarry Smith MatGetColumnIJ_SeqAIJ, 3420a93ec695SBarry Smith MatRestoreColumnIJ_SeqAIJ, 342193dfae19SHong Zhang /* 54*/ MatFDColoringCreate_SeqXAIJ, 3422b9617806SBarry Smith 0, 34230513a670SBarry Smith 0, 3424cda55fadSBarry Smith MatPermute_SeqAIJ, 3425cda55fadSBarry Smith 0, 3426d519adbfSMatthew Knepley /* 59*/ 0, 3427b9b97703SBarry Smith MatDestroy_SeqAIJ, 3428b9b97703SBarry Smith MatView_SeqAIJ, 3429357abbc8SBarry Smith 0, 34304222ddf1SHong Zhang 0, 34314222ddf1SHong Zhang /* 64*/ 0, 3432321b30b9SSatish Balay MatMatMatMultNumeric_SeqAIJ_SeqAIJ_SeqAIJ, 3433ee4f033dSBarry Smith 0, 3434ee4f033dSBarry Smith 0, 3435ee4f033dSBarry Smith 0, 3436d519adbfSMatthew Knepley /* 69*/ MatGetRowMaxAbs_SeqAIJ, 3437c87e5d42SMatthew Knepley MatGetRowMinAbs_SeqAIJ, 3438ee4f033dSBarry Smith 0, 3439dcf5cc72SBarry Smith 0, 34402c93a97aSBarry Smith 0, 34412c93a97aSBarry Smith /* 74*/ 0, 34423acb8795SBarry Smith MatFDColoringApply_AIJ, 344397304618SKris Buschelman 0, 344497304618SKris Buschelman 0, 344597304618SKris Buschelman 0, 34466ce1633cSBarry Smith /* 79*/ MatFindZeroDiagonals_SeqAIJ, 344797304618SKris Buschelman 0, 344897304618SKris Buschelman 0, 344997304618SKris Buschelman 0, 3450bc011b1eSHong Zhang MatLoad_SeqAIJ, 3451d519adbfSMatthew Knepley /* 84*/ MatIsSymmetric_SeqAIJ, 34521cbb95d3SBarry Smith MatIsHermitian_SeqAIJ, 34536284ec50SHong Zhang 0, 34546284ec50SHong Zhang 0, 3455bc011b1eSHong Zhang 0, 34564222ddf1SHong Zhang /* 89*/ 0, 34574222ddf1SHong Zhang 0, 345826be0446SHong Zhang MatMatMultNumeric_SeqAIJ_SeqAIJ, 34594222ddf1SHong Zhang 0, 34604222ddf1SHong Zhang 0, 34618fa4b5a6SHong Zhang /* 94*/ MatPtAPNumeric_SeqAIJ_SeqAIJ_SparseAxpy, 34624222ddf1SHong Zhang 0, 34634222ddf1SHong Zhang 0, 34646fc122caSHong Zhang MatMatTransposeMultNumeric_SeqAIJ_SeqAIJ, 34652121bac1SHong Zhang 0, 34664222ddf1SHong Zhang /* 99*/ MatProductSetFromOptions_SeqAIJ, 3467609c6c4dSKris Buschelman 0, 3468609c6c4dSKris Buschelman 0, 346987d4246cSBarry Smith MatConjugate_SeqAIJ, 347087d4246cSBarry Smith 0, 3471d519adbfSMatthew Knepley /*104*/ MatSetValuesRow_SeqAIJ, 347299cafbc1SBarry Smith MatRealPart_SeqAIJ, 3473f5edf698SHong Zhang MatImaginaryPart_SeqAIJ, 3474f5edf698SHong Zhang 0, 34752bebee5dSHong Zhang 0, 3476cbd44569SHong Zhang /*109*/ MatMatSolve_SeqAIJ, 3477985db425SBarry Smith 0, 34782af78befSBarry Smith MatGetRowMin_SeqAIJ, 34792af78befSBarry Smith 0, 3480599ef60dSHong Zhang MatMissingDiagonal_SeqAIJ, 3481d519adbfSMatthew Knepley /*114*/ 0, 3482599ef60dSHong Zhang 0, 34833c2a7987SHong Zhang 0, 3484fe97e370SBarry Smith 0, 3485fbdbba38SShri Abhyankar 0, 3486fbdbba38SShri Abhyankar /*119*/ 0, 3487fbdbba38SShri Abhyankar 0, 3488fbdbba38SShri Abhyankar 0, 348982d44351SHong Zhang 0, 3490b3a44c85SBarry Smith MatGetMultiProcBlock_SeqAIJ, 34910716a85fSBarry Smith /*124*/ MatFindNonzeroRows_SeqAIJ, 3492bbead8a2SBarry Smith MatGetColumnNorms_SeqAIJ, 349337868618SMatthew G Knepley MatInvertBlockDiagonal_SeqAIJ, 34940da83c2eSBarry Smith MatInvertVariableBlockDiagonal_SeqAIJ, 349537868618SMatthew G Knepley 0, 34965df89d91SHong Zhang /*129*/ 0, 34974222ddf1SHong Zhang 0, 34984222ddf1SHong Zhang 0, 349975648e8dSHong Zhang MatTransposeMatMultNumeric_SeqAIJ_SeqAIJ, 3500b9af6bddSHong Zhang MatTransposeColoringCreate_SeqAIJ, 3501b9af6bddSHong Zhang /*134*/ MatTransColoringApplySpToDen_SeqAIJ, 35022b8ad9a3SHong Zhang MatTransColoringApplyDenToSp_SeqAIJ, 35034222ddf1SHong Zhang 0, 35044222ddf1SHong Zhang 0, 35053964eb88SJed Brown MatRARtNumeric_SeqAIJ_SeqAIJ, 35063964eb88SJed Brown /*139*/0, 3507f9426fe0SMark Adams 0, 35081919a2e2SJed Brown 0, 35093a062f41SBarry Smith MatFDColoringSetUp_SeqXAIJ, 35109c8f2541SHong Zhang MatFindOffBlockDiagonalEntries_SeqAIJ, 35114222ddf1SHong Zhang MatCreateMPIMatConcatenateSeqMat_SeqAIJ, 35124222ddf1SHong Zhang /*145*/MatDestroySubMatrices_SeqAIJ, 35134222ddf1SHong Zhang 0, 35144222ddf1SHong Zhang 0 35159e29f15eSvictorle }; 351617ab2063SBarry Smith 35177087cfbeSBarry Smith PetscErrorCode MatSeqAIJSetColumnIndices_SeqAIJ(Mat mat,PetscInt *indices) 3518bef8e0ddSBarry Smith { 3519bef8e0ddSBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ*)mat->data; 352097f1f81fSBarry Smith PetscInt i,nz,n; 3521bef8e0ddSBarry Smith 3522bef8e0ddSBarry Smith PetscFunctionBegin; 3523bef8e0ddSBarry Smith nz = aij->maxnz; 3524d0f46423SBarry Smith n = mat->rmap->n; 3525bef8e0ddSBarry Smith for (i=0; i<nz; i++) { 3526bef8e0ddSBarry Smith aij->j[i] = indices[i]; 3527bef8e0ddSBarry Smith } 3528bef8e0ddSBarry Smith aij->nz = nz; 3529bef8e0ddSBarry Smith for (i=0; i<n; i++) { 3530bef8e0ddSBarry Smith aij->ilen[i] = aij->imax[i]; 3531bef8e0ddSBarry Smith } 3532bef8e0ddSBarry Smith PetscFunctionReturn(0); 3533bef8e0ddSBarry Smith } 3534bef8e0ddSBarry Smith 3535a3bb6f32SFande Kong /* 3536e8b528d9SFande Kong * When a sparse matrix has many zero columns, we should compact them out to save the space 3537a3bb6f32SFande Kong * This happens in MatPtAPSymbolic_MPIAIJ_MPIAIJ_scalable() 3538a3bb6f32SFande Kong * */ 3539a3bb6f32SFande Kong PetscErrorCode MatSeqAIJCompactOutExtraColumns_SeqAIJ(Mat mat, ISLocalToGlobalMapping *mapping) 3540a3bb6f32SFande Kong { 3541a3bb6f32SFande Kong Mat_SeqAIJ *aij = (Mat_SeqAIJ*)mat->data; 3542a3bb6f32SFande Kong PetscTable gid1_lid1; 3543a3bb6f32SFande Kong PetscTablePosition tpos; 3544a3bb6f32SFande Kong PetscInt gid,lid,i,j,ncols,ec; 3545a3bb6f32SFande Kong PetscInt *garray; 3546a3bb6f32SFande Kong PetscErrorCode ierr; 3547a3bb6f32SFande Kong 3548a3bb6f32SFande Kong PetscFunctionBegin; 3549a3bb6f32SFande Kong PetscValidHeaderSpecific(mat,MAT_CLASSID,1); 3550a3bb6f32SFande Kong PetscValidPointer(mapping,2); 3551a3bb6f32SFande Kong /* use a table */ 3552a3bb6f32SFande Kong ierr = PetscTableCreate(mat->rmap->n,mat->cmap->N+1,&gid1_lid1);CHKERRQ(ierr); 3553a3bb6f32SFande Kong ec = 0; 3554a3bb6f32SFande Kong for (i=0; i<mat->rmap->n; i++) { 3555a3bb6f32SFande Kong ncols = aij->i[i+1] - aij->i[i]; 3556a3bb6f32SFande Kong for (j=0; j<ncols; j++) { 3557a3bb6f32SFande Kong PetscInt data,gid1 = aij->j[aij->i[i] + j] + 1; 3558a3bb6f32SFande Kong ierr = PetscTableFind(gid1_lid1,gid1,&data);CHKERRQ(ierr); 3559a3bb6f32SFande Kong if (!data) { 3560a3bb6f32SFande Kong /* one based table */ 3561a3bb6f32SFande Kong ierr = PetscTableAdd(gid1_lid1,gid1,++ec,INSERT_VALUES);CHKERRQ(ierr); 3562a3bb6f32SFande Kong } 3563a3bb6f32SFande Kong } 3564a3bb6f32SFande Kong } 3565a3bb6f32SFande Kong /* form array of columns we need */ 3566a3bb6f32SFande Kong ierr = PetscMalloc1(ec+1,&garray);CHKERRQ(ierr); 3567a3bb6f32SFande Kong ierr = PetscTableGetHeadPosition(gid1_lid1,&tpos);CHKERRQ(ierr); 3568a3bb6f32SFande Kong while (tpos) { 3569a3bb6f32SFande Kong ierr = PetscTableGetNext(gid1_lid1,&tpos,&gid,&lid);CHKERRQ(ierr); 3570a3bb6f32SFande Kong gid--; 3571a3bb6f32SFande Kong lid--; 3572a3bb6f32SFande Kong garray[lid] = gid; 3573a3bb6f32SFande Kong } 3574a3bb6f32SFande Kong ierr = PetscSortInt(ec,garray);CHKERRQ(ierr); /* sort, and rebuild */ 3575a3bb6f32SFande Kong ierr = PetscTableRemoveAll(gid1_lid1);CHKERRQ(ierr); 3576a3bb6f32SFande Kong for (i=0; i<ec; i++) { 3577a3bb6f32SFande Kong ierr = PetscTableAdd(gid1_lid1,garray[i]+1,i+1,INSERT_VALUES);CHKERRQ(ierr); 3578a3bb6f32SFande Kong } 3579a3bb6f32SFande Kong /* compact out the extra columns in B */ 3580a3bb6f32SFande Kong for (i=0; i<mat->rmap->n; i++) { 3581a3bb6f32SFande Kong ncols = aij->i[i+1] - aij->i[i]; 3582a3bb6f32SFande Kong for (j=0; j<ncols; j++) { 3583a3bb6f32SFande Kong PetscInt gid1 = aij->j[aij->i[i] + j] + 1; 3584a3bb6f32SFande Kong ierr = PetscTableFind(gid1_lid1,gid1,&lid);CHKERRQ(ierr); 3585a3bb6f32SFande Kong lid--; 3586a3bb6f32SFande Kong aij->j[aij->i[i] + j] = lid; 3587a3bb6f32SFande Kong } 3588a3bb6f32SFande Kong } 3589ca5434daSLawrence Mitchell ierr = PetscLayoutDestroy(&mat->cmap);CHKERRQ(ierr); 3590ca5434daSLawrence Mitchell ierr = PetscLayoutCreateFromSizes(PetscObjectComm((PetscObject)mat),ec,ec,1,&mat->cmap);CHKERRQ(ierr); 3591a3bb6f32SFande Kong ierr = PetscTableDestroy(&gid1_lid1);CHKERRQ(ierr); 3592a3bb6f32SFande Kong ierr = ISLocalToGlobalMappingCreate(PETSC_COMM_SELF,mat->cmap->bs,mat->cmap->n,garray,PETSC_OWN_POINTER,mapping);CHKERRQ(ierr); 3593a3bb6f32SFande Kong ierr = ISLocalToGlobalMappingSetType(*mapping,ISLOCALTOGLOBALMAPPINGHASH);CHKERRQ(ierr); 3594a3bb6f32SFande Kong PetscFunctionReturn(0); 3595a3bb6f32SFande Kong } 3596a3bb6f32SFande Kong 3597bef8e0ddSBarry Smith /*@ 3598bef8e0ddSBarry Smith MatSeqAIJSetColumnIndices - Set the column indices for all the rows 3599bef8e0ddSBarry Smith in the matrix. 3600bef8e0ddSBarry Smith 3601bef8e0ddSBarry Smith Input Parameters: 3602bef8e0ddSBarry Smith + mat - the SeqAIJ matrix 3603bef8e0ddSBarry Smith - indices - the column indices 3604bef8e0ddSBarry Smith 360515091d37SBarry Smith Level: advanced 360615091d37SBarry Smith 3607bef8e0ddSBarry Smith Notes: 3608bef8e0ddSBarry Smith This can be called if you have precomputed the nonzero structure of the 3609bef8e0ddSBarry Smith matrix and want to provide it to the matrix object to improve the performance 3610bef8e0ddSBarry Smith of the MatSetValues() operation. 3611bef8e0ddSBarry Smith 3612bef8e0ddSBarry Smith You MUST have set the correct numbers of nonzeros per row in the call to 3613d1be2dadSMatthew Knepley MatCreateSeqAIJ(), and the columns indices MUST be sorted. 3614bef8e0ddSBarry Smith 3615bef8e0ddSBarry Smith MUST be called before any calls to MatSetValues(); 3616bef8e0ddSBarry Smith 3617b9617806SBarry Smith The indices should start with zero, not one. 3618b9617806SBarry Smith 3619bef8e0ddSBarry Smith @*/ 36207087cfbeSBarry Smith PetscErrorCode MatSeqAIJSetColumnIndices(Mat mat,PetscInt *indices) 3621bef8e0ddSBarry Smith { 36224ac538c5SBarry Smith PetscErrorCode ierr; 3623bef8e0ddSBarry Smith 3624bef8e0ddSBarry Smith PetscFunctionBegin; 36250700a824SBarry Smith PetscValidHeaderSpecific(mat,MAT_CLASSID,1); 36264482741eSBarry Smith PetscValidPointer(indices,2); 36274ac538c5SBarry Smith ierr = PetscUseMethod(mat,"MatSeqAIJSetColumnIndices_C",(Mat,PetscInt*),(mat,indices));CHKERRQ(ierr); 3628bef8e0ddSBarry Smith PetscFunctionReturn(0); 3629bef8e0ddSBarry Smith } 3630bef8e0ddSBarry Smith 3631be6bf707SBarry Smith /* ----------------------------------------------------------------------------------------*/ 3632be6bf707SBarry Smith 36337087cfbeSBarry Smith PetscErrorCode MatStoreValues_SeqAIJ(Mat mat) 3634be6bf707SBarry Smith { 3635be6bf707SBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ*)mat->data; 36366849ba73SBarry Smith PetscErrorCode ierr; 3637d0f46423SBarry Smith size_t nz = aij->i[mat->rmap->n]; 3638be6bf707SBarry Smith 3639be6bf707SBarry Smith PetscFunctionBegin; 3640169f6850SBarry Smith if (!aij->nonew) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ORDER,"Must call MatSetOption(A,MAT_NEW_NONZERO_LOCATIONS,PETSC_FALSE);first"); 3641be6bf707SBarry Smith 3642be6bf707SBarry Smith /* allocate space for values if not already there */ 3643be6bf707SBarry Smith if (!aij->saved_values) { 3644854ce69bSBarry Smith ierr = PetscMalloc1(nz+1,&aij->saved_values);CHKERRQ(ierr); 36453bb1ff40SBarry Smith ierr = PetscLogObjectMemory((PetscObject)mat,(nz+1)*sizeof(PetscScalar));CHKERRQ(ierr); 3646be6bf707SBarry Smith } 3647be6bf707SBarry Smith 3648be6bf707SBarry Smith /* copy values over */ 3649580bdb30SBarry Smith ierr = PetscArraycpy(aij->saved_values,aij->a,nz);CHKERRQ(ierr); 3650be6bf707SBarry Smith PetscFunctionReturn(0); 3651be6bf707SBarry Smith } 3652be6bf707SBarry Smith 3653be6bf707SBarry Smith /*@ 3654be6bf707SBarry Smith MatStoreValues - Stashes a copy of the matrix values; this allows, for 3655be6bf707SBarry Smith example, reuse of the linear part of a Jacobian, while recomputing the 3656be6bf707SBarry Smith nonlinear portion. 3657be6bf707SBarry Smith 3658be6bf707SBarry Smith Collect on Mat 3659be6bf707SBarry Smith 3660be6bf707SBarry Smith Input Parameters: 36610e609b76SBarry Smith . mat - the matrix (currently only AIJ matrices support this option) 3662be6bf707SBarry Smith 366315091d37SBarry Smith Level: advanced 366415091d37SBarry Smith 3665be6bf707SBarry Smith Common Usage, with SNESSolve(): 3666be6bf707SBarry Smith $ Create Jacobian matrix 3667be6bf707SBarry Smith $ Set linear terms into matrix 3668be6bf707SBarry Smith $ Apply boundary conditions to matrix, at this time matrix must have 3669be6bf707SBarry Smith $ final nonzero structure (i.e. setting the nonlinear terms and applying 3670be6bf707SBarry Smith $ boundary conditions again will not change the nonzero structure 3671512a5fc5SBarry Smith $ ierr = MatSetOption(mat,MAT_NEW_NONZERO_LOCATIONS,PETSC_FALSE); 3672be6bf707SBarry Smith $ ierr = MatStoreValues(mat); 3673be6bf707SBarry Smith $ Call SNESSetJacobian() with matrix 3674be6bf707SBarry Smith $ In your Jacobian routine 3675be6bf707SBarry Smith $ ierr = MatRetrieveValues(mat); 3676be6bf707SBarry Smith $ Set nonlinear terms in matrix 3677be6bf707SBarry Smith 3678be6bf707SBarry Smith Common Usage without SNESSolve(), i.e. when you handle nonlinear solve yourself: 3679be6bf707SBarry Smith $ // build linear portion of Jacobian 3680512a5fc5SBarry Smith $ ierr = MatSetOption(mat,MAT_NEW_NONZERO_LOCATIONS,PETSC_FALSE); 3681be6bf707SBarry Smith $ ierr = MatStoreValues(mat); 3682be6bf707SBarry Smith $ loop over nonlinear iterations 3683be6bf707SBarry Smith $ ierr = MatRetrieveValues(mat); 3684be6bf707SBarry Smith $ // call MatSetValues(mat,...) to set nonliner portion of Jacobian 3685be6bf707SBarry Smith $ // call MatAssemblyBegin/End() on matrix 3686be6bf707SBarry Smith $ Solve linear system with Jacobian 3687be6bf707SBarry Smith $ endloop 3688be6bf707SBarry Smith 3689be6bf707SBarry Smith Notes: 3690be6bf707SBarry Smith Matrix must already be assemblied before calling this routine 3691512a5fc5SBarry Smith Must set the matrix option MatSetOption(mat,MAT_NEW_NONZERO_LOCATIONS,PETSC_FALSE); before 3692be6bf707SBarry Smith calling this routine. 3693be6bf707SBarry Smith 36940c468ba9SBarry Smith When this is called multiple times it overwrites the previous set of stored values 36950c468ba9SBarry Smith and does not allocated additional space. 36960c468ba9SBarry Smith 3697be6bf707SBarry Smith .seealso: MatRetrieveValues() 3698be6bf707SBarry Smith 3699be6bf707SBarry Smith @*/ 37007087cfbeSBarry Smith PetscErrorCode MatStoreValues(Mat mat) 3701be6bf707SBarry Smith { 37024ac538c5SBarry Smith PetscErrorCode ierr; 3703be6bf707SBarry Smith 3704be6bf707SBarry Smith PetscFunctionBegin; 37050700a824SBarry Smith PetscValidHeaderSpecific(mat,MAT_CLASSID,1); 3706e32f2f54SBarry Smith if (!mat->assembled) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Not for unassembled matrix"); 3707e32f2f54SBarry Smith if (mat->factortype) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Not for factored matrix"); 37084ac538c5SBarry Smith ierr = PetscUseMethod(mat,"MatStoreValues_C",(Mat),(mat));CHKERRQ(ierr); 3709be6bf707SBarry Smith PetscFunctionReturn(0); 3710be6bf707SBarry Smith } 3711be6bf707SBarry Smith 37127087cfbeSBarry Smith PetscErrorCode MatRetrieveValues_SeqAIJ(Mat mat) 3713be6bf707SBarry Smith { 3714be6bf707SBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ*)mat->data; 37156849ba73SBarry Smith PetscErrorCode ierr; 3716d0f46423SBarry Smith PetscInt nz = aij->i[mat->rmap->n]; 3717be6bf707SBarry Smith 3718be6bf707SBarry Smith PetscFunctionBegin; 3719169f6850SBarry Smith if (!aij->nonew) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ORDER,"Must call MatSetOption(A,MAT_NEW_NONZERO_LOCATIONS,PETSC_FALSE);first"); 3720f23aa3ddSBarry Smith if (!aij->saved_values) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ORDER,"Must call MatStoreValues(A);first"); 3721be6bf707SBarry Smith /* copy values over */ 3722580bdb30SBarry Smith ierr = PetscArraycpy(aij->a,aij->saved_values,nz);CHKERRQ(ierr); 3723be6bf707SBarry Smith PetscFunctionReturn(0); 3724be6bf707SBarry Smith } 3725be6bf707SBarry Smith 3726be6bf707SBarry Smith /*@ 3727be6bf707SBarry Smith MatRetrieveValues - Retrieves the copy of the matrix values; this allows, for 3728be6bf707SBarry Smith example, reuse of the linear part of a Jacobian, while recomputing the 3729be6bf707SBarry Smith nonlinear portion. 3730be6bf707SBarry Smith 3731be6bf707SBarry Smith Collect on Mat 3732be6bf707SBarry Smith 3733be6bf707SBarry Smith Input Parameters: 3734386f7cf9SBarry Smith . mat - the matrix (currently only AIJ matrices support this option) 3735be6bf707SBarry Smith 373615091d37SBarry Smith Level: advanced 373715091d37SBarry Smith 3738be6bf707SBarry Smith .seealso: MatStoreValues() 3739be6bf707SBarry Smith 3740be6bf707SBarry Smith @*/ 37417087cfbeSBarry Smith PetscErrorCode MatRetrieveValues(Mat mat) 3742be6bf707SBarry Smith { 37434ac538c5SBarry Smith PetscErrorCode ierr; 3744be6bf707SBarry Smith 3745be6bf707SBarry Smith PetscFunctionBegin; 37460700a824SBarry Smith PetscValidHeaderSpecific(mat,MAT_CLASSID,1); 3747e32f2f54SBarry Smith if (!mat->assembled) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Not for unassembled matrix"); 3748e32f2f54SBarry Smith if (mat->factortype) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Not for factored matrix"); 37494ac538c5SBarry Smith ierr = PetscUseMethod(mat,"MatRetrieveValues_C",(Mat),(mat));CHKERRQ(ierr); 3750be6bf707SBarry Smith PetscFunctionReturn(0); 3751be6bf707SBarry Smith } 3752be6bf707SBarry Smith 3753f83d6046SBarry Smith 3754be6bf707SBarry Smith /* --------------------------------------------------------------------------------*/ 375517ab2063SBarry Smith /*@C 3756682d7d0cSBarry Smith MatCreateSeqAIJ - Creates a sparse matrix in AIJ (compressed row) format 37570d15e28bSLois Curfman McInnes (the default parallel PETSc format). For good matrix assembly performance 37586e62573dSLois Curfman McInnes the user should preallocate the matrix storage by setting the parameter nz 375951c19458SBarry Smith (or the array nnz). By setting these parameters accurately, performance 37602bd5e0b2SLois Curfman McInnes during matrix assembly can be increased by more than a factor of 50. 376117ab2063SBarry Smith 3762d083f849SBarry Smith Collective 3763db81eaa0SLois Curfman McInnes 376417ab2063SBarry Smith Input Parameters: 3765db81eaa0SLois Curfman McInnes + comm - MPI communicator, set to PETSC_COMM_SELF 376617ab2063SBarry Smith . m - number of rows 376717ab2063SBarry Smith . n - number of columns 376817ab2063SBarry Smith . nz - number of nonzeros per row (same for all rows) 376951c19458SBarry Smith - nnz - array containing the number of nonzeros in the various rows 37700298fd71SBarry Smith (possibly different for each row) or NULL 377117ab2063SBarry Smith 377217ab2063SBarry Smith Output Parameter: 3773416022c9SBarry Smith . A - the matrix 377417ab2063SBarry Smith 3775175b88e8SBarry Smith It is recommended that one use the MatCreate(), MatSetType() and/or MatSetFromOptions(), 3776f6f02116SRichard Tran Mills MatXXXXSetPreallocation() paradigm instead of this routine directly. 3777175b88e8SBarry Smith [MatXXXXSetPreallocation() is, for example, MatSeqAIJSetPreallocation] 3778175b88e8SBarry Smith 3779b259b22eSLois Curfman McInnes Notes: 378049a6f317SBarry Smith If nnz is given then nz is ignored 378149a6f317SBarry Smith 378217ab2063SBarry Smith The AIJ format (also called the Yale sparse matrix format or 378317ab2063SBarry Smith compressed row storage), is fully compatible with standard Fortran 77 37840002213bSLois Curfman McInnes storage. That is, the stored row and column indices can begin at 378544cd7ae7SLois Curfman McInnes either one (as in Fortran) or zero. See the users' manual for details. 378617ab2063SBarry Smith 378717ab2063SBarry Smith Specify the preallocated storage with either nz or nnz (not both). 37880298fd71SBarry Smith Set nz=PETSC_DEFAULT and nnz=NULL for PETSc to control dynamic memory 37893d323bbdSBarry Smith allocation. For large problems you MUST preallocate memory or you 37906da5968aSLois Curfman McInnes will get TERRIBLE performance, see the users' manual chapter on matrices. 379117ab2063SBarry Smith 3792682d7d0cSBarry Smith By default, this format uses inodes (identical nodes) when possible, to 37934fca80b9SLois Curfman McInnes improve numerical efficiency of matrix-vector products and solves. We 3794682d7d0cSBarry Smith search for consecutive rows with the same nonzero structure, thereby 37956c7ebb05SLois Curfman McInnes reusing matrix information to achieve increased efficiency. 37966c7ebb05SLois Curfman McInnes 37976c7ebb05SLois Curfman McInnes Options Database Keys: 3798698d4c6aSKris Buschelman + -mat_no_inode - Do not use inodes 37999db58ca8SBarry Smith - -mat_inode_limit <limit> - Sets inode limit (max limit=5) 380017ab2063SBarry Smith 3801027ccd11SLois Curfman McInnes Level: intermediate 3802027ccd11SLois Curfman McInnes 380369b1f4b7SBarry Smith .seealso: MatCreate(), MatCreateAIJ(), MatSetValues(), MatSeqAIJSetColumnIndices(), MatCreateSeqAIJWithArrays() 380436db0b34SBarry Smith 380517ab2063SBarry Smith @*/ 38067087cfbeSBarry Smith PetscErrorCode MatCreateSeqAIJ(MPI_Comm comm,PetscInt m,PetscInt n,PetscInt nz,const PetscInt nnz[],Mat *A) 380717ab2063SBarry Smith { 3808dfbe8321SBarry Smith PetscErrorCode ierr; 38096945ee14SBarry Smith 38103a40ed3dSBarry Smith PetscFunctionBegin; 3811f69a0ea3SMatthew Knepley ierr = MatCreate(comm,A);CHKERRQ(ierr); 3812117016b1SBarry Smith ierr = MatSetSizes(*A,m,n,m,n);CHKERRQ(ierr); 3813c4752a88SBarry Smith ierr = MatSetType(*A,MATSEQAIJ);CHKERRQ(ierr); 3814d28bb7d2SJed Brown ierr = MatSeqAIJSetPreallocation_SeqAIJ(*A,nz,nnz);CHKERRQ(ierr); 3815273d9f13SBarry Smith PetscFunctionReturn(0); 3816273d9f13SBarry Smith } 3817273d9f13SBarry Smith 3818273d9f13SBarry Smith /*@C 3819273d9f13SBarry Smith MatSeqAIJSetPreallocation - For good matrix assembly performance 3820273d9f13SBarry Smith the user should preallocate the matrix storage by setting the parameter nz 3821273d9f13SBarry Smith (or the array nnz). By setting these parameters accurately, performance 3822273d9f13SBarry Smith during matrix assembly can be increased by more than a factor of 50. 3823273d9f13SBarry Smith 3824d083f849SBarry Smith Collective 3825273d9f13SBarry Smith 3826273d9f13SBarry Smith Input Parameters: 38271c4f3114SJed Brown + B - The matrix 3828273d9f13SBarry Smith . nz - number of nonzeros per row (same for all rows) 3829273d9f13SBarry Smith - nnz - array containing the number of nonzeros in the various rows 38300298fd71SBarry Smith (possibly different for each row) or NULL 3831273d9f13SBarry Smith 3832273d9f13SBarry Smith Notes: 383349a6f317SBarry Smith If nnz is given then nz is ignored 383449a6f317SBarry Smith 3835273d9f13SBarry Smith The AIJ format (also called the Yale sparse matrix format or 3836273d9f13SBarry Smith compressed row storage), is fully compatible with standard Fortran 77 3837273d9f13SBarry Smith storage. That is, the stored row and column indices can begin at 3838273d9f13SBarry Smith either one (as in Fortran) or zero. See the users' manual for details. 3839273d9f13SBarry Smith 3840273d9f13SBarry Smith Specify the preallocated storage with either nz or nnz (not both). 38410298fd71SBarry Smith Set nz=PETSC_DEFAULT and nnz=NULL for PETSc to control dynamic memory 3842273d9f13SBarry Smith allocation. For large problems you MUST preallocate memory or you 3843273d9f13SBarry Smith will get TERRIBLE performance, see the users' manual chapter on matrices. 3844273d9f13SBarry Smith 3845aa95bbe8SBarry Smith You can call MatGetInfo() to get information on how effective the preallocation was; 3846aa95bbe8SBarry Smith for example the fields mallocs,nz_allocated,nz_used,nz_unneeded; 3847aa95bbe8SBarry Smith You can also run with the option -info and look for messages with the string 3848aa95bbe8SBarry Smith malloc in them to see if additional memory allocation was needed. 3849aa95bbe8SBarry Smith 3850a96a251dSBarry Smith Developers: Use nz of MAT_SKIP_ALLOCATION to not allocate any space for the matrix 3851a96a251dSBarry Smith entries or columns indices 3852a96a251dSBarry Smith 3853273d9f13SBarry Smith By default, this format uses inodes (identical nodes) when possible, to 3854273d9f13SBarry Smith improve numerical efficiency of matrix-vector products and solves. We 3855273d9f13SBarry Smith search for consecutive rows with the same nonzero structure, thereby 3856273d9f13SBarry Smith reusing matrix information to achieve increased efficiency. 3857273d9f13SBarry Smith 3858273d9f13SBarry Smith Options Database Keys: 3859698d4c6aSKris Buschelman + -mat_no_inode - Do not use inodes 386047b2e64bSBarry Smith - -mat_inode_limit <limit> - Sets inode limit (max limit=5) 3861273d9f13SBarry Smith 3862273d9f13SBarry Smith Level: intermediate 3863273d9f13SBarry Smith 386469b1f4b7SBarry Smith .seealso: MatCreate(), MatCreateAIJ(), MatSetValues(), MatSeqAIJSetColumnIndices(), MatCreateSeqAIJWithArrays(), MatGetInfo() 3865273d9f13SBarry Smith 3866273d9f13SBarry Smith @*/ 38677087cfbeSBarry Smith PetscErrorCode MatSeqAIJSetPreallocation(Mat B,PetscInt nz,const PetscInt nnz[]) 3868273d9f13SBarry Smith { 38694ac538c5SBarry Smith PetscErrorCode ierr; 3870a23d5eceSKris Buschelman 3871a23d5eceSKris Buschelman PetscFunctionBegin; 38726ba663aaSJed Brown PetscValidHeaderSpecific(B,MAT_CLASSID,1); 38736ba663aaSJed Brown PetscValidType(B,1); 38744ac538c5SBarry Smith ierr = PetscTryMethod(B,"MatSeqAIJSetPreallocation_C",(Mat,PetscInt,const PetscInt[]),(B,nz,nnz));CHKERRQ(ierr); 3875a23d5eceSKris Buschelman PetscFunctionReturn(0); 3876a23d5eceSKris Buschelman } 3877a23d5eceSKris Buschelman 38787087cfbeSBarry Smith PetscErrorCode MatSeqAIJSetPreallocation_SeqAIJ(Mat B,PetscInt nz,const PetscInt *nnz) 3879a23d5eceSKris Buschelman { 3880273d9f13SBarry Smith Mat_SeqAIJ *b; 38812576faa2SJed Brown PetscBool skipallocation = PETSC_FALSE,realalloc = PETSC_FALSE; 38826849ba73SBarry Smith PetscErrorCode ierr; 388397f1f81fSBarry Smith PetscInt i; 3884273d9f13SBarry Smith 3885273d9f13SBarry Smith PetscFunctionBegin; 38862576faa2SJed Brown if (nz >= 0 || nnz) realalloc = PETSC_TRUE; 3887a96a251dSBarry Smith if (nz == MAT_SKIP_ALLOCATION) { 3888c461c341SBarry Smith skipallocation = PETSC_TRUE; 3889c461c341SBarry Smith nz = 0; 3890c461c341SBarry Smith } 389126283091SBarry Smith ierr = PetscLayoutSetUp(B->rmap);CHKERRQ(ierr); 389226283091SBarry Smith ierr = PetscLayoutSetUp(B->cmap);CHKERRQ(ierr); 3893899cda47SBarry Smith 3894435da068SBarry Smith if (nz == PETSC_DEFAULT || nz == PETSC_DECIDE) nz = 5; 389560e0710aSBarry Smith if (nz < 0) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"nz cannot be less than 0: value %D",nz); 3896cf9c20a2SJed Brown if (PetscUnlikelyDebug(nnz)) { 3897d0f46423SBarry Smith for (i=0; i<B->rmap->n; i++) { 389860e0710aSBarry Smith if (nnz[i] < 0) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"nnz cannot be less than 0: local row %D value %D",i,nnz[i]); 389960e0710aSBarry Smith if (nnz[i] > B->cmap->n) SETERRQ3(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"nnz cannot be greater than row length: local row %D value %d rowlength %D",i,nnz[i],B->cmap->n); 3900b73539f3SBarry Smith } 3901b73539f3SBarry Smith } 3902b73539f3SBarry Smith 3903273d9f13SBarry Smith B->preallocated = PETSC_TRUE; 39042205254eSKarl Rupp 3905273d9f13SBarry Smith b = (Mat_SeqAIJ*)B->data; 3906273d9f13SBarry Smith 3907ab93d7beSBarry Smith if (!skipallocation) { 39082ee49352SLisandro Dalcin if (!b->imax) { 3909071fcb05SBarry Smith ierr = PetscMalloc1(B->rmap->n,&b->imax);CHKERRQ(ierr); 3910071fcb05SBarry Smith ierr = PetscLogObjectMemory((PetscObject)B,B->rmap->n*sizeof(PetscInt));CHKERRQ(ierr); 3911071fcb05SBarry Smith } 3912071fcb05SBarry Smith if (!b->ilen) { 3913071fcb05SBarry Smith /* b->ilen will count nonzeros in each row so far. */ 3914071fcb05SBarry Smith ierr = PetscCalloc1(B->rmap->n,&b->ilen);CHKERRQ(ierr); 3915071fcb05SBarry Smith ierr = PetscLogObjectMemory((PetscObject)B,B->rmap->n*sizeof(PetscInt));CHKERRQ(ierr); 3916071fcb05SBarry Smith } else { 3917071fcb05SBarry Smith ierr = PetscMemzero(b->ilen,B->rmap->n*sizeof(PetscInt));CHKERRQ(ierr); 39182ee49352SLisandro Dalcin } 3919846b4da1SFande Kong if (!b->ipre) { 3920846b4da1SFande Kong ierr = PetscMalloc1(B->rmap->n,&b->ipre);CHKERRQ(ierr); 3921846b4da1SFande Kong ierr = PetscLogObjectMemory((PetscObject)B,B->rmap->n*sizeof(PetscInt));CHKERRQ(ierr); 3922846b4da1SFande Kong } 3923273d9f13SBarry Smith if (!nnz) { 3924435da068SBarry Smith if (nz == PETSC_DEFAULT || nz == PETSC_DECIDE) nz = 10; 3925c62bd62aSJed Brown else if (nz < 0) nz = 1; 39265d2a9ed1SStefano Zampini nz = PetscMin(nz,B->cmap->n); 3927d0f46423SBarry Smith for (i=0; i<B->rmap->n; i++) b->imax[i] = nz; 3928d0f46423SBarry Smith nz = nz*B->rmap->n; 3929273d9f13SBarry Smith } else { 3930c73702f5SBarry Smith PetscInt64 nz64 = 0; 3931c73702f5SBarry Smith for (i=0; i<B->rmap->n; i++) {b->imax[i] = nnz[i]; nz64 += nnz[i];} 3932c73702f5SBarry Smith ierr = PetscIntCast(nz64,&nz);CHKERRQ(ierr); 3933273d9f13SBarry Smith } 3934ab93d7beSBarry Smith 3935273d9f13SBarry Smith /* allocate the matrix space */ 393653dd7562SDmitry Karpeev /* FIXME: should B's old memory be unlogged? */ 39372ee49352SLisandro Dalcin ierr = MatSeqXAIJFreeAIJ(B,&b->a,&b->j,&b->i);CHKERRQ(ierr); 3938396832f4SHong Zhang if (B->structure_only) { 39395848002fSHong Zhang ierr = PetscMalloc1(nz,&b->j);CHKERRQ(ierr); 39405848002fSHong Zhang ierr = PetscMalloc1(B->rmap->n+1,&b->i);CHKERRQ(ierr); 3941396832f4SHong Zhang ierr = PetscLogObjectMemory((PetscObject)B,(B->rmap->n+1)*sizeof(PetscInt)+nz*sizeof(PetscInt));CHKERRQ(ierr); 3942396832f4SHong Zhang } else { 3943dcca6d9dSJed Brown ierr = PetscMalloc3(nz,&b->a,nz,&b->j,B->rmap->n+1,&b->i);CHKERRQ(ierr); 39443bb1ff40SBarry Smith ierr = PetscLogObjectMemory((PetscObject)B,(B->rmap->n+1)*sizeof(PetscInt)+nz*(sizeof(PetscScalar)+sizeof(PetscInt)));CHKERRQ(ierr); 3945396832f4SHong Zhang } 3946bfeeae90SHong Zhang b->i[0] = 0; 3947d0f46423SBarry Smith for (i=1; i<B->rmap->n+1; i++) { 39485da197adSKris Buschelman b->i[i] = b->i[i-1] + b->imax[i-1]; 39495da197adSKris Buschelman } 3950396832f4SHong Zhang if (B->structure_only) { 3951396832f4SHong Zhang b->singlemalloc = PETSC_FALSE; 3952396832f4SHong Zhang b->free_a = PETSC_FALSE; 3953396832f4SHong Zhang } else { 3954273d9f13SBarry Smith b->singlemalloc = PETSC_TRUE; 3955e6b907acSBarry Smith b->free_a = PETSC_TRUE; 3956396832f4SHong Zhang } 3957e6b907acSBarry Smith b->free_ij = PETSC_TRUE; 3958c461c341SBarry Smith } else { 3959e6b907acSBarry Smith b->free_a = PETSC_FALSE; 3960e6b907acSBarry Smith b->free_ij = PETSC_FALSE; 3961c461c341SBarry Smith } 3962273d9f13SBarry Smith 3963846b4da1SFande Kong if (b->ipre && nnz != b->ipre && b->imax) { 3964846b4da1SFande Kong /* reserve user-requested sparsity */ 3965580bdb30SBarry Smith ierr = PetscArraycpy(b->ipre,b->imax,B->rmap->n);CHKERRQ(ierr); 3966846b4da1SFande Kong } 3967846b4da1SFande Kong 3968846b4da1SFande Kong 3969273d9f13SBarry Smith b->nz = 0; 3970273d9f13SBarry Smith b->maxnz = nz; 3971273d9f13SBarry Smith B->info.nz_unneeded = (double)b->maxnz; 39722205254eSKarl Rupp if (realalloc) { 39732205254eSKarl Rupp ierr = MatSetOption(B,MAT_NEW_NONZERO_ALLOCATION_ERR,PETSC_TRUE);CHKERRQ(ierr); 39742205254eSKarl Rupp } 3975cb7b82ddSBarry Smith B->was_assembled = PETSC_FALSE; 3976cb7b82ddSBarry Smith B->assembled = PETSC_FALSE; 3977273d9f13SBarry Smith PetscFunctionReturn(0); 3978273d9f13SBarry Smith } 3979273d9f13SBarry Smith 3980846b4da1SFande Kong 3981846b4da1SFande Kong PetscErrorCode MatResetPreallocation_SeqAIJ(Mat A) 3982846b4da1SFande Kong { 3983846b4da1SFande Kong Mat_SeqAIJ *a; 3984a5bbaf83SFande Kong PetscInt i; 3985846b4da1SFande Kong PetscErrorCode ierr; 3986846b4da1SFande Kong 3987846b4da1SFande Kong PetscFunctionBegin; 3988846b4da1SFande Kong PetscValidHeaderSpecific(A,MAT_CLASSID,1); 398914d0e64fSAlex Lindsay 399014d0e64fSAlex Lindsay /* Check local size. If zero, then return */ 399114d0e64fSAlex Lindsay if (!A->rmap->n) PetscFunctionReturn(0); 399214d0e64fSAlex Lindsay 3993846b4da1SFande Kong a = (Mat_SeqAIJ*)A->data; 39942c814fdeSFande Kong /* if no saved info, we error out */ 3995fb4dc15dSAlex Lindsay if (!a->ipre) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_NULL,"No saved preallocation info \n"); 39962c814fdeSFande Kong 3997fb4dc15dSAlex Lindsay if (!a->i || !a->j || !a->a || !a->imax || !a->ilen) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_NULL,"Memory info is incomplete, and can not reset preallocation \n"); 39982c814fdeSFande Kong 3999580bdb30SBarry Smith ierr = PetscArraycpy(a->imax,a->ipre,A->rmap->n);CHKERRQ(ierr); 4000580bdb30SBarry Smith ierr = PetscArrayzero(a->ilen,A->rmap->n);CHKERRQ(ierr); 4001846b4da1SFande Kong a->i[0] = 0; 4002846b4da1SFande Kong for (i=1; i<A->rmap->n+1; i++) { 4003846b4da1SFande Kong a->i[i] = a->i[i-1] + a->imax[i-1]; 4004846b4da1SFande Kong } 4005846b4da1SFande Kong A->preallocated = PETSC_TRUE; 4006846b4da1SFande Kong a->nz = 0; 4007846b4da1SFande Kong a->maxnz = a->i[A->rmap->n]; 4008846b4da1SFande Kong A->info.nz_unneeded = (double)a->maxnz; 4009846b4da1SFande Kong A->was_assembled = PETSC_FALSE; 4010846b4da1SFande Kong A->assembled = PETSC_FALSE; 4011846b4da1SFande Kong PetscFunctionReturn(0); 4012846b4da1SFande Kong } 4013846b4da1SFande Kong 401458d36128SBarry Smith /*@ 4015a1661176SMatthew Knepley MatSeqAIJSetPreallocationCSR - Allocates memory for a sparse sequential matrix in AIJ format. 4016a1661176SMatthew Knepley 4017a1661176SMatthew Knepley Input Parameters: 4018a1661176SMatthew Knepley + B - the matrix 4019a1661176SMatthew Knepley . i - the indices into j for the start of each row (starts with zero) 4020a1661176SMatthew Knepley . j - the column indices for each row (starts with zero) these must be sorted for each row 4021a1661176SMatthew Knepley - v - optional values in the matrix 4022a1661176SMatthew Knepley 4023a1661176SMatthew Knepley Level: developer 4024a1661176SMatthew Knepley 402558d36128SBarry Smith The i,j,v values are COPIED with this routine; to avoid the copy use MatCreateSeqAIJWithArrays() 402658d36128SBarry Smith 4027c1c1d628SHong Zhang .seealso: MatCreate(), MatCreateSeqAIJ(), MatSetValues(), MatSeqAIJSetPreallocation(), MatCreateSeqAIJ(), MATSEQAIJ 4028a1661176SMatthew Knepley @*/ 4029a1661176SMatthew Knepley PetscErrorCode MatSeqAIJSetPreallocationCSR(Mat B,const PetscInt i[],const PetscInt j[],const PetscScalar v[]) 4030a1661176SMatthew Knepley { 4031a1661176SMatthew Knepley PetscErrorCode ierr; 4032a1661176SMatthew Knepley 4033a1661176SMatthew Knepley PetscFunctionBegin; 40340700a824SBarry Smith PetscValidHeaderSpecific(B,MAT_CLASSID,1); 40356ba663aaSJed Brown PetscValidType(B,1); 40364ac538c5SBarry Smith ierr = PetscTryMethod(B,"MatSeqAIJSetPreallocationCSR_C",(Mat,const PetscInt[],const PetscInt[],const PetscScalar[]),(B,i,j,v));CHKERRQ(ierr); 4037a1661176SMatthew Knepley PetscFunctionReturn(0); 4038a1661176SMatthew Knepley } 4039a1661176SMatthew Knepley 40407087cfbeSBarry Smith PetscErrorCode MatSeqAIJSetPreallocationCSR_SeqAIJ(Mat B,const PetscInt Ii[],const PetscInt J[],const PetscScalar v[]) 4041a1661176SMatthew Knepley { 4042a1661176SMatthew Knepley PetscInt i; 4043a1661176SMatthew Knepley PetscInt m,n; 4044a1661176SMatthew Knepley PetscInt nz; 4045a1661176SMatthew Knepley PetscInt *nnz, nz_max = 0; 4046a1661176SMatthew Knepley PetscErrorCode ierr; 4047a1661176SMatthew Knepley 4048a1661176SMatthew Knepley PetscFunctionBegin; 404965e19b50SBarry Smith if (Ii[0]) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE, "Ii[0] must be 0 it is %D", Ii[0]); 4050779a8d59SSatish Balay 4051779a8d59SSatish Balay ierr = PetscLayoutSetUp(B->rmap);CHKERRQ(ierr); 4052779a8d59SSatish Balay ierr = PetscLayoutSetUp(B->cmap);CHKERRQ(ierr); 4053779a8d59SSatish Balay 4054779a8d59SSatish Balay ierr = MatGetSize(B, &m, &n);CHKERRQ(ierr); 4055854ce69bSBarry Smith ierr = PetscMalloc1(m+1, &nnz);CHKERRQ(ierr); 4056a1661176SMatthew Knepley for (i = 0; i < m; i++) { 4057b7940d39SSatish Balay nz = Ii[i+1]- Ii[i]; 4058a1661176SMatthew Knepley nz_max = PetscMax(nz_max, nz); 405965e19b50SBarry Smith if (nz < 0) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE, "Local row %D has a negative number of columns %D", i, nnz); 4060a1661176SMatthew Knepley nnz[i] = nz; 4061a1661176SMatthew Knepley } 4062a1661176SMatthew Knepley ierr = MatSeqAIJSetPreallocation(B, 0, nnz);CHKERRQ(ierr); 4063a1661176SMatthew Knepley ierr = PetscFree(nnz);CHKERRQ(ierr); 4064a1661176SMatthew Knepley 4065a1661176SMatthew Knepley for (i = 0; i < m; i++) { 4066071fcb05SBarry Smith ierr = MatSetValues_SeqAIJ(B, 1, &i, Ii[i+1] - Ii[i], J+Ii[i], v ? v + Ii[i] : NULL, INSERT_VALUES);CHKERRQ(ierr); 4067a1661176SMatthew Knepley } 4068a1661176SMatthew Knepley 4069a1661176SMatthew Knepley ierr = MatAssemblyBegin(B,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 4070a1661176SMatthew Knepley ierr = MatAssemblyEnd(B,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 4071a1661176SMatthew Knepley 40727827cd58SJed Brown ierr = MatSetOption(B,MAT_NEW_NONZERO_LOCATION_ERR,PETSC_TRUE);CHKERRQ(ierr); 4073a1661176SMatthew Knepley PetscFunctionReturn(0); 4074a1661176SMatthew Knepley } 4075a1661176SMatthew Knepley 4076c6db04a5SJed Brown #include <../src/mat/impls/dense/seq/dense.h> 4077af0996ceSBarry Smith #include <petsc/private/kernels/petscaxpy.h> 4078170fe5c8SBarry Smith 4079170fe5c8SBarry Smith /* 4080170fe5c8SBarry Smith Computes (B'*A')' since computing B*A directly is untenable 4081170fe5c8SBarry Smith 4082170fe5c8SBarry Smith n p p 4083170fe5c8SBarry Smith ( ) ( ) ( ) 4084170fe5c8SBarry Smith m ( A ) * n ( B ) = m ( C ) 4085170fe5c8SBarry Smith ( ) ( ) ( ) 4086170fe5c8SBarry Smith 4087170fe5c8SBarry Smith */ 4088170fe5c8SBarry Smith PetscErrorCode MatMatMultNumeric_SeqDense_SeqAIJ(Mat A,Mat B,Mat C) 4089170fe5c8SBarry Smith { 4090170fe5c8SBarry Smith PetscErrorCode ierr; 4091170fe5c8SBarry Smith Mat_SeqDense *sub_a = (Mat_SeqDense*)A->data; 4092170fe5c8SBarry Smith Mat_SeqAIJ *sub_b = (Mat_SeqAIJ*)B->data; 4093170fe5c8SBarry Smith Mat_SeqDense *sub_c = (Mat_SeqDense*)C->data; 40941de00fd4SBarry Smith PetscInt i,n,m,q,p; 4095170fe5c8SBarry Smith const PetscInt *ii,*idx; 4096170fe5c8SBarry Smith const PetscScalar *b,*a,*a_q; 4097170fe5c8SBarry Smith PetscScalar *c,*c_q; 4098170fe5c8SBarry Smith 4099170fe5c8SBarry Smith PetscFunctionBegin; 4100d0f46423SBarry Smith m = A->rmap->n; 4101d0f46423SBarry Smith n = A->cmap->n; 4102d0f46423SBarry Smith p = B->cmap->n; 4103170fe5c8SBarry Smith a = sub_a->v; 4104170fe5c8SBarry Smith b = sub_b->a; 4105170fe5c8SBarry Smith c = sub_c->v; 4106580bdb30SBarry Smith ierr = PetscArrayzero(c,m*p);CHKERRQ(ierr); 4107170fe5c8SBarry Smith 4108170fe5c8SBarry Smith ii = sub_b->i; 4109170fe5c8SBarry Smith idx = sub_b->j; 4110170fe5c8SBarry Smith for (i=0; i<n; i++) { 4111170fe5c8SBarry Smith q = ii[i+1] - ii[i]; 4112170fe5c8SBarry Smith while (q-->0) { 4113170fe5c8SBarry Smith c_q = c + m*(*idx); 4114170fe5c8SBarry Smith a_q = a + m*i; 4115854c7f52SBarry Smith PetscKernelAXPY(c_q,*b,a_q,m); 4116170fe5c8SBarry Smith idx++; 4117170fe5c8SBarry Smith b++; 4118170fe5c8SBarry Smith } 4119170fe5c8SBarry Smith } 4120170fe5c8SBarry Smith PetscFunctionReturn(0); 4121170fe5c8SBarry Smith } 4122170fe5c8SBarry Smith 41234222ddf1SHong Zhang PetscErrorCode MatMatMultSymbolic_SeqDense_SeqAIJ(Mat A,Mat B,PetscReal fill,Mat C) 4124170fe5c8SBarry Smith { 4125170fe5c8SBarry Smith PetscErrorCode ierr; 4126d0f46423SBarry Smith PetscInt m=A->rmap->n,n=B->cmap->n; 4127170fe5c8SBarry Smith 4128170fe5c8SBarry Smith PetscFunctionBegin; 412960e0710aSBarry Smith if (A->cmap->n != B->rmap->n) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"A->cmap->n %D != B->rmap->n %D\n",A->cmap->n,B->rmap->n); 41304222ddf1SHong Zhang ierr = MatSetSizes(C,m,n,m,n);CHKERRQ(ierr); 41314222ddf1SHong Zhang ierr = MatSetBlockSizesFromMats(C,A,B);CHKERRQ(ierr); 41324222ddf1SHong Zhang ierr = MatSetType(C,MATSEQDENSE);CHKERRQ(ierr); 41334222ddf1SHong Zhang ierr = MatSeqDenseSetPreallocation(C,NULL);CHKERRQ(ierr); 4134d73949e8SHong Zhang 41354222ddf1SHong Zhang C->ops->matmultnumeric = MatMatMultNumeric_SeqDense_SeqAIJ; 4136170fe5c8SBarry Smith PetscFunctionReturn(0); 4137170fe5c8SBarry Smith } 4138170fe5c8SBarry Smith 4139170fe5c8SBarry Smith /* ----------------------------------------------------------------*/ 41400bad9183SKris Buschelman /*MC 4141fafad747SKris Buschelman MATSEQAIJ - MATSEQAIJ = "seqaij" - A matrix type to be used for sequential sparse matrices, 41420bad9183SKris Buschelman based on compressed sparse row format. 41430bad9183SKris Buschelman 41440bad9183SKris Buschelman Options Database Keys: 41450bad9183SKris Buschelman . -mat_type seqaij - sets the matrix type to "seqaij" during a call to MatSetFromOptions() 41460bad9183SKris Buschelman 41470bad9183SKris Buschelman Level: beginner 41480bad9183SKris Buschelman 41490cd7f59aSBarry Smith Notes: 41500cd7f59aSBarry Smith MatSetValues() may be called for this matrix type with a NULL argument for the numerical values, 41510cd7f59aSBarry Smith in this case the values associated with the rows and columns one passes in are set to zero 41520cd7f59aSBarry Smith in the matrix 41530cd7f59aSBarry Smith 41540cd7f59aSBarry Smith MatSetOptions(,MAT_STRUCTURE_ONLY,PETSC_TRUE) may be called for this matrix type. In this no 41550cd7f59aSBarry Smith space is allocated for the nonzero entries and any entries passed with MatSetValues() are ignored 41560cd7f59aSBarry Smith 41570cd7f59aSBarry Smith Developer Notes: 41580cd7f59aSBarry Smith It would be nice if all matrix formats supported passing NULL in for the numerical values 41590cd7f59aSBarry Smith 4160f587520bSBarry Smith .seealso: MatCreateSeqAIJ(), MatSetFromOptions(), MatSetType(), MatCreate(), MatType 41610bad9183SKris Buschelman M*/ 41620bad9183SKris Buschelman 4163ccd284c7SBarry Smith /*MC 4164ccd284c7SBarry Smith MATAIJ - MATAIJ = "aij" - A matrix type to be used for sparse matrices. 4165ccd284c7SBarry Smith 4166ccd284c7SBarry Smith This matrix type is identical to MATSEQAIJ when constructed with a single process communicator, 4167ccd284c7SBarry Smith and MATMPIAIJ otherwise. As a result, for single process communicators, 41680cd7f59aSBarry Smith MatSeqAIJSetPreallocation is supported, and similarly MatMPIAIJSetPreallocation() is supported 4169ccd284c7SBarry Smith for communicators controlling multiple processes. It is recommended that you call both of 4170ccd284c7SBarry Smith the above preallocation routines for simplicity. 4171ccd284c7SBarry Smith 4172ccd284c7SBarry Smith Options Database Keys: 4173ccd284c7SBarry Smith . -mat_type aij - sets the matrix type to "aij" during a call to MatSetFromOptions() 4174ccd284c7SBarry Smith 417595452b02SPatrick Sanan Developer Notes: 4176ca9cdca7SRichard Tran Mills Subclasses include MATAIJCUSPARSE, MATAIJPERM, MATAIJSELL, MATAIJMKL, MATAIJCRL, and also automatically switches over to use inodes when 4177ccd284c7SBarry Smith enough exist. 4178ccd284c7SBarry Smith 4179ccd284c7SBarry Smith Level: beginner 4180ccd284c7SBarry Smith 4181ccd284c7SBarry Smith .seealso: MatCreateAIJ(), MatCreateSeqAIJ(), MATSEQAIJ,MATMPIAIJ 4182ccd284c7SBarry Smith M*/ 4183ccd284c7SBarry Smith 4184ccd284c7SBarry Smith /*MC 4185ccd284c7SBarry Smith MATAIJCRL - MATAIJCRL = "aijcrl" - A matrix type to be used for sparse matrices. 4186ccd284c7SBarry Smith 4187ccd284c7SBarry Smith This matrix type is identical to MATSEQAIJCRL when constructed with a single process communicator, 4188ccd284c7SBarry Smith and MATMPIAIJCRL otherwise. As a result, for single process communicators, 4189ccd284c7SBarry Smith MatSeqAIJSetPreallocation() is supported, and similarly MatMPIAIJSetPreallocation() is supported 4190ccd284c7SBarry Smith for communicators controlling multiple processes. It is recommended that you call both of 4191ccd284c7SBarry Smith the above preallocation routines for simplicity. 4192ccd284c7SBarry Smith 4193ccd284c7SBarry Smith Options Database Keys: 4194ccd284c7SBarry Smith . -mat_type aijcrl - sets the matrix type to "aijcrl" during a call to MatSetFromOptions() 4195ccd284c7SBarry Smith 4196ccd284c7SBarry Smith Level: beginner 4197ccd284c7SBarry Smith 4198ccd284c7SBarry Smith .seealso: MatCreateMPIAIJCRL,MATSEQAIJCRL,MATMPIAIJCRL, MATSEQAIJCRL, MATMPIAIJCRL 4199ccd284c7SBarry Smith M*/ 4200ccd284c7SBarry Smith 42017906f579SHong Zhang PETSC_INTERN PetscErrorCode MatConvert_SeqAIJ_SeqAIJCRL(Mat,MatType,MatReuse,Mat*); 42027906f579SHong Zhang #if defined(PETSC_HAVE_ELEMENTAL) 42037906f579SHong Zhang PETSC_INTERN PetscErrorCode MatConvert_SeqAIJ_Elemental(Mat,MatType,MatReuse,Mat*); 42047906f579SHong Zhang #endif 42057906f579SHong Zhang #if defined(PETSC_HAVE_HYPRE) 42067906f579SHong Zhang PETSC_INTERN PetscErrorCode MatConvert_AIJ_HYPRE(Mat A,MatType,MatReuse,Mat*); 42077906f579SHong Zhang #endif 42087906f579SHong Zhang PETSC_INTERN PetscErrorCode MatConvert_SeqAIJ_SeqDense(Mat,MatType,MatReuse,Mat*); 42097906f579SHong Zhang 4210d4002b98SHong Zhang PETSC_EXTERN PetscErrorCode MatConvert_SeqAIJ_SeqSELL(Mat,MatType,MatReuse,Mat*); 4211c9225affSStefano Zampini PETSC_INTERN PetscErrorCode MatConvert_XAIJ_IS(Mat,MatType,MatReuse,Mat*); 42124222ddf1SHong Zhang PETSC_INTERN PetscErrorCode MatProductSetFromOptions_IS_XAIJ(Mat); 42137906f579SHong Zhang 42148c778c55SBarry Smith /*@C 42158f1ea47aSStefano Zampini MatSeqAIJGetArray - gives read/write access to the array where the data for a MATSEQAIJ matrix is stored 42168c778c55SBarry Smith 42178c778c55SBarry Smith Not Collective 42188c778c55SBarry Smith 42198c778c55SBarry Smith Input Parameter: 4220579dbff0SBarry Smith . mat - a MATSEQAIJ matrix 42218c778c55SBarry Smith 42228c778c55SBarry Smith Output Parameter: 42238c778c55SBarry Smith . array - pointer to the data 42248c778c55SBarry Smith 42258c778c55SBarry Smith Level: intermediate 42268c778c55SBarry Smith 4227774cf152SJed Brown .seealso: MatSeqAIJRestoreArray(), MatSeqAIJGetArrayF90() 42288c778c55SBarry Smith @*/ 42298c778c55SBarry Smith PetscErrorCode MatSeqAIJGetArray(Mat A,PetscScalar **array) 42308c778c55SBarry Smith { 42318c778c55SBarry Smith PetscErrorCode ierr; 42328c778c55SBarry Smith 42338c778c55SBarry Smith PetscFunctionBegin; 42348c778c55SBarry Smith ierr = PetscUseMethod(A,"MatSeqAIJGetArray_C",(Mat,PetscScalar**),(A,array));CHKERRQ(ierr); 42358c778c55SBarry Smith PetscFunctionReturn(0); 42368c778c55SBarry Smith } 42378c778c55SBarry Smith 423821e72a00SBarry Smith /*@C 42398f1ea47aSStefano Zampini MatSeqAIJGetArrayRead - gives read-only access to the array where the data for a MATSEQAIJ matrix is stored 42408f1ea47aSStefano Zampini 42418f1ea47aSStefano Zampini Not Collective 42428f1ea47aSStefano Zampini 42438f1ea47aSStefano Zampini Input Parameter: 42448f1ea47aSStefano Zampini . mat - a MATSEQAIJ matrix 42458f1ea47aSStefano Zampini 42468f1ea47aSStefano Zampini Output Parameter: 42478f1ea47aSStefano Zampini . array - pointer to the data 42488f1ea47aSStefano Zampini 42498f1ea47aSStefano Zampini Level: intermediate 42508f1ea47aSStefano Zampini 42518f1ea47aSStefano Zampini .seealso: MatSeqAIJGetArray(), MatSeqAIJRestoreArrayRead() 42528f1ea47aSStefano Zampini @*/ 42538f1ea47aSStefano Zampini PetscErrorCode MatSeqAIJGetArrayRead(Mat A,const PetscScalar **array) 42548f1ea47aSStefano Zampini { 42558f1ea47aSStefano Zampini #if defined(PETSC_HAVE_CUDA) || defined(PETSC_HAVE_VIENNACL) 4256c70f7ee4SJunchao Zhang PetscOffloadMask oval; 42578f1ea47aSStefano Zampini #endif 42588f1ea47aSStefano Zampini PetscErrorCode ierr; 42598f1ea47aSStefano Zampini 42608f1ea47aSStefano Zampini PetscFunctionBegin; 42618f1ea47aSStefano Zampini #if defined(PETSC_HAVE_CUDA) || defined(PETSC_HAVE_VIENNACL) 4262c70f7ee4SJunchao Zhang oval = A->offloadmask; 42638f1ea47aSStefano Zampini #endif 42648f1ea47aSStefano Zampini ierr = MatSeqAIJGetArray(A,(PetscScalar**)array);CHKERRQ(ierr); 42658f1ea47aSStefano Zampini #if defined(PETSC_HAVE_CUDA) || defined(PETSC_HAVE_VIENNACL) 4266c70f7ee4SJunchao Zhang if (oval == PETSC_OFFLOAD_GPU || oval == PETSC_OFFLOAD_BOTH) A->offloadmask = PETSC_OFFLOAD_BOTH; 42678f1ea47aSStefano Zampini #endif 42688f1ea47aSStefano Zampini PetscFunctionReturn(0); 42698f1ea47aSStefano Zampini } 42708f1ea47aSStefano Zampini 42718f1ea47aSStefano Zampini /*@C 42728f1ea47aSStefano Zampini MatSeqAIJRestoreArrayRead - restore the read-only access array obtained from MatSeqAIJGetArrayRead 42738f1ea47aSStefano Zampini 42748f1ea47aSStefano Zampini Not Collective 42758f1ea47aSStefano Zampini 42768f1ea47aSStefano Zampini Input Parameter: 42778f1ea47aSStefano Zampini . mat - a MATSEQAIJ matrix 42788f1ea47aSStefano Zampini 42798f1ea47aSStefano Zampini Output Parameter: 42808f1ea47aSStefano Zampini . array - pointer to the data 42818f1ea47aSStefano Zampini 42828f1ea47aSStefano Zampini Level: intermediate 42838f1ea47aSStefano Zampini 42848f1ea47aSStefano Zampini .seealso: MatSeqAIJGetArray(), MatSeqAIJGetArrayRead() 42858f1ea47aSStefano Zampini @*/ 42868f1ea47aSStefano Zampini PetscErrorCode MatSeqAIJRestoreArrayRead(Mat A,const PetscScalar **array) 42878f1ea47aSStefano Zampini { 42888f1ea47aSStefano Zampini #if defined(PETSC_HAVE_CUDA) || defined(PETSC_HAVE_VIENNACL) 4289c70f7ee4SJunchao Zhang PetscOffloadMask oval; 42908f1ea47aSStefano Zampini #endif 42918f1ea47aSStefano Zampini PetscErrorCode ierr; 42928f1ea47aSStefano Zampini 42938f1ea47aSStefano Zampini PetscFunctionBegin; 42948f1ea47aSStefano Zampini #if defined(PETSC_HAVE_CUDA) || defined(PETSC_HAVE_VIENNACL) 4295c70f7ee4SJunchao Zhang oval = A->offloadmask; 42968f1ea47aSStefano Zampini #endif 42978f1ea47aSStefano Zampini ierr = MatSeqAIJRestoreArray(A,(PetscScalar**)array);CHKERRQ(ierr); 42988f1ea47aSStefano Zampini #if defined(PETSC_HAVE_CUDA) || defined(PETSC_HAVE_VIENNACL) 4299c70f7ee4SJunchao Zhang A->offloadmask = oval; 43008f1ea47aSStefano Zampini #endif 43018f1ea47aSStefano Zampini PetscFunctionReturn(0); 43028f1ea47aSStefano Zampini } 43038f1ea47aSStefano Zampini 43048f1ea47aSStefano Zampini /*@C 430521e72a00SBarry Smith MatSeqAIJGetMaxRowNonzeros - returns the maximum number of nonzeros in any row 430621e72a00SBarry Smith 430721e72a00SBarry Smith Not Collective 430821e72a00SBarry Smith 430921e72a00SBarry Smith Input Parameter: 4310579dbff0SBarry Smith . mat - a MATSEQAIJ matrix 431121e72a00SBarry Smith 431221e72a00SBarry Smith Output Parameter: 431321e72a00SBarry Smith . nz - the maximum number of nonzeros in any row 431421e72a00SBarry Smith 431521e72a00SBarry Smith Level: intermediate 431621e72a00SBarry Smith 431721e72a00SBarry Smith .seealso: MatSeqAIJRestoreArray(), MatSeqAIJGetArrayF90() 431821e72a00SBarry Smith @*/ 431921e72a00SBarry Smith PetscErrorCode MatSeqAIJGetMaxRowNonzeros(Mat A,PetscInt *nz) 432021e72a00SBarry Smith { 432121e72a00SBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ*)A->data; 432221e72a00SBarry Smith 432321e72a00SBarry Smith PetscFunctionBegin; 432421e72a00SBarry Smith *nz = aij->rmax; 432521e72a00SBarry Smith PetscFunctionReturn(0); 432621e72a00SBarry Smith } 432721e72a00SBarry Smith 43288c778c55SBarry Smith /*@C 4329579dbff0SBarry Smith MatSeqAIJRestoreArray - returns access to the array where the data for a MATSEQAIJ matrix is stored obtained by MatSeqAIJGetArray() 43308c778c55SBarry Smith 43318c778c55SBarry Smith Not Collective 43328c778c55SBarry Smith 43338c778c55SBarry Smith Input Parameters: 4334a2b725a8SWilliam Gropp + mat - a MATSEQAIJ matrix 4335a2b725a8SWilliam Gropp - array - pointer to the data 43368c778c55SBarry Smith 43378c778c55SBarry Smith Level: intermediate 43388c778c55SBarry Smith 4339774cf152SJed Brown .seealso: MatSeqAIJGetArray(), MatSeqAIJRestoreArrayF90() 43408c778c55SBarry Smith @*/ 43418c778c55SBarry Smith PetscErrorCode MatSeqAIJRestoreArray(Mat A,PetscScalar **array) 43428c778c55SBarry Smith { 43438c778c55SBarry Smith PetscErrorCode ierr; 43448c778c55SBarry Smith 43458c778c55SBarry Smith PetscFunctionBegin; 43468c778c55SBarry Smith ierr = PetscUseMethod(A,"MatSeqAIJRestoreArray_C",(Mat,PetscScalar**),(A,array));CHKERRQ(ierr); 43478c778c55SBarry Smith PetscFunctionReturn(0); 43488c778c55SBarry Smith } 43498c778c55SBarry Smith 435034b5b067SBarry Smith #if defined(PETSC_HAVE_CUDA) 4351*0ce8acdeSStefano Zampini PETSC_INTERN PetscErrorCode MatConvert_SeqAIJ_SeqAIJCUSPARSE(Mat); 435202fe1965SBarry Smith #endif 435302fe1965SBarry Smith 43548cc058d9SJed Brown PETSC_EXTERN PetscErrorCode MatCreate_SeqAIJ(Mat B) 4355273d9f13SBarry Smith { 4356273d9f13SBarry Smith Mat_SeqAIJ *b; 4357dfbe8321SBarry Smith PetscErrorCode ierr; 435838baddfdSBarry Smith PetscMPIInt size; 4359273d9f13SBarry Smith 4360273d9f13SBarry Smith PetscFunctionBegin; 4361ce94432eSBarry Smith ierr = MPI_Comm_size(PetscObjectComm((PetscObject)B),&size);CHKERRQ(ierr); 4362e32f2f54SBarry Smith if (size > 1) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Comm must be of size 1"); 4363273d9f13SBarry Smith 4364b00a9115SJed Brown ierr = PetscNewLog(B,&b);CHKERRQ(ierr); 43652205254eSKarl Rupp 4366b0a32e0cSBarry Smith B->data = (void*)b; 43672205254eSKarl Rupp 4368549d3d68SSatish Balay ierr = PetscMemcpy(B->ops,&MatOps_Values,sizeof(struct _MatOps));CHKERRQ(ierr); 4369071fcb05SBarry Smith if (B->sortedfull) B->ops->setvalues = MatSetValues_SeqAIJ_SortedFull; 43702205254eSKarl Rupp 4371416022c9SBarry Smith b->row = 0; 4372416022c9SBarry Smith b->col = 0; 437382bf6240SBarry Smith b->icol = 0; 4374b810aeb4SBarry Smith b->reallocs = 0; 437536db0b34SBarry Smith b->ignorezeroentries = PETSC_FALSE; 4376f1e2ffcdSBarry Smith b->roworiented = PETSC_TRUE; 4377416022c9SBarry Smith b->nonew = 0; 4378416022c9SBarry Smith b->diag = 0; 4379416022c9SBarry Smith b->solve_work = 0; 43802a1b7f2aSHong Zhang B->spptr = 0; 4381be6bf707SBarry Smith b->saved_values = 0; 4382d7f994e1SBarry Smith b->idiag = 0; 438371f1c65dSBarry Smith b->mdiag = 0; 438471f1c65dSBarry Smith b->ssor_work = 0; 438571f1c65dSBarry Smith b->omega = 1.0; 438671f1c65dSBarry Smith b->fshift = 0.0; 438771f1c65dSBarry Smith b->idiagvalid = PETSC_FALSE; 4388bbead8a2SBarry Smith b->ibdiagvalid = PETSC_FALSE; 4389a9817697SBarry Smith b->keepnonzeropattern = PETSC_FALSE; 439017ab2063SBarry Smith 439135d8aa7fSBarry Smith ierr = PetscObjectChangeTypeName((PetscObject)B,MATSEQAIJ);CHKERRQ(ierr); 4392bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatSeqAIJGetArray_C",MatSeqAIJGetArray_SeqAIJ);CHKERRQ(ierr); 4393bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatSeqAIJRestoreArray_C",MatSeqAIJRestoreArray_SeqAIJ);CHKERRQ(ierr); 43948c778c55SBarry Smith 4395b3866ffcSBarry Smith #if defined(PETSC_HAVE_MATLAB_ENGINE) 4396bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"PetscMatlabEnginePut_C",MatlabEnginePut_SeqAIJ);CHKERRQ(ierr); 4397bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"PetscMatlabEngineGet_C",MatlabEngineGet_SeqAIJ);CHKERRQ(ierr); 4398b3866ffcSBarry Smith #endif 439917f1a0eaSHong Zhang 4400bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatSeqAIJSetColumnIndices_C",MatSeqAIJSetColumnIndices_SeqAIJ);CHKERRQ(ierr); 4401bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatStoreValues_C",MatStoreValues_SeqAIJ);CHKERRQ(ierr); 4402bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatRetrieveValues_C",MatRetrieveValues_SeqAIJ);CHKERRQ(ierr); 4403bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatConvert_seqaij_seqsbaij_C",MatConvert_SeqAIJ_SeqSBAIJ);CHKERRQ(ierr); 4404bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatConvert_seqaij_seqbaij_C",MatConvert_SeqAIJ_SeqBAIJ);CHKERRQ(ierr); 4405bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatConvert_seqaij_seqaijperm_C",MatConvert_SeqAIJ_SeqAIJPERM);CHKERRQ(ierr); 44064dfdc2d9SRichard Tran Mills ierr = PetscObjectComposeFunction((PetscObject)B,"MatConvert_seqaij_seqaijsell_C",MatConvert_SeqAIJ_SeqAIJSELL);CHKERRQ(ierr); 44079779e05dSSatish Balay #if defined(PETSC_HAVE_MKL_SPARSE) 44084a2a386eSRichard Tran Mills ierr = PetscObjectComposeFunction((PetscObject)B,"MatConvert_seqaij_seqaijmkl_C",MatConvert_SeqAIJ_SeqAIJMKL);CHKERRQ(ierr); 4409191b95cbSRichard Tran Mills #endif 441034b5b067SBarry Smith #if defined(PETSC_HAVE_CUDA) 441102fe1965SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatConvert_seqaij_seqaijcusparse_C",MatConvert_SeqAIJ_SeqAIJCUSPARSE);CHKERRQ(ierr); 44124222ddf1SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatProductSetFromOptions_seqaijcusparse_seqaij_C",MatProductSetFromOptions_SeqAIJ);CHKERRQ(ierr); 441302fe1965SBarry Smith #endif 4414bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatConvert_seqaij_seqaijcrl_C",MatConvert_SeqAIJ_SeqAIJCRL);CHKERRQ(ierr); 4415af8000cdSHong Zhang #if defined(PETSC_HAVE_ELEMENTAL) 4416af8000cdSHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatConvert_seqaij_elemental_C",MatConvert_SeqAIJ_Elemental);CHKERRQ(ierr); 4417af8000cdSHong Zhang #endif 441863c07aadSStefano Zampini #if defined(PETSC_HAVE_HYPRE) 441963c07aadSStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatConvert_seqaij_hypre_C",MatConvert_AIJ_HYPRE);CHKERRQ(ierr); 44204222ddf1SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatProductSetFromOptions_transpose_seqaij_seqaij_C",MatProductSetFromOptions_Transpose_AIJ_AIJ);CHKERRQ(ierr); 442163c07aadSStefano Zampini #endif 4422b49cda9fSStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatConvert_seqaij_seqdense_C",MatConvert_SeqAIJ_SeqDense);CHKERRQ(ierr); 4423d4002b98SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatConvert_seqaij_seqsell_C",MatConvert_SeqAIJ_SeqSELL);CHKERRQ(ierr); 4424c9225affSStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatConvert_seqaij_is_C",MatConvert_XAIJ_IS);CHKERRQ(ierr); 4425bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatIsTranspose_C",MatIsTranspose_SeqAIJ);CHKERRQ(ierr); 4426bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatIsHermitianTranspose_C",MatIsTranspose_SeqAIJ);CHKERRQ(ierr); 4427bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatSeqAIJSetPreallocation_C",MatSeqAIJSetPreallocation_SeqAIJ);CHKERRQ(ierr); 4428846b4da1SFande Kong ierr = PetscObjectComposeFunction((PetscObject)B,"MatResetPreallocation_C",MatResetPreallocation_SeqAIJ);CHKERRQ(ierr); 4429bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatSeqAIJSetPreallocationCSR_C",MatSeqAIJSetPreallocationCSR_SeqAIJ);CHKERRQ(ierr); 4430bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatReorderForNonzeroDiagonal_C",MatReorderForNonzeroDiagonal_SeqAIJ);CHKERRQ(ierr); 4431bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatMatMultSymbolic_seqdense_seqaij_C",MatMatMultSymbolic_SeqDense_SeqAIJ);CHKERRQ(ierr); 4432bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatMatMultNumeric_seqdense_seqaij_C",MatMatMultNumeric_SeqDense_SeqAIJ);CHKERRQ(ierr); 44334222ddf1SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatProductSetFromOptions_is_seqaij_C",MatProductSetFromOptions_IS_XAIJ);CHKERRQ(ierr); 44344222ddf1SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatProductSetFromOptions_seqdense_seqaij_C",MatProductSetFromOptions_SeqDense_SeqAIJ);CHKERRQ(ierr); 44354222ddf1SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatProductSetFromOptions_seqaij_seqaij_C",MatProductSetFromOptions_SeqAIJ);CHKERRQ(ierr); 44364108e4d5SBarry Smith ierr = MatCreate_SeqAIJ_Inode(B);CHKERRQ(ierr); 443717667f90SBarry Smith ierr = PetscObjectChangeTypeName((PetscObject)B,MATSEQAIJ);CHKERRQ(ierr); 44384099cc6bSBarry Smith ierr = MatSeqAIJSetTypeFromOptions(B);CHKERRQ(ierr); /* this allows changing the matrix subtype to say MATSEQAIJPERM */ 44393a40ed3dSBarry Smith PetscFunctionReturn(0); 444017ab2063SBarry Smith } 444117ab2063SBarry Smith 4442b24902e0SBarry Smith /* 4443b24902e0SBarry Smith Given a matrix generated with MatGetFactor() duplicates all the information in A into B 4444b24902e0SBarry Smith */ 4445ace3abfcSBarry Smith PetscErrorCode MatDuplicateNoCreate_SeqAIJ(Mat C,Mat A,MatDuplicateOption cpvalues,PetscBool mallocmatspace) 444617ab2063SBarry Smith { 4447416022c9SBarry Smith Mat_SeqAIJ *c,*a = (Mat_SeqAIJ*)A->data; 44486849ba73SBarry Smith PetscErrorCode ierr; 4449071fcb05SBarry Smith PetscInt m = A->rmap->n,i; 445017ab2063SBarry Smith 44513a40ed3dSBarry Smith PetscFunctionBegin; 4452273d9f13SBarry Smith c = (Mat_SeqAIJ*)C->data; 4453273d9f13SBarry Smith 4454d5f3da31SBarry Smith C->factortype = A->factortype; 4455416022c9SBarry Smith c->row = 0; 4456416022c9SBarry Smith c->col = 0; 445782bf6240SBarry Smith c->icol = 0; 44586ad4291fSHong Zhang c->reallocs = 0; 445917ab2063SBarry Smith 44606ad4291fSHong Zhang C->assembled = PETSC_TRUE; 446117ab2063SBarry Smith 4462aa5ea44dSBarry Smith ierr = PetscLayoutReference(A->rmap,&C->rmap);CHKERRQ(ierr); 4463aa5ea44dSBarry Smith ierr = PetscLayoutReference(A->cmap,&C->cmap);CHKERRQ(ierr); 4464eec197d1SBarry Smith 4465071fcb05SBarry Smith ierr = PetscMalloc1(m,&c->imax);CHKERRQ(ierr); 4466071fcb05SBarry Smith ierr = PetscMemcpy(c->imax,a->imax,m*sizeof(PetscInt));CHKERRQ(ierr); 4467071fcb05SBarry Smith ierr = PetscMalloc1(m,&c->ilen);CHKERRQ(ierr); 4468071fcb05SBarry Smith ierr = PetscMemcpy(c->ilen,a->ilen,m*sizeof(PetscInt));CHKERRQ(ierr); 44693bb1ff40SBarry Smith ierr = PetscLogObjectMemory((PetscObject)C, 2*m*sizeof(PetscInt));CHKERRQ(ierr); 447017ab2063SBarry Smith 447117ab2063SBarry Smith /* allocate the matrix space */ 4472f77e22a1SHong Zhang if (mallocmatspace) { 4473dcca6d9dSJed Brown ierr = PetscMalloc3(a->i[m],&c->a,a->i[m],&c->j,m+1,&c->i);CHKERRQ(ierr); 44743bb1ff40SBarry Smith ierr = PetscLogObjectMemory((PetscObject)C, a->i[m]*(sizeof(PetscScalar)+sizeof(PetscInt))+(m+1)*sizeof(PetscInt));CHKERRQ(ierr); 44752205254eSKarl Rupp 4476f1e2ffcdSBarry Smith c->singlemalloc = PETSC_TRUE; 44772205254eSKarl Rupp 4478580bdb30SBarry Smith ierr = PetscArraycpy(c->i,a->i,m+1);CHKERRQ(ierr); 447917ab2063SBarry Smith if (m > 0) { 4480580bdb30SBarry Smith ierr = PetscArraycpy(c->j,a->j,a->i[m]);CHKERRQ(ierr); 4481be6bf707SBarry Smith if (cpvalues == MAT_COPY_VALUES) { 4482580bdb30SBarry Smith ierr = PetscArraycpy(c->a,a->a,a->i[m]);CHKERRQ(ierr); 4483be6bf707SBarry Smith } else { 4484580bdb30SBarry Smith ierr = PetscArrayzero(c->a,a->i[m]);CHKERRQ(ierr); 448517ab2063SBarry Smith } 448608480c60SBarry Smith } 4487f77e22a1SHong Zhang } 448817ab2063SBarry Smith 44896ad4291fSHong Zhang c->ignorezeroentries = a->ignorezeroentries; 4490416022c9SBarry Smith c->roworiented = a->roworiented; 4491416022c9SBarry Smith c->nonew = a->nonew; 4492416022c9SBarry Smith if (a->diag) { 4493854ce69bSBarry Smith ierr = PetscMalloc1(m+1,&c->diag);CHKERRQ(ierr); 4494071fcb05SBarry Smith ierr = PetscMemcpy(c->diag,a->diag,m*sizeof(PetscInt));CHKERRQ(ierr); 44953bb1ff40SBarry Smith ierr = PetscLogObjectMemory((PetscObject)C,(m+1)*sizeof(PetscInt));CHKERRQ(ierr); 4496071fcb05SBarry Smith } else c->diag = NULL; 44972205254eSKarl Rupp 44986ad4291fSHong Zhang c->solve_work = 0; 44996ad4291fSHong Zhang c->saved_values = 0; 45006ad4291fSHong Zhang c->idiag = 0; 450171f1c65dSBarry Smith c->ssor_work = 0; 4502a9817697SBarry Smith c->keepnonzeropattern = a->keepnonzeropattern; 4503e6b907acSBarry Smith c->free_a = PETSC_TRUE; 4504e6b907acSBarry Smith c->free_ij = PETSC_TRUE; 45056ad4291fSHong Zhang 4506893ad86cSHong Zhang c->rmax = a->rmax; 4507416022c9SBarry Smith c->nz = a->nz; 45088ed568f8SMatthew G Knepley c->maxnz = a->nz; /* Since we allocate exactly the right amount */ 4509273d9f13SBarry Smith C->preallocated = PETSC_TRUE; 4510754ec7b1SSatish Balay 45116ad4291fSHong Zhang c->compressedrow.use = a->compressedrow.use; 45126ad4291fSHong Zhang c->compressedrow.nrows = a->compressedrow.nrows; 4513cd6b891eSBarry Smith if (a->compressedrow.use) { 45146ad4291fSHong Zhang i = a->compressedrow.nrows; 4515dcca6d9dSJed Brown ierr = PetscMalloc2(i+1,&c->compressedrow.i,i,&c->compressedrow.rindex);CHKERRQ(ierr); 4516580bdb30SBarry Smith ierr = PetscArraycpy(c->compressedrow.i,a->compressedrow.i,i+1);CHKERRQ(ierr); 4517580bdb30SBarry Smith ierr = PetscArraycpy(c->compressedrow.rindex,a->compressedrow.rindex,i);CHKERRQ(ierr); 451827ea64f8SHong Zhang } else { 451927ea64f8SHong Zhang c->compressedrow.use = PETSC_FALSE; 45200298fd71SBarry Smith c->compressedrow.i = NULL; 45210298fd71SBarry Smith c->compressedrow.rindex = NULL; 45226ad4291fSHong Zhang } 4523ea632784SBarry Smith c->nonzerorowcnt = a->nonzerorowcnt; 4524e56f5c9eSBarry Smith C->nonzerostate = A->nonzerostate; 45254846f1f5SKris Buschelman 45262205254eSKarl Rupp ierr = MatDuplicate_SeqAIJ_Inode(A,cpvalues,&C);CHKERRQ(ierr); 4527140e18c1SBarry Smith ierr = PetscFunctionListDuplicate(((PetscObject)A)->qlist,&((PetscObject)C)->qlist);CHKERRQ(ierr); 45283a40ed3dSBarry Smith PetscFunctionReturn(0); 452917ab2063SBarry Smith } 453017ab2063SBarry Smith 4531b24902e0SBarry Smith PetscErrorCode MatDuplicate_SeqAIJ(Mat A,MatDuplicateOption cpvalues,Mat *B) 4532b24902e0SBarry Smith { 4533b24902e0SBarry Smith PetscErrorCode ierr; 4534b24902e0SBarry Smith 4535b24902e0SBarry Smith PetscFunctionBegin; 4536ce94432eSBarry Smith ierr = MatCreate(PetscObjectComm((PetscObject)A),B);CHKERRQ(ierr); 45374b6263acSBarry Smith ierr = MatSetSizes(*B,A->rmap->n,A->cmap->n,A->rmap->n,A->cmap->n);CHKERRQ(ierr); 4538cfd3f464SBarry Smith if (!(A->rmap->n % A->rmap->bs) && !(A->cmap->n % A->cmap->bs)) { 453933d57670SJed Brown ierr = MatSetBlockSizesFromMats(*B,A,A);CHKERRQ(ierr); 4540cfd3f464SBarry Smith } 4541a54f2f98SBarry Smith ierr = MatSetType(*B,((PetscObject)A)->type_name);CHKERRQ(ierr); 4542f77e22a1SHong Zhang ierr = MatDuplicateNoCreate_SeqAIJ(*B,A,cpvalues,PETSC_TRUE);CHKERRQ(ierr); 4543b24902e0SBarry Smith PetscFunctionReturn(0); 4544b24902e0SBarry Smith } 4545b24902e0SBarry Smith 4546112444f4SShri Abhyankar PetscErrorCode MatLoad_SeqAIJ(Mat newMat, PetscViewer viewer) 4547fbdbba38SShri Abhyankar { 454852f91c60SVaclav Hapla PetscBool isbinary, ishdf5; 454952f91c60SVaclav Hapla PetscErrorCode ierr; 455052f91c60SVaclav Hapla 455152f91c60SVaclav Hapla PetscFunctionBegin; 455252f91c60SVaclav Hapla PetscValidHeaderSpecific(newMat,MAT_CLASSID,1); 455352f91c60SVaclav Hapla PetscValidHeaderSpecific(viewer,PETSC_VIEWER_CLASSID,2); 4554c27b3999SVaclav Hapla /* force binary viewer to load .info file if it has not yet done so */ 4555c27b3999SVaclav Hapla ierr = PetscViewerSetUp(viewer);CHKERRQ(ierr); 455652f91c60SVaclav Hapla ierr = PetscObjectTypeCompare((PetscObject)viewer,PETSCVIEWERBINARY,&isbinary);CHKERRQ(ierr); 455752f91c60SVaclav Hapla ierr = PetscObjectTypeCompare((PetscObject)viewer,PETSCVIEWERHDF5, &ishdf5);CHKERRQ(ierr); 455852f91c60SVaclav Hapla if (isbinary) { 455952f91c60SVaclav Hapla ierr = MatLoad_SeqAIJ_Binary(newMat,viewer);CHKERRQ(ierr); 456052f91c60SVaclav Hapla } else if (ishdf5) { 456152f91c60SVaclav Hapla #if defined(PETSC_HAVE_HDF5) 456252f91c60SVaclav Hapla ierr = MatLoad_AIJ_HDF5(newMat,viewer);CHKERRQ(ierr); 456352f91c60SVaclav Hapla #else 456452f91c60SVaclav Hapla SETERRQ(PetscObjectComm((PetscObject)newMat),PETSC_ERR_SUP,"HDF5 not supported in this build.\nPlease reconfigure using --download-hdf5"); 456552f91c60SVaclav Hapla #endif 456652f91c60SVaclav Hapla } else { 456752f91c60SVaclav Hapla SETERRQ2(PetscObjectComm((PetscObject)newMat),PETSC_ERR_SUP,"Viewer type %s not yet supported for reading %s matrices",((PetscObject)viewer)->type_name,((PetscObject)newMat)->type_name); 456852f91c60SVaclav Hapla } 456952f91c60SVaclav Hapla PetscFunctionReturn(0); 457052f91c60SVaclav Hapla } 457152f91c60SVaclav Hapla 45723ea6fe3dSLisandro Dalcin PetscErrorCode MatLoad_SeqAIJ_Binary(Mat mat, PetscViewer viewer) 457352f91c60SVaclav Hapla { 45743ea6fe3dSLisandro Dalcin Mat_SeqAIJ *a = (Mat_SeqAIJ*)mat->data; 4575fbdbba38SShri Abhyankar PetscErrorCode ierr; 45763ea6fe3dSLisandro Dalcin PetscInt header[4],*rowlens,M,N,nz,sum,rows,cols,i; 4577fbdbba38SShri Abhyankar 4578fbdbba38SShri Abhyankar PetscFunctionBegin; 45793ea6fe3dSLisandro Dalcin ierr = PetscViewerSetUp(viewer);CHKERRQ(ierr); 4580bbead8a2SBarry Smith 45813ea6fe3dSLisandro Dalcin /* read in matrix header */ 45823ea6fe3dSLisandro Dalcin ierr = PetscViewerBinaryRead(viewer,header,4,NULL,PETSC_INT);CHKERRQ(ierr); 45833ea6fe3dSLisandro Dalcin if (header[0] != MAT_FILE_CLASSID) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_FILE_UNEXPECTED,"Not a matrix object in file"); 4584fbdbba38SShri Abhyankar M = header[1]; N = header[2]; nz = header[3]; 45853ea6fe3dSLisandro Dalcin if (M < 0) SETERRQ1(PetscObjectComm((PetscObject)viewer),PETSC_ERR_FILE_UNEXPECTED,"Matrix row size (%D) in file is negative",M); 45863ea6fe3dSLisandro Dalcin if (N < 0) SETERRQ1(PetscObjectComm((PetscObject)viewer),PETSC_ERR_FILE_UNEXPECTED,"Matrix column size (%D) in file is negative",N); 4587bbead8a2SBarry Smith if (nz < 0) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_FILE_UNEXPECTED,"Matrix stored in special format on disk, cannot load as SeqAIJ"); 4588fbdbba38SShri Abhyankar 45893ea6fe3dSLisandro Dalcin /* set block sizes from the viewer's .info file */ 45903ea6fe3dSLisandro Dalcin ierr = MatLoad_Binary_BlockSizes(mat,viewer);CHKERRQ(ierr); 45913ea6fe3dSLisandro Dalcin /* set local and global sizes if not set already */ 45923ea6fe3dSLisandro Dalcin if (mat->rmap->n < 0) mat->rmap->n = M; 45933ea6fe3dSLisandro Dalcin if (mat->cmap->n < 0) mat->cmap->n = N; 45943ea6fe3dSLisandro Dalcin if (mat->rmap->N < 0) mat->rmap->N = M; 45953ea6fe3dSLisandro Dalcin if (mat->cmap->N < 0) mat->cmap->N = N; 45963ea6fe3dSLisandro Dalcin ierr = PetscLayoutSetUp(mat->rmap);CHKERRQ(ierr); 45973ea6fe3dSLisandro Dalcin ierr = PetscLayoutSetUp(mat->cmap);CHKERRQ(ierr); 45983ea6fe3dSLisandro Dalcin 45993ea6fe3dSLisandro Dalcin /* check if the matrix sizes are correct */ 46003ea6fe3dSLisandro Dalcin ierr = MatGetSize(mat,&rows,&cols);CHKERRQ(ierr); 46013ea6fe3dSLisandro Dalcin if (M != rows || N != cols) SETERRQ4(PETSC_COMM_SELF,PETSC_ERR_FILE_UNEXPECTED, "Matrix in file of different sizes (%D, %D) than the input matrix (%D, %D)",M,N,rows,cols); 46023ea6fe3dSLisandro Dalcin 4603fbdbba38SShri Abhyankar /* read in row lengths */ 46043ea6fe3dSLisandro Dalcin ierr = PetscMalloc1(M,&rowlens);CHKERRQ(ierr); 46053ea6fe3dSLisandro Dalcin ierr = PetscViewerBinaryRead(viewer,rowlens,M,NULL,PETSC_INT);CHKERRQ(ierr); 46063ea6fe3dSLisandro Dalcin /* check if sum(rowlens) is same as nz */ 46073ea6fe3dSLisandro Dalcin sum = 0; for (i=0; i<M; i++) sum += rowlens[i]; 46083ea6fe3dSLisandro Dalcin if (sum != nz) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_FILE_UNEXPECTED,"Inconsistent matrix data in file: nonzeros = %D, sum-row-lengths = %D\n",nz,sum); 46093ea6fe3dSLisandro Dalcin /* preallocate and check sizes */ 46103ea6fe3dSLisandro Dalcin ierr = MatSeqAIJSetPreallocation_SeqAIJ(mat,0,rowlens);CHKERRQ(ierr); 46113ea6fe3dSLisandro Dalcin ierr = MatGetSize(mat,&rows,&cols);CHKERRQ(ierr); 461260e0710aSBarry Smith if (M != rows || N != cols) SETERRQ4(PETSC_COMM_SELF,PETSC_ERR_FILE_UNEXPECTED, "Matrix in file of different length (%D, %D) than the input matrix (%D, %D)",M,N,rows,cols); 46133ea6fe3dSLisandro Dalcin /* store row lengths */ 46143ea6fe3dSLisandro Dalcin ierr = PetscArraycpy(a->ilen,rowlens,M);CHKERRQ(ierr); 46153ea6fe3dSLisandro Dalcin ierr = PetscFree(rowlens);CHKERRQ(ierr); 4616fbdbba38SShri Abhyankar 46173ea6fe3dSLisandro Dalcin /* fill in "i" row pointers */ 46183ea6fe3dSLisandro Dalcin a->i[0] = 0; for (i=0; i<M; i++) a->i[i+1] = a->i[i] + a->ilen[i]; 46193ea6fe3dSLisandro Dalcin /* read in "j" column indices */ 46203ea6fe3dSLisandro Dalcin ierr = PetscViewerBinaryRead(viewer,a->j,nz,NULL,PETSC_INT);CHKERRQ(ierr); 46213ea6fe3dSLisandro Dalcin /* read in "a" nonzero values */ 46223ea6fe3dSLisandro Dalcin ierr = PetscViewerBinaryRead(viewer,a->a,nz,NULL,PETSC_SCALAR);CHKERRQ(ierr); 4623fbdbba38SShri Abhyankar 46243ea6fe3dSLisandro Dalcin ierr = MatAssemblyBegin(mat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 46253ea6fe3dSLisandro Dalcin ierr = MatAssemblyEnd(mat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 4626fbdbba38SShri Abhyankar PetscFunctionReturn(0); 4627fbdbba38SShri Abhyankar } 4628fbdbba38SShri Abhyankar 4629ace3abfcSBarry Smith PetscErrorCode MatEqual_SeqAIJ(Mat A,Mat B,PetscBool * flg) 46307264ac53SSatish Balay { 46317264ac53SSatish Balay Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data,*b = (Mat_SeqAIJ*)B->data; 4632dfbe8321SBarry Smith PetscErrorCode ierr; 4633eeffb40dSHong Zhang #if defined(PETSC_USE_COMPLEX) 4634eeffb40dSHong Zhang PetscInt k; 4635eeffb40dSHong Zhang #endif 46367264ac53SSatish Balay 46373a40ed3dSBarry Smith PetscFunctionBegin; 4638bfeeae90SHong Zhang /* If the matrix dimensions are not equal,or no of nonzeros */ 4639d0f46423SBarry Smith if ((A->rmap->n != B->rmap->n) || (A->cmap->n != B->cmap->n) ||(a->nz != b->nz)) { 4640ca44d042SBarry Smith *flg = PETSC_FALSE; 4641ca44d042SBarry Smith PetscFunctionReturn(0); 4642bcd2baecSBarry Smith } 46437264ac53SSatish Balay 46447264ac53SSatish Balay /* if the a->i are the same */ 4645580bdb30SBarry Smith ierr = PetscArraycmp(a->i,b->i,A->rmap->n+1,flg);CHKERRQ(ierr); 4646abc0a331SBarry Smith if (!*flg) PetscFunctionReturn(0); 46477264ac53SSatish Balay 46487264ac53SSatish Balay /* if a->j are the same */ 4649580bdb30SBarry Smith ierr = PetscArraycmp(a->j,b->j,a->nz,flg);CHKERRQ(ierr); 4650abc0a331SBarry Smith if (!*flg) PetscFunctionReturn(0); 4651bcd2baecSBarry Smith 4652bcd2baecSBarry Smith /* if a->a are the same */ 4653eeffb40dSHong Zhang #if defined(PETSC_USE_COMPLEX) 4654eeffb40dSHong Zhang for (k=0; k<a->nz; k++) { 4655eeffb40dSHong Zhang if (PetscRealPart(a->a[k]) != PetscRealPart(b->a[k]) || PetscImaginaryPart(a->a[k]) != PetscImaginaryPart(b->a[k])) { 4656eeffb40dSHong Zhang *flg = PETSC_FALSE; 46573a40ed3dSBarry Smith PetscFunctionReturn(0); 4658eeffb40dSHong Zhang } 4659eeffb40dSHong Zhang } 4660eeffb40dSHong Zhang #else 4661580bdb30SBarry Smith ierr = PetscArraycmp(a->a,b->a,a->nz,flg);CHKERRQ(ierr); 4662eeffb40dSHong Zhang #endif 4663eeffb40dSHong Zhang PetscFunctionReturn(0); 46647264ac53SSatish Balay } 466536db0b34SBarry Smith 466605869f15SSatish Balay /*@ 466736db0b34SBarry Smith MatCreateSeqAIJWithArrays - Creates an sequential AIJ matrix using matrix elements (in CSR format) 466836db0b34SBarry Smith provided by the user. 466936db0b34SBarry Smith 4670d083f849SBarry Smith Collective 467136db0b34SBarry Smith 467236db0b34SBarry Smith Input Parameters: 467336db0b34SBarry Smith + comm - must be an MPI communicator of size 1 467436db0b34SBarry Smith . m - number of rows 467536db0b34SBarry Smith . n - number of columns 4676483a2f95SBarry Smith . i - row indices; that is i[0] = 0, i[row] = i[row-1] + number of elements in that row of the matrix 467736db0b34SBarry Smith . j - column indices 467836db0b34SBarry Smith - a - matrix values 467936db0b34SBarry Smith 468036db0b34SBarry Smith Output Parameter: 468136db0b34SBarry Smith . mat - the matrix 468236db0b34SBarry Smith 468336db0b34SBarry Smith Level: intermediate 468436db0b34SBarry Smith 468536db0b34SBarry Smith Notes: 46860551d7c0SBarry Smith The i, j, and a arrays are not copied by this routine, the user must free these arrays 4687292fb18eSBarry Smith once the matrix is destroyed and not before 468836db0b34SBarry Smith 468936db0b34SBarry Smith You cannot set new nonzero locations into this matrix, that will generate an error. 469036db0b34SBarry Smith 4691bfeeae90SHong Zhang The i and j indices are 0 based 469236db0b34SBarry Smith 4693a4552177SSatish Balay The format which is used for the sparse matrix input, is equivalent to a 4694a4552177SSatish Balay row-major ordering.. i.e for the following matrix, the input data expected is 46958eef79e4SBarry Smith as shown 4696a4552177SSatish Balay 46978eef79e4SBarry Smith $ 1 0 0 46988eef79e4SBarry Smith $ 2 0 3 46998eef79e4SBarry Smith $ 4 5 6 47008eef79e4SBarry Smith $ 47018eef79e4SBarry Smith $ i = {0,1,3,6} [size = nrow+1 = 3+1] 47028eef79e4SBarry Smith $ j = {0,0,2,0,1,2} [size = 6]; values must be sorted for each row 47038eef79e4SBarry Smith $ v = {1,2,3,4,5,6} [size = 6] 4704a4552177SSatish Balay 47059985e31cSBarry Smith 470669b1f4b7SBarry Smith .seealso: MatCreate(), MatCreateAIJ(), MatCreateSeqAIJ(), MatCreateMPIAIJWithArrays(), MatMPIAIJSetPreallocationCSR() 470736db0b34SBarry Smith 470836db0b34SBarry Smith @*/ 4709c3c607ccSBarry Smith PetscErrorCode MatCreateSeqAIJWithArrays(MPI_Comm comm,PetscInt m,PetscInt n,PetscInt i[],PetscInt j[],PetscScalar a[],Mat *mat) 471036db0b34SBarry Smith { 4711dfbe8321SBarry Smith PetscErrorCode ierr; 4712cbcfb4deSHong Zhang PetscInt ii; 471336db0b34SBarry Smith Mat_SeqAIJ *aij; 4714cbcfb4deSHong Zhang PetscInt jj; 471536db0b34SBarry Smith 471636db0b34SBarry Smith PetscFunctionBegin; 471741096f02SStefano Zampini if (m > 0 && i[0]) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"i (row indices) must start with 0"); 4718f69a0ea3SMatthew Knepley ierr = MatCreate(comm,mat);CHKERRQ(ierr); 4719f69a0ea3SMatthew Knepley ierr = MatSetSizes(*mat,m,n,m,n);CHKERRQ(ierr); 4720a2f3521dSMark F. Adams /* ierr = MatSetBlockSizes(*mat,,);CHKERRQ(ierr); */ 4721ab93d7beSBarry Smith ierr = MatSetType(*mat,MATSEQAIJ);CHKERRQ(ierr); 4722ab93d7beSBarry Smith ierr = MatSeqAIJSetPreallocation_SeqAIJ(*mat,MAT_SKIP_ALLOCATION,0);CHKERRQ(ierr); 4723ab93d7beSBarry Smith aij = (Mat_SeqAIJ*)(*mat)->data; 4724071fcb05SBarry Smith ierr = PetscMalloc1(m,&aij->imax);CHKERRQ(ierr); 4725071fcb05SBarry Smith ierr = PetscMalloc1(m,&aij->ilen);CHKERRQ(ierr); 4726ab93d7beSBarry Smith 472736db0b34SBarry Smith aij->i = i; 472836db0b34SBarry Smith aij->j = j; 472936db0b34SBarry Smith aij->a = a; 473036db0b34SBarry Smith aij->singlemalloc = PETSC_FALSE; 473136db0b34SBarry Smith aij->nonew = -1; /*this indicates that inserting a new value in the matrix that generates a new nonzero is an error*/ 4732e6b907acSBarry Smith aij->free_a = PETSC_FALSE; 4733e6b907acSBarry Smith aij->free_ij = PETSC_FALSE; 473436db0b34SBarry Smith 473536db0b34SBarry Smith for (ii=0; ii<m; ii++) { 473636db0b34SBarry Smith aij->ilen[ii] = aij->imax[ii] = i[ii+1] - i[ii]; 473776bd3646SJed Brown if (PetscDefined(USE_DEBUG)) { 473860e0710aSBarry Smith if (i[ii+1] - i[ii] < 0) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Negative row length in i (row indices) row = %D length = %D",ii,i[ii+1] - i[ii]); 47399985e31cSBarry Smith for (jj=i[ii]+1; jj<i[ii+1]; jj++) { 4740a061629eSStefano Zampini if (j[jj] < j[jj-1]) SETERRQ3(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Column entry number %D (actual column %D) in row %D is not sorted",jj-i[ii],j[jj],ii); 4741a061629eSStefano Zampini if (j[jj] == j[jj-1]) SETERRQ3(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Column entry number %D (actual column %D) in row %D is identical to previous entry",jj-i[ii],j[jj],ii); 47429985e31cSBarry Smith } 474336db0b34SBarry Smith } 474476bd3646SJed Brown } 474576bd3646SJed Brown if (PetscDefined(USE_DEBUG)) { 474636db0b34SBarry Smith for (ii=0; ii<aij->i[m]; ii++) { 474760e0710aSBarry Smith if (j[ii] < 0) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Negative column index at location = %D index = %D",ii,j[ii]); 474860e0710aSBarry Smith if (j[ii] > n - 1) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Column index to large at location = %D index = %D",ii,j[ii]); 474936db0b34SBarry Smith } 475076bd3646SJed Brown } 475136db0b34SBarry Smith 4752b65db4caSBarry Smith ierr = MatAssemblyBegin(*mat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 4753b65db4caSBarry Smith ierr = MatAssemblyEnd(*mat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 475436db0b34SBarry Smith PetscFunctionReturn(0); 475536db0b34SBarry Smith } 475680ef6e79SMatthew G Knepley /*@C 4757d021a1c5SVictor Minden MatCreateSeqAIJFromTriple - Creates an sequential AIJ matrix using matrix elements (in COO format) 47588a0b0e6bSVictor Minden provided by the user. 47598a0b0e6bSVictor Minden 4760d083f849SBarry Smith Collective 47618a0b0e6bSVictor Minden 47628a0b0e6bSVictor Minden Input Parameters: 47638a0b0e6bSVictor Minden + comm - must be an MPI communicator of size 1 47648a0b0e6bSVictor Minden . m - number of rows 47658a0b0e6bSVictor Minden . n - number of columns 47668a0b0e6bSVictor Minden . i - row indices 47678a0b0e6bSVictor Minden . j - column indices 47681230e6d1SVictor Minden . a - matrix values 47691230e6d1SVictor Minden . nz - number of nonzeros 47701230e6d1SVictor Minden - idx - 0 or 1 based 47718a0b0e6bSVictor Minden 47728a0b0e6bSVictor Minden Output Parameter: 47738a0b0e6bSVictor Minden . mat - the matrix 47748a0b0e6bSVictor Minden 47758a0b0e6bSVictor Minden Level: intermediate 47768a0b0e6bSVictor Minden 47778a0b0e6bSVictor Minden Notes: 47788a0b0e6bSVictor Minden The i and j indices are 0 based 47798a0b0e6bSVictor Minden 47808a0b0e6bSVictor Minden The format which is used for the sparse matrix input, is equivalent to a 47818a0b0e6bSVictor Minden row-major ordering.. i.e for the following matrix, the input data expected is 47828a0b0e6bSVictor Minden as shown: 47838a0b0e6bSVictor Minden 47848a0b0e6bSVictor Minden 1 0 0 47858a0b0e6bSVictor Minden 2 0 3 47868a0b0e6bSVictor Minden 4 5 6 47878a0b0e6bSVictor Minden 47888a0b0e6bSVictor Minden i = {0,1,1,2,2,2} 47898a0b0e6bSVictor Minden j = {0,0,2,0,1,2} 47908a0b0e6bSVictor Minden v = {1,2,3,4,5,6} 47918a0b0e6bSVictor Minden 47928a0b0e6bSVictor Minden 479369b1f4b7SBarry Smith .seealso: MatCreate(), MatCreateAIJ(), MatCreateSeqAIJ(), MatCreateSeqAIJWithArrays(), MatMPIAIJSetPreallocationCSR() 47948a0b0e6bSVictor Minden 47958a0b0e6bSVictor Minden @*/ 4796c3c607ccSBarry Smith PetscErrorCode MatCreateSeqAIJFromTriple(MPI_Comm comm,PetscInt m,PetscInt n,PetscInt i[],PetscInt j[],PetscScalar a[],Mat *mat,PetscInt nz,PetscBool idx) 47978a0b0e6bSVictor Minden { 47988a0b0e6bSVictor Minden PetscErrorCode ierr; 4799d021a1c5SVictor Minden PetscInt ii, *nnz, one = 1,row,col; 48008a0b0e6bSVictor Minden 48018a0b0e6bSVictor Minden 48028a0b0e6bSVictor Minden PetscFunctionBegin; 48031795a4d1SJed Brown ierr = PetscCalloc1(m,&nnz);CHKERRQ(ierr); 48041230e6d1SVictor Minden for (ii = 0; ii < nz; ii++) { 4805c8d679ebSHong Zhang nnz[i[ii] - !!idx] += 1; 48061230e6d1SVictor Minden } 48078a0b0e6bSVictor Minden ierr = MatCreate(comm,mat);CHKERRQ(ierr); 48088a0b0e6bSVictor Minden ierr = MatSetSizes(*mat,m,n,m,n);CHKERRQ(ierr); 48098a0b0e6bSVictor Minden ierr = MatSetType(*mat,MATSEQAIJ);CHKERRQ(ierr); 48101230e6d1SVictor Minden ierr = MatSeqAIJSetPreallocation_SeqAIJ(*mat,0,nnz);CHKERRQ(ierr); 48111230e6d1SVictor Minden for (ii = 0; ii < nz; ii++) { 48121230e6d1SVictor Minden if (idx) { 48131230e6d1SVictor Minden row = i[ii] - 1; 48141230e6d1SVictor Minden col = j[ii] - 1; 48151230e6d1SVictor Minden } else { 48161230e6d1SVictor Minden row = i[ii]; 48171230e6d1SVictor Minden col = j[ii]; 48188a0b0e6bSVictor Minden } 48191230e6d1SVictor Minden ierr = MatSetValues(*mat,one,&row,one,&col,&a[ii],ADD_VALUES);CHKERRQ(ierr); 48208a0b0e6bSVictor Minden } 48218a0b0e6bSVictor Minden ierr = MatAssemblyBegin(*mat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 48228a0b0e6bSVictor Minden ierr = MatAssemblyEnd(*mat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 4823d021a1c5SVictor Minden ierr = PetscFree(nnz);CHKERRQ(ierr); 48248a0b0e6bSVictor Minden PetscFunctionReturn(0); 48258a0b0e6bSVictor Minden } 482636db0b34SBarry Smith 4827acf2f550SJed Brown PetscErrorCode MatSeqAIJInvalidateDiagonal(Mat A) 4828acf2f550SJed Brown { 4829acf2f550SJed Brown Mat_SeqAIJ *a=(Mat_SeqAIJ*)A->data; 4830acf2f550SJed Brown PetscErrorCode ierr; 4831acf2f550SJed Brown 4832acf2f550SJed Brown PetscFunctionBegin; 4833acf2f550SJed Brown a->idiagvalid = PETSC_FALSE; 4834acf2f550SJed Brown a->ibdiagvalid = PETSC_FALSE; 48352205254eSKarl Rupp 4836acf2f550SJed Brown ierr = MatSeqAIJInvalidateDiagonal_Inode(A);CHKERRQ(ierr); 4837acf2f550SJed Brown PetscFunctionReturn(0); 4838acf2f550SJed Brown } 4839acf2f550SJed Brown 48409c8f2541SHong Zhang PetscErrorCode MatCreateMPIMatConcatenateSeqMat_SeqAIJ(MPI_Comm comm,Mat inmat,PetscInt n,MatReuse scall,Mat *outmat) 48419c8f2541SHong Zhang { 48429c8f2541SHong Zhang PetscErrorCode ierr; 48438761c3d6SHong Zhang PetscMPIInt size; 48449c8f2541SHong Zhang 48459c8f2541SHong Zhang PetscFunctionBegin; 48468761c3d6SHong Zhang ierr = MPI_Comm_size(comm,&size);CHKERRQ(ierr); 48477bbdc51dSHong Zhang if (size == 1) { 48487bbdc51dSHong Zhang if (scall == MAT_INITIAL_MATRIX) { 48497bbdc51dSHong Zhang ierr = MatDuplicate(inmat,MAT_COPY_VALUES,outmat);CHKERRQ(ierr); 48507bbdc51dSHong Zhang } else { 48518761c3d6SHong Zhang ierr = MatCopy(inmat,*outmat,SAME_NONZERO_PATTERN);CHKERRQ(ierr); 48527bbdc51dSHong Zhang } 48538761c3d6SHong Zhang } else { 48549c8f2541SHong Zhang ierr = MatCreateMPIMatConcatenateSeqMat_MPIAIJ(comm,inmat,n,scall,outmat);CHKERRQ(ierr); 48558761c3d6SHong Zhang } 48569c8f2541SHong Zhang PetscFunctionReturn(0); 48579c8f2541SHong Zhang } 48589c8f2541SHong Zhang 485981824310SBarry Smith /* 486053dd7562SDmitry Karpeev Permute A into C's *local* index space using rowemb,colemb. 486153dd7562SDmitry Karpeev The embedding are supposed to be injections and the above implies that the range of rowemb is a subset 486253dd7562SDmitry Karpeev of [0,m), colemb is in [0,n). 486353dd7562SDmitry Karpeev If pattern == DIFFERENT_NONZERO_PATTERN, C is preallocated according to A. 486453dd7562SDmitry Karpeev */ 486553dd7562SDmitry Karpeev PetscErrorCode MatSetSeqMat_SeqAIJ(Mat C,IS rowemb,IS colemb,MatStructure pattern,Mat B) 486653dd7562SDmitry Karpeev { 486753dd7562SDmitry Karpeev /* If making this function public, change the error returned in this function away from _PLIB. */ 486853dd7562SDmitry Karpeev PetscErrorCode ierr; 486953dd7562SDmitry Karpeev Mat_SeqAIJ *Baij; 487053dd7562SDmitry Karpeev PetscBool seqaij; 487153dd7562SDmitry Karpeev PetscInt m,n,*nz,i,j,count; 487253dd7562SDmitry Karpeev PetscScalar v; 487353dd7562SDmitry Karpeev const PetscInt *rowindices,*colindices; 487453dd7562SDmitry Karpeev 487553dd7562SDmitry Karpeev PetscFunctionBegin; 487653dd7562SDmitry Karpeev if (!B) PetscFunctionReturn(0); 487753dd7562SDmitry Karpeev /* Check to make sure the target matrix (and embeddings) are compatible with C and each other. */ 48784099cc6bSBarry Smith ierr = PetscObjectBaseTypeCompare((PetscObject)B,MATSEQAIJ,&seqaij);CHKERRQ(ierr); 487953dd7562SDmitry Karpeev if (!seqaij) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Input matrix is of wrong type"); 488053dd7562SDmitry Karpeev if (rowemb) { 488153dd7562SDmitry Karpeev ierr = ISGetLocalSize(rowemb,&m);CHKERRQ(ierr); 488253dd7562SDmitry Karpeev if (m != B->rmap->n) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Row IS of size %D is incompatible with matrix row size %D",m,B->rmap->n); 488353dd7562SDmitry Karpeev } else { 48846c4ed002SBarry Smith if (C->rmap->n != B->rmap->n) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Input matrix is row-incompatible with the target matrix"); 488553dd7562SDmitry Karpeev } 488653dd7562SDmitry Karpeev if (colemb) { 488753dd7562SDmitry Karpeev ierr = ISGetLocalSize(colemb,&n);CHKERRQ(ierr); 488853dd7562SDmitry Karpeev if (n != B->cmap->n) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Diag col IS of size %D is incompatible with input matrix col size %D",n,B->cmap->n); 488953dd7562SDmitry Karpeev } else { 489053dd7562SDmitry Karpeev if (C->cmap->n != B->cmap->n) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Input matrix is col-incompatible with the target matrix"); 489153dd7562SDmitry Karpeev } 489253dd7562SDmitry Karpeev 489353dd7562SDmitry Karpeev Baij = (Mat_SeqAIJ*)(B->data); 489453dd7562SDmitry Karpeev if (pattern == DIFFERENT_NONZERO_PATTERN) { 489553dd7562SDmitry Karpeev ierr = PetscMalloc1(B->rmap->n,&nz);CHKERRQ(ierr); 489653dd7562SDmitry Karpeev for (i=0; i<B->rmap->n; i++) { 489753dd7562SDmitry Karpeev nz[i] = Baij->i[i+1] - Baij->i[i]; 489853dd7562SDmitry Karpeev } 489953dd7562SDmitry Karpeev ierr = MatSeqAIJSetPreallocation(C,0,nz);CHKERRQ(ierr); 490053dd7562SDmitry Karpeev ierr = PetscFree(nz);CHKERRQ(ierr); 490153dd7562SDmitry Karpeev } 490253dd7562SDmitry Karpeev if (pattern == SUBSET_NONZERO_PATTERN) { 490353dd7562SDmitry Karpeev ierr = MatZeroEntries(C);CHKERRQ(ierr); 490453dd7562SDmitry Karpeev } 490553dd7562SDmitry Karpeev count = 0; 490653dd7562SDmitry Karpeev rowindices = NULL; 490753dd7562SDmitry Karpeev colindices = NULL; 490853dd7562SDmitry Karpeev if (rowemb) { 490953dd7562SDmitry Karpeev ierr = ISGetIndices(rowemb,&rowindices);CHKERRQ(ierr); 491053dd7562SDmitry Karpeev } 491153dd7562SDmitry Karpeev if (colemb) { 491253dd7562SDmitry Karpeev ierr = ISGetIndices(colemb,&colindices);CHKERRQ(ierr); 491353dd7562SDmitry Karpeev } 491453dd7562SDmitry Karpeev for (i=0; i<B->rmap->n; i++) { 491553dd7562SDmitry Karpeev PetscInt row; 491653dd7562SDmitry Karpeev row = i; 491753dd7562SDmitry Karpeev if (rowindices) row = rowindices[i]; 491853dd7562SDmitry Karpeev for (j=Baij->i[i]; j<Baij->i[i+1]; j++) { 491953dd7562SDmitry Karpeev PetscInt col; 492053dd7562SDmitry Karpeev col = Baij->j[count]; 492153dd7562SDmitry Karpeev if (colindices) col = colindices[col]; 492253dd7562SDmitry Karpeev v = Baij->a[count]; 492353dd7562SDmitry Karpeev ierr = MatSetValues(C,1,&row,1,&col,&v,INSERT_VALUES);CHKERRQ(ierr); 492453dd7562SDmitry Karpeev ++count; 492553dd7562SDmitry Karpeev } 492653dd7562SDmitry Karpeev } 492753dd7562SDmitry Karpeev /* FIXME: set C's nonzerostate correctly. */ 492853dd7562SDmitry Karpeev /* Assembly for C is necessary. */ 492953dd7562SDmitry Karpeev C->preallocated = PETSC_TRUE; 493053dd7562SDmitry Karpeev C->assembled = PETSC_TRUE; 493153dd7562SDmitry Karpeev C->was_assembled = PETSC_FALSE; 493253dd7562SDmitry Karpeev PetscFunctionReturn(0); 493353dd7562SDmitry Karpeev } 493453dd7562SDmitry Karpeev 49354099cc6bSBarry Smith PetscFunctionList MatSeqAIJList = NULL; 49364099cc6bSBarry Smith 49374099cc6bSBarry Smith /*@C 49384099cc6bSBarry Smith MatSeqAIJSetType - Converts a MATSEQAIJ matrix to a subtype 49394099cc6bSBarry Smith 49404099cc6bSBarry Smith Collective on Mat 49414099cc6bSBarry Smith 49424099cc6bSBarry Smith Input Parameters: 49434099cc6bSBarry Smith + mat - the matrix object 49444099cc6bSBarry Smith - matype - matrix type 49454099cc6bSBarry Smith 49464099cc6bSBarry Smith Options Database Key: 49474099cc6bSBarry Smith . -mat_seqai_type <method> - for example seqaijcrl 49484099cc6bSBarry Smith 49494099cc6bSBarry Smith 49504099cc6bSBarry Smith Level: intermediate 49514099cc6bSBarry Smith 49524099cc6bSBarry Smith .seealso: PCSetType(), VecSetType(), MatCreate(), MatType, Mat 49534099cc6bSBarry Smith @*/ 49544099cc6bSBarry Smith PetscErrorCode MatSeqAIJSetType(Mat mat, MatType matype) 49554099cc6bSBarry Smith { 4956fd9d3c67SJed Brown PetscErrorCode ierr,(*r)(Mat,MatType,MatReuse,Mat*); 49574099cc6bSBarry Smith PetscBool sametype; 49584099cc6bSBarry Smith 49594099cc6bSBarry Smith PetscFunctionBegin; 49604099cc6bSBarry Smith PetscValidHeaderSpecific(mat,MAT_CLASSID,1); 49614099cc6bSBarry Smith ierr = PetscObjectTypeCompare((PetscObject)mat,matype,&sametype);CHKERRQ(ierr); 49624099cc6bSBarry Smith if (sametype) PetscFunctionReturn(0); 49634099cc6bSBarry Smith 49644099cc6bSBarry Smith ierr = PetscFunctionListFind(MatSeqAIJList,matype,&r);CHKERRQ(ierr); 49654099cc6bSBarry Smith if (!r) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_ARG_UNKNOWN_TYPE,"Unknown Mat type given: %s",matype); 49664099cc6bSBarry Smith ierr = (*r)(mat,matype,MAT_INPLACE_MATRIX,&mat);CHKERRQ(ierr); 49674099cc6bSBarry Smith PetscFunctionReturn(0); 49684099cc6bSBarry Smith } 49694099cc6bSBarry Smith 49704099cc6bSBarry Smith 49714099cc6bSBarry Smith /*@C 49724099cc6bSBarry Smith MatSeqAIJRegister - - Adds a new sub-matrix type for sequential AIJ matrices 49734099cc6bSBarry Smith 49744099cc6bSBarry Smith Not Collective 49754099cc6bSBarry Smith 49764099cc6bSBarry Smith Input Parameters: 49774099cc6bSBarry Smith + name - name of a new user-defined matrix type, for example MATSEQAIJCRL 49784099cc6bSBarry Smith - function - routine to convert to subtype 49794099cc6bSBarry Smith 49804099cc6bSBarry Smith Notes: 49814099cc6bSBarry Smith MatSeqAIJRegister() may be called multiple times to add several user-defined solvers. 49824099cc6bSBarry Smith 49834099cc6bSBarry Smith 49844099cc6bSBarry Smith Then, your matrix can be chosen with the procedural interface at runtime via the option 49854099cc6bSBarry Smith $ -mat_seqaij_type my_mat 49864099cc6bSBarry Smith 49874099cc6bSBarry Smith Level: advanced 49884099cc6bSBarry Smith 49894099cc6bSBarry Smith .seealso: MatSeqAIJRegisterAll() 49904099cc6bSBarry Smith 49914099cc6bSBarry Smith 49924099cc6bSBarry Smith Level: advanced 49934099cc6bSBarry Smith @*/ 4994388d47a6SSatish Balay PetscErrorCode MatSeqAIJRegister(const char sname[],PetscErrorCode (*function)(Mat,MatType,MatReuse,Mat *)) 49954099cc6bSBarry Smith { 49964099cc6bSBarry Smith PetscErrorCode ierr; 49974099cc6bSBarry Smith 49984099cc6bSBarry Smith PetscFunctionBegin; 49999cc31a68SJed Brown ierr = MatInitializePackage();CHKERRQ(ierr); 50004099cc6bSBarry Smith ierr = PetscFunctionListAdd(&MatSeqAIJList,sname,function);CHKERRQ(ierr); 50014099cc6bSBarry Smith PetscFunctionReturn(0); 50024099cc6bSBarry Smith } 50034099cc6bSBarry Smith 50044099cc6bSBarry Smith PetscBool MatSeqAIJRegisterAllCalled = PETSC_FALSE; 50054099cc6bSBarry Smith 50064099cc6bSBarry Smith /*@C 50074099cc6bSBarry Smith MatSeqAIJRegisterAll - Registers all of the matrix subtypes of SeqAIJ 50084099cc6bSBarry Smith 50094099cc6bSBarry Smith Not Collective 50104099cc6bSBarry Smith 50114099cc6bSBarry Smith Level: advanced 50124099cc6bSBarry Smith 50134099cc6bSBarry Smith Developers Note: CUSP and CUSPARSE do not yet support the MatConvert_SeqAIJ..() paradigm and thus cannot be registered here 50144099cc6bSBarry Smith 50154099cc6bSBarry Smith .seealso: MatRegisterAll(), MatSeqAIJRegister() 50164099cc6bSBarry Smith @*/ 50174099cc6bSBarry Smith PetscErrorCode MatSeqAIJRegisterAll(void) 50184099cc6bSBarry Smith { 50194099cc6bSBarry Smith PetscErrorCode ierr; 50204099cc6bSBarry Smith 50214099cc6bSBarry Smith PetscFunctionBegin; 50224099cc6bSBarry Smith if (MatSeqAIJRegisterAllCalled) PetscFunctionReturn(0); 50234099cc6bSBarry Smith MatSeqAIJRegisterAllCalled = PETSC_TRUE; 50244099cc6bSBarry Smith 50254099cc6bSBarry Smith ierr = MatSeqAIJRegister(MATSEQAIJCRL, MatConvert_SeqAIJ_SeqAIJCRL);CHKERRQ(ierr); 50264099cc6bSBarry Smith ierr = MatSeqAIJRegister(MATSEQAIJPERM, MatConvert_SeqAIJ_SeqAIJPERM);CHKERRQ(ierr); 50274dfdc2d9SRichard Tran Mills ierr = MatSeqAIJRegister(MATSEQAIJSELL, MatConvert_SeqAIJ_SeqAIJSELL);CHKERRQ(ierr); 50289779e05dSSatish Balay #if defined(PETSC_HAVE_MKL_SPARSE) 50296b62b571SRichard Tran Mills ierr = MatSeqAIJRegister(MATSEQAIJMKL, MatConvert_SeqAIJ_SeqAIJMKL);CHKERRQ(ierr); 5030485f9817SRichard Tran Mills #endif 50314099cc6bSBarry Smith #if defined(PETSC_HAVE_VIENNACL) && defined(PETSC_HAVE_VIENNACL_NO_CUDA) 50324099cc6bSBarry Smith ierr = MatSeqAIJRegister(MATMPIAIJVIENNACL, MatConvert_SeqAIJ_SeqAIJViennaCL);CHKERRQ(ierr); 50334099cc6bSBarry Smith #endif 50344099cc6bSBarry Smith PetscFunctionReturn(0); 50354099cc6bSBarry Smith } 503653dd7562SDmitry Karpeev 503753dd7562SDmitry Karpeev /* 503881824310SBarry Smith Special version for direct calls from Fortran 503981824310SBarry Smith */ 5040af0996ceSBarry Smith #include <petsc/private/fortranimpl.h> 504181824310SBarry Smith #if defined(PETSC_HAVE_FORTRAN_CAPS) 504281824310SBarry Smith #define matsetvaluesseqaij_ MATSETVALUESSEQAIJ 504381824310SBarry Smith #elif !defined(PETSC_HAVE_FORTRAN_UNDERSCORE) 504481824310SBarry Smith #define matsetvaluesseqaij_ matsetvaluesseqaij 504581824310SBarry Smith #endif 504681824310SBarry Smith 504781824310SBarry Smith /* Change these macros so can be used in void function */ 504881824310SBarry Smith #undef CHKERRQ 5049ce94432eSBarry Smith #define CHKERRQ(ierr) CHKERRABORT(PetscObjectComm((PetscObject)A),ierr) 505081824310SBarry Smith #undef SETERRQ2 5051e32f2f54SBarry Smith #define SETERRQ2(comm,ierr,b,c,d) CHKERRABORT(comm,ierr) 50524994cf47SJed Brown #undef SETERRQ3 50534994cf47SJed Brown #define SETERRQ3(comm,ierr,b,c,d,e) CHKERRABORT(comm,ierr) 505481824310SBarry Smith 505519caf8f3SSatish Balay PETSC_EXTERN void matsetvaluesseqaij_(Mat *AA,PetscInt *mm,const PetscInt im[],PetscInt *nn,const PetscInt in[],const PetscScalar v[],InsertMode *isis, PetscErrorCode *_ierr) 505681824310SBarry Smith { 505781824310SBarry Smith Mat A = *AA; 505881824310SBarry Smith PetscInt m = *mm, n = *nn; 505981824310SBarry Smith InsertMode is = *isis; 506081824310SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 506181824310SBarry Smith PetscInt *rp,k,low,high,t,ii,row,nrow,i,col,l,rmax,N; 506281824310SBarry Smith PetscInt *imax,*ai,*ailen; 506381824310SBarry Smith PetscErrorCode ierr; 506481824310SBarry Smith PetscInt *aj,nonew = a->nonew,lastcol = -1; 506554f21887SBarry Smith MatScalar *ap,value,*aa; 5066ace3abfcSBarry Smith PetscBool ignorezeroentries = a->ignorezeroentries; 5067ace3abfcSBarry Smith PetscBool roworiented = a->roworiented; 506881824310SBarry Smith 506981824310SBarry Smith PetscFunctionBegin; 50704994cf47SJed Brown MatCheckPreallocated(A,1); 507181824310SBarry Smith imax = a->imax; 507281824310SBarry Smith ai = a->i; 507381824310SBarry Smith ailen = a->ilen; 507481824310SBarry Smith aj = a->j; 507581824310SBarry Smith aa = a->a; 507681824310SBarry Smith 507781824310SBarry Smith for (k=0; k<m; k++) { /* loop over added rows */ 507881824310SBarry Smith row = im[k]; 507981824310SBarry Smith if (row < 0) continue; 5080cf9c20a2SJed Brown if (PetscUnlikelyDebug(row >= A->rmap->n)) SETERRABORT(PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_OUTOFRANGE,"Row too large"); 508181824310SBarry Smith rp = aj + ai[row]; ap = aa + ai[row]; 508281824310SBarry Smith rmax = imax[row]; nrow = ailen[row]; 508381824310SBarry Smith low = 0; 508481824310SBarry Smith high = nrow; 508581824310SBarry Smith for (l=0; l<n; l++) { /* loop over added columns */ 508681824310SBarry Smith if (in[l] < 0) continue; 5087cf9c20a2SJed Brown if (PetscUnlikelyDebug(in[l] >= A->cmap->n)) SETERRABORT(PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_OUTOFRANGE,"Column too large"); 508881824310SBarry Smith col = in[l]; 50892205254eSKarl Rupp if (roworiented) value = v[l + k*n]; 50902205254eSKarl Rupp else value = v[k + l*m]; 50912205254eSKarl Rupp 509281824310SBarry Smith if (value == 0.0 && ignorezeroentries && (is == ADD_VALUES)) continue; 509381824310SBarry Smith 50942205254eSKarl Rupp if (col <= lastcol) low = 0; 50952205254eSKarl Rupp else high = nrow; 509681824310SBarry Smith lastcol = col; 509781824310SBarry Smith while (high-low > 5) { 509881824310SBarry Smith t = (low+high)/2; 509981824310SBarry Smith if (rp[t] > col) high = t; 510081824310SBarry Smith else low = t; 510181824310SBarry Smith } 510281824310SBarry Smith for (i=low; i<high; i++) { 510381824310SBarry Smith if (rp[i] > col) break; 510481824310SBarry Smith if (rp[i] == col) { 510581824310SBarry Smith if (is == ADD_VALUES) ap[i] += value; 510681824310SBarry Smith else ap[i] = value; 510781824310SBarry Smith goto noinsert; 510881824310SBarry Smith } 510981824310SBarry Smith } 511081824310SBarry Smith if (value == 0.0 && ignorezeroentries) goto noinsert; 511181824310SBarry Smith if (nonew == 1) goto noinsert; 5112ce94432eSBarry Smith if (nonew == -1) SETERRABORT(PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_OUTOFRANGE,"Inserting a new nonzero in the matrix"); 5113fef13f97SBarry Smith MatSeqXAIJReallocateAIJ(A,A->rmap->n,1,nrow,row,col,rmax,aa,ai,aj,rp,ap,imax,nonew,MatScalar); 511481824310SBarry Smith N = nrow++ - 1; a->nz++; high++; 511581824310SBarry Smith /* shift up all the later entries in this row */ 511681824310SBarry Smith for (ii=N; ii>=i; ii--) { 511781824310SBarry Smith rp[ii+1] = rp[ii]; 511881824310SBarry Smith ap[ii+1] = ap[ii]; 511981824310SBarry Smith } 512081824310SBarry Smith rp[i] = col; 512181824310SBarry Smith ap[i] = value; 5122e56f5c9eSBarry Smith A->nonzerostate++; 512381824310SBarry Smith noinsert:; 512481824310SBarry Smith low = i + 1; 512581824310SBarry Smith } 512681824310SBarry Smith ailen[row] = nrow; 512781824310SBarry Smith } 512881824310SBarry Smith PetscFunctionReturnVoid(); 512981824310SBarry Smith } 5130