1d5d45c9bSBarry Smith /* 23369ce9aSBarry Smith Defines the basic matrix operations for the AIJ (compressed row) 3d5d45c9bSBarry Smith matrix storage format. 4d5d45c9bSBarry Smith */ 53369ce9aSBarry Smith 67c4f633dSBarry Smith 7c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/aij.h> /*I "petscmat.h" I*/ 8c6db04a5SJed Brown #include <petscblaslapack.h> 9c6db04a5SJed Brown #include <petscbt.h> 10af0996ceSBarry Smith #include <petsc/private/kernels/blocktranspose.h> 110716a85fSBarry Smith 124099cc6bSBarry Smith PetscErrorCode MatSeqAIJSetTypeFromOptions(Mat A) 134099cc6bSBarry Smith { 144099cc6bSBarry Smith PetscErrorCode ierr; 154099cc6bSBarry Smith PetscBool flg; 164099cc6bSBarry Smith char type[256]; 174099cc6bSBarry Smith 184099cc6bSBarry Smith PetscFunctionBegin; 194099cc6bSBarry Smith ierr = PetscObjectOptionsBegin((PetscObject)A); 204099cc6bSBarry Smith ierr = PetscOptionsFList("-mat_seqaij_type","Matrix SeqAIJ type","MatSeqAIJSetType",MatSeqAIJList,"seqaij",type,256,&flg);CHKERRQ(ierr); 214099cc6bSBarry Smith if (flg) { 224099cc6bSBarry Smith ierr = MatSeqAIJSetType(A,type);CHKERRQ(ierr); 234099cc6bSBarry Smith } 244099cc6bSBarry Smith ierr = PetscOptionsEnd();CHKERRQ(ierr); 254099cc6bSBarry Smith PetscFunctionReturn(0); 264099cc6bSBarry Smith } 274099cc6bSBarry Smith 280716a85fSBarry Smith PetscErrorCode MatGetColumnNorms_SeqAIJ(Mat A,NormType type,PetscReal *norms) 290716a85fSBarry Smith { 300716a85fSBarry Smith PetscErrorCode ierr; 310716a85fSBarry Smith PetscInt i,m,n; 320716a85fSBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ*)A->data; 330716a85fSBarry Smith 340716a85fSBarry Smith PetscFunctionBegin; 350716a85fSBarry Smith ierr = MatGetSize(A,&m,&n);CHKERRQ(ierr); 36580bdb30SBarry Smith ierr = PetscArrayzero(norms,n);CHKERRQ(ierr); 370716a85fSBarry Smith if (type == NORM_2) { 380716a85fSBarry Smith for (i=0; i<aij->i[m]; i++) { 390716a85fSBarry Smith norms[aij->j[i]] += PetscAbsScalar(aij->a[i]*aij->a[i]); 400716a85fSBarry Smith } 410716a85fSBarry Smith } else if (type == NORM_1) { 420716a85fSBarry Smith for (i=0; i<aij->i[m]; i++) { 430716a85fSBarry Smith norms[aij->j[i]] += PetscAbsScalar(aij->a[i]); 440716a85fSBarry Smith } 450716a85fSBarry Smith } else if (type == NORM_INFINITY) { 460716a85fSBarry Smith for (i=0; i<aij->i[m]; i++) { 470716a85fSBarry Smith norms[aij->j[i]] = PetscMax(PetscAbsScalar(aij->a[i]),norms[aij->j[i]]); 480716a85fSBarry Smith } 490716a85fSBarry Smith } else SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONG,"Unknown NormType"); 500716a85fSBarry Smith 510716a85fSBarry Smith if (type == NORM_2) { 528f1a2a5eSBarry Smith for (i=0; i<n; i++) norms[i] = PetscSqrtReal(norms[i]); 530716a85fSBarry Smith } 540716a85fSBarry Smith PetscFunctionReturn(0); 550716a85fSBarry Smith } 560716a85fSBarry Smith 573a062f41SBarry Smith PetscErrorCode MatFindOffBlockDiagonalEntries_SeqAIJ(Mat A,IS *is) 583a062f41SBarry Smith { 593a062f41SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 603a062f41SBarry Smith PetscInt i,m=A->rmap->n,cnt = 0, bs = A->rmap->bs; 613a062f41SBarry Smith const PetscInt *jj = a->j,*ii = a->i; 623a062f41SBarry Smith PetscInt *rows; 633a062f41SBarry Smith PetscErrorCode ierr; 643a062f41SBarry Smith 653a062f41SBarry Smith PetscFunctionBegin; 663a062f41SBarry Smith for (i=0; i<m; i++) { 673a062f41SBarry Smith if ((ii[i] != ii[i+1]) && ((jj[ii[i]] < bs*(i/bs)) || (jj[ii[i+1]-1] > bs*((i+bs)/bs)-1))) { 683a062f41SBarry Smith cnt++; 693a062f41SBarry Smith } 703a062f41SBarry Smith } 713a062f41SBarry Smith ierr = PetscMalloc1(cnt,&rows);CHKERRQ(ierr); 723a062f41SBarry Smith cnt = 0; 733a062f41SBarry Smith for (i=0; i<m; i++) { 743a062f41SBarry Smith if ((ii[i] != ii[i+1]) && ((jj[ii[i]] < bs*(i/bs)) || (jj[ii[i+1]-1] > bs*((i+bs)/bs)-1))) { 753a062f41SBarry Smith rows[cnt] = i; 763a062f41SBarry Smith cnt++; 773a062f41SBarry Smith } 783a062f41SBarry Smith } 793a062f41SBarry Smith ierr = ISCreateGeneral(PETSC_COMM_SELF,cnt,rows,PETSC_OWN_POINTER,is);CHKERRQ(ierr); 803a062f41SBarry Smith PetscFunctionReturn(0); 813a062f41SBarry Smith } 823a062f41SBarry Smith 83f1f41ecbSJed Brown PetscErrorCode MatFindZeroDiagonals_SeqAIJ_Private(Mat A,PetscInt *nrows,PetscInt **zrows) 846ce1633cSBarry Smith { 856ce1633cSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 866ce1633cSBarry Smith const MatScalar *aa = a->a; 876ce1633cSBarry Smith PetscInt i,m=A->rmap->n,cnt = 0; 88b2db7409Sstefano_zampini const PetscInt *ii = a->i,*jj = a->j,*diag; 896ce1633cSBarry Smith PetscInt *rows; 906ce1633cSBarry Smith PetscErrorCode ierr; 916ce1633cSBarry Smith 926ce1633cSBarry Smith PetscFunctionBegin; 936ce1633cSBarry Smith ierr = MatMarkDiagonal_SeqAIJ(A);CHKERRQ(ierr); 946ce1633cSBarry Smith diag = a->diag; 956ce1633cSBarry Smith for (i=0; i<m; i++) { 96b2db7409Sstefano_zampini if ((diag[i] >= ii[i+1]) || (jj[diag[i]] != i) || (aa[diag[i]] == 0.0)) { 976ce1633cSBarry Smith cnt++; 986ce1633cSBarry Smith } 996ce1633cSBarry Smith } 100785e854fSJed Brown ierr = PetscMalloc1(cnt,&rows);CHKERRQ(ierr); 1016ce1633cSBarry Smith cnt = 0; 1026ce1633cSBarry Smith for (i=0; i<m; i++) { 103b2db7409Sstefano_zampini if ((diag[i] >= ii[i+1]) || (jj[diag[i]] != i) || (aa[diag[i]] == 0.0)) { 1046ce1633cSBarry Smith rows[cnt++] = i; 1056ce1633cSBarry Smith } 1066ce1633cSBarry Smith } 107f1f41ecbSJed Brown *nrows = cnt; 108f1f41ecbSJed Brown *zrows = rows; 109f1f41ecbSJed Brown PetscFunctionReturn(0); 110f1f41ecbSJed Brown } 111f1f41ecbSJed Brown 112f1f41ecbSJed Brown PetscErrorCode MatFindZeroDiagonals_SeqAIJ(Mat A,IS *zrows) 113f1f41ecbSJed Brown { 114f1f41ecbSJed Brown PetscInt nrows,*rows; 115f1f41ecbSJed Brown PetscErrorCode ierr; 116f1f41ecbSJed Brown 117f1f41ecbSJed Brown PetscFunctionBegin; 1180298fd71SBarry Smith *zrows = NULL; 119f1f41ecbSJed Brown ierr = MatFindZeroDiagonals_SeqAIJ_Private(A,&nrows,&rows);CHKERRQ(ierr); 120ce94432eSBarry Smith ierr = ISCreateGeneral(PetscObjectComm((PetscObject)A),nrows,rows,PETSC_OWN_POINTER,zrows);CHKERRQ(ierr); 1216ce1633cSBarry Smith PetscFunctionReturn(0); 1226ce1633cSBarry Smith } 1236ce1633cSBarry Smith 124b3a44c85SBarry Smith PetscErrorCode MatFindNonzeroRows_SeqAIJ(Mat A,IS *keptrows) 125b3a44c85SBarry Smith { 126b3a44c85SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 127b3a44c85SBarry Smith const MatScalar *aa; 128b3a44c85SBarry Smith PetscInt m=A->rmap->n,cnt = 0; 129b3a44c85SBarry Smith const PetscInt *ii; 130b3a44c85SBarry Smith PetscInt n,i,j,*rows; 131b3a44c85SBarry Smith PetscErrorCode ierr; 132b3a44c85SBarry Smith 133b3a44c85SBarry Smith PetscFunctionBegin; 134b3a44c85SBarry Smith *keptrows = 0; 135b3a44c85SBarry Smith ii = a->i; 136b3a44c85SBarry Smith for (i=0; i<m; i++) { 137b3a44c85SBarry Smith n = ii[i+1] - ii[i]; 138b3a44c85SBarry Smith if (!n) { 139b3a44c85SBarry Smith cnt++; 140b3a44c85SBarry Smith goto ok1; 141b3a44c85SBarry Smith } 142b3a44c85SBarry Smith aa = a->a + ii[i]; 143b3a44c85SBarry Smith for (j=0; j<n; j++) { 144b3a44c85SBarry Smith if (aa[j] != 0.0) goto ok1; 145b3a44c85SBarry Smith } 146b3a44c85SBarry Smith cnt++; 147b3a44c85SBarry Smith ok1:; 148b3a44c85SBarry Smith } 149b3a44c85SBarry Smith if (!cnt) PetscFunctionReturn(0); 150854ce69bSBarry Smith ierr = PetscMalloc1(A->rmap->n-cnt,&rows);CHKERRQ(ierr); 151b3a44c85SBarry Smith cnt = 0; 152b3a44c85SBarry Smith for (i=0; i<m; i++) { 153b3a44c85SBarry Smith n = ii[i+1] - ii[i]; 154b3a44c85SBarry Smith if (!n) continue; 155b3a44c85SBarry Smith aa = a->a + ii[i]; 156b3a44c85SBarry Smith for (j=0; j<n; j++) { 157b3a44c85SBarry Smith if (aa[j] != 0.0) { 158b3a44c85SBarry Smith rows[cnt++] = i; 159b3a44c85SBarry Smith break; 160b3a44c85SBarry Smith } 161b3a44c85SBarry Smith } 162b3a44c85SBarry Smith } 163b3a44c85SBarry Smith ierr = ISCreateGeneral(PETSC_COMM_SELF,cnt,rows,PETSC_OWN_POINTER,keptrows);CHKERRQ(ierr); 164b3a44c85SBarry Smith PetscFunctionReturn(0); 165b3a44c85SBarry Smith } 166b3a44c85SBarry Smith 1677087cfbeSBarry Smith PetscErrorCode MatDiagonalSet_SeqAIJ(Mat Y,Vec D,InsertMode is) 16879299369SBarry Smith { 16979299369SBarry Smith PetscErrorCode ierr; 17079299369SBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ*) Y->data; 17199e65526SBarry Smith PetscInt i,m = Y->rmap->n; 17299e65526SBarry Smith const PetscInt *diag; 17354f21887SBarry Smith MatScalar *aa = aij->a; 17499e65526SBarry Smith const PetscScalar *v; 175ace3abfcSBarry Smith PetscBool missing; 176837a59e1SRichard Tran Mills #if defined(PETSC_HAVE_VIENNACL) || defined(PETSC_HAVE_CUDA) 177837a59e1SRichard Tran Mills PetscBool inserted = PETSC_FALSE; 178837a59e1SRichard Tran Mills #endif 17979299369SBarry Smith 18079299369SBarry Smith PetscFunctionBegin; 18109f38230SBarry Smith if (Y->assembled) { 1820298fd71SBarry Smith ierr = MatMissingDiagonal_SeqAIJ(Y,&missing,NULL);CHKERRQ(ierr); 18309f38230SBarry Smith if (!missing) { 18479299369SBarry Smith diag = aij->diag; 18599e65526SBarry Smith ierr = VecGetArrayRead(D,&v);CHKERRQ(ierr); 18679299369SBarry Smith if (is == INSERT_VALUES) { 187837a59e1SRichard Tran Mills #if defined(PETSC_HAVE_VIENNACL) || defined(PETSC_HAVE_CUDA) 188837a59e1SRichard Tran Mills inserted = PETSC_TRUE; 189837a59e1SRichard Tran Mills #endif 19079299369SBarry Smith for (i=0; i<m; i++) { 19179299369SBarry Smith aa[diag[i]] = v[i]; 19279299369SBarry Smith } 19379299369SBarry Smith } else { 19479299369SBarry Smith for (i=0; i<m; i++) { 195837a59e1SRichard Tran Mills #if defined(PETSC_HAVE_VIENNACL) || defined(PETSC_HAVE_CUDA) 196837a59e1SRichard Tran Mills if (v[i] != 0.0) inserted = PETSC_TRUE; 197837a59e1SRichard Tran Mills #endif 19879299369SBarry Smith aa[diag[i]] += v[i]; 19979299369SBarry Smith } 20079299369SBarry Smith } 201837a59e1SRichard Tran Mills #if defined(PETSC_HAVE_VIENNACL) || defined(PETSC_HAVE_CUDA) 202837a59e1SRichard Tran Mills if (inserted) Y->offloadmask = PETSC_OFFLOAD_CPU; 203837a59e1SRichard Tran Mills #endif 20499e65526SBarry Smith ierr = VecRestoreArrayRead(D,&v);CHKERRQ(ierr); 20579299369SBarry Smith PetscFunctionReturn(0); 20679299369SBarry Smith } 207acf2f550SJed Brown ierr = MatSeqAIJInvalidateDiagonal(Y);CHKERRQ(ierr); 20809f38230SBarry Smith } 20909f38230SBarry Smith ierr = MatDiagonalSet_Default(Y,D,is);CHKERRQ(ierr); 21009f38230SBarry Smith PetscFunctionReturn(0); 21109f38230SBarry Smith } 21279299369SBarry Smith 2131a83f524SJed Brown PetscErrorCode MatGetRowIJ_SeqAIJ(Mat A,PetscInt oshift,PetscBool symmetric,PetscBool inodecompressed,PetscInt *m,const PetscInt *ia[],const PetscInt *ja[],PetscBool *done) 21417ab2063SBarry Smith { 215416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 216dfbe8321SBarry Smith PetscErrorCode ierr; 21797f1f81fSBarry Smith PetscInt i,ishift; 21817ab2063SBarry Smith 2193a40ed3dSBarry Smith PetscFunctionBegin; 220d0f46423SBarry Smith *m = A->rmap->n; 2213a40ed3dSBarry Smith if (!ia) PetscFunctionReturn(0); 222bfeeae90SHong Zhang ishift = 0; 22353e63a63SBarry Smith if (symmetric && !A->structurally_symmetric) { 2242462f5fdSStefano Zampini ierr = MatToSymmetricIJ_SeqAIJ(A->rmap->n,a->i,a->j,PETSC_TRUE,ishift,oshift,(PetscInt**)ia,(PetscInt**)ja);CHKERRQ(ierr); 225bfeeae90SHong Zhang } else if (oshift == 1) { 2261a83f524SJed Brown PetscInt *tia; 227d0f46423SBarry Smith PetscInt nz = a->i[A->rmap->n]; 2283b2fbd54SBarry Smith /* malloc space and add 1 to i and j indices */ 229854ce69bSBarry Smith ierr = PetscMalloc1(A->rmap->n+1,&tia);CHKERRQ(ierr); 2301a83f524SJed Brown for (i=0; i<A->rmap->n+1; i++) tia[i] = a->i[i] + 1; 2311a83f524SJed Brown *ia = tia; 232ecc77c7aSBarry Smith if (ja) { 2331a83f524SJed Brown PetscInt *tja; 234854ce69bSBarry Smith ierr = PetscMalloc1(nz+1,&tja);CHKERRQ(ierr); 2351a83f524SJed Brown for (i=0; i<nz; i++) tja[i] = a->j[i] + 1; 2361a83f524SJed Brown *ja = tja; 237ecc77c7aSBarry Smith } 2386945ee14SBarry Smith } else { 239ecc77c7aSBarry Smith *ia = a->i; 240ecc77c7aSBarry Smith if (ja) *ja = a->j; 241a2ce50c7SBarry Smith } 2423a40ed3dSBarry Smith PetscFunctionReturn(0); 243a2744918SBarry Smith } 244a2744918SBarry Smith 2451a83f524SJed Brown PetscErrorCode MatRestoreRowIJ_SeqAIJ(Mat A,PetscInt oshift,PetscBool symmetric,PetscBool inodecompressed,PetscInt *n,const PetscInt *ia[],const PetscInt *ja[],PetscBool *done) 2466945ee14SBarry Smith { 247dfbe8321SBarry Smith PetscErrorCode ierr; 2486945ee14SBarry Smith 2493a40ed3dSBarry Smith PetscFunctionBegin; 2503a40ed3dSBarry Smith if (!ia) PetscFunctionReturn(0); 251bfeeae90SHong Zhang if ((symmetric && !A->structurally_symmetric) || oshift == 1) { 252606d414cSSatish Balay ierr = PetscFree(*ia);CHKERRQ(ierr); 253ecc77c7aSBarry Smith if (ja) {ierr = PetscFree(*ja);CHKERRQ(ierr);} 254bcd2baecSBarry Smith } 2553a40ed3dSBarry Smith PetscFunctionReturn(0); 25617ab2063SBarry Smith } 25717ab2063SBarry Smith 2581a83f524SJed Brown PetscErrorCode MatGetColumnIJ_SeqAIJ(Mat A,PetscInt oshift,PetscBool symmetric,PetscBool inodecompressed,PetscInt *nn,const PetscInt *ia[],const PetscInt *ja[],PetscBool *done) 2593b2fbd54SBarry Smith { 2603b2fbd54SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 261dfbe8321SBarry Smith PetscErrorCode ierr; 262d0f46423SBarry Smith PetscInt i,*collengths,*cia,*cja,n = A->cmap->n,m = A->rmap->n; 26397f1f81fSBarry Smith PetscInt nz = a->i[m],row,*jj,mr,col; 2643b2fbd54SBarry Smith 2653a40ed3dSBarry Smith PetscFunctionBegin; 266899cda47SBarry Smith *nn = n; 2673a40ed3dSBarry Smith if (!ia) PetscFunctionReturn(0); 2683b2fbd54SBarry Smith if (symmetric) { 2692462f5fdSStefano Zampini ierr = MatToSymmetricIJ_SeqAIJ(A->rmap->n,a->i,a->j,PETSC_TRUE,0,oshift,(PetscInt**)ia,(PetscInt**)ja);CHKERRQ(ierr); 2703b2fbd54SBarry Smith } else { 271b9e7e5c1SBarry Smith ierr = PetscCalloc1(n,&collengths);CHKERRQ(ierr); 272854ce69bSBarry Smith ierr = PetscMalloc1(n+1,&cia);CHKERRQ(ierr); 273b9e7e5c1SBarry Smith ierr = PetscMalloc1(nz,&cja);CHKERRQ(ierr); 2743b2fbd54SBarry Smith jj = a->j; 2753b2fbd54SBarry Smith for (i=0; i<nz; i++) { 276bfeeae90SHong Zhang collengths[jj[i]]++; 2773b2fbd54SBarry Smith } 2783b2fbd54SBarry Smith cia[0] = oshift; 2793b2fbd54SBarry Smith for (i=0; i<n; i++) { 2803b2fbd54SBarry Smith cia[i+1] = cia[i] + collengths[i]; 2813b2fbd54SBarry Smith } 282580bdb30SBarry Smith ierr = PetscArrayzero(collengths,n);CHKERRQ(ierr); 2833b2fbd54SBarry Smith jj = a->j; 284a93ec695SBarry Smith for (row=0; row<m; row++) { 285a93ec695SBarry Smith mr = a->i[row+1] - a->i[row]; 286a93ec695SBarry Smith for (i=0; i<mr; i++) { 287bfeeae90SHong Zhang col = *jj++; 2882205254eSKarl Rupp 2893b2fbd54SBarry Smith cja[cia[col] + collengths[col]++ - oshift] = row + oshift; 2903b2fbd54SBarry Smith } 2913b2fbd54SBarry Smith } 292606d414cSSatish Balay ierr = PetscFree(collengths);CHKERRQ(ierr); 2933b2fbd54SBarry Smith *ia = cia; *ja = cja; 2943b2fbd54SBarry Smith } 2953a40ed3dSBarry Smith PetscFunctionReturn(0); 2963b2fbd54SBarry Smith } 2973b2fbd54SBarry Smith 2981a83f524SJed Brown PetscErrorCode MatRestoreColumnIJ_SeqAIJ(Mat A,PetscInt oshift,PetscBool symmetric,PetscBool inodecompressed,PetscInt *n,const PetscInt *ia[],const PetscInt *ja[],PetscBool *done) 2993b2fbd54SBarry Smith { 300dfbe8321SBarry Smith PetscErrorCode ierr; 301606d414cSSatish Balay 3023a40ed3dSBarry Smith PetscFunctionBegin; 3033a40ed3dSBarry Smith if (!ia) PetscFunctionReturn(0); 3043b2fbd54SBarry Smith 305606d414cSSatish Balay ierr = PetscFree(*ia);CHKERRQ(ierr); 306606d414cSSatish Balay ierr = PetscFree(*ja);CHKERRQ(ierr); 3073a40ed3dSBarry Smith PetscFunctionReturn(0); 3083b2fbd54SBarry Smith } 3093b2fbd54SBarry Smith 3107cee066cSHong Zhang /* 3117cee066cSHong Zhang MatGetColumnIJ_SeqAIJ_Color() and MatRestoreColumnIJ_SeqAIJ_Color() are customized from 3127cee066cSHong Zhang MatGetColumnIJ_SeqAIJ() and MatRestoreColumnIJ_SeqAIJ() by adding an output 313040ebd07SHong Zhang spidx[], index of a->a, to be used in MatTransposeColoringCreate_SeqAIJ() and MatFDColoringCreate_SeqXAIJ() 3147cee066cSHong Zhang */ 3157cee066cSHong Zhang PetscErrorCode MatGetColumnIJ_SeqAIJ_Color(Mat A,PetscInt oshift,PetscBool symmetric,PetscBool inodecompressed,PetscInt *nn,const PetscInt *ia[],const PetscInt *ja[],PetscInt *spidx[],PetscBool *done) 3167cee066cSHong Zhang { 3177cee066cSHong Zhang Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 3187cee066cSHong Zhang PetscErrorCode ierr; 3197cee066cSHong Zhang PetscInt i,*collengths,*cia,*cja,n = A->cmap->n,m = A->rmap->n; 320071fcb05SBarry Smith PetscInt nz = a->i[m],row,mr,col,tmp; 3217cee066cSHong Zhang PetscInt *cspidx; 322071fcb05SBarry Smith const PetscInt *jj; 3237cee066cSHong Zhang 3247cee066cSHong Zhang PetscFunctionBegin; 3257cee066cSHong Zhang *nn = n; 3267cee066cSHong Zhang if (!ia) PetscFunctionReturn(0); 327625f6d37SHong Zhang 328b9e7e5c1SBarry Smith ierr = PetscCalloc1(n,&collengths);CHKERRQ(ierr); 329854ce69bSBarry Smith ierr = PetscMalloc1(n+1,&cia);CHKERRQ(ierr); 330b9e7e5c1SBarry Smith ierr = PetscMalloc1(nz,&cja);CHKERRQ(ierr); 331b9e7e5c1SBarry Smith ierr = PetscMalloc1(nz,&cspidx);CHKERRQ(ierr); 3327cee066cSHong Zhang jj = a->j; 3337cee066cSHong Zhang for (i=0; i<nz; i++) { 3347cee066cSHong Zhang collengths[jj[i]]++; 3357cee066cSHong Zhang } 3367cee066cSHong Zhang cia[0] = oshift; 3377cee066cSHong Zhang for (i=0; i<n; i++) { 3387cee066cSHong Zhang cia[i+1] = cia[i] + collengths[i]; 3397cee066cSHong Zhang } 340580bdb30SBarry Smith ierr = PetscArrayzero(collengths,n);CHKERRQ(ierr); 3417cee066cSHong Zhang jj = a->j; 3427cee066cSHong Zhang for (row=0; row<m; row++) { 3437cee066cSHong Zhang mr = a->i[row+1] - a->i[row]; 3447cee066cSHong Zhang for (i=0; i<mr; i++) { 3457cee066cSHong Zhang col = *jj++; 346071fcb05SBarry Smith tmp = cia[col] + collengths[col]++ - oshift; 347071fcb05SBarry Smith cspidx[tmp] = a->i[row] + i; /* index of a->j */ 348071fcb05SBarry Smith cja[tmp] = row + oshift; 3497cee066cSHong Zhang } 3507cee066cSHong Zhang } 3517cee066cSHong Zhang ierr = PetscFree(collengths);CHKERRQ(ierr); 352071fcb05SBarry Smith *ia = cia; 353071fcb05SBarry Smith *ja = cja; 3547cee066cSHong Zhang *spidx = cspidx; 3557cee066cSHong Zhang PetscFunctionReturn(0); 3567cee066cSHong Zhang } 3577cee066cSHong Zhang 3587cee066cSHong Zhang PetscErrorCode MatRestoreColumnIJ_SeqAIJ_Color(Mat A,PetscInt oshift,PetscBool symmetric,PetscBool inodecompressed,PetscInt *n,const PetscInt *ia[],const PetscInt *ja[],PetscInt *spidx[],PetscBool *done) 3597cee066cSHong Zhang { 3607cee066cSHong Zhang PetscErrorCode ierr; 3617cee066cSHong Zhang 3627cee066cSHong Zhang PetscFunctionBegin; 3635243ef75SHong Zhang ierr = MatRestoreColumnIJ_SeqAIJ(A,oshift,symmetric,inodecompressed,n,ia,ja,done);CHKERRQ(ierr); 3647cee066cSHong Zhang ierr = PetscFree(*spidx);CHKERRQ(ierr); 3657cee066cSHong Zhang PetscFunctionReturn(0); 3667cee066cSHong Zhang } 3677cee066cSHong Zhang 36887d4246cSBarry Smith PetscErrorCode MatSetValuesRow_SeqAIJ(Mat A,PetscInt row,const PetscScalar v[]) 36987d4246cSBarry Smith { 37087d4246cSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 37187d4246cSBarry Smith PetscInt *ai = a->i; 37287d4246cSBarry Smith PetscErrorCode ierr; 37387d4246cSBarry Smith 37487d4246cSBarry Smith PetscFunctionBegin; 375580bdb30SBarry Smith ierr = PetscArraycpy(a->a+ai[row],v,ai[row+1]-ai[row]);CHKERRQ(ierr); 376e2cf4d64SStefano Zampini #if defined(PETSC_HAVE_VIENNACL) || defined(PETSC_HAVE_CUDA) 377c70f7ee4SJunchao Zhang if (A->offloadmask != PETSC_OFFLOAD_UNALLOCATED && ai[row+1]-ai[row]) A->offloadmask = PETSC_OFFLOAD_CPU; 378e2cf4d64SStefano Zampini #endif 37987d4246cSBarry Smith PetscFunctionReturn(0); 38087d4246cSBarry Smith } 38187d4246cSBarry Smith 382bd04181cSBarry Smith /* 383bd04181cSBarry Smith MatSeqAIJSetValuesLocalFast - An optimized version of MatSetValuesLocal() for SeqAIJ matrices with several assumptions 384bd04181cSBarry Smith 385bd04181cSBarry Smith - a single row of values is set with each call 386bd04181cSBarry Smith - no row or column indices are negative or (in error) larger than the number of rows or columns 387bd04181cSBarry Smith - the values are always added to the matrix, not set 388bd04181cSBarry Smith - no new locations are introduced in the nonzero structure of the matrix 389bd04181cSBarry Smith 3901f763a69SBarry Smith This does NOT assume the global column indices are sorted 391bd04181cSBarry Smith 3921f763a69SBarry Smith */ 393bd04181cSBarry Smith 394af0996ceSBarry Smith #include <petsc/private/isimpl.h> 395189e4007SBarry Smith PetscErrorCode MatSeqAIJSetValuesLocalFast(Mat A,PetscInt m,const PetscInt im[],PetscInt n,const PetscInt in[],const PetscScalar v[],InsertMode is) 396189e4007SBarry Smith { 397189e4007SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 3981f763a69SBarry Smith PetscInt low,high,t,row,nrow,i,col,l; 3991f763a69SBarry Smith const PetscInt *rp,*ai = a->i,*ailen = a->ilen,*aj = a->j; 4001f763a69SBarry Smith PetscInt lastcol = -1; 401189e4007SBarry Smith MatScalar *ap,value,*aa = a->a; 402189e4007SBarry Smith const PetscInt *ridx = A->rmap->mapping->indices,*cidx = A->cmap->mapping->indices; 403189e4007SBarry Smith 404f38dd0b8SBarry Smith row = ridx[im[0]]; 4051f763a69SBarry Smith rp = aj + ai[row]; 4061f763a69SBarry Smith ap = aa + ai[row]; 4071f763a69SBarry Smith nrow = ailen[row]; 408189e4007SBarry Smith low = 0; 409189e4007SBarry Smith high = nrow; 410189e4007SBarry Smith for (l=0; l<n; l++) { /* loop over added columns */ 411189e4007SBarry Smith col = cidx[in[l]]; 412f38dd0b8SBarry Smith value = v[l]; 413189e4007SBarry Smith 414189e4007SBarry Smith if (col <= lastcol) low = 0; 415189e4007SBarry Smith else high = nrow; 416189e4007SBarry Smith lastcol = col; 417189e4007SBarry Smith while (high-low > 5) { 418189e4007SBarry Smith t = (low+high)/2; 419189e4007SBarry Smith if (rp[t] > col) high = t; 420189e4007SBarry Smith else low = t; 421189e4007SBarry Smith } 422189e4007SBarry Smith for (i=low; i<high; i++) { 423189e4007SBarry Smith if (rp[i] == col) { 4241f763a69SBarry Smith ap[i] += value; 425189e4007SBarry Smith low = i + 1; 4261f763a69SBarry Smith break; 427189e4007SBarry Smith } 428189e4007SBarry Smith } 429189e4007SBarry Smith } 430e2cf4d64SStefano Zampini #if defined(PETSC_HAVE_VIENNACL) || defined(PETSC_HAVE_CUDA) 431c70f7ee4SJunchao Zhang if (A->offloadmask != PETSC_OFFLOAD_UNALLOCATED && m && n) A->offloadmask = PETSC_OFFLOAD_CPU; 432e2cf4d64SStefano Zampini #endif 433f38dd0b8SBarry Smith return 0; 434189e4007SBarry Smith } 435189e4007SBarry Smith 43697f1f81fSBarry Smith PetscErrorCode MatSetValues_SeqAIJ(Mat A,PetscInt m,const PetscInt im[],PetscInt n,const PetscInt in[],const PetscScalar v[],InsertMode is) 43717ab2063SBarry Smith { 438416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 439e2ee6c50SBarry Smith PetscInt *rp,k,low,high,t,ii,row,nrow,i,col,l,rmax,N; 44097f1f81fSBarry Smith PetscInt *imax = a->imax,*ai = a->i,*ailen = a->ilen; 4416849ba73SBarry Smith PetscErrorCode ierr; 442e2ee6c50SBarry Smith PetscInt *aj = a->j,nonew = a->nonew,lastcol = -1; 443d8cdefa3SHong Zhang MatScalar *ap=NULL,value=0.0,*aa = a->a; 444ace3abfcSBarry Smith PetscBool ignorezeroentries = a->ignorezeroentries; 445ace3abfcSBarry Smith PetscBool roworiented = a->roworiented; 446e2cf4d64SStefano Zampini #if defined(PETSC_HAVE_VIENNACL) || defined(PETSC_HAVE_CUDA) 447e2cf4d64SStefano Zampini PetscBool inserted = PETSC_FALSE; 448e2cf4d64SStefano Zampini #endif 44917ab2063SBarry Smith 4503a40ed3dSBarry Smith PetscFunctionBegin; 45117ab2063SBarry Smith for (k=0; k<m; k++) { /* loop over added rows */ 452416022c9SBarry Smith row = im[k]; 4535ef9f2a5SBarry Smith if (row < 0) continue; 454cf9c20a2SJed Brown if (PetscUnlikelyDebug(row >= A->rmap->n)) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Row too large: row %D max %D",row,A->rmap->n-1); 455720833daSHong Zhang rp = aj + ai[row]; 456876c6284SHong Zhang if (!A->structure_only) ap = aa + ai[row]; 45717ab2063SBarry Smith rmax = imax[row]; nrow = ailen[row]; 458416022c9SBarry Smith low = 0; 459c71e6ed7SBarry Smith high = nrow; 46017ab2063SBarry Smith for (l=0; l<n; l++) { /* loop over added columns */ 4615ef9f2a5SBarry Smith if (in[l] < 0) continue; 462cf9c20a2SJed Brown if (PetscUnlikelyDebug(in[l] >= A->cmap->n)) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Column too large: col %D max %D",in[l],A->cmap->n-1); 463bfeeae90SHong Zhang col = in[l]; 464071fcb05SBarry Smith if (v && !A->structure_only) value = roworiented ? v[l + k*n] : v[k + l*m]; 465071fcb05SBarry Smith if (!A->structure_only && value == 0.0 && ignorezeroentries && is == ADD_VALUES && row != col) continue; 46636db0b34SBarry Smith 4672205254eSKarl Rupp if (col <= lastcol) low = 0; 4682205254eSKarl Rupp else high = nrow; 469e2ee6c50SBarry Smith lastcol = col; 470416022c9SBarry Smith while (high-low > 5) { 471416022c9SBarry Smith t = (low+high)/2; 472416022c9SBarry Smith if (rp[t] > col) high = t; 473416022c9SBarry Smith else low = t; 47417ab2063SBarry Smith } 475416022c9SBarry Smith for (i=low; i<high; i++) { 47617ab2063SBarry Smith if (rp[i] > col) break; 47717ab2063SBarry Smith if (rp[i] == col) { 478876c6284SHong Zhang if (!A->structure_only) { 4790c0d7e18SFande Kong if (is == ADD_VALUES) { 4800c0d7e18SFande Kong ap[i] += value; 4810c0d7e18SFande Kong (void)PetscLogFlops(1.0); 4820c0d7e18SFande Kong } 48317ab2063SBarry Smith else ap[i] = value; 484e2cf4d64SStefano Zampini #if defined(PETSC_HAVE_VIENNACL) || defined(PETSC_HAVE_CUDA) 485e2cf4d64SStefano Zampini inserted = PETSC_TRUE; 486e2cf4d64SStefano Zampini #endif 487720833daSHong Zhang } 488e44c0bd4SBarry Smith low = i + 1; 48917ab2063SBarry Smith goto noinsert; 49017ab2063SBarry Smith } 49117ab2063SBarry Smith } 492dcd36c23SBarry Smith if (value == 0.0 && ignorezeroentries && row != col) goto noinsert; 493c2653b3dSLois Curfman McInnes if (nonew == 1) goto noinsert; 494e32f2f54SBarry Smith if (nonew == -1) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Inserting a new nonzero at (%D,%D) in the matrix",row,col); 495720833daSHong Zhang if (A->structure_only) { 496876c6284SHong Zhang MatSeqXAIJReallocateAIJ_structure_only(A,A->rmap->n,1,nrow,row,col,rmax,ai,aj,rp,imax,nonew,MatScalar); 497720833daSHong Zhang } else { 498fef13f97SBarry Smith MatSeqXAIJReallocateAIJ(A,A->rmap->n,1,nrow,row,col,rmax,aa,ai,aj,rp,ap,imax,nonew,MatScalar); 499720833daSHong Zhang } 500c03d1d03SSatish Balay N = nrow++ - 1; a->nz++; high++; 501416022c9SBarry Smith /* shift up all the later entries in this row */ 502580bdb30SBarry Smith ierr = PetscArraymove(rp+i+1,rp+i,N-i+1);CHKERRQ(ierr); 50317ab2063SBarry Smith rp[i] = col; 504580bdb30SBarry Smith if (!A->structure_only){ 505580bdb30SBarry Smith ierr = PetscArraymove(ap+i+1,ap+i,N-i+1);CHKERRQ(ierr); 506580bdb30SBarry Smith ap[i] = value; 507580bdb30SBarry Smith } 508416022c9SBarry Smith low = i + 1; 509e56f5c9eSBarry Smith A->nonzerostate++; 510e2cf4d64SStefano Zampini #if defined(PETSC_HAVE_VIENNACL) || defined(PETSC_HAVE_CUDA) 511e2cf4d64SStefano Zampini inserted = PETSC_TRUE; 512e2cf4d64SStefano Zampini #endif 513e44c0bd4SBarry Smith noinsert:; 51417ab2063SBarry Smith } 51517ab2063SBarry Smith ailen[row] = nrow; 51617ab2063SBarry Smith } 517e2cf4d64SStefano Zampini #if defined(PETSC_HAVE_VIENNACL) || defined(PETSC_HAVE_CUDA) 518c70f7ee4SJunchao Zhang if (A->offloadmask != PETSC_OFFLOAD_UNALLOCATED && inserted) A->offloadmask = PETSC_OFFLOAD_CPU; 519e2cf4d64SStefano Zampini #endif 5203a40ed3dSBarry Smith PetscFunctionReturn(0); 52117ab2063SBarry Smith } 52217ab2063SBarry Smith 523071fcb05SBarry Smith PetscErrorCode MatSetValues_SeqAIJ_SortedFull(Mat A,PetscInt m,const PetscInt im[],PetscInt n,const PetscInt in[],const PetscScalar v[],InsertMode is) 524071fcb05SBarry Smith { 525071fcb05SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 526071fcb05SBarry Smith PetscInt *rp,k,row; 527071fcb05SBarry Smith PetscInt *ai = a->i,*ailen = a->ilen; 528071fcb05SBarry Smith PetscErrorCode ierr; 529071fcb05SBarry Smith PetscInt *aj = a->j; 530071fcb05SBarry Smith MatScalar *aa = a->a,*ap; 531071fcb05SBarry Smith 532071fcb05SBarry Smith PetscFunctionBegin; 533071fcb05SBarry Smith for (k=0; k<m; k++) { /* loop over added rows */ 534071fcb05SBarry Smith row = im[k]; 535071fcb05SBarry Smith rp = aj + ai[row]; 536071fcb05SBarry Smith ap = aa + ai[row]; 537071fcb05SBarry Smith if (!A->was_assembled) { 538071fcb05SBarry Smith ierr = PetscMemcpy(rp,in,n*sizeof(PetscInt));CHKERRQ(ierr); 539071fcb05SBarry Smith } 540071fcb05SBarry Smith if (!A->structure_only) { 541071fcb05SBarry Smith if (v) { 542071fcb05SBarry Smith ierr = PetscMemcpy(ap,v,n*sizeof(PetscScalar));CHKERRQ(ierr); 543071fcb05SBarry Smith v += n; 544071fcb05SBarry Smith } else { 545071fcb05SBarry Smith ierr = PetscMemzero(ap,n*sizeof(PetscScalar));CHKERRQ(ierr); 546071fcb05SBarry Smith } 547071fcb05SBarry Smith } 548071fcb05SBarry Smith ailen[row] = n; 549071fcb05SBarry Smith a->nz += n; 550071fcb05SBarry Smith } 551e2cf4d64SStefano Zampini #if defined(PETSC_HAVE_VIENNACL) || defined(PETSC_HAVE_CUDA) 552c70f7ee4SJunchao Zhang if (A->offloadmask != PETSC_OFFLOAD_UNALLOCATED && m && n) A->offloadmask = PETSC_OFFLOAD_CPU; 553e2cf4d64SStefano Zampini #endif 554071fcb05SBarry Smith PetscFunctionReturn(0); 555071fcb05SBarry Smith } 556071fcb05SBarry Smith 55781824310SBarry Smith 558a77337e4SBarry Smith PetscErrorCode MatGetValues_SeqAIJ(Mat A,PetscInt m,const PetscInt im[],PetscInt n,const PetscInt in[],PetscScalar v[]) 5597eb43aa7SLois Curfman McInnes { 5607eb43aa7SLois Curfman McInnes Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 56197f1f81fSBarry Smith PetscInt *rp,k,low,high,t,row,nrow,i,col,l,*aj = a->j; 56297f1f81fSBarry Smith PetscInt *ai = a->i,*ailen = a->ilen; 56354f21887SBarry Smith MatScalar *ap,*aa = a->a; 5647eb43aa7SLois Curfman McInnes 5653a40ed3dSBarry Smith PetscFunctionBegin; 5667eb43aa7SLois Curfman McInnes for (k=0; k<m; k++) { /* loop over rows */ 5677eb43aa7SLois Curfman McInnes row = im[k]; 568e32f2f54SBarry Smith if (row < 0) {v += n; continue;} /* SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Negative row: %D",row); */ 569e32f2f54SBarry Smith if (row >= A->rmap->n) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Row too large: row %D max %D",row,A->rmap->n-1); 570bfeeae90SHong Zhang rp = aj + ai[row]; ap = aa + ai[row]; 5717eb43aa7SLois Curfman McInnes nrow = ailen[row]; 5727eb43aa7SLois Curfman McInnes for (l=0; l<n; l++) { /* loop over columns */ 573e32f2f54SBarry Smith if (in[l] < 0) {v++; continue;} /* SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Negative column: %D",in[l]); */ 574e32f2f54SBarry Smith if (in[l] >= A->cmap->n) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Column too large: col %D max %D",in[l],A->cmap->n-1); 575bfeeae90SHong Zhang col = in[l]; 5767eb43aa7SLois Curfman McInnes high = nrow; low = 0; /* assume unsorted */ 5777eb43aa7SLois Curfman McInnes while (high-low > 5) { 5787eb43aa7SLois Curfman McInnes t = (low+high)/2; 5797eb43aa7SLois Curfman McInnes if (rp[t] > col) high = t; 5807eb43aa7SLois Curfman McInnes else low = t; 5817eb43aa7SLois Curfman McInnes } 5827eb43aa7SLois Curfman McInnes for (i=low; i<high; i++) { 5837eb43aa7SLois Curfman McInnes if (rp[i] > col) break; 5847eb43aa7SLois Curfman McInnes if (rp[i] == col) { 585b49de8d1SLois Curfman McInnes *v++ = ap[i]; 5867eb43aa7SLois Curfman McInnes goto finished; 5877eb43aa7SLois Curfman McInnes } 5887eb43aa7SLois Curfman McInnes } 58997e567efSBarry Smith *v++ = 0.0; 5907eb43aa7SLois Curfman McInnes finished:; 5917eb43aa7SLois Curfman McInnes } 5927eb43aa7SLois Curfman McInnes } 5933a40ed3dSBarry Smith PetscFunctionReturn(0); 5947eb43aa7SLois Curfman McInnes } 5957eb43aa7SLois Curfman McInnes 5963ea6fe3dSLisandro Dalcin PetscErrorCode MatView_SeqAIJ_Binary(Mat mat,PetscViewer viewer) 59717ab2063SBarry Smith { 5983ea6fe3dSLisandro Dalcin Mat_SeqAIJ *A = (Mat_SeqAIJ*)mat->data; 5993ea6fe3dSLisandro Dalcin PetscInt header[4],M,N,m,nz,i; 6003ea6fe3dSLisandro Dalcin PetscInt *rowlens; 6016849ba73SBarry Smith PetscErrorCode ierr; 60217ab2063SBarry Smith 6033a40ed3dSBarry Smith PetscFunctionBegin; 6043ea6fe3dSLisandro Dalcin ierr = PetscViewerSetUp(viewer);CHKERRQ(ierr); 6052205254eSKarl Rupp 6063ea6fe3dSLisandro Dalcin M = mat->rmap->N; 6073ea6fe3dSLisandro Dalcin N = mat->cmap->N; 6083ea6fe3dSLisandro Dalcin m = mat->rmap->n; 6093ea6fe3dSLisandro Dalcin nz = A->nz; 610416022c9SBarry Smith 6113ea6fe3dSLisandro Dalcin /* write matrix header */ 6123ea6fe3dSLisandro Dalcin header[0] = MAT_FILE_CLASSID; 6133ea6fe3dSLisandro Dalcin header[1] = M; header[2] = N; header[3] = nz; 6143ea6fe3dSLisandro Dalcin ierr = PetscViewerBinaryWrite(viewer,header,4,PETSC_INT);CHKERRQ(ierr); 615416022c9SBarry Smith 6163ea6fe3dSLisandro Dalcin /* fill in and store row lengths */ 6173ea6fe3dSLisandro Dalcin ierr = PetscMalloc1(m,&rowlens);CHKERRQ(ierr); 6183ea6fe3dSLisandro Dalcin for (i=0; i<m; i++) rowlens[i] = A->i[i+1] - A->i[i]; 6193ea6fe3dSLisandro Dalcin ierr = PetscViewerBinaryWrite(viewer,rowlens,m,PETSC_INT);CHKERRQ(ierr); 6203ea6fe3dSLisandro Dalcin ierr = PetscFree(rowlens);CHKERRQ(ierr); 6213ea6fe3dSLisandro Dalcin /* store column indices */ 6223ea6fe3dSLisandro Dalcin ierr = PetscViewerBinaryWrite(viewer,A->j,nz,PETSC_INT);CHKERRQ(ierr); 623416022c9SBarry Smith /* store nonzero values */ 6243ea6fe3dSLisandro Dalcin ierr = PetscViewerBinaryWrite(viewer,A->a,nz,PETSC_SCALAR);CHKERRQ(ierr); 625b37d52dbSMark F. Adams 6263ea6fe3dSLisandro Dalcin /* write block size option to the viewer's .info file */ 6273ea6fe3dSLisandro Dalcin ierr = MatView_Binary_BlockSizes(mat,viewer);CHKERRQ(ierr); 6283a40ed3dSBarry Smith PetscFunctionReturn(0); 62917ab2063SBarry Smith } 630416022c9SBarry Smith 6317dc0baabSHong Zhang static PetscErrorCode MatView_SeqAIJ_ASCII_structonly(Mat A,PetscViewer viewer) 6327dc0baabSHong Zhang { 6337dc0baabSHong Zhang PetscErrorCode ierr; 6347dc0baabSHong Zhang Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 6357dc0baabSHong Zhang PetscInt i,k,m=A->rmap->N; 6367dc0baabSHong Zhang 6377dc0baabSHong Zhang PetscFunctionBegin; 6387dc0baabSHong Zhang ierr = PetscViewerASCIIUseTabs(viewer,PETSC_FALSE);CHKERRQ(ierr); 6397dc0baabSHong Zhang for (i=0; i<m; i++) { 6407dc0baabSHong Zhang ierr = PetscViewerASCIIPrintf(viewer,"row %D:",i);CHKERRQ(ierr); 6417dc0baabSHong Zhang for (k=a->i[i]; k<a->i[i+1]; k++) { 6427dc0baabSHong Zhang ierr = PetscViewerASCIIPrintf(viewer," (%D) ",a->j[k]);CHKERRQ(ierr); 6437dc0baabSHong Zhang } 6447dc0baabSHong Zhang ierr = PetscViewerASCIIPrintf(viewer,"\n");CHKERRQ(ierr); 6457dc0baabSHong Zhang } 6467dc0baabSHong Zhang ierr = PetscViewerASCIIUseTabs(viewer,PETSC_TRUE);CHKERRQ(ierr); 6477dc0baabSHong Zhang PetscFunctionReturn(0); 6487dc0baabSHong Zhang } 6497dc0baabSHong Zhang 65009573ac7SBarry Smith extern PetscErrorCode MatSeqAIJFactorInfo_Matlab(Mat,PetscViewer); 651cd155464SBarry Smith 652dfbe8321SBarry Smith PetscErrorCode MatView_SeqAIJ_ASCII(Mat A,PetscViewer viewer) 653416022c9SBarry Smith { 654416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 655dfbe8321SBarry Smith PetscErrorCode ierr; 65660e0710aSBarry Smith PetscInt i,j,m = A->rmap->n; 657e060cb09SBarry Smith const char *name; 658f3ef73ceSBarry Smith PetscViewerFormat format; 65917ab2063SBarry Smith 6603a40ed3dSBarry Smith PetscFunctionBegin; 6617dc0baabSHong Zhang if (A->structure_only) { 6627dc0baabSHong Zhang ierr = MatView_SeqAIJ_ASCII_structonly(A,viewer);CHKERRQ(ierr); 6637dc0baabSHong Zhang PetscFunctionReturn(0); 6647dc0baabSHong Zhang } 66543e49210SHong Zhang 666b0a32e0cSBarry Smith ierr = PetscViewerGetFormat(viewer,&format);CHKERRQ(ierr); 66771c2f376SKris Buschelman if (format == PETSC_VIEWER_ASCII_MATLAB) { 66897f1f81fSBarry Smith PetscInt nofinalvalue = 0; 66960e0710aSBarry Smith if (m && ((a->i[m] == a->i[m-1]) || (a->j[a->nz-1] != A->cmap->n-1))) { 670c337ccceSJed Brown /* Need a dummy value to ensure the dimension of the matrix. */ 671d00d2cf4SBarry Smith nofinalvalue = 1; 672d00d2cf4SBarry Smith } 673d00279f6SBarry Smith ierr = PetscViewerASCIIUseTabs(viewer,PETSC_FALSE);CHKERRQ(ierr); 674d0f46423SBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"%% Size = %D %D \n",m,A->cmap->n);CHKERRQ(ierr); 67577431f27SBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"%% Nonzeros = %D \n",a->nz);CHKERRQ(ierr); 676fbfe6fa7SJed Brown #if defined(PETSC_USE_COMPLEX) 677fbfe6fa7SJed Brown ierr = PetscViewerASCIIPrintf(viewer,"zzz = zeros(%D,4);\n",a->nz+nofinalvalue);CHKERRQ(ierr); 678fbfe6fa7SJed Brown #else 67977431f27SBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"zzz = zeros(%D,3);\n",a->nz+nofinalvalue);CHKERRQ(ierr); 680fbfe6fa7SJed Brown #endif 681b0a32e0cSBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"zzz = [\n");CHKERRQ(ierr); 68217ab2063SBarry Smith 68317ab2063SBarry Smith for (i=0; i<m; i++) { 68460e0710aSBarry Smith for (j=a->i[i]; j<a->i[i+1]; j++) { 685aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 686a9bf72d8SJed Brown ierr = PetscViewerASCIIPrintf(viewer,"%D %D %18.16e %18.16e\n",i+1,a->j[j]+1,(double)PetscRealPart(a->a[j]),(double)PetscImaginaryPart(a->a[j]));CHKERRQ(ierr); 68717ab2063SBarry Smith #else 68860e0710aSBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"%D %D %18.16e\n",i+1,a->j[j]+1,(double)a->a[j]);CHKERRQ(ierr); 68917ab2063SBarry Smith #endif 69017ab2063SBarry Smith } 69117ab2063SBarry Smith } 692d00d2cf4SBarry Smith if (nofinalvalue) { 693c337ccceSJed Brown #if defined(PETSC_USE_COMPLEX) 694c337ccceSJed Brown ierr = PetscViewerASCIIPrintf(viewer,"%D %D %18.16e %18.16e\n",m,A->cmap->n,0.,0.);CHKERRQ(ierr); 695c337ccceSJed Brown #else 696d0f46423SBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"%D %D %18.16e\n",m,A->cmap->n,0.0);CHKERRQ(ierr); 697c337ccceSJed Brown #endif 698d00d2cf4SBarry Smith } 699317d6ea6SBarry Smith ierr = PetscObjectGetName((PetscObject)A,&name);CHKERRQ(ierr); 700fb9695e5SSatish Balay ierr = PetscViewerASCIIPrintf(viewer,"];\n %s = spconvert(zzz);\n",name);CHKERRQ(ierr); 701d00279f6SBarry Smith ierr = PetscViewerASCIIUseTabs(viewer,PETSC_TRUE);CHKERRQ(ierr); 7022950ac48SStefano Zampini } else if (format == PETSC_VIEWER_ASCII_FACTOR_INFO || format == PETSC_VIEWER_ASCII_INFO || format == PETSC_VIEWER_ASCII_INFO_DETAIL) { 703cd155464SBarry Smith PetscFunctionReturn(0); 704fb9695e5SSatish Balay } else if (format == PETSC_VIEWER_ASCII_COMMON) { 705d00279f6SBarry Smith ierr = PetscViewerASCIIUseTabs(viewer,PETSC_FALSE);CHKERRQ(ierr); 70644cd7ae7SLois Curfman McInnes for (i=0; i<m; i++) { 70777431f27SBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"row %D:",i);CHKERRQ(ierr); 70860e0710aSBarry Smith for (j=a->i[i]; j<a->i[i+1]; j++) { 709aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 71036db0b34SBarry Smith if (PetscImaginaryPart(a->a[j]) > 0.0 && PetscRealPart(a->a[j]) != 0.0) { 71160e0710aSBarry Smith ierr = PetscViewerASCIIPrintf(viewer," (%D, %g + %g i)",a->j[j],(double)PetscRealPart(a->a[j]),(double)PetscImaginaryPart(a->a[j]));CHKERRQ(ierr); 71236db0b34SBarry Smith } else if (PetscImaginaryPart(a->a[j]) < 0.0 && PetscRealPart(a->a[j]) != 0.0) { 71360e0710aSBarry Smith ierr = PetscViewerASCIIPrintf(viewer," (%D, %g - %g i)",a->j[j],(double)PetscRealPart(a->a[j]),(double)-PetscImaginaryPart(a->a[j]));CHKERRQ(ierr); 71436db0b34SBarry Smith } else if (PetscRealPart(a->a[j]) != 0.0) { 71560e0710aSBarry Smith ierr = PetscViewerASCIIPrintf(viewer," (%D, %g) ",a->j[j],(double)PetscRealPart(a->a[j]));CHKERRQ(ierr); 7166831982aSBarry Smith } 71744cd7ae7SLois Curfman McInnes #else 71860e0710aSBarry Smith if (a->a[j] != 0.0) {ierr = PetscViewerASCIIPrintf(viewer," (%D, %g) ",a->j[j],(double)a->a[j]);CHKERRQ(ierr);} 71944cd7ae7SLois Curfman McInnes #endif 72044cd7ae7SLois Curfman McInnes } 721b0a32e0cSBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"\n");CHKERRQ(ierr); 72244cd7ae7SLois Curfman McInnes } 723d00279f6SBarry Smith ierr = PetscViewerASCIIUseTabs(viewer,PETSC_TRUE);CHKERRQ(ierr); 724fb9695e5SSatish Balay } else if (format == PETSC_VIEWER_ASCII_SYMMODU) { 72597f1f81fSBarry Smith PetscInt nzd=0,fshift=1,*sptr; 726d00279f6SBarry Smith ierr = PetscViewerASCIIUseTabs(viewer,PETSC_FALSE);CHKERRQ(ierr); 727854ce69bSBarry Smith ierr = PetscMalloc1(m+1,&sptr);CHKERRQ(ierr); 728496be53dSLois Curfman McInnes for (i=0; i<m; i++) { 729496be53dSLois Curfman McInnes sptr[i] = nzd+1; 73060e0710aSBarry Smith for (j=a->i[i]; j<a->i[i+1]; j++) { 731496be53dSLois Curfman McInnes if (a->j[j] >= i) { 732aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 73336db0b34SBarry Smith if (PetscImaginaryPart(a->a[j]) != 0.0 || PetscRealPart(a->a[j]) != 0.0) nzd++; 734496be53dSLois Curfman McInnes #else 735496be53dSLois Curfman McInnes if (a->a[j] != 0.0) nzd++; 736496be53dSLois Curfman McInnes #endif 737496be53dSLois Curfman McInnes } 738496be53dSLois Curfman McInnes } 739496be53dSLois Curfman McInnes } 7402e44a96cSLois Curfman McInnes sptr[m] = nzd+1; 74177431f27SBarry Smith ierr = PetscViewerASCIIPrintf(viewer," %D %D\n\n",m,nzd);CHKERRQ(ierr); 7422e44a96cSLois Curfman McInnes for (i=0; i<m+1; i+=6) { 7432205254eSKarl Rupp if (i+4<m) { 7442205254eSKarl Rupp ierr = PetscViewerASCIIPrintf(viewer," %D %D %D %D %D %D\n",sptr[i],sptr[i+1],sptr[i+2],sptr[i+3],sptr[i+4],sptr[i+5]);CHKERRQ(ierr); 7452205254eSKarl Rupp } else if (i+3<m) { 7462205254eSKarl Rupp ierr = PetscViewerASCIIPrintf(viewer," %D %D %D %D %D\n",sptr[i],sptr[i+1],sptr[i+2],sptr[i+3],sptr[i+4]);CHKERRQ(ierr); 7472205254eSKarl Rupp } else if (i+2<m) { 7482205254eSKarl Rupp ierr = PetscViewerASCIIPrintf(viewer," %D %D %D %D\n",sptr[i],sptr[i+1],sptr[i+2],sptr[i+3]);CHKERRQ(ierr); 7492205254eSKarl Rupp } else if (i+1<m) { 7502205254eSKarl Rupp ierr = PetscViewerASCIIPrintf(viewer," %D %D %D\n",sptr[i],sptr[i+1],sptr[i+2]);CHKERRQ(ierr); 7512205254eSKarl Rupp } else if (i<m) { 7522205254eSKarl Rupp ierr = PetscViewerASCIIPrintf(viewer," %D %D\n",sptr[i],sptr[i+1]);CHKERRQ(ierr); 7532205254eSKarl Rupp } else { 7542205254eSKarl Rupp ierr = PetscViewerASCIIPrintf(viewer," %D\n",sptr[i]);CHKERRQ(ierr); 7552205254eSKarl Rupp } 756496be53dSLois Curfman McInnes } 757b0a32e0cSBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"\n");CHKERRQ(ierr); 758606d414cSSatish Balay ierr = PetscFree(sptr);CHKERRQ(ierr); 759496be53dSLois Curfman McInnes for (i=0; i<m; i++) { 76060e0710aSBarry Smith for (j=a->i[i]; j<a->i[i+1]; j++) { 76177431f27SBarry Smith if (a->j[j] >= i) {ierr = PetscViewerASCIIPrintf(viewer," %D ",a->j[j]+fshift);CHKERRQ(ierr);} 762496be53dSLois Curfman McInnes } 763b0a32e0cSBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"\n");CHKERRQ(ierr); 764496be53dSLois Curfman McInnes } 765b0a32e0cSBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"\n");CHKERRQ(ierr); 766496be53dSLois Curfman McInnes for (i=0; i<m; i++) { 76760e0710aSBarry Smith for (j=a->i[i]; j<a->i[i+1]; j++) { 768496be53dSLois Curfman McInnes if (a->j[j] >= i) { 769aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 77036db0b34SBarry Smith if (PetscImaginaryPart(a->a[j]) != 0.0 || PetscRealPart(a->a[j]) != 0.0) { 77160e0710aSBarry Smith ierr = PetscViewerASCIIPrintf(viewer," %18.16e %18.16e ",(double)PetscRealPart(a->a[j]),(double)PetscImaginaryPart(a->a[j]));CHKERRQ(ierr); 7726831982aSBarry Smith } 773496be53dSLois Curfman McInnes #else 77460e0710aSBarry Smith if (a->a[j] != 0.0) {ierr = PetscViewerASCIIPrintf(viewer," %18.16e ",(double)a->a[j]);CHKERRQ(ierr);} 775496be53dSLois Curfman McInnes #endif 776496be53dSLois Curfman McInnes } 777496be53dSLois Curfman McInnes } 778b0a32e0cSBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"\n");CHKERRQ(ierr); 779496be53dSLois Curfman McInnes } 780d00279f6SBarry Smith ierr = PetscViewerASCIIUseTabs(viewer,PETSC_TRUE);CHKERRQ(ierr); 781fb9695e5SSatish Balay } else if (format == PETSC_VIEWER_ASCII_DENSE) { 78297f1f81fSBarry Smith PetscInt cnt = 0,jcnt; 78387828ca2SBarry Smith PetscScalar value; 78468f1ed48SBarry Smith #if defined(PETSC_USE_COMPLEX) 78568f1ed48SBarry Smith PetscBool realonly = PETSC_TRUE; 78668f1ed48SBarry Smith 78768f1ed48SBarry Smith for (i=0; i<a->i[m]; i++) { 78868f1ed48SBarry Smith if (PetscImaginaryPart(a->a[i]) != 0.0) { 78968f1ed48SBarry Smith realonly = PETSC_FALSE; 79068f1ed48SBarry Smith break; 79168f1ed48SBarry Smith } 79268f1ed48SBarry Smith } 79368f1ed48SBarry Smith #endif 79402594712SBarry Smith 795d00279f6SBarry Smith ierr = PetscViewerASCIIUseTabs(viewer,PETSC_FALSE);CHKERRQ(ierr); 79602594712SBarry Smith for (i=0; i<m; i++) { 79702594712SBarry Smith jcnt = 0; 798d0f46423SBarry Smith for (j=0; j<A->cmap->n; j++) { 799e24b481bSBarry Smith if (jcnt < a->i[i+1]-a->i[i] && j == a->j[cnt]) { 80002594712SBarry Smith value = a->a[cnt++]; 801e24b481bSBarry Smith jcnt++; 80202594712SBarry Smith } else { 80302594712SBarry Smith value = 0.0; 80402594712SBarry Smith } 805aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 80668f1ed48SBarry Smith if (realonly) { 80760e0710aSBarry Smith ierr = PetscViewerASCIIPrintf(viewer," %7.5e ",(double)PetscRealPart(value));CHKERRQ(ierr); 80868f1ed48SBarry Smith } else { 80960e0710aSBarry Smith ierr = PetscViewerASCIIPrintf(viewer," %7.5e+%7.5e i ",(double)PetscRealPart(value),(double)PetscImaginaryPart(value));CHKERRQ(ierr); 81068f1ed48SBarry Smith } 81102594712SBarry Smith #else 81260e0710aSBarry Smith ierr = PetscViewerASCIIPrintf(viewer," %7.5e ",(double)value);CHKERRQ(ierr); 81302594712SBarry Smith #endif 81402594712SBarry Smith } 815b0a32e0cSBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"\n");CHKERRQ(ierr); 81602594712SBarry Smith } 817d00279f6SBarry Smith ierr = PetscViewerASCIIUseTabs(viewer,PETSC_TRUE);CHKERRQ(ierr); 8183c215bfdSMatthew Knepley } else if (format == PETSC_VIEWER_ASCII_MATRIXMARKET) { 819150b93efSMatthew G. Knepley PetscInt fshift=1; 820d00279f6SBarry Smith ierr = PetscViewerASCIIUseTabs(viewer,PETSC_FALSE);CHKERRQ(ierr); 8213c215bfdSMatthew Knepley #if defined(PETSC_USE_COMPLEX) 82219303e72SJonathan Guyer ierr = PetscViewerASCIIPrintf(viewer,"%%%%MatrixMarket matrix coordinate complex general\n");CHKERRQ(ierr); 8233c215bfdSMatthew Knepley #else 82419303e72SJonathan Guyer ierr = PetscViewerASCIIPrintf(viewer,"%%%%MatrixMarket matrix coordinate real general\n");CHKERRQ(ierr); 8253c215bfdSMatthew Knepley #endif 826d0f46423SBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"%D %D %D\n", m, A->cmap->n, a->nz);CHKERRQ(ierr); 8273c215bfdSMatthew Knepley for (i=0; i<m; i++) { 82860e0710aSBarry Smith for (j=a->i[i]; j<a->i[i+1]; j++) { 8293c215bfdSMatthew Knepley #if defined(PETSC_USE_COMPLEX) 830a9a0e077SKarl Rupp ierr = PetscViewerASCIIPrintf(viewer,"%D %D %g %g\n", i+fshift,a->j[j]+fshift,(double)PetscRealPart(a->a[j]),(double)PetscImaginaryPart(a->a[j]));CHKERRQ(ierr); 8313c215bfdSMatthew Knepley #else 832150b93efSMatthew G. Knepley ierr = PetscViewerASCIIPrintf(viewer,"%D %D %g\n", i+fshift, a->j[j]+fshift, (double)a->a[j]);CHKERRQ(ierr); 8333c215bfdSMatthew Knepley #endif 8343c215bfdSMatthew Knepley } 8353c215bfdSMatthew Knepley } 836d00279f6SBarry Smith ierr = PetscViewerASCIIUseTabs(viewer,PETSC_TRUE);CHKERRQ(ierr); 8373a40ed3dSBarry Smith } else { 838d00279f6SBarry Smith ierr = PetscViewerASCIIUseTabs(viewer,PETSC_FALSE);CHKERRQ(ierr); 839d5f3da31SBarry Smith if (A->factortype) { 84016cd7e1dSShri Abhyankar for (i=0; i<m; i++) { 84116cd7e1dSShri Abhyankar ierr = PetscViewerASCIIPrintf(viewer,"row %D:",i);CHKERRQ(ierr); 84216cd7e1dSShri Abhyankar /* L part */ 84360e0710aSBarry Smith for (j=a->i[i]; j<a->i[i+1]; j++) { 84416cd7e1dSShri Abhyankar #if defined(PETSC_USE_COMPLEX) 84516cd7e1dSShri Abhyankar if (PetscImaginaryPart(a->a[j]) > 0.0) { 84660e0710aSBarry Smith ierr = PetscViewerASCIIPrintf(viewer," (%D, %g + %g i)",a->j[j],(double)PetscRealPart(a->a[j]),(double)PetscImaginaryPart(a->a[j]));CHKERRQ(ierr); 84716cd7e1dSShri Abhyankar } else if (PetscImaginaryPart(a->a[j]) < 0.0) { 8486712e2f1SBarry Smith ierr = PetscViewerASCIIPrintf(viewer," (%D, %g - %g i)",a->j[j],(double)PetscRealPart(a->a[j]),(double)(-PetscImaginaryPart(a->a[j])));CHKERRQ(ierr); 84916cd7e1dSShri Abhyankar } else { 85060e0710aSBarry Smith ierr = PetscViewerASCIIPrintf(viewer," (%D, %g) ",a->j[j],(double)PetscRealPart(a->a[j]));CHKERRQ(ierr); 85116cd7e1dSShri Abhyankar } 85216cd7e1dSShri Abhyankar #else 85360e0710aSBarry Smith ierr = PetscViewerASCIIPrintf(viewer," (%D, %g) ",a->j[j],(double)a->a[j]);CHKERRQ(ierr); 85416cd7e1dSShri Abhyankar #endif 85516cd7e1dSShri Abhyankar } 85616cd7e1dSShri Abhyankar /* diagonal */ 85716cd7e1dSShri Abhyankar j = a->diag[i]; 85816cd7e1dSShri Abhyankar #if defined(PETSC_USE_COMPLEX) 85916cd7e1dSShri Abhyankar if (PetscImaginaryPart(a->a[j]) > 0.0) { 86060e0710aSBarry Smith ierr = PetscViewerASCIIPrintf(viewer," (%D, %g + %g i)",a->j[j],(double)PetscRealPart(1.0/a->a[j]),(double)PetscImaginaryPart(1.0/a->a[j]));CHKERRQ(ierr); 86116cd7e1dSShri Abhyankar } else if (PetscImaginaryPart(a->a[j]) < 0.0) { 8626712e2f1SBarry Smith ierr = PetscViewerASCIIPrintf(viewer," (%D, %g - %g i)",a->j[j],(double)PetscRealPart(1.0/a->a[j]),(double)(-PetscImaginaryPart(1.0/a->a[j])));CHKERRQ(ierr); 86316cd7e1dSShri Abhyankar } else { 86460e0710aSBarry Smith ierr = PetscViewerASCIIPrintf(viewer," (%D, %g) ",a->j[j],(double)PetscRealPart(1.0/a->a[j]));CHKERRQ(ierr); 86516cd7e1dSShri Abhyankar } 86616cd7e1dSShri Abhyankar #else 86760e0710aSBarry Smith ierr = PetscViewerASCIIPrintf(viewer," (%D, %g) ",a->j[j],(double)(1.0/a->a[j]));CHKERRQ(ierr); 86816cd7e1dSShri Abhyankar #endif 86916cd7e1dSShri Abhyankar 87016cd7e1dSShri Abhyankar /* U part */ 87160e0710aSBarry Smith for (j=a->diag[i+1]+1; j<a->diag[i]; j++) { 87216cd7e1dSShri Abhyankar #if defined(PETSC_USE_COMPLEX) 87316cd7e1dSShri Abhyankar if (PetscImaginaryPart(a->a[j]) > 0.0) { 87460e0710aSBarry Smith ierr = PetscViewerASCIIPrintf(viewer," (%D, %g + %g i)",a->j[j],(double)PetscRealPart(a->a[j]),(double)PetscImaginaryPart(a->a[j]));CHKERRQ(ierr); 87516cd7e1dSShri Abhyankar } else if (PetscImaginaryPart(a->a[j]) < 0.0) { 87622ab088eSBarry Smith ierr = PetscViewerASCIIPrintf(viewer," (%D, %g - %g i)",a->j[j],(double)PetscRealPart(a->a[j]),(double)(-PetscImaginaryPart(a->a[j])));CHKERRQ(ierr); 87716cd7e1dSShri Abhyankar } else { 87860e0710aSBarry Smith ierr = PetscViewerASCIIPrintf(viewer," (%D, %g) ",a->j[j],(double)PetscRealPart(a->a[j]));CHKERRQ(ierr); 87916cd7e1dSShri Abhyankar } 88016cd7e1dSShri Abhyankar #else 88160e0710aSBarry Smith ierr = PetscViewerASCIIPrintf(viewer," (%D, %g) ",a->j[j],(double)a->a[j]);CHKERRQ(ierr); 88216cd7e1dSShri Abhyankar #endif 88316cd7e1dSShri Abhyankar } 88416cd7e1dSShri Abhyankar ierr = PetscViewerASCIIPrintf(viewer,"\n");CHKERRQ(ierr); 88516cd7e1dSShri Abhyankar } 88616cd7e1dSShri Abhyankar } else { 88717ab2063SBarry Smith for (i=0; i<m; i++) { 88877431f27SBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"row %D:",i);CHKERRQ(ierr); 88960e0710aSBarry Smith for (j=a->i[i]; j<a->i[i+1]; j++) { 890aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX) 89136db0b34SBarry Smith if (PetscImaginaryPart(a->a[j]) > 0.0) { 89260e0710aSBarry Smith ierr = PetscViewerASCIIPrintf(viewer," (%D, %g + %g i)",a->j[j],(double)PetscRealPart(a->a[j]),(double)PetscImaginaryPart(a->a[j]));CHKERRQ(ierr); 89336db0b34SBarry Smith } else if (PetscImaginaryPart(a->a[j]) < 0.0) { 89460e0710aSBarry Smith ierr = PetscViewerASCIIPrintf(viewer," (%D, %g - %g i)",a->j[j],(double)PetscRealPart(a->a[j]),(double)-PetscImaginaryPart(a->a[j]));CHKERRQ(ierr); 8953a40ed3dSBarry Smith } else { 89660e0710aSBarry Smith ierr = PetscViewerASCIIPrintf(viewer," (%D, %g) ",a->j[j],(double)PetscRealPart(a->a[j]));CHKERRQ(ierr); 89717ab2063SBarry Smith } 89817ab2063SBarry Smith #else 89960e0710aSBarry Smith ierr = PetscViewerASCIIPrintf(viewer," (%D, %g) ",a->j[j],(double)a->a[j]);CHKERRQ(ierr); 90017ab2063SBarry Smith #endif 90117ab2063SBarry Smith } 902b0a32e0cSBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"\n");CHKERRQ(ierr); 90317ab2063SBarry Smith } 90416cd7e1dSShri Abhyankar } 905d00279f6SBarry Smith ierr = PetscViewerASCIIUseTabs(viewer,PETSC_TRUE);CHKERRQ(ierr); 90617ab2063SBarry Smith } 907b0a32e0cSBarry Smith ierr = PetscViewerFlush(viewer);CHKERRQ(ierr); 9083a40ed3dSBarry Smith PetscFunctionReturn(0); 909416022c9SBarry Smith } 910416022c9SBarry Smith 9119804daf3SBarry Smith #include <petscdraw.h> 912dfbe8321SBarry Smith PetscErrorCode MatView_SeqAIJ_Draw_Zoom(PetscDraw draw,void *Aa) 913416022c9SBarry Smith { 914480ef9eaSBarry Smith Mat A = (Mat) Aa; 915416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 916dfbe8321SBarry Smith PetscErrorCode ierr; 917383922c3SLisandro Dalcin PetscInt i,j,m = A->rmap->n; 918383922c3SLisandro Dalcin int color; 919b05fc000SLisandro Dalcin PetscReal xl,yl,xr,yr,x_l,x_r,y_l,y_r; 920b0a32e0cSBarry Smith PetscViewer viewer; 921f3ef73ceSBarry Smith PetscViewerFormat format; 922cddf8d76SBarry Smith 9233a40ed3dSBarry Smith PetscFunctionBegin; 924480ef9eaSBarry Smith ierr = PetscObjectQuery((PetscObject)A,"Zoomviewer",(PetscObject*)&viewer);CHKERRQ(ierr); 925b0a32e0cSBarry Smith ierr = PetscViewerGetFormat(viewer,&format);CHKERRQ(ierr); 926b0a32e0cSBarry Smith ierr = PetscDrawGetCoordinates(draw,&xl,&yl,&xr,&yr);CHKERRQ(ierr); 927383922c3SLisandro Dalcin 928416022c9SBarry Smith /* loop over matrix elements drawing boxes */ 9290513a670SBarry Smith 930fb9695e5SSatish Balay if (format != PETSC_VIEWER_DRAW_CONTOUR) { 931383922c3SLisandro Dalcin ierr = PetscDrawCollectiveBegin(draw);CHKERRQ(ierr); 9320513a670SBarry Smith /* Blue for negative, Cyan for zero and Red for positive */ 933b0a32e0cSBarry Smith color = PETSC_DRAW_BLUE; 934416022c9SBarry Smith for (i=0; i<m; i++) { 935cddf8d76SBarry Smith y_l = m - i - 1.0; y_r = y_l + 1.0; 936bfeeae90SHong Zhang for (j=a->i[i]; j<a->i[i+1]; j++) { 937bfeeae90SHong Zhang x_l = a->j[j]; x_r = x_l + 1.0; 93836db0b34SBarry Smith if (PetscRealPart(a->a[j]) >= 0.) continue; 939b0a32e0cSBarry Smith ierr = PetscDrawRectangle(draw,x_l,y_l,x_r,y_r,color,color,color,color);CHKERRQ(ierr); 940cddf8d76SBarry Smith } 941cddf8d76SBarry Smith } 942b0a32e0cSBarry Smith color = PETSC_DRAW_CYAN; 943cddf8d76SBarry Smith for (i=0; i<m; i++) { 944cddf8d76SBarry Smith y_l = m - i - 1.0; y_r = y_l + 1.0; 945bfeeae90SHong Zhang for (j=a->i[i]; j<a->i[i+1]; j++) { 946bfeeae90SHong Zhang x_l = a->j[j]; x_r = x_l + 1.0; 947cddf8d76SBarry Smith if (a->a[j] != 0.) continue; 948b0a32e0cSBarry Smith ierr = PetscDrawRectangle(draw,x_l,y_l,x_r,y_r,color,color,color,color);CHKERRQ(ierr); 949cddf8d76SBarry Smith } 950cddf8d76SBarry Smith } 951b0a32e0cSBarry Smith color = PETSC_DRAW_RED; 952cddf8d76SBarry Smith for (i=0; i<m; i++) { 953cddf8d76SBarry Smith y_l = m - i - 1.0; y_r = y_l + 1.0; 954bfeeae90SHong Zhang for (j=a->i[i]; j<a->i[i+1]; j++) { 955bfeeae90SHong Zhang x_l = a->j[j]; x_r = x_l + 1.0; 95636db0b34SBarry Smith if (PetscRealPart(a->a[j]) <= 0.) continue; 957b0a32e0cSBarry Smith ierr = PetscDrawRectangle(draw,x_l,y_l,x_r,y_r,color,color,color,color);CHKERRQ(ierr); 958416022c9SBarry Smith } 959416022c9SBarry Smith } 960383922c3SLisandro Dalcin ierr = PetscDrawCollectiveEnd(draw);CHKERRQ(ierr); 9610513a670SBarry Smith } else { 9620513a670SBarry Smith /* use contour shading to indicate magnitude of values */ 9630513a670SBarry Smith /* first determine max of all nonzero values */ 964b05fc000SLisandro Dalcin PetscReal minv = 0.0, maxv = 0.0; 965383922c3SLisandro Dalcin PetscInt nz = a->nz, count = 0; 966b0a32e0cSBarry Smith PetscDraw popup; 9670513a670SBarry Smith 9680513a670SBarry Smith for (i=0; i<nz; i++) { 9690513a670SBarry Smith if (PetscAbsScalar(a->a[i]) > maxv) maxv = PetscAbsScalar(a->a[i]); 9700513a670SBarry Smith } 971383922c3SLisandro Dalcin if (minv >= maxv) maxv = minv + PETSC_SMALL; 972b0a32e0cSBarry Smith ierr = PetscDrawGetPopup(draw,&popup);CHKERRQ(ierr); 97345f3bb6eSLisandro Dalcin ierr = PetscDrawScalePopup(popup,minv,maxv);CHKERRQ(ierr); 974383922c3SLisandro Dalcin 975383922c3SLisandro Dalcin ierr = PetscDrawCollectiveBegin(draw);CHKERRQ(ierr); 9760513a670SBarry Smith for (i=0; i<m; i++) { 977383922c3SLisandro Dalcin y_l = m - i - 1.0; 978383922c3SLisandro Dalcin y_r = y_l + 1.0; 979bfeeae90SHong Zhang for (j=a->i[i]; j<a->i[i+1]; j++) { 980383922c3SLisandro Dalcin x_l = a->j[j]; 981383922c3SLisandro Dalcin x_r = x_l + 1.0; 982b05fc000SLisandro Dalcin color = PetscDrawRealToColor(PetscAbsScalar(a->a[count]),minv,maxv); 983b0a32e0cSBarry Smith ierr = PetscDrawRectangle(draw,x_l,y_l,x_r,y_r,color,color,color,color);CHKERRQ(ierr); 9840513a670SBarry Smith count++; 9850513a670SBarry Smith } 9860513a670SBarry Smith } 987383922c3SLisandro Dalcin ierr = PetscDrawCollectiveEnd(draw);CHKERRQ(ierr); 9880513a670SBarry Smith } 989480ef9eaSBarry Smith PetscFunctionReturn(0); 990480ef9eaSBarry Smith } 991cddf8d76SBarry Smith 9929804daf3SBarry Smith #include <petscdraw.h> 993dfbe8321SBarry Smith PetscErrorCode MatView_SeqAIJ_Draw(Mat A,PetscViewer viewer) 994480ef9eaSBarry Smith { 995dfbe8321SBarry Smith PetscErrorCode ierr; 996b0a32e0cSBarry Smith PetscDraw draw; 99736db0b34SBarry Smith PetscReal xr,yr,xl,yl,h,w; 998ace3abfcSBarry Smith PetscBool isnull; 999480ef9eaSBarry Smith 1000480ef9eaSBarry Smith PetscFunctionBegin; 1001b0a32e0cSBarry Smith ierr = PetscViewerDrawGetDraw(viewer,0,&draw);CHKERRQ(ierr); 1002b0a32e0cSBarry Smith ierr = PetscDrawIsNull(draw,&isnull);CHKERRQ(ierr); 1003480ef9eaSBarry Smith if (isnull) PetscFunctionReturn(0); 1004480ef9eaSBarry Smith 1005d0f46423SBarry Smith xr = A->cmap->n; yr = A->rmap->n; h = yr/10.0; w = xr/10.0; 1006480ef9eaSBarry Smith xr += w; yr += h; xl = -w; yl = -h; 1007b0a32e0cSBarry Smith ierr = PetscDrawSetCoordinates(draw,xl,yl,xr,yr);CHKERRQ(ierr); 1008832b7cebSLisandro Dalcin ierr = PetscObjectCompose((PetscObject)A,"Zoomviewer",(PetscObject)viewer);CHKERRQ(ierr); 1009b0a32e0cSBarry Smith ierr = PetscDrawZoom(draw,MatView_SeqAIJ_Draw_Zoom,A);CHKERRQ(ierr); 10100298fd71SBarry Smith ierr = PetscObjectCompose((PetscObject)A,"Zoomviewer",NULL);CHKERRQ(ierr); 1011832b7cebSLisandro Dalcin ierr = PetscDrawSave(draw);CHKERRQ(ierr); 10123a40ed3dSBarry Smith PetscFunctionReturn(0); 1013416022c9SBarry Smith } 1014416022c9SBarry Smith 1015dfbe8321SBarry Smith PetscErrorCode MatView_SeqAIJ(Mat A,PetscViewer viewer) 1016416022c9SBarry Smith { 1017dfbe8321SBarry Smith PetscErrorCode ierr; 1018ace3abfcSBarry Smith PetscBool iascii,isbinary,isdraw; 1019416022c9SBarry Smith 10203a40ed3dSBarry Smith PetscFunctionBegin; 1021251f4c67SDmitry Karpeev ierr = PetscObjectTypeCompare((PetscObject)viewer,PETSCVIEWERASCII,&iascii);CHKERRQ(ierr); 1022251f4c67SDmitry Karpeev ierr = PetscObjectTypeCompare((PetscObject)viewer,PETSCVIEWERBINARY,&isbinary);CHKERRQ(ierr); 1023251f4c67SDmitry Karpeev ierr = PetscObjectTypeCompare((PetscObject)viewer,PETSCVIEWERDRAW,&isdraw);CHKERRQ(ierr); 1024c45a1595SBarry Smith if (iascii) { 10253a40ed3dSBarry Smith ierr = MatView_SeqAIJ_ASCII(A,viewer);CHKERRQ(ierr); 10260f5bd95cSBarry Smith } else if (isbinary) { 10273a40ed3dSBarry Smith ierr = MatView_SeqAIJ_Binary(A,viewer);CHKERRQ(ierr); 10280f5bd95cSBarry Smith } else if (isdraw) { 10293a40ed3dSBarry Smith ierr = MatView_SeqAIJ_Draw(A,viewer);CHKERRQ(ierr); 103011aeaf0aSBarry Smith } 10314108e4d5SBarry Smith ierr = MatView_SeqAIJ_Inode(A,viewer);CHKERRQ(ierr); 10323a40ed3dSBarry Smith PetscFunctionReturn(0); 103317ab2063SBarry Smith } 103419bcc07fSBarry Smith 1035dfbe8321SBarry Smith PetscErrorCode MatAssemblyEnd_SeqAIJ(Mat A,MatAssemblyType mode) 103617ab2063SBarry Smith { 1037416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 10386849ba73SBarry Smith PetscErrorCode ierr; 1039580bdb30SBarry Smith PetscInt fshift = 0,i,*ai = a->i,*aj = a->j,*imax = a->imax; 1040d0f46423SBarry Smith PetscInt m = A->rmap->n,*ip,N,*ailen = a->ilen,rmax = 0; 104154f21887SBarry Smith MatScalar *aa = a->a,*ap; 10423447b6efSHong Zhang PetscReal ratio = 0.6; 104317ab2063SBarry Smith 10443a40ed3dSBarry Smith PetscFunctionBegin; 10453a40ed3dSBarry Smith if (mode == MAT_FLUSH_ASSEMBLY) PetscFunctionReturn(0); 1046071fcb05SBarry Smith ierr = MatSeqAIJInvalidateDiagonal(A);CHKERRQ(ierr); 1047071fcb05SBarry Smith if (A->was_assembled && A->ass_nonzerostate == A->nonzerostate) PetscFunctionReturn(0); 104817ab2063SBarry Smith 104943ee02c3SBarry Smith if (m) rmax = ailen[0]; /* determine row with most nonzeros */ 105017ab2063SBarry Smith for (i=1; i<m; i++) { 1051416022c9SBarry Smith /* move each row back by the amount of empty slots (fshift) before it*/ 105217ab2063SBarry Smith fshift += imax[i-1] - ailen[i-1]; 105394a9d846SBarry Smith rmax = PetscMax(rmax,ailen[i]); 105417ab2063SBarry Smith if (fshift) { 1055bfeeae90SHong Zhang ip = aj + ai[i]; 1056bfeeae90SHong Zhang ap = aa + ai[i]; 105717ab2063SBarry Smith N = ailen[i]; 1058580bdb30SBarry Smith ierr = PetscArraymove(ip-fshift,ip,N);CHKERRQ(ierr); 1059580bdb30SBarry Smith if (!A->structure_only) { 1060580bdb30SBarry Smith ierr = PetscArraymove(ap-fshift,ap,N);CHKERRQ(ierr); 106117ab2063SBarry Smith } 106217ab2063SBarry Smith } 106317ab2063SBarry Smith ai[i] = ai[i-1] + ailen[i-1]; 106417ab2063SBarry Smith } 106517ab2063SBarry Smith if (m) { 106617ab2063SBarry Smith fshift += imax[m-1] - ailen[m-1]; 106717ab2063SBarry Smith ai[m] = ai[m-1] + ailen[m-1]; 106817ab2063SBarry Smith } 10697b083b7cSBarry Smith 107017ab2063SBarry Smith /* reset ilen and imax for each row */ 10717b083b7cSBarry Smith a->nonzerorowcnt = 0; 1072396832f4SHong Zhang if (A->structure_only) { 1073071fcb05SBarry Smith ierr = PetscFree(a->imax);CHKERRQ(ierr); 1074071fcb05SBarry Smith ierr = PetscFree(a->ilen);CHKERRQ(ierr); 1075396832f4SHong Zhang } else { /* !A->structure_only */ 107617ab2063SBarry Smith for (i=0; i<m; i++) { 107717ab2063SBarry Smith ailen[i] = imax[i] = ai[i+1] - ai[i]; 10787b083b7cSBarry Smith a->nonzerorowcnt += ((ai[i+1] - ai[i]) > 0); 107917ab2063SBarry Smith } 1080396832f4SHong Zhang } 1081bfeeae90SHong Zhang a->nz = ai[m]; 108265e19b50SBarry Smith if (fshift && a->nounused == -1) SETERRQ3(PETSC_COMM_SELF,PETSC_ERR_PLIB, "Unused space detected in matrix: %D X %D, %D unneeded", m, A->cmap->n, fshift); 108317ab2063SBarry Smith 108409f38230SBarry Smith ierr = MatMarkDiagonal_SeqAIJ(A);CHKERRQ(ierr); 1085d0f46423SBarry Smith ierr = PetscInfo4(A,"Matrix size: %D X %D; storage space: %D unneeded,%D used\n",m,A->cmap->n,fshift,a->nz);CHKERRQ(ierr); 1086ae15b995SBarry Smith ierr = PetscInfo1(A,"Number of mallocs during MatSetValues() is %D\n",a->reallocs);CHKERRQ(ierr); 1087ae15b995SBarry Smith ierr = PetscInfo1(A,"Maximum nonzeros in any row is %D\n",rmax);CHKERRQ(ierr); 10882205254eSKarl Rupp 10898e58a170SBarry Smith A->info.mallocs += a->reallocs; 1090dd5f02e7SSatish Balay a->reallocs = 0; 10916712e2f1SBarry Smith A->info.nz_unneeded = (PetscReal)fshift; 109236db0b34SBarry Smith a->rmax = rmax; 10934e220ebcSLois Curfman McInnes 1094396832f4SHong Zhang if (!A->structure_only) { 109511e456e1SBarry Smith ierr = MatCheckCompressedRow(A,a->nonzerorowcnt,&a->compressedrow,a->i,m,ratio);CHKERRQ(ierr); 1096396832f4SHong Zhang } 10974108e4d5SBarry Smith ierr = MatAssemblyEnd_SeqAIJ_Inode(A,mode);CHKERRQ(ierr); 10983a40ed3dSBarry Smith PetscFunctionReturn(0); 109917ab2063SBarry Smith } 110017ab2063SBarry Smith 110199cafbc1SBarry Smith PetscErrorCode MatRealPart_SeqAIJ(Mat A) 110299cafbc1SBarry Smith { 110399cafbc1SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 110499cafbc1SBarry Smith PetscInt i,nz = a->nz; 110554f21887SBarry Smith MatScalar *aa = a->a; 1106acf2f550SJed Brown PetscErrorCode ierr; 110799cafbc1SBarry Smith 110899cafbc1SBarry Smith PetscFunctionBegin; 110999cafbc1SBarry Smith for (i=0; i<nz; i++) aa[i] = PetscRealPart(aa[i]); 1110acf2f550SJed Brown ierr = MatSeqAIJInvalidateDiagonal(A);CHKERRQ(ierr); 1111e2cf4d64SStefano Zampini #if defined(PETSC_HAVE_VIENNACL) || defined(PETSC_HAVE_CUDA) 1112c70f7ee4SJunchao Zhang if (A->offloadmask != PETSC_OFFLOAD_UNALLOCATED) A->offloadmask = PETSC_OFFLOAD_CPU; 1113e2cf4d64SStefano Zampini #endif 111499cafbc1SBarry Smith PetscFunctionReturn(0); 111599cafbc1SBarry Smith } 111699cafbc1SBarry Smith 111799cafbc1SBarry Smith PetscErrorCode MatImaginaryPart_SeqAIJ(Mat A) 111899cafbc1SBarry Smith { 111999cafbc1SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 112099cafbc1SBarry Smith PetscInt i,nz = a->nz; 112154f21887SBarry Smith MatScalar *aa = a->a; 1122acf2f550SJed Brown PetscErrorCode ierr; 112399cafbc1SBarry Smith 112499cafbc1SBarry Smith PetscFunctionBegin; 112599cafbc1SBarry Smith for (i=0; i<nz; i++) aa[i] = PetscImaginaryPart(aa[i]); 1126acf2f550SJed Brown ierr = MatSeqAIJInvalidateDiagonal(A);CHKERRQ(ierr); 1127e2cf4d64SStefano Zampini #if defined(PETSC_HAVE_VIENNACL) || defined(PETSC_HAVE_CUDA) 1128c70f7ee4SJunchao Zhang if (A->offloadmask != PETSC_OFFLOAD_UNALLOCATED) A->offloadmask = PETSC_OFFLOAD_CPU; 1129e2cf4d64SStefano Zampini #endif 113099cafbc1SBarry Smith PetscFunctionReturn(0); 113199cafbc1SBarry Smith } 113299cafbc1SBarry Smith 1133dfbe8321SBarry Smith PetscErrorCode MatZeroEntries_SeqAIJ(Mat A) 113417ab2063SBarry Smith { 1135416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 1136dfbe8321SBarry Smith PetscErrorCode ierr; 11373a40ed3dSBarry Smith 11383a40ed3dSBarry Smith PetscFunctionBegin; 1139580bdb30SBarry Smith ierr = PetscArrayzero(a->a,a->i[A->rmap->n]);CHKERRQ(ierr); 1140acf2f550SJed Brown ierr = MatSeqAIJInvalidateDiagonal(A);CHKERRQ(ierr); 1141e2cf4d64SStefano Zampini #if defined(PETSC_HAVE_VIENNACL) || defined(PETSC_HAVE_CUDA) 1142c70f7ee4SJunchao Zhang if (A->offloadmask != PETSC_OFFLOAD_UNALLOCATED) A->offloadmask = PETSC_OFFLOAD_CPU; 1143e2cf4d64SStefano Zampini #endif 11443a40ed3dSBarry Smith PetscFunctionReturn(0); 114517ab2063SBarry Smith } 1146416022c9SBarry Smith 1147dfbe8321SBarry Smith PetscErrorCode MatDestroy_SeqAIJ(Mat A) 114817ab2063SBarry Smith { 1149416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 1150dfbe8321SBarry Smith PetscErrorCode ierr; 1151d5d45c9bSBarry Smith 11523a40ed3dSBarry Smith PetscFunctionBegin; 1153aa482453SBarry Smith #if defined(PETSC_USE_LOG) 1154d0f46423SBarry Smith PetscLogObjectState((PetscObject)A,"Rows=%D, Cols=%D, NZ=%D",A->rmap->n,A->cmap->n,a->nz); 115517ab2063SBarry Smith #endif 1156e6b907acSBarry Smith ierr = MatSeqXAIJFreeAIJ(A,&a->a,&a->j,&a->i);CHKERRQ(ierr); 11576bf464f9SBarry Smith ierr = ISDestroy(&a->row);CHKERRQ(ierr); 11586bf464f9SBarry Smith ierr = ISDestroy(&a->col);CHKERRQ(ierr); 115905b42c5fSBarry Smith ierr = PetscFree(a->diag);CHKERRQ(ierr); 1160d48dcb14SBarry Smith ierr = PetscFree(a->ibdiag);CHKERRQ(ierr); 1161071fcb05SBarry Smith ierr = PetscFree(a->imax);CHKERRQ(ierr); 1162071fcb05SBarry Smith ierr = PetscFree(a->ilen);CHKERRQ(ierr); 1163846b4da1SFande Kong ierr = PetscFree(a->ipre);CHKERRQ(ierr); 116471f1c65dSBarry Smith ierr = PetscFree3(a->idiag,a->mdiag,a->ssor_work);CHKERRQ(ierr); 116505b42c5fSBarry Smith ierr = PetscFree(a->solve_work);CHKERRQ(ierr); 11666bf464f9SBarry Smith ierr = ISDestroy(&a->icol);CHKERRQ(ierr); 116705b42c5fSBarry Smith ierr = PetscFree(a->saved_values);CHKERRQ(ierr); 1168cd6b891eSBarry Smith ierr = PetscFree2(a->compressedrow.i,a->compressedrow.rindex);CHKERRQ(ierr); 1169a30b2313SHong Zhang 11704108e4d5SBarry Smith ierr = MatDestroy_SeqAIJ_Inode(A);CHKERRQ(ierr); 1171bf0cc555SLisandro Dalcin ierr = PetscFree(A->data);CHKERRQ(ierr); 1172901853e0SKris Buschelman 11736718818eSStefano Zampini /* MatMatMultNumeric_SeqAIJ_SeqAIJ_Sorted may allocate this. 11746718818eSStefano Zampini That function is so heavily used (sometimes in an hidden way through multnumeric function pointers) 11756718818eSStefano Zampini that is hard to properly add this data to the MatProduct data. We free it here to avoid 11766718818eSStefano Zampini users reusing the matrix object with different data to incur in obscure segmentation faults 11776718818eSStefano Zampini due to different matrix sizes */ 11786718818eSStefano Zampini ierr = PetscObjectCompose((PetscObject)A,"__PETSc__ab_dense",NULL);CHKERRQ(ierr); 11796718818eSStefano Zampini 1180dbd8c25aSHong Zhang ierr = PetscObjectChangeTypeName((PetscObject)A,0);CHKERRQ(ierr); 1181bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)A,"MatSeqAIJSetColumnIndices_C",NULL);CHKERRQ(ierr); 1182bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)A,"MatStoreValues_C",NULL);CHKERRQ(ierr); 1183bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)A,"MatRetrieveValues_C",NULL);CHKERRQ(ierr); 1184bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)A,"MatConvert_seqaij_seqsbaij_C",NULL);CHKERRQ(ierr); 1185bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)A,"MatConvert_seqaij_seqbaij_C",NULL);CHKERRQ(ierr); 1186bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)A,"MatConvert_seqaij_seqaijperm_C",NULL);CHKERRQ(ierr); 11874222ddf1SHong Zhang 11884222ddf1SHong Zhang #if defined(PETSC_HAVE_CUDA) 11894222ddf1SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)A,"MatConvert_seqaij_seqaijcusparse_C",NULL);CHKERRQ(ierr); 1190*e6e9a74fSStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)A,"MatProductSetFromOptions_seqaijcusparse_seqaij_C",NULL);CHKERRQ(ierr); 11914222ddf1SHong Zhang #endif 11924222ddf1SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)A,"MatConvert_seqaij_seqaijcrl_C",NULL);CHKERRQ(ierr); 1193af8000cdSHong Zhang #if defined(PETSC_HAVE_ELEMENTAL) 1194af8000cdSHong Zhang ierr = PetscObjectComposeFunction((PetscObject)A,"MatConvert_seqaij_elemental_C",NULL);CHKERRQ(ierr); 1195af8000cdSHong Zhang #endif 1196d24d4204SJose E. Roman #if defined(PETSC_HAVE_SCALAPACK) 1197d24d4204SJose E. Roman ierr = PetscObjectComposeFunction((PetscObject)A,"MatConvert_seqaij_scalapack_C",NULL);CHKERRQ(ierr); 1198d24d4204SJose E. Roman #endif 119963c07aadSStefano Zampini #if defined(PETSC_HAVE_HYPRE) 120063c07aadSStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)A,"MatConvert_seqaij_hypre_C",NULL);CHKERRQ(ierr); 12014222ddf1SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)A,"MatProductSetFromOptions_transpose_seqaij_seqaij_C",NULL);CHKERRQ(ierr); 120263c07aadSStefano Zampini #endif 1203b49cda9fSStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)A,"MatConvert_seqaij_seqdense_C",NULL);CHKERRQ(ierr); 1204c9225affSStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)A,"MatConvert_seqaij_seqsell_C",NULL);CHKERRQ(ierr); 1205c9225affSStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)A,"MatConvert_seqaij_is_C",NULL);CHKERRQ(ierr); 1206bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)A,"MatIsTranspose_C",NULL);CHKERRQ(ierr); 1207bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)A,"MatSeqAIJSetPreallocation_C",NULL);CHKERRQ(ierr); 1208846b4da1SFande Kong ierr = PetscObjectComposeFunction((PetscObject)A,"MatResetPreallocation_C",NULL);CHKERRQ(ierr); 1209bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)A,"MatSeqAIJSetPreallocationCSR_C",NULL);CHKERRQ(ierr); 1210bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)A,"MatReorderForNonzeroDiagonal_C",NULL);CHKERRQ(ierr); 12114222ddf1SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)A,"MatProductSetFromOptions_is_seqaij_C",NULL);CHKERRQ(ierr); 12124222ddf1SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)A,"MatProductSetFromOptions_seqdense_seqaij_C",NULL);CHKERRQ(ierr); 12134222ddf1SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)A,"MatProductSetFromOptions_seqaij_seqaij_C",NULL);CHKERRQ(ierr); 12143a40ed3dSBarry Smith PetscFunctionReturn(0); 121517ab2063SBarry Smith } 121617ab2063SBarry Smith 1217ace3abfcSBarry Smith PetscErrorCode MatSetOption_SeqAIJ(Mat A,MatOption op,PetscBool flg) 121817ab2063SBarry Smith { 1219416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 12204846f1f5SKris Buschelman PetscErrorCode ierr; 12213a40ed3dSBarry Smith 12223a40ed3dSBarry Smith PetscFunctionBegin; 1223a65d3064SKris Buschelman switch (op) { 1224a65d3064SKris Buschelman case MAT_ROW_ORIENTED: 12254e0d8c25SBarry Smith a->roworiented = flg; 1226a65d3064SKris Buschelman break; 1227a9817697SBarry Smith case MAT_KEEP_NONZERO_PATTERN: 1228a9817697SBarry Smith a->keepnonzeropattern = flg; 1229a65d3064SKris Buschelman break; 1230512a5fc5SBarry Smith case MAT_NEW_NONZERO_LOCATIONS: 1231512a5fc5SBarry Smith a->nonew = (flg ? 0 : 1); 1232a65d3064SKris Buschelman break; 1233a65d3064SKris Buschelman case MAT_NEW_NONZERO_LOCATION_ERR: 12344e0d8c25SBarry Smith a->nonew = (flg ? -1 : 0); 1235a65d3064SKris Buschelman break; 1236a65d3064SKris Buschelman case MAT_NEW_NONZERO_ALLOCATION_ERR: 12374e0d8c25SBarry Smith a->nonew = (flg ? -2 : 0); 1238a65d3064SKris Buschelman break; 123928b2fa4aSMatthew Knepley case MAT_UNUSED_NONZERO_LOCATION_ERR: 124028b2fa4aSMatthew Knepley a->nounused = (flg ? -1 : 0); 124128b2fa4aSMatthew Knepley break; 1242a65d3064SKris Buschelman case MAT_IGNORE_ZERO_ENTRIES: 12434e0d8c25SBarry Smith a->ignorezeroentries = flg; 12440df259c2SBarry Smith break; 12453d472b54SHong Zhang case MAT_SPD: 1246b1646e73SJed Brown case MAT_SYMMETRIC: 1247b1646e73SJed Brown case MAT_STRUCTURALLY_SYMMETRIC: 1248b1646e73SJed Brown case MAT_HERMITIAN: 1249b1646e73SJed Brown case MAT_SYMMETRY_ETERNAL: 1250957cac9fSHong Zhang case MAT_STRUCTURE_ONLY: 12515021d80fSJed Brown /* These options are handled directly by MatSetOption() */ 12525021d80fSJed Brown break; 12534e0d8c25SBarry Smith case MAT_NEW_DIAGONALS: 1254a65d3064SKris Buschelman case MAT_IGNORE_OFF_PROC_ENTRIES: 1255a65d3064SKris Buschelman case MAT_USE_HASH_TABLE: 1256290bbb0aSBarry Smith ierr = PetscInfo1(A,"Option %s ignored\n",MatOptions[op]);CHKERRQ(ierr); 1257a65d3064SKris Buschelman break; 1258b87ac2d8SJed Brown case MAT_USE_INODES: 1259b87ac2d8SJed Brown /* Not an error because MatSetOption_SeqAIJ_Inode handles this one */ 1260b87ac2d8SJed Brown break; 1261c10200c1SHong Zhang case MAT_SUBMAT_SINGLEIS: 1262c10200c1SHong Zhang A->submat_singleis = flg; 1263c10200c1SHong Zhang break; 1264071fcb05SBarry Smith case MAT_SORTED_FULL: 1265071fcb05SBarry Smith if (flg) A->ops->setvalues = MatSetValues_SeqAIJ_SortedFull; 1266071fcb05SBarry Smith else A->ops->setvalues = MatSetValues_SeqAIJ; 1267071fcb05SBarry Smith break; 1268a65d3064SKris Buschelman default: 1269e32f2f54SBarry Smith SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_SUP,"unknown option %d",op); 1270a65d3064SKris Buschelman } 12714108e4d5SBarry Smith ierr = MatSetOption_SeqAIJ_Inode(A,op,flg);CHKERRQ(ierr); 12723a40ed3dSBarry Smith PetscFunctionReturn(0); 127317ab2063SBarry Smith } 127417ab2063SBarry Smith 1275dfbe8321SBarry Smith PetscErrorCode MatGetDiagonal_SeqAIJ(Mat A,Vec v) 127617ab2063SBarry Smith { 1277416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 12786849ba73SBarry Smith PetscErrorCode ierr; 1279fdc842d1SBarry Smith PetscInt i,j,n,*ai=a->i,*aj=a->j; 1280fdc842d1SBarry Smith PetscScalar *aa=a->a,*x; 128117ab2063SBarry Smith 12823a40ed3dSBarry Smith PetscFunctionBegin; 1283d3e70bfaSHong Zhang ierr = VecGetLocalSize(v,&n);CHKERRQ(ierr); 1284e32f2f54SBarry Smith if (n != A->rmap->n) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Nonconforming matrix and vector"); 128535e7444dSHong Zhang 1286d5f3da31SBarry Smith if (A->factortype == MAT_FACTOR_ILU || A->factortype == MAT_FACTOR_LU) { 1287d3e70bfaSHong Zhang PetscInt *diag=a->diag; 1288fdc842d1SBarry Smith ierr = VecGetArrayWrite(v,&x);CHKERRQ(ierr); 12892c990fa1SHong Zhang for (i=0; i<n; i++) x[i] = 1.0/aa[diag[i]]; 1290fdc842d1SBarry Smith ierr = VecRestoreArrayWrite(v,&x);CHKERRQ(ierr); 129135e7444dSHong Zhang PetscFunctionReturn(0); 129235e7444dSHong Zhang } 129335e7444dSHong Zhang 1294fdc842d1SBarry Smith ierr = VecGetArrayWrite(v,&x);CHKERRQ(ierr); 129535e7444dSHong Zhang for (i=0; i<n; i++) { 1296fdc842d1SBarry Smith x[i] = 0.0; 129735e7444dSHong Zhang for (j=ai[i]; j<ai[i+1]; j++) { 129835e7444dSHong Zhang if (aj[j] == i) { 129935e7444dSHong Zhang x[i] = aa[j]; 130017ab2063SBarry Smith break; 130117ab2063SBarry Smith } 130217ab2063SBarry Smith } 130317ab2063SBarry Smith } 1304fdc842d1SBarry Smith ierr = VecRestoreArrayWrite(v,&x);CHKERRQ(ierr); 13053a40ed3dSBarry Smith PetscFunctionReturn(0); 130617ab2063SBarry Smith } 130717ab2063SBarry Smith 1308c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/ftn-kernels/fmult.h> 1309dfbe8321SBarry Smith PetscErrorCode MatMultTransposeAdd_SeqAIJ(Mat A,Vec xx,Vec zz,Vec yy) 131017ab2063SBarry Smith { 1311416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 1312d9ca1df4SBarry Smith PetscScalar *y; 1313d9ca1df4SBarry Smith const PetscScalar *x; 1314dfbe8321SBarry Smith PetscErrorCode ierr; 1315d0f46423SBarry Smith PetscInt m = A->rmap->n; 13165c897100SBarry Smith #if !defined(PETSC_USE_FORTRAN_KERNEL_MULTTRANSPOSEAIJ) 1317d9ca1df4SBarry Smith const MatScalar *v; 1318a77337e4SBarry Smith PetscScalar alpha; 1319d9ca1df4SBarry Smith PetscInt n,i,j; 1320d9ca1df4SBarry Smith const PetscInt *idx,*ii,*ridx=NULL; 13213447b6efSHong Zhang Mat_CompressedRow cprow = a->compressedrow; 1322ace3abfcSBarry Smith PetscBool usecprow = cprow.use; 13235c897100SBarry Smith #endif 132417ab2063SBarry Smith 13253a40ed3dSBarry Smith PetscFunctionBegin; 13262e8a6d31SBarry Smith if (zz != yy) {ierr = VecCopy(zz,yy);CHKERRQ(ierr);} 1327d9ca1df4SBarry Smith ierr = VecGetArrayRead(xx,&x);CHKERRQ(ierr); 13281ebc52fbSHong Zhang ierr = VecGetArray(yy,&y);CHKERRQ(ierr); 13295c897100SBarry Smith 13305c897100SBarry Smith #if defined(PETSC_USE_FORTRAN_KERNEL_MULTTRANSPOSEAIJ) 1331bfeeae90SHong Zhang fortranmulttransposeaddaij_(&m,x,a->i,a->j,a->a,y); 13325c897100SBarry Smith #else 13333447b6efSHong Zhang if (usecprow) { 13343447b6efSHong Zhang m = cprow.nrows; 13353447b6efSHong Zhang ii = cprow.i; 13367b2bb3b9SHong Zhang ridx = cprow.rindex; 13373447b6efSHong Zhang } else { 13383447b6efSHong Zhang ii = a->i; 13393447b6efSHong Zhang } 134017ab2063SBarry Smith for (i=0; i<m; i++) { 13413447b6efSHong Zhang idx = a->j + ii[i]; 13423447b6efSHong Zhang v = a->a + ii[i]; 13433447b6efSHong Zhang n = ii[i+1] - ii[i]; 13443447b6efSHong Zhang if (usecprow) { 13457b2bb3b9SHong Zhang alpha = x[ridx[i]]; 13463447b6efSHong Zhang } else { 134717ab2063SBarry Smith alpha = x[i]; 13483447b6efSHong Zhang } 134904fbf559SBarry Smith for (j=0; j<n; j++) y[idx[j]] += alpha*v[j]; 135017ab2063SBarry Smith } 13515c897100SBarry Smith #endif 1352dc0b31edSSatish Balay ierr = PetscLogFlops(2.0*a->nz);CHKERRQ(ierr); 1353d9ca1df4SBarry Smith ierr = VecRestoreArrayRead(xx,&x);CHKERRQ(ierr); 13541ebc52fbSHong Zhang ierr = VecRestoreArray(yy,&y);CHKERRQ(ierr); 13553a40ed3dSBarry Smith PetscFunctionReturn(0); 135617ab2063SBarry Smith } 135717ab2063SBarry Smith 1358dfbe8321SBarry Smith PetscErrorCode MatMultTranspose_SeqAIJ(Mat A,Vec xx,Vec yy) 13595c897100SBarry Smith { 1360dfbe8321SBarry Smith PetscErrorCode ierr; 13615c897100SBarry Smith 13625c897100SBarry Smith PetscFunctionBegin; 1363170fe5c8SBarry Smith ierr = VecSet(yy,0.0);CHKERRQ(ierr); 13645c897100SBarry Smith ierr = MatMultTransposeAdd_SeqAIJ(A,xx,yy,yy);CHKERRQ(ierr); 13655c897100SBarry Smith PetscFunctionReturn(0); 13665c897100SBarry Smith } 13675c897100SBarry Smith 1368c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/ftn-kernels/fmult.h> 136978b84d54SShri Abhyankar 1370dfbe8321SBarry Smith PetscErrorCode MatMult_SeqAIJ(Mat A,Vec xx,Vec yy) 137117ab2063SBarry Smith { 1372416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 1373d9fead3dSBarry Smith PetscScalar *y; 137454f21887SBarry Smith const PetscScalar *x; 137554f21887SBarry Smith const MatScalar *aa; 1376dfbe8321SBarry Smith PetscErrorCode ierr; 1377003131ecSBarry Smith PetscInt m=A->rmap->n; 13780298fd71SBarry Smith const PetscInt *aj,*ii,*ridx=NULL; 13797b083b7cSBarry Smith PetscInt n,i; 1380362ced78SSatish Balay PetscScalar sum; 1381ace3abfcSBarry Smith PetscBool usecprow=a->compressedrow.use; 138217ab2063SBarry Smith 1383b6410449SSatish Balay #if defined(PETSC_HAVE_PRAGMA_DISJOINT) 138497952fefSHong Zhang #pragma disjoint(*x,*y,*aa) 1385fee21e36SBarry Smith #endif 1386fee21e36SBarry Smith 13873a40ed3dSBarry Smith PetscFunctionBegin; 13883649974fSBarry Smith ierr = VecGetArrayRead(xx,&x);CHKERRQ(ierr); 13891ebc52fbSHong Zhang ierr = VecGetArray(yy,&y);CHKERRQ(ierr); 1390416022c9SBarry Smith ii = a->i; 13914eb6d288SHong Zhang if (usecprow) { /* use compressed row format */ 1392580bdb30SBarry Smith ierr = PetscArrayzero(y,m);CHKERRQ(ierr); 139397952fefSHong Zhang m = a->compressedrow.nrows; 139497952fefSHong Zhang ii = a->compressedrow.i; 139597952fefSHong Zhang ridx = a->compressedrow.rindex; 139697952fefSHong Zhang for (i=0; i<m; i++) { 139797952fefSHong Zhang n = ii[i+1] - ii[i]; 139897952fefSHong Zhang aj = a->j + ii[i]; 139997952fefSHong Zhang aa = a->a + ii[i]; 140097952fefSHong Zhang sum = 0.0; 1401003131ecSBarry Smith PetscSparseDensePlusDot(sum,x,aa,aj,n); 1402003131ecSBarry Smith /* for (j=0; j<n; j++) sum += (*aa++)*x[*aj++]; */ 140397952fefSHong Zhang y[*ridx++] = sum; 140497952fefSHong Zhang } 140597952fefSHong Zhang } else { /* do not use compressed row format */ 1406b05257ddSBarry Smith #if defined(PETSC_USE_FORTRAN_KERNEL_MULTAIJ) 14073d3eaba7SBarry Smith aj = a->j; 14083d3eaba7SBarry Smith aa = a->a; 1409b05257ddSBarry Smith fortranmultaij_(&m,x,ii,aj,aa,y); 1410b05257ddSBarry Smith #else 141117ab2063SBarry Smith for (i=0; i<m; i++) { 1412003131ecSBarry Smith n = ii[i+1] - ii[i]; 1413003131ecSBarry Smith aj = a->j + ii[i]; 1414003131ecSBarry Smith aa = a->a + ii[i]; 141517ab2063SBarry Smith sum = 0.0; 1416003131ecSBarry Smith PetscSparseDensePlusDot(sum,x,aa,aj,n); 141717ab2063SBarry Smith y[i] = sum; 141817ab2063SBarry Smith } 14198d195f9aSBarry Smith #endif 1420b05257ddSBarry Smith } 14217b083b7cSBarry Smith ierr = PetscLogFlops(2.0*a->nz - a->nonzerorowcnt);CHKERRQ(ierr); 14223649974fSBarry Smith ierr = VecRestoreArrayRead(xx,&x);CHKERRQ(ierr); 14231ebc52fbSHong Zhang ierr = VecRestoreArray(yy,&y);CHKERRQ(ierr); 14243a40ed3dSBarry Smith PetscFunctionReturn(0); 142517ab2063SBarry Smith } 142617ab2063SBarry Smith 1427b434eb95SMatthew G. Knepley PetscErrorCode MatMultMax_SeqAIJ(Mat A,Vec xx,Vec yy) 1428b434eb95SMatthew G. Knepley { 1429b434eb95SMatthew G. Knepley Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 1430b434eb95SMatthew G. Knepley PetscScalar *y; 1431b434eb95SMatthew G. Knepley const PetscScalar *x; 1432b434eb95SMatthew G. Knepley const MatScalar *aa; 1433b434eb95SMatthew G. Knepley PetscErrorCode ierr; 1434b434eb95SMatthew G. Knepley PetscInt m=A->rmap->n; 1435b434eb95SMatthew G. Knepley const PetscInt *aj,*ii,*ridx=NULL; 1436b434eb95SMatthew G. Knepley PetscInt n,i,nonzerorow=0; 1437b434eb95SMatthew G. Knepley PetscScalar sum; 1438b434eb95SMatthew G. Knepley PetscBool usecprow=a->compressedrow.use; 1439b434eb95SMatthew G. Knepley 1440b434eb95SMatthew G. Knepley #if defined(PETSC_HAVE_PRAGMA_DISJOINT) 1441b434eb95SMatthew G. Knepley #pragma disjoint(*x,*y,*aa) 1442b434eb95SMatthew G. Knepley #endif 1443b434eb95SMatthew G. Knepley 1444b434eb95SMatthew G. Knepley PetscFunctionBegin; 1445b434eb95SMatthew G. Knepley ierr = VecGetArrayRead(xx,&x);CHKERRQ(ierr); 1446b434eb95SMatthew G. Knepley ierr = VecGetArray(yy,&y);CHKERRQ(ierr); 1447b434eb95SMatthew G. Knepley if (usecprow) { /* use compressed row format */ 1448b434eb95SMatthew G. Knepley m = a->compressedrow.nrows; 1449b434eb95SMatthew G. Knepley ii = a->compressedrow.i; 1450b434eb95SMatthew G. Knepley ridx = a->compressedrow.rindex; 1451b434eb95SMatthew G. Knepley for (i=0; i<m; i++) { 1452b434eb95SMatthew G. Knepley n = ii[i+1] - ii[i]; 1453b434eb95SMatthew G. Knepley aj = a->j + ii[i]; 1454b434eb95SMatthew G. Knepley aa = a->a + ii[i]; 1455b434eb95SMatthew G. Knepley sum = 0.0; 1456b434eb95SMatthew G. Knepley nonzerorow += (n>0); 1457b434eb95SMatthew G. Knepley PetscSparseDenseMaxDot(sum,x,aa,aj,n); 1458b434eb95SMatthew G. Knepley /* for (j=0; j<n; j++) sum += (*aa++)*x[*aj++]; */ 1459b434eb95SMatthew G. Knepley y[*ridx++] = sum; 1460b434eb95SMatthew G. Knepley } 1461b434eb95SMatthew G. Knepley } else { /* do not use compressed row format */ 14623d3eaba7SBarry Smith ii = a->i; 1463b434eb95SMatthew G. Knepley for (i=0; i<m; i++) { 1464b434eb95SMatthew G. Knepley n = ii[i+1] - ii[i]; 1465b434eb95SMatthew G. Knepley aj = a->j + ii[i]; 1466b434eb95SMatthew G. Knepley aa = a->a + ii[i]; 1467b434eb95SMatthew G. Knepley sum = 0.0; 1468b434eb95SMatthew G. Knepley nonzerorow += (n>0); 1469b434eb95SMatthew G. Knepley PetscSparseDenseMaxDot(sum,x,aa,aj,n); 1470b434eb95SMatthew G. Knepley y[i] = sum; 1471b434eb95SMatthew G. Knepley } 1472b434eb95SMatthew G. Knepley } 1473b434eb95SMatthew G. Knepley ierr = PetscLogFlops(2.0*a->nz - nonzerorow);CHKERRQ(ierr); 1474b434eb95SMatthew G. Knepley ierr = VecRestoreArrayRead(xx,&x);CHKERRQ(ierr); 1475b434eb95SMatthew G. Knepley ierr = VecRestoreArray(yy,&y);CHKERRQ(ierr); 1476b434eb95SMatthew G. Knepley PetscFunctionReturn(0); 1477b434eb95SMatthew G. Knepley } 1478b434eb95SMatthew G. Knepley 1479b434eb95SMatthew G. Knepley PetscErrorCode MatMultAddMax_SeqAIJ(Mat A,Vec xx,Vec yy,Vec zz) 1480b434eb95SMatthew G. Knepley { 1481b434eb95SMatthew G. Knepley Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 1482b434eb95SMatthew G. Knepley PetscScalar *y,*z; 1483b434eb95SMatthew G. Knepley const PetscScalar *x; 1484b434eb95SMatthew G. Knepley const MatScalar *aa; 1485b434eb95SMatthew G. Knepley PetscErrorCode ierr; 1486b434eb95SMatthew G. Knepley PetscInt m = A->rmap->n,*aj,*ii; 1487b434eb95SMatthew G. Knepley PetscInt n,i,*ridx=NULL; 1488b434eb95SMatthew G. Knepley PetscScalar sum; 1489b434eb95SMatthew G. Knepley PetscBool usecprow=a->compressedrow.use; 1490b434eb95SMatthew G. Knepley 1491b434eb95SMatthew G. Knepley PetscFunctionBegin; 1492b434eb95SMatthew G. Knepley ierr = VecGetArrayRead(xx,&x);CHKERRQ(ierr); 1493d9ca1df4SBarry Smith ierr = VecGetArrayPair(yy,zz,&y,&z);CHKERRQ(ierr); 1494b434eb95SMatthew G. Knepley if (usecprow) { /* use compressed row format */ 1495b434eb95SMatthew G. Knepley if (zz != yy) { 1496580bdb30SBarry Smith ierr = PetscArraycpy(z,y,m);CHKERRQ(ierr); 1497b434eb95SMatthew G. Knepley } 1498b434eb95SMatthew G. Knepley m = a->compressedrow.nrows; 1499b434eb95SMatthew G. Knepley ii = a->compressedrow.i; 1500b434eb95SMatthew G. Knepley ridx = a->compressedrow.rindex; 1501b434eb95SMatthew G. Knepley for (i=0; i<m; i++) { 1502b434eb95SMatthew G. Knepley n = ii[i+1] - ii[i]; 1503b434eb95SMatthew G. Knepley aj = a->j + ii[i]; 1504b434eb95SMatthew G. Knepley aa = a->a + ii[i]; 1505b434eb95SMatthew G. Knepley sum = y[*ridx]; 1506b434eb95SMatthew G. Knepley PetscSparseDenseMaxDot(sum,x,aa,aj,n); 1507b434eb95SMatthew G. Knepley z[*ridx++] = sum; 1508b434eb95SMatthew G. Knepley } 1509b434eb95SMatthew G. Knepley } else { /* do not use compressed row format */ 15103d3eaba7SBarry Smith ii = a->i; 1511b434eb95SMatthew G. Knepley for (i=0; i<m; i++) { 1512b434eb95SMatthew G. Knepley n = ii[i+1] - ii[i]; 1513b434eb95SMatthew G. Knepley aj = a->j + ii[i]; 1514b434eb95SMatthew G. Knepley aa = a->a + ii[i]; 1515b434eb95SMatthew G. Knepley sum = y[i]; 1516b434eb95SMatthew G. Knepley PetscSparseDenseMaxDot(sum,x,aa,aj,n); 1517b434eb95SMatthew G. Knepley z[i] = sum; 1518b434eb95SMatthew G. Knepley } 1519b434eb95SMatthew G. Knepley } 1520b434eb95SMatthew G. Knepley ierr = PetscLogFlops(2.0*a->nz);CHKERRQ(ierr); 1521b434eb95SMatthew G. Knepley ierr = VecRestoreArrayRead(xx,&x);CHKERRQ(ierr); 1522d9ca1df4SBarry Smith ierr = VecRestoreArrayPair(yy,zz,&y,&z);CHKERRQ(ierr); 1523b434eb95SMatthew G. Knepley PetscFunctionReturn(0); 1524b434eb95SMatthew G. Knepley } 1525b434eb95SMatthew G. Knepley 1526c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/ftn-kernels/fmultadd.h> 1527dfbe8321SBarry Smith PetscErrorCode MatMultAdd_SeqAIJ(Mat A,Vec xx,Vec yy,Vec zz) 152817ab2063SBarry Smith { 1529416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 1530f15663dcSBarry Smith PetscScalar *y,*z; 1531f15663dcSBarry Smith const PetscScalar *x; 153254f21887SBarry Smith const MatScalar *aa; 1533dfbe8321SBarry Smith PetscErrorCode ierr; 1534d9ca1df4SBarry Smith const PetscInt *aj,*ii,*ridx=NULL; 1535d9ca1df4SBarry Smith PetscInt m = A->rmap->n,n,i; 1536362ced78SSatish Balay PetscScalar sum; 1537ace3abfcSBarry Smith PetscBool usecprow=a->compressedrow.use; 15389ea0dfa2SSatish Balay 15393a40ed3dSBarry Smith PetscFunctionBegin; 1540f15663dcSBarry Smith ierr = VecGetArrayRead(xx,&x);CHKERRQ(ierr); 1541d9ca1df4SBarry Smith ierr = VecGetArrayPair(yy,zz,&y,&z);CHKERRQ(ierr); 15424eb6d288SHong Zhang if (usecprow) { /* use compressed row format */ 15434eb6d288SHong Zhang if (zz != yy) { 1544580bdb30SBarry Smith ierr = PetscArraycpy(z,y,m);CHKERRQ(ierr); 15454eb6d288SHong Zhang } 154697952fefSHong Zhang m = a->compressedrow.nrows; 154797952fefSHong Zhang ii = a->compressedrow.i; 154897952fefSHong Zhang ridx = a->compressedrow.rindex; 154997952fefSHong Zhang for (i=0; i<m; i++) { 155097952fefSHong Zhang n = ii[i+1] - ii[i]; 155197952fefSHong Zhang aj = a->j + ii[i]; 155297952fefSHong Zhang aa = a->a + ii[i]; 155397952fefSHong Zhang sum = y[*ridx]; 1554f15663dcSBarry Smith PetscSparseDensePlusDot(sum,x,aa,aj,n); 155597952fefSHong Zhang z[*ridx++] = sum; 155697952fefSHong Zhang } 155797952fefSHong Zhang } else { /* do not use compressed row format */ 15583d3eaba7SBarry Smith ii = a->i; 1559f15663dcSBarry Smith #if defined(PETSC_USE_FORTRAN_KERNEL_MULTADDAIJ) 15603d3eaba7SBarry Smith aj = a->j; 15613d3eaba7SBarry Smith aa = a->a; 1562f15663dcSBarry Smith fortranmultaddaij_(&m,x,ii,aj,aa,y,z); 1563f15663dcSBarry Smith #else 156417ab2063SBarry Smith for (i=0; i<m; i++) { 1565f15663dcSBarry Smith n = ii[i+1] - ii[i]; 1566f15663dcSBarry Smith aj = a->j + ii[i]; 1567f15663dcSBarry Smith aa = a->a + ii[i]; 156817ab2063SBarry Smith sum = y[i]; 1569f15663dcSBarry Smith PetscSparseDensePlusDot(sum,x,aa,aj,n); 157017ab2063SBarry Smith z[i] = sum; 157117ab2063SBarry Smith } 157202ab625aSSatish Balay #endif 1573f15663dcSBarry Smith } 1574dc0b31edSSatish Balay ierr = PetscLogFlops(2.0*a->nz);CHKERRQ(ierr); 1575f15663dcSBarry Smith ierr = VecRestoreArrayRead(xx,&x);CHKERRQ(ierr); 1576d9ca1df4SBarry Smith ierr = VecRestoreArrayPair(yy,zz,&y,&z);CHKERRQ(ierr); 15773a40ed3dSBarry Smith PetscFunctionReturn(0); 157817ab2063SBarry Smith } 157917ab2063SBarry Smith 158017ab2063SBarry Smith /* 158117ab2063SBarry Smith Adds diagonal pointers to sparse matrix structure. 158217ab2063SBarry Smith */ 1583dfbe8321SBarry Smith PetscErrorCode MatMarkDiagonal_SeqAIJ(Mat A) 158417ab2063SBarry Smith { 1585416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 15866849ba73SBarry Smith PetscErrorCode ierr; 1587d0f46423SBarry Smith PetscInt i,j,m = A->rmap->n; 158817ab2063SBarry Smith 15893a40ed3dSBarry Smith PetscFunctionBegin; 159009f38230SBarry Smith if (!a->diag) { 1591785e854fSJed Brown ierr = PetscMalloc1(m,&a->diag);CHKERRQ(ierr); 15923bb1ff40SBarry Smith ierr = PetscLogObjectMemory((PetscObject)A, m*sizeof(PetscInt));CHKERRQ(ierr); 159309f38230SBarry Smith } 1594d0f46423SBarry Smith for (i=0; i<A->rmap->n; i++) { 159509f38230SBarry Smith a->diag[i] = a->i[i+1]; 1596bfeeae90SHong Zhang for (j=a->i[i]; j<a->i[i+1]; j++) { 1597bfeeae90SHong Zhang if (a->j[j] == i) { 159809f38230SBarry Smith a->diag[i] = j; 159917ab2063SBarry Smith break; 160017ab2063SBarry Smith } 160117ab2063SBarry Smith } 160217ab2063SBarry Smith } 16033a40ed3dSBarry Smith PetscFunctionReturn(0); 160417ab2063SBarry Smith } 160517ab2063SBarry Smith 160661ecd0c6SBarry Smith PetscErrorCode MatShift_SeqAIJ(Mat A,PetscScalar v) 160761ecd0c6SBarry Smith { 160861ecd0c6SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 160961ecd0c6SBarry Smith const PetscInt *diag = (const PetscInt*)a->diag; 161061ecd0c6SBarry Smith const PetscInt *ii = (const PetscInt*) a->i; 161161ecd0c6SBarry Smith PetscInt i,*mdiag = NULL; 161261ecd0c6SBarry Smith PetscErrorCode ierr; 161361ecd0c6SBarry Smith PetscInt cnt = 0; /* how many diagonals are missing */ 161461ecd0c6SBarry Smith 161561ecd0c6SBarry Smith PetscFunctionBegin; 161661ecd0c6SBarry Smith if (!A->preallocated || !a->nz) { 161761ecd0c6SBarry Smith ierr = MatSeqAIJSetPreallocation(A,1,NULL);CHKERRQ(ierr); 161861ecd0c6SBarry Smith ierr = MatShift_Basic(A,v);CHKERRQ(ierr); 161961ecd0c6SBarry Smith PetscFunctionReturn(0); 162061ecd0c6SBarry Smith } 162161ecd0c6SBarry Smith 162261ecd0c6SBarry Smith if (a->diagonaldense) { 162361ecd0c6SBarry Smith cnt = 0; 162461ecd0c6SBarry Smith } else { 162561ecd0c6SBarry Smith ierr = PetscCalloc1(A->rmap->n,&mdiag);CHKERRQ(ierr); 162661ecd0c6SBarry Smith for (i=0; i<A->rmap->n; i++) { 162761ecd0c6SBarry Smith if (diag[i] >= ii[i+1]) { 162861ecd0c6SBarry Smith cnt++; 162961ecd0c6SBarry Smith mdiag[i] = 1; 163061ecd0c6SBarry Smith } 163161ecd0c6SBarry Smith } 163261ecd0c6SBarry Smith } 163361ecd0c6SBarry Smith if (!cnt) { 163461ecd0c6SBarry Smith ierr = MatShift_Basic(A,v);CHKERRQ(ierr); 163561ecd0c6SBarry Smith } else { 1636b6f2aa54SBarry Smith PetscScalar *olda = a->a; /* preserve pointers to current matrix nonzeros structure and values */ 1637b6f2aa54SBarry Smith PetscInt *oldj = a->j, *oldi = a->i; 163861ecd0c6SBarry Smith PetscBool singlemalloc = a->singlemalloc,free_a = a->free_a,free_ij = a->free_ij; 163961ecd0c6SBarry Smith 164061ecd0c6SBarry Smith a->a = NULL; 164161ecd0c6SBarry Smith a->j = NULL; 164261ecd0c6SBarry Smith a->i = NULL; 164361ecd0c6SBarry Smith /* increase the values in imax for each row where a diagonal is being inserted then reallocate the matrix data structures */ 164461ecd0c6SBarry Smith for (i=0; i<A->rmap->n; i++) { 164561ecd0c6SBarry Smith a->imax[i] += mdiag[i]; 1646447d62f5SStefano Zampini a->imax[i] = PetscMin(a->imax[i],A->cmap->n); 164761ecd0c6SBarry Smith } 164861ecd0c6SBarry Smith ierr = MatSeqAIJSetPreallocation_SeqAIJ(A,0,a->imax);CHKERRQ(ierr); 164961ecd0c6SBarry Smith 165061ecd0c6SBarry Smith /* copy old values into new matrix data structure */ 165161ecd0c6SBarry Smith for (i=0; i<A->rmap->n; i++) { 165261ecd0c6SBarry Smith ierr = MatSetValues(A,1,&i,a->imax[i] - mdiag[i],&oldj[oldi[i]],&olda[oldi[i]],ADD_VALUES);CHKERRQ(ierr); 1653447d62f5SStefano Zampini if (i < A->cmap->n) { 165461ecd0c6SBarry Smith ierr = MatSetValue(A,i,i,v,ADD_VALUES);CHKERRQ(ierr); 165561ecd0c6SBarry Smith } 1656447d62f5SStefano Zampini } 165761ecd0c6SBarry Smith ierr = MatAssemblyBegin(A,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 165861ecd0c6SBarry Smith ierr = MatAssemblyEnd(A,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 165961ecd0c6SBarry Smith if (singlemalloc) { 166061ecd0c6SBarry Smith ierr = PetscFree3(olda,oldj,oldi);CHKERRQ(ierr); 166161ecd0c6SBarry Smith } else { 166261ecd0c6SBarry Smith if (free_a) {ierr = PetscFree(olda);CHKERRQ(ierr);} 166361ecd0c6SBarry Smith if (free_ij) {ierr = PetscFree(oldj);CHKERRQ(ierr);} 166461ecd0c6SBarry Smith if (free_ij) {ierr = PetscFree(oldi);CHKERRQ(ierr);} 166561ecd0c6SBarry Smith } 166661ecd0c6SBarry Smith } 166761ecd0c6SBarry Smith ierr = PetscFree(mdiag);CHKERRQ(ierr); 166861ecd0c6SBarry Smith a->diagonaldense = PETSC_TRUE; 166961ecd0c6SBarry Smith PetscFunctionReturn(0); 167061ecd0c6SBarry Smith } 167161ecd0c6SBarry Smith 1672be5855fcSBarry Smith /* 1673be5855fcSBarry Smith Checks for missing diagonals 1674be5855fcSBarry Smith */ 1675ace3abfcSBarry Smith PetscErrorCode MatMissingDiagonal_SeqAIJ(Mat A,PetscBool *missing,PetscInt *d) 1676be5855fcSBarry Smith { 1677be5855fcSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 16787734d3b5SMatthew G. Knepley PetscInt *diag,*ii = a->i,i; 1679994fe344SLisandro Dalcin PetscErrorCode ierr; 1680be5855fcSBarry Smith 1681be5855fcSBarry Smith PetscFunctionBegin; 168209f38230SBarry Smith *missing = PETSC_FALSE; 16837734d3b5SMatthew G. Knepley if (A->rmap->n > 0 && !ii) { 168409f38230SBarry Smith *missing = PETSC_TRUE; 168509f38230SBarry Smith if (d) *d = 0; 1686994fe344SLisandro Dalcin ierr = PetscInfo(A,"Matrix has no entries therefore is missing diagonal\n");CHKERRQ(ierr); 168709f38230SBarry Smith } else { 168801445905SHong Zhang PetscInt n; 168901445905SHong Zhang n = PetscMin(A->rmap->n, A->cmap->n); 1690f1e2ffcdSBarry Smith diag = a->diag; 169101445905SHong Zhang for (i=0; i<n; i++) { 16927734d3b5SMatthew G. Knepley if (diag[i] >= ii[i+1]) { 169309f38230SBarry Smith *missing = PETSC_TRUE; 169409f38230SBarry Smith if (d) *d = i; 1695994fe344SLisandro Dalcin ierr = PetscInfo1(A,"Matrix is missing diagonal number %D\n",i);CHKERRQ(ierr); 1696358d2f5dSShri Abhyankar break; 169709f38230SBarry Smith } 1698be5855fcSBarry Smith } 1699be5855fcSBarry Smith } 1700be5855fcSBarry Smith PetscFunctionReturn(0); 1701be5855fcSBarry Smith } 1702be5855fcSBarry Smith 17030da83c2eSBarry Smith #include <petscblaslapack.h> 17040da83c2eSBarry Smith #include <petsc/private/kernels/blockinvert.h> 17050da83c2eSBarry Smith 17060da83c2eSBarry Smith /* 17070da83c2eSBarry Smith Note that values is allocated externally by the PC and then passed into this routine 17080da83c2eSBarry Smith */ 17090da83c2eSBarry Smith PetscErrorCode MatInvertVariableBlockDiagonal_SeqAIJ(Mat A,PetscInt nblocks,const PetscInt *bsizes,PetscScalar *diag) 17100da83c2eSBarry Smith { 17110da83c2eSBarry Smith PetscErrorCode ierr; 17120da83c2eSBarry Smith PetscInt n = A->rmap->n, i, ncnt = 0, *indx,j,bsizemax = 0,*v_pivots; 17130da83c2eSBarry Smith PetscBool allowzeropivot,zeropivotdetected=PETSC_FALSE; 17140da83c2eSBarry Smith const PetscReal shift = 0.0; 17150da83c2eSBarry Smith PetscInt ipvt[5]; 17160da83c2eSBarry Smith PetscScalar work[25],*v_work; 17170da83c2eSBarry Smith 17180da83c2eSBarry Smith PetscFunctionBegin; 17190da83c2eSBarry Smith allowzeropivot = PetscNot(A->erroriffailure); 17200da83c2eSBarry Smith for (i=0; i<nblocks; i++) ncnt += bsizes[i]; 17210da83c2eSBarry Smith if (ncnt != n) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Total blocksizes %D doesn't match number matrix rows %D",ncnt,n); 17220da83c2eSBarry Smith for (i=0; i<nblocks; i++) { 17230da83c2eSBarry Smith bsizemax = PetscMax(bsizemax,bsizes[i]); 17240da83c2eSBarry Smith } 17250da83c2eSBarry Smith ierr = PetscMalloc1(bsizemax,&indx);CHKERRQ(ierr); 17260da83c2eSBarry Smith if (bsizemax > 7) { 17270da83c2eSBarry Smith ierr = PetscMalloc2(bsizemax,&v_work,bsizemax,&v_pivots);CHKERRQ(ierr); 17280da83c2eSBarry Smith } 17290da83c2eSBarry Smith ncnt = 0; 17300da83c2eSBarry Smith for (i=0; i<nblocks; i++) { 17310da83c2eSBarry Smith for (j=0; j<bsizes[i]; j++) indx[j] = ncnt+j; 17320da83c2eSBarry Smith ierr = MatGetValues(A,bsizes[i],indx,bsizes[i],indx,diag);CHKERRQ(ierr); 17330da83c2eSBarry Smith switch (bsizes[i]) { 17340da83c2eSBarry Smith case 1: 17350da83c2eSBarry Smith *diag = 1.0/(*diag); 17360da83c2eSBarry Smith break; 17370da83c2eSBarry Smith case 2: 17380da83c2eSBarry Smith ierr = PetscKernel_A_gets_inverse_A_2(diag,shift,allowzeropivot,&zeropivotdetected);CHKERRQ(ierr); 17390da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 17400da83c2eSBarry Smith ierr = PetscKernel_A_gets_transpose_A_2(diag);CHKERRQ(ierr); 17410da83c2eSBarry Smith break; 17420da83c2eSBarry Smith case 3: 17430da83c2eSBarry Smith ierr = PetscKernel_A_gets_inverse_A_3(diag,shift,allowzeropivot,&zeropivotdetected);CHKERRQ(ierr); 17440da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 17450da83c2eSBarry Smith ierr = PetscKernel_A_gets_transpose_A_3(diag);CHKERRQ(ierr); 17460da83c2eSBarry Smith break; 17470da83c2eSBarry Smith case 4: 17480da83c2eSBarry Smith ierr = PetscKernel_A_gets_inverse_A_4(diag,shift,allowzeropivot,&zeropivotdetected);CHKERRQ(ierr); 17490da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 17500da83c2eSBarry Smith ierr = PetscKernel_A_gets_transpose_A_4(diag);CHKERRQ(ierr); 17510da83c2eSBarry Smith break; 17520da83c2eSBarry Smith case 5: 17530da83c2eSBarry Smith ierr = PetscKernel_A_gets_inverse_A_5(diag,ipvt,work,shift,allowzeropivot,&zeropivotdetected);CHKERRQ(ierr); 17540da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 17550da83c2eSBarry Smith ierr = PetscKernel_A_gets_transpose_A_5(diag);CHKERRQ(ierr); 17560da83c2eSBarry Smith break; 17570da83c2eSBarry Smith case 6: 17580da83c2eSBarry Smith ierr = PetscKernel_A_gets_inverse_A_6(diag,shift,allowzeropivot,&zeropivotdetected);CHKERRQ(ierr); 17590da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 17600da83c2eSBarry Smith ierr = PetscKernel_A_gets_transpose_A_6(diag);CHKERRQ(ierr); 17610da83c2eSBarry Smith break; 17620da83c2eSBarry Smith case 7: 17630da83c2eSBarry Smith ierr = PetscKernel_A_gets_inverse_A_7(diag,shift,allowzeropivot,&zeropivotdetected);CHKERRQ(ierr); 17640da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 17650da83c2eSBarry Smith ierr = PetscKernel_A_gets_transpose_A_7(diag);CHKERRQ(ierr); 17660da83c2eSBarry Smith break; 17670da83c2eSBarry Smith default: 17680da83c2eSBarry Smith ierr = PetscKernel_A_gets_inverse_A(bsizes[i],diag,v_pivots,v_work,allowzeropivot,&zeropivotdetected);CHKERRQ(ierr); 17690da83c2eSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 17700da83c2eSBarry Smith ierr = PetscKernel_A_gets_transpose_A_N(diag,bsizes[i]);CHKERRQ(ierr); 17710da83c2eSBarry Smith } 17720da83c2eSBarry Smith ncnt += bsizes[i]; 17730da83c2eSBarry Smith diag += bsizes[i]*bsizes[i]; 17740da83c2eSBarry Smith } 17750da83c2eSBarry Smith if (bsizemax > 7) { 17760da83c2eSBarry Smith ierr = PetscFree2(v_work,v_pivots);CHKERRQ(ierr); 17770da83c2eSBarry Smith } 17780da83c2eSBarry Smith ierr = PetscFree(indx);CHKERRQ(ierr); 17790da83c2eSBarry Smith PetscFunctionReturn(0); 17800da83c2eSBarry Smith } 17810da83c2eSBarry Smith 1782422a814eSBarry Smith /* 1783422a814eSBarry Smith Negative shift indicates do not generate an error if there is a zero diagonal, just invert it anyways 1784422a814eSBarry Smith */ 17857087cfbeSBarry Smith PetscErrorCode MatInvertDiagonal_SeqAIJ(Mat A,PetscScalar omega,PetscScalar fshift) 178671f1c65dSBarry Smith { 178771f1c65dSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*) A->data; 178871f1c65dSBarry Smith PetscErrorCode ierr; 1789d0f46423SBarry Smith PetscInt i,*diag,m = A->rmap->n; 179054f21887SBarry Smith MatScalar *v = a->a; 179154f21887SBarry Smith PetscScalar *idiag,*mdiag; 179271f1c65dSBarry Smith 179371f1c65dSBarry Smith PetscFunctionBegin; 179471f1c65dSBarry Smith if (a->idiagvalid) PetscFunctionReturn(0); 179571f1c65dSBarry Smith ierr = MatMarkDiagonal_SeqAIJ(A);CHKERRQ(ierr); 179671f1c65dSBarry Smith diag = a->diag; 179771f1c65dSBarry Smith if (!a->idiag) { 1798dcca6d9dSJed Brown ierr = PetscMalloc3(m,&a->idiag,m,&a->mdiag,m,&a->ssor_work);CHKERRQ(ierr); 17993bb1ff40SBarry Smith ierr = PetscLogObjectMemory((PetscObject)A, 3*m*sizeof(PetscScalar));CHKERRQ(ierr); 180071f1c65dSBarry Smith v = a->a; 180171f1c65dSBarry Smith } 180271f1c65dSBarry Smith mdiag = a->mdiag; 180371f1c65dSBarry Smith idiag = a->idiag; 180471f1c65dSBarry Smith 1805422a814eSBarry Smith if (omega == 1.0 && PetscRealPart(fshift) <= 0.0) { 180671f1c65dSBarry Smith for (i=0; i<m; i++) { 180771f1c65dSBarry Smith mdiag[i] = v[diag[i]]; 1808899639b0SHong Zhang if (!PetscAbsScalar(mdiag[i])) { /* zero diagonal */ 1809899639b0SHong Zhang if (PetscRealPart(fshift)) { 1810899639b0SHong Zhang ierr = PetscInfo1(A,"Zero diagonal on row %D\n",i);CHKERRQ(ierr); 18117b6c816cSBarry Smith A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 18127b6c816cSBarry Smith A->factorerror_zeropivot_value = 0.0; 18137b6c816cSBarry Smith A->factorerror_zeropivot_row = i; 1814a6fa060aSHong Zhang } else SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_ARG_INCOMP,"Zero diagonal on row %D",i); 1815899639b0SHong Zhang } 181671f1c65dSBarry Smith idiag[i] = 1.0/v[diag[i]]; 181771f1c65dSBarry Smith } 181871f1c65dSBarry Smith ierr = PetscLogFlops(m);CHKERRQ(ierr); 181971f1c65dSBarry Smith } else { 182071f1c65dSBarry Smith for (i=0; i<m; i++) { 182171f1c65dSBarry Smith mdiag[i] = v[diag[i]]; 182271f1c65dSBarry Smith idiag[i] = omega/(fshift + v[diag[i]]); 182371f1c65dSBarry Smith } 1824dc0b31edSSatish Balay ierr = PetscLogFlops(2.0*m);CHKERRQ(ierr); 182571f1c65dSBarry Smith } 182671f1c65dSBarry Smith a->idiagvalid = PETSC_TRUE; 182771f1c65dSBarry Smith PetscFunctionReturn(0); 182871f1c65dSBarry Smith } 182971f1c65dSBarry Smith 1830c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/ftn-kernels/frelax.h> 183141f059aeSBarry Smith PetscErrorCode MatSOR_SeqAIJ(Mat A,Vec bb,PetscReal omega,MatSORType flag,PetscReal fshift,PetscInt its,PetscInt lits,Vec xx) 183217ab2063SBarry Smith { 1833416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 1834e6d1f457SBarry Smith PetscScalar *x,d,sum,*t,scale; 18353d3eaba7SBarry Smith const MatScalar *v,*idiag=0,*mdiag; 183654f21887SBarry Smith const PetscScalar *b, *bs,*xb, *ts; 1837dfbe8321SBarry Smith PetscErrorCode ierr; 18383d3eaba7SBarry Smith PetscInt n,m = A->rmap->n,i; 183997f1f81fSBarry Smith const PetscInt *idx,*diag; 184017ab2063SBarry Smith 18413a40ed3dSBarry Smith PetscFunctionBegin; 1842b965ef7fSBarry Smith its = its*lits; 184391723122SBarry Smith 184471f1c65dSBarry Smith if (fshift != a->fshift || omega != a->omega) a->idiagvalid = PETSC_FALSE; /* must recompute idiag[] */ 184571f1c65dSBarry Smith if (!a->idiagvalid) {ierr = MatInvertDiagonal_SeqAIJ(A,omega,fshift);CHKERRQ(ierr);} 184671f1c65dSBarry Smith a->fshift = fshift; 184771f1c65dSBarry Smith a->omega = omega; 1848ed480e8bSBarry Smith 184971f1c65dSBarry Smith diag = a->diag; 185071f1c65dSBarry Smith t = a->ssor_work; 1851ed480e8bSBarry Smith idiag = a->idiag; 185271f1c65dSBarry Smith mdiag = a->mdiag; 1853ed480e8bSBarry Smith 18541ebc52fbSHong Zhang ierr = VecGetArray(xx,&x);CHKERRQ(ierr); 18553649974fSBarry Smith ierr = VecGetArrayRead(bb,&b);CHKERRQ(ierr); 1856ed480e8bSBarry Smith /* We count flops by assuming the upper triangular and lower triangular parts have the same number of nonzeros */ 185717ab2063SBarry Smith if (flag == SOR_APPLY_UPPER) { 185817ab2063SBarry Smith /* apply (U + D/omega) to the vector */ 1859ed480e8bSBarry Smith bs = b; 186017ab2063SBarry Smith for (i=0; i<m; i++) { 186171f1c65dSBarry Smith d = fshift + mdiag[i]; 1862416022c9SBarry Smith n = a->i[i+1] - diag[i] - 1; 1863ed480e8bSBarry Smith idx = a->j + diag[i] + 1; 1864ed480e8bSBarry Smith v = a->a + diag[i] + 1; 186517ab2063SBarry Smith sum = b[i]*d/omega; 1866003131ecSBarry Smith PetscSparseDensePlusDot(sum,bs,v,idx,n); 186717ab2063SBarry Smith x[i] = sum; 186817ab2063SBarry Smith } 18691ebc52fbSHong Zhang ierr = VecRestoreArray(xx,&x);CHKERRQ(ierr); 18703649974fSBarry Smith ierr = VecRestoreArrayRead(bb,&b);CHKERRQ(ierr); 1871efee365bSSatish Balay ierr = PetscLogFlops(a->nz);CHKERRQ(ierr); 18723a40ed3dSBarry Smith PetscFunctionReturn(0); 187317ab2063SBarry Smith } 1874c783ea89SBarry Smith 18752205254eSKarl Rupp if (flag == SOR_APPLY_LOWER) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_SUP,"SOR_APPLY_LOWER is not implemented"); 18762205254eSKarl Rupp else if (flag & SOR_EISENSTAT) { 18774c500f23SPierre Jolivet /* Let A = L + U + D; where L is lower triangular, 1878887ee2caSBarry Smith U is upper triangular, E = D/omega; This routine applies 187917ab2063SBarry Smith 188017ab2063SBarry Smith (L + E)^{-1} A (U + E)^{-1} 188117ab2063SBarry Smith 1882887ee2caSBarry Smith to a vector efficiently using Eisenstat's trick. 188317ab2063SBarry Smith */ 188417ab2063SBarry Smith scale = (2.0/omega) - 1.0; 188517ab2063SBarry Smith 188617ab2063SBarry Smith /* x = (E + U)^{-1} b */ 188717ab2063SBarry Smith for (i=m-1; i>=0; i--) { 1888416022c9SBarry Smith n = a->i[i+1] - diag[i] - 1; 1889ed480e8bSBarry Smith idx = a->j + diag[i] + 1; 1890ed480e8bSBarry Smith v = a->a + diag[i] + 1; 189117ab2063SBarry Smith sum = b[i]; 1892e6d1f457SBarry Smith PetscSparseDenseMinusDot(sum,x,v,idx,n); 1893ed480e8bSBarry Smith x[i] = sum*idiag[i]; 189417ab2063SBarry Smith } 189517ab2063SBarry Smith 189617ab2063SBarry Smith /* t = b - (2*E - D)x */ 1897416022c9SBarry Smith v = a->a; 18982205254eSKarl Rupp for (i=0; i<m; i++) t[i] = b[i] - scale*(v[*diag++])*x[i]; 189917ab2063SBarry Smith 190017ab2063SBarry Smith /* t = (E + L)^{-1}t */ 1901ed480e8bSBarry Smith ts = t; 1902416022c9SBarry Smith diag = a->diag; 190317ab2063SBarry Smith for (i=0; i<m; i++) { 1904416022c9SBarry Smith n = diag[i] - a->i[i]; 1905ed480e8bSBarry Smith idx = a->j + a->i[i]; 1906ed480e8bSBarry Smith v = a->a + a->i[i]; 190717ab2063SBarry Smith sum = t[i]; 1908003131ecSBarry Smith PetscSparseDenseMinusDot(sum,ts,v,idx,n); 1909ed480e8bSBarry Smith t[i] = sum*idiag[i]; 1910733d66baSBarry Smith /* x = x + t */ 1911733d66baSBarry Smith x[i] += t[i]; 191217ab2063SBarry Smith } 191317ab2063SBarry Smith 1914dc0b31edSSatish Balay ierr = PetscLogFlops(6.0*m-1 + 2.0*a->nz);CHKERRQ(ierr); 19151ebc52fbSHong Zhang ierr = VecRestoreArray(xx,&x);CHKERRQ(ierr); 19163649974fSBarry Smith ierr = VecRestoreArrayRead(bb,&b);CHKERRQ(ierr); 19173a40ed3dSBarry Smith PetscFunctionReturn(0); 191817ab2063SBarry Smith } 191917ab2063SBarry Smith if (flag & SOR_ZERO_INITIAL_GUESS) { 192017ab2063SBarry Smith if (flag & SOR_FORWARD_SWEEP || flag & SOR_LOCAL_FORWARD_SWEEP) { 192117ab2063SBarry Smith for (i=0; i<m; i++) { 1922416022c9SBarry Smith n = diag[i] - a->i[i]; 1923ed480e8bSBarry Smith idx = a->j + a->i[i]; 1924ed480e8bSBarry Smith v = a->a + a->i[i]; 192517ab2063SBarry Smith sum = b[i]; 1926e6d1f457SBarry Smith PetscSparseDenseMinusDot(sum,x,v,idx,n); 19275c99c7daSBarry Smith t[i] = sum; 1928ed480e8bSBarry Smith x[i] = sum*idiag[i]; 192917ab2063SBarry Smith } 19305c99c7daSBarry Smith xb = t; 1931efee365bSSatish Balay ierr = PetscLogFlops(a->nz);CHKERRQ(ierr); 19323a40ed3dSBarry Smith } else xb = b; 193317ab2063SBarry Smith if (flag & SOR_BACKWARD_SWEEP || flag & SOR_LOCAL_BACKWARD_SWEEP) { 193417ab2063SBarry Smith for (i=m-1; i>=0; i--) { 1935416022c9SBarry Smith n = a->i[i+1] - diag[i] - 1; 1936ed480e8bSBarry Smith idx = a->j + diag[i] + 1; 1937ed480e8bSBarry Smith v = a->a + diag[i] + 1; 193817ab2063SBarry Smith sum = xb[i]; 1939e6d1f457SBarry Smith PetscSparseDenseMinusDot(sum,x,v,idx,n); 19405c99c7daSBarry Smith if (xb == b) { 1941ed480e8bSBarry Smith x[i] = sum*idiag[i]; 19425c99c7daSBarry Smith } else { 1943b19a5dc2SMark Adams x[i] = (1-omega)*x[i] + sum*idiag[i]; /* omega in idiag */ 194417ab2063SBarry Smith } 19455c99c7daSBarry Smith } 1946b19a5dc2SMark Adams ierr = PetscLogFlops(a->nz);CHKERRQ(ierr); /* assumes 1/2 in upper */ 194717ab2063SBarry Smith } 194817ab2063SBarry Smith its--; 194917ab2063SBarry Smith } 195017ab2063SBarry Smith while (its--) { 195117ab2063SBarry Smith if (flag & SOR_FORWARD_SWEEP || flag & SOR_LOCAL_FORWARD_SWEEP) { 195217ab2063SBarry Smith for (i=0; i<m; i++) { 1953b19a5dc2SMark Adams /* lower */ 1954b19a5dc2SMark Adams n = diag[i] - a->i[i]; 1955ed480e8bSBarry Smith idx = a->j + a->i[i]; 1956ed480e8bSBarry Smith v = a->a + a->i[i]; 195717ab2063SBarry Smith sum = b[i]; 1958e6d1f457SBarry Smith PetscSparseDenseMinusDot(sum,x,v,idx,n); 1959b19a5dc2SMark Adams t[i] = sum; /* save application of the lower-triangular part */ 1960b19a5dc2SMark Adams /* upper */ 1961b19a5dc2SMark Adams n = a->i[i+1] - diag[i] - 1; 1962b19a5dc2SMark Adams idx = a->j + diag[i] + 1; 1963b19a5dc2SMark Adams v = a->a + diag[i] + 1; 1964b19a5dc2SMark Adams PetscSparseDenseMinusDot(sum,x,v,idx,n); 1965b19a5dc2SMark Adams x[i] = (1. - omega)*x[i] + sum*idiag[i]; /* omega in idiag */ 196617ab2063SBarry Smith } 1967b19a5dc2SMark Adams xb = t; 19689f863219SBarry Smith ierr = PetscLogFlops(2.0*a->nz);CHKERRQ(ierr); 1969b19a5dc2SMark Adams } else xb = b; 197017ab2063SBarry Smith if (flag & SOR_BACKWARD_SWEEP || flag & SOR_LOCAL_BACKWARD_SWEEP) { 197117ab2063SBarry Smith for (i=m-1; i>=0; i--) { 1972b19a5dc2SMark Adams sum = xb[i]; 1973b19a5dc2SMark Adams if (xb == b) { 1974b19a5dc2SMark Adams /* whole matrix (no checkpointing available) */ 1975416022c9SBarry Smith n = a->i[i+1] - a->i[i]; 1976ed480e8bSBarry Smith idx = a->j + a->i[i]; 1977ed480e8bSBarry Smith v = a->a + a->i[i]; 1978e6d1f457SBarry Smith PetscSparseDenseMinusDot(sum,x,v,idx,n); 1979ed480e8bSBarry Smith x[i] = (1. - omega)*x[i] + (sum + mdiag[i]*x[i])*idiag[i]; 1980b19a5dc2SMark Adams } else { /* lower-triangular part has been saved, so only apply upper-triangular */ 1981b19a5dc2SMark Adams n = a->i[i+1] - diag[i] - 1; 1982b19a5dc2SMark Adams idx = a->j + diag[i] + 1; 1983b19a5dc2SMark Adams v = a->a + diag[i] + 1; 1984b19a5dc2SMark Adams PetscSparseDenseMinusDot(sum,x,v,idx,n); 1985b19a5dc2SMark Adams x[i] = (1. - omega)*x[i] + sum*idiag[i]; /* omega in idiag */ 198617ab2063SBarry Smith } 1987b19a5dc2SMark Adams } 1988b19a5dc2SMark Adams if (xb == b) { 19899f863219SBarry Smith ierr = PetscLogFlops(2.0*a->nz);CHKERRQ(ierr); 1990b19a5dc2SMark Adams } else { 1991b19a5dc2SMark Adams ierr = PetscLogFlops(a->nz);CHKERRQ(ierr); /* assumes 1/2 in upper */ 1992b19a5dc2SMark Adams } 199317ab2063SBarry Smith } 199417ab2063SBarry Smith } 19951ebc52fbSHong Zhang ierr = VecRestoreArray(xx,&x);CHKERRQ(ierr); 19963649974fSBarry Smith ierr = VecRestoreArrayRead(bb,&b);CHKERRQ(ierr); 1997365a8a9eSBarry Smith PetscFunctionReturn(0); 199817ab2063SBarry Smith } 199917ab2063SBarry Smith 20002af78befSBarry Smith 2001dfbe8321SBarry Smith PetscErrorCode MatGetInfo_SeqAIJ(Mat A,MatInfoType flag,MatInfo *info) 200217ab2063SBarry Smith { 2003416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 20044e220ebcSLois Curfman McInnes 20053a40ed3dSBarry Smith PetscFunctionBegin; 20064e220ebcSLois Curfman McInnes info->block_size = 1.0; 20073966268fSBarry Smith info->nz_allocated = a->maxnz; 20083966268fSBarry Smith info->nz_used = a->nz; 20093966268fSBarry Smith info->nz_unneeded = (a->maxnz - a->nz); 20103966268fSBarry Smith info->assemblies = A->num_ass; 20113966268fSBarry Smith info->mallocs = A->info.mallocs; 20127adad957SLisandro Dalcin info->memory = ((PetscObject)A)->mem; 2013d5f3da31SBarry Smith if (A->factortype) { 20144e220ebcSLois Curfman McInnes info->fill_ratio_given = A->info.fill_ratio_given; 20154e220ebcSLois Curfman McInnes info->fill_ratio_needed = A->info.fill_ratio_needed; 20164e220ebcSLois Curfman McInnes info->factor_mallocs = A->info.factor_mallocs; 20174e220ebcSLois Curfman McInnes } else { 20184e220ebcSLois Curfman McInnes info->fill_ratio_given = 0; 20194e220ebcSLois Curfman McInnes info->fill_ratio_needed = 0; 20204e220ebcSLois Curfman McInnes info->factor_mallocs = 0; 20214e220ebcSLois Curfman McInnes } 20223a40ed3dSBarry Smith PetscFunctionReturn(0); 202317ab2063SBarry Smith } 202417ab2063SBarry Smith 20252b40b63fSBarry Smith PetscErrorCode MatZeroRows_SeqAIJ(Mat A,PetscInt N,const PetscInt rows[],PetscScalar diag,Vec x,Vec b) 202617ab2063SBarry Smith { 2027416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 2028c7da8527SEric Chamberland PetscInt i,m = A->rmap->n - 1; 20296849ba73SBarry Smith PetscErrorCode ierr; 203097b48c8fSBarry Smith const PetscScalar *xx; 203197b48c8fSBarry Smith PetscScalar *bb; 2032c7da8527SEric Chamberland PetscInt d = 0; 203317ab2063SBarry Smith 20343a40ed3dSBarry Smith PetscFunctionBegin; 203597b48c8fSBarry Smith if (x && b) { 203697b48c8fSBarry Smith ierr = VecGetArrayRead(x,&xx);CHKERRQ(ierr); 203797b48c8fSBarry Smith ierr = VecGetArray(b,&bb);CHKERRQ(ierr); 203897b48c8fSBarry Smith for (i=0; i<N; i++) { 203997b48c8fSBarry Smith if (rows[i] < 0 || rows[i] > m) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"row %D out of range", rows[i]); 2040447d62f5SStefano Zampini if (rows[i] >= A->cmap->n) continue; 204197b48c8fSBarry Smith bb[rows[i]] = diag*xx[rows[i]]; 204297b48c8fSBarry Smith } 204397b48c8fSBarry Smith ierr = VecRestoreArrayRead(x,&xx);CHKERRQ(ierr); 204497b48c8fSBarry Smith ierr = VecRestoreArray(b,&bb);CHKERRQ(ierr); 204597b48c8fSBarry Smith } 204697b48c8fSBarry Smith 2047a9817697SBarry Smith if (a->keepnonzeropattern) { 2048f1e2ffcdSBarry Smith for (i=0; i<N; i++) { 2049e32f2f54SBarry Smith if (rows[i] < 0 || rows[i] > m) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"row %D out of range", rows[i]); 2050580bdb30SBarry Smith ierr = PetscArrayzero(&a->a[a->i[rows[i]]],a->ilen[rows[i]]);CHKERRQ(ierr); 2051f1e2ffcdSBarry Smith } 2052f4df32b1SMatthew Knepley if (diag != 0.0) { 2053c7da8527SEric Chamberland for (i=0; i<N; i++) { 2054c7da8527SEric Chamberland d = rows[i]; 2055447d62f5SStefano Zampini if (rows[i] >= A->cmap->n) continue; 2056c7da8527SEric Chamberland if (a->diag[d] >= a->i[d+1]) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Matrix is missing diagonal entry in the zeroed row %D",d); 2057c7da8527SEric Chamberland } 2058f1e2ffcdSBarry Smith for (i=0; i<N; i++) { 2059447d62f5SStefano Zampini if (rows[i] >= A->cmap->n) continue; 2060f4df32b1SMatthew Knepley a->a[a->diag[rows[i]]] = diag; 2061f1e2ffcdSBarry Smith } 2062f1e2ffcdSBarry Smith } 2063f1e2ffcdSBarry Smith } else { 2064f4df32b1SMatthew Knepley if (diag != 0.0) { 206517ab2063SBarry Smith for (i=0; i<N; i++) { 2066e32f2f54SBarry Smith if (rows[i] < 0 || rows[i] > m) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"row %D out of range", rows[i]); 20677ae801bdSBarry Smith if (a->ilen[rows[i]] > 0) { 2068447d62f5SStefano Zampini if (rows[i] >= A->cmap->n) { 2069447d62f5SStefano Zampini a->ilen[rows[i]] = 0; 2070447d62f5SStefano Zampini } else { 2071416022c9SBarry Smith a->ilen[rows[i]] = 1; 2072f4df32b1SMatthew Knepley a->a[a->i[rows[i]]] = diag; 2073bfeeae90SHong Zhang a->j[a->i[rows[i]]] = rows[i]; 2074447d62f5SStefano Zampini } 2075447d62f5SStefano Zampini } else if (rows[i] < A->cmap->n) { /* in case row was completely empty */ 2076f4df32b1SMatthew Knepley ierr = MatSetValues_SeqAIJ(A,1,&rows[i],1,&rows[i],&diag,INSERT_VALUES);CHKERRQ(ierr); 207717ab2063SBarry Smith } 207817ab2063SBarry Smith } 20793a40ed3dSBarry Smith } else { 208017ab2063SBarry Smith for (i=0; i<N; i++) { 2081e32f2f54SBarry Smith if (rows[i] < 0 || rows[i] > m) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"row %D out of range", rows[i]); 2082416022c9SBarry Smith a->ilen[rows[i]] = 0; 208317ab2063SBarry Smith } 208417ab2063SBarry Smith } 2085e56f5c9eSBarry Smith A->nonzerostate++; 2086f1e2ffcdSBarry Smith } 2087e2cf4d64SStefano Zampini #if defined(PETSC_HAVE_VIENNACL) || defined(PETSC_HAVE_CUDA) 2088c70f7ee4SJunchao Zhang if (A->offloadmask != PETSC_OFFLOAD_UNALLOCATED) A->offloadmask = PETSC_OFFLOAD_CPU; 2089e2cf4d64SStefano Zampini #endif 20904099cc6bSBarry Smith ierr = (*A->ops->assemblyend)(A,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 20913a40ed3dSBarry Smith PetscFunctionReturn(0); 209217ab2063SBarry Smith } 209317ab2063SBarry Smith 20946e169961SBarry Smith PetscErrorCode MatZeroRowsColumns_SeqAIJ(Mat A,PetscInt N,const PetscInt rows[],PetscScalar diag,Vec x,Vec b) 20956e169961SBarry Smith { 20966e169961SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 20976e169961SBarry Smith PetscInt i,j,m = A->rmap->n - 1,d = 0; 20986e169961SBarry Smith PetscErrorCode ierr; 20992b40b63fSBarry Smith PetscBool missing,*zeroed,vecs = PETSC_FALSE; 21006e169961SBarry Smith const PetscScalar *xx; 21016e169961SBarry Smith PetscScalar *bb; 21026e169961SBarry Smith 21036e169961SBarry Smith PetscFunctionBegin; 21046e169961SBarry Smith if (x && b) { 21056e169961SBarry Smith ierr = VecGetArrayRead(x,&xx);CHKERRQ(ierr); 21066e169961SBarry Smith ierr = VecGetArray(b,&bb);CHKERRQ(ierr); 21072b40b63fSBarry Smith vecs = PETSC_TRUE; 21086e169961SBarry Smith } 21091795a4d1SJed Brown ierr = PetscCalloc1(A->rmap->n,&zeroed);CHKERRQ(ierr); 21106e169961SBarry Smith for (i=0; i<N; i++) { 21116e169961SBarry Smith if (rows[i] < 0 || rows[i] > m) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"row %D out of range", rows[i]); 2112580bdb30SBarry Smith ierr = PetscArrayzero(&a->a[a->i[rows[i]]],a->ilen[rows[i]]);CHKERRQ(ierr); 21132205254eSKarl Rupp 21146e169961SBarry Smith zeroed[rows[i]] = PETSC_TRUE; 21156e169961SBarry Smith } 21166e169961SBarry Smith for (i=0; i<A->rmap->n; i++) { 21176e169961SBarry Smith if (!zeroed[i]) { 21186e169961SBarry Smith for (j=a->i[i]; j<a->i[i+1]; j++) { 21194cf107fdSStefano Zampini if (a->j[j] < A->rmap->n && zeroed[a->j[j]]) { 21202b40b63fSBarry Smith if (vecs) bb[i] -= a->a[j]*xx[a->j[j]]; 21216e169961SBarry Smith a->a[j] = 0.0; 21226e169961SBarry Smith } 21236e169961SBarry Smith } 21244cf107fdSStefano Zampini } else if (vecs && i < A->cmap->N) bb[i] = diag*xx[i]; 21256e169961SBarry Smith } 21266e169961SBarry Smith if (x && b) { 21276e169961SBarry Smith ierr = VecRestoreArrayRead(x,&xx);CHKERRQ(ierr); 21286e169961SBarry Smith ierr = VecRestoreArray(b,&bb);CHKERRQ(ierr); 21296e169961SBarry Smith } 21306e169961SBarry Smith ierr = PetscFree(zeroed);CHKERRQ(ierr); 21316e169961SBarry Smith if (diag != 0.0) { 21326e169961SBarry Smith ierr = MatMissingDiagonal_SeqAIJ(A,&missing,&d);CHKERRQ(ierr); 21331d5a398dSstefano_zampini if (missing) { 21341d5a398dSstefano_zampini for (i=0; i<N; i++) { 21354cf107fdSStefano Zampini if (rows[i] >= A->cmap->N) continue; 21364cf107fdSStefano Zampini if (a->nonew && rows[i] >= d) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Matrix is missing diagonal entry in row %D (%D)",d,rows[i]); 21371d5a398dSstefano_zampini ierr = MatSetValues_SeqAIJ(A,1,&rows[i],1,&rows[i],&diag,INSERT_VALUES);CHKERRQ(ierr); 21381d5a398dSstefano_zampini } 21391d5a398dSstefano_zampini } else { 21406e169961SBarry Smith for (i=0; i<N; i++) { 21416e169961SBarry Smith a->a[a->diag[rows[i]]] = diag; 21426e169961SBarry Smith } 21436e169961SBarry Smith } 21441d5a398dSstefano_zampini } 2145e2cf4d64SStefano Zampini #if defined(PETSC_HAVE_VIENNACL) || defined(PETSC_HAVE_CUDA) 2146c70f7ee4SJunchao Zhang if (A->offloadmask != PETSC_OFFLOAD_UNALLOCATED) A->offloadmask = PETSC_OFFLOAD_CPU; 2147e2cf4d64SStefano Zampini #endif 21484099cc6bSBarry Smith ierr = (*A->ops->assemblyend)(A,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 21496e169961SBarry Smith PetscFunctionReturn(0); 21506e169961SBarry Smith } 21516e169961SBarry Smith 2152a77337e4SBarry Smith PetscErrorCode MatGetRow_SeqAIJ(Mat A,PetscInt row,PetscInt *nz,PetscInt **idx,PetscScalar **v) 215317ab2063SBarry Smith { 2154416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 215597f1f81fSBarry Smith PetscInt *itmp; 215617ab2063SBarry Smith 21573a40ed3dSBarry Smith PetscFunctionBegin; 2158e32f2f54SBarry Smith if (row < 0 || row >= A->rmap->n) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Row %D out of range",row); 215917ab2063SBarry Smith 2160416022c9SBarry Smith *nz = a->i[row+1] - a->i[row]; 2161bfeeae90SHong Zhang if (v) *v = a->a + a->i[row]; 216217ab2063SBarry Smith if (idx) { 2163bfeeae90SHong Zhang itmp = a->j + a->i[row]; 216426fbe8dcSKarl Rupp if (*nz) *idx = itmp; 216517ab2063SBarry Smith else *idx = 0; 216617ab2063SBarry Smith } 21673a40ed3dSBarry Smith PetscFunctionReturn(0); 216817ab2063SBarry Smith } 216917ab2063SBarry Smith 2170bfeeae90SHong Zhang /* remove this function? */ 2171a77337e4SBarry Smith PetscErrorCode MatRestoreRow_SeqAIJ(Mat A,PetscInt row,PetscInt *nz,PetscInt **idx,PetscScalar **v) 217217ab2063SBarry Smith { 21733a40ed3dSBarry Smith PetscFunctionBegin; 21743a40ed3dSBarry Smith PetscFunctionReturn(0); 217517ab2063SBarry Smith } 217617ab2063SBarry Smith 2177dfbe8321SBarry Smith PetscErrorCode MatNorm_SeqAIJ(Mat A,NormType type,PetscReal *nrm) 217817ab2063SBarry Smith { 2179416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 218054f21887SBarry Smith MatScalar *v = a->a; 218136db0b34SBarry Smith PetscReal sum = 0.0; 21826849ba73SBarry Smith PetscErrorCode ierr; 218397f1f81fSBarry Smith PetscInt i,j; 218417ab2063SBarry Smith 21853a40ed3dSBarry Smith PetscFunctionBegin; 218617ab2063SBarry Smith if (type == NORM_FROBENIUS) { 2187570b7f6dSBarry Smith #if defined(PETSC_USE_REAL___FP16) 2188570b7f6dSBarry Smith PetscBLASInt one = 1,nz = a->nz; 2189570b7f6dSBarry Smith *nrm = BLASnrm2_(&nz,v,&one); 2190570b7f6dSBarry Smith #else 2191416022c9SBarry Smith for (i=0; i<a->nz; i++) { 219236db0b34SBarry Smith sum += PetscRealPart(PetscConj(*v)*(*v)); v++; 219317ab2063SBarry Smith } 21948f1a2a5eSBarry Smith *nrm = PetscSqrtReal(sum); 2195570b7f6dSBarry Smith #endif 219651f70360SJed Brown ierr = PetscLogFlops(2*a->nz);CHKERRQ(ierr); 21973a40ed3dSBarry Smith } else if (type == NORM_1) { 219836db0b34SBarry Smith PetscReal *tmp; 219997f1f81fSBarry Smith PetscInt *jj = a->j; 22001795a4d1SJed Brown ierr = PetscCalloc1(A->cmap->n+1,&tmp);CHKERRQ(ierr); 2201064f8208SBarry Smith *nrm = 0.0; 2202416022c9SBarry Smith for (j=0; j<a->nz; j++) { 2203bfeeae90SHong Zhang tmp[*jj++] += PetscAbsScalar(*v); v++; 220417ab2063SBarry Smith } 2205d0f46423SBarry Smith for (j=0; j<A->cmap->n; j++) { 2206064f8208SBarry Smith if (tmp[j] > *nrm) *nrm = tmp[j]; 220717ab2063SBarry Smith } 2208606d414cSSatish Balay ierr = PetscFree(tmp);CHKERRQ(ierr); 220951f70360SJed Brown ierr = PetscLogFlops(PetscMax(a->nz-1,0));CHKERRQ(ierr); 22103a40ed3dSBarry Smith } else if (type == NORM_INFINITY) { 2211064f8208SBarry Smith *nrm = 0.0; 2212d0f46423SBarry Smith for (j=0; j<A->rmap->n; j++) { 2213bfeeae90SHong Zhang v = a->a + a->i[j]; 221417ab2063SBarry Smith sum = 0.0; 2215416022c9SBarry Smith for (i=0; i<a->i[j+1]-a->i[j]; i++) { 2216cddf8d76SBarry Smith sum += PetscAbsScalar(*v); v++; 221717ab2063SBarry Smith } 2218064f8208SBarry Smith if (sum > *nrm) *nrm = sum; 221917ab2063SBarry Smith } 222051f70360SJed Brown ierr = PetscLogFlops(PetscMax(a->nz-1,0));CHKERRQ(ierr); 2221f23aa3ddSBarry Smith } else SETERRQ(PETSC_COMM_SELF,PETSC_ERR_SUP,"No support for two norm"); 22223a40ed3dSBarry Smith PetscFunctionReturn(0); 222317ab2063SBarry Smith } 222417ab2063SBarry Smith 22254e938277SHong Zhang /* Merged from MatGetSymbolicTranspose_SeqAIJ() - replace MatGetSymbolicTranspose_SeqAIJ()? */ 22264e938277SHong Zhang PetscErrorCode MatTransposeSymbolic_SeqAIJ(Mat A,Mat *B) 22274e938277SHong Zhang { 22284e938277SHong Zhang PetscErrorCode ierr; 22294e938277SHong Zhang PetscInt i,j,anzj; 22304e938277SHong Zhang Mat_SeqAIJ *a=(Mat_SeqAIJ*)A->data,*b; 22314e938277SHong Zhang PetscInt an=A->cmap->N,am=A->rmap->N; 22324e938277SHong Zhang PetscInt *ati,*atj,*atfill,*ai=a->i,*aj=a->j; 22334e938277SHong Zhang 22344e938277SHong Zhang PetscFunctionBegin; 22354e938277SHong Zhang /* Allocate space for symbolic transpose info and work array */ 2236854ce69bSBarry Smith ierr = PetscCalloc1(an+1,&ati);CHKERRQ(ierr); 2237785e854fSJed Brown ierr = PetscMalloc1(ai[am],&atj);CHKERRQ(ierr); 2238785e854fSJed Brown ierr = PetscMalloc1(an,&atfill);CHKERRQ(ierr); 22394e938277SHong Zhang 22404e938277SHong Zhang /* Walk through aj and count ## of non-zeros in each row of A^T. */ 22414e938277SHong Zhang /* Note: offset by 1 for fast conversion into csr format. */ 224226fbe8dcSKarl Rupp for (i=0;i<ai[am];i++) ati[aj[i]+1] += 1; 22434e938277SHong Zhang /* Form ati for csr format of A^T. */ 224426fbe8dcSKarl Rupp for (i=0;i<an;i++) ati[i+1] += ati[i]; 22454e938277SHong Zhang 22464e938277SHong Zhang /* Copy ati into atfill so we have locations of the next free space in atj */ 2247580bdb30SBarry Smith ierr = PetscArraycpy(atfill,ati,an);CHKERRQ(ierr); 22484e938277SHong Zhang 22494e938277SHong Zhang /* Walk through A row-wise and mark nonzero entries of A^T. */ 22504e938277SHong Zhang for (i=0;i<am;i++) { 22514e938277SHong Zhang anzj = ai[i+1] - ai[i]; 22524e938277SHong Zhang for (j=0;j<anzj;j++) { 22534e938277SHong Zhang atj[atfill[*aj]] = i; 22544e938277SHong Zhang atfill[*aj++] += 1; 22554e938277SHong Zhang } 22564e938277SHong Zhang } 22574e938277SHong Zhang 22584e938277SHong Zhang /* Clean up temporary space and complete requests. */ 22594e938277SHong Zhang ierr = PetscFree(atfill);CHKERRQ(ierr); 2260ce94432eSBarry Smith ierr = MatCreateSeqAIJWithArrays(PetscObjectComm((PetscObject)A),an,am,ati,atj,NULL,B);CHKERRQ(ierr); 226133d57670SJed Brown ierr = MatSetBlockSizes(*B,PetscAbs(A->cmap->bs),PetscAbs(A->rmap->bs));CHKERRQ(ierr); 2262b5bb3eecSMark Adams ierr = MatSetType(*B,((PetscObject)A)->type_name);CHKERRQ(ierr); 2263a2f3521dSMark F. Adams 22644e938277SHong Zhang b = (Mat_SeqAIJ*)((*B)->data); 22654e938277SHong Zhang b->free_a = PETSC_FALSE; 22664e938277SHong Zhang b->free_ij = PETSC_TRUE; 22674e938277SHong Zhang b->nonew = 0; 22684e938277SHong Zhang PetscFunctionReturn(0); 22694e938277SHong Zhang } 22704e938277SHong Zhang 22717087cfbeSBarry Smith PetscErrorCode MatIsTranspose_SeqAIJ(Mat A,Mat B,PetscReal tol,PetscBool *f) 2272cd0d46ebSvictorle { 22733d3eaba7SBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ*) A->data,*bij = (Mat_SeqAIJ*) B->data; 227454f21887SBarry Smith PetscInt *adx,*bdx,*aii,*bii,*aptr,*bptr; 227554f21887SBarry Smith MatScalar *va,*vb; 22766849ba73SBarry Smith PetscErrorCode ierr; 227797f1f81fSBarry Smith PetscInt ma,na,mb,nb, i; 2278cd0d46ebSvictorle 2279cd0d46ebSvictorle PetscFunctionBegin; 2280cd0d46ebSvictorle ierr = MatGetSize(A,&ma,&na);CHKERRQ(ierr); 2281cd0d46ebSvictorle ierr = MatGetSize(B,&mb,&nb);CHKERRQ(ierr); 22825485867bSBarry Smith if (ma!=nb || na!=mb) { 22835485867bSBarry Smith *f = PETSC_FALSE; 22845485867bSBarry Smith PetscFunctionReturn(0); 22855485867bSBarry Smith } 2286cd0d46ebSvictorle aii = aij->i; bii = bij->i; 2287cd0d46ebSvictorle adx = aij->j; bdx = bij->j; 2288cd0d46ebSvictorle va = aij->a; vb = bij->a; 2289785e854fSJed Brown ierr = PetscMalloc1(ma,&aptr);CHKERRQ(ierr); 2290785e854fSJed Brown ierr = PetscMalloc1(mb,&bptr);CHKERRQ(ierr); 2291cd0d46ebSvictorle for (i=0; i<ma; i++) aptr[i] = aii[i]; 2292cd0d46ebSvictorle for (i=0; i<mb; i++) bptr[i] = bii[i]; 2293cd0d46ebSvictorle 2294cd0d46ebSvictorle *f = PETSC_TRUE; 2295cd0d46ebSvictorle for (i=0; i<ma; i++) { 2296cd0d46ebSvictorle while (aptr[i]<aii[i+1]) { 229797f1f81fSBarry Smith PetscInt idc,idr; 22985485867bSBarry Smith PetscScalar vc,vr; 2299cd0d46ebSvictorle /* column/row index/value */ 23005485867bSBarry Smith idc = adx[aptr[i]]; 23015485867bSBarry Smith idr = bdx[bptr[idc]]; 23025485867bSBarry Smith vc = va[aptr[i]]; 23035485867bSBarry Smith vr = vb[bptr[idc]]; 23045485867bSBarry Smith if (i!=idr || PetscAbsScalar(vc-vr) > tol) { 23055485867bSBarry Smith *f = PETSC_FALSE; 23065485867bSBarry Smith goto done; 2307cd0d46ebSvictorle } else { 23085485867bSBarry Smith aptr[i]++; 23095485867bSBarry Smith if (B || i!=idc) bptr[idc]++; 2310cd0d46ebSvictorle } 2311cd0d46ebSvictorle } 2312cd0d46ebSvictorle } 2313cd0d46ebSvictorle done: 2314cd0d46ebSvictorle ierr = PetscFree(aptr);CHKERRQ(ierr); 23153aeef889SHong Zhang ierr = PetscFree(bptr);CHKERRQ(ierr); 2316cd0d46ebSvictorle PetscFunctionReturn(0); 2317cd0d46ebSvictorle } 2318cd0d46ebSvictorle 23197087cfbeSBarry Smith PetscErrorCode MatIsHermitianTranspose_SeqAIJ(Mat A,Mat B,PetscReal tol,PetscBool *f) 23201cbb95d3SBarry Smith { 23213d3eaba7SBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ*) A->data,*bij = (Mat_SeqAIJ*) B->data; 232254f21887SBarry Smith PetscInt *adx,*bdx,*aii,*bii,*aptr,*bptr; 232354f21887SBarry Smith MatScalar *va,*vb; 23241cbb95d3SBarry Smith PetscErrorCode ierr; 23251cbb95d3SBarry Smith PetscInt ma,na,mb,nb, i; 23261cbb95d3SBarry Smith 23271cbb95d3SBarry Smith PetscFunctionBegin; 23281cbb95d3SBarry Smith ierr = MatGetSize(A,&ma,&na);CHKERRQ(ierr); 23291cbb95d3SBarry Smith ierr = MatGetSize(B,&mb,&nb);CHKERRQ(ierr); 23301cbb95d3SBarry Smith if (ma!=nb || na!=mb) { 23311cbb95d3SBarry Smith *f = PETSC_FALSE; 23321cbb95d3SBarry Smith PetscFunctionReturn(0); 23331cbb95d3SBarry Smith } 23341cbb95d3SBarry Smith aii = aij->i; bii = bij->i; 23351cbb95d3SBarry Smith adx = aij->j; bdx = bij->j; 23361cbb95d3SBarry Smith va = aij->a; vb = bij->a; 2337785e854fSJed Brown ierr = PetscMalloc1(ma,&aptr);CHKERRQ(ierr); 2338785e854fSJed Brown ierr = PetscMalloc1(mb,&bptr);CHKERRQ(ierr); 23391cbb95d3SBarry Smith for (i=0; i<ma; i++) aptr[i] = aii[i]; 23401cbb95d3SBarry Smith for (i=0; i<mb; i++) bptr[i] = bii[i]; 23411cbb95d3SBarry Smith 23421cbb95d3SBarry Smith *f = PETSC_TRUE; 23431cbb95d3SBarry Smith for (i=0; i<ma; i++) { 23441cbb95d3SBarry Smith while (aptr[i]<aii[i+1]) { 23451cbb95d3SBarry Smith PetscInt idc,idr; 23461cbb95d3SBarry Smith PetscScalar vc,vr; 23471cbb95d3SBarry Smith /* column/row index/value */ 23481cbb95d3SBarry Smith idc = adx[aptr[i]]; 23491cbb95d3SBarry Smith idr = bdx[bptr[idc]]; 23501cbb95d3SBarry Smith vc = va[aptr[i]]; 23511cbb95d3SBarry Smith vr = vb[bptr[idc]]; 23521cbb95d3SBarry Smith if (i!=idr || PetscAbsScalar(vc-PetscConj(vr)) > tol) { 23531cbb95d3SBarry Smith *f = PETSC_FALSE; 23541cbb95d3SBarry Smith goto done; 23551cbb95d3SBarry Smith } else { 23561cbb95d3SBarry Smith aptr[i]++; 23571cbb95d3SBarry Smith if (B || i!=idc) bptr[idc]++; 23581cbb95d3SBarry Smith } 23591cbb95d3SBarry Smith } 23601cbb95d3SBarry Smith } 23611cbb95d3SBarry Smith done: 23621cbb95d3SBarry Smith ierr = PetscFree(aptr);CHKERRQ(ierr); 23631cbb95d3SBarry Smith ierr = PetscFree(bptr);CHKERRQ(ierr); 23641cbb95d3SBarry Smith PetscFunctionReturn(0); 23651cbb95d3SBarry Smith } 23661cbb95d3SBarry Smith 2367ace3abfcSBarry Smith PetscErrorCode MatIsSymmetric_SeqAIJ(Mat A,PetscReal tol,PetscBool *f) 23689e29f15eSvictorle { 2369dfbe8321SBarry Smith PetscErrorCode ierr; 23706e111a19SKarl Rupp 23719e29f15eSvictorle PetscFunctionBegin; 23725485867bSBarry Smith ierr = MatIsTranspose_SeqAIJ(A,A,tol,f);CHKERRQ(ierr); 23739e29f15eSvictorle PetscFunctionReturn(0); 23749e29f15eSvictorle } 23759e29f15eSvictorle 2376ace3abfcSBarry Smith PetscErrorCode MatIsHermitian_SeqAIJ(Mat A,PetscReal tol,PetscBool *f) 23771cbb95d3SBarry Smith { 23781cbb95d3SBarry Smith PetscErrorCode ierr; 23796e111a19SKarl Rupp 23801cbb95d3SBarry Smith PetscFunctionBegin; 23811cbb95d3SBarry Smith ierr = MatIsHermitianTranspose_SeqAIJ(A,A,tol,f);CHKERRQ(ierr); 23821cbb95d3SBarry Smith PetscFunctionReturn(0); 23831cbb95d3SBarry Smith } 23841cbb95d3SBarry Smith 2385dfbe8321SBarry Smith PetscErrorCode MatDiagonalScale_SeqAIJ(Mat A,Vec ll,Vec rr) 238617ab2063SBarry Smith { 2387416022c9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 2388fff8e43fSBarry Smith const PetscScalar *l,*r; 2389fff8e43fSBarry Smith PetscScalar x; 239054f21887SBarry Smith MatScalar *v; 2391dfbe8321SBarry Smith PetscErrorCode ierr; 2392fff8e43fSBarry Smith PetscInt i,j,m = A->rmap->n,n = A->cmap->n,M,nz = a->nz; 2393fff8e43fSBarry Smith const PetscInt *jj; 239417ab2063SBarry Smith 23953a40ed3dSBarry Smith PetscFunctionBegin; 239617ab2063SBarry Smith if (ll) { 23973ea7c6a1SSatish Balay /* The local size is used so that VecMPI can be passed to this routine 23983ea7c6a1SSatish Balay by MatDiagonalScale_MPIAIJ */ 2399e1311b90SBarry Smith ierr = VecGetLocalSize(ll,&m);CHKERRQ(ierr); 2400e32f2f54SBarry Smith if (m != A->rmap->n) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Left scaling vector wrong length"); 2401fff8e43fSBarry Smith ierr = VecGetArrayRead(ll,&l);CHKERRQ(ierr); 2402416022c9SBarry Smith v = a->a; 240317ab2063SBarry Smith for (i=0; i<m; i++) { 240417ab2063SBarry Smith x = l[i]; 2405416022c9SBarry Smith M = a->i[i+1] - a->i[i]; 24062205254eSKarl Rupp for (j=0; j<M; j++) (*v++) *= x; 240717ab2063SBarry Smith } 2408fff8e43fSBarry Smith ierr = VecRestoreArrayRead(ll,&l);CHKERRQ(ierr); 2409efee365bSSatish Balay ierr = PetscLogFlops(nz);CHKERRQ(ierr); 241017ab2063SBarry Smith } 241117ab2063SBarry Smith if (rr) { 2412e1311b90SBarry Smith ierr = VecGetLocalSize(rr,&n);CHKERRQ(ierr); 2413e32f2f54SBarry Smith if (n != A->cmap->n) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Right scaling vector wrong length"); 2414fff8e43fSBarry Smith ierr = VecGetArrayRead(rr,&r);CHKERRQ(ierr); 2415416022c9SBarry Smith v = a->a; jj = a->j; 24162205254eSKarl Rupp for (i=0; i<nz; i++) (*v++) *= r[*jj++]; 2417fff8e43fSBarry Smith ierr = VecRestoreArrayRead(rr,&r);CHKERRQ(ierr); 2418efee365bSSatish Balay ierr = PetscLogFlops(nz);CHKERRQ(ierr); 241917ab2063SBarry Smith } 2420acf2f550SJed Brown ierr = MatSeqAIJInvalidateDiagonal(A);CHKERRQ(ierr); 2421e2cf4d64SStefano Zampini #if defined(PETSC_HAVE_VIENNACL) || defined(PETSC_HAVE_CUDA) 2422c70f7ee4SJunchao Zhang if (A->offloadmask != PETSC_OFFLOAD_UNALLOCATED) A->offloadmask = PETSC_OFFLOAD_CPU; 2423e2cf4d64SStefano Zampini #endif 24243a40ed3dSBarry Smith PetscFunctionReturn(0); 242517ab2063SBarry Smith } 242617ab2063SBarry Smith 24277dae84e0SHong Zhang PetscErrorCode MatCreateSubMatrix_SeqAIJ(Mat A,IS isrow,IS iscol,PetscInt csize,MatReuse scall,Mat *B) 242817ab2063SBarry Smith { 2429db02288aSLois Curfman McInnes Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data,*c; 24306849ba73SBarry Smith PetscErrorCode ierr; 2431d0f46423SBarry Smith PetscInt *smap,i,k,kstart,kend,oldcols = A->cmap->n,*lens; 243297f1f81fSBarry Smith PetscInt row,mat_i,*mat_j,tcol,first,step,*mat_ilen,sum,lensi; 24335d0c19d7SBarry Smith const PetscInt *irow,*icol; 24345d0c19d7SBarry Smith PetscInt nrows,ncols; 243597f1f81fSBarry Smith PetscInt *starts,*j_new,*i_new,*aj = a->j,*ai = a->i,ii,*ailen = a->ilen; 243654f21887SBarry Smith MatScalar *a_new,*mat_a; 2437416022c9SBarry Smith Mat C; 2438cdc6f3adSToby Isaac PetscBool stride; 243917ab2063SBarry Smith 24403a40ed3dSBarry Smith PetscFunctionBegin; 244199141d43SSatish Balay 244217ab2063SBarry Smith ierr = ISGetIndices(isrow,&irow);CHKERRQ(ierr); 2443b9b97703SBarry Smith ierr = ISGetLocalSize(isrow,&nrows);CHKERRQ(ierr); 2444b9b97703SBarry Smith ierr = ISGetLocalSize(iscol,&ncols);CHKERRQ(ierr); 244517ab2063SBarry Smith 2446251f4c67SDmitry Karpeev ierr = PetscObjectTypeCompare((PetscObject)iscol,ISSTRIDE,&stride);CHKERRQ(ierr); 2447ff718158SBarry Smith if (stride) { 2448ff718158SBarry Smith ierr = ISStrideGetInfo(iscol,&first,&step);CHKERRQ(ierr); 2449ff718158SBarry Smith } else { 2450ff718158SBarry Smith first = 0; 2451ff718158SBarry Smith step = 0; 2452ff718158SBarry Smith } 2453fee21e36SBarry Smith if (stride && step == 1) { 245402834360SBarry Smith /* special case of contiguous rows */ 2455dcca6d9dSJed Brown ierr = PetscMalloc2(nrows,&lens,nrows,&starts);CHKERRQ(ierr); 245602834360SBarry Smith /* loop over new rows determining lens and starting points */ 245702834360SBarry Smith for (i=0; i<nrows; i++) { 2458bfeeae90SHong Zhang kstart = ai[irow[i]]; 2459a2744918SBarry Smith kend = kstart + ailen[irow[i]]; 2460a91a9bebSLisandro Dalcin starts[i] = kstart; 246102834360SBarry Smith for (k=kstart; k<kend; k++) { 2462bfeeae90SHong Zhang if (aj[k] >= first) { 246302834360SBarry Smith starts[i] = k; 246402834360SBarry Smith break; 246502834360SBarry Smith } 246602834360SBarry Smith } 2467a2744918SBarry Smith sum = 0; 246802834360SBarry Smith while (k < kend) { 2469bfeeae90SHong Zhang if (aj[k++] >= first+ncols) break; 2470a2744918SBarry Smith sum++; 247102834360SBarry Smith } 2472a2744918SBarry Smith lens[i] = sum; 247302834360SBarry Smith } 247402834360SBarry Smith /* create submatrix */ 2475cddf8d76SBarry Smith if (scall == MAT_REUSE_MATRIX) { 247697f1f81fSBarry Smith PetscInt n_cols,n_rows; 247708480c60SBarry Smith ierr = MatGetSize(*B,&n_rows,&n_cols);CHKERRQ(ierr); 2478e32f2f54SBarry Smith if (n_rows != nrows || n_cols != ncols) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Reused submatrix wrong size"); 2479d8ced48eSBarry Smith ierr = MatZeroEntries(*B);CHKERRQ(ierr); 248008480c60SBarry Smith C = *B; 24813a40ed3dSBarry Smith } else { 24823bef6203SJed Brown PetscInt rbs,cbs; 2483ce94432eSBarry Smith ierr = MatCreate(PetscObjectComm((PetscObject)A),&C);CHKERRQ(ierr); 2484f69a0ea3SMatthew Knepley ierr = MatSetSizes(C,nrows,ncols,PETSC_DETERMINE,PETSC_DETERMINE);CHKERRQ(ierr); 24853bef6203SJed Brown ierr = ISGetBlockSize(isrow,&rbs);CHKERRQ(ierr); 24863bef6203SJed Brown ierr = ISGetBlockSize(iscol,&cbs);CHKERRQ(ierr); 24873bef6203SJed Brown ierr = MatSetBlockSizes(C,rbs,cbs);CHKERRQ(ierr); 24887adad957SLisandro Dalcin ierr = MatSetType(C,((PetscObject)A)->type_name);CHKERRQ(ierr); 2489ab93d7beSBarry Smith ierr = MatSeqAIJSetPreallocation_SeqAIJ(C,0,lens);CHKERRQ(ierr); 249008480c60SBarry Smith } 2491db02288aSLois Curfman McInnes c = (Mat_SeqAIJ*)C->data; 2492db02288aSLois Curfman McInnes 249302834360SBarry Smith /* loop over rows inserting into submatrix */ 2494db02288aSLois Curfman McInnes a_new = c->a; 2495db02288aSLois Curfman McInnes j_new = c->j; 2496db02288aSLois Curfman McInnes i_new = c->i; 2497bfeeae90SHong Zhang 249802834360SBarry Smith for (i=0; i<nrows; i++) { 2499a2744918SBarry Smith ii = starts[i]; 2500a2744918SBarry Smith lensi = lens[i]; 2501a2744918SBarry Smith for (k=0; k<lensi; k++) { 2502a2744918SBarry Smith *j_new++ = aj[ii+k] - first; 250302834360SBarry Smith } 2504580bdb30SBarry Smith ierr = PetscArraycpy(a_new,a->a + starts[i],lensi);CHKERRQ(ierr); 2505a2744918SBarry Smith a_new += lensi; 2506a2744918SBarry Smith i_new[i+1] = i_new[i] + lensi; 2507a2744918SBarry Smith c->ilen[i] = lensi; 250802834360SBarry Smith } 25090e83c824SBarry Smith ierr = PetscFree2(lens,starts);CHKERRQ(ierr); 25103a40ed3dSBarry Smith } else { 251102834360SBarry Smith ierr = ISGetIndices(iscol,&icol);CHKERRQ(ierr); 25121795a4d1SJed Brown ierr = PetscCalloc1(oldcols,&smap);CHKERRQ(ierr); 2513854ce69bSBarry Smith ierr = PetscMalloc1(1+nrows,&lens);CHKERRQ(ierr); 25144dcab191SBarry Smith for (i=0; i<ncols; i++) { 2515d9ef940eSSatish Balay if (PetscUnlikelyDebug(icol[i] >= oldcols)) SETERRQ3(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Requesting column beyond largest column icol[%D] %D >= A->cmap->n %D",i,icol[i],oldcols); 25164dcab191SBarry Smith smap[icol[i]] = i+1; 25174dcab191SBarry Smith } 25184dcab191SBarry Smith 251902834360SBarry Smith /* determine lens of each row */ 252002834360SBarry Smith for (i=0; i<nrows; i++) { 2521bfeeae90SHong Zhang kstart = ai[irow[i]]; 252202834360SBarry Smith kend = kstart + a->ilen[irow[i]]; 252302834360SBarry Smith lens[i] = 0; 252402834360SBarry Smith for (k=kstart; k<kend; k++) { 2525bfeeae90SHong Zhang if (smap[aj[k]]) { 252602834360SBarry Smith lens[i]++; 252702834360SBarry Smith } 252802834360SBarry Smith } 252902834360SBarry Smith } 253017ab2063SBarry Smith /* Create and fill new matrix */ 2531a2744918SBarry Smith if (scall == MAT_REUSE_MATRIX) { 2532ace3abfcSBarry Smith PetscBool equal; 25330f5bd95cSBarry Smith 253499141d43SSatish Balay c = (Mat_SeqAIJ*)((*B)->data); 2535e32f2f54SBarry Smith if ((*B)->rmap->n != nrows || (*B)->cmap->n != ncols) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Cannot reuse matrix. wrong size"); 2536580bdb30SBarry Smith ierr = PetscArraycmp(c->ilen,lens,(*B)->rmap->n,&equal);CHKERRQ(ierr); 2537f23aa3ddSBarry Smith if (!equal) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Cannot reuse matrix. wrong no of nonzeros"); 2538580bdb30SBarry Smith ierr = PetscArrayzero(c->ilen,(*B)->rmap->n);CHKERRQ(ierr); 253908480c60SBarry Smith C = *B; 25403a40ed3dSBarry Smith } else { 25413bef6203SJed Brown PetscInt rbs,cbs; 2542ce94432eSBarry Smith ierr = MatCreate(PetscObjectComm((PetscObject)A),&C);CHKERRQ(ierr); 2543f69a0ea3SMatthew Knepley ierr = MatSetSizes(C,nrows,ncols,PETSC_DETERMINE,PETSC_DETERMINE);CHKERRQ(ierr); 25443bef6203SJed Brown ierr = ISGetBlockSize(isrow,&rbs);CHKERRQ(ierr); 25453bef6203SJed Brown ierr = ISGetBlockSize(iscol,&cbs);CHKERRQ(ierr); 25463bef6203SJed Brown ierr = MatSetBlockSizes(C,rbs,cbs);CHKERRQ(ierr); 25477adad957SLisandro Dalcin ierr = MatSetType(C,((PetscObject)A)->type_name);CHKERRQ(ierr); 2548ab93d7beSBarry Smith ierr = MatSeqAIJSetPreallocation_SeqAIJ(C,0,lens);CHKERRQ(ierr); 254908480c60SBarry Smith } 255099141d43SSatish Balay c = (Mat_SeqAIJ*)(C->data); 255117ab2063SBarry Smith for (i=0; i<nrows; i++) { 255299141d43SSatish Balay row = irow[i]; 2553bfeeae90SHong Zhang kstart = ai[row]; 255499141d43SSatish Balay kend = kstart + a->ilen[row]; 2555bfeeae90SHong Zhang mat_i = c->i[i]; 255699141d43SSatish Balay mat_j = c->j + mat_i; 255799141d43SSatish Balay mat_a = c->a + mat_i; 255899141d43SSatish Balay mat_ilen = c->ilen + i; 255917ab2063SBarry Smith for (k=kstart; k<kend; k++) { 2560bfeeae90SHong Zhang if ((tcol=smap[a->j[k]])) { 2561ed480e8bSBarry Smith *mat_j++ = tcol - 1; 256299141d43SSatish Balay *mat_a++ = a->a[k]; 256399141d43SSatish Balay (*mat_ilen)++; 256499141d43SSatish Balay 256517ab2063SBarry Smith } 256617ab2063SBarry Smith } 256717ab2063SBarry Smith } 256802834360SBarry Smith /* Free work space */ 256902834360SBarry Smith ierr = ISRestoreIndices(iscol,&icol);CHKERRQ(ierr); 2570606d414cSSatish Balay ierr = PetscFree(smap);CHKERRQ(ierr); 2571606d414cSSatish Balay ierr = PetscFree(lens);CHKERRQ(ierr); 2572cdc6f3adSToby Isaac /* sort */ 2573cdc6f3adSToby Isaac for (i = 0; i < nrows; i++) { 2574cdc6f3adSToby Isaac PetscInt ilen; 2575cdc6f3adSToby Isaac 2576cdc6f3adSToby Isaac mat_i = c->i[i]; 2577cdc6f3adSToby Isaac mat_j = c->j + mat_i; 2578cdc6f3adSToby Isaac mat_a = c->a + mat_i; 2579cdc6f3adSToby Isaac ilen = c->ilen[i]; 2580390e1bf2SBarry Smith ierr = PetscSortIntWithScalarArray(ilen,mat_j,mat_a);CHKERRQ(ierr); 2581cdc6f3adSToby Isaac } 258202834360SBarry Smith } 2583305c6ccfSStefano Zampini #if defined(PETSC_HAVE_VIENNACL) || defined(PETSC_HAVE_CUDA) 2584b470e4b4SRichard Tran Mills ierr = MatBindToCPU(C,A->boundtocpu);CHKERRQ(ierr); 2585305c6ccfSStefano Zampini #endif 25866d4a8577SBarry Smith ierr = MatAssemblyBegin(C,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 25876d4a8577SBarry Smith ierr = MatAssemblyEnd(C,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 258817ab2063SBarry Smith 258917ab2063SBarry Smith ierr = ISRestoreIndices(isrow,&irow);CHKERRQ(ierr); 2590416022c9SBarry Smith *B = C; 25913a40ed3dSBarry Smith PetscFunctionReturn(0); 259217ab2063SBarry Smith } 259317ab2063SBarry Smith 2594fc08c53fSHong Zhang PetscErrorCode MatGetMultiProcBlock_SeqAIJ(Mat mat,MPI_Comm subComm,MatReuse scall,Mat *subMat) 259582d44351SHong Zhang { 259682d44351SHong Zhang PetscErrorCode ierr; 259782d44351SHong Zhang Mat B; 259882d44351SHong Zhang 259982d44351SHong Zhang PetscFunctionBegin; 2600c2d650bdSHong Zhang if (scall == MAT_INITIAL_MATRIX) { 260182d44351SHong Zhang ierr = MatCreate(subComm,&B);CHKERRQ(ierr); 260282d44351SHong Zhang ierr = MatSetSizes(B,mat->rmap->n,mat->cmap->n,mat->rmap->n,mat->cmap->n);CHKERRQ(ierr); 260333d57670SJed Brown ierr = MatSetBlockSizesFromMats(B,mat,mat);CHKERRQ(ierr); 260482d44351SHong Zhang ierr = MatSetType(B,MATSEQAIJ);CHKERRQ(ierr); 260582d44351SHong Zhang ierr = MatDuplicateNoCreate_SeqAIJ(B,mat,MAT_COPY_VALUES,PETSC_TRUE);CHKERRQ(ierr); 260682d44351SHong Zhang *subMat = B; 2607c2d650bdSHong Zhang } else { 2608c2d650bdSHong Zhang ierr = MatCopy_SeqAIJ(mat,*subMat,SAME_NONZERO_PATTERN);CHKERRQ(ierr); 2609c2d650bdSHong Zhang } 261082d44351SHong Zhang PetscFunctionReturn(0); 261182d44351SHong Zhang } 261282d44351SHong Zhang 26139a625307SHong Zhang PetscErrorCode MatILUFactor_SeqAIJ(Mat inA,IS row,IS col,const MatFactorInfo *info) 2614a871dcd8SBarry Smith { 261563b91edcSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)inA->data; 2616dfbe8321SBarry Smith PetscErrorCode ierr; 261763b91edcSBarry Smith Mat outA; 2618ace3abfcSBarry Smith PetscBool row_identity,col_identity; 261963b91edcSBarry Smith 26203a40ed3dSBarry Smith PetscFunctionBegin; 2621e32f2f54SBarry Smith if (info->levels != 0) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_SUP,"Only levels=0 supported for in-place ilu"); 26221df811f5SHong Zhang 2623b8a78c4aSBarry Smith ierr = ISIdentity(row,&row_identity);CHKERRQ(ierr); 2624b8a78c4aSBarry Smith ierr = ISIdentity(col,&col_identity);CHKERRQ(ierr); 2625a871dcd8SBarry Smith 262663b91edcSBarry Smith outA = inA; 2627d5f3da31SBarry Smith outA->factortype = MAT_FACTOR_LU; 2628f6224b95SHong Zhang ierr = PetscFree(inA->solvertype);CHKERRQ(ierr); 2629f6224b95SHong Zhang ierr = PetscStrallocpy(MATSOLVERPETSC,&inA->solvertype);CHKERRQ(ierr); 26302205254eSKarl Rupp 2631c38d4ed2SBarry Smith ierr = PetscObjectReference((PetscObject)row);CHKERRQ(ierr); 26326bf464f9SBarry Smith ierr = ISDestroy(&a->row);CHKERRQ(ierr); 26332205254eSKarl Rupp 2634c3122656SLisandro Dalcin a->row = row; 26352205254eSKarl Rupp 2636c38d4ed2SBarry Smith ierr = PetscObjectReference((PetscObject)col);CHKERRQ(ierr); 26376bf464f9SBarry Smith ierr = ISDestroy(&a->col);CHKERRQ(ierr); 26382205254eSKarl Rupp 2639c3122656SLisandro Dalcin a->col = col; 264063b91edcSBarry Smith 264136db0b34SBarry Smith /* Create the inverse permutation so that it can be used in MatLUFactorNumeric() */ 26426bf464f9SBarry Smith ierr = ISDestroy(&a->icol);CHKERRQ(ierr); 26434c49b128SBarry Smith ierr = ISInvertPermutation(col,PETSC_DECIDE,&a->icol);CHKERRQ(ierr); 26443bb1ff40SBarry Smith ierr = PetscLogObjectParent((PetscObject)inA,(PetscObject)a->icol);CHKERRQ(ierr); 2645f0ec6fceSSatish Balay 264694a9d846SBarry Smith if (!a->solve_work) { /* this matrix may have been factored before */ 2647854ce69bSBarry Smith ierr = PetscMalloc1(inA->rmap->n+1,&a->solve_work);CHKERRQ(ierr); 26483bb1ff40SBarry Smith ierr = PetscLogObjectMemory((PetscObject)inA, (inA->rmap->n+1)*sizeof(PetscScalar));CHKERRQ(ierr); 264994a9d846SBarry Smith } 265063b91edcSBarry Smith 2651f1e2ffcdSBarry Smith ierr = MatMarkDiagonal_SeqAIJ(inA);CHKERRQ(ierr); 2652137fb511SHong Zhang if (row_identity && col_identity) { 2653ad04f41aSHong Zhang ierr = MatLUFactorNumeric_SeqAIJ_inplace(outA,inA,info);CHKERRQ(ierr); 2654137fb511SHong Zhang } else { 2655719d5645SBarry Smith ierr = MatLUFactorNumeric_SeqAIJ_InplaceWithPerm(outA,inA,info);CHKERRQ(ierr); 2656137fb511SHong Zhang } 26573a40ed3dSBarry Smith PetscFunctionReturn(0); 2658a871dcd8SBarry Smith } 2659a871dcd8SBarry Smith 2660f4df32b1SMatthew Knepley PetscErrorCode MatScale_SeqAIJ(Mat inA,PetscScalar alpha) 2661f0b747eeSBarry Smith { 2662f0b747eeSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)inA->data; 2663f4df32b1SMatthew Knepley PetscScalar oalpha = alpha; 2664efee365bSSatish Balay PetscErrorCode ierr; 2665c5df96a5SBarry Smith PetscBLASInt one = 1,bnz; 26663a40ed3dSBarry Smith 26673a40ed3dSBarry Smith PetscFunctionBegin; 2668c5df96a5SBarry Smith ierr = PetscBLASIntCast(a->nz,&bnz);CHKERRQ(ierr); 26698b83055fSJed Brown PetscStackCallBLAS("BLASscal",BLASscal_(&bnz,&oalpha,a->a,&one)); 2670efee365bSSatish Balay ierr = PetscLogFlops(a->nz);CHKERRQ(ierr); 2671acf2f550SJed Brown ierr = MatSeqAIJInvalidateDiagonal(inA);CHKERRQ(ierr); 2672e2cf4d64SStefano Zampini #if defined(PETSC_HAVE_VIENNACL) || defined(PETSC_HAVE_CUDA) 2673c70f7ee4SJunchao Zhang if (inA->offloadmask != PETSC_OFFLOAD_UNALLOCATED) inA->offloadmask = PETSC_OFFLOAD_CPU; 2674e2cf4d64SStefano Zampini #endif 26753a40ed3dSBarry Smith PetscFunctionReturn(0); 2676f0b747eeSBarry Smith } 2677f0b747eeSBarry Smith 2678f68bb481SHong Zhang PetscErrorCode MatDestroySubMatrix_Private(Mat_SubSppt *submatj) 267916b64355SHong Zhang { 268016b64355SHong Zhang PetscErrorCode ierr; 268116b64355SHong Zhang PetscInt i; 268216b64355SHong Zhang 268316b64355SHong Zhang PetscFunctionBegin; 268416b64355SHong Zhang if (!submatj->id) { /* delete data that are linked only to submats[id=0] */ 268516b64355SHong Zhang ierr = PetscFree4(submatj->sbuf1,submatj->ptr,submatj->tmp,submatj->ctr);CHKERRQ(ierr); 268616b64355SHong Zhang 268716b64355SHong Zhang for (i=0; i<submatj->nrqr; ++i) { 268816b64355SHong Zhang ierr = PetscFree(submatj->sbuf2[i]);CHKERRQ(ierr); 268916b64355SHong Zhang } 269016b64355SHong Zhang ierr = PetscFree3(submatj->sbuf2,submatj->req_size,submatj->req_source1);CHKERRQ(ierr); 269116b64355SHong Zhang 269216b64355SHong Zhang if (submatj->rbuf1) { 269316b64355SHong Zhang ierr = PetscFree(submatj->rbuf1[0]);CHKERRQ(ierr); 269416b64355SHong Zhang ierr = PetscFree(submatj->rbuf1);CHKERRQ(ierr); 269516b64355SHong Zhang } 269616b64355SHong Zhang 269716b64355SHong Zhang for (i=0; i<submatj->nrqs; ++i) { 269816b64355SHong Zhang ierr = PetscFree(submatj->rbuf3[i]);CHKERRQ(ierr); 269916b64355SHong Zhang } 270016b64355SHong Zhang ierr = PetscFree3(submatj->req_source2,submatj->rbuf2,submatj->rbuf3);CHKERRQ(ierr); 270116b64355SHong Zhang ierr = PetscFree(submatj->pa);CHKERRQ(ierr); 270216b64355SHong Zhang } 270316b64355SHong Zhang 270416b64355SHong Zhang #if defined(PETSC_USE_CTABLE) 270516b64355SHong Zhang ierr = PetscTableDestroy((PetscTable*)&submatj->rmap);CHKERRQ(ierr); 270616b64355SHong Zhang if (submatj->cmap_loc) {ierr = PetscFree(submatj->cmap_loc);CHKERRQ(ierr);} 270716b64355SHong Zhang ierr = PetscFree(submatj->rmap_loc);CHKERRQ(ierr); 270816b64355SHong Zhang #else 270916b64355SHong Zhang ierr = PetscFree(submatj->rmap);CHKERRQ(ierr); 271016b64355SHong Zhang #endif 271116b64355SHong Zhang 271216b64355SHong Zhang if (!submatj->allcolumns) { 271316b64355SHong Zhang #if defined(PETSC_USE_CTABLE) 271416b64355SHong Zhang ierr = PetscTableDestroy((PetscTable*)&submatj->cmap);CHKERRQ(ierr); 271516b64355SHong Zhang #else 271616b64355SHong Zhang ierr = PetscFree(submatj->cmap);CHKERRQ(ierr); 271716b64355SHong Zhang #endif 271816b64355SHong Zhang } 271916b64355SHong Zhang ierr = PetscFree(submatj->row2proc);CHKERRQ(ierr); 272016b64355SHong Zhang 272116b64355SHong Zhang ierr = PetscFree(submatj);CHKERRQ(ierr); 272216b64355SHong Zhang PetscFunctionReturn(0); 272316b64355SHong Zhang } 272416b64355SHong Zhang 27250fb991dcSHong Zhang PetscErrorCode MatDestroySubMatrix_SeqAIJ(Mat C) 272616b64355SHong Zhang { 272716b64355SHong Zhang PetscErrorCode ierr; 272816b64355SHong Zhang Mat_SeqAIJ *c = (Mat_SeqAIJ*)C->data; 27295c39f6d9SHong Zhang Mat_SubSppt *submatj = c->submatis1; 273016b64355SHong Zhang 273116b64355SHong Zhang PetscFunctionBegin; 273234136279SStefano Zampini ierr = (*submatj->destroy)(C);CHKERRQ(ierr); 2733f68bb481SHong Zhang ierr = MatDestroySubMatrix_Private(submatj);CHKERRQ(ierr); 273416b64355SHong Zhang PetscFunctionReturn(0); 273516b64355SHong Zhang } 273616b64355SHong Zhang 27372d033e1fSHong Zhang PetscErrorCode MatDestroySubMatrices_SeqAIJ(PetscInt n,Mat *mat[]) 27382d033e1fSHong Zhang { 27392d033e1fSHong Zhang PetscErrorCode ierr; 27402d033e1fSHong Zhang PetscInt i; 27410fb991dcSHong Zhang Mat C; 27420fb991dcSHong Zhang Mat_SeqAIJ *c; 27430fb991dcSHong Zhang Mat_SubSppt *submatj; 27442d033e1fSHong Zhang 27452d033e1fSHong Zhang PetscFunctionBegin; 27462d033e1fSHong Zhang for (i=0; i<n; i++) { 27470fb991dcSHong Zhang C = (*mat)[i]; 27480fb991dcSHong Zhang c = (Mat_SeqAIJ*)C->data; 27490fb991dcSHong Zhang submatj = c->submatis1; 27502d033e1fSHong Zhang if (submatj) { 2751682e4c99SStefano Zampini if (--((PetscObject)C)->refct <= 0) { 275234136279SStefano Zampini ierr = (*submatj->destroy)(C);CHKERRQ(ierr); 2753f68bb481SHong Zhang ierr = MatDestroySubMatrix_Private(submatj);CHKERRQ(ierr); 275434136279SStefano Zampini ierr = PetscFree(C->defaultvectype);CHKERRQ(ierr); 27552d033e1fSHong Zhang ierr = PetscLayoutDestroy(&C->rmap);CHKERRQ(ierr); 27562d033e1fSHong Zhang ierr = PetscLayoutDestroy(&C->cmap);CHKERRQ(ierr); 27572d033e1fSHong Zhang ierr = PetscHeaderDestroy(&C);CHKERRQ(ierr); 2758682e4c99SStefano Zampini } 27592d033e1fSHong Zhang } else { 27602d033e1fSHong Zhang ierr = MatDestroy(&C);CHKERRQ(ierr); 27612d033e1fSHong Zhang } 27622d033e1fSHong Zhang } 276386e85357SHong Zhang 276463a75b2aSHong Zhang /* Destroy Dummy submatrices created for reuse */ 276563a75b2aSHong Zhang ierr = MatDestroySubMatrices_Dummy(n,mat);CHKERRQ(ierr); 276663a75b2aSHong Zhang 27672d033e1fSHong Zhang ierr = PetscFree(*mat);CHKERRQ(ierr); 27682d033e1fSHong Zhang PetscFunctionReturn(0); 27692d033e1fSHong Zhang } 27702d033e1fSHong Zhang 27717dae84e0SHong Zhang PetscErrorCode MatCreateSubMatrices_SeqAIJ(Mat A,PetscInt n,const IS irow[],const IS icol[],MatReuse scall,Mat *B[]) 2772cddf8d76SBarry Smith { 2773dfbe8321SBarry Smith PetscErrorCode ierr; 277497f1f81fSBarry Smith PetscInt i; 2775cddf8d76SBarry Smith 27763a40ed3dSBarry Smith PetscFunctionBegin; 2777cddf8d76SBarry Smith if (scall == MAT_INITIAL_MATRIX) { 2778df750dc8SHong Zhang ierr = PetscCalloc1(n+1,B);CHKERRQ(ierr); 2779cddf8d76SBarry Smith } 2780cddf8d76SBarry Smith 2781cddf8d76SBarry Smith for (i=0; i<n; i++) { 27827dae84e0SHong Zhang ierr = MatCreateSubMatrix_SeqAIJ(A,irow[i],icol[i],PETSC_DECIDE,scall,&(*B)[i]);CHKERRQ(ierr); 2783cddf8d76SBarry Smith } 27843a40ed3dSBarry Smith PetscFunctionReturn(0); 2785cddf8d76SBarry Smith } 2786cddf8d76SBarry Smith 278797f1f81fSBarry Smith PetscErrorCode MatIncreaseOverlap_SeqAIJ(Mat A,PetscInt is_max,IS is[],PetscInt ov) 27884dcbc457SBarry Smith { 2789e4d965acSSatish Balay Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 27906849ba73SBarry Smith PetscErrorCode ierr; 27915d0c19d7SBarry Smith PetscInt row,i,j,k,l,m,n,*nidx,isz,val; 27925d0c19d7SBarry Smith const PetscInt *idx; 279397f1f81fSBarry Smith PetscInt start,end,*ai,*aj; 2794f1af5d2fSBarry Smith PetscBT table; 2795bbd702dbSSatish Balay 27963a40ed3dSBarry Smith PetscFunctionBegin; 2797d0f46423SBarry Smith m = A->rmap->n; 2798e4d965acSSatish Balay ai = a->i; 2799bfeeae90SHong Zhang aj = a->j; 28008a047759SSatish Balay 2801e32f2f54SBarry Smith if (ov < 0) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"illegal negative overlap value used"); 280206763907SSatish Balay 2803854ce69bSBarry Smith ierr = PetscMalloc1(m+1,&nidx);CHKERRQ(ierr); 280453b8de81SBarry Smith ierr = PetscBTCreate(m,&table);CHKERRQ(ierr); 280506763907SSatish Balay 2806e4d965acSSatish Balay for (i=0; i<is_max; i++) { 2807b97fc60eSLois Curfman McInnes /* Initialize the two local arrays */ 2808e4d965acSSatish Balay isz = 0; 28096831982aSBarry Smith ierr = PetscBTMemzero(m,table);CHKERRQ(ierr); 2810e4d965acSSatish Balay 2811e4d965acSSatish Balay /* Extract the indices, assume there can be duplicate entries */ 28124dcbc457SBarry Smith ierr = ISGetIndices(is[i],&idx);CHKERRQ(ierr); 2813b9b97703SBarry Smith ierr = ISGetLocalSize(is[i],&n);CHKERRQ(ierr); 2814e4d965acSSatish Balay 2815dd097bc3SLois Curfman McInnes /* Enter these into the temp arrays. I.e., mark table[row], enter row into new index */ 2816e4d965acSSatish Balay for (j=0; j<n; ++j) { 28172205254eSKarl Rupp if (!PetscBTLookupSet(table,idx[j])) nidx[isz++] = idx[j]; 28184dcbc457SBarry Smith } 281906763907SSatish Balay ierr = ISRestoreIndices(is[i],&idx);CHKERRQ(ierr); 28206bf464f9SBarry Smith ierr = ISDestroy(&is[i]);CHKERRQ(ierr); 2821e4d965acSSatish Balay 282204a348a9SBarry Smith k = 0; 282304a348a9SBarry Smith for (j=0; j<ov; j++) { /* for each overlap */ 282404a348a9SBarry Smith n = isz; 282506763907SSatish Balay for (; k<n; k++) { /* do only those rows in nidx[k], which are not done yet */ 2826e4d965acSSatish Balay row = nidx[k]; 2827e4d965acSSatish Balay start = ai[row]; 2828e4d965acSSatish Balay end = ai[row+1]; 282904a348a9SBarry Smith for (l = start; l<end; l++) { 2830efb16452SHong Zhang val = aj[l]; 28312205254eSKarl Rupp if (!PetscBTLookupSet(table,val)) nidx[isz++] = val; 2832e4d965acSSatish Balay } 2833e4d965acSSatish Balay } 2834e4d965acSSatish Balay } 283570b3c8c7SBarry Smith ierr = ISCreateGeneral(PETSC_COMM_SELF,isz,nidx,PETSC_COPY_VALUES,(is+i));CHKERRQ(ierr); 2836e4d965acSSatish Balay } 283794bacf5dSBarry Smith ierr = PetscBTDestroy(&table);CHKERRQ(ierr); 2838606d414cSSatish Balay ierr = PetscFree(nidx);CHKERRQ(ierr); 28393a40ed3dSBarry Smith PetscFunctionReturn(0); 28404dcbc457SBarry Smith } 284117ab2063SBarry Smith 28420513a670SBarry Smith /* -------------------------------------------------------------- */ 2843dfbe8321SBarry Smith PetscErrorCode MatPermute_SeqAIJ(Mat A,IS rowp,IS colp,Mat *B) 28440513a670SBarry Smith { 28450513a670SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 28466849ba73SBarry Smith PetscErrorCode ierr; 28473b98c0a2SBarry Smith PetscInt i,nz = 0,m = A->rmap->n,n = A->cmap->n; 28485d0c19d7SBarry Smith const PetscInt *row,*col; 28495d0c19d7SBarry Smith PetscInt *cnew,j,*lens; 285056cd22aeSBarry Smith IS icolp,irowp; 28510298fd71SBarry Smith PetscInt *cwork = NULL; 28520298fd71SBarry Smith PetscScalar *vwork = NULL; 28530513a670SBarry Smith 28543a40ed3dSBarry Smith PetscFunctionBegin; 28554c49b128SBarry Smith ierr = ISInvertPermutation(rowp,PETSC_DECIDE,&irowp);CHKERRQ(ierr); 285656cd22aeSBarry Smith ierr = ISGetIndices(irowp,&row);CHKERRQ(ierr); 28574c49b128SBarry Smith ierr = ISInvertPermutation(colp,PETSC_DECIDE,&icolp);CHKERRQ(ierr); 285856cd22aeSBarry Smith ierr = ISGetIndices(icolp,&col);CHKERRQ(ierr); 28590513a670SBarry Smith 28600513a670SBarry Smith /* determine lengths of permuted rows */ 2861854ce69bSBarry Smith ierr = PetscMalloc1(m+1,&lens);CHKERRQ(ierr); 28622205254eSKarl Rupp for (i=0; i<m; i++) lens[row[i]] = a->i[i+1] - a->i[i]; 2863ce94432eSBarry Smith ierr = MatCreate(PetscObjectComm((PetscObject)A),B);CHKERRQ(ierr); 2864f69a0ea3SMatthew Knepley ierr = MatSetSizes(*B,m,n,m,n);CHKERRQ(ierr); 286533d57670SJed Brown ierr = MatSetBlockSizesFromMats(*B,A,A);CHKERRQ(ierr); 28667adad957SLisandro Dalcin ierr = MatSetType(*B,((PetscObject)A)->type_name);CHKERRQ(ierr); 2867ab93d7beSBarry Smith ierr = MatSeqAIJSetPreallocation_SeqAIJ(*B,0,lens);CHKERRQ(ierr); 2868606d414cSSatish Balay ierr = PetscFree(lens);CHKERRQ(ierr); 28690513a670SBarry Smith 2870785e854fSJed Brown ierr = PetscMalloc1(n,&cnew);CHKERRQ(ierr); 28710513a670SBarry Smith for (i=0; i<m; i++) { 287232ec9ce4SBarry Smith ierr = MatGetRow_SeqAIJ(A,i,&nz,&cwork,&vwork);CHKERRQ(ierr); 28732205254eSKarl Rupp for (j=0; j<nz; j++) cnew[j] = col[cwork[j]]; 2874cdc0ba36SBarry Smith ierr = MatSetValues_SeqAIJ(*B,1,&row[i],nz,cnew,vwork,INSERT_VALUES);CHKERRQ(ierr); 287532ec9ce4SBarry Smith ierr = MatRestoreRow_SeqAIJ(A,i,&nz,&cwork,&vwork);CHKERRQ(ierr); 28760513a670SBarry Smith } 2877606d414cSSatish Balay ierr = PetscFree(cnew);CHKERRQ(ierr); 28782205254eSKarl Rupp 28793c7d62e4SBarry Smith (*B)->assembled = PETSC_FALSE; 28802205254eSKarl Rupp 28819fe5e383SStefano Zampini #if defined(PETSC_HAVE_VIENNACL) || defined(PETSC_HAVE_CUDA) 2882b470e4b4SRichard Tran Mills ierr = MatBindToCPU(*B,A->boundtocpu);CHKERRQ(ierr); 28839fe5e383SStefano Zampini #endif 28840513a670SBarry Smith ierr = MatAssemblyBegin(*B,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 28850513a670SBarry Smith ierr = MatAssemblyEnd(*B,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 288656cd22aeSBarry Smith ierr = ISRestoreIndices(irowp,&row);CHKERRQ(ierr); 288756cd22aeSBarry Smith ierr = ISRestoreIndices(icolp,&col);CHKERRQ(ierr); 28886bf464f9SBarry Smith ierr = ISDestroy(&irowp);CHKERRQ(ierr); 28896bf464f9SBarry Smith ierr = ISDestroy(&icolp);CHKERRQ(ierr); 28906768869dSprj- if (rowp == colp) { 28916768869dSprj- if (A->symmetric) { 28926768869dSprj- ierr = MatSetOption(*B,MAT_SYMMETRIC,PETSC_TRUE);CHKERRQ(ierr); 28936768869dSprj- } 28946768869dSprj- if (A->hermitian) { 28956768869dSprj- ierr = MatSetOption(*B,MAT_HERMITIAN,PETSC_TRUE);CHKERRQ(ierr); 28966768869dSprj- } 28976768869dSprj- } 28983a40ed3dSBarry Smith PetscFunctionReturn(0); 28990513a670SBarry Smith } 29000513a670SBarry Smith 2901dfbe8321SBarry Smith PetscErrorCode MatCopy_SeqAIJ(Mat A,Mat B,MatStructure str) 2902cb5b572fSBarry Smith { 2903dfbe8321SBarry Smith PetscErrorCode ierr; 2904cb5b572fSBarry Smith 2905cb5b572fSBarry Smith PetscFunctionBegin; 290633f4a19fSKris Buschelman /* If the two matrices have the same copy implementation, use fast copy. */ 290733f4a19fSKris Buschelman if (str == SAME_NONZERO_PATTERN && (A->ops->copy == B->ops->copy)) { 2908be6bf707SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 2909be6bf707SBarry Smith Mat_SeqAIJ *b = (Mat_SeqAIJ*)B->data; 2910be6bf707SBarry Smith 29114d805d7cSStefano Zampini if (a->i[A->rmap->n] != b->i[B->rmap->n]) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_INCOMP,"Number of nonzeros in two matrices are different %D != %D",a->i[A->rmap->n],b->i[B->rmap->n]); 2912580bdb30SBarry Smith ierr = PetscArraycpy(b->a,a->a,a->i[A->rmap->n]);CHKERRQ(ierr); 2913cdc753b6SBarry Smith ierr = PetscObjectStateIncrease((PetscObject)B);CHKERRQ(ierr); 2914cb5b572fSBarry Smith } else { 2915cb5b572fSBarry Smith ierr = MatCopy_Basic(A,B,str);CHKERRQ(ierr); 2916cb5b572fSBarry Smith } 2917cb5b572fSBarry Smith PetscFunctionReturn(0); 2918cb5b572fSBarry Smith } 2919cb5b572fSBarry Smith 29204994cf47SJed Brown PetscErrorCode MatSetUp_SeqAIJ(Mat A) 2921273d9f13SBarry Smith { 2922dfbe8321SBarry Smith PetscErrorCode ierr; 2923273d9f13SBarry Smith 2924273d9f13SBarry Smith PetscFunctionBegin; 2925ab93d7beSBarry Smith ierr = MatSeqAIJSetPreallocation_SeqAIJ(A,PETSC_DEFAULT,0);CHKERRQ(ierr); 2926273d9f13SBarry Smith PetscFunctionReturn(0); 2927273d9f13SBarry Smith } 2928273d9f13SBarry Smith 2929f38c1e66SStefano Zampini PETSC_INTERN PetscErrorCode MatSeqAIJGetArray_SeqAIJ(Mat A,PetscScalar *array[]) 29306c0721eeSBarry Smith { 29316c0721eeSBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 29326e111a19SKarl Rupp 29336c0721eeSBarry Smith PetscFunctionBegin; 29346c0721eeSBarry Smith *array = a->a; 29356c0721eeSBarry Smith PetscFunctionReturn(0); 29366c0721eeSBarry Smith } 29376c0721eeSBarry Smith 2938f38c1e66SStefano Zampini PETSC_INTERN PetscErrorCode MatSeqAIJRestoreArray_SeqAIJ(Mat A,PetscScalar *array[]) 29396c0721eeSBarry Smith { 29406c0721eeSBarry Smith PetscFunctionBegin; 2941f38c1e66SStefano Zampini *array = NULL; 29426c0721eeSBarry Smith PetscFunctionReturn(0); 29436c0721eeSBarry Smith } 2944273d9f13SBarry Smith 29458229c054SShri Abhyankar /* 29468229c054SShri Abhyankar Computes the number of nonzeros per row needed for preallocation when X and Y 29478229c054SShri Abhyankar have different nonzero structure. 29488229c054SShri Abhyankar */ 2949b264fe52SHong Zhang PetscErrorCode MatAXPYGetPreallocation_SeqX_private(PetscInt m,const PetscInt *xi,const PetscInt *xj,const PetscInt *yi,const PetscInt *yj,PetscInt *nnz) 2950ec7775f6SShri Abhyankar { 2951b264fe52SHong Zhang PetscInt i,j,k,nzx,nzy; 2952ec7775f6SShri Abhyankar 2953ec7775f6SShri Abhyankar PetscFunctionBegin; 2954ec7775f6SShri Abhyankar /* Set the number of nonzeros in the new matrix */ 2955ec7775f6SShri Abhyankar for (i=0; i<m; i++) { 2956b264fe52SHong Zhang const PetscInt *xjj = xj+xi[i],*yjj = yj+yi[i]; 2957b264fe52SHong Zhang nzx = xi[i+1] - xi[i]; 2958b264fe52SHong Zhang nzy = yi[i+1] - yi[i]; 29598af7cee1SJed Brown nnz[i] = 0; 29608af7cee1SJed Brown for (j=0,k=0; j<nzx; j++) { /* Point in X */ 2961b264fe52SHong Zhang for (; k<nzy && yjj[k]<xjj[j]; k++) nnz[i]++; /* Catch up to X */ 2962b264fe52SHong Zhang if (k<nzy && yjj[k]==xjj[j]) k++; /* Skip duplicate */ 29638af7cee1SJed Brown nnz[i]++; 29648af7cee1SJed Brown } 29658af7cee1SJed Brown for (; k<nzy; k++) nnz[i]++; 2966ec7775f6SShri Abhyankar } 2967ec7775f6SShri Abhyankar PetscFunctionReturn(0); 2968ec7775f6SShri Abhyankar } 2969ec7775f6SShri Abhyankar 2970b264fe52SHong Zhang PetscErrorCode MatAXPYGetPreallocation_SeqAIJ(Mat Y,Mat X,PetscInt *nnz) 2971b264fe52SHong Zhang { 2972b264fe52SHong Zhang PetscInt m = Y->rmap->N; 2973b264fe52SHong Zhang Mat_SeqAIJ *x = (Mat_SeqAIJ*)X->data; 2974b264fe52SHong Zhang Mat_SeqAIJ *y = (Mat_SeqAIJ*)Y->data; 2975b264fe52SHong Zhang PetscErrorCode ierr; 2976b264fe52SHong Zhang 2977b264fe52SHong Zhang PetscFunctionBegin; 2978b264fe52SHong Zhang /* Set the number of nonzeros in the new matrix */ 2979b264fe52SHong Zhang ierr = MatAXPYGetPreallocation_SeqX_private(m,x->i,x->j,y->i,y->j,nnz);CHKERRQ(ierr); 2980b264fe52SHong Zhang PetscFunctionReturn(0); 2981b264fe52SHong Zhang } 2982b264fe52SHong Zhang 2983f4df32b1SMatthew Knepley PetscErrorCode MatAXPY_SeqAIJ(Mat Y,PetscScalar a,Mat X,MatStructure str) 2984ac90fabeSBarry Smith { 2985dfbe8321SBarry Smith PetscErrorCode ierr; 2986ac90fabeSBarry Smith Mat_SeqAIJ *x = (Mat_SeqAIJ*)X->data,*y = (Mat_SeqAIJ*)Y->data; 2987c5df96a5SBarry Smith PetscBLASInt one=1,bnz; 2988ac90fabeSBarry Smith 2989ac90fabeSBarry Smith PetscFunctionBegin; 2990c5df96a5SBarry Smith ierr = PetscBLASIntCast(x->nz,&bnz);CHKERRQ(ierr); 2991ac90fabeSBarry Smith if (str == SAME_NONZERO_PATTERN) { 2992f4df32b1SMatthew Knepley PetscScalar alpha = a; 29938b83055fSJed Brown PetscStackCallBLAS("BLASaxpy",BLASaxpy_(&bnz,&alpha,x->a,&one,y->a,&one)); 2994acf2f550SJed Brown ierr = MatSeqAIJInvalidateDiagonal(Y);CHKERRQ(ierr); 2995a3fa217bSJose E. Roman ierr = PetscObjectStateIncrease((PetscObject)Y);CHKERRQ(ierr); 2996e2cf4d64SStefano Zampini /* the MatAXPY_Basic* subroutines calls MatAssembly, so the matrix on the GPU 2997e2cf4d64SStefano Zampini will be updated */ 2998e2cf4d64SStefano Zampini #if defined(PETSC_HAVE_VIENNACL) || defined(PETSC_HAVE_CUDA) 2999c70f7ee4SJunchao Zhang if (Y->offloadmask != PETSC_OFFLOAD_UNALLOCATED) { 3000c70f7ee4SJunchao Zhang Y->offloadmask = PETSC_OFFLOAD_CPU; 3001e2cf4d64SStefano Zampini } 3002e2cf4d64SStefano Zampini #endif 3003ab784542SHong Zhang } else if (str == SUBSET_NONZERO_PATTERN) { /* nonzeros of X is a subset of Y's */ 3004ab784542SHong Zhang ierr = MatAXPY_Basic(Y,a,X,str);CHKERRQ(ierr); 3005ac90fabeSBarry Smith } else { 30068229c054SShri Abhyankar Mat B; 30078229c054SShri Abhyankar PetscInt *nnz; 3008785e854fSJed Brown ierr = PetscMalloc1(Y->rmap->N,&nnz);CHKERRQ(ierr); 3009ce94432eSBarry Smith ierr = MatCreate(PetscObjectComm((PetscObject)Y),&B);CHKERRQ(ierr); 3010bc5a2726SShri Abhyankar ierr = PetscObjectSetName((PetscObject)B,((PetscObject)Y)->name);CHKERRQ(ierr); 30114aa94f47SShri Abhyankar ierr = MatSetSizes(B,Y->rmap->n,Y->cmap->n,Y->rmap->N,Y->cmap->N);CHKERRQ(ierr); 301233d57670SJed Brown ierr = MatSetBlockSizesFromMats(B,Y,Y);CHKERRQ(ierr); 3013176df525SBarry Smith ierr = MatSetType(B,(MatType) ((PetscObject)Y)->type_name);CHKERRQ(ierr); 30148229c054SShri Abhyankar ierr = MatAXPYGetPreallocation_SeqAIJ(Y,X,nnz);CHKERRQ(ierr); 3015ecd8bba6SJed Brown ierr = MatSeqAIJSetPreallocation(B,0,nnz);CHKERRQ(ierr); 3016ec7775f6SShri Abhyankar ierr = MatAXPY_BasicWithPreallocation(B,Y,a,X,str);CHKERRQ(ierr); 301728be2f97SBarry Smith ierr = MatHeaderReplace(Y,&B);CHKERRQ(ierr); 30188229c054SShri Abhyankar ierr = PetscFree(nnz);CHKERRQ(ierr); 3019ac90fabeSBarry Smith } 3020ac90fabeSBarry Smith PetscFunctionReturn(0); 3021ac90fabeSBarry Smith } 3022ac90fabeSBarry Smith 30237087cfbeSBarry Smith PetscErrorCode MatConjugate_SeqAIJ(Mat mat) 3024354c94deSBarry Smith { 3025354c94deSBarry Smith #if defined(PETSC_USE_COMPLEX) 3026354c94deSBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ*)mat->data; 3027354c94deSBarry Smith PetscInt i,nz; 3028354c94deSBarry Smith PetscScalar *a; 3029354c94deSBarry Smith 3030354c94deSBarry Smith PetscFunctionBegin; 3031354c94deSBarry Smith nz = aij->nz; 3032354c94deSBarry Smith a = aij->a; 30332205254eSKarl Rupp for (i=0; i<nz; i++) a[i] = PetscConj(a[i]); 3034e2cf4d64SStefano Zampini #if defined(PETSC_HAVE_VIENNACL) || defined(PETSC_HAVE_CUDA) 3035c70f7ee4SJunchao Zhang if (mat->offloadmask != PETSC_OFFLOAD_UNALLOCATED) mat->offloadmask = PETSC_OFFLOAD_CPU; 3036e2cf4d64SStefano Zampini #endif 3037354c94deSBarry Smith #else 3038354c94deSBarry Smith PetscFunctionBegin; 3039354c94deSBarry Smith #endif 3040354c94deSBarry Smith PetscFunctionReturn(0); 3041354c94deSBarry Smith } 3042354c94deSBarry Smith 3043985db425SBarry Smith PetscErrorCode MatGetRowMaxAbs_SeqAIJ(Mat A,Vec v,PetscInt idx[]) 3044e34fafa9SBarry Smith { 3045e34fafa9SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 3046e34fafa9SBarry Smith PetscErrorCode ierr; 3047d0f46423SBarry Smith PetscInt i,j,m = A->rmap->n,*ai,*aj,ncols,n; 3048e34fafa9SBarry Smith PetscReal atmp; 3049985db425SBarry Smith PetscScalar *x; 3050e34fafa9SBarry Smith MatScalar *aa; 3051e34fafa9SBarry Smith 3052e34fafa9SBarry Smith PetscFunctionBegin; 3053e32f2f54SBarry Smith if (A->factortype) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Not for factored matrix"); 3054e34fafa9SBarry Smith aa = a->a; 3055e34fafa9SBarry Smith ai = a->i; 3056e34fafa9SBarry Smith aj = a->j; 3057e34fafa9SBarry Smith 3058985db425SBarry Smith ierr = VecSet(v,0.0);CHKERRQ(ierr); 3059e34fafa9SBarry Smith ierr = VecGetArray(v,&x);CHKERRQ(ierr); 3060e34fafa9SBarry Smith ierr = VecGetLocalSize(v,&n);CHKERRQ(ierr); 3061e32f2f54SBarry Smith if (n != A->rmap->n) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Nonconforming matrix and vector"); 3062e34fafa9SBarry Smith for (i=0; i<m; i++) { 3063e34fafa9SBarry Smith ncols = ai[1] - ai[0]; ai++; 30649189402eSHong Zhang x[i] = 0.0; 3065e34fafa9SBarry Smith for (j=0; j<ncols; j++) { 3066985db425SBarry Smith atmp = PetscAbsScalar(*aa); 3067985db425SBarry Smith if (PetscAbsScalar(x[i]) < atmp) {x[i] = atmp; if (idx) idx[i] = *aj;} 3068985db425SBarry Smith aa++; aj++; 3069985db425SBarry Smith } 3070985db425SBarry Smith } 3071985db425SBarry Smith ierr = VecRestoreArray(v,&x);CHKERRQ(ierr); 3072985db425SBarry Smith PetscFunctionReturn(0); 3073985db425SBarry Smith } 3074985db425SBarry Smith 3075985db425SBarry Smith PetscErrorCode MatGetRowMax_SeqAIJ(Mat A,Vec v,PetscInt idx[]) 3076985db425SBarry Smith { 3077985db425SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 3078985db425SBarry Smith PetscErrorCode ierr; 3079d0f46423SBarry Smith PetscInt i,j,m = A->rmap->n,*ai,*aj,ncols,n; 3080985db425SBarry Smith PetscScalar *x; 3081985db425SBarry Smith MatScalar *aa; 3082985db425SBarry Smith 3083985db425SBarry Smith PetscFunctionBegin; 3084e32f2f54SBarry Smith if (A->factortype) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Not for factored matrix"); 3085985db425SBarry Smith aa = a->a; 3086985db425SBarry Smith ai = a->i; 3087985db425SBarry Smith aj = a->j; 3088985db425SBarry Smith 3089985db425SBarry Smith ierr = VecSet(v,0.0);CHKERRQ(ierr); 3090985db425SBarry Smith ierr = VecGetArray(v,&x);CHKERRQ(ierr); 3091985db425SBarry Smith ierr = VecGetLocalSize(v,&n);CHKERRQ(ierr); 3092e32f2f54SBarry Smith if (n != A->rmap->n) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Nonconforming matrix and vector"); 3093985db425SBarry Smith for (i=0; i<m; i++) { 3094985db425SBarry Smith ncols = ai[1] - ai[0]; ai++; 3095d0f46423SBarry Smith if (ncols == A->cmap->n) { /* row is dense */ 3096985db425SBarry Smith x[i] = *aa; if (idx) idx[i] = 0; 3097985db425SBarry Smith } else { /* row is sparse so already KNOW maximum is 0.0 or higher */ 3098985db425SBarry Smith x[i] = 0.0; 3099985db425SBarry Smith if (idx) { 3100985db425SBarry Smith idx[i] = 0; /* in case ncols is zero */ 3101985db425SBarry Smith for (j=0;j<ncols;j++) { /* find first implicit 0.0 in the row */ 3102985db425SBarry Smith if (aj[j] > j) { 3103985db425SBarry Smith idx[i] = j; 3104985db425SBarry Smith break; 3105985db425SBarry Smith } 3106985db425SBarry Smith } 3107985db425SBarry Smith } 3108985db425SBarry Smith } 3109985db425SBarry Smith for (j=0; j<ncols; j++) { 3110985db425SBarry Smith if (PetscRealPart(x[i]) < PetscRealPart(*aa)) {x[i] = *aa; if (idx) idx[i] = *aj;} 3111985db425SBarry Smith aa++; aj++; 3112985db425SBarry Smith } 3113985db425SBarry Smith } 3114985db425SBarry Smith ierr = VecRestoreArray(v,&x);CHKERRQ(ierr); 3115985db425SBarry Smith PetscFunctionReturn(0); 3116985db425SBarry Smith } 3117985db425SBarry Smith 3118c87e5d42SMatthew Knepley PetscErrorCode MatGetRowMinAbs_SeqAIJ(Mat A,Vec v,PetscInt idx[]) 3119c87e5d42SMatthew Knepley { 3120c87e5d42SMatthew Knepley Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 3121c87e5d42SMatthew Knepley PetscErrorCode ierr; 3122c87e5d42SMatthew Knepley PetscInt i,j,m = A->rmap->n,*ai,*aj,ncols,n; 3123c87e5d42SMatthew Knepley PetscReal atmp; 3124c87e5d42SMatthew Knepley PetscScalar *x; 3125c87e5d42SMatthew Knepley MatScalar *aa; 3126c87e5d42SMatthew Knepley 3127c87e5d42SMatthew Knepley PetscFunctionBegin; 3128e32f2f54SBarry Smith if (A->factortype) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Not for factored matrix"); 3129c87e5d42SMatthew Knepley aa = a->a; 3130c87e5d42SMatthew Knepley ai = a->i; 3131c87e5d42SMatthew Knepley aj = a->j; 3132c87e5d42SMatthew Knepley 3133c87e5d42SMatthew Knepley ierr = VecSet(v,0.0);CHKERRQ(ierr); 3134c87e5d42SMatthew Knepley ierr = VecGetArray(v,&x);CHKERRQ(ierr); 3135c87e5d42SMatthew Knepley ierr = VecGetLocalSize(v,&n);CHKERRQ(ierr); 313660e0710aSBarry Smith if (n != A->rmap->n) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Nonconforming matrix and vector, %D vs. %D rows", A->rmap->n, n); 3137c87e5d42SMatthew Knepley for (i=0; i<m; i++) { 3138c87e5d42SMatthew Knepley ncols = ai[1] - ai[0]; ai++; 3139289a08f5SMatthew Knepley if (ncols) { 3140289a08f5SMatthew Knepley /* Get first nonzero */ 3141289a08f5SMatthew Knepley for (j = 0; j < ncols; j++) { 3142289a08f5SMatthew Knepley atmp = PetscAbsScalar(aa[j]); 31432205254eSKarl Rupp if (atmp > 1.0e-12) { 31442205254eSKarl Rupp x[i] = atmp; 31452205254eSKarl Rupp if (idx) idx[i] = aj[j]; 31462205254eSKarl Rupp break; 31472205254eSKarl Rupp } 3148289a08f5SMatthew Knepley } 314912431cb0SMatthew G Knepley if (j == ncols) {x[i] = PetscAbsScalar(*aa); if (idx) idx[i] = *aj;} 3150289a08f5SMatthew Knepley } else { 3151289a08f5SMatthew Knepley x[i] = 0.0; if (idx) idx[i] = 0; 3152289a08f5SMatthew Knepley } 3153c87e5d42SMatthew Knepley for (j = 0; j < ncols; j++) { 3154c87e5d42SMatthew Knepley atmp = PetscAbsScalar(*aa); 3155289a08f5SMatthew Knepley if (atmp > 1.0e-12 && PetscAbsScalar(x[i]) > atmp) {x[i] = atmp; if (idx) idx[i] = *aj;} 3156c87e5d42SMatthew Knepley aa++; aj++; 3157c87e5d42SMatthew Knepley } 3158c87e5d42SMatthew Knepley } 3159c87e5d42SMatthew Knepley ierr = VecRestoreArray(v,&x);CHKERRQ(ierr); 3160c87e5d42SMatthew Knepley PetscFunctionReturn(0); 3161c87e5d42SMatthew Knepley } 3162c87e5d42SMatthew Knepley 3163985db425SBarry Smith PetscErrorCode MatGetRowMin_SeqAIJ(Mat A,Vec v,PetscInt idx[]) 3164985db425SBarry Smith { 3165985db425SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 3166985db425SBarry Smith PetscErrorCode ierr; 3167d9ca1df4SBarry Smith PetscInt i,j,m = A->rmap->n,ncols,n; 3168d9ca1df4SBarry Smith const PetscInt *ai,*aj; 3169985db425SBarry Smith PetscScalar *x; 3170d9ca1df4SBarry Smith const MatScalar *aa; 3171985db425SBarry Smith 3172985db425SBarry Smith PetscFunctionBegin; 3173e32f2f54SBarry Smith if (A->factortype) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Not for factored matrix"); 3174985db425SBarry Smith aa = a->a; 3175985db425SBarry Smith ai = a->i; 3176985db425SBarry Smith aj = a->j; 3177985db425SBarry Smith 3178985db425SBarry Smith ierr = VecSet(v,0.0);CHKERRQ(ierr); 3179985db425SBarry Smith ierr = VecGetArray(v,&x);CHKERRQ(ierr); 3180985db425SBarry Smith ierr = VecGetLocalSize(v,&n);CHKERRQ(ierr); 3181e32f2f54SBarry Smith if (n != A->rmap->n) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Nonconforming matrix and vector"); 3182985db425SBarry Smith for (i=0; i<m; i++) { 3183985db425SBarry Smith ncols = ai[1] - ai[0]; ai++; 3184d0f46423SBarry Smith if (ncols == A->cmap->n) { /* row is dense */ 3185985db425SBarry Smith x[i] = *aa; if (idx) idx[i] = 0; 3186985db425SBarry Smith } else { /* row is sparse so already KNOW minimum is 0.0 or lower */ 3187985db425SBarry Smith x[i] = 0.0; 3188985db425SBarry Smith if (idx) { /* find first implicit 0.0 in the row */ 3189985db425SBarry Smith idx[i] = 0; /* in case ncols is zero */ 3190985db425SBarry Smith for (j=0; j<ncols; j++) { 3191985db425SBarry Smith if (aj[j] > j) { 3192985db425SBarry Smith idx[i] = j; 3193985db425SBarry Smith break; 3194985db425SBarry Smith } 3195985db425SBarry Smith } 3196985db425SBarry Smith } 3197985db425SBarry Smith } 3198985db425SBarry Smith for (j=0; j<ncols; j++) { 3199985db425SBarry Smith if (PetscRealPart(x[i]) > PetscRealPart(*aa)) {x[i] = *aa; if (idx) idx[i] = *aj;} 3200985db425SBarry Smith aa++; aj++; 3201e34fafa9SBarry Smith } 3202e34fafa9SBarry Smith } 3203e34fafa9SBarry Smith ierr = VecRestoreArray(v,&x);CHKERRQ(ierr); 3204e34fafa9SBarry Smith PetscFunctionReturn(0); 3205e34fafa9SBarry Smith } 3206bbead8a2SBarry Smith 3207713ccfa9SJed Brown PetscErrorCode MatInvertBlockDiagonal_SeqAIJ(Mat A,const PetscScalar **values) 3208bbead8a2SBarry Smith { 3209bbead8a2SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*) A->data; 3210bbead8a2SBarry Smith PetscErrorCode ierr; 321133d57670SJed Brown PetscInt i,bs = PetscAbs(A->rmap->bs),mbs = A->rmap->n/bs,ipvt[5],bs2 = bs*bs,*v_pivots,ij[7],*IJ,j; 3212bbead8a2SBarry Smith MatScalar *diag,work[25],*v_work; 32130da83c2eSBarry Smith const PetscReal shift = 0.0; 32141a9391e3SHong Zhang PetscBool allowzeropivot,zeropivotdetected=PETSC_FALSE; 3215bbead8a2SBarry Smith 3216bbead8a2SBarry Smith PetscFunctionBegin; 3217a455e926SHong Zhang allowzeropivot = PetscNot(A->erroriffailure); 32184a0d0026SBarry Smith if (a->ibdiagvalid) { 32194a0d0026SBarry Smith if (values) *values = a->ibdiag; 32204a0d0026SBarry Smith PetscFunctionReturn(0); 32214a0d0026SBarry Smith } 3222bbead8a2SBarry Smith ierr = MatMarkDiagonal_SeqAIJ(A);CHKERRQ(ierr); 3223bbead8a2SBarry Smith if (!a->ibdiag) { 3224785e854fSJed Brown ierr = PetscMalloc1(bs2*mbs,&a->ibdiag);CHKERRQ(ierr); 32253bb1ff40SBarry Smith ierr = PetscLogObjectMemory((PetscObject)A,bs2*mbs*sizeof(PetscScalar));CHKERRQ(ierr); 3226bbead8a2SBarry Smith } 3227bbead8a2SBarry Smith diag = a->ibdiag; 3228bbead8a2SBarry Smith if (values) *values = a->ibdiag; 3229bbead8a2SBarry Smith /* factor and invert each block */ 3230bbead8a2SBarry Smith switch (bs) { 3231bbead8a2SBarry Smith case 1: 3232bbead8a2SBarry Smith for (i=0; i<mbs; i++) { 3233bbead8a2SBarry Smith ierr = MatGetValues(A,1,&i,1,&i,diag+i);CHKERRQ(ierr); 3234ec1892c8SHong Zhang if (PetscAbsScalar(diag[i] + shift) < PETSC_MACHINE_EPSILON) { 3235ec1892c8SHong Zhang if (allowzeropivot) { 32367b6c816cSBarry Smith A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 32377b6c816cSBarry Smith A->factorerror_zeropivot_value = PetscAbsScalar(diag[i]); 32387b6c816cSBarry Smith A->factorerror_zeropivot_row = i; 32397b6c816cSBarry Smith ierr = PetscInfo3(A,"Zero pivot, row %D pivot %g tolerance %g\n",i,(double)PetscAbsScalar(diag[i]),(double)PETSC_MACHINE_EPSILON);CHKERRQ(ierr); 32407b6c816cSBarry Smith } else SETERRQ3(PETSC_COMM_SELF,PETSC_ERR_MAT_LU_ZRPVT,"Zero pivot, row %D pivot %g tolerance %g",i,(double)PetscAbsScalar(diag[i]),(double)PETSC_MACHINE_EPSILON); 3241ec1892c8SHong Zhang } 3242bbead8a2SBarry Smith diag[i] = (PetscScalar)1.0 / (diag[i] + shift); 3243bbead8a2SBarry Smith } 3244bbead8a2SBarry Smith break; 3245bbead8a2SBarry Smith case 2: 3246bbead8a2SBarry Smith for (i=0; i<mbs; i++) { 3247bbead8a2SBarry Smith ij[0] = 2*i; ij[1] = 2*i + 1; 3248bbead8a2SBarry Smith ierr = MatGetValues(A,2,ij,2,ij,diag);CHKERRQ(ierr); 3249a455e926SHong Zhang ierr = PetscKernel_A_gets_inverse_A_2(diag,shift,allowzeropivot,&zeropivotdetected);CHKERRQ(ierr); 32507b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 325196b95a6bSBarry Smith ierr = PetscKernel_A_gets_transpose_A_2(diag);CHKERRQ(ierr); 3252bbead8a2SBarry Smith diag += 4; 3253bbead8a2SBarry Smith } 3254bbead8a2SBarry Smith break; 3255bbead8a2SBarry Smith case 3: 3256bbead8a2SBarry Smith for (i=0; i<mbs; i++) { 3257bbead8a2SBarry Smith ij[0] = 3*i; ij[1] = 3*i + 1; ij[2] = 3*i + 2; 3258bbead8a2SBarry Smith ierr = MatGetValues(A,3,ij,3,ij,diag);CHKERRQ(ierr); 3259a455e926SHong Zhang ierr = PetscKernel_A_gets_inverse_A_3(diag,shift,allowzeropivot,&zeropivotdetected);CHKERRQ(ierr); 32607b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 326196b95a6bSBarry Smith ierr = PetscKernel_A_gets_transpose_A_3(diag);CHKERRQ(ierr); 3262bbead8a2SBarry Smith diag += 9; 3263bbead8a2SBarry Smith } 3264bbead8a2SBarry Smith break; 3265bbead8a2SBarry Smith case 4: 3266bbead8a2SBarry Smith for (i=0; i<mbs; i++) { 3267bbead8a2SBarry Smith ij[0] = 4*i; ij[1] = 4*i + 1; ij[2] = 4*i + 2; ij[3] = 4*i + 3; 3268bbead8a2SBarry Smith ierr = MatGetValues(A,4,ij,4,ij,diag);CHKERRQ(ierr); 3269a455e926SHong Zhang ierr = PetscKernel_A_gets_inverse_A_4(diag,shift,allowzeropivot,&zeropivotdetected);CHKERRQ(ierr); 32707b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 327196b95a6bSBarry Smith ierr = PetscKernel_A_gets_transpose_A_4(diag);CHKERRQ(ierr); 3272bbead8a2SBarry Smith diag += 16; 3273bbead8a2SBarry Smith } 3274bbead8a2SBarry Smith break; 3275bbead8a2SBarry Smith case 5: 3276bbead8a2SBarry Smith for (i=0; i<mbs; i++) { 3277bbead8a2SBarry Smith ij[0] = 5*i; ij[1] = 5*i + 1; ij[2] = 5*i + 2; ij[3] = 5*i + 3; ij[4] = 5*i + 4; 3278bbead8a2SBarry Smith ierr = MatGetValues(A,5,ij,5,ij,diag);CHKERRQ(ierr); 3279a455e926SHong Zhang ierr = PetscKernel_A_gets_inverse_A_5(diag,ipvt,work,shift,allowzeropivot,&zeropivotdetected);CHKERRQ(ierr); 32807b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 328196b95a6bSBarry Smith ierr = PetscKernel_A_gets_transpose_A_5(diag);CHKERRQ(ierr); 3282bbead8a2SBarry Smith diag += 25; 3283bbead8a2SBarry Smith } 3284bbead8a2SBarry Smith break; 3285bbead8a2SBarry Smith case 6: 3286bbead8a2SBarry Smith for (i=0; i<mbs; i++) { 3287bbead8a2SBarry Smith ij[0] = 6*i; ij[1] = 6*i + 1; ij[2] = 6*i + 2; ij[3] = 6*i + 3; ij[4] = 6*i + 4; ij[5] = 6*i + 5; 3288bbead8a2SBarry Smith ierr = MatGetValues(A,6,ij,6,ij,diag);CHKERRQ(ierr); 3289a455e926SHong Zhang ierr = PetscKernel_A_gets_inverse_A_6(diag,shift,allowzeropivot,&zeropivotdetected);CHKERRQ(ierr); 32907b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 329196b95a6bSBarry Smith ierr = PetscKernel_A_gets_transpose_A_6(diag);CHKERRQ(ierr); 3292bbead8a2SBarry Smith diag += 36; 3293bbead8a2SBarry Smith } 3294bbead8a2SBarry Smith break; 3295bbead8a2SBarry Smith case 7: 3296bbead8a2SBarry Smith for (i=0; i<mbs; i++) { 3297bbead8a2SBarry Smith ij[0] = 7*i; ij[1] = 7*i + 1; ij[2] = 7*i + 2; ij[3] = 7*i + 3; ij[4] = 7*i + 4; ij[5] = 7*i + 5; ij[5] = 7*i + 6; 3298bbead8a2SBarry Smith ierr = MatGetValues(A,7,ij,7,ij,diag);CHKERRQ(ierr); 3299a455e926SHong Zhang ierr = PetscKernel_A_gets_inverse_A_7(diag,shift,allowzeropivot,&zeropivotdetected);CHKERRQ(ierr); 33007b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 330196b95a6bSBarry Smith ierr = PetscKernel_A_gets_transpose_A_7(diag);CHKERRQ(ierr); 3302bbead8a2SBarry Smith diag += 49; 3303bbead8a2SBarry Smith } 3304bbead8a2SBarry Smith break; 3305bbead8a2SBarry Smith default: 3306dcca6d9dSJed Brown ierr = PetscMalloc3(bs,&v_work,bs,&v_pivots,bs,&IJ);CHKERRQ(ierr); 3307bbead8a2SBarry Smith for (i=0; i<mbs; i++) { 3308bbead8a2SBarry Smith for (j=0; j<bs; j++) { 3309bbead8a2SBarry Smith IJ[j] = bs*i + j; 3310bbead8a2SBarry Smith } 3311bbead8a2SBarry Smith ierr = MatGetValues(A,bs,IJ,bs,IJ,diag);CHKERRQ(ierr); 33125f8bbccaSHong Zhang ierr = PetscKernel_A_gets_inverse_A(bs,diag,v_pivots,v_work,allowzeropivot,&zeropivotdetected);CHKERRQ(ierr); 33137b6c816cSBarry Smith if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT; 331496b95a6bSBarry Smith ierr = PetscKernel_A_gets_transpose_A_N(diag,bs);CHKERRQ(ierr); 3315bbead8a2SBarry Smith diag += bs2; 3316bbead8a2SBarry Smith } 3317bbead8a2SBarry Smith ierr = PetscFree3(v_work,v_pivots,IJ);CHKERRQ(ierr); 3318bbead8a2SBarry Smith } 3319bbead8a2SBarry Smith a->ibdiagvalid = PETSC_TRUE; 3320bbead8a2SBarry Smith PetscFunctionReturn(0); 3321bbead8a2SBarry Smith } 3322bbead8a2SBarry Smith 332373a71a0fSBarry Smith static PetscErrorCode MatSetRandom_SeqAIJ(Mat x,PetscRandom rctx) 332473a71a0fSBarry Smith { 332573a71a0fSBarry Smith PetscErrorCode ierr; 332673a71a0fSBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ*)x->data; 332773a71a0fSBarry Smith PetscScalar a; 332873a71a0fSBarry Smith PetscInt m,n,i,j,col; 332973a71a0fSBarry Smith 333073a71a0fSBarry Smith PetscFunctionBegin; 333173a71a0fSBarry Smith if (!x->assembled) { 333273a71a0fSBarry Smith ierr = MatGetSize(x,&m,&n);CHKERRQ(ierr); 333373a71a0fSBarry Smith for (i=0; i<m; i++) { 333473a71a0fSBarry Smith for (j=0; j<aij->imax[i]; j++) { 333573a71a0fSBarry Smith ierr = PetscRandomGetValue(rctx,&a);CHKERRQ(ierr); 333673a71a0fSBarry Smith col = (PetscInt)(n*PetscRealPart(a)); 333773a71a0fSBarry Smith ierr = MatSetValues(x,1,&i,1,&col,&a,ADD_VALUES);CHKERRQ(ierr); 333873a71a0fSBarry Smith } 333973a71a0fSBarry Smith } 3340e2ce353bSJunchao Zhang } else { 3341e2ce353bSJunchao Zhang for (i=0; i<aij->nz; i++) {ierr = PetscRandomGetValue(rctx,aij->a+i);CHKERRQ(ierr);} 3342e2ce353bSJunchao Zhang } 334373a71a0fSBarry Smith ierr = MatAssemblyBegin(x,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 334473a71a0fSBarry Smith ierr = MatAssemblyEnd(x,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 334573a71a0fSBarry Smith PetscFunctionReturn(0); 334673a71a0fSBarry Smith } 334773a71a0fSBarry Smith 3348679944adSJunchao Zhang /* Like MatSetRandom_SeqAIJ, but do not set values on columns in range of [low, high) */ 3349679944adSJunchao Zhang PetscErrorCode MatSetRandomSkipColumnRange_SeqAIJ_Private(Mat x,PetscInt low,PetscInt high,PetscRandom rctx) 3350679944adSJunchao Zhang { 3351679944adSJunchao Zhang PetscErrorCode ierr; 3352679944adSJunchao Zhang Mat_SeqAIJ *aij = (Mat_SeqAIJ*)x->data; 3353679944adSJunchao Zhang PetscScalar a; 3354679944adSJunchao Zhang PetscInt m,n,i,j,col,nskip; 3355679944adSJunchao Zhang 3356679944adSJunchao Zhang PetscFunctionBegin; 3357679944adSJunchao Zhang nskip = high - low; 3358679944adSJunchao Zhang ierr = MatGetSize(x,&m,&n);CHKERRQ(ierr); 3359679944adSJunchao Zhang n -= nskip; /* shrink number of columns where nonzeros can be set */ 3360679944adSJunchao Zhang for (i=0; i<m; i++) { 3361679944adSJunchao Zhang for (j=0; j<aij->imax[i]; j++) { 3362679944adSJunchao Zhang ierr = PetscRandomGetValue(rctx,&a);CHKERRQ(ierr); 3363679944adSJunchao Zhang col = (PetscInt)(n*PetscRealPart(a)); 3364679944adSJunchao Zhang if (col >= low) col += nskip; /* shift col rightward to skip the hole */ 3365679944adSJunchao Zhang ierr = MatSetValues(x,1,&i,1,&col,&a,ADD_VALUES);CHKERRQ(ierr); 3366679944adSJunchao Zhang } 3367e2ce353bSJunchao Zhang } 3368679944adSJunchao Zhang ierr = MatAssemblyBegin(x,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 3369679944adSJunchao Zhang ierr = MatAssemblyEnd(x,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 3370679944adSJunchao Zhang PetscFunctionReturn(0); 3371679944adSJunchao Zhang } 3372679944adSJunchao Zhang 3373679944adSJunchao Zhang 3374682d7d0cSBarry Smith /* -------------------------------------------------------------------*/ 33750a6ffc59SBarry Smith static struct _MatOps MatOps_Values = { MatSetValues_SeqAIJ, 3376cb5b572fSBarry Smith MatGetRow_SeqAIJ, 3377cb5b572fSBarry Smith MatRestoreRow_SeqAIJ, 3378cb5b572fSBarry Smith MatMult_SeqAIJ, 337997304618SKris Buschelman /* 4*/ MatMultAdd_SeqAIJ, 33807c922b88SBarry Smith MatMultTranspose_SeqAIJ, 33817c922b88SBarry Smith MatMultTransposeAdd_SeqAIJ, 3382db4efbfdSBarry Smith 0, 3383db4efbfdSBarry Smith 0, 3384db4efbfdSBarry Smith 0, 3385db4efbfdSBarry Smith /* 10*/ 0, 3386cb5b572fSBarry Smith MatLUFactor_SeqAIJ, 3387cb5b572fSBarry Smith 0, 338841f059aeSBarry Smith MatSOR_SeqAIJ, 338991e9d3e2SHong Zhang MatTranspose_SeqAIJ, 339097304618SKris Buschelman /*1 5*/ MatGetInfo_SeqAIJ, 3391cb5b572fSBarry Smith MatEqual_SeqAIJ, 3392cb5b572fSBarry Smith MatGetDiagonal_SeqAIJ, 3393cb5b572fSBarry Smith MatDiagonalScale_SeqAIJ, 3394cb5b572fSBarry Smith MatNorm_SeqAIJ, 339597304618SKris Buschelman /* 20*/ 0, 3396cb5b572fSBarry Smith MatAssemblyEnd_SeqAIJ, 3397cb5b572fSBarry Smith MatSetOption_SeqAIJ, 3398cb5b572fSBarry Smith MatZeroEntries_SeqAIJ, 3399d519adbfSMatthew Knepley /* 24*/ MatZeroRows_SeqAIJ, 3400db4efbfdSBarry Smith 0, 3401db4efbfdSBarry Smith 0, 3402db4efbfdSBarry Smith 0, 3403db4efbfdSBarry Smith 0, 34044994cf47SJed Brown /* 29*/ MatSetUp_SeqAIJ, 3405db4efbfdSBarry Smith 0, 3406db4efbfdSBarry Smith 0, 34078c778c55SBarry Smith 0, 34088c778c55SBarry Smith 0, 3409d519adbfSMatthew Knepley /* 34*/ MatDuplicate_SeqAIJ, 3410cb5b572fSBarry Smith 0, 3411cb5b572fSBarry Smith 0, 3412cb5b572fSBarry Smith MatILUFactor_SeqAIJ, 3413cb5b572fSBarry Smith 0, 3414d519adbfSMatthew Knepley /* 39*/ MatAXPY_SeqAIJ, 34157dae84e0SHong Zhang MatCreateSubMatrices_SeqAIJ, 3416cb5b572fSBarry Smith MatIncreaseOverlap_SeqAIJ, 3417cb5b572fSBarry Smith MatGetValues_SeqAIJ, 3418cb5b572fSBarry Smith MatCopy_SeqAIJ, 3419d519adbfSMatthew Knepley /* 44*/ MatGetRowMax_SeqAIJ, 3420cb5b572fSBarry Smith MatScale_SeqAIJ, 34217d68702bSBarry Smith MatShift_SeqAIJ, 342279299369SBarry Smith MatDiagonalSet_SeqAIJ, 34236e169961SBarry Smith MatZeroRowsColumns_SeqAIJ, 342473a71a0fSBarry Smith /* 49*/ MatSetRandom_SeqAIJ, 34253b2fbd54SBarry Smith MatGetRowIJ_SeqAIJ, 34263b2fbd54SBarry Smith MatRestoreRowIJ_SeqAIJ, 34273b2fbd54SBarry Smith MatGetColumnIJ_SeqAIJ, 3428a93ec695SBarry Smith MatRestoreColumnIJ_SeqAIJ, 342993dfae19SHong Zhang /* 54*/ MatFDColoringCreate_SeqXAIJ, 3430b9617806SBarry Smith 0, 34310513a670SBarry Smith 0, 3432cda55fadSBarry Smith MatPermute_SeqAIJ, 3433cda55fadSBarry Smith 0, 3434d519adbfSMatthew Knepley /* 59*/ 0, 3435b9b97703SBarry Smith MatDestroy_SeqAIJ, 3436b9b97703SBarry Smith MatView_SeqAIJ, 3437357abbc8SBarry Smith 0, 34384222ddf1SHong Zhang 0, 34394222ddf1SHong Zhang /* 64*/ 0, 3440321b30b9SSatish Balay MatMatMatMultNumeric_SeqAIJ_SeqAIJ_SeqAIJ, 3441ee4f033dSBarry Smith 0, 3442ee4f033dSBarry Smith 0, 3443ee4f033dSBarry Smith 0, 3444d519adbfSMatthew Knepley /* 69*/ MatGetRowMaxAbs_SeqAIJ, 3445c87e5d42SMatthew Knepley MatGetRowMinAbs_SeqAIJ, 3446ee4f033dSBarry Smith 0, 3447dcf5cc72SBarry Smith 0, 34482c93a97aSBarry Smith 0, 34492c93a97aSBarry Smith /* 74*/ 0, 34503acb8795SBarry Smith MatFDColoringApply_AIJ, 345197304618SKris Buschelman 0, 345297304618SKris Buschelman 0, 345397304618SKris Buschelman 0, 34546ce1633cSBarry Smith /* 79*/ MatFindZeroDiagonals_SeqAIJ, 345597304618SKris Buschelman 0, 345697304618SKris Buschelman 0, 345797304618SKris Buschelman 0, 3458bc011b1eSHong Zhang MatLoad_SeqAIJ, 3459d519adbfSMatthew Knepley /* 84*/ MatIsSymmetric_SeqAIJ, 34601cbb95d3SBarry Smith MatIsHermitian_SeqAIJ, 34616284ec50SHong Zhang 0, 34626284ec50SHong Zhang 0, 3463bc011b1eSHong Zhang 0, 34644222ddf1SHong Zhang /* 89*/ 0, 34654222ddf1SHong Zhang 0, 346626be0446SHong Zhang MatMatMultNumeric_SeqAIJ_SeqAIJ, 34674222ddf1SHong Zhang 0, 34684222ddf1SHong Zhang 0, 34698fa4b5a6SHong Zhang /* 94*/ MatPtAPNumeric_SeqAIJ_SeqAIJ_SparseAxpy, 34704222ddf1SHong Zhang 0, 34714222ddf1SHong Zhang 0, 34726fc122caSHong Zhang MatMatTransposeMultNumeric_SeqAIJ_SeqAIJ, 34732121bac1SHong Zhang 0, 34744222ddf1SHong Zhang /* 99*/ MatProductSetFromOptions_SeqAIJ, 3475609c6c4dSKris Buschelman 0, 3476609c6c4dSKris Buschelman 0, 347787d4246cSBarry Smith MatConjugate_SeqAIJ, 347887d4246cSBarry Smith 0, 3479d519adbfSMatthew Knepley /*104*/ MatSetValuesRow_SeqAIJ, 348099cafbc1SBarry Smith MatRealPart_SeqAIJ, 3481f5edf698SHong Zhang MatImaginaryPart_SeqAIJ, 3482f5edf698SHong Zhang 0, 34832bebee5dSHong Zhang 0, 3484cbd44569SHong Zhang /*109*/ MatMatSolve_SeqAIJ, 3485985db425SBarry Smith 0, 34862af78befSBarry Smith MatGetRowMin_SeqAIJ, 34872af78befSBarry Smith 0, 3488599ef60dSHong Zhang MatMissingDiagonal_SeqAIJ, 3489d519adbfSMatthew Knepley /*114*/ 0, 3490599ef60dSHong Zhang 0, 34913c2a7987SHong Zhang 0, 3492fe97e370SBarry Smith 0, 3493fbdbba38SShri Abhyankar 0, 3494fbdbba38SShri Abhyankar /*119*/ 0, 3495fbdbba38SShri Abhyankar 0, 3496fbdbba38SShri Abhyankar 0, 349782d44351SHong Zhang 0, 3498b3a44c85SBarry Smith MatGetMultiProcBlock_SeqAIJ, 34990716a85fSBarry Smith /*124*/ MatFindNonzeroRows_SeqAIJ, 3500bbead8a2SBarry Smith MatGetColumnNorms_SeqAIJ, 350137868618SMatthew G Knepley MatInvertBlockDiagonal_SeqAIJ, 35020da83c2eSBarry Smith MatInvertVariableBlockDiagonal_SeqAIJ, 350337868618SMatthew G Knepley 0, 35045df89d91SHong Zhang /*129*/ 0, 35054222ddf1SHong Zhang 0, 35064222ddf1SHong Zhang 0, 350775648e8dSHong Zhang MatTransposeMatMultNumeric_SeqAIJ_SeqAIJ, 3508b9af6bddSHong Zhang MatTransposeColoringCreate_SeqAIJ, 3509b9af6bddSHong Zhang /*134*/ MatTransColoringApplySpToDen_SeqAIJ, 35102b8ad9a3SHong Zhang MatTransColoringApplyDenToSp_SeqAIJ, 35114222ddf1SHong Zhang 0, 35124222ddf1SHong Zhang 0, 35133964eb88SJed Brown MatRARtNumeric_SeqAIJ_SeqAIJ, 35143964eb88SJed Brown /*139*/0, 3515f9426fe0SMark Adams 0, 35161919a2e2SJed Brown 0, 35173a062f41SBarry Smith MatFDColoringSetUp_SeqXAIJ, 35189c8f2541SHong Zhang MatFindOffBlockDiagonalEntries_SeqAIJ, 35194222ddf1SHong Zhang MatCreateMPIMatConcatenateSeqMat_SeqAIJ, 35204222ddf1SHong Zhang /*145*/MatDestroySubMatrices_SeqAIJ, 35214222ddf1SHong Zhang 0, 35224222ddf1SHong Zhang 0 35239e29f15eSvictorle }; 352417ab2063SBarry Smith 35257087cfbeSBarry Smith PetscErrorCode MatSeqAIJSetColumnIndices_SeqAIJ(Mat mat,PetscInt *indices) 3526bef8e0ddSBarry Smith { 3527bef8e0ddSBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ*)mat->data; 352897f1f81fSBarry Smith PetscInt i,nz,n; 3529bef8e0ddSBarry Smith 3530bef8e0ddSBarry Smith PetscFunctionBegin; 3531bef8e0ddSBarry Smith nz = aij->maxnz; 3532d0f46423SBarry Smith n = mat->rmap->n; 3533bef8e0ddSBarry Smith for (i=0; i<nz; i++) { 3534bef8e0ddSBarry Smith aij->j[i] = indices[i]; 3535bef8e0ddSBarry Smith } 3536bef8e0ddSBarry Smith aij->nz = nz; 3537bef8e0ddSBarry Smith for (i=0; i<n; i++) { 3538bef8e0ddSBarry Smith aij->ilen[i] = aij->imax[i]; 3539bef8e0ddSBarry Smith } 3540bef8e0ddSBarry Smith PetscFunctionReturn(0); 3541bef8e0ddSBarry Smith } 3542bef8e0ddSBarry Smith 3543a3bb6f32SFande Kong /* 3544e8b528d9SFande Kong * When a sparse matrix has many zero columns, we should compact them out to save the space 3545a3bb6f32SFande Kong * This happens in MatPtAPSymbolic_MPIAIJ_MPIAIJ_scalable() 3546a3bb6f32SFande Kong * */ 3547a3bb6f32SFande Kong PetscErrorCode MatSeqAIJCompactOutExtraColumns_SeqAIJ(Mat mat, ISLocalToGlobalMapping *mapping) 3548a3bb6f32SFande Kong { 3549a3bb6f32SFande Kong Mat_SeqAIJ *aij = (Mat_SeqAIJ*)mat->data; 3550a3bb6f32SFande Kong PetscTable gid1_lid1; 3551a3bb6f32SFande Kong PetscTablePosition tpos; 3552a3bb6f32SFande Kong PetscInt gid,lid,i,j,ncols,ec; 3553a3bb6f32SFande Kong PetscInt *garray; 3554a3bb6f32SFande Kong PetscErrorCode ierr; 3555a3bb6f32SFande Kong 3556a3bb6f32SFande Kong PetscFunctionBegin; 3557a3bb6f32SFande Kong PetscValidHeaderSpecific(mat,MAT_CLASSID,1); 3558a3bb6f32SFande Kong PetscValidPointer(mapping,2); 3559a3bb6f32SFande Kong /* use a table */ 3560a3bb6f32SFande Kong ierr = PetscTableCreate(mat->rmap->n,mat->cmap->N+1,&gid1_lid1);CHKERRQ(ierr); 3561a3bb6f32SFande Kong ec = 0; 3562a3bb6f32SFande Kong for (i=0; i<mat->rmap->n; i++) { 3563a3bb6f32SFande Kong ncols = aij->i[i+1] - aij->i[i]; 3564a3bb6f32SFande Kong for (j=0; j<ncols; j++) { 3565a3bb6f32SFande Kong PetscInt data,gid1 = aij->j[aij->i[i] + j] + 1; 3566a3bb6f32SFande Kong ierr = PetscTableFind(gid1_lid1,gid1,&data);CHKERRQ(ierr); 3567a3bb6f32SFande Kong if (!data) { 3568a3bb6f32SFande Kong /* one based table */ 3569a3bb6f32SFande Kong ierr = PetscTableAdd(gid1_lid1,gid1,++ec,INSERT_VALUES);CHKERRQ(ierr); 3570a3bb6f32SFande Kong } 3571a3bb6f32SFande Kong } 3572a3bb6f32SFande Kong } 3573a3bb6f32SFande Kong /* form array of columns we need */ 3574a3bb6f32SFande Kong ierr = PetscMalloc1(ec+1,&garray);CHKERRQ(ierr); 3575a3bb6f32SFande Kong ierr = PetscTableGetHeadPosition(gid1_lid1,&tpos);CHKERRQ(ierr); 3576a3bb6f32SFande Kong while (tpos) { 3577a3bb6f32SFande Kong ierr = PetscTableGetNext(gid1_lid1,&tpos,&gid,&lid);CHKERRQ(ierr); 3578a3bb6f32SFande Kong gid--; 3579a3bb6f32SFande Kong lid--; 3580a3bb6f32SFande Kong garray[lid] = gid; 3581a3bb6f32SFande Kong } 3582a3bb6f32SFande Kong ierr = PetscSortInt(ec,garray);CHKERRQ(ierr); /* sort, and rebuild */ 3583a3bb6f32SFande Kong ierr = PetscTableRemoveAll(gid1_lid1);CHKERRQ(ierr); 3584a3bb6f32SFande Kong for (i=0; i<ec; i++) { 3585a3bb6f32SFande Kong ierr = PetscTableAdd(gid1_lid1,garray[i]+1,i+1,INSERT_VALUES);CHKERRQ(ierr); 3586a3bb6f32SFande Kong } 3587a3bb6f32SFande Kong /* compact out the extra columns in B */ 3588a3bb6f32SFande Kong for (i=0; i<mat->rmap->n; i++) { 3589a3bb6f32SFande Kong ncols = aij->i[i+1] - aij->i[i]; 3590a3bb6f32SFande Kong for (j=0; j<ncols; j++) { 3591a3bb6f32SFande Kong PetscInt gid1 = aij->j[aij->i[i] + j] + 1; 3592a3bb6f32SFande Kong ierr = PetscTableFind(gid1_lid1,gid1,&lid);CHKERRQ(ierr); 3593a3bb6f32SFande Kong lid--; 3594a3bb6f32SFande Kong aij->j[aij->i[i] + j] = lid; 3595a3bb6f32SFande Kong } 3596a3bb6f32SFande Kong } 3597ca5434daSLawrence Mitchell ierr = PetscLayoutDestroy(&mat->cmap);CHKERRQ(ierr); 3598ca5434daSLawrence Mitchell ierr = PetscLayoutCreateFromSizes(PetscObjectComm((PetscObject)mat),ec,ec,1,&mat->cmap);CHKERRQ(ierr); 3599a3bb6f32SFande Kong ierr = PetscTableDestroy(&gid1_lid1);CHKERRQ(ierr); 3600a3bb6f32SFande Kong ierr = ISLocalToGlobalMappingCreate(PETSC_COMM_SELF,mat->cmap->bs,mat->cmap->n,garray,PETSC_OWN_POINTER,mapping);CHKERRQ(ierr); 3601a3bb6f32SFande Kong ierr = ISLocalToGlobalMappingSetType(*mapping,ISLOCALTOGLOBALMAPPINGHASH);CHKERRQ(ierr); 3602a3bb6f32SFande Kong PetscFunctionReturn(0); 3603a3bb6f32SFande Kong } 3604a3bb6f32SFande Kong 3605bef8e0ddSBarry Smith /*@ 3606bef8e0ddSBarry Smith MatSeqAIJSetColumnIndices - Set the column indices for all the rows 3607bef8e0ddSBarry Smith in the matrix. 3608bef8e0ddSBarry Smith 3609bef8e0ddSBarry Smith Input Parameters: 3610bef8e0ddSBarry Smith + mat - the SeqAIJ matrix 3611bef8e0ddSBarry Smith - indices - the column indices 3612bef8e0ddSBarry Smith 361315091d37SBarry Smith Level: advanced 361415091d37SBarry Smith 3615bef8e0ddSBarry Smith Notes: 3616bef8e0ddSBarry Smith This can be called if you have precomputed the nonzero structure of the 3617bef8e0ddSBarry Smith matrix and want to provide it to the matrix object to improve the performance 3618bef8e0ddSBarry Smith of the MatSetValues() operation. 3619bef8e0ddSBarry Smith 3620bef8e0ddSBarry Smith You MUST have set the correct numbers of nonzeros per row in the call to 3621d1be2dadSMatthew Knepley MatCreateSeqAIJ(), and the columns indices MUST be sorted. 3622bef8e0ddSBarry Smith 3623bef8e0ddSBarry Smith MUST be called before any calls to MatSetValues(); 3624bef8e0ddSBarry Smith 3625b9617806SBarry Smith The indices should start with zero, not one. 3626b9617806SBarry Smith 3627bef8e0ddSBarry Smith @*/ 36287087cfbeSBarry Smith PetscErrorCode MatSeqAIJSetColumnIndices(Mat mat,PetscInt *indices) 3629bef8e0ddSBarry Smith { 36304ac538c5SBarry Smith PetscErrorCode ierr; 3631bef8e0ddSBarry Smith 3632bef8e0ddSBarry Smith PetscFunctionBegin; 36330700a824SBarry Smith PetscValidHeaderSpecific(mat,MAT_CLASSID,1); 36344482741eSBarry Smith PetscValidPointer(indices,2); 36354ac538c5SBarry Smith ierr = PetscUseMethod(mat,"MatSeqAIJSetColumnIndices_C",(Mat,PetscInt*),(mat,indices));CHKERRQ(ierr); 3636bef8e0ddSBarry Smith PetscFunctionReturn(0); 3637bef8e0ddSBarry Smith } 3638bef8e0ddSBarry Smith 3639be6bf707SBarry Smith /* ----------------------------------------------------------------------------------------*/ 3640be6bf707SBarry Smith 36417087cfbeSBarry Smith PetscErrorCode MatStoreValues_SeqAIJ(Mat mat) 3642be6bf707SBarry Smith { 3643be6bf707SBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ*)mat->data; 36446849ba73SBarry Smith PetscErrorCode ierr; 3645d0f46423SBarry Smith size_t nz = aij->i[mat->rmap->n]; 3646be6bf707SBarry Smith 3647be6bf707SBarry Smith PetscFunctionBegin; 3648169f6850SBarry Smith if (!aij->nonew) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ORDER,"Must call MatSetOption(A,MAT_NEW_NONZERO_LOCATIONS,PETSC_FALSE);first"); 3649be6bf707SBarry Smith 3650be6bf707SBarry Smith /* allocate space for values if not already there */ 3651be6bf707SBarry Smith if (!aij->saved_values) { 3652854ce69bSBarry Smith ierr = PetscMalloc1(nz+1,&aij->saved_values);CHKERRQ(ierr); 36533bb1ff40SBarry Smith ierr = PetscLogObjectMemory((PetscObject)mat,(nz+1)*sizeof(PetscScalar));CHKERRQ(ierr); 3654be6bf707SBarry Smith } 3655be6bf707SBarry Smith 3656be6bf707SBarry Smith /* copy values over */ 3657580bdb30SBarry Smith ierr = PetscArraycpy(aij->saved_values,aij->a,nz);CHKERRQ(ierr); 3658be6bf707SBarry Smith PetscFunctionReturn(0); 3659be6bf707SBarry Smith } 3660be6bf707SBarry Smith 3661be6bf707SBarry Smith /*@ 3662be6bf707SBarry Smith MatStoreValues - Stashes a copy of the matrix values; this allows, for 3663be6bf707SBarry Smith example, reuse of the linear part of a Jacobian, while recomputing the 3664be6bf707SBarry Smith nonlinear portion. 3665be6bf707SBarry Smith 3666be6bf707SBarry Smith Collect on Mat 3667be6bf707SBarry Smith 3668be6bf707SBarry Smith Input Parameters: 36690e609b76SBarry Smith . mat - the matrix (currently only AIJ matrices support this option) 3670be6bf707SBarry Smith 367115091d37SBarry Smith Level: advanced 367215091d37SBarry Smith 3673be6bf707SBarry Smith Common Usage, with SNESSolve(): 3674be6bf707SBarry Smith $ Create Jacobian matrix 3675be6bf707SBarry Smith $ Set linear terms into matrix 3676be6bf707SBarry Smith $ Apply boundary conditions to matrix, at this time matrix must have 3677be6bf707SBarry Smith $ final nonzero structure (i.e. setting the nonlinear terms and applying 3678be6bf707SBarry Smith $ boundary conditions again will not change the nonzero structure 3679512a5fc5SBarry Smith $ ierr = MatSetOption(mat,MAT_NEW_NONZERO_LOCATIONS,PETSC_FALSE); 3680be6bf707SBarry Smith $ ierr = MatStoreValues(mat); 3681be6bf707SBarry Smith $ Call SNESSetJacobian() with matrix 3682be6bf707SBarry Smith $ In your Jacobian routine 3683be6bf707SBarry Smith $ ierr = MatRetrieveValues(mat); 3684be6bf707SBarry Smith $ Set nonlinear terms in matrix 3685be6bf707SBarry Smith 3686be6bf707SBarry Smith Common Usage without SNESSolve(), i.e. when you handle nonlinear solve yourself: 3687be6bf707SBarry Smith $ // build linear portion of Jacobian 3688512a5fc5SBarry Smith $ ierr = MatSetOption(mat,MAT_NEW_NONZERO_LOCATIONS,PETSC_FALSE); 3689be6bf707SBarry Smith $ ierr = MatStoreValues(mat); 3690be6bf707SBarry Smith $ loop over nonlinear iterations 3691be6bf707SBarry Smith $ ierr = MatRetrieveValues(mat); 3692be6bf707SBarry Smith $ // call MatSetValues(mat,...) to set nonliner portion of Jacobian 3693be6bf707SBarry Smith $ // call MatAssemblyBegin/End() on matrix 3694be6bf707SBarry Smith $ Solve linear system with Jacobian 3695be6bf707SBarry Smith $ endloop 3696be6bf707SBarry Smith 3697be6bf707SBarry Smith Notes: 3698be6bf707SBarry Smith Matrix must already be assemblied before calling this routine 3699512a5fc5SBarry Smith Must set the matrix option MatSetOption(mat,MAT_NEW_NONZERO_LOCATIONS,PETSC_FALSE); before 3700be6bf707SBarry Smith calling this routine. 3701be6bf707SBarry Smith 37020c468ba9SBarry Smith When this is called multiple times it overwrites the previous set of stored values 37030c468ba9SBarry Smith and does not allocated additional space. 37040c468ba9SBarry Smith 3705be6bf707SBarry Smith .seealso: MatRetrieveValues() 3706be6bf707SBarry Smith 3707be6bf707SBarry Smith @*/ 37087087cfbeSBarry Smith PetscErrorCode MatStoreValues(Mat mat) 3709be6bf707SBarry Smith { 37104ac538c5SBarry Smith PetscErrorCode ierr; 3711be6bf707SBarry Smith 3712be6bf707SBarry Smith PetscFunctionBegin; 37130700a824SBarry Smith PetscValidHeaderSpecific(mat,MAT_CLASSID,1); 3714e32f2f54SBarry Smith if (!mat->assembled) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Not for unassembled matrix"); 3715e32f2f54SBarry Smith if (mat->factortype) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Not for factored matrix"); 37164ac538c5SBarry Smith ierr = PetscUseMethod(mat,"MatStoreValues_C",(Mat),(mat));CHKERRQ(ierr); 3717be6bf707SBarry Smith PetscFunctionReturn(0); 3718be6bf707SBarry Smith } 3719be6bf707SBarry Smith 37207087cfbeSBarry Smith PetscErrorCode MatRetrieveValues_SeqAIJ(Mat mat) 3721be6bf707SBarry Smith { 3722be6bf707SBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ*)mat->data; 37236849ba73SBarry Smith PetscErrorCode ierr; 3724d0f46423SBarry Smith PetscInt nz = aij->i[mat->rmap->n]; 3725be6bf707SBarry Smith 3726be6bf707SBarry Smith PetscFunctionBegin; 3727169f6850SBarry Smith if (!aij->nonew) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ORDER,"Must call MatSetOption(A,MAT_NEW_NONZERO_LOCATIONS,PETSC_FALSE);first"); 3728f23aa3ddSBarry Smith if (!aij->saved_values) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ORDER,"Must call MatStoreValues(A);first"); 3729be6bf707SBarry Smith /* copy values over */ 3730580bdb30SBarry Smith ierr = PetscArraycpy(aij->a,aij->saved_values,nz);CHKERRQ(ierr); 3731be6bf707SBarry Smith PetscFunctionReturn(0); 3732be6bf707SBarry Smith } 3733be6bf707SBarry Smith 3734be6bf707SBarry Smith /*@ 3735be6bf707SBarry Smith MatRetrieveValues - Retrieves the copy of the matrix values; this allows, for 3736be6bf707SBarry Smith example, reuse of the linear part of a Jacobian, while recomputing the 3737be6bf707SBarry Smith nonlinear portion. 3738be6bf707SBarry Smith 3739be6bf707SBarry Smith Collect on Mat 3740be6bf707SBarry Smith 3741be6bf707SBarry Smith Input Parameters: 3742386f7cf9SBarry Smith . mat - the matrix (currently only AIJ matrices support this option) 3743be6bf707SBarry Smith 374415091d37SBarry Smith Level: advanced 374515091d37SBarry Smith 3746be6bf707SBarry Smith .seealso: MatStoreValues() 3747be6bf707SBarry Smith 3748be6bf707SBarry Smith @*/ 37497087cfbeSBarry Smith PetscErrorCode MatRetrieveValues(Mat mat) 3750be6bf707SBarry Smith { 37514ac538c5SBarry Smith PetscErrorCode ierr; 3752be6bf707SBarry Smith 3753be6bf707SBarry Smith PetscFunctionBegin; 37540700a824SBarry Smith PetscValidHeaderSpecific(mat,MAT_CLASSID,1); 3755e32f2f54SBarry Smith if (!mat->assembled) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Not for unassembled matrix"); 3756e32f2f54SBarry Smith if (mat->factortype) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Not for factored matrix"); 37574ac538c5SBarry Smith ierr = PetscUseMethod(mat,"MatRetrieveValues_C",(Mat),(mat));CHKERRQ(ierr); 3758be6bf707SBarry Smith PetscFunctionReturn(0); 3759be6bf707SBarry Smith } 3760be6bf707SBarry Smith 3761f83d6046SBarry Smith 3762be6bf707SBarry Smith /* --------------------------------------------------------------------------------*/ 376317ab2063SBarry Smith /*@C 3764682d7d0cSBarry Smith MatCreateSeqAIJ - Creates a sparse matrix in AIJ (compressed row) format 37650d15e28bSLois Curfman McInnes (the default parallel PETSc format). For good matrix assembly performance 37666e62573dSLois Curfman McInnes the user should preallocate the matrix storage by setting the parameter nz 376751c19458SBarry Smith (or the array nnz). By setting these parameters accurately, performance 37682bd5e0b2SLois Curfman McInnes during matrix assembly can be increased by more than a factor of 50. 376917ab2063SBarry Smith 3770d083f849SBarry Smith Collective 3771db81eaa0SLois Curfman McInnes 377217ab2063SBarry Smith Input Parameters: 3773db81eaa0SLois Curfman McInnes + comm - MPI communicator, set to PETSC_COMM_SELF 377417ab2063SBarry Smith . m - number of rows 377517ab2063SBarry Smith . n - number of columns 377617ab2063SBarry Smith . nz - number of nonzeros per row (same for all rows) 377751c19458SBarry Smith - nnz - array containing the number of nonzeros in the various rows 37780298fd71SBarry Smith (possibly different for each row) or NULL 377917ab2063SBarry Smith 378017ab2063SBarry Smith Output Parameter: 3781416022c9SBarry Smith . A - the matrix 378217ab2063SBarry Smith 3783175b88e8SBarry Smith It is recommended that one use the MatCreate(), MatSetType() and/or MatSetFromOptions(), 3784f6f02116SRichard Tran Mills MatXXXXSetPreallocation() paradigm instead of this routine directly. 3785175b88e8SBarry Smith [MatXXXXSetPreallocation() is, for example, MatSeqAIJSetPreallocation] 3786175b88e8SBarry Smith 3787b259b22eSLois Curfman McInnes Notes: 378849a6f317SBarry Smith If nnz is given then nz is ignored 378949a6f317SBarry Smith 379017ab2063SBarry Smith The AIJ format (also called the Yale sparse matrix format or 379117ab2063SBarry Smith compressed row storage), is fully compatible with standard Fortran 77 37920002213bSLois Curfman McInnes storage. That is, the stored row and column indices can begin at 379344cd7ae7SLois Curfman McInnes either one (as in Fortran) or zero. See the users' manual for details. 379417ab2063SBarry Smith 379517ab2063SBarry Smith Specify the preallocated storage with either nz or nnz (not both). 37960298fd71SBarry Smith Set nz=PETSC_DEFAULT and nnz=NULL for PETSc to control dynamic memory 37973d323bbdSBarry Smith allocation. For large problems you MUST preallocate memory or you 37986da5968aSLois Curfman McInnes will get TERRIBLE performance, see the users' manual chapter on matrices. 379917ab2063SBarry Smith 3800682d7d0cSBarry Smith By default, this format uses inodes (identical nodes) when possible, to 38014fca80b9SLois Curfman McInnes improve numerical efficiency of matrix-vector products and solves. We 3802682d7d0cSBarry Smith search for consecutive rows with the same nonzero structure, thereby 38036c7ebb05SLois Curfman McInnes reusing matrix information to achieve increased efficiency. 38046c7ebb05SLois Curfman McInnes 38056c7ebb05SLois Curfman McInnes Options Database Keys: 3806698d4c6aSKris Buschelman + -mat_no_inode - Do not use inodes 38079db58ca8SBarry Smith - -mat_inode_limit <limit> - Sets inode limit (max limit=5) 380817ab2063SBarry Smith 3809027ccd11SLois Curfman McInnes Level: intermediate 3810027ccd11SLois Curfman McInnes 381169b1f4b7SBarry Smith .seealso: MatCreate(), MatCreateAIJ(), MatSetValues(), MatSeqAIJSetColumnIndices(), MatCreateSeqAIJWithArrays() 381236db0b34SBarry Smith 381317ab2063SBarry Smith @*/ 38147087cfbeSBarry Smith PetscErrorCode MatCreateSeqAIJ(MPI_Comm comm,PetscInt m,PetscInt n,PetscInt nz,const PetscInt nnz[],Mat *A) 381517ab2063SBarry Smith { 3816dfbe8321SBarry Smith PetscErrorCode ierr; 38176945ee14SBarry Smith 38183a40ed3dSBarry Smith PetscFunctionBegin; 3819f69a0ea3SMatthew Knepley ierr = MatCreate(comm,A);CHKERRQ(ierr); 3820117016b1SBarry Smith ierr = MatSetSizes(*A,m,n,m,n);CHKERRQ(ierr); 3821c4752a88SBarry Smith ierr = MatSetType(*A,MATSEQAIJ);CHKERRQ(ierr); 3822d28bb7d2SJed Brown ierr = MatSeqAIJSetPreallocation_SeqAIJ(*A,nz,nnz);CHKERRQ(ierr); 3823273d9f13SBarry Smith PetscFunctionReturn(0); 3824273d9f13SBarry Smith } 3825273d9f13SBarry Smith 3826273d9f13SBarry Smith /*@C 3827273d9f13SBarry Smith MatSeqAIJSetPreallocation - For good matrix assembly performance 3828273d9f13SBarry Smith the user should preallocate the matrix storage by setting the parameter nz 3829273d9f13SBarry Smith (or the array nnz). By setting these parameters accurately, performance 3830273d9f13SBarry Smith during matrix assembly can be increased by more than a factor of 50. 3831273d9f13SBarry Smith 3832d083f849SBarry Smith Collective 3833273d9f13SBarry Smith 3834273d9f13SBarry Smith Input Parameters: 38351c4f3114SJed Brown + B - The matrix 3836273d9f13SBarry Smith . nz - number of nonzeros per row (same for all rows) 3837273d9f13SBarry Smith - nnz - array containing the number of nonzeros in the various rows 38380298fd71SBarry Smith (possibly different for each row) or NULL 3839273d9f13SBarry Smith 3840273d9f13SBarry Smith Notes: 384149a6f317SBarry Smith If nnz is given then nz is ignored 384249a6f317SBarry Smith 3843273d9f13SBarry Smith The AIJ format (also called the Yale sparse matrix format or 3844273d9f13SBarry Smith compressed row storage), is fully compatible with standard Fortran 77 3845273d9f13SBarry Smith storage. That is, the stored row and column indices can begin at 3846273d9f13SBarry Smith either one (as in Fortran) or zero. See the users' manual for details. 3847273d9f13SBarry Smith 3848273d9f13SBarry Smith Specify the preallocated storage with either nz or nnz (not both). 38490298fd71SBarry Smith Set nz=PETSC_DEFAULT and nnz=NULL for PETSc to control dynamic memory 3850273d9f13SBarry Smith allocation. For large problems you MUST preallocate memory or you 3851273d9f13SBarry Smith will get TERRIBLE performance, see the users' manual chapter on matrices. 3852273d9f13SBarry Smith 3853aa95bbe8SBarry Smith You can call MatGetInfo() to get information on how effective the preallocation was; 3854aa95bbe8SBarry Smith for example the fields mallocs,nz_allocated,nz_used,nz_unneeded; 3855aa95bbe8SBarry Smith You can also run with the option -info and look for messages with the string 3856aa95bbe8SBarry Smith malloc in them to see if additional memory allocation was needed. 3857aa95bbe8SBarry Smith 3858a96a251dSBarry Smith Developers: Use nz of MAT_SKIP_ALLOCATION to not allocate any space for the matrix 3859a96a251dSBarry Smith entries or columns indices 3860a96a251dSBarry Smith 3861273d9f13SBarry Smith By default, this format uses inodes (identical nodes) when possible, to 3862273d9f13SBarry Smith improve numerical efficiency of matrix-vector products and solves. We 3863273d9f13SBarry Smith search for consecutive rows with the same nonzero structure, thereby 3864273d9f13SBarry Smith reusing matrix information to achieve increased efficiency. 3865273d9f13SBarry Smith 3866273d9f13SBarry Smith Options Database Keys: 3867698d4c6aSKris Buschelman + -mat_no_inode - Do not use inodes 386847b2e64bSBarry Smith - -mat_inode_limit <limit> - Sets inode limit (max limit=5) 3869273d9f13SBarry Smith 3870273d9f13SBarry Smith Level: intermediate 3871273d9f13SBarry Smith 387269b1f4b7SBarry Smith .seealso: MatCreate(), MatCreateAIJ(), MatSetValues(), MatSeqAIJSetColumnIndices(), MatCreateSeqAIJWithArrays(), MatGetInfo() 3873273d9f13SBarry Smith 3874273d9f13SBarry Smith @*/ 38757087cfbeSBarry Smith PetscErrorCode MatSeqAIJSetPreallocation(Mat B,PetscInt nz,const PetscInt nnz[]) 3876273d9f13SBarry Smith { 38774ac538c5SBarry Smith PetscErrorCode ierr; 3878a23d5eceSKris Buschelman 3879a23d5eceSKris Buschelman PetscFunctionBegin; 38806ba663aaSJed Brown PetscValidHeaderSpecific(B,MAT_CLASSID,1); 38816ba663aaSJed Brown PetscValidType(B,1); 38824ac538c5SBarry Smith ierr = PetscTryMethod(B,"MatSeqAIJSetPreallocation_C",(Mat,PetscInt,const PetscInt[]),(B,nz,nnz));CHKERRQ(ierr); 3883a23d5eceSKris Buschelman PetscFunctionReturn(0); 3884a23d5eceSKris Buschelman } 3885a23d5eceSKris Buschelman 38867087cfbeSBarry Smith PetscErrorCode MatSeqAIJSetPreallocation_SeqAIJ(Mat B,PetscInt nz,const PetscInt *nnz) 3887a23d5eceSKris Buschelman { 3888273d9f13SBarry Smith Mat_SeqAIJ *b; 38892576faa2SJed Brown PetscBool skipallocation = PETSC_FALSE,realalloc = PETSC_FALSE; 38906849ba73SBarry Smith PetscErrorCode ierr; 389197f1f81fSBarry Smith PetscInt i; 3892273d9f13SBarry Smith 3893273d9f13SBarry Smith PetscFunctionBegin; 38942576faa2SJed Brown if (nz >= 0 || nnz) realalloc = PETSC_TRUE; 3895a96a251dSBarry Smith if (nz == MAT_SKIP_ALLOCATION) { 3896c461c341SBarry Smith skipallocation = PETSC_TRUE; 3897c461c341SBarry Smith nz = 0; 3898c461c341SBarry Smith } 389926283091SBarry Smith ierr = PetscLayoutSetUp(B->rmap);CHKERRQ(ierr); 390026283091SBarry Smith ierr = PetscLayoutSetUp(B->cmap);CHKERRQ(ierr); 3901899cda47SBarry Smith 3902435da068SBarry Smith if (nz == PETSC_DEFAULT || nz == PETSC_DECIDE) nz = 5; 390360e0710aSBarry Smith if (nz < 0) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"nz cannot be less than 0: value %D",nz); 3904cf9c20a2SJed Brown if (PetscUnlikelyDebug(nnz)) { 3905d0f46423SBarry Smith for (i=0; i<B->rmap->n; i++) { 390660e0710aSBarry Smith if (nnz[i] < 0) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"nnz cannot be less than 0: local row %D value %D",i,nnz[i]); 390760e0710aSBarry Smith if (nnz[i] > B->cmap->n) SETERRQ3(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"nnz cannot be greater than row length: local row %D value %d rowlength %D",i,nnz[i],B->cmap->n); 3908b73539f3SBarry Smith } 3909b73539f3SBarry Smith } 3910b73539f3SBarry Smith 3911273d9f13SBarry Smith B->preallocated = PETSC_TRUE; 39122205254eSKarl Rupp 3913273d9f13SBarry Smith b = (Mat_SeqAIJ*)B->data; 3914273d9f13SBarry Smith 3915ab93d7beSBarry Smith if (!skipallocation) { 39162ee49352SLisandro Dalcin if (!b->imax) { 3917071fcb05SBarry Smith ierr = PetscMalloc1(B->rmap->n,&b->imax);CHKERRQ(ierr); 3918071fcb05SBarry Smith ierr = PetscLogObjectMemory((PetscObject)B,B->rmap->n*sizeof(PetscInt));CHKERRQ(ierr); 3919071fcb05SBarry Smith } 3920071fcb05SBarry Smith if (!b->ilen) { 3921071fcb05SBarry Smith /* b->ilen will count nonzeros in each row so far. */ 3922071fcb05SBarry Smith ierr = PetscCalloc1(B->rmap->n,&b->ilen);CHKERRQ(ierr); 3923071fcb05SBarry Smith ierr = PetscLogObjectMemory((PetscObject)B,B->rmap->n*sizeof(PetscInt));CHKERRQ(ierr); 3924071fcb05SBarry Smith } else { 3925071fcb05SBarry Smith ierr = PetscMemzero(b->ilen,B->rmap->n*sizeof(PetscInt));CHKERRQ(ierr); 39262ee49352SLisandro Dalcin } 3927846b4da1SFande Kong if (!b->ipre) { 3928846b4da1SFande Kong ierr = PetscMalloc1(B->rmap->n,&b->ipre);CHKERRQ(ierr); 3929846b4da1SFande Kong ierr = PetscLogObjectMemory((PetscObject)B,B->rmap->n*sizeof(PetscInt));CHKERRQ(ierr); 3930846b4da1SFande Kong } 3931273d9f13SBarry Smith if (!nnz) { 3932435da068SBarry Smith if (nz == PETSC_DEFAULT || nz == PETSC_DECIDE) nz = 10; 3933c62bd62aSJed Brown else if (nz < 0) nz = 1; 39345d2a9ed1SStefano Zampini nz = PetscMin(nz,B->cmap->n); 3935d0f46423SBarry Smith for (i=0; i<B->rmap->n; i++) b->imax[i] = nz; 3936d0f46423SBarry Smith nz = nz*B->rmap->n; 3937273d9f13SBarry Smith } else { 3938c73702f5SBarry Smith PetscInt64 nz64 = 0; 3939c73702f5SBarry Smith for (i=0; i<B->rmap->n; i++) {b->imax[i] = nnz[i]; nz64 += nnz[i];} 3940c73702f5SBarry Smith ierr = PetscIntCast(nz64,&nz);CHKERRQ(ierr); 3941273d9f13SBarry Smith } 3942ab93d7beSBarry Smith 3943273d9f13SBarry Smith /* allocate the matrix space */ 394453dd7562SDmitry Karpeev /* FIXME: should B's old memory be unlogged? */ 39452ee49352SLisandro Dalcin ierr = MatSeqXAIJFreeAIJ(B,&b->a,&b->j,&b->i);CHKERRQ(ierr); 3946396832f4SHong Zhang if (B->structure_only) { 39475848002fSHong Zhang ierr = PetscMalloc1(nz,&b->j);CHKERRQ(ierr); 39485848002fSHong Zhang ierr = PetscMalloc1(B->rmap->n+1,&b->i);CHKERRQ(ierr); 3949396832f4SHong Zhang ierr = PetscLogObjectMemory((PetscObject)B,(B->rmap->n+1)*sizeof(PetscInt)+nz*sizeof(PetscInt));CHKERRQ(ierr); 3950396832f4SHong Zhang } else { 3951dcca6d9dSJed Brown ierr = PetscMalloc3(nz,&b->a,nz,&b->j,B->rmap->n+1,&b->i);CHKERRQ(ierr); 39523bb1ff40SBarry Smith ierr = PetscLogObjectMemory((PetscObject)B,(B->rmap->n+1)*sizeof(PetscInt)+nz*(sizeof(PetscScalar)+sizeof(PetscInt)));CHKERRQ(ierr); 3953396832f4SHong Zhang } 3954bfeeae90SHong Zhang b->i[0] = 0; 3955d0f46423SBarry Smith for (i=1; i<B->rmap->n+1; i++) { 39565da197adSKris Buschelman b->i[i] = b->i[i-1] + b->imax[i-1]; 39575da197adSKris Buschelman } 3958396832f4SHong Zhang if (B->structure_only) { 3959396832f4SHong Zhang b->singlemalloc = PETSC_FALSE; 3960396832f4SHong Zhang b->free_a = PETSC_FALSE; 3961396832f4SHong Zhang } else { 3962273d9f13SBarry Smith b->singlemalloc = PETSC_TRUE; 3963e6b907acSBarry Smith b->free_a = PETSC_TRUE; 3964396832f4SHong Zhang } 3965e6b907acSBarry Smith b->free_ij = PETSC_TRUE; 3966c461c341SBarry Smith } else { 3967e6b907acSBarry Smith b->free_a = PETSC_FALSE; 3968e6b907acSBarry Smith b->free_ij = PETSC_FALSE; 3969c461c341SBarry Smith } 3970273d9f13SBarry Smith 3971846b4da1SFande Kong if (b->ipre && nnz != b->ipre && b->imax) { 3972846b4da1SFande Kong /* reserve user-requested sparsity */ 3973580bdb30SBarry Smith ierr = PetscArraycpy(b->ipre,b->imax,B->rmap->n);CHKERRQ(ierr); 3974846b4da1SFande Kong } 3975846b4da1SFande Kong 3976846b4da1SFande Kong 3977273d9f13SBarry Smith b->nz = 0; 3978273d9f13SBarry Smith b->maxnz = nz; 3979273d9f13SBarry Smith B->info.nz_unneeded = (double)b->maxnz; 39802205254eSKarl Rupp if (realalloc) { 39812205254eSKarl Rupp ierr = MatSetOption(B,MAT_NEW_NONZERO_ALLOCATION_ERR,PETSC_TRUE);CHKERRQ(ierr); 39822205254eSKarl Rupp } 3983cb7b82ddSBarry Smith B->was_assembled = PETSC_FALSE; 3984cb7b82ddSBarry Smith B->assembled = PETSC_FALSE; 3985273d9f13SBarry Smith PetscFunctionReturn(0); 3986273d9f13SBarry Smith } 3987273d9f13SBarry Smith 3988846b4da1SFande Kong 3989846b4da1SFande Kong PetscErrorCode MatResetPreallocation_SeqAIJ(Mat A) 3990846b4da1SFande Kong { 3991846b4da1SFande Kong Mat_SeqAIJ *a; 3992a5bbaf83SFande Kong PetscInt i; 3993846b4da1SFande Kong PetscErrorCode ierr; 3994846b4da1SFande Kong 3995846b4da1SFande Kong PetscFunctionBegin; 3996846b4da1SFande Kong PetscValidHeaderSpecific(A,MAT_CLASSID,1); 399714d0e64fSAlex Lindsay 399814d0e64fSAlex Lindsay /* Check local size. If zero, then return */ 399914d0e64fSAlex Lindsay if (!A->rmap->n) PetscFunctionReturn(0); 400014d0e64fSAlex Lindsay 4001846b4da1SFande Kong a = (Mat_SeqAIJ*)A->data; 40022c814fdeSFande Kong /* if no saved info, we error out */ 4003fb4dc15dSAlex Lindsay if (!a->ipre) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_NULL,"No saved preallocation info \n"); 40042c814fdeSFande Kong 4005fb4dc15dSAlex Lindsay if (!a->i || !a->j || !a->a || !a->imax || !a->ilen) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_NULL,"Memory info is incomplete, and can not reset preallocation \n"); 40062c814fdeSFande Kong 4007580bdb30SBarry Smith ierr = PetscArraycpy(a->imax,a->ipre,A->rmap->n);CHKERRQ(ierr); 4008580bdb30SBarry Smith ierr = PetscArrayzero(a->ilen,A->rmap->n);CHKERRQ(ierr); 4009846b4da1SFande Kong a->i[0] = 0; 4010846b4da1SFande Kong for (i=1; i<A->rmap->n+1; i++) { 4011846b4da1SFande Kong a->i[i] = a->i[i-1] + a->imax[i-1]; 4012846b4da1SFande Kong } 4013846b4da1SFande Kong A->preallocated = PETSC_TRUE; 4014846b4da1SFande Kong a->nz = 0; 4015846b4da1SFande Kong a->maxnz = a->i[A->rmap->n]; 4016846b4da1SFande Kong A->info.nz_unneeded = (double)a->maxnz; 4017846b4da1SFande Kong A->was_assembled = PETSC_FALSE; 4018846b4da1SFande Kong A->assembled = PETSC_FALSE; 4019846b4da1SFande Kong PetscFunctionReturn(0); 4020846b4da1SFande Kong } 4021846b4da1SFande Kong 402258d36128SBarry Smith /*@ 4023a1661176SMatthew Knepley MatSeqAIJSetPreallocationCSR - Allocates memory for a sparse sequential matrix in AIJ format. 4024a1661176SMatthew Knepley 4025a1661176SMatthew Knepley Input Parameters: 4026a1661176SMatthew Knepley + B - the matrix 4027a1661176SMatthew Knepley . i - the indices into j for the start of each row (starts with zero) 4028a1661176SMatthew Knepley . j - the column indices for each row (starts with zero) these must be sorted for each row 4029a1661176SMatthew Knepley - v - optional values in the matrix 4030a1661176SMatthew Knepley 4031a1661176SMatthew Knepley Level: developer 4032a1661176SMatthew Knepley 403358d36128SBarry Smith The i,j,v values are COPIED with this routine; to avoid the copy use MatCreateSeqAIJWithArrays() 403458d36128SBarry Smith 4035c1c1d628SHong Zhang .seealso: MatCreate(), MatCreateSeqAIJ(), MatSetValues(), MatSeqAIJSetPreallocation(), MatCreateSeqAIJ(), MATSEQAIJ 4036a1661176SMatthew Knepley @*/ 4037a1661176SMatthew Knepley PetscErrorCode MatSeqAIJSetPreallocationCSR(Mat B,const PetscInt i[],const PetscInt j[],const PetscScalar v[]) 4038a1661176SMatthew Knepley { 4039a1661176SMatthew Knepley PetscErrorCode ierr; 4040a1661176SMatthew Knepley 4041a1661176SMatthew Knepley PetscFunctionBegin; 40420700a824SBarry Smith PetscValidHeaderSpecific(B,MAT_CLASSID,1); 40436ba663aaSJed Brown PetscValidType(B,1); 40444ac538c5SBarry Smith ierr = PetscTryMethod(B,"MatSeqAIJSetPreallocationCSR_C",(Mat,const PetscInt[],const PetscInt[],const PetscScalar[]),(B,i,j,v));CHKERRQ(ierr); 4045a1661176SMatthew Knepley PetscFunctionReturn(0); 4046a1661176SMatthew Knepley } 4047a1661176SMatthew Knepley 40487087cfbeSBarry Smith PetscErrorCode MatSeqAIJSetPreallocationCSR_SeqAIJ(Mat B,const PetscInt Ii[],const PetscInt J[],const PetscScalar v[]) 4049a1661176SMatthew Knepley { 4050a1661176SMatthew Knepley PetscInt i; 4051a1661176SMatthew Knepley PetscInt m,n; 4052a1661176SMatthew Knepley PetscInt nz; 4053a1661176SMatthew Knepley PetscInt *nnz, nz_max = 0; 4054a1661176SMatthew Knepley PetscErrorCode ierr; 4055a1661176SMatthew Knepley 4056a1661176SMatthew Knepley PetscFunctionBegin; 405765e19b50SBarry Smith if (Ii[0]) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE, "Ii[0] must be 0 it is %D", Ii[0]); 4058779a8d59SSatish Balay 4059779a8d59SSatish Balay ierr = PetscLayoutSetUp(B->rmap);CHKERRQ(ierr); 4060779a8d59SSatish Balay ierr = PetscLayoutSetUp(B->cmap);CHKERRQ(ierr); 4061779a8d59SSatish Balay 4062779a8d59SSatish Balay ierr = MatGetSize(B, &m, &n);CHKERRQ(ierr); 4063854ce69bSBarry Smith ierr = PetscMalloc1(m+1, &nnz);CHKERRQ(ierr); 4064a1661176SMatthew Knepley for (i = 0; i < m; i++) { 4065b7940d39SSatish Balay nz = Ii[i+1]- Ii[i]; 4066a1661176SMatthew Knepley nz_max = PetscMax(nz_max, nz); 406765e19b50SBarry Smith if (nz < 0) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE, "Local row %D has a negative number of columns %D", i, nnz); 4068a1661176SMatthew Knepley nnz[i] = nz; 4069a1661176SMatthew Knepley } 4070a1661176SMatthew Knepley ierr = MatSeqAIJSetPreallocation(B, 0, nnz);CHKERRQ(ierr); 4071a1661176SMatthew Knepley ierr = PetscFree(nnz);CHKERRQ(ierr); 4072a1661176SMatthew Knepley 4073a1661176SMatthew Knepley for (i = 0; i < m; i++) { 4074071fcb05SBarry Smith ierr = MatSetValues_SeqAIJ(B, 1, &i, Ii[i+1] - Ii[i], J+Ii[i], v ? v + Ii[i] : NULL, INSERT_VALUES);CHKERRQ(ierr); 4075a1661176SMatthew Knepley } 4076a1661176SMatthew Knepley 4077a1661176SMatthew Knepley ierr = MatAssemblyBegin(B,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 4078a1661176SMatthew Knepley ierr = MatAssemblyEnd(B,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 4079a1661176SMatthew Knepley 40807827cd58SJed Brown ierr = MatSetOption(B,MAT_NEW_NONZERO_LOCATION_ERR,PETSC_TRUE);CHKERRQ(ierr); 4081a1661176SMatthew Knepley PetscFunctionReturn(0); 4082a1661176SMatthew Knepley } 4083a1661176SMatthew Knepley 4084c6db04a5SJed Brown #include <../src/mat/impls/dense/seq/dense.h> 4085af0996ceSBarry Smith #include <petsc/private/kernels/petscaxpy.h> 4086170fe5c8SBarry Smith 4087170fe5c8SBarry Smith /* 4088170fe5c8SBarry Smith Computes (B'*A')' since computing B*A directly is untenable 4089170fe5c8SBarry Smith 4090170fe5c8SBarry Smith n p p 4091170fe5c8SBarry Smith ( ) ( ) ( ) 4092170fe5c8SBarry Smith m ( A ) * n ( B ) = m ( C ) 4093170fe5c8SBarry Smith ( ) ( ) ( ) 4094170fe5c8SBarry Smith 4095170fe5c8SBarry Smith */ 4096170fe5c8SBarry Smith PetscErrorCode MatMatMultNumeric_SeqDense_SeqAIJ(Mat A,Mat B,Mat C) 4097170fe5c8SBarry Smith { 4098170fe5c8SBarry Smith PetscErrorCode ierr; 4099170fe5c8SBarry Smith Mat_SeqDense *sub_a = (Mat_SeqDense*)A->data; 4100170fe5c8SBarry Smith Mat_SeqAIJ *sub_b = (Mat_SeqAIJ*)B->data; 4101170fe5c8SBarry Smith Mat_SeqDense *sub_c = (Mat_SeqDense*)C->data; 410286214ceeSStefano Zampini PetscInt i,j,n,m,q,p; 4103170fe5c8SBarry Smith const PetscInt *ii,*idx; 4104170fe5c8SBarry Smith const PetscScalar *b,*a,*a_q; 4105170fe5c8SBarry Smith PetscScalar *c,*c_q; 410686214ceeSStefano Zampini PetscInt clda = sub_c->lda; 410786214ceeSStefano Zampini PetscInt alda = sub_a->lda; 4108170fe5c8SBarry Smith 4109170fe5c8SBarry Smith PetscFunctionBegin; 4110d0f46423SBarry Smith m = A->rmap->n; 4111d0f46423SBarry Smith n = A->cmap->n; 4112d0f46423SBarry Smith p = B->cmap->n; 4113170fe5c8SBarry Smith a = sub_a->v; 4114170fe5c8SBarry Smith b = sub_b->a; 4115170fe5c8SBarry Smith c = sub_c->v; 411686214ceeSStefano Zampini if (clda == m) { 4117580bdb30SBarry Smith ierr = PetscArrayzero(c,m*p);CHKERRQ(ierr); 411886214ceeSStefano Zampini } else { 411986214ceeSStefano Zampini for (j=0;j<p;j++) 412086214ceeSStefano Zampini for (i=0;i<m;i++) 412186214ceeSStefano Zampini c[j*clda + i] = 0.0; 412286214ceeSStefano Zampini } 4123170fe5c8SBarry Smith ii = sub_b->i; 4124170fe5c8SBarry Smith idx = sub_b->j; 4125170fe5c8SBarry Smith for (i=0; i<n; i++) { 4126170fe5c8SBarry Smith q = ii[i+1] - ii[i]; 4127170fe5c8SBarry Smith while (q-->0) { 412886214ceeSStefano Zampini c_q = c + clda*(*idx); 412986214ceeSStefano Zampini a_q = a + alda*i; 4130854c7f52SBarry Smith PetscKernelAXPY(c_q,*b,a_q,m); 4131170fe5c8SBarry Smith idx++; 4132170fe5c8SBarry Smith b++; 4133170fe5c8SBarry Smith } 4134170fe5c8SBarry Smith } 4135170fe5c8SBarry Smith PetscFunctionReturn(0); 4136170fe5c8SBarry Smith } 4137170fe5c8SBarry Smith 41384222ddf1SHong Zhang PetscErrorCode MatMatMultSymbolic_SeqDense_SeqAIJ(Mat A,Mat B,PetscReal fill,Mat C) 4139170fe5c8SBarry Smith { 4140170fe5c8SBarry Smith PetscErrorCode ierr; 4141d0f46423SBarry Smith PetscInt m=A->rmap->n,n=B->cmap->n; 414286214ceeSStefano Zampini PetscBool cisdense; 4143170fe5c8SBarry Smith 4144170fe5c8SBarry Smith PetscFunctionBegin; 414560e0710aSBarry Smith if (A->cmap->n != B->rmap->n) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"A->cmap->n %D != B->rmap->n %D\n",A->cmap->n,B->rmap->n); 41464222ddf1SHong Zhang ierr = MatSetSizes(C,m,n,m,n);CHKERRQ(ierr); 41474222ddf1SHong Zhang ierr = MatSetBlockSizesFromMats(C,A,B);CHKERRQ(ierr); 414886214ceeSStefano Zampini ierr = PetscObjectTypeCompareAny((PetscObject)C,&cisdense,MATSEQDENSE,MATSEQDENSECUDA,"");CHKERRQ(ierr); 414986214ceeSStefano Zampini if (!cisdense) { 415086214ceeSStefano Zampini ierr = MatSetType(C,MATDENSE);CHKERRQ(ierr); 415186214ceeSStefano Zampini } 415286214ceeSStefano Zampini ierr = MatSetUp(C);CHKERRQ(ierr); 4153d73949e8SHong Zhang 41544222ddf1SHong Zhang C->ops->matmultnumeric = MatMatMultNumeric_SeqDense_SeqAIJ; 4155170fe5c8SBarry Smith PetscFunctionReturn(0); 4156170fe5c8SBarry Smith } 4157170fe5c8SBarry Smith 4158170fe5c8SBarry Smith /* ----------------------------------------------------------------*/ 41590bad9183SKris Buschelman /*MC 4160fafad747SKris Buschelman MATSEQAIJ - MATSEQAIJ = "seqaij" - A matrix type to be used for sequential sparse matrices, 41610bad9183SKris Buschelman based on compressed sparse row format. 41620bad9183SKris Buschelman 41630bad9183SKris Buschelman Options Database Keys: 41640bad9183SKris Buschelman . -mat_type seqaij - sets the matrix type to "seqaij" during a call to MatSetFromOptions() 41650bad9183SKris Buschelman 41660bad9183SKris Buschelman Level: beginner 41670bad9183SKris Buschelman 41680cd7f59aSBarry Smith Notes: 41690cd7f59aSBarry Smith MatSetValues() may be called for this matrix type with a NULL argument for the numerical values, 41700cd7f59aSBarry Smith in this case the values associated with the rows and columns one passes in are set to zero 41710cd7f59aSBarry Smith in the matrix 41720cd7f59aSBarry Smith 41730cd7f59aSBarry Smith MatSetOptions(,MAT_STRUCTURE_ONLY,PETSC_TRUE) may be called for this matrix type. In this no 41740cd7f59aSBarry Smith space is allocated for the nonzero entries and any entries passed with MatSetValues() are ignored 41750cd7f59aSBarry Smith 41760cd7f59aSBarry Smith Developer Notes: 41770cd7f59aSBarry Smith It would be nice if all matrix formats supported passing NULL in for the numerical values 41780cd7f59aSBarry Smith 4179f587520bSBarry Smith .seealso: MatCreateSeqAIJ(), MatSetFromOptions(), MatSetType(), MatCreate(), MatType 41800bad9183SKris Buschelman M*/ 41810bad9183SKris Buschelman 4182ccd284c7SBarry Smith /*MC 4183ccd284c7SBarry Smith MATAIJ - MATAIJ = "aij" - A matrix type to be used for sparse matrices. 4184ccd284c7SBarry Smith 4185ccd284c7SBarry Smith This matrix type is identical to MATSEQAIJ when constructed with a single process communicator, 4186ccd284c7SBarry Smith and MATMPIAIJ otherwise. As a result, for single process communicators, 41870cd7f59aSBarry Smith MatSeqAIJSetPreallocation is supported, and similarly MatMPIAIJSetPreallocation() is supported 4188ccd284c7SBarry Smith for communicators controlling multiple processes. It is recommended that you call both of 4189ccd284c7SBarry Smith the above preallocation routines for simplicity. 4190ccd284c7SBarry Smith 4191ccd284c7SBarry Smith Options Database Keys: 4192ccd284c7SBarry Smith . -mat_type aij - sets the matrix type to "aij" during a call to MatSetFromOptions() 4193ccd284c7SBarry Smith 419495452b02SPatrick Sanan Developer Notes: 4195ca9cdca7SRichard Tran Mills Subclasses include MATAIJCUSPARSE, MATAIJPERM, MATAIJSELL, MATAIJMKL, MATAIJCRL, and also automatically switches over to use inodes when 4196ccd284c7SBarry Smith enough exist. 4197ccd284c7SBarry Smith 4198ccd284c7SBarry Smith Level: beginner 4199ccd284c7SBarry Smith 4200ccd284c7SBarry Smith .seealso: MatCreateAIJ(), MatCreateSeqAIJ(), MATSEQAIJ,MATMPIAIJ 4201ccd284c7SBarry Smith M*/ 4202ccd284c7SBarry Smith 4203ccd284c7SBarry Smith /*MC 4204ccd284c7SBarry Smith MATAIJCRL - MATAIJCRL = "aijcrl" - A matrix type to be used for sparse matrices. 4205ccd284c7SBarry Smith 4206ccd284c7SBarry Smith This matrix type is identical to MATSEQAIJCRL when constructed with a single process communicator, 4207ccd284c7SBarry Smith and MATMPIAIJCRL otherwise. As a result, for single process communicators, 4208ccd284c7SBarry Smith MatSeqAIJSetPreallocation() is supported, and similarly MatMPIAIJSetPreallocation() is supported 4209ccd284c7SBarry Smith for communicators controlling multiple processes. It is recommended that you call both of 4210ccd284c7SBarry Smith the above preallocation routines for simplicity. 4211ccd284c7SBarry Smith 4212ccd284c7SBarry Smith Options Database Keys: 4213ccd284c7SBarry Smith . -mat_type aijcrl - sets the matrix type to "aijcrl" during a call to MatSetFromOptions() 4214ccd284c7SBarry Smith 4215ccd284c7SBarry Smith Level: beginner 4216ccd284c7SBarry Smith 4217ccd284c7SBarry Smith .seealso: MatCreateMPIAIJCRL,MATSEQAIJCRL,MATMPIAIJCRL, MATSEQAIJCRL, MATMPIAIJCRL 4218ccd284c7SBarry Smith M*/ 4219ccd284c7SBarry Smith 42207906f579SHong Zhang PETSC_INTERN PetscErrorCode MatConvert_SeqAIJ_SeqAIJCRL(Mat,MatType,MatReuse,Mat*); 42217906f579SHong Zhang #if defined(PETSC_HAVE_ELEMENTAL) 42227906f579SHong Zhang PETSC_INTERN PetscErrorCode MatConvert_SeqAIJ_Elemental(Mat,MatType,MatReuse,Mat*); 42237906f579SHong Zhang #endif 4224d24d4204SJose E. Roman #if defined(PETSC_HAVE_SCALAPACK) 4225d24d4204SJose E. Roman PETSC_INTERN PetscErrorCode MatConvert_AIJ_ScaLAPACK(Mat,MatType,MatReuse,Mat*); 4226d24d4204SJose E. Roman #endif 42277906f579SHong Zhang #if defined(PETSC_HAVE_HYPRE) 42287906f579SHong Zhang PETSC_INTERN PetscErrorCode MatConvert_AIJ_HYPRE(Mat A,MatType,MatReuse,Mat*); 42297906f579SHong Zhang #endif 42307906f579SHong Zhang PETSC_INTERN PetscErrorCode MatConvert_SeqAIJ_SeqDense(Mat,MatType,MatReuse,Mat*); 42317906f579SHong Zhang 4232d4002b98SHong Zhang PETSC_EXTERN PetscErrorCode MatConvert_SeqAIJ_SeqSELL(Mat,MatType,MatReuse,Mat*); 4233c9225affSStefano Zampini PETSC_INTERN PetscErrorCode MatConvert_XAIJ_IS(Mat,MatType,MatReuse,Mat*); 42344222ddf1SHong Zhang PETSC_INTERN PetscErrorCode MatProductSetFromOptions_IS_XAIJ(Mat); 42357906f579SHong Zhang 42368c778c55SBarry Smith /*@C 42378f1ea47aSStefano Zampini MatSeqAIJGetArray - gives read/write access to the array where the data for a MATSEQAIJ matrix is stored 42388c778c55SBarry Smith 42398c778c55SBarry Smith Not Collective 42408c778c55SBarry Smith 42418c778c55SBarry Smith Input Parameter: 4242579dbff0SBarry Smith . mat - a MATSEQAIJ matrix 42438c778c55SBarry Smith 42448c778c55SBarry Smith Output Parameter: 42458c778c55SBarry Smith . array - pointer to the data 42468c778c55SBarry Smith 42478c778c55SBarry Smith Level: intermediate 42488c778c55SBarry Smith 4249774cf152SJed Brown .seealso: MatSeqAIJRestoreArray(), MatSeqAIJGetArrayF90() 42508c778c55SBarry Smith @*/ 42518c778c55SBarry Smith PetscErrorCode MatSeqAIJGetArray(Mat A,PetscScalar **array) 42528c778c55SBarry Smith { 42538c778c55SBarry Smith PetscErrorCode ierr; 42548c778c55SBarry Smith 42558c778c55SBarry Smith PetscFunctionBegin; 42568c778c55SBarry Smith ierr = PetscUseMethod(A,"MatSeqAIJGetArray_C",(Mat,PetscScalar**),(A,array));CHKERRQ(ierr); 42578c778c55SBarry Smith PetscFunctionReturn(0); 42588c778c55SBarry Smith } 42598c778c55SBarry Smith 426021e72a00SBarry Smith /*@C 42618f1ea47aSStefano Zampini MatSeqAIJGetArrayRead - gives read-only access to the array where the data for a MATSEQAIJ matrix is stored 42628f1ea47aSStefano Zampini 42638f1ea47aSStefano Zampini Not Collective 42648f1ea47aSStefano Zampini 42658f1ea47aSStefano Zampini Input Parameter: 42668f1ea47aSStefano Zampini . mat - a MATSEQAIJ matrix 42678f1ea47aSStefano Zampini 42688f1ea47aSStefano Zampini Output Parameter: 42698f1ea47aSStefano Zampini . array - pointer to the data 42708f1ea47aSStefano Zampini 42718f1ea47aSStefano Zampini Level: intermediate 42728f1ea47aSStefano Zampini 42738f1ea47aSStefano Zampini .seealso: MatSeqAIJGetArray(), MatSeqAIJRestoreArrayRead() 42748f1ea47aSStefano Zampini @*/ 42758f1ea47aSStefano Zampini PetscErrorCode MatSeqAIJGetArrayRead(Mat A,const PetscScalar **array) 42768f1ea47aSStefano Zampini { 42778f1ea47aSStefano Zampini #if defined(PETSC_HAVE_CUDA) || defined(PETSC_HAVE_VIENNACL) 4278c70f7ee4SJunchao Zhang PetscOffloadMask oval; 42798f1ea47aSStefano Zampini #endif 42808f1ea47aSStefano Zampini PetscErrorCode ierr; 42818f1ea47aSStefano Zampini 42828f1ea47aSStefano Zampini PetscFunctionBegin; 42838f1ea47aSStefano Zampini #if defined(PETSC_HAVE_CUDA) || defined(PETSC_HAVE_VIENNACL) 4284c70f7ee4SJunchao Zhang oval = A->offloadmask; 42858f1ea47aSStefano Zampini #endif 42868f1ea47aSStefano Zampini ierr = MatSeqAIJGetArray(A,(PetscScalar**)array);CHKERRQ(ierr); 42878f1ea47aSStefano Zampini #if defined(PETSC_HAVE_CUDA) || defined(PETSC_HAVE_VIENNACL) 4288c70f7ee4SJunchao Zhang if (oval == PETSC_OFFLOAD_GPU || oval == PETSC_OFFLOAD_BOTH) A->offloadmask = PETSC_OFFLOAD_BOTH; 42898f1ea47aSStefano Zampini #endif 42908f1ea47aSStefano Zampini PetscFunctionReturn(0); 42918f1ea47aSStefano Zampini } 42928f1ea47aSStefano Zampini 42938f1ea47aSStefano Zampini /*@C 42948f1ea47aSStefano Zampini MatSeqAIJRestoreArrayRead - restore the read-only access array obtained from MatSeqAIJGetArrayRead 42958f1ea47aSStefano Zampini 42968f1ea47aSStefano Zampini Not Collective 42978f1ea47aSStefano Zampini 42988f1ea47aSStefano Zampini Input Parameter: 42998f1ea47aSStefano Zampini . mat - a MATSEQAIJ matrix 43008f1ea47aSStefano Zampini 43018f1ea47aSStefano Zampini Output Parameter: 43028f1ea47aSStefano Zampini . array - pointer to the data 43038f1ea47aSStefano Zampini 43048f1ea47aSStefano Zampini Level: intermediate 43058f1ea47aSStefano Zampini 43068f1ea47aSStefano Zampini .seealso: MatSeqAIJGetArray(), MatSeqAIJGetArrayRead() 43078f1ea47aSStefano Zampini @*/ 43088f1ea47aSStefano Zampini PetscErrorCode MatSeqAIJRestoreArrayRead(Mat A,const PetscScalar **array) 43098f1ea47aSStefano Zampini { 43108f1ea47aSStefano Zampini #if defined(PETSC_HAVE_CUDA) || defined(PETSC_HAVE_VIENNACL) 4311c70f7ee4SJunchao Zhang PetscOffloadMask oval; 43128f1ea47aSStefano Zampini #endif 43138f1ea47aSStefano Zampini PetscErrorCode ierr; 43148f1ea47aSStefano Zampini 43158f1ea47aSStefano Zampini PetscFunctionBegin; 43168f1ea47aSStefano Zampini #if defined(PETSC_HAVE_CUDA) || defined(PETSC_HAVE_VIENNACL) 4317c70f7ee4SJunchao Zhang oval = A->offloadmask; 43188f1ea47aSStefano Zampini #endif 43198f1ea47aSStefano Zampini ierr = MatSeqAIJRestoreArray(A,(PetscScalar**)array);CHKERRQ(ierr); 43208f1ea47aSStefano Zampini #if defined(PETSC_HAVE_CUDA) || defined(PETSC_HAVE_VIENNACL) 4321c70f7ee4SJunchao Zhang A->offloadmask = oval; 43228f1ea47aSStefano Zampini #endif 43238f1ea47aSStefano Zampini PetscFunctionReturn(0); 43248f1ea47aSStefano Zampini } 43258f1ea47aSStefano Zampini 43268f1ea47aSStefano Zampini /*@C 432721e72a00SBarry Smith MatSeqAIJGetMaxRowNonzeros - returns the maximum number of nonzeros in any row 432821e72a00SBarry Smith 432921e72a00SBarry Smith Not Collective 433021e72a00SBarry Smith 433121e72a00SBarry Smith Input Parameter: 4332579dbff0SBarry Smith . mat - a MATSEQAIJ matrix 433321e72a00SBarry Smith 433421e72a00SBarry Smith Output Parameter: 433521e72a00SBarry Smith . nz - the maximum number of nonzeros in any row 433621e72a00SBarry Smith 433721e72a00SBarry Smith Level: intermediate 433821e72a00SBarry Smith 433921e72a00SBarry Smith .seealso: MatSeqAIJRestoreArray(), MatSeqAIJGetArrayF90() 434021e72a00SBarry Smith @*/ 434121e72a00SBarry Smith PetscErrorCode MatSeqAIJGetMaxRowNonzeros(Mat A,PetscInt *nz) 434221e72a00SBarry Smith { 434321e72a00SBarry Smith Mat_SeqAIJ *aij = (Mat_SeqAIJ*)A->data; 434421e72a00SBarry Smith 434521e72a00SBarry Smith PetscFunctionBegin; 434621e72a00SBarry Smith *nz = aij->rmax; 434721e72a00SBarry Smith PetscFunctionReturn(0); 434821e72a00SBarry Smith } 434921e72a00SBarry Smith 43508c778c55SBarry Smith /*@C 4351579dbff0SBarry Smith MatSeqAIJRestoreArray - returns access to the array where the data for a MATSEQAIJ matrix is stored obtained by MatSeqAIJGetArray() 43528c778c55SBarry Smith 43538c778c55SBarry Smith Not Collective 43548c778c55SBarry Smith 43558c778c55SBarry Smith Input Parameters: 4356a2b725a8SWilliam Gropp + mat - a MATSEQAIJ matrix 4357a2b725a8SWilliam Gropp - array - pointer to the data 43588c778c55SBarry Smith 43598c778c55SBarry Smith Level: intermediate 43608c778c55SBarry Smith 4361774cf152SJed Brown .seealso: MatSeqAIJGetArray(), MatSeqAIJRestoreArrayF90() 43628c778c55SBarry Smith @*/ 43638c778c55SBarry Smith PetscErrorCode MatSeqAIJRestoreArray(Mat A,PetscScalar **array) 43648c778c55SBarry Smith { 43658c778c55SBarry Smith PetscErrorCode ierr; 43668c778c55SBarry Smith 43678c778c55SBarry Smith PetscFunctionBegin; 43688c778c55SBarry Smith ierr = PetscUseMethod(A,"MatSeqAIJRestoreArray_C",(Mat,PetscScalar**),(A,array));CHKERRQ(ierr); 43698c778c55SBarry Smith PetscFunctionReturn(0); 43708c778c55SBarry Smith } 43718c778c55SBarry Smith 437234b5b067SBarry Smith #if defined(PETSC_HAVE_CUDA) 43730ce8acdeSStefano Zampini PETSC_INTERN PetscErrorCode MatConvert_SeqAIJ_SeqAIJCUSPARSE(Mat); 437402fe1965SBarry Smith #endif 437502fe1965SBarry Smith 43768cc058d9SJed Brown PETSC_EXTERN PetscErrorCode MatCreate_SeqAIJ(Mat B) 4377273d9f13SBarry Smith { 4378273d9f13SBarry Smith Mat_SeqAIJ *b; 4379dfbe8321SBarry Smith PetscErrorCode ierr; 438038baddfdSBarry Smith PetscMPIInt size; 4381273d9f13SBarry Smith 4382273d9f13SBarry Smith PetscFunctionBegin; 4383ce94432eSBarry Smith ierr = MPI_Comm_size(PetscObjectComm((PetscObject)B),&size);CHKERRQ(ierr); 4384e32f2f54SBarry Smith if (size > 1) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Comm must be of size 1"); 4385273d9f13SBarry Smith 4386b00a9115SJed Brown ierr = PetscNewLog(B,&b);CHKERRQ(ierr); 43872205254eSKarl Rupp 4388b0a32e0cSBarry Smith B->data = (void*)b; 43892205254eSKarl Rupp 4390549d3d68SSatish Balay ierr = PetscMemcpy(B->ops,&MatOps_Values,sizeof(struct _MatOps));CHKERRQ(ierr); 4391071fcb05SBarry Smith if (B->sortedfull) B->ops->setvalues = MatSetValues_SeqAIJ_SortedFull; 43922205254eSKarl Rupp 4393416022c9SBarry Smith b->row = 0; 4394416022c9SBarry Smith b->col = 0; 439582bf6240SBarry Smith b->icol = 0; 4396b810aeb4SBarry Smith b->reallocs = 0; 439736db0b34SBarry Smith b->ignorezeroentries = PETSC_FALSE; 4398f1e2ffcdSBarry Smith b->roworiented = PETSC_TRUE; 4399416022c9SBarry Smith b->nonew = 0; 4400416022c9SBarry Smith b->diag = 0; 4401416022c9SBarry Smith b->solve_work = 0; 44022a1b7f2aSHong Zhang B->spptr = 0; 4403be6bf707SBarry Smith b->saved_values = 0; 4404d7f994e1SBarry Smith b->idiag = 0; 440571f1c65dSBarry Smith b->mdiag = 0; 440671f1c65dSBarry Smith b->ssor_work = 0; 440771f1c65dSBarry Smith b->omega = 1.0; 440871f1c65dSBarry Smith b->fshift = 0.0; 440971f1c65dSBarry Smith b->idiagvalid = PETSC_FALSE; 4410bbead8a2SBarry Smith b->ibdiagvalid = PETSC_FALSE; 4411a9817697SBarry Smith b->keepnonzeropattern = PETSC_FALSE; 441217ab2063SBarry Smith 441335d8aa7fSBarry Smith ierr = PetscObjectChangeTypeName((PetscObject)B,MATSEQAIJ);CHKERRQ(ierr); 4414bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatSeqAIJGetArray_C",MatSeqAIJGetArray_SeqAIJ);CHKERRQ(ierr); 4415bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatSeqAIJRestoreArray_C",MatSeqAIJRestoreArray_SeqAIJ);CHKERRQ(ierr); 44168c778c55SBarry Smith 4417b3866ffcSBarry Smith #if defined(PETSC_HAVE_MATLAB_ENGINE) 4418bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"PetscMatlabEnginePut_C",MatlabEnginePut_SeqAIJ);CHKERRQ(ierr); 4419bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"PetscMatlabEngineGet_C",MatlabEngineGet_SeqAIJ);CHKERRQ(ierr); 4420b3866ffcSBarry Smith #endif 442117f1a0eaSHong Zhang 4422bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatSeqAIJSetColumnIndices_C",MatSeqAIJSetColumnIndices_SeqAIJ);CHKERRQ(ierr); 4423bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatStoreValues_C",MatStoreValues_SeqAIJ);CHKERRQ(ierr); 4424bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatRetrieveValues_C",MatRetrieveValues_SeqAIJ);CHKERRQ(ierr); 4425bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatConvert_seqaij_seqsbaij_C",MatConvert_SeqAIJ_SeqSBAIJ);CHKERRQ(ierr); 4426bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatConvert_seqaij_seqbaij_C",MatConvert_SeqAIJ_SeqBAIJ);CHKERRQ(ierr); 4427bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatConvert_seqaij_seqaijperm_C",MatConvert_SeqAIJ_SeqAIJPERM);CHKERRQ(ierr); 44284dfdc2d9SRichard Tran Mills ierr = PetscObjectComposeFunction((PetscObject)B,"MatConvert_seqaij_seqaijsell_C",MatConvert_SeqAIJ_SeqAIJSELL);CHKERRQ(ierr); 44299779e05dSSatish Balay #if defined(PETSC_HAVE_MKL_SPARSE) 44304a2a386eSRichard Tran Mills ierr = PetscObjectComposeFunction((PetscObject)B,"MatConvert_seqaij_seqaijmkl_C",MatConvert_SeqAIJ_SeqAIJMKL);CHKERRQ(ierr); 4431191b95cbSRichard Tran Mills #endif 443234b5b067SBarry Smith #if defined(PETSC_HAVE_CUDA) 443302fe1965SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatConvert_seqaij_seqaijcusparse_C",MatConvert_SeqAIJ_SeqAIJCUSPARSE);CHKERRQ(ierr); 44344222ddf1SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatProductSetFromOptions_seqaijcusparse_seqaij_C",MatProductSetFromOptions_SeqAIJ);CHKERRQ(ierr); 443502fe1965SBarry Smith #endif 4436bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatConvert_seqaij_seqaijcrl_C",MatConvert_SeqAIJ_SeqAIJCRL);CHKERRQ(ierr); 4437af8000cdSHong Zhang #if defined(PETSC_HAVE_ELEMENTAL) 4438af8000cdSHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatConvert_seqaij_elemental_C",MatConvert_SeqAIJ_Elemental);CHKERRQ(ierr); 4439af8000cdSHong Zhang #endif 4440d24d4204SJose E. Roman #if defined(PETSC_HAVE_SCALAPACK) 4441d24d4204SJose E. Roman ierr = PetscObjectComposeFunction((PetscObject)B,"MatConvert_seqaij_scalapack_C",MatConvert_AIJ_ScaLAPACK);CHKERRQ(ierr); 4442d24d4204SJose E. Roman #endif 444363c07aadSStefano Zampini #if defined(PETSC_HAVE_HYPRE) 444463c07aadSStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatConvert_seqaij_hypre_C",MatConvert_AIJ_HYPRE);CHKERRQ(ierr); 44454222ddf1SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatProductSetFromOptions_transpose_seqaij_seqaij_C",MatProductSetFromOptions_Transpose_AIJ_AIJ);CHKERRQ(ierr); 444663c07aadSStefano Zampini #endif 4447b49cda9fSStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatConvert_seqaij_seqdense_C",MatConvert_SeqAIJ_SeqDense);CHKERRQ(ierr); 4448d4002b98SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatConvert_seqaij_seqsell_C",MatConvert_SeqAIJ_SeqSELL);CHKERRQ(ierr); 4449c9225affSStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatConvert_seqaij_is_C",MatConvert_XAIJ_IS);CHKERRQ(ierr); 4450bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatIsTranspose_C",MatIsTranspose_SeqAIJ);CHKERRQ(ierr); 4451bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatIsHermitianTranspose_C",MatIsTranspose_SeqAIJ);CHKERRQ(ierr); 4452bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatSeqAIJSetPreallocation_C",MatSeqAIJSetPreallocation_SeqAIJ);CHKERRQ(ierr); 4453846b4da1SFande Kong ierr = PetscObjectComposeFunction((PetscObject)B,"MatResetPreallocation_C",MatResetPreallocation_SeqAIJ);CHKERRQ(ierr); 4454bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatSeqAIJSetPreallocationCSR_C",MatSeqAIJSetPreallocationCSR_SeqAIJ);CHKERRQ(ierr); 4455bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatReorderForNonzeroDiagonal_C",MatReorderForNonzeroDiagonal_SeqAIJ);CHKERRQ(ierr); 44564222ddf1SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatProductSetFromOptions_is_seqaij_C",MatProductSetFromOptions_IS_XAIJ);CHKERRQ(ierr); 44574222ddf1SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatProductSetFromOptions_seqdense_seqaij_C",MatProductSetFromOptions_SeqDense_SeqAIJ);CHKERRQ(ierr); 44584222ddf1SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatProductSetFromOptions_seqaij_seqaij_C",MatProductSetFromOptions_SeqAIJ);CHKERRQ(ierr); 44594108e4d5SBarry Smith ierr = MatCreate_SeqAIJ_Inode(B);CHKERRQ(ierr); 446017667f90SBarry Smith ierr = PetscObjectChangeTypeName((PetscObject)B,MATSEQAIJ);CHKERRQ(ierr); 44614099cc6bSBarry Smith ierr = MatSeqAIJSetTypeFromOptions(B);CHKERRQ(ierr); /* this allows changing the matrix subtype to say MATSEQAIJPERM */ 44623a40ed3dSBarry Smith PetscFunctionReturn(0); 446317ab2063SBarry Smith } 446417ab2063SBarry Smith 4465b24902e0SBarry Smith /* 4466b24902e0SBarry Smith Given a matrix generated with MatGetFactor() duplicates all the information in A into B 4467b24902e0SBarry Smith */ 4468ace3abfcSBarry Smith PetscErrorCode MatDuplicateNoCreate_SeqAIJ(Mat C,Mat A,MatDuplicateOption cpvalues,PetscBool mallocmatspace) 446917ab2063SBarry Smith { 4470416022c9SBarry Smith Mat_SeqAIJ *c,*a = (Mat_SeqAIJ*)A->data; 44716849ba73SBarry Smith PetscErrorCode ierr; 4472071fcb05SBarry Smith PetscInt m = A->rmap->n,i; 447317ab2063SBarry Smith 44743a40ed3dSBarry Smith PetscFunctionBegin; 4475273d9f13SBarry Smith c = (Mat_SeqAIJ*)C->data; 4476273d9f13SBarry Smith 4477d5f3da31SBarry Smith C->factortype = A->factortype; 4478416022c9SBarry Smith c->row = 0; 4479416022c9SBarry Smith c->col = 0; 448082bf6240SBarry Smith c->icol = 0; 44816ad4291fSHong Zhang c->reallocs = 0; 448217ab2063SBarry Smith 44836ad4291fSHong Zhang C->assembled = PETSC_TRUE; 448417ab2063SBarry Smith 4485aa5ea44dSBarry Smith ierr = PetscLayoutReference(A->rmap,&C->rmap);CHKERRQ(ierr); 4486aa5ea44dSBarry Smith ierr = PetscLayoutReference(A->cmap,&C->cmap);CHKERRQ(ierr); 4487eec197d1SBarry Smith 4488071fcb05SBarry Smith ierr = PetscMalloc1(m,&c->imax);CHKERRQ(ierr); 4489071fcb05SBarry Smith ierr = PetscMemcpy(c->imax,a->imax,m*sizeof(PetscInt));CHKERRQ(ierr); 4490071fcb05SBarry Smith ierr = PetscMalloc1(m,&c->ilen);CHKERRQ(ierr); 4491071fcb05SBarry Smith ierr = PetscMemcpy(c->ilen,a->ilen,m*sizeof(PetscInt));CHKERRQ(ierr); 44923bb1ff40SBarry Smith ierr = PetscLogObjectMemory((PetscObject)C, 2*m*sizeof(PetscInt));CHKERRQ(ierr); 449317ab2063SBarry Smith 449417ab2063SBarry Smith /* allocate the matrix space */ 4495f77e22a1SHong Zhang if (mallocmatspace) { 4496dcca6d9dSJed Brown ierr = PetscMalloc3(a->i[m],&c->a,a->i[m],&c->j,m+1,&c->i);CHKERRQ(ierr); 44973bb1ff40SBarry Smith ierr = PetscLogObjectMemory((PetscObject)C, a->i[m]*(sizeof(PetscScalar)+sizeof(PetscInt))+(m+1)*sizeof(PetscInt));CHKERRQ(ierr); 44982205254eSKarl Rupp 4499f1e2ffcdSBarry Smith c->singlemalloc = PETSC_TRUE; 45002205254eSKarl Rupp 4501580bdb30SBarry Smith ierr = PetscArraycpy(c->i,a->i,m+1);CHKERRQ(ierr); 450217ab2063SBarry Smith if (m > 0) { 4503580bdb30SBarry Smith ierr = PetscArraycpy(c->j,a->j,a->i[m]);CHKERRQ(ierr); 4504be6bf707SBarry Smith if (cpvalues == MAT_COPY_VALUES) { 4505580bdb30SBarry Smith ierr = PetscArraycpy(c->a,a->a,a->i[m]);CHKERRQ(ierr); 4506be6bf707SBarry Smith } else { 4507580bdb30SBarry Smith ierr = PetscArrayzero(c->a,a->i[m]);CHKERRQ(ierr); 450817ab2063SBarry Smith } 450908480c60SBarry Smith } 4510f77e22a1SHong Zhang } 451117ab2063SBarry Smith 45126ad4291fSHong Zhang c->ignorezeroentries = a->ignorezeroentries; 4513416022c9SBarry Smith c->roworiented = a->roworiented; 4514416022c9SBarry Smith c->nonew = a->nonew; 4515416022c9SBarry Smith if (a->diag) { 4516854ce69bSBarry Smith ierr = PetscMalloc1(m+1,&c->diag);CHKERRQ(ierr); 4517071fcb05SBarry Smith ierr = PetscMemcpy(c->diag,a->diag,m*sizeof(PetscInt));CHKERRQ(ierr); 45183bb1ff40SBarry Smith ierr = PetscLogObjectMemory((PetscObject)C,(m+1)*sizeof(PetscInt));CHKERRQ(ierr); 4519071fcb05SBarry Smith } else c->diag = NULL; 45202205254eSKarl Rupp 45216ad4291fSHong Zhang c->solve_work = 0; 45226ad4291fSHong Zhang c->saved_values = 0; 45236ad4291fSHong Zhang c->idiag = 0; 452471f1c65dSBarry Smith c->ssor_work = 0; 4525a9817697SBarry Smith c->keepnonzeropattern = a->keepnonzeropattern; 4526e6b907acSBarry Smith c->free_a = PETSC_TRUE; 4527e6b907acSBarry Smith c->free_ij = PETSC_TRUE; 45286ad4291fSHong Zhang 4529893ad86cSHong Zhang c->rmax = a->rmax; 4530416022c9SBarry Smith c->nz = a->nz; 45318ed568f8SMatthew G Knepley c->maxnz = a->nz; /* Since we allocate exactly the right amount */ 4532273d9f13SBarry Smith C->preallocated = PETSC_TRUE; 4533754ec7b1SSatish Balay 45346ad4291fSHong Zhang c->compressedrow.use = a->compressedrow.use; 45356ad4291fSHong Zhang c->compressedrow.nrows = a->compressedrow.nrows; 4536cd6b891eSBarry Smith if (a->compressedrow.use) { 45376ad4291fSHong Zhang i = a->compressedrow.nrows; 4538dcca6d9dSJed Brown ierr = PetscMalloc2(i+1,&c->compressedrow.i,i,&c->compressedrow.rindex);CHKERRQ(ierr); 4539580bdb30SBarry Smith ierr = PetscArraycpy(c->compressedrow.i,a->compressedrow.i,i+1);CHKERRQ(ierr); 4540580bdb30SBarry Smith ierr = PetscArraycpy(c->compressedrow.rindex,a->compressedrow.rindex,i);CHKERRQ(ierr); 454127ea64f8SHong Zhang } else { 454227ea64f8SHong Zhang c->compressedrow.use = PETSC_FALSE; 45430298fd71SBarry Smith c->compressedrow.i = NULL; 45440298fd71SBarry Smith c->compressedrow.rindex = NULL; 45456ad4291fSHong Zhang } 4546ea632784SBarry Smith c->nonzerorowcnt = a->nonzerorowcnt; 4547e56f5c9eSBarry Smith C->nonzerostate = A->nonzerostate; 45484846f1f5SKris Buschelman 45492205254eSKarl Rupp ierr = MatDuplicate_SeqAIJ_Inode(A,cpvalues,&C);CHKERRQ(ierr); 4550140e18c1SBarry Smith ierr = PetscFunctionListDuplicate(((PetscObject)A)->qlist,&((PetscObject)C)->qlist);CHKERRQ(ierr); 45513a40ed3dSBarry Smith PetscFunctionReturn(0); 455217ab2063SBarry Smith } 455317ab2063SBarry Smith 4554b24902e0SBarry Smith PetscErrorCode MatDuplicate_SeqAIJ(Mat A,MatDuplicateOption cpvalues,Mat *B) 4555b24902e0SBarry Smith { 4556b24902e0SBarry Smith PetscErrorCode ierr; 4557b24902e0SBarry Smith 4558b24902e0SBarry Smith PetscFunctionBegin; 4559ce94432eSBarry Smith ierr = MatCreate(PetscObjectComm((PetscObject)A),B);CHKERRQ(ierr); 45604b6263acSBarry Smith ierr = MatSetSizes(*B,A->rmap->n,A->cmap->n,A->rmap->n,A->cmap->n);CHKERRQ(ierr); 4561cfd3f464SBarry Smith if (!(A->rmap->n % A->rmap->bs) && !(A->cmap->n % A->cmap->bs)) { 456233d57670SJed Brown ierr = MatSetBlockSizesFromMats(*B,A,A);CHKERRQ(ierr); 4563cfd3f464SBarry Smith } 4564a54f2f98SBarry Smith ierr = MatSetType(*B,((PetscObject)A)->type_name);CHKERRQ(ierr); 4565f77e22a1SHong Zhang ierr = MatDuplicateNoCreate_SeqAIJ(*B,A,cpvalues,PETSC_TRUE);CHKERRQ(ierr); 4566b24902e0SBarry Smith PetscFunctionReturn(0); 4567b24902e0SBarry Smith } 4568b24902e0SBarry Smith 4569112444f4SShri Abhyankar PetscErrorCode MatLoad_SeqAIJ(Mat newMat, PetscViewer viewer) 4570fbdbba38SShri Abhyankar { 457152f91c60SVaclav Hapla PetscBool isbinary, ishdf5; 457252f91c60SVaclav Hapla PetscErrorCode ierr; 457352f91c60SVaclav Hapla 457452f91c60SVaclav Hapla PetscFunctionBegin; 457552f91c60SVaclav Hapla PetscValidHeaderSpecific(newMat,MAT_CLASSID,1); 457652f91c60SVaclav Hapla PetscValidHeaderSpecific(viewer,PETSC_VIEWER_CLASSID,2); 4577c27b3999SVaclav Hapla /* force binary viewer to load .info file if it has not yet done so */ 4578c27b3999SVaclav Hapla ierr = PetscViewerSetUp(viewer);CHKERRQ(ierr); 457952f91c60SVaclav Hapla ierr = PetscObjectTypeCompare((PetscObject)viewer,PETSCVIEWERBINARY,&isbinary);CHKERRQ(ierr); 458052f91c60SVaclav Hapla ierr = PetscObjectTypeCompare((PetscObject)viewer,PETSCVIEWERHDF5, &ishdf5);CHKERRQ(ierr); 458152f91c60SVaclav Hapla if (isbinary) { 458252f91c60SVaclav Hapla ierr = MatLoad_SeqAIJ_Binary(newMat,viewer);CHKERRQ(ierr); 458352f91c60SVaclav Hapla } else if (ishdf5) { 458452f91c60SVaclav Hapla #if defined(PETSC_HAVE_HDF5) 458552f91c60SVaclav Hapla ierr = MatLoad_AIJ_HDF5(newMat,viewer);CHKERRQ(ierr); 458652f91c60SVaclav Hapla #else 458752f91c60SVaclav Hapla SETERRQ(PetscObjectComm((PetscObject)newMat),PETSC_ERR_SUP,"HDF5 not supported in this build.\nPlease reconfigure using --download-hdf5"); 458852f91c60SVaclav Hapla #endif 458952f91c60SVaclav Hapla } else { 459052f91c60SVaclav Hapla SETERRQ2(PetscObjectComm((PetscObject)newMat),PETSC_ERR_SUP,"Viewer type %s not yet supported for reading %s matrices",((PetscObject)viewer)->type_name,((PetscObject)newMat)->type_name); 459152f91c60SVaclav Hapla } 459252f91c60SVaclav Hapla PetscFunctionReturn(0); 459352f91c60SVaclav Hapla } 459452f91c60SVaclav Hapla 45953ea6fe3dSLisandro Dalcin PetscErrorCode MatLoad_SeqAIJ_Binary(Mat mat, PetscViewer viewer) 459652f91c60SVaclav Hapla { 45973ea6fe3dSLisandro Dalcin Mat_SeqAIJ *a = (Mat_SeqAIJ*)mat->data; 4598fbdbba38SShri Abhyankar PetscErrorCode ierr; 45993ea6fe3dSLisandro Dalcin PetscInt header[4],*rowlens,M,N,nz,sum,rows,cols,i; 4600fbdbba38SShri Abhyankar 4601fbdbba38SShri Abhyankar PetscFunctionBegin; 46023ea6fe3dSLisandro Dalcin ierr = PetscViewerSetUp(viewer);CHKERRQ(ierr); 4603bbead8a2SBarry Smith 46043ea6fe3dSLisandro Dalcin /* read in matrix header */ 46053ea6fe3dSLisandro Dalcin ierr = PetscViewerBinaryRead(viewer,header,4,NULL,PETSC_INT);CHKERRQ(ierr); 46063ea6fe3dSLisandro Dalcin if (header[0] != MAT_FILE_CLASSID) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_FILE_UNEXPECTED,"Not a matrix object in file"); 4607fbdbba38SShri Abhyankar M = header[1]; N = header[2]; nz = header[3]; 46083ea6fe3dSLisandro Dalcin if (M < 0) SETERRQ1(PetscObjectComm((PetscObject)viewer),PETSC_ERR_FILE_UNEXPECTED,"Matrix row size (%D) in file is negative",M); 46093ea6fe3dSLisandro Dalcin if (N < 0) SETERRQ1(PetscObjectComm((PetscObject)viewer),PETSC_ERR_FILE_UNEXPECTED,"Matrix column size (%D) in file is negative",N); 4610bbead8a2SBarry Smith if (nz < 0) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_FILE_UNEXPECTED,"Matrix stored in special format on disk, cannot load as SeqAIJ"); 4611fbdbba38SShri Abhyankar 46123ea6fe3dSLisandro Dalcin /* set block sizes from the viewer's .info file */ 46133ea6fe3dSLisandro Dalcin ierr = MatLoad_Binary_BlockSizes(mat,viewer);CHKERRQ(ierr); 46143ea6fe3dSLisandro Dalcin /* set local and global sizes if not set already */ 46153ea6fe3dSLisandro Dalcin if (mat->rmap->n < 0) mat->rmap->n = M; 46163ea6fe3dSLisandro Dalcin if (mat->cmap->n < 0) mat->cmap->n = N; 46173ea6fe3dSLisandro Dalcin if (mat->rmap->N < 0) mat->rmap->N = M; 46183ea6fe3dSLisandro Dalcin if (mat->cmap->N < 0) mat->cmap->N = N; 46193ea6fe3dSLisandro Dalcin ierr = PetscLayoutSetUp(mat->rmap);CHKERRQ(ierr); 46203ea6fe3dSLisandro Dalcin ierr = PetscLayoutSetUp(mat->cmap);CHKERRQ(ierr); 46213ea6fe3dSLisandro Dalcin 46223ea6fe3dSLisandro Dalcin /* check if the matrix sizes are correct */ 46233ea6fe3dSLisandro Dalcin ierr = MatGetSize(mat,&rows,&cols);CHKERRQ(ierr); 46243ea6fe3dSLisandro Dalcin if (M != rows || N != cols) SETERRQ4(PETSC_COMM_SELF,PETSC_ERR_FILE_UNEXPECTED, "Matrix in file of different sizes (%D, %D) than the input matrix (%D, %D)",M,N,rows,cols); 46253ea6fe3dSLisandro Dalcin 4626fbdbba38SShri Abhyankar /* read in row lengths */ 46273ea6fe3dSLisandro Dalcin ierr = PetscMalloc1(M,&rowlens);CHKERRQ(ierr); 46283ea6fe3dSLisandro Dalcin ierr = PetscViewerBinaryRead(viewer,rowlens,M,NULL,PETSC_INT);CHKERRQ(ierr); 46293ea6fe3dSLisandro Dalcin /* check if sum(rowlens) is same as nz */ 46303ea6fe3dSLisandro Dalcin sum = 0; for (i=0; i<M; i++) sum += rowlens[i]; 46313ea6fe3dSLisandro Dalcin if (sum != nz) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_FILE_UNEXPECTED,"Inconsistent matrix data in file: nonzeros = %D, sum-row-lengths = %D\n",nz,sum); 46323ea6fe3dSLisandro Dalcin /* preallocate and check sizes */ 46333ea6fe3dSLisandro Dalcin ierr = MatSeqAIJSetPreallocation_SeqAIJ(mat,0,rowlens);CHKERRQ(ierr); 46343ea6fe3dSLisandro Dalcin ierr = MatGetSize(mat,&rows,&cols);CHKERRQ(ierr); 463560e0710aSBarry Smith if (M != rows || N != cols) SETERRQ4(PETSC_COMM_SELF,PETSC_ERR_FILE_UNEXPECTED, "Matrix in file of different length (%D, %D) than the input matrix (%D, %D)",M,N,rows,cols); 46363ea6fe3dSLisandro Dalcin /* store row lengths */ 46373ea6fe3dSLisandro Dalcin ierr = PetscArraycpy(a->ilen,rowlens,M);CHKERRQ(ierr); 46383ea6fe3dSLisandro Dalcin ierr = PetscFree(rowlens);CHKERRQ(ierr); 4639fbdbba38SShri Abhyankar 46403ea6fe3dSLisandro Dalcin /* fill in "i" row pointers */ 46413ea6fe3dSLisandro Dalcin a->i[0] = 0; for (i=0; i<M; i++) a->i[i+1] = a->i[i] + a->ilen[i]; 46423ea6fe3dSLisandro Dalcin /* read in "j" column indices */ 46433ea6fe3dSLisandro Dalcin ierr = PetscViewerBinaryRead(viewer,a->j,nz,NULL,PETSC_INT);CHKERRQ(ierr); 46443ea6fe3dSLisandro Dalcin /* read in "a" nonzero values */ 46453ea6fe3dSLisandro Dalcin ierr = PetscViewerBinaryRead(viewer,a->a,nz,NULL,PETSC_SCALAR);CHKERRQ(ierr); 4646fbdbba38SShri Abhyankar 46473ea6fe3dSLisandro Dalcin ierr = MatAssemblyBegin(mat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 46483ea6fe3dSLisandro Dalcin ierr = MatAssemblyEnd(mat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 4649fbdbba38SShri Abhyankar PetscFunctionReturn(0); 4650fbdbba38SShri Abhyankar } 4651fbdbba38SShri Abhyankar 4652ace3abfcSBarry Smith PetscErrorCode MatEqual_SeqAIJ(Mat A,Mat B,PetscBool * flg) 46537264ac53SSatish Balay { 46547264ac53SSatish Balay Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data,*b = (Mat_SeqAIJ*)B->data; 4655dfbe8321SBarry Smith PetscErrorCode ierr; 4656eeffb40dSHong Zhang #if defined(PETSC_USE_COMPLEX) 4657eeffb40dSHong Zhang PetscInt k; 4658eeffb40dSHong Zhang #endif 46597264ac53SSatish Balay 46603a40ed3dSBarry Smith PetscFunctionBegin; 4661bfeeae90SHong Zhang /* If the matrix dimensions are not equal,or no of nonzeros */ 4662d0f46423SBarry Smith if ((A->rmap->n != B->rmap->n) || (A->cmap->n != B->cmap->n) ||(a->nz != b->nz)) { 4663ca44d042SBarry Smith *flg = PETSC_FALSE; 4664ca44d042SBarry Smith PetscFunctionReturn(0); 4665bcd2baecSBarry Smith } 46667264ac53SSatish Balay 46677264ac53SSatish Balay /* if the a->i are the same */ 4668580bdb30SBarry Smith ierr = PetscArraycmp(a->i,b->i,A->rmap->n+1,flg);CHKERRQ(ierr); 4669abc0a331SBarry Smith if (!*flg) PetscFunctionReturn(0); 46707264ac53SSatish Balay 46717264ac53SSatish Balay /* if a->j are the same */ 4672580bdb30SBarry Smith ierr = PetscArraycmp(a->j,b->j,a->nz,flg);CHKERRQ(ierr); 4673abc0a331SBarry Smith if (!*flg) PetscFunctionReturn(0); 4674bcd2baecSBarry Smith 4675bcd2baecSBarry Smith /* if a->a are the same */ 4676eeffb40dSHong Zhang #if defined(PETSC_USE_COMPLEX) 4677eeffb40dSHong Zhang for (k=0; k<a->nz; k++) { 4678eeffb40dSHong Zhang if (PetscRealPart(a->a[k]) != PetscRealPart(b->a[k]) || PetscImaginaryPart(a->a[k]) != PetscImaginaryPart(b->a[k])) { 4679eeffb40dSHong Zhang *flg = PETSC_FALSE; 46803a40ed3dSBarry Smith PetscFunctionReturn(0); 4681eeffb40dSHong Zhang } 4682eeffb40dSHong Zhang } 4683eeffb40dSHong Zhang #else 4684580bdb30SBarry Smith ierr = PetscArraycmp(a->a,b->a,a->nz,flg);CHKERRQ(ierr); 4685eeffb40dSHong Zhang #endif 4686eeffb40dSHong Zhang PetscFunctionReturn(0); 46877264ac53SSatish Balay } 468836db0b34SBarry Smith 468905869f15SSatish Balay /*@ 469036db0b34SBarry Smith MatCreateSeqAIJWithArrays - Creates an sequential AIJ matrix using matrix elements (in CSR format) 469136db0b34SBarry Smith provided by the user. 469236db0b34SBarry Smith 4693d083f849SBarry Smith Collective 469436db0b34SBarry Smith 469536db0b34SBarry Smith Input Parameters: 469636db0b34SBarry Smith + comm - must be an MPI communicator of size 1 469736db0b34SBarry Smith . m - number of rows 469836db0b34SBarry Smith . n - number of columns 4699483a2f95SBarry Smith . i - row indices; that is i[0] = 0, i[row] = i[row-1] + number of elements in that row of the matrix 470036db0b34SBarry Smith . j - column indices 470136db0b34SBarry Smith - a - matrix values 470236db0b34SBarry Smith 470336db0b34SBarry Smith Output Parameter: 470436db0b34SBarry Smith . mat - the matrix 470536db0b34SBarry Smith 470636db0b34SBarry Smith Level: intermediate 470736db0b34SBarry Smith 470836db0b34SBarry Smith Notes: 47090551d7c0SBarry Smith The i, j, and a arrays are not copied by this routine, the user must free these arrays 4710292fb18eSBarry Smith once the matrix is destroyed and not before 471136db0b34SBarry Smith 471236db0b34SBarry Smith You cannot set new nonzero locations into this matrix, that will generate an error. 471336db0b34SBarry Smith 4714bfeeae90SHong Zhang The i and j indices are 0 based 471536db0b34SBarry Smith 4716a4552177SSatish Balay The format which is used for the sparse matrix input, is equivalent to a 4717a4552177SSatish Balay row-major ordering.. i.e for the following matrix, the input data expected is 47188eef79e4SBarry Smith as shown 4719a4552177SSatish Balay 47208eef79e4SBarry Smith $ 1 0 0 47218eef79e4SBarry Smith $ 2 0 3 47228eef79e4SBarry Smith $ 4 5 6 47238eef79e4SBarry Smith $ 47248eef79e4SBarry Smith $ i = {0,1,3,6} [size = nrow+1 = 3+1] 47258eef79e4SBarry Smith $ j = {0,0,2,0,1,2} [size = 6]; values must be sorted for each row 47268eef79e4SBarry Smith $ v = {1,2,3,4,5,6} [size = 6] 4727a4552177SSatish Balay 47289985e31cSBarry Smith 472969b1f4b7SBarry Smith .seealso: MatCreate(), MatCreateAIJ(), MatCreateSeqAIJ(), MatCreateMPIAIJWithArrays(), MatMPIAIJSetPreallocationCSR() 473036db0b34SBarry Smith 473136db0b34SBarry Smith @*/ 4732c3c607ccSBarry Smith PetscErrorCode MatCreateSeqAIJWithArrays(MPI_Comm comm,PetscInt m,PetscInt n,PetscInt i[],PetscInt j[],PetscScalar a[],Mat *mat) 473336db0b34SBarry Smith { 4734dfbe8321SBarry Smith PetscErrorCode ierr; 4735cbcfb4deSHong Zhang PetscInt ii; 473636db0b34SBarry Smith Mat_SeqAIJ *aij; 4737cbcfb4deSHong Zhang PetscInt jj; 473836db0b34SBarry Smith 473936db0b34SBarry Smith PetscFunctionBegin; 474041096f02SStefano Zampini if (m > 0 && i[0]) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"i (row indices) must start with 0"); 4741f69a0ea3SMatthew Knepley ierr = MatCreate(comm,mat);CHKERRQ(ierr); 4742f69a0ea3SMatthew Knepley ierr = MatSetSizes(*mat,m,n,m,n);CHKERRQ(ierr); 4743a2f3521dSMark F. Adams /* ierr = MatSetBlockSizes(*mat,,);CHKERRQ(ierr); */ 4744ab93d7beSBarry Smith ierr = MatSetType(*mat,MATSEQAIJ);CHKERRQ(ierr); 4745ab93d7beSBarry Smith ierr = MatSeqAIJSetPreallocation_SeqAIJ(*mat,MAT_SKIP_ALLOCATION,0);CHKERRQ(ierr); 4746ab93d7beSBarry Smith aij = (Mat_SeqAIJ*)(*mat)->data; 4747071fcb05SBarry Smith ierr = PetscMalloc1(m,&aij->imax);CHKERRQ(ierr); 4748071fcb05SBarry Smith ierr = PetscMalloc1(m,&aij->ilen);CHKERRQ(ierr); 4749ab93d7beSBarry Smith 475036db0b34SBarry Smith aij->i = i; 475136db0b34SBarry Smith aij->j = j; 475236db0b34SBarry Smith aij->a = a; 475336db0b34SBarry Smith aij->singlemalloc = PETSC_FALSE; 475436db0b34SBarry Smith aij->nonew = -1; /*this indicates that inserting a new value in the matrix that generates a new nonzero is an error*/ 4755e6b907acSBarry Smith aij->free_a = PETSC_FALSE; 4756e6b907acSBarry Smith aij->free_ij = PETSC_FALSE; 475736db0b34SBarry Smith 475836db0b34SBarry Smith for (ii=0; ii<m; ii++) { 475936db0b34SBarry Smith aij->ilen[ii] = aij->imax[ii] = i[ii+1] - i[ii]; 476076bd3646SJed Brown if (PetscDefined(USE_DEBUG)) { 476160e0710aSBarry Smith if (i[ii+1] - i[ii] < 0) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Negative row length in i (row indices) row = %D length = %D",ii,i[ii+1] - i[ii]); 47629985e31cSBarry Smith for (jj=i[ii]+1; jj<i[ii+1]; jj++) { 4763a061629eSStefano Zampini if (j[jj] < j[jj-1]) SETERRQ3(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Column entry number %D (actual column %D) in row %D is not sorted",jj-i[ii],j[jj],ii); 4764a061629eSStefano Zampini if (j[jj] == j[jj-1]) SETERRQ3(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Column entry number %D (actual column %D) in row %D is identical to previous entry",jj-i[ii],j[jj],ii); 47659985e31cSBarry Smith } 476636db0b34SBarry Smith } 476776bd3646SJed Brown } 476876bd3646SJed Brown if (PetscDefined(USE_DEBUG)) { 476936db0b34SBarry Smith for (ii=0; ii<aij->i[m]; ii++) { 477060e0710aSBarry Smith if (j[ii] < 0) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Negative column index at location = %D index = %D",ii,j[ii]); 477160e0710aSBarry Smith if (j[ii] > n - 1) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Column index to large at location = %D index = %D",ii,j[ii]); 477236db0b34SBarry Smith } 477376bd3646SJed Brown } 477436db0b34SBarry Smith 4775b65db4caSBarry Smith ierr = MatAssemblyBegin(*mat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 4776b65db4caSBarry Smith ierr = MatAssemblyEnd(*mat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 477736db0b34SBarry Smith PetscFunctionReturn(0); 477836db0b34SBarry Smith } 477980ef6e79SMatthew G Knepley /*@C 4780d021a1c5SVictor Minden MatCreateSeqAIJFromTriple - Creates an sequential AIJ matrix using matrix elements (in COO format) 47818a0b0e6bSVictor Minden provided by the user. 47828a0b0e6bSVictor Minden 4783d083f849SBarry Smith Collective 47848a0b0e6bSVictor Minden 47858a0b0e6bSVictor Minden Input Parameters: 47868a0b0e6bSVictor Minden + comm - must be an MPI communicator of size 1 47878a0b0e6bSVictor Minden . m - number of rows 47888a0b0e6bSVictor Minden . n - number of columns 47898a0b0e6bSVictor Minden . i - row indices 47908a0b0e6bSVictor Minden . j - column indices 47911230e6d1SVictor Minden . a - matrix values 47921230e6d1SVictor Minden . nz - number of nonzeros 47931230e6d1SVictor Minden - idx - 0 or 1 based 47948a0b0e6bSVictor Minden 47958a0b0e6bSVictor Minden Output Parameter: 47968a0b0e6bSVictor Minden . mat - the matrix 47978a0b0e6bSVictor Minden 47988a0b0e6bSVictor Minden Level: intermediate 47998a0b0e6bSVictor Minden 48008a0b0e6bSVictor Minden Notes: 48018a0b0e6bSVictor Minden The i and j indices are 0 based 48028a0b0e6bSVictor Minden 48038a0b0e6bSVictor Minden The format which is used for the sparse matrix input, is equivalent to a 48048a0b0e6bSVictor Minden row-major ordering.. i.e for the following matrix, the input data expected is 48058a0b0e6bSVictor Minden as shown: 48068a0b0e6bSVictor Minden 48078a0b0e6bSVictor Minden 1 0 0 48088a0b0e6bSVictor Minden 2 0 3 48098a0b0e6bSVictor Minden 4 5 6 48108a0b0e6bSVictor Minden 48118a0b0e6bSVictor Minden i = {0,1,1,2,2,2} 48128a0b0e6bSVictor Minden j = {0,0,2,0,1,2} 48138a0b0e6bSVictor Minden v = {1,2,3,4,5,6} 48148a0b0e6bSVictor Minden 48158a0b0e6bSVictor Minden 481669b1f4b7SBarry Smith .seealso: MatCreate(), MatCreateAIJ(), MatCreateSeqAIJ(), MatCreateSeqAIJWithArrays(), MatMPIAIJSetPreallocationCSR() 48178a0b0e6bSVictor Minden 48188a0b0e6bSVictor Minden @*/ 4819c3c607ccSBarry Smith PetscErrorCode MatCreateSeqAIJFromTriple(MPI_Comm comm,PetscInt m,PetscInt n,PetscInt i[],PetscInt j[],PetscScalar a[],Mat *mat,PetscInt nz,PetscBool idx) 48208a0b0e6bSVictor Minden { 48218a0b0e6bSVictor Minden PetscErrorCode ierr; 4822d021a1c5SVictor Minden PetscInt ii, *nnz, one = 1,row,col; 48238a0b0e6bSVictor Minden 48248a0b0e6bSVictor Minden 48258a0b0e6bSVictor Minden PetscFunctionBegin; 48261795a4d1SJed Brown ierr = PetscCalloc1(m,&nnz);CHKERRQ(ierr); 48271230e6d1SVictor Minden for (ii = 0; ii < nz; ii++) { 4828c8d679ebSHong Zhang nnz[i[ii] - !!idx] += 1; 48291230e6d1SVictor Minden } 48308a0b0e6bSVictor Minden ierr = MatCreate(comm,mat);CHKERRQ(ierr); 48318a0b0e6bSVictor Minden ierr = MatSetSizes(*mat,m,n,m,n);CHKERRQ(ierr); 48328a0b0e6bSVictor Minden ierr = MatSetType(*mat,MATSEQAIJ);CHKERRQ(ierr); 48331230e6d1SVictor Minden ierr = MatSeqAIJSetPreallocation_SeqAIJ(*mat,0,nnz);CHKERRQ(ierr); 48341230e6d1SVictor Minden for (ii = 0; ii < nz; ii++) { 48351230e6d1SVictor Minden if (idx) { 48361230e6d1SVictor Minden row = i[ii] - 1; 48371230e6d1SVictor Minden col = j[ii] - 1; 48381230e6d1SVictor Minden } else { 48391230e6d1SVictor Minden row = i[ii]; 48401230e6d1SVictor Minden col = j[ii]; 48418a0b0e6bSVictor Minden } 48421230e6d1SVictor Minden ierr = MatSetValues(*mat,one,&row,one,&col,&a[ii],ADD_VALUES);CHKERRQ(ierr); 48438a0b0e6bSVictor Minden } 48448a0b0e6bSVictor Minden ierr = MatAssemblyBegin(*mat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 48458a0b0e6bSVictor Minden ierr = MatAssemblyEnd(*mat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 4846d021a1c5SVictor Minden ierr = PetscFree(nnz);CHKERRQ(ierr); 48478a0b0e6bSVictor Minden PetscFunctionReturn(0); 48488a0b0e6bSVictor Minden } 484936db0b34SBarry Smith 4850acf2f550SJed Brown PetscErrorCode MatSeqAIJInvalidateDiagonal(Mat A) 4851acf2f550SJed Brown { 4852acf2f550SJed Brown Mat_SeqAIJ *a=(Mat_SeqAIJ*)A->data; 4853acf2f550SJed Brown PetscErrorCode ierr; 4854acf2f550SJed Brown 4855acf2f550SJed Brown PetscFunctionBegin; 4856acf2f550SJed Brown a->idiagvalid = PETSC_FALSE; 4857acf2f550SJed Brown a->ibdiagvalid = PETSC_FALSE; 48582205254eSKarl Rupp 4859acf2f550SJed Brown ierr = MatSeqAIJInvalidateDiagonal_Inode(A);CHKERRQ(ierr); 4860acf2f550SJed Brown PetscFunctionReturn(0); 4861acf2f550SJed Brown } 4862acf2f550SJed Brown 48639c8f2541SHong Zhang PetscErrorCode MatCreateMPIMatConcatenateSeqMat_SeqAIJ(MPI_Comm comm,Mat inmat,PetscInt n,MatReuse scall,Mat *outmat) 48649c8f2541SHong Zhang { 48659c8f2541SHong Zhang PetscErrorCode ierr; 48668761c3d6SHong Zhang PetscMPIInt size; 48679c8f2541SHong Zhang 48689c8f2541SHong Zhang PetscFunctionBegin; 48698761c3d6SHong Zhang ierr = MPI_Comm_size(comm,&size);CHKERRQ(ierr); 48707bbdc51dSHong Zhang if (size == 1) { 48717bbdc51dSHong Zhang if (scall == MAT_INITIAL_MATRIX) { 48727bbdc51dSHong Zhang ierr = MatDuplicate(inmat,MAT_COPY_VALUES,outmat);CHKERRQ(ierr); 48737bbdc51dSHong Zhang } else { 48748761c3d6SHong Zhang ierr = MatCopy(inmat,*outmat,SAME_NONZERO_PATTERN);CHKERRQ(ierr); 48757bbdc51dSHong Zhang } 48768761c3d6SHong Zhang } else { 48779c8f2541SHong Zhang ierr = MatCreateMPIMatConcatenateSeqMat_MPIAIJ(comm,inmat,n,scall,outmat);CHKERRQ(ierr); 48788761c3d6SHong Zhang } 48799c8f2541SHong Zhang PetscFunctionReturn(0); 48809c8f2541SHong Zhang } 48819c8f2541SHong Zhang 488281824310SBarry Smith /* 488353dd7562SDmitry Karpeev Permute A into C's *local* index space using rowemb,colemb. 488453dd7562SDmitry Karpeev The embedding are supposed to be injections and the above implies that the range of rowemb is a subset 488553dd7562SDmitry Karpeev of [0,m), colemb is in [0,n). 488653dd7562SDmitry Karpeev If pattern == DIFFERENT_NONZERO_PATTERN, C is preallocated according to A. 488753dd7562SDmitry Karpeev */ 488853dd7562SDmitry Karpeev PetscErrorCode MatSetSeqMat_SeqAIJ(Mat C,IS rowemb,IS colemb,MatStructure pattern,Mat B) 488953dd7562SDmitry Karpeev { 489053dd7562SDmitry Karpeev /* If making this function public, change the error returned in this function away from _PLIB. */ 489153dd7562SDmitry Karpeev PetscErrorCode ierr; 489253dd7562SDmitry Karpeev Mat_SeqAIJ *Baij; 489353dd7562SDmitry Karpeev PetscBool seqaij; 489453dd7562SDmitry Karpeev PetscInt m,n,*nz,i,j,count; 489553dd7562SDmitry Karpeev PetscScalar v; 489653dd7562SDmitry Karpeev const PetscInt *rowindices,*colindices; 489753dd7562SDmitry Karpeev 489853dd7562SDmitry Karpeev PetscFunctionBegin; 489953dd7562SDmitry Karpeev if (!B) PetscFunctionReturn(0); 490053dd7562SDmitry Karpeev /* Check to make sure the target matrix (and embeddings) are compatible with C and each other. */ 49014099cc6bSBarry Smith ierr = PetscObjectBaseTypeCompare((PetscObject)B,MATSEQAIJ,&seqaij);CHKERRQ(ierr); 490253dd7562SDmitry Karpeev if (!seqaij) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Input matrix is of wrong type"); 490353dd7562SDmitry Karpeev if (rowemb) { 490453dd7562SDmitry Karpeev ierr = ISGetLocalSize(rowemb,&m);CHKERRQ(ierr); 490553dd7562SDmitry Karpeev if (m != B->rmap->n) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Row IS of size %D is incompatible with matrix row size %D",m,B->rmap->n); 490653dd7562SDmitry Karpeev } else { 49076c4ed002SBarry Smith if (C->rmap->n != B->rmap->n) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Input matrix is row-incompatible with the target matrix"); 490853dd7562SDmitry Karpeev } 490953dd7562SDmitry Karpeev if (colemb) { 491053dd7562SDmitry Karpeev ierr = ISGetLocalSize(colemb,&n);CHKERRQ(ierr); 491153dd7562SDmitry Karpeev if (n != B->cmap->n) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Diag col IS of size %D is incompatible with input matrix col size %D",n,B->cmap->n); 491253dd7562SDmitry Karpeev } else { 491353dd7562SDmitry Karpeev if (C->cmap->n != B->cmap->n) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Input matrix is col-incompatible with the target matrix"); 491453dd7562SDmitry Karpeev } 491553dd7562SDmitry Karpeev 491653dd7562SDmitry Karpeev Baij = (Mat_SeqAIJ*)(B->data); 491753dd7562SDmitry Karpeev if (pattern == DIFFERENT_NONZERO_PATTERN) { 491853dd7562SDmitry Karpeev ierr = PetscMalloc1(B->rmap->n,&nz);CHKERRQ(ierr); 491953dd7562SDmitry Karpeev for (i=0; i<B->rmap->n; i++) { 492053dd7562SDmitry Karpeev nz[i] = Baij->i[i+1] - Baij->i[i]; 492153dd7562SDmitry Karpeev } 492253dd7562SDmitry Karpeev ierr = MatSeqAIJSetPreallocation(C,0,nz);CHKERRQ(ierr); 492353dd7562SDmitry Karpeev ierr = PetscFree(nz);CHKERRQ(ierr); 492453dd7562SDmitry Karpeev } 492553dd7562SDmitry Karpeev if (pattern == SUBSET_NONZERO_PATTERN) { 492653dd7562SDmitry Karpeev ierr = MatZeroEntries(C);CHKERRQ(ierr); 492753dd7562SDmitry Karpeev } 492853dd7562SDmitry Karpeev count = 0; 492953dd7562SDmitry Karpeev rowindices = NULL; 493053dd7562SDmitry Karpeev colindices = NULL; 493153dd7562SDmitry Karpeev if (rowemb) { 493253dd7562SDmitry Karpeev ierr = ISGetIndices(rowemb,&rowindices);CHKERRQ(ierr); 493353dd7562SDmitry Karpeev } 493453dd7562SDmitry Karpeev if (colemb) { 493553dd7562SDmitry Karpeev ierr = ISGetIndices(colemb,&colindices);CHKERRQ(ierr); 493653dd7562SDmitry Karpeev } 493753dd7562SDmitry Karpeev for (i=0; i<B->rmap->n; i++) { 493853dd7562SDmitry Karpeev PetscInt row; 493953dd7562SDmitry Karpeev row = i; 494053dd7562SDmitry Karpeev if (rowindices) row = rowindices[i]; 494153dd7562SDmitry Karpeev for (j=Baij->i[i]; j<Baij->i[i+1]; j++) { 494253dd7562SDmitry Karpeev PetscInt col; 494353dd7562SDmitry Karpeev col = Baij->j[count]; 494453dd7562SDmitry Karpeev if (colindices) col = colindices[col]; 494553dd7562SDmitry Karpeev v = Baij->a[count]; 494653dd7562SDmitry Karpeev ierr = MatSetValues(C,1,&row,1,&col,&v,INSERT_VALUES);CHKERRQ(ierr); 494753dd7562SDmitry Karpeev ++count; 494853dd7562SDmitry Karpeev } 494953dd7562SDmitry Karpeev } 495053dd7562SDmitry Karpeev /* FIXME: set C's nonzerostate correctly. */ 495153dd7562SDmitry Karpeev /* Assembly for C is necessary. */ 495253dd7562SDmitry Karpeev C->preallocated = PETSC_TRUE; 495353dd7562SDmitry Karpeev C->assembled = PETSC_TRUE; 495453dd7562SDmitry Karpeev C->was_assembled = PETSC_FALSE; 495553dd7562SDmitry Karpeev PetscFunctionReturn(0); 495653dd7562SDmitry Karpeev } 495753dd7562SDmitry Karpeev 49584099cc6bSBarry Smith PetscFunctionList MatSeqAIJList = NULL; 49594099cc6bSBarry Smith 49604099cc6bSBarry Smith /*@C 49614099cc6bSBarry Smith MatSeqAIJSetType - Converts a MATSEQAIJ matrix to a subtype 49624099cc6bSBarry Smith 49634099cc6bSBarry Smith Collective on Mat 49644099cc6bSBarry Smith 49654099cc6bSBarry Smith Input Parameters: 49664099cc6bSBarry Smith + mat - the matrix object 49674099cc6bSBarry Smith - matype - matrix type 49684099cc6bSBarry Smith 49694099cc6bSBarry Smith Options Database Key: 49704099cc6bSBarry Smith . -mat_seqai_type <method> - for example seqaijcrl 49714099cc6bSBarry Smith 49724099cc6bSBarry Smith 49734099cc6bSBarry Smith Level: intermediate 49744099cc6bSBarry Smith 49754099cc6bSBarry Smith .seealso: PCSetType(), VecSetType(), MatCreate(), MatType, Mat 49764099cc6bSBarry Smith @*/ 49774099cc6bSBarry Smith PetscErrorCode MatSeqAIJSetType(Mat mat, MatType matype) 49784099cc6bSBarry Smith { 4979fd9d3c67SJed Brown PetscErrorCode ierr,(*r)(Mat,MatType,MatReuse,Mat*); 49804099cc6bSBarry Smith PetscBool sametype; 49814099cc6bSBarry Smith 49824099cc6bSBarry Smith PetscFunctionBegin; 49834099cc6bSBarry Smith PetscValidHeaderSpecific(mat,MAT_CLASSID,1); 49844099cc6bSBarry Smith ierr = PetscObjectTypeCompare((PetscObject)mat,matype,&sametype);CHKERRQ(ierr); 49854099cc6bSBarry Smith if (sametype) PetscFunctionReturn(0); 49864099cc6bSBarry Smith 49874099cc6bSBarry Smith ierr = PetscFunctionListFind(MatSeqAIJList,matype,&r);CHKERRQ(ierr); 49884099cc6bSBarry Smith if (!r) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_ARG_UNKNOWN_TYPE,"Unknown Mat type given: %s",matype); 49894099cc6bSBarry Smith ierr = (*r)(mat,matype,MAT_INPLACE_MATRIX,&mat);CHKERRQ(ierr); 49904099cc6bSBarry Smith PetscFunctionReturn(0); 49914099cc6bSBarry Smith } 49924099cc6bSBarry Smith 49934099cc6bSBarry Smith 49944099cc6bSBarry Smith /*@C 49954099cc6bSBarry Smith MatSeqAIJRegister - - Adds a new sub-matrix type for sequential AIJ matrices 49964099cc6bSBarry Smith 49974099cc6bSBarry Smith Not Collective 49984099cc6bSBarry Smith 49994099cc6bSBarry Smith Input Parameters: 50004099cc6bSBarry Smith + name - name of a new user-defined matrix type, for example MATSEQAIJCRL 50014099cc6bSBarry Smith - function - routine to convert to subtype 50024099cc6bSBarry Smith 50034099cc6bSBarry Smith Notes: 50044099cc6bSBarry Smith MatSeqAIJRegister() may be called multiple times to add several user-defined solvers. 50054099cc6bSBarry Smith 50064099cc6bSBarry Smith 50074099cc6bSBarry Smith Then, your matrix can be chosen with the procedural interface at runtime via the option 50084099cc6bSBarry Smith $ -mat_seqaij_type my_mat 50094099cc6bSBarry Smith 50104099cc6bSBarry Smith Level: advanced 50114099cc6bSBarry Smith 50124099cc6bSBarry Smith .seealso: MatSeqAIJRegisterAll() 50134099cc6bSBarry Smith 50144099cc6bSBarry Smith 50154099cc6bSBarry Smith Level: advanced 50164099cc6bSBarry Smith @*/ 5017388d47a6SSatish Balay PetscErrorCode MatSeqAIJRegister(const char sname[],PetscErrorCode (*function)(Mat,MatType,MatReuse,Mat *)) 50184099cc6bSBarry Smith { 50194099cc6bSBarry Smith PetscErrorCode ierr; 50204099cc6bSBarry Smith 50214099cc6bSBarry Smith PetscFunctionBegin; 50229cc31a68SJed Brown ierr = MatInitializePackage();CHKERRQ(ierr); 50234099cc6bSBarry Smith ierr = PetscFunctionListAdd(&MatSeqAIJList,sname,function);CHKERRQ(ierr); 50244099cc6bSBarry Smith PetscFunctionReturn(0); 50254099cc6bSBarry Smith } 50264099cc6bSBarry Smith 50274099cc6bSBarry Smith PetscBool MatSeqAIJRegisterAllCalled = PETSC_FALSE; 50284099cc6bSBarry Smith 50294099cc6bSBarry Smith /*@C 50304099cc6bSBarry Smith MatSeqAIJRegisterAll - Registers all of the matrix subtypes of SeqAIJ 50314099cc6bSBarry Smith 50324099cc6bSBarry Smith Not Collective 50334099cc6bSBarry Smith 50344099cc6bSBarry Smith Level: advanced 50354099cc6bSBarry Smith 50364099cc6bSBarry Smith Developers Note: CUSP and CUSPARSE do not yet support the MatConvert_SeqAIJ..() paradigm and thus cannot be registered here 50374099cc6bSBarry Smith 50384099cc6bSBarry Smith .seealso: MatRegisterAll(), MatSeqAIJRegister() 50394099cc6bSBarry Smith @*/ 50404099cc6bSBarry Smith PetscErrorCode MatSeqAIJRegisterAll(void) 50414099cc6bSBarry Smith { 50424099cc6bSBarry Smith PetscErrorCode ierr; 50434099cc6bSBarry Smith 50444099cc6bSBarry Smith PetscFunctionBegin; 50454099cc6bSBarry Smith if (MatSeqAIJRegisterAllCalled) PetscFunctionReturn(0); 50464099cc6bSBarry Smith MatSeqAIJRegisterAllCalled = PETSC_TRUE; 50474099cc6bSBarry Smith 50484099cc6bSBarry Smith ierr = MatSeqAIJRegister(MATSEQAIJCRL, MatConvert_SeqAIJ_SeqAIJCRL);CHKERRQ(ierr); 50494099cc6bSBarry Smith ierr = MatSeqAIJRegister(MATSEQAIJPERM, MatConvert_SeqAIJ_SeqAIJPERM);CHKERRQ(ierr); 50504dfdc2d9SRichard Tran Mills ierr = MatSeqAIJRegister(MATSEQAIJSELL, MatConvert_SeqAIJ_SeqAIJSELL);CHKERRQ(ierr); 50519779e05dSSatish Balay #if defined(PETSC_HAVE_MKL_SPARSE) 50526b62b571SRichard Tran Mills ierr = MatSeqAIJRegister(MATSEQAIJMKL, MatConvert_SeqAIJ_SeqAIJMKL);CHKERRQ(ierr); 5053485f9817SRichard Tran Mills #endif 50544099cc6bSBarry Smith #if defined(PETSC_HAVE_VIENNACL) && defined(PETSC_HAVE_VIENNACL_NO_CUDA) 50554099cc6bSBarry Smith ierr = MatSeqAIJRegister(MATMPIAIJVIENNACL, MatConvert_SeqAIJ_SeqAIJViennaCL);CHKERRQ(ierr); 50564099cc6bSBarry Smith #endif 50574099cc6bSBarry Smith PetscFunctionReturn(0); 50584099cc6bSBarry Smith } 505953dd7562SDmitry Karpeev 506053dd7562SDmitry Karpeev /* 506181824310SBarry Smith Special version for direct calls from Fortran 506281824310SBarry Smith */ 5063af0996ceSBarry Smith #include <petsc/private/fortranimpl.h> 506481824310SBarry Smith #if defined(PETSC_HAVE_FORTRAN_CAPS) 506581824310SBarry Smith #define matsetvaluesseqaij_ MATSETVALUESSEQAIJ 506681824310SBarry Smith #elif !defined(PETSC_HAVE_FORTRAN_UNDERSCORE) 506781824310SBarry Smith #define matsetvaluesseqaij_ matsetvaluesseqaij 506881824310SBarry Smith #endif 506981824310SBarry Smith 507081824310SBarry Smith /* Change these macros so can be used in void function */ 507181824310SBarry Smith #undef CHKERRQ 5072ce94432eSBarry Smith #define CHKERRQ(ierr) CHKERRABORT(PetscObjectComm((PetscObject)A),ierr) 507381824310SBarry Smith #undef SETERRQ2 5074e32f2f54SBarry Smith #define SETERRQ2(comm,ierr,b,c,d) CHKERRABORT(comm,ierr) 50754994cf47SJed Brown #undef SETERRQ3 50764994cf47SJed Brown #define SETERRQ3(comm,ierr,b,c,d,e) CHKERRABORT(comm,ierr) 507781824310SBarry Smith 507819caf8f3SSatish Balay PETSC_EXTERN void matsetvaluesseqaij_(Mat *AA,PetscInt *mm,const PetscInt im[],PetscInt *nn,const PetscInt in[],const PetscScalar v[],InsertMode *isis, PetscErrorCode *_ierr) 507981824310SBarry Smith { 508081824310SBarry Smith Mat A = *AA; 508181824310SBarry Smith PetscInt m = *mm, n = *nn; 508281824310SBarry Smith InsertMode is = *isis; 508381824310SBarry Smith Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data; 508481824310SBarry Smith PetscInt *rp,k,low,high,t,ii,row,nrow,i,col,l,rmax,N; 508581824310SBarry Smith PetscInt *imax,*ai,*ailen; 508681824310SBarry Smith PetscErrorCode ierr; 508781824310SBarry Smith PetscInt *aj,nonew = a->nonew,lastcol = -1; 508854f21887SBarry Smith MatScalar *ap,value,*aa; 5089ace3abfcSBarry Smith PetscBool ignorezeroentries = a->ignorezeroentries; 5090ace3abfcSBarry Smith PetscBool roworiented = a->roworiented; 509181824310SBarry Smith 509281824310SBarry Smith PetscFunctionBegin; 50934994cf47SJed Brown MatCheckPreallocated(A,1); 509481824310SBarry Smith imax = a->imax; 509581824310SBarry Smith ai = a->i; 509681824310SBarry Smith ailen = a->ilen; 509781824310SBarry Smith aj = a->j; 509881824310SBarry Smith aa = a->a; 509981824310SBarry Smith 510081824310SBarry Smith for (k=0; k<m; k++) { /* loop over added rows */ 510181824310SBarry Smith row = im[k]; 510281824310SBarry Smith if (row < 0) continue; 5103cf9c20a2SJed Brown if (PetscUnlikelyDebug(row >= A->rmap->n)) SETERRABORT(PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_OUTOFRANGE,"Row too large"); 510481824310SBarry Smith rp = aj + ai[row]; ap = aa + ai[row]; 510581824310SBarry Smith rmax = imax[row]; nrow = ailen[row]; 510681824310SBarry Smith low = 0; 510781824310SBarry Smith high = nrow; 510881824310SBarry Smith for (l=0; l<n; l++) { /* loop over added columns */ 510981824310SBarry Smith if (in[l] < 0) continue; 5110cf9c20a2SJed Brown if (PetscUnlikelyDebug(in[l] >= A->cmap->n)) SETERRABORT(PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_OUTOFRANGE,"Column too large"); 511181824310SBarry Smith col = in[l]; 51122205254eSKarl Rupp if (roworiented) value = v[l + k*n]; 51132205254eSKarl Rupp else value = v[k + l*m]; 51142205254eSKarl Rupp 511581824310SBarry Smith if (value == 0.0 && ignorezeroentries && (is == ADD_VALUES)) continue; 511681824310SBarry Smith 51172205254eSKarl Rupp if (col <= lastcol) low = 0; 51182205254eSKarl Rupp else high = nrow; 511981824310SBarry Smith lastcol = col; 512081824310SBarry Smith while (high-low > 5) { 512181824310SBarry Smith t = (low+high)/2; 512281824310SBarry Smith if (rp[t] > col) high = t; 512381824310SBarry Smith else low = t; 512481824310SBarry Smith } 512581824310SBarry Smith for (i=low; i<high; i++) { 512681824310SBarry Smith if (rp[i] > col) break; 512781824310SBarry Smith if (rp[i] == col) { 512881824310SBarry Smith if (is == ADD_VALUES) ap[i] += value; 512981824310SBarry Smith else ap[i] = value; 513081824310SBarry Smith goto noinsert; 513181824310SBarry Smith } 513281824310SBarry Smith } 513381824310SBarry Smith if (value == 0.0 && ignorezeroentries) goto noinsert; 513481824310SBarry Smith if (nonew == 1) goto noinsert; 5135ce94432eSBarry Smith if (nonew == -1) SETERRABORT(PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_OUTOFRANGE,"Inserting a new nonzero in the matrix"); 5136fef13f97SBarry Smith MatSeqXAIJReallocateAIJ(A,A->rmap->n,1,nrow,row,col,rmax,aa,ai,aj,rp,ap,imax,nonew,MatScalar); 513781824310SBarry Smith N = nrow++ - 1; a->nz++; high++; 513881824310SBarry Smith /* shift up all the later entries in this row */ 513981824310SBarry Smith for (ii=N; ii>=i; ii--) { 514081824310SBarry Smith rp[ii+1] = rp[ii]; 514181824310SBarry Smith ap[ii+1] = ap[ii]; 514281824310SBarry Smith } 514381824310SBarry Smith rp[i] = col; 514481824310SBarry Smith ap[i] = value; 5145e56f5c9eSBarry Smith A->nonzerostate++; 514681824310SBarry Smith noinsert:; 514781824310SBarry Smith low = i + 1; 514881824310SBarry Smith } 514981824310SBarry Smith ailen[row] = nrow; 515081824310SBarry Smith } 515181824310SBarry Smith PetscFunctionReturnVoid(); 515281824310SBarry Smith } 5153