149b5e25fSSatish Balay 249b5e25fSSatish Balay /* 3a1373b80SHong Zhang Defines the basic matrix operations for the SBAIJ (compressed row) 449b5e25fSSatish Balay matrix storage format. 549b5e25fSSatish Balay */ 6c6db04a5SJed Brown #include <../src/mat/impls/baij/seq/baij.h> /*I "petscmat.h" I*/ 7c6db04a5SJed Brown #include <../src/mat/impls/sbaij/seq/sbaij.h> 8c6db04a5SJed Brown #include <petscblaslapack.h> 949b5e25fSSatish Balay 10c6db04a5SJed Brown #include <../src/mat/impls/sbaij/seq/relax.h> 1170dcbbb9SBarry Smith #define USESHORT 12c6db04a5SJed Brown #include <../src/mat/impls/sbaij/seq/relax.h> 1370dcbbb9SBarry Smith 146214f412SHong Zhang #if defined(PETSC_HAVE_ELEMENTAL) 15cc2e6a90SBarry Smith PETSC_INTERN PetscErrorCode MatConvert_SeqSBAIJ_Elemental(Mat,MatType,MatReuse,Mat*); 166214f412SHong Zhang #endif 17d24d4204SJose E. Roman #if defined(PETSC_HAVE_SCALAPACK) 18d24d4204SJose E. Roman PETSC_INTERN PetscErrorCode MatConvert_SBAIJ_ScaLAPACK(Mat,MatType,MatReuse,Mat*); 19d24d4204SJose E. Roman #endif 2028d58a37SPierre Jolivet PETSC_INTERN PetscErrorCode MatConvert_MPISBAIJ_Basic(Mat,MatType,MatReuse,Mat*); 21b5b17502SBarry Smith 2249b5e25fSSatish Balay /* 2349b5e25fSSatish Balay Checks for missing diagonals 2449b5e25fSSatish Balay */ 25ace3abfcSBarry Smith PetscErrorCode MatMissingDiagonal_SeqSBAIJ(Mat A,PetscBool *missing,PetscInt *dd) 2649b5e25fSSatish Balay { 27045c9aa0SHong Zhang Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ*)A->data; 286849ba73SBarry Smith PetscErrorCode ierr; 297734d3b5SMatthew G. Knepley PetscInt *diag,*ii = a->i,i; 3049b5e25fSSatish Balay 3149b5e25fSSatish Balay PetscFunctionBegin; 32045c9aa0SHong Zhang ierr = MatMarkDiagonal_SeqSBAIJ(A);CHKERRQ(ierr); 332af78befSBarry Smith *missing = PETSC_FALSE; 347734d3b5SMatthew G. Knepley if (A->rmap->n > 0 && !ii) { 35358d2f5dSShri Abhyankar *missing = PETSC_TRUE; 36358d2f5dSShri Abhyankar if (dd) *dd = 0; 37955c1f14SBarry Smith ierr = PetscInfo(A,"Matrix has no entries therefore is missing diagonal\n");CHKERRQ(ierr); 38358d2f5dSShri Abhyankar } else { 39358d2f5dSShri Abhyankar diag = a->diag; 4049b5e25fSSatish Balay for (i=0; i<a->mbs; i++) { 417734d3b5SMatthew G. Knepley if (diag[i] >= ii[i+1]) { 422af78befSBarry Smith *missing = PETSC_TRUE; 432af78befSBarry Smith if (dd) *dd = i; 442af78befSBarry Smith break; 452af78befSBarry Smith } 4649b5e25fSSatish Balay } 47358d2f5dSShri Abhyankar } 4849b5e25fSSatish Balay PetscFunctionReturn(0); 4949b5e25fSSatish Balay } 5049b5e25fSSatish Balay 51dfbe8321SBarry Smith PetscErrorCode MatMarkDiagonal_SeqSBAIJ(Mat A) 5249b5e25fSSatish Balay { 53045c9aa0SHong Zhang Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ*)A->data; 546849ba73SBarry Smith PetscErrorCode ierr; 5548dd3d27SHong Zhang PetscInt i,j; 5649b5e25fSSatish Balay 5749b5e25fSSatish Balay PetscFunctionBegin; 5809f38230SBarry Smith if (!a->diag) { 59785e854fSJed Brown ierr = PetscMalloc1(a->mbs,&a->diag);CHKERRQ(ierr); 603bb1ff40SBarry Smith ierr = PetscLogObjectMemory((PetscObject)A,a->mbs*sizeof(PetscInt));CHKERRQ(ierr); 61c760cd28SBarry Smith a->free_diag = PETSC_TRUE; 6209f38230SBarry Smith } 6348dd3d27SHong Zhang for (i=0; i<a->mbs; i++) { 6448dd3d27SHong Zhang a->diag[i] = a->i[i+1]; 6548dd3d27SHong Zhang for (j=a->i[i]; j<a->i[i+1]; j++) { 6648dd3d27SHong Zhang if (a->j[j] == i) { 6748dd3d27SHong Zhang a->diag[i] = j; 6848dd3d27SHong Zhang break; 6948dd3d27SHong Zhang } 7048dd3d27SHong Zhang } 7148dd3d27SHong Zhang } 7249b5e25fSSatish Balay PetscFunctionReturn(0); 7349b5e25fSSatish Balay } 7449b5e25fSSatish Balay 751a83f524SJed Brown static PetscErrorCode MatGetRowIJ_SeqSBAIJ(Mat A,PetscInt oshift,PetscBool symmetric,PetscBool blockcompressed,PetscInt *nn,const PetscInt *inia[],const PetscInt *inja[],PetscBool *done) 7649b5e25fSSatish Balay { 77a6ece127SHong Zhang Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ*)A->data; 788f7157efSSatish Balay PetscErrorCode ierr; 792462f5fdSStefano Zampini PetscInt i,j,n = a->mbs,nz = a->i[n],*tia,*tja,bs = A->rmap->bs,k,l,cnt; 802462f5fdSStefano Zampini PetscInt **ia = (PetscInt**)inia,**ja = (PetscInt**)inja; 8149b5e25fSSatish Balay 8249b5e25fSSatish Balay PetscFunctionBegin; 83d3e5a4abSHong Zhang *nn = n; 84a1373b80SHong Zhang if (!ia) PetscFunctionReturn(0); 852462f5fdSStefano Zampini if (symmetric) { 862462f5fdSStefano Zampini ierr = MatToSymmetricIJ_SeqAIJ(n,a->i,a->j,PETSC_FALSE,0,0,&tia,&tja);CHKERRQ(ierr); 872462f5fdSStefano Zampini nz = tia[n]; 882462f5fdSStefano Zampini } else { 892462f5fdSStefano Zampini tia = a->i; tja = a->j; 902462f5fdSStefano Zampini } 912462f5fdSStefano Zampini 922462f5fdSStefano Zampini if (!blockcompressed && bs > 1) { 932462f5fdSStefano Zampini (*nn) *= bs; 948f7157efSSatish Balay /* malloc & create the natural set of indices */ 952462f5fdSStefano Zampini ierr = PetscMalloc1((n+1)*bs,ia);CHKERRQ(ierr); 962462f5fdSStefano Zampini if (n) { 972462f5fdSStefano Zampini (*ia)[0] = oshift; 982462f5fdSStefano Zampini for (j=1; j<bs; j++) { 992462f5fdSStefano Zampini (*ia)[j] = (tia[1]-tia[0])*bs+(*ia)[j-1]; 1002462f5fdSStefano Zampini } 1012462f5fdSStefano Zampini } 1022462f5fdSStefano Zampini 1032462f5fdSStefano Zampini for (i=1; i<n; i++) { 1042462f5fdSStefano Zampini (*ia)[i*bs] = (tia[i]-tia[i-1])*bs + (*ia)[i*bs-1]; 1052462f5fdSStefano Zampini for (j=1; j<bs; j++) { 1062462f5fdSStefano Zampini (*ia)[i*bs+j] = (tia[i+1]-tia[i])*bs + (*ia)[i*bs+j-1]; 1072462f5fdSStefano Zampini } 1082462f5fdSStefano Zampini } 1092462f5fdSStefano Zampini if (n) { 1102462f5fdSStefano Zampini (*ia)[n*bs] = (tia[n]-tia[n-1])*bs + (*ia)[n*bs-1]; 1112462f5fdSStefano Zampini } 1122462f5fdSStefano Zampini 1132462f5fdSStefano Zampini if (inja) { 1142462f5fdSStefano Zampini ierr = PetscMalloc1(nz*bs*bs,ja);CHKERRQ(ierr); 1152462f5fdSStefano Zampini cnt = 0; 1162462f5fdSStefano Zampini for (i=0; i<n; i++) { 1178f7157efSSatish Balay for (j=0; j<bs; j++) { 1182462f5fdSStefano Zampini for (k=tia[i]; k<tia[i+1]; k++) { 1192462f5fdSStefano Zampini for (l=0; l<bs; l++) { 1202462f5fdSStefano Zampini (*ja)[cnt++] = bs*tja[k] + l; 1218f7157efSSatish Balay } 1228f7157efSSatish Balay } 1238f7157efSSatish Balay } 1248f7157efSSatish Balay } 1258f7157efSSatish Balay } 1262462f5fdSStefano Zampini 1272462f5fdSStefano Zampini if (symmetric) { /* deallocate memory allocated in MatToSymmetricIJ_SeqAIJ() */ 1282462f5fdSStefano Zampini ierr = PetscFree(tia);CHKERRQ(ierr); 1292462f5fdSStefano Zampini ierr = PetscFree(tja);CHKERRQ(ierr); 1302462f5fdSStefano Zampini } 1312462f5fdSStefano Zampini } else if (oshift == 1) { 1322462f5fdSStefano Zampini if (symmetric) { 1332462f5fdSStefano Zampini nz = tia[A->rmap->n/bs]; 1342462f5fdSStefano Zampini /* add 1 to i and j indices */ 1352462f5fdSStefano Zampini for (i=0; i<A->rmap->n/bs+1; i++) tia[i] = tia[i] + 1; 1362462f5fdSStefano Zampini *ia = tia; 1372462f5fdSStefano Zampini if (ja) { 1382462f5fdSStefano Zampini for (i=0; i<nz; i++) tja[i] = tja[i] + 1; 1392462f5fdSStefano Zampini *ja = tja; 1402462f5fdSStefano Zampini } 1412462f5fdSStefano Zampini } else { 1422462f5fdSStefano Zampini nz = a->i[A->rmap->n/bs]; 1432462f5fdSStefano Zampini /* malloc space and add 1 to i and j indices */ 1442462f5fdSStefano Zampini ierr = PetscMalloc1(A->rmap->n/bs+1,ia);CHKERRQ(ierr); 1452462f5fdSStefano Zampini for (i=0; i<A->rmap->n/bs+1; i++) (*ia)[i] = a->i[i] + 1; 1462462f5fdSStefano Zampini if (ja) { 1472462f5fdSStefano Zampini ierr = PetscMalloc1(nz,ja);CHKERRQ(ierr); 1482462f5fdSStefano Zampini for (i=0; i<nz; i++) (*ja)[i] = a->j[i] + 1; 1492462f5fdSStefano Zampini } 1502462f5fdSStefano Zampini } 1512462f5fdSStefano Zampini } else { 1522462f5fdSStefano Zampini *ia = tia; 1532462f5fdSStefano Zampini if (ja) *ja = tja; 154a6ece127SHong Zhang } 15549b5e25fSSatish Balay PetscFunctionReturn(0); 15649b5e25fSSatish Balay } 15749b5e25fSSatish Balay 1581a83f524SJed Brown static PetscErrorCode MatRestoreRowIJ_SeqSBAIJ(Mat A,PetscInt oshift,PetscBool symmetric,PetscBool blockcompressed,PetscInt *nn,const PetscInt *ia[],const PetscInt *ja[],PetscBool *done) 15949b5e25fSSatish Balay { 1608f7157efSSatish Balay PetscErrorCode ierr; 161a6ece127SHong Zhang 16249b5e25fSSatish Balay PetscFunctionBegin; 16349b5e25fSSatish Balay if (!ia) PetscFunctionReturn(0); 1642462f5fdSStefano Zampini if ((!blockcompressed && A->rmap->bs > 1) || (symmetric || oshift == 1)) { 1652462f5fdSStefano Zampini ierr = PetscFree(*ia);CHKERRQ(ierr); 1662462f5fdSStefano Zampini if (ja) {ierr = PetscFree(*ja);CHKERRQ(ierr);} 167a6ece127SHong Zhang } 168a6ece127SHong Zhang PetscFunctionReturn(0); 16949b5e25fSSatish Balay } 17049b5e25fSSatish Balay 171dfbe8321SBarry Smith PetscErrorCode MatDestroy_SeqSBAIJ(Mat A) 17249b5e25fSSatish Balay { 17349b5e25fSSatish Balay Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ*)A->data; 174dfbe8321SBarry Smith PetscErrorCode ierr; 17549b5e25fSSatish Balay 17649b5e25fSSatish Balay PetscFunctionBegin; 177a9f03627SSatish Balay #if defined(PETSC_USE_LOG) 178d0f46423SBarry Smith PetscLogObjectState((PetscObject)A,"Rows=%D, NZ=%D",A->rmap->N,a->nz); 179a9f03627SSatish Balay #endif 180e6b907acSBarry Smith ierr = MatSeqXAIJFreeAIJ(A,&a->a,&a->j,&a->i);CHKERRQ(ierr); 1817f53bb6cSHong Zhang if (a->free_diag) {ierr = PetscFree(a->diag);CHKERRQ(ierr);} 1826bf464f9SBarry Smith ierr = ISDestroy(&a->row);CHKERRQ(ierr); 1836bf464f9SBarry Smith ierr = ISDestroy(&a->col);CHKERRQ(ierr); 1846bf464f9SBarry Smith ierr = ISDestroy(&a->icol);CHKERRQ(ierr); 185c31cb41cSBarry Smith ierr = PetscFree(a->idiag);CHKERRQ(ierr); 186c31cb41cSBarry Smith ierr = PetscFree(a->inode.size);CHKERRQ(ierr); 187c760cd28SBarry Smith if (a->free_imax_ilen) {ierr = PetscFree2(a->imax,a->ilen);CHKERRQ(ierr);} 18805b42c5fSBarry Smith ierr = PetscFree(a->solve_work);CHKERRQ(ierr); 18941f059aeSBarry Smith ierr = PetscFree(a->sor_work);CHKERRQ(ierr); 19005b42c5fSBarry Smith ierr = PetscFree(a->solves_work);CHKERRQ(ierr); 19105b42c5fSBarry Smith ierr = PetscFree(a->mult_work);CHKERRQ(ierr); 19205b42c5fSBarry Smith ierr = PetscFree(a->saved_values);CHKERRQ(ierr); 1934da8f245SBarry Smith if (a->free_jshort) {ierr = PetscFree(a->jshort);CHKERRQ(ierr);} 1941a3463dfSHong Zhang ierr = PetscFree(a->inew);CHKERRQ(ierr); 1956bf464f9SBarry Smith ierr = MatDestroy(&a->parent);CHKERRQ(ierr); 196bf0cc555SLisandro Dalcin ierr = PetscFree(A->data);CHKERRQ(ierr); 197901853e0SKris Buschelman 198*f4259b30SLisandro Dalcin ierr = PetscObjectChangeTypeName((PetscObject)A,NULL);CHKERRQ(ierr); 199bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)A,"MatStoreValues_C",NULL);CHKERRQ(ierr); 200bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)A,"MatRetrieveValues_C",NULL);CHKERRQ(ierr); 201bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)A,"MatSeqSBAIJSetColumnIndices_C",NULL);CHKERRQ(ierr); 202bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)A,"MatConvert_seqsbaij_seqaij_C",NULL);CHKERRQ(ierr); 203bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)A,"MatConvert_seqsbaij_seqbaij_C",NULL);CHKERRQ(ierr); 204bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)A,"MatSeqSBAIJSetPreallocation_C",NULL);CHKERRQ(ierr); 20538f409ebSLisandro Dalcin ierr = PetscObjectComposeFunction((PetscObject)A,"MatSeqSBAIJSetPreallocationCSR_C",NULL);CHKERRQ(ierr); 2066214f412SHong Zhang #if defined(PETSC_HAVE_ELEMENTAL) 2076214f412SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)A,"MatConvert_seqsbaij_elemental_C",NULL);CHKERRQ(ierr); 2086214f412SHong Zhang #endif 209d24d4204SJose E. Roman #if defined(PETSC_HAVE_SCALAPACK) 210d24d4204SJose E. Roman ierr = PetscObjectComposeFunction((PetscObject)A,"MatConvert_seqsbaij_scalapack_C",NULL);CHKERRQ(ierr); 211d24d4204SJose E. Roman #endif 21249b5e25fSSatish Balay PetscFunctionReturn(0); 21349b5e25fSSatish Balay } 21449b5e25fSSatish Balay 215ace3abfcSBarry Smith PetscErrorCode MatSetOption_SeqSBAIJ(Mat A,MatOption op,PetscBool flg) 21649b5e25fSSatish Balay { 217045c9aa0SHong Zhang Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ*)A->data; 218eb1ec7c1SStefano Zampini #if defined(PETSC_USE_COMPLEX) 219eb1ec7c1SStefano Zampini PetscInt bs; 220eb1ec7c1SStefano Zampini #endif 22163ba0a88SBarry Smith PetscErrorCode ierr; 22249b5e25fSSatish Balay 22349b5e25fSSatish Balay PetscFunctionBegin; 224eb1ec7c1SStefano Zampini #if defined(PETSC_USE_COMPLEX) 225eb1ec7c1SStefano Zampini ierr = MatGetBlockSize(A,&bs);CHKERRQ(ierr); 226eb1ec7c1SStefano Zampini #endif 2274d9d31abSKris Buschelman switch (op) { 2284d9d31abSKris Buschelman case MAT_ROW_ORIENTED: 2294e0d8c25SBarry Smith a->roworiented = flg; 2304d9d31abSKris Buschelman break; 231a9817697SBarry Smith case MAT_KEEP_NONZERO_PATTERN: 232a9817697SBarry Smith a->keepnonzeropattern = flg; 2334d9d31abSKris Buschelman break; 234512a5fc5SBarry Smith case MAT_NEW_NONZERO_LOCATIONS: 235512a5fc5SBarry Smith a->nonew = (flg ? 0 : 1); 2364d9d31abSKris Buschelman break; 2374d9d31abSKris Buschelman case MAT_NEW_NONZERO_LOCATION_ERR: 2384e0d8c25SBarry Smith a->nonew = (flg ? -1 : 0); 2394d9d31abSKris Buschelman break; 2404d9d31abSKris Buschelman case MAT_NEW_NONZERO_ALLOCATION_ERR: 2414e0d8c25SBarry Smith a->nonew = (flg ? -2 : 0); 2424d9d31abSKris Buschelman break; 24328b2fa4aSMatthew Knepley case MAT_UNUSED_NONZERO_LOCATION_ERR: 24428b2fa4aSMatthew Knepley a->nounused = (flg ? -1 : 0); 24528b2fa4aSMatthew Knepley break; 2464e0d8c25SBarry Smith case MAT_NEW_DIAGONALS: 2474d9d31abSKris Buschelman case MAT_IGNORE_OFF_PROC_ENTRIES: 2484d9d31abSKris Buschelman case MAT_USE_HASH_TABLE: 249071fcb05SBarry Smith case MAT_SORTED_FULL: 250290bbb0aSBarry Smith ierr = PetscInfo1(A,"Option %s ignored\n",MatOptions[op]);CHKERRQ(ierr); 2514d9d31abSKris Buschelman break; 2529a4540c5SBarry Smith case MAT_HERMITIAN: 253eb1ec7c1SStefano Zampini #if defined(PETSC_USE_COMPLEX) 254eb1ec7c1SStefano Zampini if (flg) { /* disable transpose ops */ 255eb1ec7c1SStefano Zampini if (bs > 1) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_SUP,"No support for Hermitian with block size greater than 1"); 256eb1ec7c1SStefano Zampini A->ops->multtranspose = NULL; 257eb1ec7c1SStefano Zampini A->ops->multtransposeadd = NULL; 258eb1ec7c1SStefano Zampini A->symmetric = PETSC_FALSE; 259eb1ec7c1SStefano Zampini } 2600f2140c7SStefano Zampini #endif 261eeffb40dSHong Zhang break; 26277e54ba9SKris Buschelman case MAT_SYMMETRIC: 263eb1ec7c1SStefano Zampini case MAT_SPD: 264eb1ec7c1SStefano Zampini #if defined(PETSC_USE_COMPLEX) 265eb1ec7c1SStefano Zampini if (flg) { /* An hermitian and symmetric matrix has zero imaginary part (restore back transpose ops) */ 266eb1ec7c1SStefano Zampini A->ops->multtranspose = A->ops->mult; 267eb1ec7c1SStefano Zampini A->ops->multtransposeadd = A->ops->multadd; 268eb1ec7c1SStefano Zampini } 269eb1ec7c1SStefano Zampini #endif 270eb1ec7c1SStefano Zampini break; 271eb1ec7c1SStefano Zampini /* These options are handled directly by MatSetOption() */ 27277e54ba9SKris Buschelman case MAT_STRUCTURALLY_SYMMETRIC: 2739a4540c5SBarry Smith case MAT_SYMMETRY_ETERNAL: 274672ba085SHong Zhang case MAT_STRUCTURE_ONLY: 2754dcd73b1SHong Zhang /* These options are handled directly by MatSetOption() */ 276290bbb0aSBarry Smith break; 277941593c8SHong Zhang case MAT_IGNORE_LOWER_TRIANGULAR: 2784e0d8c25SBarry Smith a->ignore_ltriangular = flg; 279941593c8SHong Zhang break; 280941593c8SHong Zhang case MAT_ERROR_LOWER_TRIANGULAR: 2814e0d8c25SBarry Smith a->ignore_ltriangular = flg; 28277e54ba9SKris Buschelman break; 283f5edf698SHong Zhang case MAT_GETROW_UPPERTRIANGULAR: 2844e0d8c25SBarry Smith a->getrow_utriangular = flg; 285f5edf698SHong Zhang break; 286c10200c1SHong Zhang case MAT_SUBMAT_SINGLEIS: 287c10200c1SHong Zhang break; 2884d9d31abSKris Buschelman default: 289e32f2f54SBarry Smith SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_SUP,"unknown option %d",op); 29049b5e25fSSatish Balay } 29149b5e25fSSatish Balay PetscFunctionReturn(0); 29249b5e25fSSatish Balay } 29349b5e25fSSatish Balay 29452768537SHong Zhang PetscErrorCode MatGetRow_SeqSBAIJ(Mat A,PetscInt row,PetscInt *nz,PetscInt **idx,PetscScalar **v) 29549b5e25fSSatish Balay { 29649b5e25fSSatish Balay Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ*)A->data; 2976849ba73SBarry Smith PetscErrorCode ierr; 29849b5e25fSSatish Balay 29949b5e25fSSatish Balay PetscFunctionBegin; 300e32f2f54SBarry Smith if (A && !a->getrow_utriangular) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_SUP,"MatGetRow is not supported for SBAIJ matrix format. Getting the upper triangular part of row, run with -mat_getrow_uppertriangular, call MatSetOption(mat,MAT_GETROW_UPPERTRIANGULAR,PETSC_TRUE) or MatGetRowUpperTriangular()"); 30152768537SHong Zhang 302f5edf698SHong Zhang /* Get the upper triangular part of the row */ 30352768537SHong Zhang ierr = MatGetRow_SeqBAIJ_private(A,row,nz,idx,v,a->i,a->j,a->a);CHKERRQ(ierr); 30449b5e25fSSatish Balay PetscFunctionReturn(0); 30549b5e25fSSatish Balay } 30649b5e25fSSatish Balay 30713f74950SBarry Smith PetscErrorCode MatRestoreRow_SeqSBAIJ(Mat A,PetscInt row,PetscInt *nz,PetscInt **idx,PetscScalar **v) 30849b5e25fSSatish Balay { 309dfbe8321SBarry Smith PetscErrorCode ierr; 31049b5e25fSSatish Balay 31149b5e25fSSatish Balay PetscFunctionBegin; 31205b42c5fSBarry Smith if (idx) {ierr = PetscFree(*idx);CHKERRQ(ierr);} 31305b42c5fSBarry Smith if (v) {ierr = PetscFree(*v);CHKERRQ(ierr);} 31449b5e25fSSatish Balay PetscFunctionReturn(0); 31549b5e25fSSatish Balay } 31649b5e25fSSatish Balay 317f5edf698SHong Zhang PetscErrorCode MatGetRowUpperTriangular_SeqSBAIJ(Mat A) 318f5edf698SHong Zhang { 319f5edf698SHong Zhang Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ*)A->data; 320f5edf698SHong Zhang 321f5edf698SHong Zhang PetscFunctionBegin; 322f5edf698SHong Zhang a->getrow_utriangular = PETSC_TRUE; 323f5edf698SHong Zhang PetscFunctionReturn(0); 324f5edf698SHong Zhang } 325a323099bSStefano Zampini 326f5edf698SHong Zhang PetscErrorCode MatRestoreRowUpperTriangular_SeqSBAIJ(Mat A) 327f5edf698SHong Zhang { 328f5edf698SHong Zhang Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ*)A->data; 329f5edf698SHong Zhang 330f5edf698SHong Zhang PetscFunctionBegin; 331f5edf698SHong Zhang a->getrow_utriangular = PETSC_FALSE; 332f5edf698SHong Zhang PetscFunctionReturn(0); 333f5edf698SHong Zhang } 334f5edf698SHong Zhang 335fc4dec0aSBarry Smith PetscErrorCode MatTranspose_SeqSBAIJ(Mat A,MatReuse reuse,Mat *B) 33649b5e25fSSatish Balay { 337dfbe8321SBarry Smith PetscErrorCode ierr; 3385fd66863SKarl Rupp 33949b5e25fSSatish Balay PetscFunctionBegin; 340cf37664fSBarry Smith if (reuse == MAT_INITIAL_MATRIX) { 341999d9058SBarry Smith ierr = MatDuplicate(A,MAT_COPY_VALUES,B);CHKERRQ(ierr); 342cf37664fSBarry Smith } else if (reuse == MAT_REUSE_MATRIX) { 343cf37664fSBarry Smith ierr = MatCopy(A,*B,SAME_NONZERO_PATTERN);CHKERRQ(ierr); 344fc4dec0aSBarry Smith } 3458115998fSBarry Smith PetscFunctionReturn(0); 34649b5e25fSSatish Balay } 34749b5e25fSSatish Balay 3487da1fb6eSBarry Smith PetscErrorCode MatView_SeqSBAIJ_ASCII(Mat A,PetscViewer viewer) 34949b5e25fSSatish Balay { 35049b5e25fSSatish Balay Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ*)A->data; 351dfbe8321SBarry Smith PetscErrorCode ierr; 352d0f46423SBarry Smith PetscInt i,j,bs = A->rmap->bs,k,l,bs2=a->bs2; 353f3ef73ceSBarry Smith PetscViewerFormat format; 354121deb67SSatish Balay PetscInt *diag; 35549b5e25fSSatish Balay 35649b5e25fSSatish Balay PetscFunctionBegin; 357b0a32e0cSBarry Smith ierr = PetscViewerGetFormat(viewer,&format);CHKERRQ(ierr); 358456192e2SBarry Smith if (format == PETSC_VIEWER_ASCII_INFO || format == PETSC_VIEWER_ASCII_INFO_DETAIL) { 35977431f27SBarry Smith ierr = PetscViewerASCIIPrintf(viewer," block size is %D\n",bs);CHKERRQ(ierr); 360fb9695e5SSatish Balay } else if (format == PETSC_VIEWER_ASCII_MATLAB) { 361d2507d54SMatthew Knepley Mat aij; 362ade3a672SBarry Smith const char *matname; 363ade3a672SBarry Smith 364d5f3da31SBarry Smith if (A->factortype && bs>1) { 36570d5e725SHong Zhang ierr = PetscPrintf(PETSC_COMM_SELF,"Warning: matrix is factored with bs>1. MatView() with PETSC_VIEWER_ASCII_MATLAB is not supported and ignored!\n");CHKERRQ(ierr); 36670d5e725SHong Zhang PetscFunctionReturn(0); 36770d5e725SHong Zhang } 368c9f458caSMatthew Knepley ierr = MatConvert(A,MATSEQAIJ,MAT_INITIAL_MATRIX,&aij);CHKERRQ(ierr); 369ade3a672SBarry Smith ierr = PetscObjectGetName((PetscObject)A,&matname);CHKERRQ(ierr); 370ade3a672SBarry Smith ierr = PetscObjectSetName((PetscObject)aij,matname);CHKERRQ(ierr); 371c9f458caSMatthew Knepley ierr = MatView(aij,viewer);CHKERRQ(ierr); 3726bf464f9SBarry Smith ierr = MatDestroy(&aij);CHKERRQ(ierr); 373fb9695e5SSatish Balay } else if (format == PETSC_VIEWER_ASCII_COMMON) { 374d00279f6SBarry Smith ierr = PetscViewerASCIIUseTabs(viewer,PETSC_FALSE);CHKERRQ(ierr); 37549b5e25fSSatish Balay for (i=0; i<a->mbs; i++) { 37649b5e25fSSatish Balay for (j=0; j<bs; j++) { 37777431f27SBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"row %D:",i*bs+j);CHKERRQ(ierr); 37849b5e25fSSatish Balay for (k=a->i[i]; k<a->i[i+1]; k++) { 37949b5e25fSSatish Balay for (l=0; l<bs; l++) { 38049b5e25fSSatish Balay #if defined(PETSC_USE_COMPLEX) 38149b5e25fSSatish Balay if (PetscImaginaryPart(a->a[bs2*k + l*bs + j]) > 0.0 && PetscRealPart(a->a[bs2*k + l*bs + j]) != 0.0) { 38257622a8eSBarry Smith ierr = PetscViewerASCIIPrintf(viewer," (%D, %g + %g i) ",bs*a->j[k]+l, 38357622a8eSBarry Smith (double)PetscRealPart(a->a[bs2*k + l*bs + j]),(double)PetscImaginaryPart(a->a[bs2*k + l*bs + j]));CHKERRQ(ierr); 38449b5e25fSSatish Balay } else if (PetscImaginaryPart(a->a[bs2*k + l*bs + j]) < 0.0 && PetscRealPart(a->a[bs2*k + l*bs + j]) != 0.0) { 38557622a8eSBarry Smith ierr = PetscViewerASCIIPrintf(viewer," (%D, %g - %g i) ",bs*a->j[k]+l, 38657622a8eSBarry Smith (double)PetscRealPart(a->a[bs2*k + l*bs + j]),-(double)PetscImaginaryPart(a->a[bs2*k + l*bs + j]));CHKERRQ(ierr); 38749b5e25fSSatish Balay } else if (PetscRealPart(a->a[bs2*k + l*bs + j]) != 0.0) { 38857622a8eSBarry Smith ierr = PetscViewerASCIIPrintf(viewer," (%D, %g) ",bs*a->j[k]+l,(double)PetscRealPart(a->a[bs2*k + l*bs + j]));CHKERRQ(ierr); 38949b5e25fSSatish Balay } 39049b5e25fSSatish Balay #else 39149b5e25fSSatish Balay if (a->a[bs2*k + l*bs + j] != 0.0) { 39257622a8eSBarry Smith ierr = PetscViewerASCIIPrintf(viewer," (%D, %g) ",bs*a->j[k]+l,(double)a->a[bs2*k + l*bs + j]);CHKERRQ(ierr); 39349b5e25fSSatish Balay } 39449b5e25fSSatish Balay #endif 39549b5e25fSSatish Balay } 39649b5e25fSSatish Balay } 397b0a32e0cSBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"\n");CHKERRQ(ierr); 39849b5e25fSSatish Balay } 39949b5e25fSSatish Balay } 400d00279f6SBarry Smith ierr = PetscViewerASCIIUseTabs(viewer,PETSC_TRUE);CHKERRQ(ierr); 401c1490034SHong Zhang } else if (format == PETSC_VIEWER_ASCII_FACTOR_INFO) { 402c1490034SHong Zhang PetscFunctionReturn(0); 40349b5e25fSSatish Balay } else { 404d00279f6SBarry Smith ierr = PetscViewerASCIIUseTabs(viewer,PETSC_FALSE);CHKERRQ(ierr); 4052c990fa1SHong Zhang if (A->factortype) { /* for factored matrix */ 4062c990fa1SHong Zhang if (bs>1) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_SUP,"matrix is factored with bs>1. Not implemented yet"); 4072c990fa1SHong Zhang 408121deb67SSatish Balay diag=a->diag; 409121deb67SSatish Balay for (i=0; i<a->mbs; i++) { /* for row block i */ 4102c990fa1SHong Zhang ierr = PetscViewerASCIIPrintf(viewer,"row %D:",i);CHKERRQ(ierr); 4112c990fa1SHong Zhang /* diagonal entry */ 4122c990fa1SHong Zhang #if defined(PETSC_USE_COMPLEX) 4132c990fa1SHong Zhang if (PetscImaginaryPart(a->a[diag[i]]) > 0.0) { 41457622a8eSBarry Smith ierr = PetscViewerASCIIPrintf(viewer," (%D, %g + %g i) ",a->j[diag[i]],(double)PetscRealPart(1.0/a->a[diag[i]]),(double)PetscImaginaryPart(1.0/a->a[diag[i]]));CHKERRQ(ierr); 4152c990fa1SHong Zhang } else if (PetscImaginaryPart(a->a[diag[i]]) < 0.0) { 41657622a8eSBarry Smith ierr = PetscViewerASCIIPrintf(viewer," (%D, %g - %g i) ",a->j[diag[i]],(double)PetscRealPart(1.0/a->a[diag[i]]),-(double)PetscImaginaryPart(1.0/a->a[diag[i]]));CHKERRQ(ierr); 4172c990fa1SHong Zhang } else { 41857622a8eSBarry Smith ierr = PetscViewerASCIIPrintf(viewer," (%D, %g) ",a->j[diag[i]],(double)PetscRealPart(1.0/a->a[diag[i]]));CHKERRQ(ierr); 4192c990fa1SHong Zhang } 4202c990fa1SHong Zhang #else 4216712e2f1SBarry Smith ierr = PetscViewerASCIIPrintf(viewer," (%D, %g) ",a->j[diag[i]],(double)(1.0/a->a[diag[i]]));CHKERRQ(ierr); 4222c990fa1SHong Zhang #endif 4232c990fa1SHong Zhang /* off-diagonal entries */ 4242c990fa1SHong Zhang for (k=a->i[i]; k<a->i[i+1]-1; k++) { 4252c990fa1SHong Zhang #if defined(PETSC_USE_COMPLEX) 426ca0704adSBarry Smith if (PetscImaginaryPart(a->a[k]) > 0.0) { 42757622a8eSBarry Smith ierr = PetscViewerASCIIPrintf(viewer," (%D, %g + %g i) ",bs*a->j[k],(double)PetscRealPart(a->a[k]),(double)PetscImaginaryPart(a->a[k]));CHKERRQ(ierr); 428ca0704adSBarry Smith } else if (PetscImaginaryPart(a->a[k]) < 0.0) { 42957622a8eSBarry Smith ierr = PetscViewerASCIIPrintf(viewer," (%D, %g - %g i) ",bs*a->j[k],(double)PetscRealPart(a->a[k]),-(double)PetscImaginaryPart(a->a[k]));CHKERRQ(ierr); 4302c990fa1SHong Zhang } else { 43157622a8eSBarry Smith ierr = PetscViewerASCIIPrintf(viewer," (%D, %g) ",bs*a->j[k],(double)PetscRealPart(a->a[k]));CHKERRQ(ierr); 4322c990fa1SHong Zhang } 4332c990fa1SHong Zhang #else 43457622a8eSBarry Smith ierr = PetscViewerASCIIPrintf(viewer," (%D, %g) ",a->j[k],(double)a->a[k]);CHKERRQ(ierr); 4352c990fa1SHong Zhang #endif 4362c990fa1SHong Zhang } 4372c990fa1SHong Zhang ierr = PetscViewerASCIIPrintf(viewer,"\n");CHKERRQ(ierr); 4382c990fa1SHong Zhang } 4392c990fa1SHong Zhang 4402c990fa1SHong Zhang } else { /* for non-factored matrix */ 4410c74a584SJed Brown for (i=0; i<a->mbs; i++) { /* for row block i */ 4420c74a584SJed Brown for (j=0; j<bs; j++) { /* for row bs*i + j */ 44377431f27SBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"row %D:",i*bs+j);CHKERRQ(ierr); 4440c74a584SJed Brown for (k=a->i[i]; k<a->i[i+1]; k++) { /* for column block */ 4450c74a584SJed Brown for (l=0; l<bs; l++) { /* for column */ 44649b5e25fSSatish Balay #if defined(PETSC_USE_COMPLEX) 44749b5e25fSSatish Balay if (PetscImaginaryPart(a->a[bs2*k + l*bs + j]) > 0.0) { 44857622a8eSBarry Smith ierr = PetscViewerASCIIPrintf(viewer," (%D, %g + %g i) ",bs*a->j[k]+l, 44957622a8eSBarry Smith (double)PetscRealPart(a->a[bs2*k + l*bs + j]),(double)PetscImaginaryPart(a->a[bs2*k + l*bs + j]));CHKERRQ(ierr); 45049b5e25fSSatish Balay } else if (PetscImaginaryPart(a->a[bs2*k + l*bs + j]) < 0.0) { 45157622a8eSBarry Smith ierr = PetscViewerASCIIPrintf(viewer," (%D, %g - %g i) ",bs*a->j[k]+l, 45257622a8eSBarry Smith (double)PetscRealPart(a->a[bs2*k + l*bs + j]),-(double)PetscImaginaryPart(a->a[bs2*k + l*bs + j]));CHKERRQ(ierr); 45349b5e25fSSatish Balay } else { 45457622a8eSBarry Smith ierr = PetscViewerASCIIPrintf(viewer," (%D, %g) ",bs*a->j[k]+l,(double)PetscRealPart(a->a[bs2*k + l*bs + j]));CHKERRQ(ierr); 45549b5e25fSSatish Balay } 45649b5e25fSSatish Balay #else 45757622a8eSBarry Smith ierr = PetscViewerASCIIPrintf(viewer," (%D, %g) ",bs*a->j[k]+l,(double)a->a[bs2*k + l*bs + j]);CHKERRQ(ierr); 45849b5e25fSSatish Balay #endif 45949b5e25fSSatish Balay } 46049b5e25fSSatish Balay } 461b0a32e0cSBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"\n");CHKERRQ(ierr); 46249b5e25fSSatish Balay } 46349b5e25fSSatish Balay } 4642c990fa1SHong Zhang } 465d00279f6SBarry Smith ierr = PetscViewerASCIIUseTabs(viewer,PETSC_TRUE);CHKERRQ(ierr); 46649b5e25fSSatish Balay } 467b0a32e0cSBarry Smith ierr = PetscViewerFlush(viewer);CHKERRQ(ierr); 46849b5e25fSSatish Balay PetscFunctionReturn(0); 46949b5e25fSSatish Balay } 47049b5e25fSSatish Balay 4719804daf3SBarry Smith #include <petscdraw.h> 4726849ba73SBarry Smith static PetscErrorCode MatView_SeqSBAIJ_Draw_Zoom(PetscDraw draw,void *Aa) 47349b5e25fSSatish Balay { 47449b5e25fSSatish Balay Mat A = (Mat) Aa; 47549b5e25fSSatish Balay Mat_SeqSBAIJ *a=(Mat_SeqSBAIJ*)A->data; 4766849ba73SBarry Smith PetscErrorCode ierr; 477d0f46423SBarry Smith PetscInt row,i,j,k,l,mbs=a->mbs,color,bs=A->rmap->bs,bs2=a->bs2; 47849b5e25fSSatish Balay PetscReal xl,yl,xr,yr,x_l,x_r,y_l,y_r; 47949b5e25fSSatish Balay MatScalar *aa; 480b0a32e0cSBarry Smith PetscViewer viewer; 48149b5e25fSSatish Balay 48249b5e25fSSatish Balay PetscFunctionBegin; 48349b5e25fSSatish Balay ierr = PetscObjectQuery((PetscObject)A,"Zoomviewer",(PetscObject*)&viewer);CHKERRQ(ierr); 484b0a32e0cSBarry Smith ierr = PetscDrawGetCoordinates(draw,&xl,&yl,&xr,&yr);CHKERRQ(ierr); 48549b5e25fSSatish Balay 48649b5e25fSSatish Balay /* loop over matrix elements drawing boxes */ 487383922c3SLisandro Dalcin 488383922c3SLisandro Dalcin ierr = PetscDrawCollectiveBegin(draw);CHKERRQ(ierr); 489383922c3SLisandro Dalcin ierr = PetscDrawString(draw, .3*(xl+xr), .3*(yl+yr), PETSC_DRAW_BLACK, "symmetric");CHKERRQ(ierr); 490383922c3SLisandro Dalcin /* Blue for negative, Cyan for zero and Red for positive */ 491b0a32e0cSBarry Smith color = PETSC_DRAW_BLUE; 49249b5e25fSSatish Balay for (i=0,row=0; i<mbs; i++,row+=bs) { 49349b5e25fSSatish Balay for (j=a->i[i]; j<a->i[i+1]; j++) { 494d0f46423SBarry Smith y_l = A->rmap->N - row - 1.0; y_r = y_l + 1.0; 49549b5e25fSSatish Balay x_l = a->j[j]*bs; x_r = x_l + 1.0; 49649b5e25fSSatish Balay aa = a->a + j*bs2; 49749b5e25fSSatish Balay for (k=0; k<bs; k++) { 49849b5e25fSSatish Balay for (l=0; l<bs; l++) { 49949b5e25fSSatish Balay if (PetscRealPart(*aa++) >= 0.) continue; 500b0a32e0cSBarry Smith ierr = PetscDrawRectangle(draw,x_l+k,y_l-l,x_r+k,y_r-l,color,color,color,color);CHKERRQ(ierr); 50149b5e25fSSatish Balay } 50249b5e25fSSatish Balay } 50349b5e25fSSatish Balay } 50449b5e25fSSatish Balay } 505b0a32e0cSBarry Smith color = PETSC_DRAW_CYAN; 50649b5e25fSSatish Balay for (i=0,row=0; i<mbs; i++,row+=bs) { 50749b5e25fSSatish Balay for (j=a->i[i]; j<a->i[i+1]; j++) { 508d0f46423SBarry Smith y_l = A->rmap->N - row - 1.0; y_r = y_l + 1.0; 50949b5e25fSSatish Balay x_l = a->j[j]*bs; x_r = x_l + 1.0; 51049b5e25fSSatish Balay aa = a->a + j*bs2; 51149b5e25fSSatish Balay for (k=0; k<bs; k++) { 51249b5e25fSSatish Balay for (l=0; l<bs; l++) { 51349b5e25fSSatish Balay if (PetscRealPart(*aa++) != 0.) continue; 514b0a32e0cSBarry Smith ierr = PetscDrawRectangle(draw,x_l+k,y_l-l,x_r+k,y_r-l,color,color,color,color);CHKERRQ(ierr); 51549b5e25fSSatish Balay } 51649b5e25fSSatish Balay } 51749b5e25fSSatish Balay } 51849b5e25fSSatish Balay } 519b0a32e0cSBarry Smith color = PETSC_DRAW_RED; 52049b5e25fSSatish Balay for (i=0,row=0; i<mbs; i++,row+=bs) { 52149b5e25fSSatish Balay for (j=a->i[i]; j<a->i[i+1]; j++) { 522d0f46423SBarry Smith y_l = A->rmap->N - row - 1.0; y_r = y_l + 1.0; 52349b5e25fSSatish Balay x_l = a->j[j]*bs; x_r = x_l + 1.0; 52449b5e25fSSatish Balay aa = a->a + j*bs2; 52549b5e25fSSatish Balay for (k=0; k<bs; k++) { 52649b5e25fSSatish Balay for (l=0; l<bs; l++) { 52749b5e25fSSatish Balay if (PetscRealPart(*aa++) <= 0.) continue; 528b0a32e0cSBarry Smith ierr = PetscDrawRectangle(draw,x_l+k,y_l-l,x_r+k,y_r-l,color,color,color,color);CHKERRQ(ierr); 52949b5e25fSSatish Balay } 53049b5e25fSSatish Balay } 53149b5e25fSSatish Balay } 53249b5e25fSSatish Balay } 533383922c3SLisandro Dalcin ierr = PetscDrawCollectiveEnd(draw);CHKERRQ(ierr); 53449b5e25fSSatish Balay PetscFunctionReturn(0); 53549b5e25fSSatish Balay } 53649b5e25fSSatish Balay 5376849ba73SBarry Smith static PetscErrorCode MatView_SeqSBAIJ_Draw(Mat A,PetscViewer viewer) 53849b5e25fSSatish Balay { 539dfbe8321SBarry Smith PetscErrorCode ierr; 54049b5e25fSSatish Balay PetscReal xl,yl,xr,yr,w,h; 541b0a32e0cSBarry Smith PetscDraw draw; 542ace3abfcSBarry Smith PetscBool isnull; 54349b5e25fSSatish Balay 54449b5e25fSSatish Balay PetscFunctionBegin; 545b0a32e0cSBarry Smith ierr = PetscViewerDrawGetDraw(viewer,0,&draw);CHKERRQ(ierr); 546383922c3SLisandro Dalcin ierr = PetscDrawIsNull(draw,&isnull);CHKERRQ(ierr); 547383922c3SLisandro Dalcin if (isnull) PetscFunctionReturn(0); 54849b5e25fSSatish Balay 549d0f46423SBarry Smith xr = A->rmap->N; yr = A->rmap->N; h = yr/10.0; w = xr/10.0; 55049b5e25fSSatish Balay xr += w; yr += h; xl = -w; yl = -h; 551b0a32e0cSBarry Smith ierr = PetscDrawSetCoordinates(draw,xl,yl,xr,yr);CHKERRQ(ierr); 552832b7cebSLisandro Dalcin ierr = PetscObjectCompose((PetscObject)A,"Zoomviewer",(PetscObject)viewer);CHKERRQ(ierr); 553b0a32e0cSBarry Smith ierr = PetscDrawZoom(draw,MatView_SeqSBAIJ_Draw_Zoom,A);CHKERRQ(ierr); 5540298fd71SBarry Smith ierr = PetscObjectCompose((PetscObject)A,"Zoomviewer",NULL);CHKERRQ(ierr); 555832b7cebSLisandro Dalcin ierr = PetscDrawSave(draw);CHKERRQ(ierr); 55649b5e25fSSatish Balay PetscFunctionReturn(0); 55749b5e25fSSatish Balay } 55849b5e25fSSatish Balay 559618cc2edSLisandro Dalcin /* Used for both MPIBAIJ and MPISBAIJ matrices */ 560618cc2edSLisandro Dalcin #define MatView_SeqSBAIJ_Binary MatView_SeqBAIJ_Binary 561618cc2edSLisandro Dalcin 562dfbe8321SBarry Smith PetscErrorCode MatView_SeqSBAIJ(Mat A,PetscViewer viewer) 56349b5e25fSSatish Balay { 564dfbe8321SBarry Smith PetscErrorCode ierr; 565618cc2edSLisandro Dalcin PetscBool iascii,isbinary,isdraw; 56649b5e25fSSatish Balay 56749b5e25fSSatish Balay PetscFunctionBegin; 568251f4c67SDmitry Karpeev ierr = PetscObjectTypeCompare((PetscObject)viewer,PETSCVIEWERASCII,&iascii);CHKERRQ(ierr); 569618cc2edSLisandro Dalcin ierr = PetscObjectTypeCompare((PetscObject)viewer,PETSCVIEWERBINARY,&isbinary);CHKERRQ(ierr); 570251f4c67SDmitry Karpeev ierr = PetscObjectTypeCompare((PetscObject)viewer,PETSCVIEWERDRAW,&isdraw);CHKERRQ(ierr); 57132077d6dSBarry Smith if (iascii) { 57249b5e25fSSatish Balay ierr = MatView_SeqSBAIJ_ASCII(A,viewer);CHKERRQ(ierr); 573618cc2edSLisandro Dalcin } else if (isbinary) { 574618cc2edSLisandro Dalcin ierr = MatView_SeqSBAIJ_Binary(A,viewer);CHKERRQ(ierr); 57549b5e25fSSatish Balay } else if (isdraw) { 57649b5e25fSSatish Balay ierr = MatView_SeqSBAIJ_Draw(A,viewer);CHKERRQ(ierr); 57749b5e25fSSatish Balay } else { 578a5e6ed63SBarry Smith Mat B; 579ade3a672SBarry Smith const char *matname; 580ceb03754SKris Buschelman ierr = MatConvert(A,MATSEQAIJ,MAT_INITIAL_MATRIX,&B);CHKERRQ(ierr); 581ade3a672SBarry Smith ierr = PetscObjectGetName((PetscObject)A,&matname);CHKERRQ(ierr); 582ade3a672SBarry Smith ierr = PetscObjectSetName((PetscObject)B,matname);CHKERRQ(ierr); 583a5e6ed63SBarry Smith ierr = MatView(B,viewer);CHKERRQ(ierr); 5846bf464f9SBarry Smith ierr = MatDestroy(&B);CHKERRQ(ierr); 58549b5e25fSSatish Balay } 58649b5e25fSSatish Balay PetscFunctionReturn(0); 58749b5e25fSSatish Balay } 58849b5e25fSSatish Balay 58949b5e25fSSatish Balay 59013f74950SBarry Smith PetscErrorCode MatGetValues_SeqSBAIJ(Mat A,PetscInt m,const PetscInt im[],PetscInt n,const PetscInt in[],PetscScalar v[]) 59149b5e25fSSatish Balay { 592045c9aa0SHong Zhang Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ*)A->data; 59313f74950SBarry Smith PetscInt *rp,k,low,high,t,row,nrow,i,col,l,*aj = a->j; 59413f74950SBarry Smith PetscInt *ai = a->i,*ailen = a->ilen; 595d0f46423SBarry Smith PetscInt brow,bcol,ridx,cidx,bs=A->rmap->bs,bs2=a->bs2; 59697e567efSBarry Smith MatScalar *ap,*aa = a->a; 59749b5e25fSSatish Balay 59849b5e25fSSatish Balay PetscFunctionBegin; 59949b5e25fSSatish Balay for (k=0; k<m; k++) { /* loop over rows */ 60049b5e25fSSatish Balay row = im[k]; brow = row/bs; 601e32f2f54SBarry Smith if (row < 0) {v += n; continue;} /* SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Negative row: %D",row); */ 602e32f2f54SBarry Smith if (row >= A->rmap->N) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Row too large: row %D max %D",row,A->rmap->N-1); 60349b5e25fSSatish Balay rp = aj + ai[brow]; ap = aa + bs2*ai[brow]; 60449b5e25fSSatish Balay nrow = ailen[brow]; 60549b5e25fSSatish Balay for (l=0; l<n; l++) { /* loop over columns */ 606e32f2f54SBarry Smith if (in[l] < 0) {v++; continue;} /* SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Negative column: %D",in[l]); */ 607e32f2f54SBarry Smith if (in[l] >= A->cmap->n) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Column too large: col %D max %D",in[l],A->cmap->n-1); 60849b5e25fSSatish Balay col = in[l]; 60949b5e25fSSatish Balay bcol = col/bs; 61049b5e25fSSatish Balay cidx = col%bs; 61149b5e25fSSatish Balay ridx = row%bs; 61249b5e25fSSatish Balay high = nrow; 61349b5e25fSSatish Balay low = 0; /* assume unsorted */ 61449b5e25fSSatish Balay while (high-low > 5) { 61549b5e25fSSatish Balay t = (low+high)/2; 61649b5e25fSSatish Balay if (rp[t] > bcol) high = t; 61749b5e25fSSatish Balay else low = t; 61849b5e25fSSatish Balay } 61949b5e25fSSatish Balay for (i=low; i<high; i++) { 62049b5e25fSSatish Balay if (rp[i] > bcol) break; 62149b5e25fSSatish Balay if (rp[i] == bcol) { 62249b5e25fSSatish Balay *v++ = ap[bs2*i+bs*cidx+ridx]; 62349b5e25fSSatish Balay goto finished; 62449b5e25fSSatish Balay } 62549b5e25fSSatish Balay } 62697e567efSBarry Smith *v++ = 0.0; 62749b5e25fSSatish Balay finished:; 62849b5e25fSSatish Balay } 62949b5e25fSSatish Balay } 63049b5e25fSSatish Balay PetscFunctionReturn(0); 63149b5e25fSSatish Balay } 63249b5e25fSSatish Balay 63349b5e25fSSatish Balay 63413f74950SBarry Smith PetscErrorCode MatSetValuesBlocked_SeqSBAIJ(Mat A,PetscInt m,const PetscInt im[],PetscInt n,const PetscInt in[],const PetscScalar v[],InsertMode is) 63549b5e25fSSatish Balay { 6360880e062SHong Zhang Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ*)A->data; 6376849ba73SBarry Smith PetscErrorCode ierr; 638e2ee6c50SBarry Smith PetscInt *rp,k,low,high,t,ii,jj,row,nrow,i,col,l,rmax,N,lastcol = -1; 63913f74950SBarry Smith PetscInt *imax =a->imax,*ai=a->i,*ailen=a->ilen; 640d0f46423SBarry Smith PetscInt *aj =a->j,nonew=a->nonew,bs2=a->bs2,bs=A->rmap->bs,stepval; 641ace3abfcSBarry Smith PetscBool roworiented=a->roworiented; 642dd6ea824SBarry Smith const PetscScalar *value = v; 643f15d580aSBarry Smith MatScalar *ap,*aa = a->a,*bap; 6440880e062SHong Zhang 64549b5e25fSSatish Balay PetscFunctionBegin; 64626fbe8dcSKarl Rupp if (roworiented) stepval = (n-1)*bs; 64726fbe8dcSKarl Rupp else stepval = (m-1)*bs; 64826fbe8dcSKarl Rupp 6490880e062SHong Zhang for (k=0; k<m; k++) { /* loop over added rows */ 6500880e062SHong Zhang row = im[k]; 6510880e062SHong Zhang if (row < 0) continue; 652cf9c20a2SJed Brown if (PetscUnlikelyDebug(row >= a->mbs)) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Block index row too large %D max %D",row,a->mbs-1); 6530880e062SHong Zhang rp = aj + ai[row]; 6540880e062SHong Zhang ap = aa + bs2*ai[row]; 6550880e062SHong Zhang rmax = imax[row]; 6560880e062SHong Zhang nrow = ailen[row]; 6570880e062SHong Zhang low = 0; 658818f2c47SBarry Smith high = nrow; 6590880e062SHong Zhang for (l=0; l<n; l++) { /* loop over added columns */ 6600880e062SHong Zhang if (in[l] < 0) continue; 6610880e062SHong Zhang col = in[l]; 662cf9c20a2SJed Brown if (PetscUnlikelyDebug(col >= a->nbs)) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Block index column too large %D max %D",col,a->nbs-1); 663b98bf0e1SJed Brown if (col < row) { 66426fbe8dcSKarl Rupp if (a->ignore_ltriangular) continue; /* ignore lower triangular block */ 66526fbe8dcSKarl Rupp else SETERRQ(PETSC_COMM_SELF,PETSC_ERR_USER,"Lower triangular value cannot be set for sbaij format. Ignoring these values, run with -mat_ignore_lower_triangular or call MatSetOption(mat,MAT_IGNORE_LOWER_TRIANGULAR,PETSC_TRUE)"); 666b98bf0e1SJed Brown } 66726fbe8dcSKarl Rupp if (roworiented) value = v + k*(stepval+bs)*bs + l*bs; 66826fbe8dcSKarl Rupp else value = v + l*(stepval+bs)*bs + k*bs; 66926fbe8dcSKarl Rupp 67026fbe8dcSKarl Rupp if (col <= lastcol) low = 0; 67126fbe8dcSKarl Rupp else high = nrow; 67226fbe8dcSKarl Rupp 673e2ee6c50SBarry Smith lastcol = col; 6740880e062SHong Zhang while (high-low > 7) { 6750880e062SHong Zhang t = (low+high)/2; 6760880e062SHong Zhang if (rp[t] > col) high = t; 6770880e062SHong Zhang else low = t; 6780880e062SHong Zhang } 6790880e062SHong Zhang for (i=low; i<high; i++) { 6800880e062SHong Zhang if (rp[i] > col) break; 6810880e062SHong Zhang if (rp[i] == col) { 6820880e062SHong Zhang bap = ap + bs2*i; 6830880e062SHong Zhang if (roworiented) { 6840880e062SHong Zhang if (is == ADD_VALUES) { 6850880e062SHong Zhang for (ii=0; ii<bs; ii++,value+=stepval) { 6860880e062SHong Zhang for (jj=ii; jj<bs2; jj+=bs) { 6870880e062SHong Zhang bap[jj] += *value++; 6880880e062SHong Zhang } 6890880e062SHong Zhang } 6900880e062SHong Zhang } else { 6910880e062SHong Zhang for (ii=0; ii<bs; ii++,value+=stepval) { 6920880e062SHong Zhang for (jj=ii; jj<bs2; jj+=bs) { 6930880e062SHong Zhang bap[jj] = *value++; 6940880e062SHong Zhang } 6950880e062SHong Zhang } 6960880e062SHong Zhang } 6970880e062SHong Zhang } else { 6980880e062SHong Zhang if (is == ADD_VALUES) { 6990880e062SHong Zhang for (ii=0; ii<bs; ii++,value+=stepval) { 7000880e062SHong Zhang for (jj=0; jj<bs; jj++) { 7010880e062SHong Zhang *bap++ += *value++; 7020880e062SHong Zhang } 7030880e062SHong Zhang } 7040880e062SHong Zhang } else { 7050880e062SHong Zhang for (ii=0; ii<bs; ii++,value+=stepval) { 7060880e062SHong Zhang for (jj=0; jj<bs; jj++) { 7070880e062SHong Zhang *bap++ = *value++; 7080880e062SHong Zhang } 7090880e062SHong Zhang } 7100880e062SHong Zhang } 7110880e062SHong Zhang } 7120880e062SHong Zhang goto noinsert2; 7130880e062SHong Zhang } 7140880e062SHong Zhang } 7150880e062SHong Zhang if (nonew == 1) goto noinsert2; 7162f7d4af7SBarry Smith if (nonew == -1) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Inserting a new block index nonzero block (%D, %D) in the matrix", row, col); 717fef13f97SBarry Smith MatSeqXAIJReallocateAIJ(A,a->mbs,bs2,nrow,row,col,rmax,aa,ai,aj,rp,ap,imax,nonew,MatScalar); 718c03d1d03SSatish Balay N = nrow++ - 1; high++; 7190880e062SHong Zhang /* shift up all the later entries in this row */ 720580bdb30SBarry Smith ierr = PetscArraymove(rp+i+1,rp+i,N-i+1);CHKERRQ(ierr); 721580bdb30SBarry Smith ierr = PetscArraymove(ap+bs2*(i+1),ap+bs2*i,bs2*(N-i+1));CHKERRQ(ierr); 722580bdb30SBarry Smith ierr = PetscArrayzero(ap+bs2*i,bs2);CHKERRQ(ierr); 7230880e062SHong Zhang rp[i] = col; 7240880e062SHong Zhang bap = ap + bs2*i; 7250880e062SHong Zhang if (roworiented) { 7260880e062SHong Zhang for (ii=0; ii<bs; ii++,value+=stepval) { 7270880e062SHong Zhang for (jj=ii; jj<bs2; jj+=bs) { 7280880e062SHong Zhang bap[jj] = *value++; 7290880e062SHong Zhang } 7300880e062SHong Zhang } 7310880e062SHong Zhang } else { 7320880e062SHong Zhang for (ii=0; ii<bs; ii++,value+=stepval) { 7330880e062SHong Zhang for (jj=0; jj<bs; jj++) { 7340880e062SHong Zhang *bap++ = *value++; 7350880e062SHong Zhang } 7360880e062SHong Zhang } 7370880e062SHong Zhang } 7380880e062SHong Zhang noinsert2:; 7390880e062SHong Zhang low = i; 7400880e062SHong Zhang } 7410880e062SHong Zhang ailen[row] = nrow; 7420880e062SHong Zhang } 7430880e062SHong Zhang PetscFunctionReturn(0); 74449b5e25fSSatish Balay } 74549b5e25fSSatish Balay 74664831d72SBarry Smith /* 74764831d72SBarry Smith This is not yet used 74864831d72SBarry Smith */ 7494108e4d5SBarry Smith PetscErrorCode MatAssemblyEnd_SeqSBAIJ_SeqAIJ_Inode(Mat A) 7500def2e27SBarry Smith { 7510def2e27SBarry Smith Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ*)A->data; 7520def2e27SBarry Smith PetscErrorCode ierr; 7530def2e27SBarry Smith const PetscInt *ai = a->i, *aj = a->j,*cols; 7540def2e27SBarry Smith PetscInt i = 0,j,blk_size,m = A->rmap->n,node_count = 0,nzx,nzy,*ns,row,nz,cnt,cnt2,*counts; 755ace3abfcSBarry Smith PetscBool flag; 7560def2e27SBarry Smith 7570def2e27SBarry Smith PetscFunctionBegin; 758785e854fSJed Brown ierr = PetscMalloc1(m,&ns);CHKERRQ(ierr); 7590def2e27SBarry Smith while (i < m) { 7600def2e27SBarry Smith nzx = ai[i+1] - ai[i]; /* Number of nonzeros */ 7610def2e27SBarry Smith /* Limits the number of elements in a node to 'a->inode.limit' */ 7620def2e27SBarry Smith for (j=i+1,blk_size=1; j<m && blk_size <a->inode.limit; ++j,++blk_size) { 7630def2e27SBarry Smith nzy = ai[j+1] - ai[j]; 7640def2e27SBarry Smith if (nzy != (nzx - j + i)) break; 765580bdb30SBarry Smith ierr = PetscArraycmp(aj + ai[i] + j - i,aj + ai[j],nzy,&flag);CHKERRQ(ierr); 7660def2e27SBarry Smith if (!flag) break; 7670def2e27SBarry Smith } 7680def2e27SBarry Smith ns[node_count++] = blk_size; 76926fbe8dcSKarl Rupp 7700def2e27SBarry Smith i = j; 7710def2e27SBarry Smith } 7720def2e27SBarry Smith if (!a->inode.size && m && node_count > .9*m) { 7730def2e27SBarry Smith ierr = PetscFree(ns);CHKERRQ(ierr); 7740def2e27SBarry Smith ierr = PetscInfo2(A,"Found %D nodes out of %D rows. Not using Inode routines\n",node_count,m);CHKERRQ(ierr); 7750def2e27SBarry Smith } else { 7760def2e27SBarry Smith a->inode.node_count = node_count; 77726fbe8dcSKarl Rupp 778785e854fSJed Brown ierr = PetscMalloc1(node_count,&a->inode.size);CHKERRQ(ierr); 7793bb1ff40SBarry Smith ierr = PetscLogObjectMemory((PetscObject)A,node_count*sizeof(PetscInt));CHKERRQ(ierr); 780580bdb30SBarry Smith ierr = PetscArraycpy(a->inode.size,ns,node_count);CHKERRQ(ierr); 7810def2e27SBarry Smith ierr = PetscFree(ns);CHKERRQ(ierr); 7820def2e27SBarry Smith ierr = PetscInfo3(A,"Found %D nodes of %D. Limit used: %D. Using Inode routines\n",node_count,m,a->inode.limit);CHKERRQ(ierr); 7830def2e27SBarry Smith 7840def2e27SBarry Smith /* count collections of adjacent columns in each inode */ 7850def2e27SBarry Smith row = 0; 7860def2e27SBarry Smith cnt = 0; 7870def2e27SBarry Smith for (i=0; i<node_count; i++) { 7880def2e27SBarry Smith cols = aj + ai[row] + a->inode.size[i]; 7890def2e27SBarry Smith nz = ai[row+1] - ai[row] - a->inode.size[i]; 7900def2e27SBarry Smith for (j=1; j<nz; j++) { 79126fbe8dcSKarl Rupp if (cols[j] != cols[j-1]+1) cnt++; 7920def2e27SBarry Smith } 7930def2e27SBarry Smith cnt++; 7940def2e27SBarry Smith row += a->inode.size[i]; 7950def2e27SBarry Smith } 796785e854fSJed Brown ierr = PetscMalloc1(2*cnt,&counts);CHKERRQ(ierr); 7970def2e27SBarry Smith cnt = 0; 7980def2e27SBarry Smith row = 0; 7990def2e27SBarry Smith for (i=0; i<node_count; i++) { 8000def2e27SBarry Smith cols = aj + ai[row] + a->inode.size[i]; 8010def2e27SBarry Smith counts[2*cnt] = cols[0]; 8020def2e27SBarry Smith nz = ai[row+1] - ai[row] - a->inode.size[i]; 8030def2e27SBarry Smith cnt2 = 1; 8040def2e27SBarry Smith for (j=1; j<nz; j++) { 8050def2e27SBarry Smith if (cols[j] != cols[j-1]+1) { 8060def2e27SBarry Smith counts[2*(cnt++)+1] = cnt2; 8070def2e27SBarry Smith counts[2*cnt] = cols[j]; 8080def2e27SBarry Smith cnt2 = 1; 8090def2e27SBarry Smith } else cnt2++; 8100def2e27SBarry Smith } 8110def2e27SBarry Smith counts[2*(cnt++)+1] = cnt2; 8120def2e27SBarry Smith row += a->inode.size[i]; 8130def2e27SBarry Smith } 814*f4259b30SLisandro Dalcin ierr = PetscIntView(2*cnt,counts,NULL);CHKERRQ(ierr); 8150def2e27SBarry Smith } 81638702af4SBarry Smith PetscFunctionReturn(0); 81738702af4SBarry Smith } 81838702af4SBarry Smith 819dfbe8321SBarry Smith PetscErrorCode MatAssemblyEnd_SeqSBAIJ(Mat A,MatAssemblyType mode) 82049b5e25fSSatish Balay { 82149b5e25fSSatish Balay Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ*)A->data; 8226849ba73SBarry Smith PetscErrorCode ierr; 8238f8f2f0dSBarry Smith PetscInt fshift = 0,i,*ai = a->i,*aj = a->j,*imax = a->imax; 824d0f46423SBarry Smith PetscInt m = A->rmap->N,*ip,N,*ailen = a->ilen; 82513f74950SBarry Smith PetscInt mbs = a->mbs,bs2 = a->bs2,rmax = 0; 82649b5e25fSSatish Balay MatScalar *aa = a->a,*ap; 82749b5e25fSSatish Balay 82849b5e25fSSatish Balay PetscFunctionBegin; 82949b5e25fSSatish Balay if (mode == MAT_FLUSH_ASSEMBLY) PetscFunctionReturn(0); 83049b5e25fSSatish Balay 83149b5e25fSSatish Balay if (m) rmax = ailen[0]; 83249b5e25fSSatish Balay for (i=1; i<mbs; i++) { 83349b5e25fSSatish Balay /* move each row back by the amount of empty slots (fshift) before it*/ 83449b5e25fSSatish Balay fshift += imax[i-1] - ailen[i-1]; 83549b5e25fSSatish Balay rmax = PetscMax(rmax,ailen[i]); 83649b5e25fSSatish Balay if (fshift) { 837580bdb30SBarry Smith ip = aj + ai[i]; 838580bdb30SBarry Smith ap = aa + bs2*ai[i]; 83949b5e25fSSatish Balay N = ailen[i]; 840580bdb30SBarry Smith ierr = PetscArraymove(ip-fshift,ip,N);CHKERRQ(ierr); 841580bdb30SBarry Smith ierr = PetscArraymove(ap-bs2*fshift,ap,bs2*N);CHKERRQ(ierr); 84249b5e25fSSatish Balay } 84349b5e25fSSatish Balay ai[i] = ai[i-1] + ailen[i-1]; 84449b5e25fSSatish Balay } 84549b5e25fSSatish Balay if (mbs) { 84649b5e25fSSatish Balay fshift += imax[mbs-1] - ailen[mbs-1]; 84749b5e25fSSatish Balay ai[mbs] = ai[mbs-1] + ailen[mbs-1]; 84849b5e25fSSatish Balay } 84949b5e25fSSatish Balay /* reset ilen and imax for each row */ 85049b5e25fSSatish Balay for (i=0; i<mbs; i++) { 85149b5e25fSSatish Balay ailen[i] = imax[i] = ai[i+1] - ai[i]; 85249b5e25fSSatish Balay } 8536c6c5352SBarry Smith a->nz = ai[mbs]; 85449b5e25fSSatish Balay 855b424e231SHong Zhang /* diagonals may have moved, reset it */ 856b424e231SHong Zhang if (a->diag) { 857580bdb30SBarry Smith ierr = PetscArraycpy(a->diag,ai,mbs);CHKERRQ(ierr); 85849b5e25fSSatish Balay } 85926fbe8dcSKarl Rupp if (fshift && a->nounused == -1) SETERRQ4(PETSC_COMM_SELF,PETSC_ERR_PLIB, "Unused space detected in matrix: %D X %D block size %D, %D unneeded", m, A->cmap->n, A->rmap->bs, fshift*bs2); 86026fbe8dcSKarl Rupp 861d0f46423SBarry Smith ierr = PetscInfo5(A,"Matrix size: %D X %D, block size %D; storage space: %D unneeded, %D used\n",m,A->rmap->N,A->rmap->bs,fshift*bs2,a->nz*bs2);CHKERRQ(ierr); 862ae15b995SBarry Smith ierr = PetscInfo1(A,"Number of mallocs during MatSetValues is %D\n",a->reallocs);CHKERRQ(ierr); 863ae15b995SBarry Smith ierr = PetscInfo1(A,"Most nonzeros blocks in any row is %D\n",rmax);CHKERRQ(ierr); 86426fbe8dcSKarl Rupp 8658e58a170SBarry Smith A->info.mallocs += a->reallocs; 86649b5e25fSSatish Balay a->reallocs = 0; 86749b5e25fSSatish Balay A->info.nz_unneeded = (PetscReal)fshift*bs2; 868061b2667SBarry Smith a->idiagvalid = PETSC_FALSE; 8694dcd73b1SHong Zhang a->rmax = rmax; 87038702af4SBarry Smith 87138702af4SBarry Smith if (A->cmap->n < 65536 && A->cmap->bs == 1) { 87244e1c64aSLisandro Dalcin if (a->jshort && a->free_jshort) { 87317803ae8SHong Zhang /* when matrix data structure is changed, previous jshort must be replaced */ 87417803ae8SHong Zhang ierr = PetscFree(a->jshort);CHKERRQ(ierr); 87517803ae8SHong Zhang } 876785e854fSJed Brown ierr = PetscMalloc1(a->i[A->rmap->n],&a->jshort);CHKERRQ(ierr); 8773bb1ff40SBarry Smith ierr = PetscLogObjectMemory((PetscObject)A,a->i[A->rmap->n]*sizeof(unsigned short));CHKERRQ(ierr); 87838702af4SBarry Smith for (i=0; i<a->i[A->rmap->n]; i++) a->jshort[i] = a->j[i]; 87938702af4SBarry Smith A->ops->mult = MatMult_SeqSBAIJ_1_ushort; 88041f059aeSBarry Smith A->ops->sor = MatSOR_SeqSBAIJ_ushort; 8814da8f245SBarry Smith a->free_jshort = PETSC_TRUE; 88238702af4SBarry Smith } 88349b5e25fSSatish Balay PetscFunctionReturn(0); 88449b5e25fSSatish Balay } 88549b5e25fSSatish Balay 88649b5e25fSSatish Balay /* 88749b5e25fSSatish Balay This function returns an array of flags which indicate the locations of contiguous 88849b5e25fSSatish Balay blocks that should be zeroed. for eg: if bs = 3 and is = [0,1,2,3,5,6,7,8,9] 88949b5e25fSSatish Balay then the resulting sizes = [3,1,1,3,1] correspondig to sets [(0,1,2),(3),(5),(6,7,8),(9)] 89049b5e25fSSatish Balay Assume: sizes should be long enough to hold all the values. 89149b5e25fSSatish Balay */ 89213f74950SBarry Smith PetscErrorCode MatZeroRows_SeqSBAIJ_Check_Blocks(PetscInt idx[],PetscInt n,PetscInt bs,PetscInt sizes[], PetscInt *bs_max) 89349b5e25fSSatish Balay { 89413f74950SBarry Smith PetscInt i,j,k,row; 895ace3abfcSBarry Smith PetscBool flg; 89649b5e25fSSatish Balay 89749b5e25fSSatish Balay PetscFunctionBegin; 89849b5e25fSSatish Balay for (i=0,j=0; i<n; j++) { 89949b5e25fSSatish Balay row = idx[i]; 90049b5e25fSSatish Balay if (row%bs!=0) { /* Not the begining of a block */ 90149b5e25fSSatish Balay sizes[j] = 1; 90249b5e25fSSatish Balay i++; 90349b5e25fSSatish Balay } else if (i+bs > n) { /* Beginning of a block, but complete block doesn't exist (at idx end) */ 90449b5e25fSSatish Balay sizes[j] = 1; /* Also makes sure atleast 'bs' values exist for next else */ 90549b5e25fSSatish Balay i++; 90649b5e25fSSatish Balay } else { /* Begining of the block, so check if the complete block exists */ 90749b5e25fSSatish Balay flg = PETSC_TRUE; 90849b5e25fSSatish Balay for (k=1; k<bs; k++) { 90949b5e25fSSatish Balay if (row+k != idx[i+k]) { /* break in the block */ 91049b5e25fSSatish Balay flg = PETSC_FALSE; 91149b5e25fSSatish Balay break; 91249b5e25fSSatish Balay } 91349b5e25fSSatish Balay } 914abc0a331SBarry Smith if (flg) { /* No break in the bs */ 91549b5e25fSSatish Balay sizes[j] = bs; 91649b5e25fSSatish Balay i += bs; 91749b5e25fSSatish Balay } else { 91849b5e25fSSatish Balay sizes[j] = 1; 91949b5e25fSSatish Balay i++; 92049b5e25fSSatish Balay } 92149b5e25fSSatish Balay } 92249b5e25fSSatish Balay } 92349b5e25fSSatish Balay *bs_max = j; 92449b5e25fSSatish Balay PetscFunctionReturn(0); 92549b5e25fSSatish Balay } 92649b5e25fSSatish Balay 92749b5e25fSSatish Balay 92849b5e25fSSatish Balay /* Only add/insert a(i,j) with i<=j (blocks). 92949b5e25fSSatish Balay Any a(i,j) with i>j input by user is ingored. 93049b5e25fSSatish Balay */ 93149b5e25fSSatish Balay 93213f74950SBarry Smith PetscErrorCode MatSetValues_SeqSBAIJ(Mat A,PetscInt m,const PetscInt im[],PetscInt n,const PetscInt in[],const PetscScalar v[],InsertMode is) 93349b5e25fSSatish Balay { 93449b5e25fSSatish Balay Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ*)A->data; 9356849ba73SBarry Smith PetscErrorCode ierr; 936e2ee6c50SBarry Smith PetscInt *rp,k,low,high,t,ii,row,nrow,i,col,l,rmax,N,lastcol = -1; 93713f74950SBarry Smith PetscInt *imax=a->imax,*ai=a->i,*ailen=a->ilen,roworiented=a->roworiented; 938d0f46423SBarry Smith PetscInt *aj =a->j,nonew=a->nonew,bs=A->rmap->bs,brow,bcol; 93913f74950SBarry Smith PetscInt ridx,cidx,bs2=a->bs2; 94049b5e25fSSatish Balay MatScalar *ap,value,*aa=a->a,*bap; 94149b5e25fSSatish Balay 94249b5e25fSSatish Balay PetscFunctionBegin; 94349b5e25fSSatish Balay for (k=0; k<m; k++) { /* loop over added rows */ 94449b5e25fSSatish Balay row = im[k]; /* row number */ 94549b5e25fSSatish Balay brow = row/bs; /* block row number */ 94649b5e25fSSatish Balay if (row < 0) continue; 947cf9c20a2SJed Brown if (PetscUnlikelyDebug(row >= A->rmap->N)) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Row too large: row %D max %D",row,A->rmap->N-1); 94849b5e25fSSatish Balay rp = aj + ai[brow]; /*ptr to beginning of column value of the row block*/ 94949b5e25fSSatish Balay ap = aa + bs2*ai[brow]; /*ptr to beginning of element value of the row block*/ 95049b5e25fSSatish Balay rmax = imax[brow]; /* maximum space allocated for this row */ 95149b5e25fSSatish Balay nrow = ailen[brow]; /* actual length of this row */ 95249b5e25fSSatish Balay low = 0; 9538509e838SStefano Zampini high = nrow; 95449b5e25fSSatish Balay for (l=0; l<n; l++) { /* loop over added columns */ 95549b5e25fSSatish Balay if (in[l] < 0) continue; 956cf9c20a2SJed Brown if (PetscUnlikelyDebug(in[l] >= A->cmap->N)) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Column too large: col %D max %D",in[l],A->cmap->N-1); 95749b5e25fSSatish Balay col = in[l]; 95849b5e25fSSatish Balay bcol = col/bs; /* block col number */ 95949b5e25fSSatish Balay 960941593c8SHong Zhang if (brow > bcol) { 96126fbe8dcSKarl Rupp if (a->ignore_ltriangular) continue; /* ignore lower triangular values */ 96226fbe8dcSKarl Rupp else SETERRQ(PETSC_COMM_SELF,PETSC_ERR_USER,"Lower triangular value cannot be set for sbaij format. Ignoring these values, run with -mat_ignore_lower_triangular or call MatSetOption(mat,MAT_IGNORE_LOWER_TRIANGULAR,PETSC_TRUE)"); 963941593c8SHong Zhang } 964f4989cb3SHong Zhang 96549b5e25fSSatish Balay ridx = row % bs; cidx = col % bs; /*row and col index inside the block */ 9668549e402SHong Zhang if ((brow==bcol && ridx<=cidx) || (brow<bcol)) { 96749b5e25fSSatish Balay /* element value a(k,l) */ 96826fbe8dcSKarl Rupp if (roworiented) value = v[l + k*n]; 96926fbe8dcSKarl Rupp else value = v[k + l*m]; 97049b5e25fSSatish Balay 97149b5e25fSSatish Balay /* move pointer bap to a(k,l) quickly and add/insert value */ 97226fbe8dcSKarl Rupp if (col <= lastcol) low = 0; 9738509e838SStefano Zampini else high = nrow; 9748509e838SStefano Zampini 975e2ee6c50SBarry Smith lastcol = col; 97649b5e25fSSatish Balay while (high-low > 7) { 97749b5e25fSSatish Balay t = (low+high)/2; 97849b5e25fSSatish Balay if (rp[t] > bcol) high = t; 97949b5e25fSSatish Balay else low = t; 98049b5e25fSSatish Balay } 98149b5e25fSSatish Balay for (i=low; i<high; i++) { 98249b5e25fSSatish Balay if (rp[i] > bcol) break; 98349b5e25fSSatish Balay if (rp[i] == bcol) { 98449b5e25fSSatish Balay bap = ap + bs2*i + bs*cidx + ridx; 98549b5e25fSSatish Balay if (is == ADD_VALUES) *bap += value; 98649b5e25fSSatish Balay else *bap = value; 9878549e402SHong Zhang /* for diag block, add/insert its symmetric element a(cidx,ridx) */ 9888549e402SHong Zhang if (brow == bcol && ridx < cidx) { 9898549e402SHong Zhang bap = ap + bs2*i + bs*ridx + cidx; 9908549e402SHong Zhang if (is == ADD_VALUES) *bap += value; 9918549e402SHong Zhang else *bap = value; 9928549e402SHong Zhang } 99349b5e25fSSatish Balay goto noinsert1; 99449b5e25fSSatish Balay } 99549b5e25fSSatish Balay } 99649b5e25fSSatish Balay 99749b5e25fSSatish Balay if (nonew == 1) goto noinsert1; 998e32f2f54SBarry Smith if (nonew == -1) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Inserting a new nonzero (%D, %D) in the matrix", row, col); 999fef13f97SBarry Smith MatSeqXAIJReallocateAIJ(A,a->mbs,bs2,nrow,brow,bcol,rmax,aa,ai,aj,rp,ap,imax,nonew,MatScalar); 100049b5e25fSSatish Balay 1001c03d1d03SSatish Balay N = nrow++ - 1; high++; 100249b5e25fSSatish Balay /* shift up all the later entries in this row */ 1003580bdb30SBarry Smith ierr = PetscArraymove(rp+i+1,rp+i,N-i+1);CHKERRQ(ierr); 1004580bdb30SBarry Smith ierr = PetscArraymove(ap+bs2*(i+1),ap+bs2*i,bs2*(N-i+1));CHKERRQ(ierr); 1005580bdb30SBarry Smith ierr = PetscArrayzero(ap+bs2*i,bs2);CHKERRQ(ierr); 100649b5e25fSSatish Balay rp[i] = bcol; 100749b5e25fSSatish Balay ap[bs2*i + bs*cidx + ridx] = value; 10088509e838SStefano Zampini /* for diag block, add/insert its symmetric element a(cidx,ridx) */ 10098509e838SStefano Zampini if (brow == bcol && ridx < cidx) { 10108509e838SStefano Zampini ap[bs2*i + bs*ridx + cidx] = value; 10118509e838SStefano Zampini } 1012e56f5c9eSBarry Smith A->nonzerostate++; 101349b5e25fSSatish Balay noinsert1:; 101449b5e25fSSatish Balay low = i; 10158549e402SHong Zhang } 101649b5e25fSSatish Balay } /* end of loop over added columns */ 101749b5e25fSSatish Balay ailen[brow] = nrow; 101849b5e25fSSatish Balay } /* end of loop over added rows */ 101949b5e25fSSatish Balay PetscFunctionReturn(0); 102049b5e25fSSatish Balay } 102149b5e25fSSatish Balay 10220481f469SBarry Smith PetscErrorCode MatICCFactor_SeqSBAIJ(Mat inA,IS row,const MatFactorInfo *info) 102349b5e25fSSatish Balay { 10244ccecd49SHong Zhang Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ*)inA->data; 102549b5e25fSSatish Balay Mat outA; 1026dfbe8321SBarry Smith PetscErrorCode ierr; 1027ace3abfcSBarry Smith PetscBool row_identity; 102849b5e25fSSatish Balay 102949b5e25fSSatish Balay PetscFunctionBegin; 1030e32f2f54SBarry Smith if (info->levels != 0) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_SUP,"Only levels=0 is supported for in-place icc"); 1031c84f5b01SHong Zhang ierr = ISIdentity(row,&row_identity);CHKERRQ(ierr); 1032e32f2f54SBarry Smith if (!row_identity) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_SUP,"Matrix reordering is not supported"); 1033e32f2f54SBarry Smith if (inA->rmap->bs != 1) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_SUP,"Matrix block size %D is not supported",inA->rmap->bs); /* Need to replace MatCholeskyFactorSymbolic_SeqSBAIJ_MSR()! */ 1034c84f5b01SHong Zhang 103549b5e25fSSatish Balay outA = inA; 1036d5f3da31SBarry Smith inA->factortype = MAT_FACTOR_ICC; 1037f6224b95SHong Zhang ierr = PetscFree(inA->solvertype);CHKERRQ(ierr); 1038f6224b95SHong Zhang ierr = PetscStrallocpy(MATSOLVERPETSC,&inA->solvertype);CHKERRQ(ierr); 103949b5e25fSSatish Balay 10401a3463dfSHong Zhang ierr = MatMarkDiagonal_SeqSBAIJ(inA);CHKERRQ(ierr); 1041d595f711SHong Zhang ierr = MatSeqSBAIJSetNumericFactorization_inplace(inA,row_identity);CHKERRQ(ierr); 104249b5e25fSSatish Balay 1043c3122656SLisandro Dalcin ierr = PetscObjectReference((PetscObject)row);CHKERRQ(ierr); 10446bf464f9SBarry Smith ierr = ISDestroy(&a->row);CHKERRQ(ierr); 1045c84f5b01SHong Zhang a->row = row; 1046c3122656SLisandro Dalcin ierr = PetscObjectReference((PetscObject)row);CHKERRQ(ierr); 10476bf464f9SBarry Smith ierr = ISDestroy(&a->col);CHKERRQ(ierr); 1048c84f5b01SHong Zhang a->col = row; 1049c84f5b01SHong Zhang 1050c84f5b01SHong Zhang /* Create the invert permutation so that it can be used in MatCholeskyFactorNumeric() */ 1051c84f5b01SHong Zhang if (a->icol) {ierr = ISInvertPermutation(row,PETSC_DECIDE, &a->icol);CHKERRQ(ierr);} 10523bb1ff40SBarry Smith ierr = PetscLogObjectParent((PetscObject)inA,(PetscObject)a->icol);CHKERRQ(ierr); 105349b5e25fSSatish Balay 105449b5e25fSSatish Balay if (!a->solve_work) { 1055854ce69bSBarry Smith ierr = PetscMalloc1(inA->rmap->N+inA->rmap->bs,&a->solve_work);CHKERRQ(ierr); 10563bb1ff40SBarry Smith ierr = PetscLogObjectMemory((PetscObject)inA,(inA->rmap->N+inA->rmap->bs)*sizeof(PetscScalar));CHKERRQ(ierr); 105749b5e25fSSatish Balay } 105849b5e25fSSatish Balay 1059719d5645SBarry Smith ierr = MatCholeskyFactorNumeric(outA,inA,info);CHKERRQ(ierr); 106049b5e25fSSatish Balay PetscFunctionReturn(0); 106149b5e25fSSatish Balay } 1062950f1e5bSHong Zhang 10637087cfbeSBarry Smith PetscErrorCode MatSeqSBAIJSetColumnIndices_SeqSBAIJ(Mat mat,PetscInt *indices) 106449b5e25fSSatish Balay { 1065045c9aa0SHong Zhang Mat_SeqSBAIJ *baij = (Mat_SeqSBAIJ*)mat->data; 106613f74950SBarry Smith PetscInt i,nz,n; 10677827cd58SJed Brown PetscErrorCode ierr; 106849b5e25fSSatish Balay 106949b5e25fSSatish Balay PetscFunctionBegin; 10706c6c5352SBarry Smith nz = baij->maxnz; 1071d0f46423SBarry Smith n = mat->cmap->n; 107226fbe8dcSKarl Rupp for (i=0; i<nz; i++) baij->j[i] = indices[i]; 107326fbe8dcSKarl Rupp 10746c6c5352SBarry Smith baij->nz = nz; 107526fbe8dcSKarl Rupp for (i=0; i<n; i++) baij->ilen[i] = baij->imax[i]; 107626fbe8dcSKarl Rupp 10777827cd58SJed Brown ierr = MatSetOption(mat,MAT_NEW_NONZERO_LOCATION_ERR,PETSC_TRUE);CHKERRQ(ierr); 107849b5e25fSSatish Balay PetscFunctionReturn(0); 107949b5e25fSSatish Balay } 108049b5e25fSSatish Balay 108149b5e25fSSatish Balay /*@ 108219585528SSatish Balay MatSeqSBAIJSetColumnIndices - Set the column indices for all the rows 108349b5e25fSSatish Balay in the matrix. 108449b5e25fSSatish Balay 108549b5e25fSSatish Balay Input Parameters: 108619585528SSatish Balay + mat - the SeqSBAIJ matrix 108749b5e25fSSatish Balay - indices - the column indices 108849b5e25fSSatish Balay 108949b5e25fSSatish Balay Level: advanced 109049b5e25fSSatish Balay 109149b5e25fSSatish Balay Notes: 109249b5e25fSSatish Balay This can be called if you have precomputed the nonzero structure of the 109349b5e25fSSatish Balay matrix and want to provide it to the matrix object to improve the performance 109449b5e25fSSatish Balay of the MatSetValues() operation. 109549b5e25fSSatish Balay 109649b5e25fSSatish Balay You MUST have set the correct numbers of nonzeros per row in the call to 1097d1be2dadSMatthew Knepley MatCreateSeqSBAIJ(), and the columns indices MUST be sorted. 109849b5e25fSSatish Balay 1099ab9f2c04SSatish Balay MUST be called before any calls to MatSetValues() 110049b5e25fSSatish Balay 1101ab9f2c04SSatish Balay .seealso: MatCreateSeqSBAIJ 110249b5e25fSSatish Balay @*/ 11037087cfbeSBarry Smith PetscErrorCode MatSeqSBAIJSetColumnIndices(Mat mat,PetscInt *indices) 110449b5e25fSSatish Balay { 11054ac538c5SBarry Smith PetscErrorCode ierr; 110649b5e25fSSatish Balay 110749b5e25fSSatish Balay PetscFunctionBegin; 11080700a824SBarry Smith PetscValidHeaderSpecific(mat,MAT_CLASSID,1); 11094482741eSBarry Smith PetscValidPointer(indices,2); 11104ac538c5SBarry Smith ierr = PetscUseMethod(mat,"MatSeqSBAIJSetColumnIndices_C",(Mat,PetscInt*),(mat,indices));CHKERRQ(ierr); 111149b5e25fSSatish Balay PetscFunctionReturn(0); 111249b5e25fSSatish Balay } 111349b5e25fSSatish Balay 11143c896bc6SHong Zhang PetscErrorCode MatCopy_SeqSBAIJ(Mat A,Mat B,MatStructure str) 11153c896bc6SHong Zhang { 11163c896bc6SHong Zhang PetscErrorCode ierr; 11174c7a3774SStefano Zampini PetscBool isbaij; 11183c896bc6SHong Zhang 11193c896bc6SHong Zhang PetscFunctionBegin; 11204c7a3774SStefano Zampini ierr = PetscObjectTypeCompareAny((PetscObject)B,&isbaij,MATSEQSBAIJ,MATMPISBAIJ,"");CHKERRQ(ierr); 11214c7a3774SStefano Zampini if (!isbaij) SETERRQ1(PetscObjectComm((PetscObject)B),PETSC_ERR_SUP,"Not for matrix type %s",((PetscObject)B)->type_name); 11224c7a3774SStefano Zampini /* If the two matrices have the same copy implementation and nonzero pattern, use fast copy. */ 11234c7a3774SStefano Zampini if (str == SAME_NONZERO_PATTERN && A->ops->copy == B->ops->copy) { 11243c896bc6SHong Zhang Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ*)A->data; 11253c896bc6SHong Zhang Mat_SeqSBAIJ *b = (Mat_SeqSBAIJ*)B->data; 11263c896bc6SHong Zhang 11274c7a3774SStefano Zampini if (a->i[a->mbs] != b->i[b->mbs]) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_INCOMP,"Number of nonzeros in two matrices are different"); 11284c7a3774SStefano Zampini if (a->mbs != b->mbs) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_INCOMP,"Number of rows in two matrices are different"); 11294c7a3774SStefano Zampini if (a->bs2 != b->bs2) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_INCOMP,"Different block size"); 1130580bdb30SBarry Smith ierr = PetscArraycpy(b->a,a->a,a->bs2*a->i[a->mbs]);CHKERRQ(ierr); 1131cdc753b6SBarry Smith ierr = PetscObjectStateIncrease((PetscObject)B);CHKERRQ(ierr); 11323c896bc6SHong Zhang } else { 1133f5edf698SHong Zhang ierr = MatGetRowUpperTriangular(A);CHKERRQ(ierr); 11343c896bc6SHong Zhang ierr = MatCopy_Basic(A,B,str);CHKERRQ(ierr); 1135f5edf698SHong Zhang ierr = MatRestoreRowUpperTriangular(A);CHKERRQ(ierr); 11363c896bc6SHong Zhang } 11373c896bc6SHong Zhang PetscFunctionReturn(0); 11383c896bc6SHong Zhang } 11393c896bc6SHong Zhang 11404994cf47SJed Brown PetscErrorCode MatSetUp_SeqSBAIJ(Mat A) 1141273d9f13SBarry Smith { 1142dfbe8321SBarry Smith PetscErrorCode ierr; 1143273d9f13SBarry Smith 1144273d9f13SBarry Smith PetscFunctionBegin; 1145*f4259b30SLisandro Dalcin ierr = MatSeqSBAIJSetPreallocation(A,A->rmap->bs,PETSC_DEFAULT,NULL);CHKERRQ(ierr); 1146273d9f13SBarry Smith PetscFunctionReturn(0); 1147273d9f13SBarry Smith } 1148273d9f13SBarry Smith 1149cda14afcSprj- static PetscErrorCode MatSeqSBAIJGetArray_SeqSBAIJ(Mat A,PetscScalar *array[]) 1150a6ece127SHong Zhang { 1151a6ece127SHong Zhang Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ*)A->data; 11525fd66863SKarl Rupp 1153a6ece127SHong Zhang PetscFunctionBegin; 1154a6ece127SHong Zhang *array = a->a; 1155a6ece127SHong Zhang PetscFunctionReturn(0); 1156a6ece127SHong Zhang } 1157a6ece127SHong Zhang 1158cda14afcSprj- static PetscErrorCode MatSeqSBAIJRestoreArray_SeqSBAIJ(Mat A,PetscScalar *array[]) 1159a6ece127SHong Zhang { 1160a6ece127SHong Zhang PetscFunctionBegin; 1161cda14afcSprj- *array = NULL; 1162a6ece127SHong Zhang PetscFunctionReturn(0); 1163a6ece127SHong Zhang } 1164a6ece127SHong Zhang 116552768537SHong Zhang PetscErrorCode MatAXPYGetPreallocation_SeqSBAIJ(Mat Y,Mat X,PetscInt *nnz) 116652768537SHong Zhang { 1167b264fe52SHong Zhang PetscInt bs = Y->rmap->bs,mbs = Y->rmap->N/bs; 116852768537SHong Zhang Mat_SeqSBAIJ *x = (Mat_SeqSBAIJ*)X->data; 116952768537SHong Zhang Mat_SeqSBAIJ *y = (Mat_SeqSBAIJ*)Y->data; 1170b264fe52SHong Zhang PetscErrorCode ierr; 117152768537SHong Zhang 117252768537SHong Zhang PetscFunctionBegin; 117352768537SHong Zhang /* Set the number of nonzeros in the new matrix */ 1174b264fe52SHong Zhang ierr = MatAXPYGetPreallocation_SeqX_private(mbs,x->i,x->j,y->i,y->j,nnz);CHKERRQ(ierr); 117552768537SHong Zhang PetscFunctionReturn(0); 117652768537SHong Zhang } 117752768537SHong Zhang 1178f4df32b1SMatthew Knepley PetscErrorCode MatAXPY_SeqSBAIJ(Mat Y,PetscScalar a,Mat X,MatStructure str) 117942ee4b1aSHong Zhang { 118042ee4b1aSHong Zhang Mat_SeqSBAIJ *x=(Mat_SeqSBAIJ*)X->data, *y=(Mat_SeqSBAIJ*)Y->data; 1181dfbe8321SBarry Smith PetscErrorCode ierr; 118231ce2d13SHong Zhang PetscInt bs=Y->rmap->bs,bs2=bs*bs; 1183e838b9e7SJed Brown PetscBLASInt one = 1; 118442ee4b1aSHong Zhang 118542ee4b1aSHong Zhang PetscFunctionBegin; 118642ee4b1aSHong Zhang if (str == SAME_NONZERO_PATTERN) { 1187f4df32b1SMatthew Knepley PetscScalar alpha = a; 1188c5df96a5SBarry Smith PetscBLASInt bnz; 1189c5df96a5SBarry Smith ierr = PetscBLASIntCast(x->nz*bs2,&bnz);CHKERRQ(ierr); 11908b83055fSJed Brown PetscStackCallBLAS("BLASaxpy",BLASaxpy_(&bnz,&alpha,x->a,&one,y->a,&one)); 1191a3fa217bSJose E. Roman ierr = PetscObjectStateIncrease((PetscObject)Y);CHKERRQ(ierr); 1192ab784542SHong Zhang } else if (str == SUBSET_NONZERO_PATTERN) { /* nonzeros of X is a subset of Y's */ 1193ab784542SHong Zhang ierr = MatSetOption(X,MAT_GETROW_UPPERTRIANGULAR,PETSC_TRUE);CHKERRQ(ierr); 1194ab784542SHong Zhang ierr = MatAXPY_Basic(Y,a,X,str);CHKERRQ(ierr); 1195ab784542SHong Zhang ierr = MatSetOption(X,MAT_GETROW_UPPERTRIANGULAR,PETSC_FALSE);CHKERRQ(ierr); 119642ee4b1aSHong Zhang } else { 119752768537SHong Zhang Mat B; 119852768537SHong Zhang PetscInt *nnz; 119952768537SHong Zhang if (bs != X->rmap->bs) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Matrices must have same block size"); 1200f5edf698SHong Zhang ierr = MatGetRowUpperTriangular(X);CHKERRQ(ierr); 120152768537SHong Zhang ierr = MatGetRowUpperTriangular(Y);CHKERRQ(ierr); 120252768537SHong Zhang ierr = PetscMalloc1(Y->rmap->N,&nnz);CHKERRQ(ierr); 120352768537SHong Zhang ierr = MatCreate(PetscObjectComm((PetscObject)Y),&B);CHKERRQ(ierr); 120452768537SHong Zhang ierr = PetscObjectSetName((PetscObject)B,((PetscObject)Y)->name);CHKERRQ(ierr); 120552768537SHong Zhang ierr = MatSetSizes(B,Y->rmap->n,Y->cmap->n,Y->rmap->N,Y->cmap->N);CHKERRQ(ierr); 120652768537SHong Zhang ierr = MatSetBlockSizesFromMats(B,Y,Y);CHKERRQ(ierr); 12074c7a3774SStefano Zampini ierr = MatSetType(B,((PetscObject)Y)->type_name);CHKERRQ(ierr); 120852768537SHong Zhang ierr = MatAXPYGetPreallocation_SeqSBAIJ(Y,X,nnz);CHKERRQ(ierr); 120952768537SHong Zhang ierr = MatSeqSBAIJSetPreallocation(B,bs,0,nnz);CHKERRQ(ierr); 121052768537SHong Zhang 121152768537SHong Zhang ierr = MatAXPY_BasicWithPreallocation(B,Y,a,X,str);CHKERRQ(ierr); 121252768537SHong Zhang 121328be2f97SBarry Smith ierr = MatHeaderReplace(Y,&B);CHKERRQ(ierr); 121452768537SHong Zhang ierr = PetscFree(nnz);CHKERRQ(ierr); 1215f5edf698SHong Zhang ierr = MatRestoreRowUpperTriangular(X);CHKERRQ(ierr); 121652768537SHong Zhang ierr = MatRestoreRowUpperTriangular(Y);CHKERRQ(ierr); 121742ee4b1aSHong Zhang } 121842ee4b1aSHong Zhang PetscFunctionReturn(0); 121942ee4b1aSHong Zhang } 122042ee4b1aSHong Zhang 1221ace3abfcSBarry Smith PetscErrorCode MatIsSymmetric_SeqSBAIJ(Mat A,PetscReal tol,PetscBool *flg) 1222efcf0fc3SBarry Smith { 1223efcf0fc3SBarry Smith PetscFunctionBegin; 1224efcf0fc3SBarry Smith *flg = PETSC_TRUE; 1225efcf0fc3SBarry Smith PetscFunctionReturn(0); 1226efcf0fc3SBarry Smith } 1227efcf0fc3SBarry Smith 1228ace3abfcSBarry Smith PetscErrorCode MatIsStructurallySymmetric_SeqSBAIJ(Mat A,PetscBool *flg) 1229efcf0fc3SBarry Smith { 1230efcf0fc3SBarry Smith PetscFunctionBegin; 1231efcf0fc3SBarry Smith *flg = PETSC_TRUE; 1232efcf0fc3SBarry Smith PetscFunctionReturn(0); 1233efcf0fc3SBarry Smith } 1234efcf0fc3SBarry Smith 1235ace3abfcSBarry Smith PetscErrorCode MatIsHermitian_SeqSBAIJ(Mat A,PetscReal tol,PetscBool *flg) 1236efcf0fc3SBarry Smith { 1237efcf0fc3SBarry Smith PetscFunctionBegin; 1238efcf0fc3SBarry Smith *flg = PETSC_FALSE; 1239efcf0fc3SBarry Smith PetscFunctionReturn(0); 1240efcf0fc3SBarry Smith } 1241efcf0fc3SBarry Smith 124299cafbc1SBarry Smith PetscErrorCode MatRealPart_SeqSBAIJ(Mat A) 124399cafbc1SBarry Smith { 124499cafbc1SBarry Smith Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ*)A->data; 124599cafbc1SBarry Smith PetscInt i,nz = a->bs2*a->i[a->mbs]; 1246dd6ea824SBarry Smith MatScalar *aa = a->a; 124799cafbc1SBarry Smith 124899cafbc1SBarry Smith PetscFunctionBegin; 124999cafbc1SBarry Smith for (i=0; i<nz; i++) aa[i] = PetscRealPart(aa[i]); 125099cafbc1SBarry Smith PetscFunctionReturn(0); 125199cafbc1SBarry Smith } 125299cafbc1SBarry Smith 125399cafbc1SBarry Smith PetscErrorCode MatImaginaryPart_SeqSBAIJ(Mat A) 125499cafbc1SBarry Smith { 125599cafbc1SBarry Smith Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ*)A->data; 125699cafbc1SBarry Smith PetscInt i,nz = a->bs2*a->i[a->mbs]; 1257dd6ea824SBarry Smith MatScalar *aa = a->a; 125899cafbc1SBarry Smith 125999cafbc1SBarry Smith PetscFunctionBegin; 126099cafbc1SBarry Smith for (i=0; i<nz; i++) aa[i] = PetscImaginaryPart(aa[i]); 126199cafbc1SBarry Smith PetscFunctionReturn(0); 126299cafbc1SBarry Smith } 126399cafbc1SBarry Smith 12643bededecSBarry Smith PetscErrorCode MatZeroRowsColumns_SeqSBAIJ(Mat A,PetscInt is_n,const PetscInt is_idx[],PetscScalar diag,Vec x, Vec b) 12653bededecSBarry Smith { 12663bededecSBarry Smith Mat_SeqSBAIJ *baij=(Mat_SeqSBAIJ*)A->data; 12673bededecSBarry Smith PetscErrorCode ierr; 12683bededecSBarry Smith PetscInt i,j,k,count; 12693bededecSBarry Smith PetscInt bs =A->rmap->bs,bs2=baij->bs2,row,col; 12703bededecSBarry Smith PetscScalar zero = 0.0; 12713bededecSBarry Smith MatScalar *aa; 12723bededecSBarry Smith const PetscScalar *xx; 12733bededecSBarry Smith PetscScalar *bb; 127456777dd2SBarry Smith PetscBool *zeroed,vecs = PETSC_FALSE; 12753bededecSBarry Smith 12763bededecSBarry Smith PetscFunctionBegin; 12773bededecSBarry Smith /* fix right hand side if needed */ 12783bededecSBarry Smith if (x && b) { 12793bededecSBarry Smith ierr = VecGetArrayRead(x,&xx);CHKERRQ(ierr); 12803bededecSBarry Smith ierr = VecGetArray(b,&bb);CHKERRQ(ierr); 128156777dd2SBarry Smith vecs = PETSC_TRUE; 12823bededecSBarry Smith } 12833bededecSBarry Smith 12843bededecSBarry Smith /* zero the columns */ 12851795a4d1SJed Brown ierr = PetscCalloc1(A->rmap->n,&zeroed);CHKERRQ(ierr); 12863bededecSBarry Smith for (i=0; i<is_n; i++) { 12873bededecSBarry Smith if (is_idx[i] < 0 || is_idx[i] >= A->rmap->N) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"row %D out of range",is_idx[i]); 12883bededecSBarry Smith zeroed[is_idx[i]] = PETSC_TRUE; 12893bededecSBarry Smith } 129056777dd2SBarry Smith if (vecs) { 129156777dd2SBarry Smith for (i=0; i<A->rmap->N; i++) { 129256777dd2SBarry Smith row = i/bs; 129356777dd2SBarry Smith for (j=baij->i[row]; j<baij->i[row+1]; j++) { 129456777dd2SBarry Smith for (k=0; k<bs; k++) { 129556777dd2SBarry Smith col = bs*baij->j[j] + k; 129656777dd2SBarry Smith if (col <= i) continue; 129756777dd2SBarry Smith aa = ((MatScalar*)(baij->a)) + j*bs2 + (i%bs) + bs*k; 129826fbe8dcSKarl Rupp if (!zeroed[i] && zeroed[col]) bb[i] -= aa[0]*xx[col]; 129926fbe8dcSKarl Rupp if (zeroed[i] && !zeroed[col]) bb[col] -= aa[0]*xx[i]; 130056777dd2SBarry Smith } 130156777dd2SBarry Smith } 130256777dd2SBarry Smith } 130326fbe8dcSKarl Rupp for (i=0; i<is_n; i++) bb[is_idx[i]] = diag*xx[is_idx[i]]; 130456777dd2SBarry Smith } 130556777dd2SBarry Smith 13063bededecSBarry Smith for (i=0; i<A->rmap->N; i++) { 13073bededecSBarry Smith if (!zeroed[i]) { 13083bededecSBarry Smith row = i/bs; 13093bededecSBarry Smith for (j=baij->i[row]; j<baij->i[row+1]; j++) { 13103bededecSBarry Smith for (k=0; k<bs; k++) { 13113bededecSBarry Smith col = bs*baij->j[j] + k; 13123bededecSBarry Smith if (zeroed[col]) { 13133bededecSBarry Smith aa = ((MatScalar*)(baij->a)) + j*bs2 + (i%bs) + bs*k; 13143bededecSBarry Smith aa[0] = 0.0; 13153bededecSBarry Smith } 13163bededecSBarry Smith } 13173bededecSBarry Smith } 13183bededecSBarry Smith } 13193bededecSBarry Smith } 13203bededecSBarry Smith ierr = PetscFree(zeroed);CHKERRQ(ierr); 132156777dd2SBarry Smith if (vecs) { 132256777dd2SBarry Smith ierr = VecRestoreArrayRead(x,&xx);CHKERRQ(ierr); 132356777dd2SBarry Smith ierr = VecRestoreArray(b,&bb);CHKERRQ(ierr); 132456777dd2SBarry Smith } 13253bededecSBarry Smith 13263bededecSBarry Smith /* zero the rows */ 13273bededecSBarry Smith for (i=0; i<is_n; i++) { 13283bededecSBarry Smith row = is_idx[i]; 13293bededecSBarry Smith count = (baij->i[row/bs +1] - baij->i[row/bs])*bs; 13303bededecSBarry Smith aa = ((MatScalar*)(baij->a)) + baij->i[row/bs]*bs2 + (row%bs); 13313bededecSBarry Smith for (k=0; k<count; k++) { 13323bededecSBarry Smith aa[0] = zero; 13333bededecSBarry Smith aa += bs; 13343bededecSBarry Smith } 13353bededecSBarry Smith if (diag != 0.0) { 13363bededecSBarry Smith ierr = (*A->ops->setvalues)(A,1,&row,1,&row,&diag,INSERT_VALUES);CHKERRQ(ierr); 13373bededecSBarry Smith } 13383bededecSBarry Smith } 13393bededecSBarry Smith ierr = MatAssemblyEnd_SeqSBAIJ(A,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 13403bededecSBarry Smith PetscFunctionReturn(0); 13413bededecSBarry Smith } 13423bededecSBarry Smith 13437d68702bSBarry Smith PetscErrorCode MatShift_SeqSBAIJ(Mat Y,PetscScalar a) 13447d68702bSBarry Smith { 13457d68702bSBarry Smith PetscErrorCode ierr; 13467d68702bSBarry Smith Mat_SeqSBAIJ *aij = (Mat_SeqSBAIJ*)Y->data; 13477d68702bSBarry Smith 13487d68702bSBarry Smith PetscFunctionBegin; 13496f33a894SBarry Smith if (!Y->preallocated || !aij->nz) { 13507d68702bSBarry Smith ierr = MatSeqSBAIJSetPreallocation(Y,Y->rmap->bs,1,NULL);CHKERRQ(ierr); 13517d68702bSBarry Smith } 13527d68702bSBarry Smith ierr = MatShift_Basic(Y,a);CHKERRQ(ierr); 13537d68702bSBarry Smith PetscFunctionReturn(0); 13547d68702bSBarry Smith } 13557d68702bSBarry Smith 135649b5e25fSSatish Balay /* -------------------------------------------------------------------*/ 13573964eb88SJed Brown static struct _MatOps MatOps_Values = {MatSetValues_SeqSBAIJ, 135849b5e25fSSatish Balay MatGetRow_SeqSBAIJ, 135949b5e25fSSatish Balay MatRestoreRow_SeqSBAIJ, 136049b5e25fSSatish Balay MatMult_SeqSBAIJ_N, 136197304618SKris Buschelman /* 4*/ MatMultAdd_SeqSBAIJ_N, 1362431c96f7SBarry Smith MatMult_SeqSBAIJ_N, /* transpose versions are same as non-transpose versions */ 1363e005ede5SBarry Smith MatMultAdd_SeqSBAIJ_N, 1364*f4259b30SLisandro Dalcin NULL, 1365*f4259b30SLisandro Dalcin NULL, 1366*f4259b30SLisandro Dalcin NULL, 1367*f4259b30SLisandro Dalcin /* 10*/ NULL, 1368*f4259b30SLisandro Dalcin NULL, 1369c078aec8SLisandro Dalcin MatCholeskyFactor_SeqSBAIJ, 137041f059aeSBarry Smith MatSOR_SeqSBAIJ, 137149b5e25fSSatish Balay MatTranspose_SeqSBAIJ, 137297304618SKris Buschelman /* 15*/ MatGetInfo_SeqSBAIJ, 137349b5e25fSSatish Balay MatEqual_SeqSBAIJ, 137449b5e25fSSatish Balay MatGetDiagonal_SeqSBAIJ, 137549b5e25fSSatish Balay MatDiagonalScale_SeqSBAIJ, 137649b5e25fSSatish Balay MatNorm_SeqSBAIJ, 1377*f4259b30SLisandro Dalcin /* 20*/ NULL, 137849b5e25fSSatish Balay MatAssemblyEnd_SeqSBAIJ, 137949b5e25fSSatish Balay MatSetOption_SeqSBAIJ, 138049b5e25fSSatish Balay MatZeroEntries_SeqSBAIJ, 1381*f4259b30SLisandro Dalcin /* 24*/ NULL, 1382*f4259b30SLisandro Dalcin NULL, 1383*f4259b30SLisandro Dalcin NULL, 1384*f4259b30SLisandro Dalcin NULL, 1385*f4259b30SLisandro Dalcin NULL, 13864994cf47SJed Brown /* 29*/ MatSetUp_SeqSBAIJ, 1387*f4259b30SLisandro Dalcin NULL, 1388*f4259b30SLisandro Dalcin NULL, 1389*f4259b30SLisandro Dalcin NULL, 1390*f4259b30SLisandro Dalcin NULL, 1391d519adbfSMatthew Knepley /* 34*/ MatDuplicate_SeqSBAIJ, 1392*f4259b30SLisandro Dalcin NULL, 1393*f4259b30SLisandro Dalcin NULL, 1394*f4259b30SLisandro Dalcin NULL, 1395c84f5b01SHong Zhang MatICCFactor_SeqSBAIJ, 1396d519adbfSMatthew Knepley /* 39*/ MatAXPY_SeqSBAIJ, 13977dae84e0SHong Zhang MatCreateSubMatrices_SeqSBAIJ, 139849b5e25fSSatish Balay MatIncreaseOverlap_SeqSBAIJ, 139949b5e25fSSatish Balay MatGetValues_SeqSBAIJ, 14003c896bc6SHong Zhang MatCopy_SeqSBAIJ, 1401*f4259b30SLisandro Dalcin /* 44*/ NULL, 140249b5e25fSSatish Balay MatScale_SeqSBAIJ, 14037d68702bSBarry Smith MatShift_SeqSBAIJ, 1404*f4259b30SLisandro Dalcin NULL, 14053bededecSBarry Smith MatZeroRowsColumns_SeqSBAIJ, 1406*f4259b30SLisandro Dalcin /* 49*/ NULL, 140749b5e25fSSatish Balay MatGetRowIJ_SeqSBAIJ, 140849b5e25fSSatish Balay MatRestoreRowIJ_SeqSBAIJ, 1409*f4259b30SLisandro Dalcin NULL, 1410*f4259b30SLisandro Dalcin NULL, 1411*f4259b30SLisandro Dalcin /* 54*/ NULL, 1412*f4259b30SLisandro Dalcin NULL, 1413*f4259b30SLisandro Dalcin NULL, 1414*f4259b30SLisandro Dalcin NULL, 141549b5e25fSSatish Balay MatSetValuesBlocked_SeqSBAIJ, 14167dae84e0SHong Zhang /* 59*/ MatCreateSubMatrix_SeqSBAIJ, 1417*f4259b30SLisandro Dalcin NULL, 1418*f4259b30SLisandro Dalcin NULL, 1419*f4259b30SLisandro Dalcin NULL, 1420*f4259b30SLisandro Dalcin NULL, 1421*f4259b30SLisandro Dalcin /* 64*/ NULL, 1422*f4259b30SLisandro Dalcin NULL, 1423*f4259b30SLisandro Dalcin NULL, 1424*f4259b30SLisandro Dalcin NULL, 1425*f4259b30SLisandro Dalcin NULL, 1426d519adbfSMatthew Knepley /* 69*/ MatGetRowMaxAbs_SeqSBAIJ, 1427*f4259b30SLisandro Dalcin NULL, 142828d58a37SPierre Jolivet MatConvert_MPISBAIJ_Basic, 1429*f4259b30SLisandro Dalcin NULL, 1430*f4259b30SLisandro Dalcin NULL, 1431*f4259b30SLisandro Dalcin /* 74*/ NULL, 1432*f4259b30SLisandro Dalcin NULL, 1433*f4259b30SLisandro Dalcin NULL, 1434*f4259b30SLisandro Dalcin NULL, 1435*f4259b30SLisandro Dalcin NULL, 1436*f4259b30SLisandro Dalcin /* 79*/ NULL, 1437*f4259b30SLisandro Dalcin NULL, 1438*f4259b30SLisandro Dalcin NULL, 143997304618SKris Buschelman MatGetInertia_SeqSBAIJ, 14405bba2384SShri Abhyankar MatLoad_SeqSBAIJ, 1441d519adbfSMatthew Knepley /* 84*/ MatIsSymmetric_SeqSBAIJ, 1442865e5f61SKris Buschelman MatIsHermitian_SeqSBAIJ, 1443efcf0fc3SBarry Smith MatIsStructurallySymmetric_SeqSBAIJ, 1444*f4259b30SLisandro Dalcin NULL, 1445*f4259b30SLisandro Dalcin NULL, 1446*f4259b30SLisandro Dalcin /* 89*/ NULL, 1447*f4259b30SLisandro Dalcin NULL, 1448*f4259b30SLisandro Dalcin NULL, 1449*f4259b30SLisandro Dalcin NULL, 1450*f4259b30SLisandro Dalcin NULL, 1451*f4259b30SLisandro Dalcin /* 94*/ NULL, 1452*f4259b30SLisandro Dalcin NULL, 1453*f4259b30SLisandro Dalcin NULL, 1454*f4259b30SLisandro Dalcin NULL, 1455*f4259b30SLisandro Dalcin NULL, 1456*f4259b30SLisandro Dalcin /* 99*/ NULL, 1457*f4259b30SLisandro Dalcin NULL, 1458*f4259b30SLisandro Dalcin NULL, 1459*f4259b30SLisandro Dalcin NULL, 1460*f4259b30SLisandro Dalcin NULL, 1461*f4259b30SLisandro Dalcin /*104*/ NULL, 146299cafbc1SBarry Smith MatRealPart_SeqSBAIJ, 1463f5edf698SHong Zhang MatImaginaryPart_SeqSBAIJ, 1464f5edf698SHong Zhang MatGetRowUpperTriangular_SeqSBAIJ, 14652af78befSBarry Smith MatRestoreRowUpperTriangular_SeqSBAIJ, 1466*f4259b30SLisandro Dalcin /*109*/ NULL, 1467*f4259b30SLisandro Dalcin NULL, 1468*f4259b30SLisandro Dalcin NULL, 1469*f4259b30SLisandro Dalcin NULL, 1470547795f9SHong Zhang MatMissingDiagonal_SeqSBAIJ, 1471*f4259b30SLisandro Dalcin /*114*/ NULL, 1472*f4259b30SLisandro Dalcin NULL, 1473*f4259b30SLisandro Dalcin NULL, 1474*f4259b30SLisandro Dalcin NULL, 1475*f4259b30SLisandro Dalcin NULL, 1476*f4259b30SLisandro Dalcin /*119*/ NULL, 1477*f4259b30SLisandro Dalcin NULL, 1478*f4259b30SLisandro Dalcin NULL, 1479*f4259b30SLisandro Dalcin NULL, 1480*f4259b30SLisandro Dalcin NULL, 1481*f4259b30SLisandro Dalcin /*124*/ NULL, 1482*f4259b30SLisandro Dalcin NULL, 1483*f4259b30SLisandro Dalcin NULL, 1484*f4259b30SLisandro Dalcin NULL, 1485*f4259b30SLisandro Dalcin NULL, 1486*f4259b30SLisandro Dalcin /*129*/ NULL, 1487*f4259b30SLisandro Dalcin NULL, 1488*f4259b30SLisandro Dalcin NULL, 1489*f4259b30SLisandro Dalcin NULL, 1490*f4259b30SLisandro Dalcin NULL, 1491*f4259b30SLisandro Dalcin /*134*/ NULL, 1492*f4259b30SLisandro Dalcin NULL, 1493*f4259b30SLisandro Dalcin NULL, 1494*f4259b30SLisandro Dalcin NULL, 1495*f4259b30SLisandro Dalcin NULL, 149646533700Sstefano_zampini /*139*/ MatSetBlockSizes_Default, 1497*f4259b30SLisandro Dalcin NULL, 1498*f4259b30SLisandro Dalcin NULL, 1499*f4259b30SLisandro Dalcin NULL, 1500*f4259b30SLisandro Dalcin NULL, 150159f5e6ceSHong Zhang /*144*/MatCreateMPIMatConcatenateSeqMat_SeqSBAIJ 150299cafbc1SBarry Smith }; 1503be1d678aSKris Buschelman 15047087cfbeSBarry Smith PetscErrorCode MatStoreValues_SeqSBAIJ(Mat mat) 150549b5e25fSSatish Balay { 15064afc71dfSHong Zhang Mat_SeqSBAIJ *aij = (Mat_SeqSBAIJ*)mat->data; 1507d0f46423SBarry Smith PetscInt nz = aij->i[mat->rmap->N]*mat->rmap->bs*aij->bs2; 1508dfbe8321SBarry Smith PetscErrorCode ierr; 150949b5e25fSSatish Balay 151049b5e25fSSatish Balay PetscFunctionBegin; 1511e7e72b3dSBarry Smith if (aij->nonew != 1) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ORDER,"Must call MatSetOption(A,MAT_NEW_NONZERO_LOCATIONS,PETSC_FALSE);first"); 151249b5e25fSSatish Balay 151349b5e25fSSatish Balay /* allocate space for values if not already there */ 151449b5e25fSSatish Balay if (!aij->saved_values) { 1515854ce69bSBarry Smith ierr = PetscMalloc1(nz+1,&aij->saved_values);CHKERRQ(ierr); 151649b5e25fSSatish Balay } 151749b5e25fSSatish Balay 151849b5e25fSSatish Balay /* copy values over */ 1519580bdb30SBarry Smith ierr = PetscArraycpy(aij->saved_values,aij->a,nz);CHKERRQ(ierr); 152049b5e25fSSatish Balay PetscFunctionReturn(0); 152149b5e25fSSatish Balay } 152249b5e25fSSatish Balay 15237087cfbeSBarry Smith PetscErrorCode MatRetrieveValues_SeqSBAIJ(Mat mat) 152449b5e25fSSatish Balay { 15254afc71dfSHong Zhang Mat_SeqSBAIJ *aij = (Mat_SeqSBAIJ*)mat->data; 15266849ba73SBarry Smith PetscErrorCode ierr; 1527d0f46423SBarry Smith PetscInt nz = aij->i[mat->rmap->N]*mat->rmap->bs*aij->bs2; 152849b5e25fSSatish Balay 152949b5e25fSSatish Balay PetscFunctionBegin; 1530e7e72b3dSBarry Smith if (aij->nonew != 1) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ORDER,"Must call MatSetOption(A,MAT_NEW_NONZERO_LOCATIONS,PETSC_FALSE);first"); 1531e7e72b3dSBarry Smith if (!aij->saved_values) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ORDER,"Must call MatStoreValues(A);first"); 153249b5e25fSSatish Balay 153349b5e25fSSatish Balay /* copy values over */ 1534580bdb30SBarry Smith ierr = PetscArraycpy(aij->a,aij->saved_values,nz);CHKERRQ(ierr); 153549b5e25fSSatish Balay PetscFunctionReturn(0); 153649b5e25fSSatish Balay } 153749b5e25fSSatish Balay 1538367daffbSBarry Smith static PetscErrorCode MatSeqSBAIJSetPreallocation_SeqSBAIJ(Mat B,PetscInt bs,PetscInt nz,PetscInt *nnz) 153949b5e25fSSatish Balay { 1540c464158bSHong Zhang Mat_SeqSBAIJ *b = (Mat_SeqSBAIJ*)B->data; 15416849ba73SBarry Smith PetscErrorCode ierr; 15424dcd73b1SHong Zhang PetscInt i,mbs,nbs,bs2; 15432576faa2SJed Brown PetscBool skipallocation = PETSC_FALSE,flg = PETSC_FALSE,realalloc = PETSC_FALSE; 154449b5e25fSSatish Balay 154549b5e25fSSatish Balay PetscFunctionBegin; 15462576faa2SJed Brown if (nz >= 0 || nnz) realalloc = PETSC_TRUE; 1547db4efbfdSBarry Smith 154833d57670SJed Brown ierr = MatSetBlockSize(B,PetscAbs(bs));CHKERRQ(ierr); 154926283091SBarry Smith ierr = PetscLayoutSetUp(B->rmap);CHKERRQ(ierr); 155026283091SBarry Smith ierr = PetscLayoutSetUp(B->cmap);CHKERRQ(ierr); 1551476417e5SBarry Smith if (B->rmap->N > B->cmap->N) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_SUP,"SEQSBAIJ matrix cannot have more rows %D than columns %D",B->rmap->N,B->cmap->N); 1552e02043d6SBarry Smith ierr = PetscLayoutGetBlockSize(B->rmap,&bs);CHKERRQ(ierr); 1553899cda47SBarry Smith 155421940c7eSstefano_zampini B->preallocated = PETSC_TRUE; 155521940c7eSstefano_zampini 1556d0f46423SBarry Smith mbs = B->rmap->N/bs; 15574dcd73b1SHong Zhang nbs = B->cmap->n/bs; 155849b5e25fSSatish Balay bs2 = bs*bs; 155949b5e25fSSatish Balay 15604dcd73b1SHong Zhang if (mbs*bs != B->rmap->N || nbs*bs!=B->cmap->n) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Number rows, cols must be divisible by blocksize"); 156149b5e25fSSatish Balay 1562ab93d7beSBarry Smith if (nz == MAT_SKIP_ALLOCATION) { 1563ab93d7beSBarry Smith skipallocation = PETSC_TRUE; 1564ab93d7beSBarry Smith nz = 0; 1565ab93d7beSBarry Smith } 1566ab93d7beSBarry Smith 1567435da068SBarry Smith if (nz == PETSC_DEFAULT || nz == PETSC_DECIDE) nz = 3; 1568e32f2f54SBarry Smith if (nz < 0) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"nz cannot be less than 0: value %D",nz); 156949b5e25fSSatish Balay if (nnz) { 157049b5e25fSSatish Balay for (i=0; i<mbs; i++) { 1571e32f2f54SBarry Smith if (nnz[i] < 0) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"nnz cannot be less than 0: local row %D value %D",i,nnz[i]); 1572de64b629SHong Zhang if (nnz[i] > nbs) SETERRQ3(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"nnz cannot be greater than block row length: local row %D value %D block rowlength %D",i,nnz[i],nbs); 157349b5e25fSSatish Balay } 157449b5e25fSSatish Balay } 157549b5e25fSSatish Balay 1576db4efbfdSBarry Smith B->ops->mult = MatMult_SeqSBAIJ_N; 1577db4efbfdSBarry Smith B->ops->multadd = MatMultAdd_SeqSBAIJ_N; 1578db4efbfdSBarry Smith B->ops->multtranspose = MatMult_SeqSBAIJ_N; 1579db4efbfdSBarry Smith B->ops->multtransposeadd = MatMultAdd_SeqSBAIJ_N; 158026fbe8dcSKarl Rupp 1581c5929fdfSBarry Smith ierr = PetscOptionsGetBool(((PetscObject)B)->options,((PetscObject)B)->prefix,"-mat_no_unroll",&flg,NULL);CHKERRQ(ierr); 158249b5e25fSSatish Balay if (!flg) { 158349b5e25fSSatish Balay switch (bs) { 158449b5e25fSSatish Balay case 1: 158549b5e25fSSatish Balay B->ops->mult = MatMult_SeqSBAIJ_1; 158649b5e25fSSatish Balay B->ops->multadd = MatMultAdd_SeqSBAIJ_1; 1587431c96f7SBarry Smith B->ops->multtranspose = MatMult_SeqSBAIJ_1; 1588431c96f7SBarry Smith B->ops->multtransposeadd = MatMultAdd_SeqSBAIJ_1; 158949b5e25fSSatish Balay break; 159049b5e25fSSatish Balay case 2: 159149b5e25fSSatish Balay B->ops->mult = MatMult_SeqSBAIJ_2; 159249b5e25fSSatish Balay B->ops->multadd = MatMultAdd_SeqSBAIJ_2; 1593431c96f7SBarry Smith B->ops->multtranspose = MatMult_SeqSBAIJ_2; 1594431c96f7SBarry Smith B->ops->multtransposeadd = MatMultAdd_SeqSBAIJ_2; 159549b5e25fSSatish Balay break; 159649b5e25fSSatish Balay case 3: 159749b5e25fSSatish Balay B->ops->mult = MatMult_SeqSBAIJ_3; 159849b5e25fSSatish Balay B->ops->multadd = MatMultAdd_SeqSBAIJ_3; 1599431c96f7SBarry Smith B->ops->multtranspose = MatMult_SeqSBAIJ_3; 1600431c96f7SBarry Smith B->ops->multtransposeadd = MatMultAdd_SeqSBAIJ_3; 160149b5e25fSSatish Balay break; 160249b5e25fSSatish Balay case 4: 160349b5e25fSSatish Balay B->ops->mult = MatMult_SeqSBAIJ_4; 160449b5e25fSSatish Balay B->ops->multadd = MatMultAdd_SeqSBAIJ_4; 1605431c96f7SBarry Smith B->ops->multtranspose = MatMult_SeqSBAIJ_4; 1606431c96f7SBarry Smith B->ops->multtransposeadd = MatMultAdd_SeqSBAIJ_4; 160749b5e25fSSatish Balay break; 160849b5e25fSSatish Balay case 5: 160949b5e25fSSatish Balay B->ops->mult = MatMult_SeqSBAIJ_5; 161049b5e25fSSatish Balay B->ops->multadd = MatMultAdd_SeqSBAIJ_5; 1611431c96f7SBarry Smith B->ops->multtranspose = MatMult_SeqSBAIJ_5; 1612431c96f7SBarry Smith B->ops->multtransposeadd = MatMultAdd_SeqSBAIJ_5; 161349b5e25fSSatish Balay break; 161449b5e25fSSatish Balay case 6: 161549b5e25fSSatish Balay B->ops->mult = MatMult_SeqSBAIJ_6; 161649b5e25fSSatish Balay B->ops->multadd = MatMultAdd_SeqSBAIJ_6; 1617431c96f7SBarry Smith B->ops->multtranspose = MatMult_SeqSBAIJ_6; 1618431c96f7SBarry Smith B->ops->multtransposeadd = MatMultAdd_SeqSBAIJ_6; 161949b5e25fSSatish Balay break; 162049b5e25fSSatish Balay case 7: 1621de53e5efSHong Zhang B->ops->mult = MatMult_SeqSBAIJ_7; 162249b5e25fSSatish Balay B->ops->multadd = MatMultAdd_SeqSBAIJ_7; 1623431c96f7SBarry Smith B->ops->multtranspose = MatMult_SeqSBAIJ_7; 1624431c96f7SBarry Smith B->ops->multtransposeadd = MatMultAdd_SeqSBAIJ_7; 162549b5e25fSSatish Balay break; 162649b5e25fSSatish Balay } 162749b5e25fSSatish Balay } 162849b5e25fSSatish Balay 162949b5e25fSSatish Balay b->mbs = mbs; 16304dcd73b1SHong Zhang b->nbs = nbs; 1631ab93d7beSBarry Smith if (!skipallocation) { 16322ee49352SLisandro Dalcin if (!b->imax) { 1633dcca6d9dSJed Brown ierr = PetscMalloc2(mbs,&b->imax,mbs,&b->ilen);CHKERRQ(ierr); 163426fbe8dcSKarl Rupp 1635c760cd28SBarry Smith b->free_imax_ilen = PETSC_TRUE; 163626fbe8dcSKarl Rupp 16373bb1ff40SBarry Smith ierr = PetscLogObjectMemory((PetscObject)B,2*mbs*sizeof(PetscInt));CHKERRQ(ierr); 16382ee49352SLisandro Dalcin } 163949b5e25fSSatish Balay if (!nnz) { 1640435da068SBarry Smith if (nz == PETSC_DEFAULT || nz == PETSC_DECIDE) nz = 5; 164149b5e25fSSatish Balay else if (nz <= 0) nz = 1; 16425d2a9ed1SStefano Zampini nz = PetscMin(nbs,nz); 164326fbe8dcSKarl Rupp for (i=0; i<mbs; i++) b->imax[i] = nz; 1644153ea458SHong Zhang nz = nz*mbs; /* total nz */ 164549b5e25fSSatish Balay } else { 1646c73702f5SBarry Smith PetscInt64 nz64 = 0; 1647c73702f5SBarry Smith for (i=0; i<mbs; i++) {b->imax[i] = nnz[i]; nz64 += nnz[i];} 1648c73702f5SBarry Smith ierr = PetscIntCast(nz64,&nz);CHKERRQ(ierr); 164949b5e25fSSatish Balay } 16502ee49352SLisandro Dalcin /* b->ilen will count nonzeros in each block row so far. */ 165126fbe8dcSKarl Rupp for (i=0; i<mbs; i++) b->ilen[i] = 0; 16526c6c5352SBarry Smith /* nz=(nz+mbs)/2; */ /* total diagonal and superdiagonal nonzero blocks */ 165349b5e25fSSatish Balay 165449b5e25fSSatish Balay /* allocate the matrix space */ 16552ee49352SLisandro Dalcin ierr = MatSeqXAIJFreeAIJ(B,&b->a,&b->j,&b->i);CHKERRQ(ierr); 1656dcca6d9dSJed Brown ierr = PetscMalloc3(bs2*nz,&b->a,nz,&b->j,B->rmap->N+1,&b->i);CHKERRQ(ierr); 16573bb1ff40SBarry Smith ierr = PetscLogObjectMemory((PetscObject)B,(B->rmap->N+1)*sizeof(PetscInt)+nz*(bs2*sizeof(PetscScalar)+sizeof(PetscInt)));CHKERRQ(ierr); 1658580bdb30SBarry Smith ierr = PetscArrayzero(b->a,nz*bs2);CHKERRQ(ierr); 1659580bdb30SBarry Smith ierr = PetscArrayzero(b->j,nz);CHKERRQ(ierr); 166026fbe8dcSKarl Rupp 166149b5e25fSSatish Balay b->singlemalloc = PETSC_TRUE; 166249b5e25fSSatish Balay 166349b5e25fSSatish Balay /* pointer to beginning of each row */ 1664e60cf9a0SBarry Smith b->i[0] = 0; 166526fbe8dcSKarl Rupp for (i=1; i<mbs+1; i++) b->i[i] = b->i[i-1] + b->imax[i-1]; 166626fbe8dcSKarl Rupp 1667e6b907acSBarry Smith b->free_a = PETSC_TRUE; 1668e6b907acSBarry Smith b->free_ij = PETSC_TRUE; 1669e811da20SHong Zhang } else { 1670e6b907acSBarry Smith b->free_a = PETSC_FALSE; 1671e6b907acSBarry Smith b->free_ij = PETSC_FALSE; 1672ab93d7beSBarry Smith } 167349b5e25fSSatish Balay 167449b5e25fSSatish Balay b->bs2 = bs2; 16756c6c5352SBarry Smith b->nz = 0; 1676b32cb4a7SJed Brown b->maxnz = nz; 1677*f4259b30SLisandro Dalcin b->inew = NULL; 1678*f4259b30SLisandro Dalcin b->jnew = NULL; 1679*f4259b30SLisandro Dalcin b->anew = NULL; 1680*f4259b30SLisandro Dalcin b->a2anew = NULL; 16811a3463dfSHong Zhang b->permute = PETSC_FALSE; 1682cb7b82ddSBarry Smith 1683cb7b82ddSBarry Smith B->was_assembled = PETSC_FALSE; 1684cb7b82ddSBarry Smith B->assembled = PETSC_FALSE; 16852576faa2SJed Brown if (realalloc) {ierr = MatSetOption(B,MAT_NEW_NONZERO_ALLOCATION_ERR,PETSC_TRUE);CHKERRQ(ierr);} 1686c464158bSHong Zhang PetscFunctionReturn(0); 1687c464158bSHong Zhang } 1688153ea458SHong Zhang 168938f409ebSLisandro Dalcin PetscErrorCode MatSeqSBAIJSetPreallocationCSR_SeqSBAIJ(Mat B,PetscInt bs,const PetscInt ii[],const PetscInt jj[], const PetscScalar V[]) 169038f409ebSLisandro Dalcin { 16910cd7f59aSBarry Smith PetscInt i,j,m,nz,anz, nz_max=0,*nnz; 1692*f4259b30SLisandro Dalcin PetscScalar *values=NULL; 169338f409ebSLisandro Dalcin PetscBool roworiented = ((Mat_SeqSBAIJ*)B->data)->roworiented; 169438f409ebSLisandro Dalcin PetscErrorCode ierr; 16950cd7f59aSBarry Smith 169638f409ebSLisandro Dalcin PetscFunctionBegin; 169738f409ebSLisandro Dalcin if (bs < 1) SETERRQ1(PetscObjectComm((PetscObject)B),PETSC_ERR_ARG_OUTOFRANGE,"Invalid block size specified, must be positive but it is %D",bs); 169838f409ebSLisandro Dalcin ierr = PetscLayoutSetBlockSize(B->rmap,bs);CHKERRQ(ierr); 169938f409ebSLisandro Dalcin ierr = PetscLayoutSetBlockSize(B->cmap,bs);CHKERRQ(ierr); 170038f409ebSLisandro Dalcin ierr = PetscLayoutSetUp(B->rmap);CHKERRQ(ierr); 170138f409ebSLisandro Dalcin ierr = PetscLayoutSetUp(B->cmap);CHKERRQ(ierr); 170238f409ebSLisandro Dalcin ierr = PetscLayoutGetBlockSize(B->rmap,&bs);CHKERRQ(ierr); 170338f409ebSLisandro Dalcin m = B->rmap->n/bs; 170438f409ebSLisandro Dalcin 170538f409ebSLisandro Dalcin if (ii[0]) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"ii[0] must be 0 but it is %D",ii[0]); 1706854ce69bSBarry Smith ierr = PetscMalloc1(m+1,&nnz);CHKERRQ(ierr); 170738f409ebSLisandro Dalcin for (i=0; i<m; i++) { 170838f409ebSLisandro Dalcin nz = ii[i+1] - ii[i]; 170938f409ebSLisandro Dalcin if (nz < 0) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Row %D has a negative number of columns %D",i,nz); 17100cd7f59aSBarry Smith anz = 0; 17110cd7f59aSBarry Smith for (j=0; j<nz; j++) { 17120cd7f59aSBarry Smith /* count only values on the diagonal or above */ 17130cd7f59aSBarry Smith if (jj[ii[i] + j] >= i) { 17140cd7f59aSBarry Smith anz = nz - j; 17150cd7f59aSBarry Smith break; 17160cd7f59aSBarry Smith } 17170cd7f59aSBarry Smith } 17180cd7f59aSBarry Smith nz_max = PetscMax(nz_max,anz); 17190cd7f59aSBarry Smith nnz[i] = anz; 172038f409ebSLisandro Dalcin } 172138f409ebSLisandro Dalcin ierr = MatSeqSBAIJSetPreallocation(B,bs,0,nnz);CHKERRQ(ierr); 172238f409ebSLisandro Dalcin ierr = PetscFree(nnz);CHKERRQ(ierr); 172338f409ebSLisandro Dalcin 172438f409ebSLisandro Dalcin values = (PetscScalar*)V; 172538f409ebSLisandro Dalcin if (!values) { 17261795a4d1SJed Brown ierr = PetscCalloc1(bs*bs*nz_max,&values);CHKERRQ(ierr); 172738f409ebSLisandro Dalcin } 172838f409ebSLisandro Dalcin for (i=0; i<m; i++) { 172938f409ebSLisandro Dalcin PetscInt ncols = ii[i+1] - ii[i]; 173038f409ebSLisandro Dalcin const PetscInt *icols = jj + ii[i]; 173138f409ebSLisandro Dalcin if (!roworiented || bs == 1) { 173238f409ebSLisandro Dalcin const PetscScalar *svals = values + (V ? (bs*bs*ii[i]) : 0); 173338f409ebSLisandro Dalcin ierr = MatSetValuesBlocked_SeqSBAIJ(B,1,&i,ncols,icols,svals,INSERT_VALUES);CHKERRQ(ierr); 173438f409ebSLisandro Dalcin } else { 173538f409ebSLisandro Dalcin for (j=0; j<ncols; j++) { 173638f409ebSLisandro Dalcin const PetscScalar *svals = values + (V ? (bs*bs*(ii[i]+j)) : 0); 173738f409ebSLisandro Dalcin ierr = MatSetValuesBlocked_SeqSBAIJ(B,1,&i,1,&icols[j],svals,INSERT_VALUES);CHKERRQ(ierr); 173838f409ebSLisandro Dalcin } 173938f409ebSLisandro Dalcin } 174038f409ebSLisandro Dalcin } 174138f409ebSLisandro Dalcin if (!V) { ierr = PetscFree(values);CHKERRQ(ierr); } 174238f409ebSLisandro Dalcin ierr = MatAssemblyBegin(B,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 174338f409ebSLisandro Dalcin ierr = MatAssemblyEnd(B,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 174438f409ebSLisandro Dalcin ierr = MatSetOption(B,MAT_NEW_NONZERO_LOCATION_ERR,PETSC_TRUE);CHKERRQ(ierr); 174538f409ebSLisandro Dalcin PetscFunctionReturn(0); 174638f409ebSLisandro Dalcin } 174738f409ebSLisandro Dalcin 1748db4efbfdSBarry Smith /* 1749db4efbfdSBarry Smith This is used to set the numeric factorization for both Cholesky and ICC symbolic factorization 1750db4efbfdSBarry Smith */ 1751ace3abfcSBarry Smith PetscErrorCode MatSeqSBAIJSetNumericFactorization_inplace(Mat B,PetscBool natural) 1752db4efbfdSBarry Smith { 1753db4efbfdSBarry Smith PetscErrorCode ierr; 1754ace3abfcSBarry Smith PetscBool flg = PETSC_FALSE; 1755db4efbfdSBarry Smith PetscInt bs = B->rmap->bs; 1756db4efbfdSBarry Smith 1757db4efbfdSBarry Smith PetscFunctionBegin; 1758c5929fdfSBarry Smith ierr = PetscOptionsGetBool(((PetscObject)B)->options,((PetscObject)B)->prefix,"-mat_no_unroll",&flg,NULL);CHKERRQ(ierr); 1759db4efbfdSBarry Smith if (flg) bs = 8; 1760db4efbfdSBarry Smith 1761db4efbfdSBarry Smith if (!natural) { 1762db4efbfdSBarry Smith switch (bs) { 1763db4efbfdSBarry Smith case 1: 1764d595f711SHong Zhang B->ops->choleskyfactornumeric = MatCholeskyFactorNumeric_SeqSBAIJ_1_inplace; 1765db4efbfdSBarry Smith break; 1766db4efbfdSBarry Smith case 2: 1767db4efbfdSBarry Smith B->ops->choleskyfactornumeric = MatCholeskyFactorNumeric_SeqSBAIJ_2; 1768db4efbfdSBarry Smith break; 1769db4efbfdSBarry Smith case 3: 1770db4efbfdSBarry Smith B->ops->choleskyfactornumeric = MatCholeskyFactorNumeric_SeqSBAIJ_3; 1771db4efbfdSBarry Smith break; 1772db4efbfdSBarry Smith case 4: 1773db4efbfdSBarry Smith B->ops->choleskyfactornumeric = MatCholeskyFactorNumeric_SeqSBAIJ_4; 1774db4efbfdSBarry Smith break; 1775db4efbfdSBarry Smith case 5: 1776db4efbfdSBarry Smith B->ops->choleskyfactornumeric = MatCholeskyFactorNumeric_SeqSBAIJ_5; 1777db4efbfdSBarry Smith break; 1778db4efbfdSBarry Smith case 6: 1779db4efbfdSBarry Smith B->ops->choleskyfactornumeric = MatCholeskyFactorNumeric_SeqSBAIJ_6; 1780db4efbfdSBarry Smith break; 1781db4efbfdSBarry Smith case 7: 1782db4efbfdSBarry Smith B->ops->choleskyfactornumeric = MatCholeskyFactorNumeric_SeqSBAIJ_7; 1783db4efbfdSBarry Smith break; 1784db4efbfdSBarry Smith default: 1785db4efbfdSBarry Smith B->ops->choleskyfactornumeric = MatCholeskyFactorNumeric_SeqSBAIJ_N; 1786db4efbfdSBarry Smith break; 1787db4efbfdSBarry Smith } 1788db4efbfdSBarry Smith } else { 1789db4efbfdSBarry Smith switch (bs) { 1790db4efbfdSBarry Smith case 1: 1791d595f711SHong Zhang B->ops->choleskyfactornumeric = MatCholeskyFactorNumeric_SeqSBAIJ_1_NaturalOrdering_inplace; 1792db4efbfdSBarry Smith break; 1793db4efbfdSBarry Smith case 2: 1794db4efbfdSBarry Smith B->ops->choleskyfactornumeric = MatCholeskyFactorNumeric_SeqSBAIJ_2_NaturalOrdering; 1795db4efbfdSBarry Smith break; 1796db4efbfdSBarry Smith case 3: 1797db4efbfdSBarry Smith B->ops->choleskyfactornumeric = MatCholeskyFactorNumeric_SeqSBAIJ_3_NaturalOrdering; 1798db4efbfdSBarry Smith break; 1799db4efbfdSBarry Smith case 4: 1800db4efbfdSBarry Smith B->ops->choleskyfactornumeric = MatCholeskyFactorNumeric_SeqSBAIJ_4_NaturalOrdering; 1801db4efbfdSBarry Smith break; 1802db4efbfdSBarry Smith case 5: 1803db4efbfdSBarry Smith B->ops->choleskyfactornumeric = MatCholeskyFactorNumeric_SeqSBAIJ_5_NaturalOrdering; 1804db4efbfdSBarry Smith break; 1805db4efbfdSBarry Smith case 6: 1806db4efbfdSBarry Smith B->ops->choleskyfactornumeric = MatCholeskyFactorNumeric_SeqSBAIJ_6_NaturalOrdering; 1807db4efbfdSBarry Smith break; 1808db4efbfdSBarry Smith case 7: 1809db4efbfdSBarry Smith B->ops->choleskyfactornumeric = MatCholeskyFactorNumeric_SeqSBAIJ_7_NaturalOrdering; 1810db4efbfdSBarry Smith break; 1811db4efbfdSBarry Smith default: 1812db4efbfdSBarry Smith B->ops->choleskyfactornumeric = MatCholeskyFactorNumeric_SeqSBAIJ_N_NaturalOrdering; 1813db4efbfdSBarry Smith break; 1814db4efbfdSBarry Smith } 1815db4efbfdSBarry Smith } 1816db4efbfdSBarry Smith PetscFunctionReturn(0); 1817db4efbfdSBarry Smith } 1818db4efbfdSBarry Smith 1819cc2e6a90SBarry Smith PETSC_INTERN PetscErrorCode MatConvert_SeqSBAIJ_SeqAIJ(Mat, MatType,MatReuse,Mat*); 1820cc2e6a90SBarry Smith PETSC_INTERN PetscErrorCode MatConvert_SeqSBAIJ_SeqBAIJ(Mat, MatType,MatReuse,Mat*); 1821d769727bSBarry Smith 1822cc2e6a90SBarry Smith PETSC_INTERN PetscErrorCode MatGetFactor_seqsbaij_petsc(Mat A,MatFactorType ftype,Mat *B) 18235c9eb25fSBarry Smith { 1824d0f46423SBarry Smith PetscInt n = A->rmap->n; 18255c9eb25fSBarry Smith PetscErrorCode ierr; 18265c9eb25fSBarry Smith 18275c9eb25fSBarry Smith PetscFunctionBegin; 18280e92d65fSHong Zhang #if defined(PETSC_USE_COMPLEX) 1829eb1ec7c1SStefano Zampini if (A->hermitian && !A->symmetric && (ftype == MAT_FACTOR_CHOLESKY||ftype == MAT_FACTOR_ICC)) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_SUP,"Hermitian CHOLESKY or ICC Factor is not supported"); 18300e92d65fSHong Zhang #endif 1831eb1ec7c1SStefano Zampini 1832ce94432eSBarry Smith ierr = MatCreate(PetscObjectComm((PetscObject)A),B);CHKERRQ(ierr); 18335c9eb25fSBarry Smith ierr = MatSetSizes(*B,n,n,n,n);CHKERRQ(ierr); 18345c9eb25fSBarry Smith if (ftype == MAT_FACTOR_CHOLESKY || ftype == MAT_FACTOR_ICC) { 18355c9eb25fSBarry Smith ierr = MatSetType(*B,MATSEQSBAIJ);CHKERRQ(ierr); 18360298fd71SBarry Smith ierr = MatSeqSBAIJSetPreallocation(*B,A->rmap->bs,MAT_SKIP_ALLOCATION,NULL);CHKERRQ(ierr); 183726fbe8dcSKarl Rupp 18387b056e98SHong Zhang (*B)->ops->choleskyfactorsymbolic = MatCholeskyFactorSymbolic_SeqSBAIJ; 1839c6d0d4f0SHong Zhang (*B)->ops->iccfactorsymbolic = MatICCFactorSymbolic_SeqSBAIJ; 1840e32f2f54SBarry Smith } else SETERRQ(PETSC_COMM_SELF,PETSC_ERR_SUP,"Factor type not supported"); 184100c67f3bSHong Zhang 1842d5f3da31SBarry Smith (*B)->factortype = ftype; 18432c7c0729SBarry Smith (*B)->useordering = PETSC_TRUE; 184400c67f3bSHong Zhang ierr = PetscFree((*B)->solvertype);CHKERRQ(ierr); 184500c67f3bSHong Zhang ierr = PetscStrallocpy(MATSOLVERPETSC,&(*B)->solvertype);CHKERRQ(ierr); 18465c9eb25fSBarry Smith PetscFunctionReturn(0); 18475c9eb25fSBarry Smith } 18485c9eb25fSBarry Smith 18498397e458SBarry Smith /*@C 18508397e458SBarry Smith MatSeqSBAIJGetArray - gives access to the array where the data for a MATSEQSBAIJ matrix is stored 18518397e458SBarry Smith 18528397e458SBarry Smith Not Collective 18538397e458SBarry Smith 18548397e458SBarry Smith Input Parameter: 18558397e458SBarry Smith . mat - a MATSEQSBAIJ matrix 18568397e458SBarry Smith 18578397e458SBarry Smith Output Parameter: 18588397e458SBarry Smith . array - pointer to the data 18598397e458SBarry Smith 18608397e458SBarry Smith Level: intermediate 18618397e458SBarry Smith 18628397e458SBarry Smith .seealso: MatSeqSBAIJRestoreArray(), MatSeqAIJGetArray(), MatSeqAIJRestoreArray() 18638397e458SBarry Smith @*/ 18648397e458SBarry Smith PetscErrorCode MatSeqSBAIJGetArray(Mat A,PetscScalar **array) 18658397e458SBarry Smith { 18668397e458SBarry Smith PetscErrorCode ierr; 18678397e458SBarry Smith 18688397e458SBarry Smith PetscFunctionBegin; 18698397e458SBarry Smith ierr = PetscUseMethod(A,"MatSeqSBAIJGetArray_C",(Mat,PetscScalar**),(A,array));CHKERRQ(ierr); 18708397e458SBarry Smith PetscFunctionReturn(0); 18718397e458SBarry Smith } 18728397e458SBarry Smith 18738397e458SBarry Smith /*@C 18748397e458SBarry Smith MatSeqSBAIJRestoreArray - returns access to the array where the data for a MATSEQSBAIJ matrix is stored obtained by MatSeqSBAIJGetArray() 18758397e458SBarry Smith 18768397e458SBarry Smith Not Collective 18778397e458SBarry Smith 18788397e458SBarry Smith Input Parameters: 1879a2b725a8SWilliam Gropp + mat - a MATSEQSBAIJ matrix 1880a2b725a8SWilliam Gropp - array - pointer to the data 18818397e458SBarry Smith 18828397e458SBarry Smith Level: intermediate 18838397e458SBarry Smith 18848397e458SBarry Smith .seealso: MatSeqSBAIJGetArray(), MatSeqAIJGetArray(), MatSeqAIJRestoreArray() 18858397e458SBarry Smith @*/ 18868397e458SBarry Smith PetscErrorCode MatSeqSBAIJRestoreArray(Mat A,PetscScalar **array) 18878397e458SBarry Smith { 18888397e458SBarry Smith PetscErrorCode ierr; 18898397e458SBarry Smith 18908397e458SBarry Smith PetscFunctionBegin; 18918397e458SBarry Smith ierr = PetscUseMethod(A,"MatSeqSBAIJRestoreArray_C",(Mat,PetscScalar**),(A,array));CHKERRQ(ierr); 18928397e458SBarry Smith PetscFunctionReturn(0); 18938397e458SBarry Smith } 18948397e458SBarry Smith 18950bad9183SKris Buschelman /*MC 1896fafad747SKris Buschelman MATSEQSBAIJ - MATSEQSBAIJ = "seqsbaij" - A matrix type to be used for sequential symmetric block sparse matrices, 18970bad9183SKris Buschelman based on block compressed sparse row format. Only the upper triangular portion of the matrix is stored. 18980bad9183SKris Buschelman 1899828413b8SBarry Smith For complex numbers by default this matrix is symmetric, NOT Hermitian symmetric. To make it Hermitian symmetric you 1900eb1ec7c1SStefano Zampini can call MatSetOption(Mat, MAT_HERMITIAN). 1901828413b8SBarry Smith 19020bad9183SKris Buschelman Options Database Keys: 19030bad9183SKris Buschelman . -mat_type seqsbaij - sets the matrix type to "seqsbaij" during a call to MatSetFromOptions() 19040bad9183SKris Buschelman 190595452b02SPatrick Sanan Notes: 190695452b02SPatrick Sanan By default if you insert values into the lower triangular part of the matrix they are simply ignored (since they are not 190771dad5bbSBarry Smith stored and it is assumed they symmetric to the upper triangular). If you call MatSetOption(Mat,MAT_IGNORE_LOWER_TRIANGULAR,PETSC_FALSE) or use 190871dad5bbSBarry Smith the options database -mat_ignore_lower_triangular false it will generate an error if you try to set a value in the lower triangular portion. 190971dad5bbSBarry Smith 1910476417e5SBarry Smith The number of rows in the matrix must be less than or equal to the number of columns 191171dad5bbSBarry Smith 19120bad9183SKris Buschelman Level: beginner 19130bad9183SKris Buschelman 1914476417e5SBarry Smith .seealso: MatCreateSeqSBAIJ(), MatType, MATMPISBAIJ 19150bad9183SKris Buschelman M*/ 19168cc058d9SJed Brown PETSC_EXTERN PetscErrorCode MatCreate_SeqSBAIJ(Mat B) 1917a23d5eceSKris Buschelman { 1918a23d5eceSKris Buschelman Mat_SeqSBAIJ *b; 1919dfbe8321SBarry Smith PetscErrorCode ierr; 192013f74950SBarry Smith PetscMPIInt size; 1921ace3abfcSBarry Smith PetscBool no_unroll = PETSC_FALSE,no_inode = PETSC_FALSE; 1922a23d5eceSKris Buschelman 1923a23d5eceSKris Buschelman PetscFunctionBegin; 1924ce94432eSBarry Smith ierr = MPI_Comm_size(PetscObjectComm((PetscObject)B),&size);CHKERRQ(ierr); 1925e32f2f54SBarry Smith if (size > 1) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONG,"Comm must be of size 1"); 1926a23d5eceSKris Buschelman 1927b00a9115SJed Brown ierr = PetscNewLog(B,&b);CHKERRQ(ierr); 1928a23d5eceSKris Buschelman B->data = (void*)b; 1929a23d5eceSKris Buschelman ierr = PetscMemcpy(B->ops,&MatOps_Values,sizeof(struct _MatOps));CHKERRQ(ierr); 193026fbe8dcSKarl Rupp 1931a23d5eceSKris Buschelman B->ops->destroy = MatDestroy_SeqSBAIJ; 1932a23d5eceSKris Buschelman B->ops->view = MatView_SeqSBAIJ; 1933*f4259b30SLisandro Dalcin b->row = NULL; 1934*f4259b30SLisandro Dalcin b->icol = NULL; 1935a23d5eceSKris Buschelman b->reallocs = 0; 1936*f4259b30SLisandro Dalcin b->saved_values = NULL; 19370def2e27SBarry Smith b->inode.limit = 5; 19380def2e27SBarry Smith b->inode.max_limit = 5; 1939a23d5eceSKris Buschelman 1940a23d5eceSKris Buschelman b->roworiented = PETSC_TRUE; 1941a23d5eceSKris Buschelman b->nonew = 0; 1942*f4259b30SLisandro Dalcin b->diag = NULL; 1943*f4259b30SLisandro Dalcin b->solve_work = NULL; 1944*f4259b30SLisandro Dalcin b->mult_work = NULL; 1945*f4259b30SLisandro Dalcin B->spptr = NULL; 1946f2cbd3d5SJed Brown B->info.nz_unneeded = (PetscReal)b->maxnz*b->bs2; 1947a9817697SBarry Smith b->keepnonzeropattern = PETSC_FALSE; 1948a23d5eceSKris Buschelman 1949*f4259b30SLisandro Dalcin b->inew = NULL; 1950*f4259b30SLisandro Dalcin b->jnew = NULL; 1951*f4259b30SLisandro Dalcin b->anew = NULL; 1952*f4259b30SLisandro Dalcin b->a2anew = NULL; 1953a23d5eceSKris Buschelman b->permute = PETSC_FALSE; 1954a23d5eceSKris Buschelman 195571dad5bbSBarry Smith b->ignore_ltriangular = PETSC_TRUE; 195626fbe8dcSKarl Rupp 1957c5929fdfSBarry Smith ierr = PetscOptionsGetBool(((PetscObject)B)->options,((PetscObject)B)->prefix,"-mat_ignore_lower_triangular",&b->ignore_ltriangular,NULL);CHKERRQ(ierr); 1958941593c8SHong Zhang 1959f5edf698SHong Zhang b->getrow_utriangular = PETSC_FALSE; 196026fbe8dcSKarl Rupp 1961c5929fdfSBarry Smith ierr = PetscOptionsGetBool(((PetscObject)B)->options,((PetscObject)B)->prefix,"-mat_getrow_uppertriangular",&b->getrow_utriangular,NULL);CHKERRQ(ierr); 1962f5edf698SHong Zhang 19638397e458SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatSeqSBAIJGetArray_C",MatSeqSBAIJGetArray_SeqSBAIJ);CHKERRQ(ierr); 19648397e458SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatSeqSBAIJRestoreArray_C",MatSeqSBAIJRestoreArray_SeqSBAIJ);CHKERRQ(ierr); 1965bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatStoreValues_C",MatStoreValues_SeqSBAIJ);CHKERRQ(ierr); 1966bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatRetrieveValues_C",MatRetrieveValues_SeqSBAIJ);CHKERRQ(ierr); 1967bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatSeqSBAIJSetColumnIndices_C",MatSeqSBAIJSetColumnIndices_SeqSBAIJ);CHKERRQ(ierr); 1968bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatConvert_seqsbaij_seqaij_C",MatConvert_SeqSBAIJ_SeqAIJ);CHKERRQ(ierr); 1969bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatConvert_seqsbaij_seqbaij_C",MatConvert_SeqSBAIJ_SeqBAIJ);CHKERRQ(ierr); 1970bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatSeqSBAIJSetPreallocation_C",MatSeqSBAIJSetPreallocation_SeqSBAIJ);CHKERRQ(ierr); 197138f409ebSLisandro Dalcin ierr = PetscObjectComposeFunction((PetscObject)B,"MatSeqSBAIJSetPreallocationCSR_C",MatSeqSBAIJSetPreallocationCSR_SeqSBAIJ);CHKERRQ(ierr); 19726214f412SHong Zhang #if defined(PETSC_HAVE_ELEMENTAL) 19736214f412SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatConvert_seqsbaij_elemental_C",MatConvert_SeqSBAIJ_Elemental);CHKERRQ(ierr); 19746214f412SHong Zhang #endif 1975d24d4204SJose E. Roman #if defined(PETSC_HAVE_SCALAPACK) 1976d24d4204SJose E. Roman ierr = PetscObjectComposeFunction((PetscObject)B,"MatConvert_seqsbaij_scalapack_C",MatConvert_SBAIJ_ScaLAPACK);CHKERRQ(ierr); 1977d24d4204SJose E. Roman #endif 197823ce1328SBarry Smith 197923ce1328SBarry Smith B->symmetric = PETSC_TRUE; 198023ce1328SBarry Smith B->structurally_symmetric = PETSC_TRUE; 198123ce1328SBarry Smith B->symmetric_set = PETSC_TRUE; 198223ce1328SBarry Smith B->structurally_symmetric_set = PETSC_TRUE; 19839899f194SHong Zhang B->symmetric_eternal = PETSC_TRUE; 1984eb1ec7c1SStefano Zampini #if defined(PETSC_USE_COMPLEX) 198513647f61SHong Zhang B->hermitian = PETSC_FALSE; 198613647f61SHong Zhang B->hermitian_set = PETSC_FALSE; 1987eb1ec7c1SStefano Zampini #else 1988eb1ec7c1SStefano Zampini B->hermitian = PETSC_TRUE; 1989eb1ec7c1SStefano Zampini B->hermitian_set = PETSC_TRUE; 1990eb1ec7c1SStefano Zampini #endif 199113647f61SHong Zhang 199217667f90SBarry Smith ierr = PetscObjectChangeTypeName((PetscObject)B,MATSEQSBAIJ);CHKERRQ(ierr); 19930def2e27SBarry Smith 1994ce94432eSBarry Smith ierr = PetscOptionsBegin(PetscObjectComm((PetscObject)B),((PetscObject)B)->prefix,"Options for SEQSBAIJ matrix","Mat");CHKERRQ(ierr); 19950298fd71SBarry Smith ierr = PetscOptionsBool("-mat_no_unroll","Do not optimize for inodes (slower)",NULL,no_unroll,&no_unroll,NULL);CHKERRQ(ierr); 199626fbe8dcSKarl Rupp if (no_unroll) { 199726fbe8dcSKarl Rupp ierr = PetscInfo(B,"Not using Inode routines due to -mat_no_unroll\n");CHKERRQ(ierr); 199826fbe8dcSKarl Rupp } 19990298fd71SBarry Smith ierr = PetscOptionsBool("-mat_no_inode","Do not optimize for inodes (slower)",NULL,no_inode,&no_inode,NULL);CHKERRQ(ierr); 200026fbe8dcSKarl Rupp if (no_inode) { 200126fbe8dcSKarl Rupp ierr = PetscInfo(B,"Not using Inode routines due to -mat_no_inode\n");CHKERRQ(ierr); 200226fbe8dcSKarl Rupp } 20030298fd71SBarry Smith ierr = PetscOptionsInt("-mat_inode_limit","Do not use inodes larger then this value",NULL,b->inode.limit,&b->inode.limit,NULL);CHKERRQ(ierr); 20040def2e27SBarry Smith ierr = PetscOptionsEnd();CHKERRQ(ierr); 2005ace3abfcSBarry Smith b->inode.use = (PetscBool)(!(no_unroll || no_inode)); 20060def2e27SBarry Smith if (b->inode.limit > b->inode.max_limit) b->inode.limit = b->inode.max_limit; 2007a23d5eceSKris Buschelman PetscFunctionReturn(0); 2008a23d5eceSKris Buschelman } 2009a23d5eceSKris Buschelman 2010a23d5eceSKris Buschelman /*@C 2011a23d5eceSKris Buschelman MatSeqSBAIJSetPreallocation - Creates a sparse symmetric matrix in block AIJ (block 2012a23d5eceSKris Buschelman compressed row) format. For good matrix assembly performance the 2013a23d5eceSKris Buschelman user should preallocate the matrix storage by setting the parameter nz 2014a23d5eceSKris Buschelman (or the array nnz). By setting these parameters accurately, performance 2015a23d5eceSKris Buschelman during matrix assembly can be increased by more than a factor of 50. 2016a23d5eceSKris Buschelman 2017a23d5eceSKris Buschelman Collective on Mat 2018a23d5eceSKris Buschelman 2019a23d5eceSKris Buschelman Input Parameters: 20201c4f3114SJed Brown + B - the symmetric matrix 2021bb7ae925SBarry Smith . bs - size of block, the blocks are ALWAYS square. One can use MatSetBlockSizes() to set a different row and column blocksize but the row 2022bb7ae925SBarry Smith blocksize always defines the size of the blocks. The column blocksize sets the blocksize of the vectors obtained with MatCreateVecs() 2023a23d5eceSKris Buschelman . nz - number of block nonzeros per block row (same for all rows) 2024a23d5eceSKris Buschelman - nnz - array containing the number of block nonzeros in the upper triangular plus 20250298fd71SBarry Smith diagonal portion of each block (possibly different for each block row) or NULL 2026a23d5eceSKris Buschelman 2027a23d5eceSKris Buschelman Options Database Keys: 2028a2b725a8SWilliam Gropp + -mat_no_unroll - uses code that does not unroll the loops in the 2029a23d5eceSKris Buschelman block calculations (much slower) 2030a2b725a8SWilliam Gropp - -mat_block_size - size of the blocks to use (only works if a negative bs is passed in 2031a23d5eceSKris Buschelman 2032a23d5eceSKris Buschelman Level: intermediate 2033a23d5eceSKris Buschelman 2034a23d5eceSKris Buschelman Notes: 2035a23d5eceSKris Buschelman Specify the preallocated storage with either nz or nnz (not both). 20360298fd71SBarry Smith Set nz=PETSC_DEFAULT and nnz=NULL for PETSc to control dynamic memory 2037a7f22e61SSatish Balay allocation. See Users-Manual: ch_mat for details. 2038a23d5eceSKris Buschelman 2039aa95bbe8SBarry Smith You can call MatGetInfo() to get information on how effective the preallocation was; 2040aa95bbe8SBarry Smith for example the fields mallocs,nz_allocated,nz_used,nz_unneeded; 2041aa95bbe8SBarry Smith You can also run with the option -info and look for messages with the string 2042aa95bbe8SBarry Smith malloc in them to see if additional memory allocation was needed. 2043aa95bbe8SBarry Smith 204449a6f317SBarry Smith If the nnz parameter is given then the nz parameter is ignored 204549a6f317SBarry Smith 204649a6f317SBarry Smith 204769b1f4b7SBarry Smith .seealso: MatCreate(), MatCreateSeqAIJ(), MatSetValues(), MatCreateSBAIJ() 2048a23d5eceSKris Buschelman @*/ 20497087cfbeSBarry Smith PetscErrorCode MatSeqSBAIJSetPreallocation(Mat B,PetscInt bs,PetscInt nz,const PetscInt nnz[]) 205013f74950SBarry Smith { 20514ac538c5SBarry Smith PetscErrorCode ierr; 2052a23d5eceSKris Buschelman 2053a23d5eceSKris Buschelman PetscFunctionBegin; 20546ba663aaSJed Brown PetscValidHeaderSpecific(B,MAT_CLASSID,1); 20556ba663aaSJed Brown PetscValidType(B,1); 20566ba663aaSJed Brown PetscValidLogicalCollectiveInt(B,bs,2); 20574ac538c5SBarry Smith ierr = PetscTryMethod(B,"MatSeqSBAIJSetPreallocation_C",(Mat,PetscInt,PetscInt,const PetscInt[]),(B,bs,nz,nnz));CHKERRQ(ierr); 2058a23d5eceSKris Buschelman PetscFunctionReturn(0); 2059a23d5eceSKris Buschelman } 206049b5e25fSSatish Balay 206138f409ebSLisandro Dalcin /*@C 2062664954b6SBarry Smith MatSeqSBAIJSetPreallocationCSR - Creates a sparse parallel matrix in SBAIJ format using the given nonzero structure and (optional) numerical values 206338f409ebSLisandro Dalcin 206438f409ebSLisandro Dalcin Input Parameters: 20651c4f3114SJed Brown + B - the matrix 2066eab78319SHong Zhang . bs - size of block, the blocks are ALWAYS square. 206738f409ebSLisandro Dalcin . i - the indices into j for the start of each local row (starts with zero) 206838f409ebSLisandro Dalcin . j - the column indices for each local row (starts with zero) these must be sorted for each row 206938f409ebSLisandro Dalcin - v - optional values in the matrix 207038f409ebSLisandro Dalcin 2071664954b6SBarry Smith Level: advanced 207238f409ebSLisandro Dalcin 207338f409ebSLisandro Dalcin Notes: 207438f409ebSLisandro Dalcin The order of the entries in values is specified by the MatOption MAT_ROW_ORIENTED. For example, C programs 207538f409ebSLisandro Dalcin may want to use the default MAT_ROW_ORIENTED=PETSC_TRUE and use an array v[nnz][bs][bs] where the second index is 207638f409ebSLisandro Dalcin over rows within a block and the last index is over columns within a block row. Fortran programs will likely set 207738f409ebSLisandro Dalcin MAT_ROW_ORIENTED=PETSC_FALSE and use a Fortran array v(bs,bs,nnz) in which the first index is over rows within a 207838f409ebSLisandro Dalcin block column and the second index is over columns within a block. 207938f409ebSLisandro Dalcin 208050c5228eSBarry Smith Any entries below the diagonal are ignored 20810cd7f59aSBarry Smith 20820cd7f59aSBarry Smith Though this routine has Preallocation() in the name it also sets the exact nonzero locations of the matrix entries 20830cd7f59aSBarry Smith and usually the numerical values as well 2084664954b6SBarry Smith 208538f409ebSLisandro Dalcin .seealso: MatCreate(), MatCreateSeqSBAIJ(), MatSetValuesBlocked(), MatSeqSBAIJSetPreallocation(), MATSEQSBAIJ 208638f409ebSLisandro Dalcin @*/ 208738f409ebSLisandro Dalcin PetscErrorCode MatSeqSBAIJSetPreallocationCSR(Mat B,PetscInt bs,const PetscInt i[],const PetscInt j[], const PetscScalar v[]) 208838f409ebSLisandro Dalcin { 208938f409ebSLisandro Dalcin PetscErrorCode ierr; 209038f409ebSLisandro Dalcin 209138f409ebSLisandro Dalcin PetscFunctionBegin; 209238f409ebSLisandro Dalcin PetscValidHeaderSpecific(B,MAT_CLASSID,1); 209338f409ebSLisandro Dalcin PetscValidType(B,1); 209438f409ebSLisandro Dalcin PetscValidLogicalCollectiveInt(B,bs,2); 209538f409ebSLisandro Dalcin ierr = PetscTryMethod(B,"MatSeqSBAIJSetPreallocationCSR_C",(Mat,PetscInt,const PetscInt[],const PetscInt[],const PetscScalar[]),(B,bs,i,j,v));CHKERRQ(ierr); 209638f409ebSLisandro Dalcin PetscFunctionReturn(0); 209738f409ebSLisandro Dalcin } 209838f409ebSLisandro Dalcin 2099c464158bSHong Zhang /*@C 2100c464158bSHong Zhang MatCreateSeqSBAIJ - Creates a sparse symmetric matrix in block AIJ (block 2101c464158bSHong Zhang compressed row) format. For good matrix assembly performance the 2102c464158bSHong Zhang user should preallocate the matrix storage by setting the parameter nz 2103c464158bSHong Zhang (or the array nnz). By setting these parameters accurately, performance 2104c464158bSHong Zhang during matrix assembly can be increased by more than a factor of 50. 210549b5e25fSSatish Balay 2106d083f849SBarry Smith Collective 2107c464158bSHong Zhang 2108c464158bSHong Zhang Input Parameters: 2109c464158bSHong Zhang + comm - MPI communicator, set to PETSC_COMM_SELF 2110bb7ae925SBarry Smith . bs - size of block, the blocks are ALWAYS square. One can use MatSetBlockSizes() to set a different row and column blocksize but the row 2111bb7ae925SBarry Smith blocksize always defines the size of the blocks. The column blocksize sets the blocksize of the vectors obtained with MatCreateVecs() 2112c464158bSHong Zhang . m - number of rows, or number of columns 2113c464158bSHong Zhang . nz - number of block nonzeros per block row (same for all rows) 2114744e8345SSatish Balay - nnz - array containing the number of block nonzeros in the upper triangular plus 21150298fd71SBarry Smith diagonal portion of each block (possibly different for each block row) or NULL 2116c464158bSHong Zhang 2117c464158bSHong Zhang Output Parameter: 2118c464158bSHong Zhang . A - the symmetric matrix 2119c464158bSHong Zhang 2120c464158bSHong Zhang Options Database Keys: 2121a2b725a8SWilliam Gropp + -mat_no_unroll - uses code that does not unroll the loops in the 2122c464158bSHong Zhang block calculations (much slower) 2123a2b725a8SWilliam Gropp - -mat_block_size - size of the blocks to use 2124c464158bSHong Zhang 2125c464158bSHong Zhang Level: intermediate 2126c464158bSHong Zhang 2127175b88e8SBarry Smith It is recommended that one use the MatCreate(), MatSetType() and/or MatSetFromOptions(), 2128f6f02116SRichard Tran Mills MatXXXXSetPreallocation() paradigm instead of this routine directly. 2129175b88e8SBarry Smith [MatXXXXSetPreallocation() is, for example, MatSeqAIJSetPreallocation] 2130175b88e8SBarry Smith 2131c464158bSHong Zhang Notes: 21326d6d819aSHong Zhang The number of rows and columns must be divisible by blocksize. 21336d6d819aSHong Zhang This matrix type does not support complex Hermitian operation. 2134c464158bSHong Zhang 2135c464158bSHong Zhang Specify the preallocated storage with either nz or nnz (not both). 21360298fd71SBarry Smith Set nz=PETSC_DEFAULT and nnz=NULL for PETSc to control dynamic memory 2137a7f22e61SSatish Balay allocation. See Users-Manual: ch_mat for details. 2138c464158bSHong Zhang 213949a6f317SBarry Smith If the nnz parameter is given then the nz parameter is ignored 214049a6f317SBarry Smith 214169b1f4b7SBarry Smith .seealso: MatCreate(), MatCreateSeqAIJ(), MatSetValues(), MatCreateSBAIJ() 2142c464158bSHong Zhang @*/ 21437087cfbeSBarry Smith PetscErrorCode MatCreateSeqSBAIJ(MPI_Comm comm,PetscInt bs,PetscInt m,PetscInt n,PetscInt nz,const PetscInt nnz[],Mat *A) 2144c464158bSHong Zhang { 2145dfbe8321SBarry Smith PetscErrorCode ierr; 2146c464158bSHong Zhang 2147c464158bSHong Zhang PetscFunctionBegin; 2148f69a0ea3SMatthew Knepley ierr = MatCreate(comm,A);CHKERRQ(ierr); 2149f69a0ea3SMatthew Knepley ierr = MatSetSizes(*A,m,n,m,n);CHKERRQ(ierr); 2150c464158bSHong Zhang ierr = MatSetType(*A,MATSEQSBAIJ);CHKERRQ(ierr); 2151367daffbSBarry Smith ierr = MatSeqSBAIJSetPreallocation(*A,bs,nz,(PetscInt*)nnz);CHKERRQ(ierr); 215249b5e25fSSatish Balay PetscFunctionReturn(0); 215349b5e25fSSatish Balay } 215449b5e25fSSatish Balay 2155dfbe8321SBarry Smith PetscErrorCode MatDuplicate_SeqSBAIJ(Mat A,MatDuplicateOption cpvalues,Mat *B) 215649b5e25fSSatish Balay { 215749b5e25fSSatish Balay Mat C; 215849b5e25fSSatish Balay Mat_SeqSBAIJ *c,*a = (Mat_SeqSBAIJ*)A->data; 21596849ba73SBarry Smith PetscErrorCode ierr; 2160b40805acSSatish Balay PetscInt i,mbs = a->mbs,nz = a->nz,bs2 =a->bs2; 216149b5e25fSSatish Balay 216249b5e25fSSatish Balay PetscFunctionBegin; 2163e32f2f54SBarry Smith if (a->i[mbs] != nz) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Corrupt matrix"); 216449b5e25fSSatish Balay 2165*f4259b30SLisandro Dalcin *B = NULL; 2166ce94432eSBarry Smith ierr = MatCreate(PetscObjectComm((PetscObject)A),&C);CHKERRQ(ierr); 2167d0f46423SBarry Smith ierr = MatSetSizes(C,A->rmap->N,A->cmap->n,A->rmap->N,A->cmap->n);CHKERRQ(ierr); 21684c7a3774SStefano Zampini ierr = MatSetBlockSizesFromMats(C,A,A);CHKERRQ(ierr); 21698e9a0fb8SHong Zhang ierr = MatSetType(C,MATSEQSBAIJ);CHKERRQ(ierr); 2170692f9cbeSHong Zhang c = (Mat_SeqSBAIJ*)C->data; 2171692f9cbeSHong Zhang 2172273d9f13SBarry Smith C->preallocated = PETSC_TRUE; 2173d5f3da31SBarry Smith C->factortype = A->factortype; 2174*f4259b30SLisandro Dalcin c->row = NULL; 2175*f4259b30SLisandro Dalcin c->icol = NULL; 2176*f4259b30SLisandro Dalcin c->saved_values = NULL; 2177a9817697SBarry Smith c->keepnonzeropattern = a->keepnonzeropattern; 217849b5e25fSSatish Balay C->assembled = PETSC_TRUE; 217949b5e25fSSatish Balay 21801e1e43feSBarry Smith ierr = PetscLayoutReference(A->rmap,&C->rmap);CHKERRQ(ierr); 21811e1e43feSBarry Smith ierr = PetscLayoutReference(A->cmap,&C->cmap);CHKERRQ(ierr); 218249b5e25fSSatish Balay c->bs2 = a->bs2; 218349b5e25fSSatish Balay c->mbs = a->mbs; 218449b5e25fSSatish Balay c->nbs = a->nbs; 218549b5e25fSSatish Balay 2186c760cd28SBarry Smith if (cpvalues == MAT_SHARE_NONZERO_PATTERN) { 2187c760cd28SBarry Smith c->imax = a->imax; 2188c760cd28SBarry Smith c->ilen = a->ilen; 2189c760cd28SBarry Smith c->free_imax_ilen = PETSC_FALSE; 2190c760cd28SBarry Smith } else { 2191dcca6d9dSJed Brown ierr = PetscMalloc2((mbs+1),&c->imax,(mbs+1),&c->ilen);CHKERRQ(ierr); 21923bb1ff40SBarry Smith ierr = PetscLogObjectMemory((PetscObject)C,2*(mbs+1)*sizeof(PetscInt));CHKERRQ(ierr); 219349b5e25fSSatish Balay for (i=0; i<mbs; i++) { 219449b5e25fSSatish Balay c->imax[i] = a->imax[i]; 219549b5e25fSSatish Balay c->ilen[i] = a->ilen[i]; 219649b5e25fSSatish Balay } 2197c760cd28SBarry Smith c->free_imax_ilen = PETSC_TRUE; 2198c760cd28SBarry Smith } 219949b5e25fSSatish Balay 220049b5e25fSSatish Balay /* allocate the matrix space */ 22014da8f245SBarry Smith if (cpvalues == MAT_SHARE_NONZERO_PATTERN) { 2202785e854fSJed Brown ierr = PetscMalloc1(bs2*nz,&c->a);CHKERRQ(ierr); 22033bb1ff40SBarry Smith ierr = PetscLogObjectMemory((PetscObject)C,nz*bs2*sizeof(MatScalar));CHKERRQ(ierr); 220444e1c64aSLisandro Dalcin c->i = a->i; 220544e1c64aSLisandro Dalcin c->j = a->j; 22064da8f245SBarry Smith c->singlemalloc = PETSC_FALSE; 220744e1c64aSLisandro Dalcin c->free_a = PETSC_TRUE; 22084da8f245SBarry Smith c->free_ij = PETSC_FALSE; 22094da8f245SBarry Smith c->parent = A; 22104da8f245SBarry Smith ierr = PetscObjectReference((PetscObject)A);CHKERRQ(ierr); 22114da8f245SBarry Smith ierr = MatSetOption(A,MAT_NEW_NONZERO_LOCATION_ERR,PETSC_TRUE);CHKERRQ(ierr); 22124da8f245SBarry Smith ierr = MatSetOption(C,MAT_NEW_NONZERO_LOCATION_ERR,PETSC_TRUE);CHKERRQ(ierr); 22134da8f245SBarry Smith } else { 2214dcca6d9dSJed Brown ierr = PetscMalloc3(bs2*nz,&c->a,nz,&c->j,mbs+1,&c->i);CHKERRQ(ierr); 2215580bdb30SBarry Smith ierr = PetscArraycpy(c->i,a->i,mbs+1);CHKERRQ(ierr); 22163bb1ff40SBarry Smith ierr = PetscLogObjectMemory((PetscObject)C,(mbs+1)*sizeof(PetscInt) + nz*(bs2*sizeof(MatScalar) + sizeof(PetscInt)));CHKERRQ(ierr); 22174da8f245SBarry Smith c->singlemalloc = PETSC_TRUE; 221844e1c64aSLisandro Dalcin c->free_a = PETSC_TRUE; 22194da8f245SBarry Smith c->free_ij = PETSC_TRUE; 22204da8f245SBarry Smith } 222149b5e25fSSatish Balay if (mbs > 0) { 22224da8f245SBarry Smith if (cpvalues != MAT_SHARE_NONZERO_PATTERN) { 2223580bdb30SBarry Smith ierr = PetscArraycpy(c->j,a->j,nz);CHKERRQ(ierr); 22244da8f245SBarry Smith } 222549b5e25fSSatish Balay if (cpvalues == MAT_COPY_VALUES) { 2226580bdb30SBarry Smith ierr = PetscArraycpy(c->a,a->a,bs2*nz);CHKERRQ(ierr); 222749b5e25fSSatish Balay } else { 2228580bdb30SBarry Smith ierr = PetscArrayzero(c->a,bs2*nz);CHKERRQ(ierr); 222949b5e25fSSatish Balay } 2230a1c3900fSBarry Smith if (a->jshort) { 223144e1c64aSLisandro Dalcin /* cannot share jshort, it is reallocated in MatAssemblyEnd_SeqSBAIJ() */ 223244e1c64aSLisandro Dalcin /* if the parent matrix is reassembled, this child matrix will never notice */ 2233785e854fSJed Brown ierr = PetscMalloc1(nz,&c->jshort);CHKERRQ(ierr); 22343bb1ff40SBarry Smith ierr = PetscLogObjectMemory((PetscObject)C,nz*sizeof(unsigned short));CHKERRQ(ierr); 2235580bdb30SBarry Smith ierr = PetscArraycpy(c->jshort,a->jshort,nz);CHKERRQ(ierr); 223626fbe8dcSKarl Rupp 22374da8f245SBarry Smith c->free_jshort = PETSC_TRUE; 22384da8f245SBarry Smith } 2239a1c3900fSBarry Smith } 224049b5e25fSSatish Balay 224149b5e25fSSatish Balay c->roworiented = a->roworiented; 224249b5e25fSSatish Balay c->nonew = a->nonew; 224349b5e25fSSatish Balay 224449b5e25fSSatish Balay if (a->diag) { 2245c760cd28SBarry Smith if (cpvalues == MAT_SHARE_NONZERO_PATTERN) { 2246c760cd28SBarry Smith c->diag = a->diag; 2247c760cd28SBarry Smith c->free_diag = PETSC_FALSE; 2248c760cd28SBarry Smith } else { 2249785e854fSJed Brown ierr = PetscMalloc1(mbs,&c->diag);CHKERRQ(ierr); 22503bb1ff40SBarry Smith ierr = PetscLogObjectMemory((PetscObject)C,mbs*sizeof(PetscInt));CHKERRQ(ierr); 225126fbe8dcSKarl Rupp for (i=0; i<mbs; i++) c->diag[i] = a->diag[i]; 2252c760cd28SBarry Smith c->free_diag = PETSC_TRUE; 2253c760cd28SBarry Smith } 225444e1c64aSLisandro Dalcin } 22556c6c5352SBarry Smith c->nz = a->nz; 2256f2cbd3d5SJed Brown c->maxnz = a->nz; /* Since we allocate exactly the right amount */ 2257*f4259b30SLisandro Dalcin c->solve_work = NULL; 2258*f4259b30SLisandro Dalcin c->mult_work = NULL; 225926fbe8dcSKarl Rupp 226049b5e25fSSatish Balay *B = C; 2261140e18c1SBarry Smith ierr = PetscFunctionListDuplicate(((PetscObject)A)->qlist,&((PetscObject)C)->qlist);CHKERRQ(ierr); 226249b5e25fSSatish Balay PetscFunctionReturn(0); 226349b5e25fSSatish Balay } 226449b5e25fSSatish Balay 2265618cc2edSLisandro Dalcin /* Used for both SeqBAIJ and SeqSBAIJ matrices */ 2266618cc2edSLisandro Dalcin #define MatLoad_SeqSBAIJ_Binary MatLoad_SeqBAIJ_Binary 2267618cc2edSLisandro Dalcin 2268618cc2edSLisandro Dalcin PetscErrorCode MatLoad_SeqSBAIJ(Mat mat,PetscViewer viewer) 22692f480046SShri Abhyankar { 22702f480046SShri Abhyankar PetscErrorCode ierr; 22717f489da9SVaclav Hapla PetscBool isbinary; 22722f480046SShri Abhyankar 22732f480046SShri Abhyankar PetscFunctionBegin; 22747f489da9SVaclav Hapla ierr = PetscObjectTypeCompare((PetscObject)viewer,PETSCVIEWERBINARY,&isbinary);CHKERRQ(ierr); 2275618cc2edSLisandro Dalcin if (!isbinary) SETERRQ2(PetscObjectComm((PetscObject)viewer),PETSC_ERR_SUP,"Viewer type %s not yet supported for reading %s matrices",((PetscObject)viewer)->type_name,((PetscObject)mat)->type_name); 2276618cc2edSLisandro Dalcin ierr = MatLoad_SeqSBAIJ_Binary(mat,viewer);CHKERRQ(ierr); 22772f480046SShri Abhyankar PetscFunctionReturn(0); 22782f480046SShri Abhyankar } 22792f480046SShri Abhyankar 2280c75a6043SHong Zhang /*@ 2281c75a6043SHong Zhang MatCreateSeqSBAIJWithArrays - Creates an sequential SBAIJ matrix using matrix elements 2282c75a6043SHong Zhang (upper triangular entries in CSR format) provided by the user. 2283c75a6043SHong Zhang 2284d083f849SBarry Smith Collective 2285c75a6043SHong Zhang 2286c75a6043SHong Zhang Input Parameters: 2287c75a6043SHong Zhang + comm - must be an MPI communicator of size 1 2288c75a6043SHong Zhang . bs - size of block 2289c75a6043SHong Zhang . m - number of rows 2290c75a6043SHong Zhang . n - number of columns 2291483a2f95SBarry Smith . i - row indices; that is i[0] = 0, i[row] = i[row-1] + number of block elements in that row block row of the matrix 2292c75a6043SHong Zhang . j - column indices 2293c75a6043SHong Zhang - a - matrix values 2294c75a6043SHong Zhang 2295c75a6043SHong Zhang Output Parameter: 2296c75a6043SHong Zhang . mat - the matrix 2297c75a6043SHong Zhang 2298dfb205c3SBarry Smith Level: advanced 2299c75a6043SHong Zhang 2300c75a6043SHong Zhang Notes: 2301c75a6043SHong Zhang The i, j, and a arrays are not copied by this routine, the user must free these arrays 2302c75a6043SHong Zhang once the matrix is destroyed 2303c75a6043SHong Zhang 2304c75a6043SHong Zhang You cannot set new nonzero locations into this matrix, that will generate an error. 2305c75a6043SHong Zhang 2306c75a6043SHong Zhang The i and j indices are 0 based 2307c75a6043SHong Zhang 2308dfb205c3SBarry Smith When block size is greater than 1 the matrix values must be stored using the SBAIJ storage format (see the SBAIJ code to determine this). For block size of 1 2309dfb205c3SBarry Smith it is the regular CSR format excluding the lower triangular elements. 2310dfb205c3SBarry Smith 231169b1f4b7SBarry Smith .seealso: MatCreate(), MatCreateSBAIJ(), MatCreateSeqSBAIJ() 2312c75a6043SHong Zhang 2313c75a6043SHong Zhang @*/ 2314c3c607ccSBarry Smith PetscErrorCode MatCreateSeqSBAIJWithArrays(MPI_Comm comm,PetscInt bs,PetscInt m,PetscInt n,PetscInt i[],PetscInt j[],PetscScalar a[],Mat *mat) 2315c75a6043SHong Zhang { 2316c75a6043SHong Zhang PetscErrorCode ierr; 2317c75a6043SHong Zhang PetscInt ii; 2318c75a6043SHong Zhang Mat_SeqSBAIJ *sbaij; 2319c75a6043SHong Zhang 2320c75a6043SHong Zhang PetscFunctionBegin; 2321e32f2f54SBarry Smith if (bs != 1) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_SUP,"block size %D > 1 is not supported yet",bs); 232241096f02SStefano Zampini if (m > 0 && i[0]) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"i (row indices) must start with 0"); 2323c75a6043SHong Zhang 2324c75a6043SHong Zhang ierr = MatCreate(comm,mat);CHKERRQ(ierr); 2325c75a6043SHong Zhang ierr = MatSetSizes(*mat,m,n,m,n);CHKERRQ(ierr); 2326c75a6043SHong Zhang ierr = MatSetType(*mat,MATSEQSBAIJ);CHKERRQ(ierr); 2327*f4259b30SLisandro Dalcin ierr = MatSeqSBAIJSetPreallocation(*mat,bs,MAT_SKIP_ALLOCATION,NULL);CHKERRQ(ierr); 2328c75a6043SHong Zhang sbaij = (Mat_SeqSBAIJ*)(*mat)->data; 2329dcca6d9dSJed Brown ierr = PetscMalloc2(m,&sbaij->imax,m,&sbaij->ilen);CHKERRQ(ierr); 23303bb1ff40SBarry Smith ierr = PetscLogObjectMemory((PetscObject)*mat,2*m*sizeof(PetscInt));CHKERRQ(ierr); 2331c75a6043SHong Zhang 2332c75a6043SHong Zhang sbaij->i = i; 2333c75a6043SHong Zhang sbaij->j = j; 2334c75a6043SHong Zhang sbaij->a = a; 233526fbe8dcSKarl Rupp 2336c75a6043SHong Zhang sbaij->singlemalloc = PETSC_FALSE; 2337c75a6043SHong Zhang sbaij->nonew = -1; /*this indicates that inserting a new value in the matrix that generates a new nonzero is an error*/ 2338e6b907acSBarry Smith sbaij->free_a = PETSC_FALSE; 2339e6b907acSBarry Smith sbaij->free_ij = PETSC_FALSE; 2340ddf7884eSMatthew Knepley sbaij->free_imax_ilen = PETSC_TRUE; 2341c75a6043SHong Zhang 2342c75a6043SHong Zhang for (ii=0; ii<m; ii++) { 2343c75a6043SHong Zhang sbaij->ilen[ii] = sbaij->imax[ii] = i[ii+1] - i[ii]; 2344cf9c20a2SJed Brown if (PetscUnlikelyDebug(i[ii+1] - i[ii] < 0)) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Negative row length in i (row indices) row = %d length = %d",ii,i[ii+1] - i[ii]); 2345c75a6043SHong Zhang } 234676bd3646SJed Brown if (PetscDefined(USE_DEBUG)) { 2347c75a6043SHong Zhang for (ii=0; ii<sbaij->i[m]; ii++) { 2348e32f2f54SBarry Smith if (j[ii] < 0) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Negative column index at location = %d index = %d",ii,j[ii]); 2349e32f2f54SBarry Smith if (j[ii] > n - 1) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Column index to large at location = %d index = %d",ii,j[ii]); 2350c75a6043SHong Zhang } 235176bd3646SJed Brown } 2352c75a6043SHong Zhang 2353c75a6043SHong Zhang ierr = MatAssemblyBegin(*mat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 2354c75a6043SHong Zhang ierr = MatAssemblyEnd(*mat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 2355c75a6043SHong Zhang PetscFunctionReturn(0); 2356c75a6043SHong Zhang } 2357d06b337dSHong Zhang 235859f5e6ceSHong Zhang PetscErrorCode MatCreateMPIMatConcatenateSeqMat_SeqSBAIJ(MPI_Comm comm,Mat inmat,PetscInt n,MatReuse scall,Mat *outmat) 235959f5e6ceSHong Zhang { 236059f5e6ceSHong Zhang PetscErrorCode ierr; 23618761c3d6SHong Zhang PetscMPIInt size; 236259f5e6ceSHong Zhang 236359f5e6ceSHong Zhang PetscFunctionBegin; 23648761c3d6SHong Zhang ierr = MPI_Comm_size(comm,&size);CHKERRQ(ierr); 23658761c3d6SHong Zhang if (size == 1 && scall == MAT_REUSE_MATRIX) { 23668761c3d6SHong Zhang ierr = MatCopy(inmat,*outmat,SAME_NONZERO_PATTERN);CHKERRQ(ierr); 23678761c3d6SHong Zhang } else { 236859f5e6ceSHong Zhang ierr = MatCreateMPIMatConcatenateSeqMat_MPISBAIJ(comm,inmat,n,scall,outmat);CHKERRQ(ierr); 23698761c3d6SHong Zhang } 237059f5e6ceSHong Zhang PetscFunctionReturn(0); 237159f5e6ceSHong Zhang } 2372