149b5e25fSSatish Balay 249b5e25fSSatish Balay /* 3a1373b80SHong Zhang Defines the basic matrix operations for the SBAIJ (compressed row) 449b5e25fSSatish Balay matrix storage format. 549b5e25fSSatish Balay */ 6c6db04a5SJed Brown #include <../src/mat/impls/baij/seq/baij.h> /*I "petscmat.h" I*/ 7c6db04a5SJed Brown #include <../src/mat/impls/sbaij/seq/sbaij.h> 8c6db04a5SJed Brown #include <petscblaslapack.h> 949b5e25fSSatish Balay 10c6db04a5SJed Brown #include <../src/mat/impls/sbaij/seq/relax.h> 1170dcbbb9SBarry Smith #define USESHORT 12c6db04a5SJed Brown #include <../src/mat/impls/sbaij/seq/relax.h> 1370dcbbb9SBarry Smith 14*26cec326SBarry Smith /* defines MatSetValues_Seq_Hash(), MatAssemblyEnd_Seq_Hash(), MatSetUp_Seq_Hash() */ 15*26cec326SBarry Smith #define TYPE SBAIJ 16*26cec326SBarry Smith #define TYPE_SBAIJ 17*26cec326SBarry Smith #define TYPE_BS 18*26cec326SBarry Smith #include "../src/mat/impls/aij/seq/seqhashmatsetvalues.h" 19*26cec326SBarry Smith #undef TYPE_BS 20*26cec326SBarry Smith #define TYPE_BS _BS 21*26cec326SBarry Smith #define TYPE_BS_ON 22*26cec326SBarry Smith #include "../src/mat/impls/aij/seq/seqhashmatsetvalues.h" 23*26cec326SBarry Smith #undef TYPE_BS 24*26cec326SBarry Smith #undef TYPE_SBAIJ 25*26cec326SBarry Smith #include "../src/mat/impls/aij/seq/seqhashmat.h" 26*26cec326SBarry Smith #undef TYPE 27*26cec326SBarry Smith #undef TYPE_BS_ON 28*26cec326SBarry Smith 296214f412SHong Zhang #if defined(PETSC_HAVE_ELEMENTAL) 30cc2e6a90SBarry Smith PETSC_INTERN PetscErrorCode MatConvert_SeqSBAIJ_Elemental(Mat, MatType, MatReuse, Mat *); 316214f412SHong Zhang #endif 32d24d4204SJose E. Roman #if defined(PETSC_HAVE_SCALAPACK) 33d24d4204SJose E. Roman PETSC_INTERN PetscErrorCode MatConvert_SBAIJ_ScaLAPACK(Mat, MatType, MatReuse, Mat *); 34d24d4204SJose E. Roman #endif 3528d58a37SPierre Jolivet PETSC_INTERN PetscErrorCode MatConvert_MPISBAIJ_Basic(Mat, MatType, MatReuse, Mat *); 36b5b17502SBarry Smith 3749b5e25fSSatish Balay /* 3849b5e25fSSatish Balay Checks for missing diagonals 3949b5e25fSSatish Balay */ 40d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMissingDiagonal_SeqSBAIJ(Mat A, PetscBool *missing, PetscInt *dd) 41d71ae5a4SJacob Faibussowitsch { 42045c9aa0SHong Zhang Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)A->data; 437734d3b5SMatthew G. Knepley PetscInt *diag, *ii = a->i, i; 4449b5e25fSSatish Balay 4549b5e25fSSatish Balay PetscFunctionBegin; 469566063dSJacob Faibussowitsch PetscCall(MatMarkDiagonal_SeqSBAIJ(A)); 472af78befSBarry Smith *missing = PETSC_FALSE; 487734d3b5SMatthew G. Knepley if (A->rmap->n > 0 && !ii) { 49358d2f5dSShri Abhyankar *missing = PETSC_TRUE; 50358d2f5dSShri Abhyankar if (dd) *dd = 0; 519566063dSJacob Faibussowitsch PetscCall(PetscInfo(A, "Matrix has no entries therefore is missing diagonal\n")); 52358d2f5dSShri Abhyankar } else { 53358d2f5dSShri Abhyankar diag = a->diag; 5449b5e25fSSatish Balay for (i = 0; i < a->mbs; i++) { 557734d3b5SMatthew G. Knepley if (diag[i] >= ii[i + 1]) { 562af78befSBarry Smith *missing = PETSC_TRUE; 572af78befSBarry Smith if (dd) *dd = i; 582af78befSBarry Smith break; 592af78befSBarry Smith } 6049b5e25fSSatish Balay } 61358d2f5dSShri Abhyankar } 623ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 6349b5e25fSSatish Balay } 6449b5e25fSSatish Balay 65d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMarkDiagonal_SeqSBAIJ(Mat A) 66d71ae5a4SJacob Faibussowitsch { 67045c9aa0SHong Zhang Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)A->data; 6848dd3d27SHong Zhang PetscInt i, j; 6949b5e25fSSatish Balay 7049b5e25fSSatish Balay PetscFunctionBegin; 7109f38230SBarry Smith if (!a->diag) { 729566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(a->mbs, &a->diag)); 73c760cd28SBarry Smith a->free_diag = PETSC_TRUE; 7409f38230SBarry Smith } 7548dd3d27SHong Zhang for (i = 0; i < a->mbs; i++) { 7648dd3d27SHong Zhang a->diag[i] = a->i[i + 1]; 7748dd3d27SHong Zhang for (j = a->i[i]; j < a->i[i + 1]; j++) { 7848dd3d27SHong Zhang if (a->j[j] == i) { 7948dd3d27SHong Zhang a->diag[i] = j; 8048dd3d27SHong Zhang break; 8148dd3d27SHong Zhang } 8248dd3d27SHong Zhang } 8348dd3d27SHong Zhang } 843ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 8549b5e25fSSatish Balay } 8649b5e25fSSatish Balay 87d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatGetRowIJ_SeqSBAIJ(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool blockcompressed, PetscInt *nn, const PetscInt *inia[], const PetscInt *inja[], PetscBool *done) 88d71ae5a4SJacob Faibussowitsch { 89a6ece127SHong Zhang Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)A->data; 902462f5fdSStefano Zampini PetscInt i, j, n = a->mbs, nz = a->i[n], *tia, *tja, bs = A->rmap->bs, k, l, cnt; 912462f5fdSStefano Zampini PetscInt **ia = (PetscInt **)inia, **ja = (PetscInt **)inja; 9249b5e25fSSatish Balay 9349b5e25fSSatish Balay PetscFunctionBegin; 94d3e5a4abSHong Zhang *nn = n; 953ba16761SJacob Faibussowitsch if (!ia) PetscFunctionReturn(PETSC_SUCCESS); 962462f5fdSStefano Zampini if (symmetric) { 979566063dSJacob Faibussowitsch PetscCall(MatToSymmetricIJ_SeqAIJ(n, a->i, a->j, PETSC_FALSE, 0, 0, &tia, &tja)); 982462f5fdSStefano Zampini nz = tia[n]; 992462f5fdSStefano Zampini } else { 1009371c9d4SSatish Balay tia = a->i; 1019371c9d4SSatish Balay tja = a->j; 1022462f5fdSStefano Zampini } 1032462f5fdSStefano Zampini 1042462f5fdSStefano Zampini if (!blockcompressed && bs > 1) { 1052462f5fdSStefano Zampini (*nn) *= bs; 1068f7157efSSatish Balay /* malloc & create the natural set of indices */ 1079566063dSJacob Faibussowitsch PetscCall(PetscMalloc1((n + 1) * bs, ia)); 1082462f5fdSStefano Zampini if (n) { 1092462f5fdSStefano Zampini (*ia)[0] = oshift; 110ad540459SPierre Jolivet for (j = 1; j < bs; j++) (*ia)[j] = (tia[1] - tia[0]) * bs + (*ia)[j - 1]; 1112462f5fdSStefano Zampini } 1122462f5fdSStefano Zampini 1132462f5fdSStefano Zampini for (i = 1; i < n; i++) { 1142462f5fdSStefano Zampini (*ia)[i * bs] = (tia[i] - tia[i - 1]) * bs + (*ia)[i * bs - 1]; 115ad540459SPierre Jolivet for (j = 1; j < bs; j++) (*ia)[i * bs + j] = (tia[i + 1] - tia[i]) * bs + (*ia)[i * bs + j - 1]; 1162462f5fdSStefano Zampini } 117ad540459SPierre Jolivet if (n) (*ia)[n * bs] = (tia[n] - tia[n - 1]) * bs + (*ia)[n * bs - 1]; 1182462f5fdSStefano Zampini 1192462f5fdSStefano Zampini if (inja) { 1209566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nz * bs * bs, ja)); 1212462f5fdSStefano Zampini cnt = 0; 1222462f5fdSStefano Zampini for (i = 0; i < n; i++) { 1238f7157efSSatish Balay for (j = 0; j < bs; j++) { 1242462f5fdSStefano Zampini for (k = tia[i]; k < tia[i + 1]; k++) { 125ad540459SPierre Jolivet for (l = 0; l < bs; l++) (*ja)[cnt++] = bs * tja[k] + l; 1268f7157efSSatish Balay } 1278f7157efSSatish Balay } 1288f7157efSSatish Balay } 1298f7157efSSatish Balay } 1302462f5fdSStefano Zampini 1312462f5fdSStefano Zampini if (symmetric) { /* deallocate memory allocated in MatToSymmetricIJ_SeqAIJ() */ 1329566063dSJacob Faibussowitsch PetscCall(PetscFree(tia)); 1339566063dSJacob Faibussowitsch PetscCall(PetscFree(tja)); 1342462f5fdSStefano Zampini } 1352462f5fdSStefano Zampini } else if (oshift == 1) { 1362462f5fdSStefano Zampini if (symmetric) { 1372462f5fdSStefano Zampini nz = tia[A->rmap->n / bs]; 1382462f5fdSStefano Zampini /* add 1 to i and j indices */ 1392462f5fdSStefano Zampini for (i = 0; i < A->rmap->n / bs + 1; i++) tia[i] = tia[i] + 1; 1402462f5fdSStefano Zampini *ia = tia; 1412462f5fdSStefano Zampini if (ja) { 1422462f5fdSStefano Zampini for (i = 0; i < nz; i++) tja[i] = tja[i] + 1; 1432462f5fdSStefano Zampini *ja = tja; 1442462f5fdSStefano Zampini } 1452462f5fdSStefano Zampini } else { 1462462f5fdSStefano Zampini nz = a->i[A->rmap->n / bs]; 1472462f5fdSStefano Zampini /* malloc space and add 1 to i and j indices */ 1489566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(A->rmap->n / bs + 1, ia)); 1492462f5fdSStefano Zampini for (i = 0; i < A->rmap->n / bs + 1; i++) (*ia)[i] = a->i[i] + 1; 1502462f5fdSStefano Zampini if (ja) { 1519566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nz, ja)); 1522462f5fdSStefano Zampini for (i = 0; i < nz; i++) (*ja)[i] = a->j[i] + 1; 1532462f5fdSStefano Zampini } 1542462f5fdSStefano Zampini } 1552462f5fdSStefano Zampini } else { 1562462f5fdSStefano Zampini *ia = tia; 1572462f5fdSStefano Zampini if (ja) *ja = tja; 158a6ece127SHong Zhang } 1593ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 16049b5e25fSSatish Balay } 16149b5e25fSSatish Balay 162d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatRestoreRowIJ_SeqSBAIJ(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool blockcompressed, PetscInt *nn, const PetscInt *ia[], const PetscInt *ja[], PetscBool *done) 163d71ae5a4SJacob Faibussowitsch { 16449b5e25fSSatish Balay PetscFunctionBegin; 1653ba16761SJacob Faibussowitsch if (!ia) PetscFunctionReturn(PETSC_SUCCESS); 1662462f5fdSStefano Zampini if ((!blockcompressed && A->rmap->bs > 1) || (symmetric || oshift == 1)) { 1679566063dSJacob Faibussowitsch PetscCall(PetscFree(*ia)); 1689566063dSJacob Faibussowitsch if (ja) PetscCall(PetscFree(*ja)); 169a6ece127SHong Zhang } 1703ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 17149b5e25fSSatish Balay } 17249b5e25fSSatish Balay 173d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDestroy_SeqSBAIJ(Mat A) 174d71ae5a4SJacob Faibussowitsch { 17549b5e25fSSatish Balay Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)A->data; 17649b5e25fSSatish Balay 17749b5e25fSSatish Balay PetscFunctionBegin; 178a9f03627SSatish Balay #if defined(PETSC_USE_LOG) 1793ba16761SJacob Faibussowitsch PetscCall(PetscLogObjectState((PetscObject)A, "Rows=%" PetscInt_FMT ", NZ=%" PetscInt_FMT, A->rmap->N, a->nz)); 180a9f03627SSatish Balay #endif 1819566063dSJacob Faibussowitsch PetscCall(MatSeqXAIJFreeAIJ(A, &a->a, &a->j, &a->i)); 1829566063dSJacob Faibussowitsch if (a->free_diag) PetscCall(PetscFree(a->diag)); 1839566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->row)); 1849566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->col)); 1859566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->icol)); 1869566063dSJacob Faibussowitsch PetscCall(PetscFree(a->idiag)); 1879566063dSJacob Faibussowitsch PetscCall(PetscFree(a->inode.size)); 1889566063dSJacob Faibussowitsch if (a->free_imax_ilen) PetscCall(PetscFree2(a->imax, a->ilen)); 1899566063dSJacob Faibussowitsch PetscCall(PetscFree(a->solve_work)); 1909566063dSJacob Faibussowitsch PetscCall(PetscFree(a->sor_work)); 1919566063dSJacob Faibussowitsch PetscCall(PetscFree(a->solves_work)); 1929566063dSJacob Faibussowitsch PetscCall(PetscFree(a->mult_work)); 1939566063dSJacob Faibussowitsch PetscCall(PetscFree(a->saved_values)); 1949566063dSJacob Faibussowitsch if (a->free_jshort) PetscCall(PetscFree(a->jshort)); 1959566063dSJacob Faibussowitsch PetscCall(PetscFree(a->inew)); 1969566063dSJacob Faibussowitsch PetscCall(MatDestroy(&a->parent)); 1979566063dSJacob Faibussowitsch PetscCall(PetscFree(A->data)); 198901853e0SKris Buschelman 1999566063dSJacob Faibussowitsch PetscCall(PetscObjectChangeTypeName((PetscObject)A, NULL)); 2002e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSeqSBAIJGetArray_C", NULL)); 2012e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSeqSBAIJRestoreArray_C", NULL)); 2029566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatStoreValues_C", NULL)); 2039566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatRetrieveValues_C", NULL)); 2049566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSeqSBAIJSetColumnIndices_C", NULL)); 2059566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqsbaij_seqaij_C", NULL)); 2069566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqsbaij_seqbaij_C", NULL)); 2079566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSeqSBAIJSetPreallocation_C", NULL)); 2089566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSeqSBAIJSetPreallocationCSR_C", NULL)); 2096214f412SHong Zhang #if defined(PETSC_HAVE_ELEMENTAL) 2109566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqsbaij_elemental_C", NULL)); 2116214f412SHong Zhang #endif 212d24d4204SJose E. Roman #if defined(PETSC_HAVE_SCALAPACK) 2139566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqsbaij_scalapack_C", NULL)); 214d24d4204SJose E. Roman #endif 2152e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatFactorGetSolverType_C", NULL)); 2163ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 21749b5e25fSSatish Balay } 21849b5e25fSSatish Balay 219d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetOption_SeqSBAIJ(Mat A, MatOption op, PetscBool flg) 220d71ae5a4SJacob Faibussowitsch { 221045c9aa0SHong Zhang Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)A->data; 222eb1ec7c1SStefano Zampini #if defined(PETSC_USE_COMPLEX) 223eb1ec7c1SStefano Zampini PetscInt bs; 224eb1ec7c1SStefano Zampini #endif 22549b5e25fSSatish Balay 22649b5e25fSSatish Balay PetscFunctionBegin; 227eb1ec7c1SStefano Zampini #if defined(PETSC_USE_COMPLEX) 2289566063dSJacob Faibussowitsch PetscCall(MatGetBlockSize(A, &bs)); 229eb1ec7c1SStefano Zampini #endif 2304d9d31abSKris Buschelman switch (op) { 231d71ae5a4SJacob Faibussowitsch case MAT_ROW_ORIENTED: 232d71ae5a4SJacob Faibussowitsch a->roworiented = flg; 233d71ae5a4SJacob Faibussowitsch break; 234d71ae5a4SJacob Faibussowitsch case MAT_KEEP_NONZERO_PATTERN: 235d71ae5a4SJacob Faibussowitsch a->keepnonzeropattern = flg; 236d71ae5a4SJacob Faibussowitsch break; 237d71ae5a4SJacob Faibussowitsch case MAT_NEW_NONZERO_LOCATIONS: 238d71ae5a4SJacob Faibussowitsch a->nonew = (flg ? 0 : 1); 239d71ae5a4SJacob Faibussowitsch break; 240d71ae5a4SJacob Faibussowitsch case MAT_NEW_NONZERO_LOCATION_ERR: 241d71ae5a4SJacob Faibussowitsch a->nonew = (flg ? -1 : 0); 242d71ae5a4SJacob Faibussowitsch break; 243d71ae5a4SJacob Faibussowitsch case MAT_NEW_NONZERO_ALLOCATION_ERR: 244d71ae5a4SJacob Faibussowitsch a->nonew = (flg ? -2 : 0); 245d71ae5a4SJacob Faibussowitsch break; 246d71ae5a4SJacob Faibussowitsch case MAT_UNUSED_NONZERO_LOCATION_ERR: 247d71ae5a4SJacob Faibussowitsch a->nounused = (flg ? -1 : 0); 248d71ae5a4SJacob Faibussowitsch break; 2498c78258cSHong Zhang case MAT_FORCE_DIAGONAL_ENTRIES: 2504d9d31abSKris Buschelman case MAT_IGNORE_OFF_PROC_ENTRIES: 2514d9d31abSKris Buschelman case MAT_USE_HASH_TABLE: 252d71ae5a4SJacob Faibussowitsch case MAT_SORTED_FULL: 253d71ae5a4SJacob Faibussowitsch PetscCall(PetscInfo(A, "Option %s ignored\n", MatOptions[op])); 254d71ae5a4SJacob Faibussowitsch break; 2559a4540c5SBarry Smith case MAT_HERMITIAN: 256eb1ec7c1SStefano Zampini #if defined(PETSC_USE_COMPLEX) 257eb1ec7c1SStefano Zampini if (flg) { /* disable transpose ops */ 25808401ef6SPierre Jolivet PetscCheck(bs <= 1, PETSC_COMM_SELF, PETSC_ERR_SUP, "No support for Hermitian with block size greater than 1"); 259eb1ec7c1SStefano Zampini A->ops->multtranspose = NULL; 260eb1ec7c1SStefano Zampini A->ops->multtransposeadd = NULL; 261b94d7dedSBarry Smith A->symmetric = PETSC_BOOL3_FALSE; 262eb1ec7c1SStefano Zampini } 2630f2140c7SStefano Zampini #endif 264eeffb40dSHong Zhang break; 26577e54ba9SKris Buschelman case MAT_SYMMETRIC: 266eb1ec7c1SStefano Zampini case MAT_SPD: 267eb1ec7c1SStefano Zampini #if defined(PETSC_USE_COMPLEX) 268eb1ec7c1SStefano Zampini if (flg) { /* An hermitian and symmetric matrix has zero imaginary part (restore back transpose ops) */ 269eb1ec7c1SStefano Zampini A->ops->multtranspose = A->ops->mult; 270eb1ec7c1SStefano Zampini A->ops->multtransposeadd = A->ops->multadd; 271eb1ec7c1SStefano Zampini } 272eb1ec7c1SStefano Zampini #endif 273eb1ec7c1SStefano Zampini break; 274eb1ec7c1SStefano Zampini /* These options are handled directly by MatSetOption() */ 27577e54ba9SKris Buschelman case MAT_STRUCTURALLY_SYMMETRIC: 2769a4540c5SBarry Smith case MAT_SYMMETRY_ETERNAL: 277b94d7dedSBarry Smith case MAT_STRUCTURAL_SYMMETRY_ETERNAL: 278672ba085SHong Zhang case MAT_STRUCTURE_ONLY: 279b94d7dedSBarry Smith case MAT_SPD_ETERNAL: 2804dcd73b1SHong Zhang /* These options are handled directly by MatSetOption() */ 281290bbb0aSBarry Smith break; 282d71ae5a4SJacob Faibussowitsch case MAT_IGNORE_LOWER_TRIANGULAR: 283d71ae5a4SJacob Faibussowitsch a->ignore_ltriangular = flg; 284d71ae5a4SJacob Faibussowitsch break; 285d71ae5a4SJacob Faibussowitsch case MAT_ERROR_LOWER_TRIANGULAR: 286d71ae5a4SJacob Faibussowitsch a->ignore_ltriangular = flg; 287d71ae5a4SJacob Faibussowitsch break; 288d71ae5a4SJacob Faibussowitsch case MAT_GETROW_UPPERTRIANGULAR: 289d71ae5a4SJacob Faibussowitsch a->getrow_utriangular = flg; 290d71ae5a4SJacob Faibussowitsch break; 291d71ae5a4SJacob Faibussowitsch case MAT_SUBMAT_SINGLEIS: 292d71ae5a4SJacob Faibussowitsch break; 293d71ae5a4SJacob Faibussowitsch default: 294d71ae5a4SJacob Faibussowitsch SETERRQ(PETSC_COMM_SELF, PETSC_ERR_SUP, "unknown option %d", op); 29549b5e25fSSatish Balay } 2963ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 29749b5e25fSSatish Balay } 29849b5e25fSSatish Balay 299d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetRow_SeqSBAIJ(Mat A, PetscInt row, PetscInt *nz, PetscInt **idx, PetscScalar **v) 300d71ae5a4SJacob Faibussowitsch { 30149b5e25fSSatish Balay Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)A->data; 30249b5e25fSSatish Balay 30349b5e25fSSatish Balay PetscFunctionBegin; 30408401ef6SPierre Jolivet PetscCheck(!A || a->getrow_utriangular, PETSC_COMM_SELF, PETSC_ERR_SUP, "MatGetRow is not supported for SBAIJ matrix format. Getting the upper triangular part of row, run with -mat_getrow_uppertriangular, call MatSetOption(mat,MAT_GETROW_UPPERTRIANGULAR,PETSC_TRUE) or MatGetRowUpperTriangular()"); 30552768537SHong Zhang 306f5edf698SHong Zhang /* Get the upper triangular part of the row */ 3079566063dSJacob Faibussowitsch PetscCall(MatGetRow_SeqBAIJ_private(A, row, nz, idx, v, a->i, a->j, a->a)); 3083ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 30949b5e25fSSatish Balay } 31049b5e25fSSatish Balay 311d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRestoreRow_SeqSBAIJ(Mat A, PetscInt row, PetscInt *nz, PetscInt **idx, PetscScalar **v) 312d71ae5a4SJacob Faibussowitsch { 31349b5e25fSSatish Balay PetscFunctionBegin; 314cb4a9cd9SHong Zhang if (nz) *nz = 0; 3159566063dSJacob Faibussowitsch if (idx) PetscCall(PetscFree(*idx)); 3169566063dSJacob Faibussowitsch if (v) PetscCall(PetscFree(*v)); 3173ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 31849b5e25fSSatish Balay } 31949b5e25fSSatish Balay 320d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetRowUpperTriangular_SeqSBAIJ(Mat A) 321d71ae5a4SJacob Faibussowitsch { 322f5edf698SHong Zhang Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)A->data; 323f5edf698SHong Zhang 324f5edf698SHong Zhang PetscFunctionBegin; 325f5edf698SHong Zhang a->getrow_utriangular = PETSC_TRUE; 3263ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 327f5edf698SHong Zhang } 328a323099bSStefano Zampini 329d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRestoreRowUpperTriangular_SeqSBAIJ(Mat A) 330d71ae5a4SJacob Faibussowitsch { 331f5edf698SHong Zhang Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)A->data; 332f5edf698SHong Zhang 333f5edf698SHong Zhang PetscFunctionBegin; 334f5edf698SHong Zhang a->getrow_utriangular = PETSC_FALSE; 3353ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 336f5edf698SHong Zhang } 337f5edf698SHong Zhang 338d71ae5a4SJacob Faibussowitsch PetscErrorCode MatTranspose_SeqSBAIJ(Mat A, MatReuse reuse, Mat *B) 339d71ae5a4SJacob Faibussowitsch { 34049b5e25fSSatish Balay PetscFunctionBegin; 3417fb60732SBarry Smith if (reuse == MAT_REUSE_MATRIX) PetscCall(MatTransposeCheckNonzeroState_Private(A, *B)); 342cf37664fSBarry Smith if (reuse == MAT_INITIAL_MATRIX) { 3439566063dSJacob Faibussowitsch PetscCall(MatDuplicate(A, MAT_COPY_VALUES, B)); 344cf37664fSBarry Smith } else if (reuse == MAT_REUSE_MATRIX) { 3459566063dSJacob Faibussowitsch PetscCall(MatCopy(A, *B, SAME_NONZERO_PATTERN)); 346fc4dec0aSBarry Smith } 3473ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 34849b5e25fSSatish Balay } 34949b5e25fSSatish Balay 350d71ae5a4SJacob Faibussowitsch PetscErrorCode MatView_SeqSBAIJ_ASCII(Mat A, PetscViewer viewer) 351d71ae5a4SJacob Faibussowitsch { 35249b5e25fSSatish Balay Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)A->data; 353d0f46423SBarry Smith PetscInt i, j, bs = A->rmap->bs, k, l, bs2 = a->bs2; 354f3ef73ceSBarry Smith PetscViewerFormat format; 355121deb67SSatish Balay PetscInt *diag; 356b3a0534dSBarry Smith const char *matname; 35749b5e25fSSatish Balay 35849b5e25fSSatish Balay PetscFunctionBegin; 3599566063dSJacob Faibussowitsch PetscCall(PetscViewerGetFormat(viewer, &format)); 360456192e2SBarry Smith if (format == PETSC_VIEWER_ASCII_INFO || format == PETSC_VIEWER_ASCII_INFO_DETAIL) { 3619566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " block size is %" PetscInt_FMT "\n", bs)); 362fb9695e5SSatish Balay } else if (format == PETSC_VIEWER_ASCII_MATLAB) { 363d2507d54SMatthew Knepley Mat aij; 364ade3a672SBarry Smith 365d5f3da31SBarry Smith if (A->factortype && bs > 1) { 3669566063dSJacob Faibussowitsch PetscCall(PetscPrintf(PETSC_COMM_SELF, "Warning: matrix is factored with bs>1. MatView() with PETSC_VIEWER_ASCII_MATLAB is not supported and ignored!\n")); 3673ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 36870d5e725SHong Zhang } 3699566063dSJacob Faibussowitsch PetscCall(MatConvert(A, MATSEQAIJ, MAT_INITIAL_MATRIX, &aij)); 37023a3927dSBarry Smith if (((PetscObject)A)->name) PetscCall(PetscObjectGetName((PetscObject)A, &matname)); 37123a3927dSBarry Smith if (((PetscObject)A)->name) PetscCall(PetscObjectSetName((PetscObject)aij, matname)); 37223a3927dSBarry Smith PetscCall(MatView_SeqAIJ(aij, viewer)); 3739566063dSJacob Faibussowitsch PetscCall(MatDestroy(&aij)); 374fb9695e5SSatish Balay } else if (format == PETSC_VIEWER_ASCII_COMMON) { 375b3a0534dSBarry Smith Mat B; 376b3a0534dSBarry Smith 377b3a0534dSBarry Smith PetscCall(MatConvert(A, MATSEQAIJ, MAT_INITIAL_MATRIX, &B)); 378b3a0534dSBarry Smith if (((PetscObject)A)->name) PetscCall(PetscObjectGetName((PetscObject)A, &matname)); 379b3a0534dSBarry Smith if (((PetscObject)A)->name) PetscCall(PetscObjectSetName((PetscObject)B, matname)); 380b3a0534dSBarry Smith PetscCall(MatView_SeqAIJ(B, viewer)); 381b3a0534dSBarry Smith PetscCall(MatDestroy(&B)); 382c1490034SHong Zhang } else if (format == PETSC_VIEWER_ASCII_FACTOR_INFO) { 3833ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 38449b5e25fSSatish Balay } else { 3859566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE)); 3862c990fa1SHong Zhang if (A->factortype) { /* for factored matrix */ 38708401ef6SPierre Jolivet PetscCheck(bs <= 1, PETSC_COMM_SELF, PETSC_ERR_SUP, "matrix is factored with bs>1. Not implemented yet"); 3882c990fa1SHong Zhang 389121deb67SSatish Balay diag = a->diag; 390121deb67SSatish Balay for (i = 0; i < a->mbs; i++) { /* for row block i */ 3919566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "row %" PetscInt_FMT ":", i)); 3922c990fa1SHong Zhang /* diagonal entry */ 3932c990fa1SHong Zhang #if defined(PETSC_USE_COMPLEX) 3942c990fa1SHong Zhang if (PetscImaginaryPart(a->a[diag[i]]) > 0.0) { 3959566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g + %g i) ", a->j[diag[i]], (double)PetscRealPart(1.0 / a->a[diag[i]]), (double)PetscImaginaryPart(1.0 / a->a[diag[i]]))); 3962c990fa1SHong Zhang } else if (PetscImaginaryPart(a->a[diag[i]]) < 0.0) { 3979566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g - %g i) ", a->j[diag[i]], (double)PetscRealPart(1.0 / a->a[diag[i]]), -(double)PetscImaginaryPart(1.0 / a->a[diag[i]]))); 3982c990fa1SHong Zhang } else { 3999566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[diag[i]], (double)PetscRealPart(1.0 / a->a[diag[i]]))); 4002c990fa1SHong Zhang } 4012c990fa1SHong Zhang #else 4029566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[diag[i]], (double)(1.0 / a->a[diag[i]]))); 4032c990fa1SHong Zhang #endif 4042c990fa1SHong Zhang /* off-diagonal entries */ 4052c990fa1SHong Zhang for (k = a->i[i]; k < a->i[i + 1] - 1; k++) { 4062c990fa1SHong Zhang #if defined(PETSC_USE_COMPLEX) 407ca0704adSBarry Smith if (PetscImaginaryPart(a->a[k]) > 0.0) { 4089566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g + %g i) ", bs * a->j[k], (double)PetscRealPart(a->a[k]), (double)PetscImaginaryPart(a->a[k]))); 409ca0704adSBarry Smith } else if (PetscImaginaryPart(a->a[k]) < 0.0) { 4109566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g - %g i) ", bs * a->j[k], (double)PetscRealPart(a->a[k]), -(double)PetscImaginaryPart(a->a[k]))); 4112c990fa1SHong Zhang } else { 4129566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", bs * a->j[k], (double)PetscRealPart(a->a[k]))); 4132c990fa1SHong Zhang } 4142c990fa1SHong Zhang #else 4159566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[k], (double)a->a[k])); 4162c990fa1SHong Zhang #endif 4172c990fa1SHong Zhang } 4189566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 4192c990fa1SHong Zhang } 4202c990fa1SHong Zhang 4212c990fa1SHong Zhang } else { /* for non-factored matrix */ 4220c74a584SJed Brown for (i = 0; i < a->mbs; i++) { /* for row block i */ 4230c74a584SJed Brown for (j = 0; j < bs; j++) { /* for row bs*i + j */ 4249566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "row %" PetscInt_FMT ":", i * bs + j)); 4250c74a584SJed Brown for (k = a->i[i]; k < a->i[i + 1]; k++) { /* for column block */ 4260c74a584SJed Brown for (l = 0; l < bs; l++) { /* for column */ 42749b5e25fSSatish Balay #if defined(PETSC_USE_COMPLEX) 42849b5e25fSSatish Balay if (PetscImaginaryPart(a->a[bs2 * k + l * bs + j]) > 0.0) { 4299371c9d4SSatish Balay PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g + %g i) ", bs * a->j[k] + l, (double)PetscRealPart(a->a[bs2 * k + l * bs + j]), (double)PetscImaginaryPart(a->a[bs2 * k + l * bs + j]))); 43049b5e25fSSatish Balay } else if (PetscImaginaryPart(a->a[bs2 * k + l * bs + j]) < 0.0) { 4319371c9d4SSatish Balay PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g - %g i) ", bs * a->j[k] + l, (double)PetscRealPart(a->a[bs2 * k + l * bs + j]), -(double)PetscImaginaryPart(a->a[bs2 * k + l * bs + j]))); 43249b5e25fSSatish Balay } else { 4339566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", bs * a->j[k] + l, (double)PetscRealPart(a->a[bs2 * k + l * bs + j]))); 43449b5e25fSSatish Balay } 43549b5e25fSSatish Balay #else 4369566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", bs * a->j[k] + l, (double)a->a[bs2 * k + l * bs + j])); 43749b5e25fSSatish Balay #endif 43849b5e25fSSatish Balay } 43949b5e25fSSatish Balay } 4409566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 44149b5e25fSSatish Balay } 44249b5e25fSSatish Balay } 4432c990fa1SHong Zhang } 4449566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE)); 44549b5e25fSSatish Balay } 4469566063dSJacob Faibussowitsch PetscCall(PetscViewerFlush(viewer)); 4473ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 44849b5e25fSSatish Balay } 44949b5e25fSSatish Balay 4509804daf3SBarry Smith #include <petscdraw.h> 451d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatView_SeqSBAIJ_Draw_Zoom(PetscDraw draw, void *Aa) 452d71ae5a4SJacob Faibussowitsch { 45349b5e25fSSatish Balay Mat A = (Mat)Aa; 45449b5e25fSSatish Balay Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)A->data; 455d0f46423SBarry Smith PetscInt row, i, j, k, l, mbs = a->mbs, color, bs = A->rmap->bs, bs2 = a->bs2; 45649b5e25fSSatish Balay PetscReal xl, yl, xr, yr, x_l, x_r, y_l, y_r; 45749b5e25fSSatish Balay MatScalar *aa; 458b0a32e0cSBarry Smith PetscViewer viewer; 45949b5e25fSSatish Balay 46049b5e25fSSatish Balay PetscFunctionBegin; 4619566063dSJacob Faibussowitsch PetscCall(PetscObjectQuery((PetscObject)A, "Zoomviewer", (PetscObject *)&viewer)); 4629566063dSJacob Faibussowitsch PetscCall(PetscDrawGetCoordinates(draw, &xl, &yl, &xr, &yr)); 46349b5e25fSSatish Balay 46449b5e25fSSatish Balay /* loop over matrix elements drawing boxes */ 465383922c3SLisandro Dalcin 466d0609cedSBarry Smith PetscDrawCollectiveBegin(draw); 4679566063dSJacob Faibussowitsch PetscCall(PetscDrawString(draw, .3 * (xl + xr), .3 * (yl + yr), PETSC_DRAW_BLACK, "symmetric")); 468383922c3SLisandro Dalcin /* Blue for negative, Cyan for zero and Red for positive */ 469b0a32e0cSBarry Smith color = PETSC_DRAW_BLUE; 47049b5e25fSSatish Balay for (i = 0, row = 0; i < mbs; i++, row += bs) { 47149b5e25fSSatish Balay for (j = a->i[i]; j < a->i[i + 1]; j++) { 4729371c9d4SSatish Balay y_l = A->rmap->N - row - 1.0; 4739371c9d4SSatish Balay y_r = y_l + 1.0; 4749371c9d4SSatish Balay x_l = a->j[j] * bs; 4759371c9d4SSatish Balay x_r = x_l + 1.0; 47649b5e25fSSatish Balay aa = a->a + j * bs2; 47749b5e25fSSatish Balay for (k = 0; k < bs; k++) { 47849b5e25fSSatish Balay for (l = 0; l < bs; l++) { 47949b5e25fSSatish Balay if (PetscRealPart(*aa++) >= 0.) continue; 4809566063dSJacob Faibussowitsch PetscCall(PetscDrawRectangle(draw, x_l + k, y_l - l, x_r + k, y_r - l, color, color, color, color)); 48149b5e25fSSatish Balay } 48249b5e25fSSatish Balay } 48349b5e25fSSatish Balay } 48449b5e25fSSatish Balay } 485b0a32e0cSBarry Smith color = PETSC_DRAW_CYAN; 48649b5e25fSSatish Balay for (i = 0, row = 0; i < mbs; i++, row += bs) { 48749b5e25fSSatish Balay for (j = a->i[i]; j < a->i[i + 1]; j++) { 4889371c9d4SSatish Balay y_l = A->rmap->N - row - 1.0; 4899371c9d4SSatish Balay y_r = y_l + 1.0; 4909371c9d4SSatish Balay x_l = a->j[j] * bs; 4919371c9d4SSatish Balay x_r = x_l + 1.0; 49249b5e25fSSatish Balay aa = a->a + j * bs2; 49349b5e25fSSatish Balay for (k = 0; k < bs; k++) { 49449b5e25fSSatish Balay for (l = 0; l < bs; l++) { 49549b5e25fSSatish Balay if (PetscRealPart(*aa++) != 0.) continue; 4969566063dSJacob Faibussowitsch PetscCall(PetscDrawRectangle(draw, x_l + k, y_l - l, x_r + k, y_r - l, color, color, color, color)); 49749b5e25fSSatish Balay } 49849b5e25fSSatish Balay } 49949b5e25fSSatish Balay } 50049b5e25fSSatish Balay } 501b0a32e0cSBarry Smith color = PETSC_DRAW_RED; 50249b5e25fSSatish Balay for (i = 0, row = 0; i < mbs; i++, row += bs) { 50349b5e25fSSatish Balay for (j = a->i[i]; j < a->i[i + 1]; j++) { 5049371c9d4SSatish Balay y_l = A->rmap->N - row - 1.0; 5059371c9d4SSatish Balay y_r = y_l + 1.0; 5069371c9d4SSatish Balay x_l = a->j[j] * bs; 5079371c9d4SSatish Balay x_r = x_l + 1.0; 50849b5e25fSSatish Balay aa = a->a + j * bs2; 50949b5e25fSSatish Balay for (k = 0; k < bs; k++) { 51049b5e25fSSatish Balay for (l = 0; l < bs; l++) { 51149b5e25fSSatish Balay if (PetscRealPart(*aa++) <= 0.) continue; 5129566063dSJacob Faibussowitsch PetscCall(PetscDrawRectangle(draw, x_l + k, y_l - l, x_r + k, y_r - l, color, color, color, color)); 51349b5e25fSSatish Balay } 51449b5e25fSSatish Balay } 51549b5e25fSSatish Balay } 51649b5e25fSSatish Balay } 517d0609cedSBarry Smith PetscDrawCollectiveEnd(draw); 5183ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 51949b5e25fSSatish Balay } 52049b5e25fSSatish Balay 521d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatView_SeqSBAIJ_Draw(Mat A, PetscViewer viewer) 522d71ae5a4SJacob Faibussowitsch { 52349b5e25fSSatish Balay PetscReal xl, yl, xr, yr, w, h; 524b0a32e0cSBarry Smith PetscDraw draw; 525ace3abfcSBarry Smith PetscBool isnull; 52649b5e25fSSatish Balay 52749b5e25fSSatish Balay PetscFunctionBegin; 5289566063dSJacob Faibussowitsch PetscCall(PetscViewerDrawGetDraw(viewer, 0, &draw)); 5299566063dSJacob Faibussowitsch PetscCall(PetscDrawIsNull(draw, &isnull)); 5303ba16761SJacob Faibussowitsch if (isnull) PetscFunctionReturn(PETSC_SUCCESS); 53149b5e25fSSatish Balay 5329371c9d4SSatish Balay xr = A->rmap->N; 5339371c9d4SSatish Balay yr = A->rmap->N; 5349371c9d4SSatish Balay h = yr / 10.0; 5359371c9d4SSatish Balay w = xr / 10.0; 5369371c9d4SSatish Balay xr += w; 5379371c9d4SSatish Balay yr += h; 5389371c9d4SSatish Balay xl = -w; 5399371c9d4SSatish Balay yl = -h; 5409566063dSJacob Faibussowitsch PetscCall(PetscDrawSetCoordinates(draw, xl, yl, xr, yr)); 5419566063dSJacob Faibussowitsch PetscCall(PetscObjectCompose((PetscObject)A, "Zoomviewer", (PetscObject)viewer)); 5429566063dSJacob Faibussowitsch PetscCall(PetscDrawZoom(draw, MatView_SeqSBAIJ_Draw_Zoom, A)); 5439566063dSJacob Faibussowitsch PetscCall(PetscObjectCompose((PetscObject)A, "Zoomviewer", NULL)); 5449566063dSJacob Faibussowitsch PetscCall(PetscDrawSave(draw)); 5453ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 54649b5e25fSSatish Balay } 54749b5e25fSSatish Balay 548618cc2edSLisandro Dalcin /* Used for both MPIBAIJ and MPISBAIJ matrices */ 549618cc2edSLisandro Dalcin #define MatView_SeqSBAIJ_Binary MatView_SeqBAIJ_Binary 550618cc2edSLisandro Dalcin 551d71ae5a4SJacob Faibussowitsch PetscErrorCode MatView_SeqSBAIJ(Mat A, PetscViewer viewer) 552d71ae5a4SJacob Faibussowitsch { 553618cc2edSLisandro Dalcin PetscBool iascii, isbinary, isdraw; 55449b5e25fSSatish Balay 55549b5e25fSSatish Balay PetscFunctionBegin; 5569566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERASCII, &iascii)); 5579566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERBINARY, &isbinary)); 5589566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERDRAW, &isdraw)); 55932077d6dSBarry Smith if (iascii) { 5609566063dSJacob Faibussowitsch PetscCall(MatView_SeqSBAIJ_ASCII(A, viewer)); 561618cc2edSLisandro Dalcin } else if (isbinary) { 5629566063dSJacob Faibussowitsch PetscCall(MatView_SeqSBAIJ_Binary(A, viewer)); 56349b5e25fSSatish Balay } else if (isdraw) { 5649566063dSJacob Faibussowitsch PetscCall(MatView_SeqSBAIJ_Draw(A, viewer)); 56549b5e25fSSatish Balay } else { 566a5e6ed63SBarry Smith Mat B; 567ade3a672SBarry Smith const char *matname; 5689566063dSJacob Faibussowitsch PetscCall(MatConvert(A, MATSEQAIJ, MAT_INITIAL_MATRIX, &B)); 56923a3927dSBarry Smith if (((PetscObject)A)->name) PetscCall(PetscObjectGetName((PetscObject)A, &matname)); 57023a3927dSBarry Smith if (((PetscObject)A)->name) PetscCall(PetscObjectSetName((PetscObject)B, matname)); 5719566063dSJacob Faibussowitsch PetscCall(MatView(B, viewer)); 5729566063dSJacob Faibussowitsch PetscCall(MatDestroy(&B)); 57349b5e25fSSatish Balay } 5743ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 57549b5e25fSSatish Balay } 57649b5e25fSSatish Balay 577d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetValues_SeqSBAIJ(Mat A, PetscInt m, const PetscInt im[], PetscInt n, const PetscInt in[], PetscScalar v[]) 578d71ae5a4SJacob Faibussowitsch { 579045c9aa0SHong Zhang Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)A->data; 58013f74950SBarry Smith PetscInt *rp, k, low, high, t, row, nrow, i, col, l, *aj = a->j; 58113f74950SBarry Smith PetscInt *ai = a->i, *ailen = a->ilen; 582d0f46423SBarry Smith PetscInt brow, bcol, ridx, cidx, bs = A->rmap->bs, bs2 = a->bs2; 58397e567efSBarry Smith MatScalar *ap, *aa = a->a; 58449b5e25fSSatish Balay 58549b5e25fSSatish Balay PetscFunctionBegin; 58649b5e25fSSatish Balay for (k = 0; k < m; k++) { /* loop over rows */ 5879371c9d4SSatish Balay row = im[k]; 5889371c9d4SSatish Balay brow = row / bs; 5899371c9d4SSatish Balay if (row < 0) { 5909371c9d4SSatish Balay v += n; 5919371c9d4SSatish Balay continue; 5929371c9d4SSatish Balay } /* negative row */ 59354c59aa7SJacob Faibussowitsch PetscCheck(row < A->rmap->N, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Row too large: row %" PetscInt_FMT " max %" PetscInt_FMT, row, A->rmap->N - 1); 5949371c9d4SSatish Balay rp = aj + ai[brow]; 5959371c9d4SSatish Balay ap = aa + bs2 * ai[brow]; 59649b5e25fSSatish Balay nrow = ailen[brow]; 59749b5e25fSSatish Balay for (l = 0; l < n; l++) { /* loop over columns */ 5989371c9d4SSatish Balay if (in[l] < 0) { 5999371c9d4SSatish Balay v++; 6009371c9d4SSatish Balay continue; 6019371c9d4SSatish Balay } /* negative column */ 60254c59aa7SJacob Faibussowitsch PetscCheck(in[l] < A->cmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Column too large: col %" PetscInt_FMT " max %" PetscInt_FMT, in[l], A->cmap->n - 1); 60349b5e25fSSatish Balay col = in[l]; 60449b5e25fSSatish Balay bcol = col / bs; 60549b5e25fSSatish Balay cidx = col % bs; 60649b5e25fSSatish Balay ridx = row % bs; 60749b5e25fSSatish Balay high = nrow; 60849b5e25fSSatish Balay low = 0; /* assume unsorted */ 60949b5e25fSSatish Balay while (high - low > 5) { 61049b5e25fSSatish Balay t = (low + high) / 2; 61149b5e25fSSatish Balay if (rp[t] > bcol) high = t; 61249b5e25fSSatish Balay else low = t; 61349b5e25fSSatish Balay } 61449b5e25fSSatish Balay for (i = low; i < high; i++) { 61549b5e25fSSatish Balay if (rp[i] > bcol) break; 61649b5e25fSSatish Balay if (rp[i] == bcol) { 61749b5e25fSSatish Balay *v++ = ap[bs2 * i + bs * cidx + ridx]; 61849b5e25fSSatish Balay goto finished; 61949b5e25fSSatish Balay } 62049b5e25fSSatish Balay } 62197e567efSBarry Smith *v++ = 0.0; 62249b5e25fSSatish Balay finished:; 62349b5e25fSSatish Balay } 62449b5e25fSSatish Balay } 6253ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 62649b5e25fSSatish Balay } 62749b5e25fSSatish Balay 628d71ae5a4SJacob Faibussowitsch PetscErrorCode MatPermute_SeqSBAIJ(Mat A, IS rowp, IS colp, Mat *B) 629d71ae5a4SJacob Faibussowitsch { 630dc29a518SPierre Jolivet Mat C; 631dc29a518SPierre Jolivet 632dc29a518SPierre Jolivet PetscFunctionBegin; 6339566063dSJacob Faibussowitsch PetscCall(MatConvert(A, MATSEQBAIJ, MAT_INITIAL_MATRIX, &C)); 6349566063dSJacob Faibussowitsch PetscCall(MatPermute(C, rowp, colp, B)); 6359566063dSJacob Faibussowitsch PetscCall(MatDestroy(&C)); 63648a46eb9SPierre Jolivet if (rowp == colp) PetscCall(MatConvert(*B, MATSEQSBAIJ, MAT_INPLACE_MATRIX, B)); 6373ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 638dc29a518SPierre Jolivet } 63949b5e25fSSatish Balay 640d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetValuesBlocked_SeqSBAIJ(Mat A, PetscInt m, const PetscInt im[], PetscInt n, const PetscInt in[], const PetscScalar v[], InsertMode is) 641d71ae5a4SJacob Faibussowitsch { 6420880e062SHong Zhang Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)A->data; 643e2ee6c50SBarry Smith PetscInt *rp, k, low, high, t, ii, jj, row, nrow, i, col, l, rmax, N, lastcol = -1; 64413f74950SBarry Smith PetscInt *imax = a->imax, *ai = a->i, *ailen = a->ilen; 645d0f46423SBarry Smith PetscInt *aj = a->j, nonew = a->nonew, bs2 = a->bs2, bs = A->rmap->bs, stepval; 646ace3abfcSBarry Smith PetscBool roworiented = a->roworiented; 647dd6ea824SBarry Smith const PetscScalar *value = v; 648f15d580aSBarry Smith MatScalar *ap, *aa = a->a, *bap; 6490880e062SHong Zhang 65049b5e25fSSatish Balay PetscFunctionBegin; 65126fbe8dcSKarl Rupp if (roworiented) stepval = (n - 1) * bs; 65226fbe8dcSKarl Rupp else stepval = (m - 1) * bs; 65326fbe8dcSKarl Rupp 6540880e062SHong Zhang for (k = 0; k < m; k++) { /* loop over added rows */ 6550880e062SHong Zhang row = im[k]; 6560880e062SHong Zhang if (row < 0) continue; 6576bdcaf15SBarry Smith PetscCheck(row < a->mbs, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Block index row too large %" PetscInt_FMT " max %" PetscInt_FMT, row, a->mbs - 1); 6580880e062SHong Zhang rp = aj + ai[row]; 6590880e062SHong Zhang ap = aa + bs2 * ai[row]; 6600880e062SHong Zhang rmax = imax[row]; 6610880e062SHong Zhang nrow = ailen[row]; 6620880e062SHong Zhang low = 0; 663818f2c47SBarry Smith high = nrow; 6640880e062SHong Zhang for (l = 0; l < n; l++) { /* loop over added columns */ 6650880e062SHong Zhang if (in[l] < 0) continue; 6660880e062SHong Zhang col = in[l]; 6676bdcaf15SBarry Smith PetscCheck(col < a->nbs, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Block index column too large %" PetscInt_FMT " max %" PetscInt_FMT, col, a->nbs - 1); 668b98bf0e1SJed Brown if (col < row) { 66926fbe8dcSKarl Rupp if (a->ignore_ltriangular) continue; /* ignore lower triangular block */ 67026fbe8dcSKarl Rupp else SETERRQ(PETSC_COMM_SELF, PETSC_ERR_USER, "Lower triangular value cannot be set for sbaij format. Ignoring these values, run with -mat_ignore_lower_triangular or call MatSetOption(mat,MAT_IGNORE_LOWER_TRIANGULAR,PETSC_TRUE)"); 671b98bf0e1SJed Brown } 67226fbe8dcSKarl Rupp if (roworiented) value = v + k * (stepval + bs) * bs + l * bs; 67326fbe8dcSKarl Rupp else value = v + l * (stepval + bs) * bs + k * bs; 67426fbe8dcSKarl Rupp 67526fbe8dcSKarl Rupp if (col <= lastcol) low = 0; 67626fbe8dcSKarl Rupp else high = nrow; 67726fbe8dcSKarl Rupp 678e2ee6c50SBarry Smith lastcol = col; 6790880e062SHong Zhang while (high - low > 7) { 6800880e062SHong Zhang t = (low + high) / 2; 6810880e062SHong Zhang if (rp[t] > col) high = t; 6820880e062SHong Zhang else low = t; 6830880e062SHong Zhang } 6840880e062SHong Zhang for (i = low; i < high; i++) { 6850880e062SHong Zhang if (rp[i] > col) break; 6860880e062SHong Zhang if (rp[i] == col) { 6870880e062SHong Zhang bap = ap + bs2 * i; 6880880e062SHong Zhang if (roworiented) { 6890880e062SHong Zhang if (is == ADD_VALUES) { 6900880e062SHong Zhang for (ii = 0; ii < bs; ii++, value += stepval) { 691ad540459SPierre Jolivet for (jj = ii; jj < bs2; jj += bs) bap[jj] += *value++; 6920880e062SHong Zhang } 6930880e062SHong Zhang } else { 6940880e062SHong Zhang for (ii = 0; ii < bs; ii++, value += stepval) { 695ad540459SPierre Jolivet for (jj = ii; jj < bs2; jj += bs) bap[jj] = *value++; 6960880e062SHong Zhang } 6970880e062SHong Zhang } 6980880e062SHong Zhang } else { 6990880e062SHong Zhang if (is == ADD_VALUES) { 7000880e062SHong Zhang for (ii = 0; ii < bs; ii++, value += stepval) { 701ad540459SPierre Jolivet for (jj = 0; jj < bs; jj++) *bap++ += *value++; 7020880e062SHong Zhang } 7030880e062SHong Zhang } else { 7040880e062SHong Zhang for (ii = 0; ii < bs; ii++, value += stepval) { 705ad540459SPierre Jolivet for (jj = 0; jj < bs; jj++) *bap++ = *value++; 7060880e062SHong Zhang } 7070880e062SHong Zhang } 7080880e062SHong Zhang } 7090880e062SHong Zhang goto noinsert2; 7100880e062SHong Zhang } 7110880e062SHong Zhang } 7120880e062SHong Zhang if (nonew == 1) goto noinsert2; 71308401ef6SPierre Jolivet PetscCheck(nonew != -1, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Inserting a new block index nonzero block (%" PetscInt_FMT ", %" PetscInt_FMT ") in the matrix", row, col); 714fef13f97SBarry Smith MatSeqXAIJReallocateAIJ(A, a->mbs, bs2, nrow, row, col, rmax, aa, ai, aj, rp, ap, imax, nonew, MatScalar); 7159371c9d4SSatish Balay N = nrow++ - 1; 7169371c9d4SSatish Balay high++; 7170880e062SHong Zhang /* shift up all the later entries in this row */ 7189566063dSJacob Faibussowitsch PetscCall(PetscArraymove(rp + i + 1, rp + i, N - i + 1)); 7199566063dSJacob Faibussowitsch PetscCall(PetscArraymove(ap + bs2 * (i + 1), ap + bs2 * i, bs2 * (N - i + 1))); 7209566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(ap + bs2 * i, bs2)); 7210880e062SHong Zhang rp[i] = col; 7220880e062SHong Zhang bap = ap + bs2 * i; 7230880e062SHong Zhang if (roworiented) { 7240880e062SHong Zhang for (ii = 0; ii < bs; ii++, value += stepval) { 725ad540459SPierre Jolivet for (jj = ii; jj < bs2; jj += bs) bap[jj] = *value++; 7260880e062SHong Zhang } 7270880e062SHong Zhang } else { 7280880e062SHong Zhang for (ii = 0; ii < bs; ii++, value += stepval) { 729ad540459SPierre Jolivet for (jj = 0; jj < bs; jj++) *bap++ = *value++; 7300880e062SHong Zhang } 7310880e062SHong Zhang } 7320880e062SHong Zhang noinsert2:; 7330880e062SHong Zhang low = i; 7340880e062SHong Zhang } 7350880e062SHong Zhang ailen[row] = nrow; 7360880e062SHong Zhang } 7373ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 73849b5e25fSSatish Balay } 73949b5e25fSSatish Balay 74064831d72SBarry Smith /* 74164831d72SBarry Smith This is not yet used 74264831d72SBarry Smith */ 743d71ae5a4SJacob Faibussowitsch PetscErrorCode MatAssemblyEnd_SeqSBAIJ_SeqAIJ_Inode(Mat A) 744d71ae5a4SJacob Faibussowitsch { 7450def2e27SBarry Smith Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)A->data; 7460def2e27SBarry Smith const PetscInt *ai = a->i, *aj = a->j, *cols; 7470def2e27SBarry Smith PetscInt i = 0, j, blk_size, m = A->rmap->n, node_count = 0, nzx, nzy, *ns, row, nz, cnt, cnt2, *counts; 748ace3abfcSBarry Smith PetscBool flag; 7490def2e27SBarry Smith 7500def2e27SBarry Smith PetscFunctionBegin; 7519566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m, &ns)); 7520def2e27SBarry Smith while (i < m) { 7530def2e27SBarry Smith nzx = ai[i + 1] - ai[i]; /* Number of nonzeros */ 7540def2e27SBarry Smith /* Limits the number of elements in a node to 'a->inode.limit' */ 7550def2e27SBarry Smith for (j = i + 1, blk_size = 1; j < m && blk_size < a->inode.limit; ++j, ++blk_size) { 7560def2e27SBarry Smith nzy = ai[j + 1] - ai[j]; 7570def2e27SBarry Smith if (nzy != (nzx - j + i)) break; 7589566063dSJacob Faibussowitsch PetscCall(PetscArraycmp(aj + ai[i] + j - i, aj + ai[j], nzy, &flag)); 7590def2e27SBarry Smith if (!flag) break; 7600def2e27SBarry Smith } 7610def2e27SBarry Smith ns[node_count++] = blk_size; 76226fbe8dcSKarl Rupp 7630def2e27SBarry Smith i = j; 7640def2e27SBarry Smith } 7650def2e27SBarry Smith if (!a->inode.size && m && node_count > .9 * m) { 7669566063dSJacob Faibussowitsch PetscCall(PetscFree(ns)); 7679566063dSJacob Faibussowitsch PetscCall(PetscInfo(A, "Found %" PetscInt_FMT " nodes out of %" PetscInt_FMT " rows. Not using Inode routines\n", node_count, m)); 7680def2e27SBarry Smith } else { 7690def2e27SBarry Smith a->inode.node_count = node_count; 77026fbe8dcSKarl Rupp 7719566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(node_count, &a->inode.size)); 7729566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(a->inode.size, ns, node_count)); 7739566063dSJacob Faibussowitsch PetscCall(PetscFree(ns)); 7749566063dSJacob Faibussowitsch PetscCall(PetscInfo(A, "Found %" PetscInt_FMT " nodes of %" PetscInt_FMT ". Limit used: %" PetscInt_FMT ". Using Inode routines\n", node_count, m, a->inode.limit)); 7750def2e27SBarry Smith 7760def2e27SBarry Smith /* count collections of adjacent columns in each inode */ 7770def2e27SBarry Smith row = 0; 7780def2e27SBarry Smith cnt = 0; 7790def2e27SBarry Smith for (i = 0; i < node_count; i++) { 7800def2e27SBarry Smith cols = aj + ai[row] + a->inode.size[i]; 7810def2e27SBarry Smith nz = ai[row + 1] - ai[row] - a->inode.size[i]; 7820def2e27SBarry Smith for (j = 1; j < nz; j++) { 78326fbe8dcSKarl Rupp if (cols[j] != cols[j - 1] + 1) cnt++; 7840def2e27SBarry Smith } 7850def2e27SBarry Smith cnt++; 7860def2e27SBarry Smith row += a->inode.size[i]; 7870def2e27SBarry Smith } 7889566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(2 * cnt, &counts)); 7890def2e27SBarry Smith cnt = 0; 7900def2e27SBarry Smith row = 0; 7910def2e27SBarry Smith for (i = 0; i < node_count; i++) { 7920def2e27SBarry Smith cols = aj + ai[row] + a->inode.size[i]; 7930def2e27SBarry Smith counts[2 * cnt] = cols[0]; 7940def2e27SBarry Smith nz = ai[row + 1] - ai[row] - a->inode.size[i]; 7950def2e27SBarry Smith cnt2 = 1; 7960def2e27SBarry Smith for (j = 1; j < nz; j++) { 7970def2e27SBarry Smith if (cols[j] != cols[j - 1] + 1) { 7980def2e27SBarry Smith counts[2 * (cnt++) + 1] = cnt2; 7990def2e27SBarry Smith counts[2 * cnt] = cols[j]; 8000def2e27SBarry Smith cnt2 = 1; 8010def2e27SBarry Smith } else cnt2++; 8020def2e27SBarry Smith } 8030def2e27SBarry Smith counts[2 * (cnt++) + 1] = cnt2; 8040def2e27SBarry Smith row += a->inode.size[i]; 8050def2e27SBarry Smith } 8069566063dSJacob Faibussowitsch PetscCall(PetscIntView(2 * cnt, counts, NULL)); 8070def2e27SBarry Smith } 8083ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 80938702af4SBarry Smith } 81038702af4SBarry Smith 811d71ae5a4SJacob Faibussowitsch PetscErrorCode MatAssemblyEnd_SeqSBAIJ(Mat A, MatAssemblyType mode) 812d71ae5a4SJacob Faibussowitsch { 81349b5e25fSSatish Balay Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)A->data; 8148f8f2f0dSBarry Smith PetscInt fshift = 0, i, *ai = a->i, *aj = a->j, *imax = a->imax; 815d0f46423SBarry Smith PetscInt m = A->rmap->N, *ip, N, *ailen = a->ilen; 81613f74950SBarry Smith PetscInt mbs = a->mbs, bs2 = a->bs2, rmax = 0; 81749b5e25fSSatish Balay MatScalar *aa = a->a, *ap; 81849b5e25fSSatish Balay 81949b5e25fSSatish Balay PetscFunctionBegin; 8203ba16761SJacob Faibussowitsch if (mode == MAT_FLUSH_ASSEMBLY) PetscFunctionReturn(PETSC_SUCCESS); 82149b5e25fSSatish Balay 82249b5e25fSSatish Balay if (m) rmax = ailen[0]; 82349b5e25fSSatish Balay for (i = 1; i < mbs; i++) { 82449b5e25fSSatish Balay /* move each row back by the amount of empty slots (fshift) before it*/ 82549b5e25fSSatish Balay fshift += imax[i - 1] - ailen[i - 1]; 82649b5e25fSSatish Balay rmax = PetscMax(rmax, ailen[i]); 82749b5e25fSSatish Balay if (fshift) { 828580bdb30SBarry Smith ip = aj + ai[i]; 829580bdb30SBarry Smith ap = aa + bs2 * ai[i]; 83049b5e25fSSatish Balay N = ailen[i]; 8319566063dSJacob Faibussowitsch PetscCall(PetscArraymove(ip - fshift, ip, N)); 8329566063dSJacob Faibussowitsch PetscCall(PetscArraymove(ap - bs2 * fshift, ap, bs2 * N)); 83349b5e25fSSatish Balay } 83449b5e25fSSatish Balay ai[i] = ai[i - 1] + ailen[i - 1]; 83549b5e25fSSatish Balay } 83649b5e25fSSatish Balay if (mbs) { 83749b5e25fSSatish Balay fshift += imax[mbs - 1] - ailen[mbs - 1]; 83849b5e25fSSatish Balay ai[mbs] = ai[mbs - 1] + ailen[mbs - 1]; 83949b5e25fSSatish Balay } 84049b5e25fSSatish Balay /* reset ilen and imax for each row */ 841ad540459SPierre Jolivet for (i = 0; i < mbs; i++) ailen[i] = imax[i] = ai[i + 1] - ai[i]; 8426c6c5352SBarry Smith a->nz = ai[mbs]; 84349b5e25fSSatish Balay 844b424e231SHong Zhang /* diagonals may have moved, reset it */ 8451baa6e33SBarry Smith if (a->diag) PetscCall(PetscArraycpy(a->diag, ai, mbs)); 846aed4548fSBarry Smith PetscCheck(!fshift || a->nounused != -1, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Unused space detected in matrix: %" PetscInt_FMT " X %" PetscInt_FMT " block size %" PetscInt_FMT ", %" PetscInt_FMT " unneeded", m, A->cmap->n, A->rmap->bs, fshift * bs2); 84726fbe8dcSKarl Rupp 8489566063dSJacob Faibussowitsch PetscCall(PetscInfo(A, "Matrix size: %" PetscInt_FMT " X %" PetscInt_FMT ", block size %" PetscInt_FMT "; storage space: %" PetscInt_FMT " unneeded, %" PetscInt_FMT " used\n", m, A->rmap->N, A->rmap->bs, fshift * bs2, a->nz * bs2)); 8499566063dSJacob Faibussowitsch PetscCall(PetscInfo(A, "Number of mallocs during MatSetValues is %" PetscInt_FMT "\n", a->reallocs)); 8509566063dSJacob Faibussowitsch PetscCall(PetscInfo(A, "Most nonzeros blocks in any row is %" PetscInt_FMT "\n", rmax)); 85126fbe8dcSKarl Rupp 8528e58a170SBarry Smith A->info.mallocs += a->reallocs; 85349b5e25fSSatish Balay a->reallocs = 0; 85449b5e25fSSatish Balay A->info.nz_unneeded = (PetscReal)fshift * bs2; 855061b2667SBarry Smith a->idiagvalid = PETSC_FALSE; 8564dcd73b1SHong Zhang a->rmax = rmax; 85738702af4SBarry Smith 85838702af4SBarry Smith if (A->cmap->n < 65536 && A->cmap->bs == 1) { 85944e1c64aSLisandro Dalcin if (a->jshort && a->free_jshort) { 86017803ae8SHong Zhang /* when matrix data structure is changed, previous jshort must be replaced */ 8619566063dSJacob Faibussowitsch PetscCall(PetscFree(a->jshort)); 86217803ae8SHong Zhang } 8639566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(a->i[A->rmap->n], &a->jshort)); 86438702af4SBarry Smith for (i = 0; i < a->i[A->rmap->n]; i++) a->jshort[i] = a->j[i]; 86538702af4SBarry Smith A->ops->mult = MatMult_SeqSBAIJ_1_ushort; 86641f059aeSBarry Smith A->ops->sor = MatSOR_SeqSBAIJ_ushort; 8674da8f245SBarry Smith a->free_jshort = PETSC_TRUE; 86838702af4SBarry Smith } 8693ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 87049b5e25fSSatish Balay } 87149b5e25fSSatish Balay 87249b5e25fSSatish Balay /* 87349b5e25fSSatish Balay This function returns an array of flags which indicate the locations of contiguous 87449b5e25fSSatish Balay blocks that should be zeroed. for eg: if bs = 3 and is = [0,1,2,3,5,6,7,8,9] 875a5b23f4aSJose E. Roman then the resulting sizes = [3,1,1,3,1] corresponding to sets [(0,1,2),(3),(5),(6,7,8),(9)] 87649b5e25fSSatish Balay Assume: sizes should be long enough to hold all the values. 87749b5e25fSSatish Balay */ 878d71ae5a4SJacob Faibussowitsch PetscErrorCode MatZeroRows_SeqSBAIJ_Check_Blocks(PetscInt idx[], PetscInt n, PetscInt bs, PetscInt sizes[], PetscInt *bs_max) 879d71ae5a4SJacob Faibussowitsch { 88013f74950SBarry Smith PetscInt i, j, k, row; 881ace3abfcSBarry Smith PetscBool flg; 88249b5e25fSSatish Balay 88349b5e25fSSatish Balay PetscFunctionBegin; 88449b5e25fSSatish Balay for (i = 0, j = 0; i < n; j++) { 88549b5e25fSSatish Balay row = idx[i]; 886a5b23f4aSJose E. Roman if (row % bs != 0) { /* Not the beginning of a block */ 88749b5e25fSSatish Balay sizes[j] = 1; 88849b5e25fSSatish Balay i++; 88949b5e25fSSatish Balay } else if (i + bs > n) { /* Beginning of a block, but complete block doesn't exist (at idx end) */ 89049b5e25fSSatish Balay sizes[j] = 1; /* Also makes sure at least 'bs' values exist for next else */ 89149b5e25fSSatish Balay i++; 8926aad120cSJose E. Roman } else { /* Beginning of the block, so check if the complete block exists */ 89349b5e25fSSatish Balay flg = PETSC_TRUE; 89449b5e25fSSatish Balay for (k = 1; k < bs; k++) { 89549b5e25fSSatish Balay if (row + k != idx[i + k]) { /* break in the block */ 89649b5e25fSSatish Balay flg = PETSC_FALSE; 89749b5e25fSSatish Balay break; 89849b5e25fSSatish Balay } 89949b5e25fSSatish Balay } 900abc0a331SBarry Smith if (flg) { /* No break in the bs */ 90149b5e25fSSatish Balay sizes[j] = bs; 90249b5e25fSSatish Balay i += bs; 90349b5e25fSSatish Balay } else { 90449b5e25fSSatish Balay sizes[j] = 1; 90549b5e25fSSatish Balay i++; 90649b5e25fSSatish Balay } 90749b5e25fSSatish Balay } 90849b5e25fSSatish Balay } 90949b5e25fSSatish Balay *bs_max = j; 9103ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 91149b5e25fSSatish Balay } 91249b5e25fSSatish Balay 91349b5e25fSSatish Balay /* Only add/insert a(i,j) with i<=j (blocks). 914da81f932SPierre Jolivet Any a(i,j) with i>j input by user is ignored. 91549b5e25fSSatish Balay */ 91649b5e25fSSatish Balay 917d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetValues_SeqSBAIJ(Mat A, PetscInt m, const PetscInt im[], PetscInt n, const PetscInt in[], const PetscScalar v[], InsertMode is) 918d71ae5a4SJacob Faibussowitsch { 91949b5e25fSSatish Balay Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)A->data; 920e2ee6c50SBarry Smith PetscInt *rp, k, low, high, t, ii, row, nrow, i, col, l, rmax, N, lastcol = -1; 92113f74950SBarry Smith PetscInt *imax = a->imax, *ai = a->i, *ailen = a->ilen, roworiented = a->roworiented; 922d0f46423SBarry Smith PetscInt *aj = a->j, nonew = a->nonew, bs = A->rmap->bs, brow, bcol; 92313f74950SBarry Smith PetscInt ridx, cidx, bs2 = a->bs2; 92449b5e25fSSatish Balay MatScalar *ap, value, *aa = a->a, *bap; 92549b5e25fSSatish Balay 92649b5e25fSSatish Balay PetscFunctionBegin; 92749b5e25fSSatish Balay for (k = 0; k < m; k++) { /* loop over added rows */ 92849b5e25fSSatish Balay row = im[k]; /* row number */ 92949b5e25fSSatish Balay brow = row / bs; /* block row number */ 93049b5e25fSSatish Balay if (row < 0) continue; 9316bdcaf15SBarry Smith PetscCheck(row < A->rmap->N, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Row too large: row %" PetscInt_FMT " max %" PetscInt_FMT, row, A->rmap->N - 1); 93249b5e25fSSatish Balay rp = aj + ai[brow]; /*ptr to beginning of column value of the row block*/ 93349b5e25fSSatish Balay ap = aa + bs2 * ai[brow]; /*ptr to beginning of element value of the row block*/ 93449b5e25fSSatish Balay rmax = imax[brow]; /* maximum space allocated for this row */ 93549b5e25fSSatish Balay nrow = ailen[brow]; /* actual length of this row */ 93649b5e25fSSatish Balay low = 0; 9378509e838SStefano Zampini high = nrow; 93849b5e25fSSatish Balay for (l = 0; l < n; l++) { /* loop over added columns */ 93949b5e25fSSatish Balay if (in[l] < 0) continue; 9406bdcaf15SBarry Smith PetscCheck(in[l] < A->cmap->N, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Column too large: col %" PetscInt_FMT " max %" PetscInt_FMT, in[l], A->cmap->N - 1); 94149b5e25fSSatish Balay col = in[l]; 94249b5e25fSSatish Balay bcol = col / bs; /* block col number */ 94349b5e25fSSatish Balay 944941593c8SHong Zhang if (brow > bcol) { 94526fbe8dcSKarl Rupp if (a->ignore_ltriangular) continue; /* ignore lower triangular values */ 94626fbe8dcSKarl Rupp else SETERRQ(PETSC_COMM_SELF, PETSC_ERR_USER, "Lower triangular value cannot be set for sbaij format. Ignoring these values, run with -mat_ignore_lower_triangular or call MatSetOption(mat,MAT_IGNORE_LOWER_TRIANGULAR,PETSC_TRUE)"); 947941593c8SHong Zhang } 948f4989cb3SHong Zhang 9499371c9d4SSatish Balay ridx = row % bs; 9509371c9d4SSatish Balay cidx = col % bs; /*row and col index inside the block */ 9518549e402SHong Zhang if ((brow == bcol && ridx <= cidx) || (brow < bcol)) { 95249b5e25fSSatish Balay /* element value a(k,l) */ 95326fbe8dcSKarl Rupp if (roworiented) value = v[l + k * n]; 95426fbe8dcSKarl Rupp else value = v[k + l * m]; 95549b5e25fSSatish Balay 95649b5e25fSSatish Balay /* move pointer bap to a(k,l) quickly and add/insert value */ 95726fbe8dcSKarl Rupp if (col <= lastcol) low = 0; 9588509e838SStefano Zampini else high = nrow; 9598509e838SStefano Zampini 960e2ee6c50SBarry Smith lastcol = col; 96149b5e25fSSatish Balay while (high - low > 7) { 96249b5e25fSSatish Balay t = (low + high) / 2; 96349b5e25fSSatish Balay if (rp[t] > bcol) high = t; 96449b5e25fSSatish Balay else low = t; 96549b5e25fSSatish Balay } 96649b5e25fSSatish Balay for (i = low; i < high; i++) { 96749b5e25fSSatish Balay if (rp[i] > bcol) break; 96849b5e25fSSatish Balay if (rp[i] == bcol) { 96949b5e25fSSatish Balay bap = ap + bs2 * i + bs * cidx + ridx; 97049b5e25fSSatish Balay if (is == ADD_VALUES) *bap += value; 97149b5e25fSSatish Balay else *bap = value; 9728549e402SHong Zhang /* for diag block, add/insert its symmetric element a(cidx,ridx) */ 9738549e402SHong Zhang if (brow == bcol && ridx < cidx) { 9748549e402SHong Zhang bap = ap + bs2 * i + bs * ridx + cidx; 9758549e402SHong Zhang if (is == ADD_VALUES) *bap += value; 9768549e402SHong Zhang else *bap = value; 9778549e402SHong Zhang } 97849b5e25fSSatish Balay goto noinsert1; 97949b5e25fSSatish Balay } 98049b5e25fSSatish Balay } 98149b5e25fSSatish Balay 98249b5e25fSSatish Balay if (nonew == 1) goto noinsert1; 98308401ef6SPierre Jolivet PetscCheck(nonew != -1, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Inserting a new nonzero (%" PetscInt_FMT ", %" PetscInt_FMT ") in the matrix", row, col); 984fef13f97SBarry Smith MatSeqXAIJReallocateAIJ(A, a->mbs, bs2, nrow, brow, bcol, rmax, aa, ai, aj, rp, ap, imax, nonew, MatScalar); 98549b5e25fSSatish Balay 9869371c9d4SSatish Balay N = nrow++ - 1; 9879371c9d4SSatish Balay high++; 98849b5e25fSSatish Balay /* shift up all the later entries in this row */ 9899566063dSJacob Faibussowitsch PetscCall(PetscArraymove(rp + i + 1, rp + i, N - i + 1)); 9909566063dSJacob Faibussowitsch PetscCall(PetscArraymove(ap + bs2 * (i + 1), ap + bs2 * i, bs2 * (N - i + 1))); 9919566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(ap + bs2 * i, bs2)); 99249b5e25fSSatish Balay rp[i] = bcol; 99349b5e25fSSatish Balay ap[bs2 * i + bs * cidx + ridx] = value; 9948509e838SStefano Zampini /* for diag block, add/insert its symmetric element a(cidx,ridx) */ 995ad540459SPierre Jolivet if (brow == bcol && ridx < cidx) ap[bs2 * i + bs * ridx + cidx] = value; 996e56f5c9eSBarry Smith A->nonzerostate++; 99749b5e25fSSatish Balay noinsert1:; 99849b5e25fSSatish Balay low = i; 9998549e402SHong Zhang } 100049b5e25fSSatish Balay } /* end of loop over added columns */ 100149b5e25fSSatish Balay ailen[brow] = nrow; 100249b5e25fSSatish Balay } /* end of loop over added rows */ 10033ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 100449b5e25fSSatish Balay } 100549b5e25fSSatish Balay 1006d71ae5a4SJacob Faibussowitsch PetscErrorCode MatICCFactor_SeqSBAIJ(Mat inA, IS row, const MatFactorInfo *info) 1007d71ae5a4SJacob Faibussowitsch { 10084ccecd49SHong Zhang Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)inA->data; 100949b5e25fSSatish Balay Mat outA; 1010ace3abfcSBarry Smith PetscBool row_identity; 101149b5e25fSSatish Balay 101249b5e25fSSatish Balay PetscFunctionBegin; 101308401ef6SPierre Jolivet PetscCheck(info->levels == 0, PETSC_COMM_SELF, PETSC_ERR_SUP, "Only levels=0 is supported for in-place icc"); 10149566063dSJacob Faibussowitsch PetscCall(ISIdentity(row, &row_identity)); 101528b400f6SJacob Faibussowitsch PetscCheck(row_identity, PETSC_COMM_SELF, PETSC_ERR_SUP, "Matrix reordering is not supported"); 101608401ef6SPierre Jolivet PetscCheck(inA->rmap->bs == 1, PETSC_COMM_SELF, PETSC_ERR_SUP, "Matrix block size %" PetscInt_FMT " is not supported", inA->rmap->bs); /* Need to replace MatCholeskyFactorSymbolic_SeqSBAIJ_MSR()! */ 1017c84f5b01SHong Zhang 101849b5e25fSSatish Balay outA = inA; 1019d5f3da31SBarry Smith inA->factortype = MAT_FACTOR_ICC; 10209566063dSJacob Faibussowitsch PetscCall(PetscFree(inA->solvertype)); 10219566063dSJacob Faibussowitsch PetscCall(PetscStrallocpy(MATSOLVERPETSC, &inA->solvertype)); 102249b5e25fSSatish Balay 10239566063dSJacob Faibussowitsch PetscCall(MatMarkDiagonal_SeqSBAIJ(inA)); 10249566063dSJacob Faibussowitsch PetscCall(MatSeqSBAIJSetNumericFactorization_inplace(inA, row_identity)); 102549b5e25fSSatish Balay 10269566063dSJacob Faibussowitsch PetscCall(PetscObjectReference((PetscObject)row)); 10279566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->row)); 1028c84f5b01SHong Zhang a->row = row; 10299566063dSJacob Faibussowitsch PetscCall(PetscObjectReference((PetscObject)row)); 10309566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->col)); 1031c84f5b01SHong Zhang a->col = row; 1032c84f5b01SHong Zhang 1033c84f5b01SHong Zhang /* Create the invert permutation so that it can be used in MatCholeskyFactorNumeric() */ 10349566063dSJacob Faibussowitsch if (a->icol) PetscCall(ISInvertPermutation(row, PETSC_DECIDE, &a->icol)); 103549b5e25fSSatish Balay 10364dfa11a4SJacob Faibussowitsch if (!a->solve_work) { PetscCall(PetscMalloc1(inA->rmap->N + inA->rmap->bs, &a->solve_work)); } 103749b5e25fSSatish Balay 10389566063dSJacob Faibussowitsch PetscCall(MatCholeskyFactorNumeric(outA, inA, info)); 10393ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 104049b5e25fSSatish Balay } 1041950f1e5bSHong Zhang 1042d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqSBAIJSetColumnIndices_SeqSBAIJ(Mat mat, PetscInt *indices) 1043d71ae5a4SJacob Faibussowitsch { 1044045c9aa0SHong Zhang Mat_SeqSBAIJ *baij = (Mat_SeqSBAIJ *)mat->data; 104513f74950SBarry Smith PetscInt i, nz, n; 104649b5e25fSSatish Balay 104749b5e25fSSatish Balay PetscFunctionBegin; 10486c6c5352SBarry Smith nz = baij->maxnz; 1049d0f46423SBarry Smith n = mat->cmap->n; 105026fbe8dcSKarl Rupp for (i = 0; i < nz; i++) baij->j[i] = indices[i]; 105126fbe8dcSKarl Rupp 10526c6c5352SBarry Smith baij->nz = nz; 105326fbe8dcSKarl Rupp for (i = 0; i < n; i++) baij->ilen[i] = baij->imax[i]; 105426fbe8dcSKarl Rupp 10559566063dSJacob Faibussowitsch PetscCall(MatSetOption(mat, MAT_NEW_NONZERO_LOCATION_ERR, PETSC_TRUE)); 10563ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 105749b5e25fSSatish Balay } 105849b5e25fSSatish Balay 105949b5e25fSSatish Balay /*@ 106019585528SSatish Balay MatSeqSBAIJSetColumnIndices - Set the column indices for all the rows 106111a5261eSBarry Smith in a `MATSEQSBAIJ` matrix. 106249b5e25fSSatish Balay 106349b5e25fSSatish Balay Input Parameters: 106411a5261eSBarry Smith + mat - the `MATSEQSBAIJ` matrix 106549b5e25fSSatish Balay - indices - the column indices 106649b5e25fSSatish Balay 106749b5e25fSSatish Balay Level: advanced 106849b5e25fSSatish Balay 106949b5e25fSSatish Balay Notes: 107049b5e25fSSatish Balay This can be called if you have precomputed the nonzero structure of the 107149b5e25fSSatish Balay matrix and want to provide it to the matrix object to improve the performance 107211a5261eSBarry Smith of the `MatSetValues()` operation. 107349b5e25fSSatish Balay 107449b5e25fSSatish Balay You MUST have set the correct numbers of nonzeros per row in the call to 107511a5261eSBarry Smith `MatCreateSeqSBAIJ()`, and the columns indices MUST be sorted. 107649b5e25fSSatish Balay 1077ab9f2c04SSatish Balay MUST be called before any calls to MatSetValues() 107849b5e25fSSatish Balay 107911a5261eSBarry Smith .seealso: `MATSEQSBAIJ`, `MatCreateSeqSBAIJ` 108049b5e25fSSatish Balay @*/ 1081d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqSBAIJSetColumnIndices(Mat mat, PetscInt *indices) 1082d71ae5a4SJacob Faibussowitsch { 108349b5e25fSSatish Balay PetscFunctionBegin; 10840700a824SBarry Smith PetscValidHeaderSpecific(mat, MAT_CLASSID, 1); 1085dadcf809SJacob Faibussowitsch PetscValidIntPointer(indices, 2); 1086cac4c232SBarry Smith PetscUseMethod(mat, "MatSeqSBAIJSetColumnIndices_C", (Mat, PetscInt *), (mat, indices)); 10873ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 108849b5e25fSSatish Balay } 108949b5e25fSSatish Balay 1090d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCopy_SeqSBAIJ(Mat A, Mat B, MatStructure str) 1091d71ae5a4SJacob Faibussowitsch { 10924c7a3774SStefano Zampini PetscBool isbaij; 10933c896bc6SHong Zhang 10943c896bc6SHong Zhang PetscFunctionBegin; 10959566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompareAny((PetscObject)B, &isbaij, MATSEQSBAIJ, MATMPISBAIJ, "")); 109628b400f6SJacob Faibussowitsch PetscCheck(isbaij, PetscObjectComm((PetscObject)B), PETSC_ERR_SUP, "Not for matrix type %s", ((PetscObject)B)->type_name); 10974c7a3774SStefano Zampini /* If the two matrices have the same copy implementation and nonzero pattern, use fast copy. */ 10984c7a3774SStefano Zampini if (str == SAME_NONZERO_PATTERN && A->ops->copy == B->ops->copy) { 10993c896bc6SHong Zhang Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)A->data; 11003c896bc6SHong Zhang Mat_SeqSBAIJ *b = (Mat_SeqSBAIJ *)B->data; 11013c896bc6SHong Zhang 110208401ef6SPierre Jolivet PetscCheck(a->i[a->mbs] == b->i[b->mbs], PETSC_COMM_SELF, PETSC_ERR_ARG_INCOMP, "Number of nonzeros in two matrices are different"); 110308401ef6SPierre Jolivet PetscCheck(a->mbs == b->mbs, PETSC_COMM_SELF, PETSC_ERR_ARG_INCOMP, "Number of rows in two matrices are different"); 110408401ef6SPierre Jolivet PetscCheck(a->bs2 == b->bs2, PETSC_COMM_SELF, PETSC_ERR_ARG_INCOMP, "Different block size"); 11059566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(b->a, a->a, a->bs2 * a->i[a->mbs])); 11069566063dSJacob Faibussowitsch PetscCall(PetscObjectStateIncrease((PetscObject)B)); 11073c896bc6SHong Zhang } else { 11089566063dSJacob Faibussowitsch PetscCall(MatGetRowUpperTriangular(A)); 11099566063dSJacob Faibussowitsch PetscCall(MatCopy_Basic(A, B, str)); 11109566063dSJacob Faibussowitsch PetscCall(MatRestoreRowUpperTriangular(A)); 11113c896bc6SHong Zhang } 11123ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 11133c896bc6SHong Zhang } 11143c896bc6SHong Zhang 1115d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatSeqSBAIJGetArray_SeqSBAIJ(Mat A, PetscScalar *array[]) 1116d71ae5a4SJacob Faibussowitsch { 1117a6ece127SHong Zhang Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)A->data; 11185fd66863SKarl Rupp 1119a6ece127SHong Zhang PetscFunctionBegin; 1120a6ece127SHong Zhang *array = a->a; 11213ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1122a6ece127SHong Zhang } 1123a6ece127SHong Zhang 1124d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatSeqSBAIJRestoreArray_SeqSBAIJ(Mat A, PetscScalar *array[]) 1125d71ae5a4SJacob Faibussowitsch { 1126a6ece127SHong Zhang PetscFunctionBegin; 1127cda14afcSprj- *array = NULL; 11283ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1129a6ece127SHong Zhang } 1130a6ece127SHong Zhang 1131d71ae5a4SJacob Faibussowitsch PetscErrorCode MatAXPYGetPreallocation_SeqSBAIJ(Mat Y, Mat X, PetscInt *nnz) 1132d71ae5a4SJacob Faibussowitsch { 1133b264fe52SHong Zhang PetscInt bs = Y->rmap->bs, mbs = Y->rmap->N / bs; 113452768537SHong Zhang Mat_SeqSBAIJ *x = (Mat_SeqSBAIJ *)X->data; 113552768537SHong Zhang Mat_SeqSBAIJ *y = (Mat_SeqSBAIJ *)Y->data; 113652768537SHong Zhang 113752768537SHong Zhang PetscFunctionBegin; 113852768537SHong Zhang /* Set the number of nonzeros in the new matrix */ 11399566063dSJacob Faibussowitsch PetscCall(MatAXPYGetPreallocation_SeqX_private(mbs, x->i, x->j, y->i, y->j, nnz)); 11403ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 114152768537SHong Zhang } 114252768537SHong Zhang 1143d71ae5a4SJacob Faibussowitsch PetscErrorCode MatAXPY_SeqSBAIJ(Mat Y, PetscScalar a, Mat X, MatStructure str) 1144d71ae5a4SJacob Faibussowitsch { 114542ee4b1aSHong Zhang Mat_SeqSBAIJ *x = (Mat_SeqSBAIJ *)X->data, *y = (Mat_SeqSBAIJ *)Y->data; 114631ce2d13SHong Zhang PetscInt bs = Y->rmap->bs, bs2 = bs * bs; 1147e838b9e7SJed Brown PetscBLASInt one = 1; 114842ee4b1aSHong Zhang 114942ee4b1aSHong Zhang PetscFunctionBegin; 1150134adf20SPierre Jolivet if (str == UNKNOWN_NONZERO_PATTERN || (PetscDefined(USE_DEBUG) && str == SAME_NONZERO_PATTERN)) { 1151134adf20SPierre Jolivet PetscBool e = x->nz == y->nz && x->mbs == y->mbs ? PETSC_TRUE : PETSC_FALSE; 1152134adf20SPierre Jolivet if (e) { 11539566063dSJacob Faibussowitsch PetscCall(PetscArraycmp(x->i, y->i, x->mbs + 1, &e)); 1154134adf20SPierre Jolivet if (e) { 11559566063dSJacob Faibussowitsch PetscCall(PetscArraycmp(x->j, y->j, x->i[x->mbs], &e)); 1156134adf20SPierre Jolivet if (e) str = SAME_NONZERO_PATTERN; 1157134adf20SPierre Jolivet } 1158134adf20SPierre Jolivet } 115954c59aa7SJacob Faibussowitsch if (!e) PetscCheck(str != SAME_NONZERO_PATTERN, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONG, "MatStructure is not SAME_NONZERO_PATTERN"); 1160134adf20SPierre Jolivet } 116142ee4b1aSHong Zhang if (str == SAME_NONZERO_PATTERN) { 1162f4df32b1SMatthew Knepley PetscScalar alpha = a; 1163c5df96a5SBarry Smith PetscBLASInt bnz; 11649566063dSJacob Faibussowitsch PetscCall(PetscBLASIntCast(x->nz * bs2, &bnz)); 1165792fecdfSBarry Smith PetscCallBLAS("BLASaxpy", BLASaxpy_(&bnz, &alpha, x->a, &one, y->a, &one)); 11669566063dSJacob Faibussowitsch PetscCall(PetscObjectStateIncrease((PetscObject)Y)); 1167ab784542SHong Zhang } else if (str == SUBSET_NONZERO_PATTERN) { /* nonzeros of X is a subset of Y's */ 11689566063dSJacob Faibussowitsch PetscCall(MatSetOption(X, MAT_GETROW_UPPERTRIANGULAR, PETSC_TRUE)); 11699566063dSJacob Faibussowitsch PetscCall(MatAXPY_Basic(Y, a, X, str)); 11709566063dSJacob Faibussowitsch PetscCall(MatSetOption(X, MAT_GETROW_UPPERTRIANGULAR, PETSC_FALSE)); 117142ee4b1aSHong Zhang } else { 117252768537SHong Zhang Mat B; 117352768537SHong Zhang PetscInt *nnz; 117454c59aa7SJacob Faibussowitsch PetscCheck(bs == X->rmap->bs, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Matrices must have same block size"); 11759566063dSJacob Faibussowitsch PetscCall(MatGetRowUpperTriangular(X)); 11769566063dSJacob Faibussowitsch PetscCall(MatGetRowUpperTriangular(Y)); 11779566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(Y->rmap->N, &nnz)); 11789566063dSJacob Faibussowitsch PetscCall(MatCreate(PetscObjectComm((PetscObject)Y), &B)); 11799566063dSJacob Faibussowitsch PetscCall(PetscObjectSetName((PetscObject)B, ((PetscObject)Y)->name)); 11809566063dSJacob Faibussowitsch PetscCall(MatSetSizes(B, Y->rmap->n, Y->cmap->n, Y->rmap->N, Y->cmap->N)); 11819566063dSJacob Faibussowitsch PetscCall(MatSetBlockSizesFromMats(B, Y, Y)); 11829566063dSJacob Faibussowitsch PetscCall(MatSetType(B, ((PetscObject)Y)->type_name)); 11839566063dSJacob Faibussowitsch PetscCall(MatAXPYGetPreallocation_SeqSBAIJ(Y, X, nnz)); 11849566063dSJacob Faibussowitsch PetscCall(MatSeqSBAIJSetPreallocation(B, bs, 0, nnz)); 118552768537SHong Zhang 11869566063dSJacob Faibussowitsch PetscCall(MatAXPY_BasicWithPreallocation(B, Y, a, X, str)); 118752768537SHong Zhang 11889566063dSJacob Faibussowitsch PetscCall(MatHeaderMerge(Y, &B)); 11899566063dSJacob Faibussowitsch PetscCall(PetscFree(nnz)); 11909566063dSJacob Faibussowitsch PetscCall(MatRestoreRowUpperTriangular(X)); 11919566063dSJacob Faibussowitsch PetscCall(MatRestoreRowUpperTriangular(Y)); 119242ee4b1aSHong Zhang } 11933ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 119442ee4b1aSHong Zhang } 119542ee4b1aSHong Zhang 1196d71ae5a4SJacob Faibussowitsch PetscErrorCode MatIsSymmetric_SeqSBAIJ(Mat A, PetscReal tol, PetscBool *flg) 1197d71ae5a4SJacob Faibussowitsch { 1198efcf0fc3SBarry Smith PetscFunctionBegin; 1199efcf0fc3SBarry Smith *flg = PETSC_TRUE; 12003ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1201efcf0fc3SBarry Smith } 1202efcf0fc3SBarry Smith 1203d71ae5a4SJacob Faibussowitsch PetscErrorCode MatIsStructurallySymmetric_SeqSBAIJ(Mat A, PetscBool *flg) 1204d71ae5a4SJacob Faibussowitsch { 1205efcf0fc3SBarry Smith PetscFunctionBegin; 1206efcf0fc3SBarry Smith *flg = PETSC_TRUE; 12073ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1208efcf0fc3SBarry Smith } 1209efcf0fc3SBarry Smith 1210d71ae5a4SJacob Faibussowitsch PetscErrorCode MatIsHermitian_SeqSBAIJ(Mat A, PetscReal tol, PetscBool *flg) 1211d71ae5a4SJacob Faibussowitsch { 1212efcf0fc3SBarry Smith PetscFunctionBegin; 1213efcf0fc3SBarry Smith *flg = PETSC_FALSE; 12143ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1215efcf0fc3SBarry Smith } 1216efcf0fc3SBarry Smith 1217d71ae5a4SJacob Faibussowitsch PetscErrorCode MatConjugate_SeqSBAIJ(Mat A) 1218d71ae5a4SJacob Faibussowitsch { 12192726fb6dSPierre Jolivet #if defined(PETSC_USE_COMPLEX) 12202726fb6dSPierre Jolivet Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)A->data; 12212726fb6dSPierre Jolivet PetscInt i, nz = a->bs2 * a->i[a->mbs]; 12222726fb6dSPierre Jolivet MatScalar *aa = a->a; 12232726fb6dSPierre Jolivet 12242726fb6dSPierre Jolivet PetscFunctionBegin; 12252726fb6dSPierre Jolivet for (i = 0; i < nz; i++) aa[i] = PetscConj(aa[i]); 12262726fb6dSPierre Jolivet #else 12272726fb6dSPierre Jolivet PetscFunctionBegin; 12282726fb6dSPierre Jolivet #endif 12293ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 12302726fb6dSPierre Jolivet } 12312726fb6dSPierre Jolivet 1232d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRealPart_SeqSBAIJ(Mat A) 1233d71ae5a4SJacob Faibussowitsch { 123499cafbc1SBarry Smith Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)A->data; 123599cafbc1SBarry Smith PetscInt i, nz = a->bs2 * a->i[a->mbs]; 1236dd6ea824SBarry Smith MatScalar *aa = a->a; 123799cafbc1SBarry Smith 123899cafbc1SBarry Smith PetscFunctionBegin; 123999cafbc1SBarry Smith for (i = 0; i < nz; i++) aa[i] = PetscRealPart(aa[i]); 12403ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 124199cafbc1SBarry Smith } 124299cafbc1SBarry Smith 1243d71ae5a4SJacob Faibussowitsch PetscErrorCode MatImaginaryPart_SeqSBAIJ(Mat A) 1244d71ae5a4SJacob Faibussowitsch { 124599cafbc1SBarry Smith Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)A->data; 124699cafbc1SBarry Smith PetscInt i, nz = a->bs2 * a->i[a->mbs]; 1247dd6ea824SBarry Smith MatScalar *aa = a->a; 124899cafbc1SBarry Smith 124999cafbc1SBarry Smith PetscFunctionBegin; 125099cafbc1SBarry Smith for (i = 0; i < nz; i++) aa[i] = PetscImaginaryPart(aa[i]); 12513ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 125299cafbc1SBarry Smith } 125399cafbc1SBarry Smith 1254d71ae5a4SJacob Faibussowitsch PetscErrorCode MatZeroRowsColumns_SeqSBAIJ(Mat A, PetscInt is_n, const PetscInt is_idx[], PetscScalar diag, Vec x, Vec b) 1255d71ae5a4SJacob Faibussowitsch { 12563bededecSBarry Smith Mat_SeqSBAIJ *baij = (Mat_SeqSBAIJ *)A->data; 12573bededecSBarry Smith PetscInt i, j, k, count; 12583bededecSBarry Smith PetscInt bs = A->rmap->bs, bs2 = baij->bs2, row, col; 12593bededecSBarry Smith PetscScalar zero = 0.0; 12603bededecSBarry Smith MatScalar *aa; 12613bededecSBarry Smith const PetscScalar *xx; 12623bededecSBarry Smith PetscScalar *bb; 126356777dd2SBarry Smith PetscBool *zeroed, vecs = PETSC_FALSE; 12643bededecSBarry Smith 12653bededecSBarry Smith PetscFunctionBegin; 12663bededecSBarry Smith /* fix right hand side if needed */ 12673bededecSBarry Smith if (x && b) { 12689566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(x, &xx)); 12699566063dSJacob Faibussowitsch PetscCall(VecGetArray(b, &bb)); 127056777dd2SBarry Smith vecs = PETSC_TRUE; 12713bededecSBarry Smith } 12723bededecSBarry Smith 12733bededecSBarry Smith /* zero the columns */ 12749566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(A->rmap->n, &zeroed)); 12753bededecSBarry Smith for (i = 0; i < is_n; i++) { 1276aed4548fSBarry Smith PetscCheck(is_idx[i] >= 0 && is_idx[i] < A->rmap->N, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "row %" PetscInt_FMT " out of range", is_idx[i]); 12773bededecSBarry Smith zeroed[is_idx[i]] = PETSC_TRUE; 12783bededecSBarry Smith } 127956777dd2SBarry Smith if (vecs) { 128056777dd2SBarry Smith for (i = 0; i < A->rmap->N; i++) { 128156777dd2SBarry Smith row = i / bs; 128256777dd2SBarry Smith for (j = baij->i[row]; j < baij->i[row + 1]; j++) { 128356777dd2SBarry Smith for (k = 0; k < bs; k++) { 128456777dd2SBarry Smith col = bs * baij->j[j] + k; 128556777dd2SBarry Smith if (col <= i) continue; 128656777dd2SBarry Smith aa = ((MatScalar *)(baij->a)) + j * bs2 + (i % bs) + bs * k; 128726fbe8dcSKarl Rupp if (!zeroed[i] && zeroed[col]) bb[i] -= aa[0] * xx[col]; 128826fbe8dcSKarl Rupp if (zeroed[i] && !zeroed[col]) bb[col] -= aa[0] * xx[i]; 128956777dd2SBarry Smith } 129056777dd2SBarry Smith } 129156777dd2SBarry Smith } 129226fbe8dcSKarl Rupp for (i = 0; i < is_n; i++) bb[is_idx[i]] = diag * xx[is_idx[i]]; 129356777dd2SBarry Smith } 129456777dd2SBarry Smith 12953bededecSBarry Smith for (i = 0; i < A->rmap->N; i++) { 12963bededecSBarry Smith if (!zeroed[i]) { 12973bededecSBarry Smith row = i / bs; 12983bededecSBarry Smith for (j = baij->i[row]; j < baij->i[row + 1]; j++) { 12993bededecSBarry Smith for (k = 0; k < bs; k++) { 13003bededecSBarry Smith col = bs * baij->j[j] + k; 13013bededecSBarry Smith if (zeroed[col]) { 13023bededecSBarry Smith aa = ((MatScalar *)(baij->a)) + j * bs2 + (i % bs) + bs * k; 13033bededecSBarry Smith aa[0] = 0.0; 13043bededecSBarry Smith } 13053bededecSBarry Smith } 13063bededecSBarry Smith } 13073bededecSBarry Smith } 13083bededecSBarry Smith } 13099566063dSJacob Faibussowitsch PetscCall(PetscFree(zeroed)); 131056777dd2SBarry Smith if (vecs) { 13119566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(x, &xx)); 13129566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(b, &bb)); 131356777dd2SBarry Smith } 13143bededecSBarry Smith 13153bededecSBarry Smith /* zero the rows */ 13163bededecSBarry Smith for (i = 0; i < is_n; i++) { 13173bededecSBarry Smith row = is_idx[i]; 13183bededecSBarry Smith count = (baij->i[row / bs + 1] - baij->i[row / bs]) * bs; 13193bededecSBarry Smith aa = ((MatScalar *)(baij->a)) + baij->i[row / bs] * bs2 + (row % bs); 13203bededecSBarry Smith for (k = 0; k < count; k++) { 13213bededecSBarry Smith aa[0] = zero; 13223bededecSBarry Smith aa += bs; 13233bededecSBarry Smith } 1324dbbe0bcdSBarry Smith if (diag != 0.0) PetscUseTypeMethod(A, setvalues, 1, &row, 1, &row, &diag, INSERT_VALUES); 13253bededecSBarry Smith } 13269566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd_SeqSBAIJ(A, MAT_FINAL_ASSEMBLY)); 13273ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 13283bededecSBarry Smith } 13293bededecSBarry Smith 1330d71ae5a4SJacob Faibussowitsch PetscErrorCode MatShift_SeqSBAIJ(Mat Y, PetscScalar a) 1331d71ae5a4SJacob Faibussowitsch { 13327d68702bSBarry Smith Mat_SeqSBAIJ *aij = (Mat_SeqSBAIJ *)Y->data; 13337d68702bSBarry Smith 13347d68702bSBarry Smith PetscFunctionBegin; 133548a46eb9SPierre Jolivet if (!Y->preallocated || !aij->nz) PetscCall(MatSeqSBAIJSetPreallocation(Y, Y->rmap->bs, 1, NULL)); 13369566063dSJacob Faibussowitsch PetscCall(MatShift_Basic(Y, a)); 13373ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 13387d68702bSBarry Smith } 13397d68702bSBarry Smith 134049b5e25fSSatish Balay /* -------------------------------------------------------------------*/ 13413964eb88SJed Brown static struct _MatOps MatOps_Values = {MatSetValues_SeqSBAIJ, 134249b5e25fSSatish Balay MatGetRow_SeqSBAIJ, 134349b5e25fSSatish Balay MatRestoreRow_SeqSBAIJ, 134449b5e25fSSatish Balay MatMult_SeqSBAIJ_N, 134597304618SKris Buschelman /* 4*/ MatMultAdd_SeqSBAIJ_N, 1346431c96f7SBarry Smith MatMult_SeqSBAIJ_N, /* transpose versions are same as non-transpose versions */ 1347e005ede5SBarry Smith MatMultAdd_SeqSBAIJ_N, 1348f4259b30SLisandro Dalcin NULL, 1349f4259b30SLisandro Dalcin NULL, 1350f4259b30SLisandro Dalcin NULL, 1351f4259b30SLisandro Dalcin /* 10*/ NULL, 1352f4259b30SLisandro Dalcin NULL, 1353c078aec8SLisandro Dalcin MatCholeskyFactor_SeqSBAIJ, 135441f059aeSBarry Smith MatSOR_SeqSBAIJ, 135549b5e25fSSatish Balay MatTranspose_SeqSBAIJ, 135697304618SKris Buschelman /* 15*/ MatGetInfo_SeqSBAIJ, 135749b5e25fSSatish Balay MatEqual_SeqSBAIJ, 135849b5e25fSSatish Balay MatGetDiagonal_SeqSBAIJ, 135949b5e25fSSatish Balay MatDiagonalScale_SeqSBAIJ, 136049b5e25fSSatish Balay MatNorm_SeqSBAIJ, 1361f4259b30SLisandro Dalcin /* 20*/ NULL, 136249b5e25fSSatish Balay MatAssemblyEnd_SeqSBAIJ, 136349b5e25fSSatish Balay MatSetOption_SeqSBAIJ, 136449b5e25fSSatish Balay MatZeroEntries_SeqSBAIJ, 1365f4259b30SLisandro Dalcin /* 24*/ NULL, 1366f4259b30SLisandro Dalcin NULL, 1367f4259b30SLisandro Dalcin NULL, 1368f4259b30SLisandro Dalcin NULL, 1369f4259b30SLisandro Dalcin NULL, 1370*26cec326SBarry Smith /* 29*/ MatSetUp_Seq_Hash, 1371f4259b30SLisandro Dalcin NULL, 1372f4259b30SLisandro Dalcin NULL, 1373f4259b30SLisandro Dalcin NULL, 1374f4259b30SLisandro Dalcin NULL, 1375d519adbfSMatthew Knepley /* 34*/ MatDuplicate_SeqSBAIJ, 1376f4259b30SLisandro Dalcin NULL, 1377f4259b30SLisandro Dalcin NULL, 1378f4259b30SLisandro Dalcin NULL, 1379c84f5b01SHong Zhang MatICCFactor_SeqSBAIJ, 1380d519adbfSMatthew Knepley /* 39*/ MatAXPY_SeqSBAIJ, 13817dae84e0SHong Zhang MatCreateSubMatrices_SeqSBAIJ, 138249b5e25fSSatish Balay MatIncreaseOverlap_SeqSBAIJ, 138349b5e25fSSatish Balay MatGetValues_SeqSBAIJ, 13843c896bc6SHong Zhang MatCopy_SeqSBAIJ, 1385f4259b30SLisandro Dalcin /* 44*/ NULL, 138649b5e25fSSatish Balay MatScale_SeqSBAIJ, 13877d68702bSBarry Smith MatShift_SeqSBAIJ, 1388f4259b30SLisandro Dalcin NULL, 13893bededecSBarry Smith MatZeroRowsColumns_SeqSBAIJ, 1390f4259b30SLisandro Dalcin /* 49*/ NULL, 139149b5e25fSSatish Balay MatGetRowIJ_SeqSBAIJ, 139249b5e25fSSatish Balay MatRestoreRowIJ_SeqSBAIJ, 1393f4259b30SLisandro Dalcin NULL, 1394f4259b30SLisandro Dalcin NULL, 1395f4259b30SLisandro Dalcin /* 54*/ NULL, 1396f4259b30SLisandro Dalcin NULL, 1397f4259b30SLisandro Dalcin NULL, 1398dc29a518SPierre Jolivet MatPermute_SeqSBAIJ, 139949b5e25fSSatish Balay MatSetValuesBlocked_SeqSBAIJ, 14007dae84e0SHong Zhang /* 59*/ MatCreateSubMatrix_SeqSBAIJ, 1401f4259b30SLisandro Dalcin NULL, 1402f4259b30SLisandro Dalcin NULL, 1403f4259b30SLisandro Dalcin NULL, 1404f4259b30SLisandro Dalcin NULL, 1405f4259b30SLisandro Dalcin /* 64*/ NULL, 1406f4259b30SLisandro Dalcin NULL, 1407f4259b30SLisandro Dalcin NULL, 1408f4259b30SLisandro Dalcin NULL, 1409f4259b30SLisandro Dalcin NULL, 1410d519adbfSMatthew Knepley /* 69*/ MatGetRowMaxAbs_SeqSBAIJ, 1411f4259b30SLisandro Dalcin NULL, 141228d58a37SPierre Jolivet MatConvert_MPISBAIJ_Basic, 1413f4259b30SLisandro Dalcin NULL, 1414f4259b30SLisandro Dalcin NULL, 1415f4259b30SLisandro Dalcin /* 74*/ NULL, 1416f4259b30SLisandro Dalcin NULL, 1417f4259b30SLisandro Dalcin NULL, 1418f4259b30SLisandro Dalcin NULL, 1419f4259b30SLisandro Dalcin NULL, 1420f4259b30SLisandro Dalcin /* 79*/ NULL, 1421f4259b30SLisandro Dalcin NULL, 1422f4259b30SLisandro Dalcin NULL, 142397304618SKris Buschelman MatGetInertia_SeqSBAIJ, 14245bba2384SShri Abhyankar MatLoad_SeqSBAIJ, 1425d519adbfSMatthew Knepley /* 84*/ MatIsSymmetric_SeqSBAIJ, 1426865e5f61SKris Buschelman MatIsHermitian_SeqSBAIJ, 1427efcf0fc3SBarry Smith MatIsStructurallySymmetric_SeqSBAIJ, 1428f4259b30SLisandro Dalcin NULL, 1429f4259b30SLisandro Dalcin NULL, 1430f4259b30SLisandro Dalcin /* 89*/ NULL, 1431f4259b30SLisandro Dalcin NULL, 1432f4259b30SLisandro Dalcin NULL, 1433f4259b30SLisandro Dalcin NULL, 1434f4259b30SLisandro Dalcin NULL, 1435f4259b30SLisandro Dalcin /* 94*/ NULL, 1436f4259b30SLisandro Dalcin NULL, 1437f4259b30SLisandro Dalcin NULL, 1438f4259b30SLisandro Dalcin NULL, 1439f4259b30SLisandro Dalcin NULL, 1440f4259b30SLisandro Dalcin /* 99*/ NULL, 1441f4259b30SLisandro Dalcin NULL, 1442f4259b30SLisandro Dalcin NULL, 14432726fb6dSPierre Jolivet MatConjugate_SeqSBAIJ, 1444f4259b30SLisandro Dalcin NULL, 1445f4259b30SLisandro Dalcin /*104*/ NULL, 144699cafbc1SBarry Smith MatRealPart_SeqSBAIJ, 1447f5edf698SHong Zhang MatImaginaryPart_SeqSBAIJ, 1448f5edf698SHong Zhang MatGetRowUpperTriangular_SeqSBAIJ, 14492af78befSBarry Smith MatRestoreRowUpperTriangular_SeqSBAIJ, 1450f4259b30SLisandro Dalcin /*109*/ NULL, 1451f4259b30SLisandro Dalcin NULL, 1452f4259b30SLisandro Dalcin NULL, 1453f4259b30SLisandro Dalcin NULL, 1454547795f9SHong Zhang MatMissingDiagonal_SeqSBAIJ, 1455f4259b30SLisandro Dalcin /*114*/ NULL, 1456f4259b30SLisandro Dalcin NULL, 1457f4259b30SLisandro Dalcin NULL, 1458f4259b30SLisandro Dalcin NULL, 1459f4259b30SLisandro Dalcin NULL, 1460f4259b30SLisandro Dalcin /*119*/ NULL, 1461f4259b30SLisandro Dalcin NULL, 1462f4259b30SLisandro Dalcin NULL, 1463f4259b30SLisandro Dalcin NULL, 1464f4259b30SLisandro Dalcin NULL, 1465f4259b30SLisandro Dalcin /*124*/ NULL, 1466f4259b30SLisandro Dalcin NULL, 1467f4259b30SLisandro Dalcin NULL, 1468f4259b30SLisandro Dalcin NULL, 1469f4259b30SLisandro Dalcin NULL, 1470f4259b30SLisandro Dalcin /*129*/ NULL, 1471f4259b30SLisandro Dalcin NULL, 1472f4259b30SLisandro Dalcin NULL, 1473f4259b30SLisandro Dalcin NULL, 1474f4259b30SLisandro Dalcin NULL, 1475f4259b30SLisandro Dalcin /*134*/ NULL, 1476f4259b30SLisandro Dalcin NULL, 1477f4259b30SLisandro Dalcin NULL, 1478f4259b30SLisandro Dalcin NULL, 1479f4259b30SLisandro Dalcin NULL, 148046533700Sstefano_zampini /*139*/ MatSetBlockSizes_Default, 1481f4259b30SLisandro Dalcin NULL, 1482f4259b30SLisandro Dalcin NULL, 1483f4259b30SLisandro Dalcin NULL, 1484f4259b30SLisandro Dalcin NULL, 1485d70f29a3SPierre Jolivet /*144*/ MatCreateMPIMatConcatenateSeqMat_SeqSBAIJ, 1486d70f29a3SPierre Jolivet NULL, 1487d70f29a3SPierre Jolivet NULL, 148899a7f59eSMark Adams NULL, 148999a7f59eSMark Adams NULL, 14907fb60732SBarry Smith NULL, 1491dec0b466SHong Zhang /*150*/ NULL, 1492dec0b466SHong Zhang NULL}; 1493be1d678aSKris Buschelman 1494d71ae5a4SJacob Faibussowitsch PetscErrorCode MatStoreValues_SeqSBAIJ(Mat mat) 1495d71ae5a4SJacob Faibussowitsch { 14964afc71dfSHong Zhang Mat_SeqSBAIJ *aij = (Mat_SeqSBAIJ *)mat->data; 1497d0f46423SBarry Smith PetscInt nz = aij->i[mat->rmap->N] * mat->rmap->bs * aij->bs2; 149849b5e25fSSatish Balay 149949b5e25fSSatish Balay PetscFunctionBegin; 150008401ef6SPierre Jolivet PetscCheck(aij->nonew == 1, PETSC_COMM_SELF, PETSC_ERR_ORDER, "Must call MatSetOption(A,MAT_NEW_NONZERO_LOCATIONS,PETSC_FALSE);first"); 150149b5e25fSSatish Balay 150249b5e25fSSatish Balay /* allocate space for values if not already there */ 150348a46eb9SPierre Jolivet if (!aij->saved_values) PetscCall(PetscMalloc1(nz + 1, &aij->saved_values)); 150449b5e25fSSatish Balay 150549b5e25fSSatish Balay /* copy values over */ 15069566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(aij->saved_values, aij->a, nz)); 15073ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 150849b5e25fSSatish Balay } 150949b5e25fSSatish Balay 1510d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRetrieveValues_SeqSBAIJ(Mat mat) 1511d71ae5a4SJacob Faibussowitsch { 15124afc71dfSHong Zhang Mat_SeqSBAIJ *aij = (Mat_SeqSBAIJ *)mat->data; 1513d0f46423SBarry Smith PetscInt nz = aij->i[mat->rmap->N] * mat->rmap->bs * aij->bs2; 151449b5e25fSSatish Balay 151549b5e25fSSatish Balay PetscFunctionBegin; 151608401ef6SPierre Jolivet PetscCheck(aij->nonew == 1, PETSC_COMM_SELF, PETSC_ERR_ORDER, "Must call MatSetOption(A,MAT_NEW_NONZERO_LOCATIONS,PETSC_FALSE);first"); 151728b400f6SJacob Faibussowitsch PetscCheck(aij->saved_values, PETSC_COMM_SELF, PETSC_ERR_ORDER, "Must call MatStoreValues(A);first"); 151849b5e25fSSatish Balay 151949b5e25fSSatish Balay /* copy values over */ 15209566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(aij->a, aij->saved_values, nz)); 15213ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 152249b5e25fSSatish Balay } 152349b5e25fSSatish Balay 1524d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatSeqSBAIJSetPreallocation_SeqSBAIJ(Mat B, PetscInt bs, PetscInt nz, PetscInt *nnz) 1525d71ae5a4SJacob Faibussowitsch { 1526c464158bSHong Zhang Mat_SeqSBAIJ *b = (Mat_SeqSBAIJ *)B->data; 15274dcd73b1SHong Zhang PetscInt i, mbs, nbs, bs2; 15282576faa2SJed Brown PetscBool skipallocation = PETSC_FALSE, flg = PETSC_FALSE, realalloc = PETSC_FALSE; 152949b5e25fSSatish Balay 153049b5e25fSSatish Balay PetscFunctionBegin; 15312576faa2SJed Brown if (nz >= 0 || nnz) realalloc = PETSC_TRUE; 1532db4efbfdSBarry Smith 15339566063dSJacob Faibussowitsch PetscCall(MatSetBlockSize(B, PetscAbs(bs))); 15349566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(B->rmap)); 15359566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(B->cmap)); 153608401ef6SPierre Jolivet PetscCheck(B->rmap->N <= B->cmap->N, PETSC_COMM_SELF, PETSC_ERR_SUP, "SEQSBAIJ matrix cannot have more rows %" PetscInt_FMT " than columns %" PetscInt_FMT, B->rmap->N, B->cmap->N); 15379566063dSJacob Faibussowitsch PetscCall(PetscLayoutGetBlockSize(B->rmap, &bs)); 1538899cda47SBarry Smith 153921940c7eSstefano_zampini B->preallocated = PETSC_TRUE; 154021940c7eSstefano_zampini 1541d0f46423SBarry Smith mbs = B->rmap->N / bs; 15424dcd73b1SHong Zhang nbs = B->cmap->n / bs; 154349b5e25fSSatish Balay bs2 = bs * bs; 154449b5e25fSSatish Balay 1545aed4548fSBarry Smith PetscCheck(mbs * bs == B->rmap->N && nbs * bs == B->cmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Number rows, cols must be divisible by blocksize"); 154649b5e25fSSatish Balay 1547ab93d7beSBarry Smith if (nz == MAT_SKIP_ALLOCATION) { 1548ab93d7beSBarry Smith skipallocation = PETSC_TRUE; 1549ab93d7beSBarry Smith nz = 0; 1550ab93d7beSBarry Smith } 1551ab93d7beSBarry Smith 1552435da068SBarry Smith if (nz == PETSC_DEFAULT || nz == PETSC_DECIDE) nz = 3; 155308401ef6SPierre Jolivet PetscCheck(nz >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "nz cannot be less than 0: value %" PetscInt_FMT, nz); 155449b5e25fSSatish Balay if (nnz) { 155549b5e25fSSatish Balay for (i = 0; i < mbs; i++) { 155608401ef6SPierre Jolivet PetscCheck(nnz[i] >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "nnz cannot be less than 0: local row %" PetscInt_FMT " value %" PetscInt_FMT, i, nnz[i]); 155708401ef6SPierre Jolivet PetscCheck(nnz[i] <= nbs, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "nnz cannot be greater than block row length: local row %" PetscInt_FMT " value %" PetscInt_FMT " block rowlength %" PetscInt_FMT, i, nnz[i], nbs); 155849b5e25fSSatish Balay } 155949b5e25fSSatish Balay } 156049b5e25fSSatish Balay 1561db4efbfdSBarry Smith B->ops->mult = MatMult_SeqSBAIJ_N; 1562db4efbfdSBarry Smith B->ops->multadd = MatMultAdd_SeqSBAIJ_N; 1563db4efbfdSBarry Smith B->ops->multtranspose = MatMult_SeqSBAIJ_N; 1564db4efbfdSBarry Smith B->ops->multtransposeadd = MatMultAdd_SeqSBAIJ_N; 156526fbe8dcSKarl Rupp 15669566063dSJacob Faibussowitsch PetscCall(PetscOptionsGetBool(((PetscObject)B)->options, ((PetscObject)B)->prefix, "-mat_no_unroll", &flg, NULL)); 156749b5e25fSSatish Balay if (!flg) { 156849b5e25fSSatish Balay switch (bs) { 156949b5e25fSSatish Balay case 1: 157049b5e25fSSatish Balay B->ops->mult = MatMult_SeqSBAIJ_1; 157149b5e25fSSatish Balay B->ops->multadd = MatMultAdd_SeqSBAIJ_1; 1572431c96f7SBarry Smith B->ops->multtranspose = MatMult_SeqSBAIJ_1; 1573431c96f7SBarry Smith B->ops->multtransposeadd = MatMultAdd_SeqSBAIJ_1; 157449b5e25fSSatish Balay break; 157549b5e25fSSatish Balay case 2: 157649b5e25fSSatish Balay B->ops->mult = MatMult_SeqSBAIJ_2; 157749b5e25fSSatish Balay B->ops->multadd = MatMultAdd_SeqSBAIJ_2; 1578431c96f7SBarry Smith B->ops->multtranspose = MatMult_SeqSBAIJ_2; 1579431c96f7SBarry Smith B->ops->multtransposeadd = MatMultAdd_SeqSBAIJ_2; 158049b5e25fSSatish Balay break; 158149b5e25fSSatish Balay case 3: 158249b5e25fSSatish Balay B->ops->mult = MatMult_SeqSBAIJ_3; 158349b5e25fSSatish Balay B->ops->multadd = MatMultAdd_SeqSBAIJ_3; 1584431c96f7SBarry Smith B->ops->multtranspose = MatMult_SeqSBAIJ_3; 1585431c96f7SBarry Smith B->ops->multtransposeadd = MatMultAdd_SeqSBAIJ_3; 158649b5e25fSSatish Balay break; 158749b5e25fSSatish Balay case 4: 158849b5e25fSSatish Balay B->ops->mult = MatMult_SeqSBAIJ_4; 158949b5e25fSSatish Balay B->ops->multadd = MatMultAdd_SeqSBAIJ_4; 1590431c96f7SBarry Smith B->ops->multtranspose = MatMult_SeqSBAIJ_4; 1591431c96f7SBarry Smith B->ops->multtransposeadd = MatMultAdd_SeqSBAIJ_4; 159249b5e25fSSatish Balay break; 159349b5e25fSSatish Balay case 5: 159449b5e25fSSatish Balay B->ops->mult = MatMult_SeqSBAIJ_5; 159549b5e25fSSatish Balay B->ops->multadd = MatMultAdd_SeqSBAIJ_5; 1596431c96f7SBarry Smith B->ops->multtranspose = MatMult_SeqSBAIJ_5; 1597431c96f7SBarry Smith B->ops->multtransposeadd = MatMultAdd_SeqSBAIJ_5; 159849b5e25fSSatish Balay break; 159949b5e25fSSatish Balay case 6: 160049b5e25fSSatish Balay B->ops->mult = MatMult_SeqSBAIJ_6; 160149b5e25fSSatish Balay B->ops->multadd = MatMultAdd_SeqSBAIJ_6; 1602431c96f7SBarry Smith B->ops->multtranspose = MatMult_SeqSBAIJ_6; 1603431c96f7SBarry Smith B->ops->multtransposeadd = MatMultAdd_SeqSBAIJ_6; 160449b5e25fSSatish Balay break; 160549b5e25fSSatish Balay case 7: 1606de53e5efSHong Zhang B->ops->mult = MatMult_SeqSBAIJ_7; 160749b5e25fSSatish Balay B->ops->multadd = MatMultAdd_SeqSBAIJ_7; 1608431c96f7SBarry Smith B->ops->multtranspose = MatMult_SeqSBAIJ_7; 1609431c96f7SBarry Smith B->ops->multtransposeadd = MatMultAdd_SeqSBAIJ_7; 161049b5e25fSSatish Balay break; 161149b5e25fSSatish Balay } 161249b5e25fSSatish Balay } 161349b5e25fSSatish Balay 161449b5e25fSSatish Balay b->mbs = mbs; 16154dcd73b1SHong Zhang b->nbs = nbs; 1616ab93d7beSBarry Smith if (!skipallocation) { 16172ee49352SLisandro Dalcin if (!b->imax) { 16189566063dSJacob Faibussowitsch PetscCall(PetscMalloc2(mbs, &b->imax, mbs, &b->ilen)); 161926fbe8dcSKarl Rupp 1620c760cd28SBarry Smith b->free_imax_ilen = PETSC_TRUE; 16212ee49352SLisandro Dalcin } 162249b5e25fSSatish Balay if (!nnz) { 1623435da068SBarry Smith if (nz == PETSC_DEFAULT || nz == PETSC_DECIDE) nz = 5; 162449b5e25fSSatish Balay else if (nz <= 0) nz = 1; 16255d2a9ed1SStefano Zampini nz = PetscMin(nbs, nz); 162626fbe8dcSKarl Rupp for (i = 0; i < mbs; i++) b->imax[i] = nz; 16279566063dSJacob Faibussowitsch PetscCall(PetscIntMultError(nz, mbs, &nz)); 162849b5e25fSSatish Balay } else { 1629c73702f5SBarry Smith PetscInt64 nz64 = 0; 16309371c9d4SSatish Balay for (i = 0; i < mbs; i++) { 16319371c9d4SSatish Balay b->imax[i] = nnz[i]; 16329371c9d4SSatish Balay nz64 += nnz[i]; 16339371c9d4SSatish Balay } 16349566063dSJacob Faibussowitsch PetscCall(PetscIntCast(nz64, &nz)); 163549b5e25fSSatish Balay } 16362ee49352SLisandro Dalcin /* b->ilen will count nonzeros in each block row so far. */ 163726fbe8dcSKarl Rupp for (i = 0; i < mbs; i++) b->ilen[i] = 0; 16386c6c5352SBarry Smith /* nz=(nz+mbs)/2; */ /* total diagonal and superdiagonal nonzero blocks */ 163949b5e25fSSatish Balay 164049b5e25fSSatish Balay /* allocate the matrix space */ 16419566063dSJacob Faibussowitsch PetscCall(MatSeqXAIJFreeAIJ(B, &b->a, &b->j, &b->i)); 16429566063dSJacob Faibussowitsch PetscCall(PetscMalloc3(bs2 * nz, &b->a, nz, &b->j, B->rmap->N + 1, &b->i)); 16439566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(b->a, nz * bs2)); 16449566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(b->j, nz)); 164526fbe8dcSKarl Rupp 164649b5e25fSSatish Balay b->singlemalloc = PETSC_TRUE; 164749b5e25fSSatish Balay 164849b5e25fSSatish Balay /* pointer to beginning of each row */ 1649e60cf9a0SBarry Smith b->i[0] = 0; 165026fbe8dcSKarl Rupp for (i = 1; i < mbs + 1; i++) b->i[i] = b->i[i - 1] + b->imax[i - 1]; 165126fbe8dcSKarl Rupp 1652e6b907acSBarry Smith b->free_a = PETSC_TRUE; 1653e6b907acSBarry Smith b->free_ij = PETSC_TRUE; 1654e811da20SHong Zhang } else { 1655e6b907acSBarry Smith b->free_a = PETSC_FALSE; 1656e6b907acSBarry Smith b->free_ij = PETSC_FALSE; 1657ab93d7beSBarry Smith } 165849b5e25fSSatish Balay 165949b5e25fSSatish Balay b->bs2 = bs2; 16606c6c5352SBarry Smith b->nz = 0; 1661b32cb4a7SJed Brown b->maxnz = nz; 1662f4259b30SLisandro Dalcin b->inew = NULL; 1663f4259b30SLisandro Dalcin b->jnew = NULL; 1664f4259b30SLisandro Dalcin b->anew = NULL; 1665f4259b30SLisandro Dalcin b->a2anew = NULL; 16661a3463dfSHong Zhang b->permute = PETSC_FALSE; 1667cb7b82ddSBarry Smith 1668cb7b82ddSBarry Smith B->was_assembled = PETSC_FALSE; 1669cb7b82ddSBarry Smith B->assembled = PETSC_FALSE; 16709566063dSJacob Faibussowitsch if (realalloc) PetscCall(MatSetOption(B, MAT_NEW_NONZERO_ALLOCATION_ERR, PETSC_TRUE)); 16713ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1672c464158bSHong Zhang } 1673153ea458SHong Zhang 1674d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqSBAIJSetPreallocationCSR_SeqSBAIJ(Mat B, PetscInt bs, const PetscInt ii[], const PetscInt jj[], const PetscScalar V[]) 1675d71ae5a4SJacob Faibussowitsch { 16760cd7f59aSBarry Smith PetscInt i, j, m, nz, anz, nz_max = 0, *nnz; 1677f4259b30SLisandro Dalcin PetscScalar *values = NULL; 167838f409ebSLisandro Dalcin PetscBool roworiented = ((Mat_SeqSBAIJ *)B->data)->roworiented; 16790cd7f59aSBarry Smith 168038f409ebSLisandro Dalcin PetscFunctionBegin; 168108401ef6SPierre Jolivet PetscCheck(bs >= 1, PetscObjectComm((PetscObject)B), PETSC_ERR_ARG_OUTOFRANGE, "Invalid block size specified, must be positive but it is %" PetscInt_FMT, bs); 16829566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetBlockSize(B->rmap, bs)); 16839566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetBlockSize(B->cmap, bs)); 16849566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(B->rmap)); 16859566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(B->cmap)); 16869566063dSJacob Faibussowitsch PetscCall(PetscLayoutGetBlockSize(B->rmap, &bs)); 168738f409ebSLisandro Dalcin m = B->rmap->n / bs; 168838f409ebSLisandro Dalcin 1689aed4548fSBarry Smith PetscCheck(!ii[0], PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "ii[0] must be 0 but it is %" PetscInt_FMT, ii[0]); 16909566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m + 1, &nnz)); 169138f409ebSLisandro Dalcin for (i = 0; i < m; i++) { 169238f409ebSLisandro Dalcin nz = ii[i + 1] - ii[i]; 169308401ef6SPierre Jolivet PetscCheck(nz >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Row %" PetscInt_FMT " has a negative number of columns %" PetscInt_FMT, i, nz); 16940cd7f59aSBarry Smith anz = 0; 16950cd7f59aSBarry Smith for (j = 0; j < nz; j++) { 16960cd7f59aSBarry Smith /* count only values on the diagonal or above */ 16970cd7f59aSBarry Smith if (jj[ii[i] + j] >= i) { 16980cd7f59aSBarry Smith anz = nz - j; 16990cd7f59aSBarry Smith break; 17000cd7f59aSBarry Smith } 17010cd7f59aSBarry Smith } 17020cd7f59aSBarry Smith nz_max = PetscMax(nz_max, anz); 17030cd7f59aSBarry Smith nnz[i] = anz; 170438f409ebSLisandro Dalcin } 17059566063dSJacob Faibussowitsch PetscCall(MatSeqSBAIJSetPreallocation(B, bs, 0, nnz)); 17069566063dSJacob Faibussowitsch PetscCall(PetscFree(nnz)); 170738f409ebSLisandro Dalcin 170838f409ebSLisandro Dalcin values = (PetscScalar *)V; 170948a46eb9SPierre Jolivet if (!values) PetscCall(PetscCalloc1(bs * bs * nz_max, &values)); 171038f409ebSLisandro Dalcin for (i = 0; i < m; i++) { 171138f409ebSLisandro Dalcin PetscInt ncols = ii[i + 1] - ii[i]; 171238f409ebSLisandro Dalcin const PetscInt *icols = jj + ii[i]; 171338f409ebSLisandro Dalcin if (!roworiented || bs == 1) { 171438f409ebSLisandro Dalcin const PetscScalar *svals = values + (V ? (bs * bs * ii[i]) : 0); 17159566063dSJacob Faibussowitsch PetscCall(MatSetValuesBlocked_SeqSBAIJ(B, 1, &i, ncols, icols, svals, INSERT_VALUES)); 171638f409ebSLisandro Dalcin } else { 171738f409ebSLisandro Dalcin for (j = 0; j < ncols; j++) { 171838f409ebSLisandro Dalcin const PetscScalar *svals = values + (V ? (bs * bs * (ii[i] + j)) : 0); 17199566063dSJacob Faibussowitsch PetscCall(MatSetValuesBlocked_SeqSBAIJ(B, 1, &i, 1, &icols[j], svals, INSERT_VALUES)); 172038f409ebSLisandro Dalcin } 172138f409ebSLisandro Dalcin } 172238f409ebSLisandro Dalcin } 17239566063dSJacob Faibussowitsch if (!V) PetscCall(PetscFree(values)); 17249566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(B, MAT_FINAL_ASSEMBLY)); 17259566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(B, MAT_FINAL_ASSEMBLY)); 17269566063dSJacob Faibussowitsch PetscCall(MatSetOption(B, MAT_NEW_NONZERO_LOCATION_ERR, PETSC_TRUE)); 17273ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 172838f409ebSLisandro Dalcin } 172938f409ebSLisandro Dalcin 1730db4efbfdSBarry Smith /* 1731db4efbfdSBarry Smith This is used to set the numeric factorization for both Cholesky and ICC symbolic factorization 1732db4efbfdSBarry Smith */ 1733d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqSBAIJSetNumericFactorization_inplace(Mat B, PetscBool natural) 1734d71ae5a4SJacob Faibussowitsch { 1735ace3abfcSBarry Smith PetscBool flg = PETSC_FALSE; 1736db4efbfdSBarry Smith PetscInt bs = B->rmap->bs; 1737db4efbfdSBarry Smith 1738db4efbfdSBarry Smith PetscFunctionBegin; 17399566063dSJacob Faibussowitsch PetscCall(PetscOptionsGetBool(((PetscObject)B)->options, ((PetscObject)B)->prefix, "-mat_no_unroll", &flg, NULL)); 1740db4efbfdSBarry Smith if (flg) bs = 8; 1741db4efbfdSBarry Smith 1742db4efbfdSBarry Smith if (!natural) { 1743db4efbfdSBarry Smith switch (bs) { 1744d71ae5a4SJacob Faibussowitsch case 1: 1745d71ae5a4SJacob Faibussowitsch B->ops->choleskyfactornumeric = MatCholeskyFactorNumeric_SeqSBAIJ_1_inplace; 1746d71ae5a4SJacob Faibussowitsch break; 1747d71ae5a4SJacob Faibussowitsch case 2: 1748d71ae5a4SJacob Faibussowitsch B->ops->choleskyfactornumeric = MatCholeskyFactorNumeric_SeqSBAIJ_2; 1749d71ae5a4SJacob Faibussowitsch break; 1750d71ae5a4SJacob Faibussowitsch case 3: 1751d71ae5a4SJacob Faibussowitsch B->ops->choleskyfactornumeric = MatCholeskyFactorNumeric_SeqSBAIJ_3; 1752d71ae5a4SJacob Faibussowitsch break; 1753d71ae5a4SJacob Faibussowitsch case 4: 1754d71ae5a4SJacob Faibussowitsch B->ops->choleskyfactornumeric = MatCholeskyFactorNumeric_SeqSBAIJ_4; 1755d71ae5a4SJacob Faibussowitsch break; 1756d71ae5a4SJacob Faibussowitsch case 5: 1757d71ae5a4SJacob Faibussowitsch B->ops->choleskyfactornumeric = MatCholeskyFactorNumeric_SeqSBAIJ_5; 1758d71ae5a4SJacob Faibussowitsch break; 1759d71ae5a4SJacob Faibussowitsch case 6: 1760d71ae5a4SJacob Faibussowitsch B->ops->choleskyfactornumeric = MatCholeskyFactorNumeric_SeqSBAIJ_6; 1761d71ae5a4SJacob Faibussowitsch break; 1762d71ae5a4SJacob Faibussowitsch case 7: 1763d71ae5a4SJacob Faibussowitsch B->ops->choleskyfactornumeric = MatCholeskyFactorNumeric_SeqSBAIJ_7; 1764d71ae5a4SJacob Faibussowitsch break; 1765d71ae5a4SJacob Faibussowitsch default: 1766d71ae5a4SJacob Faibussowitsch B->ops->choleskyfactornumeric = MatCholeskyFactorNumeric_SeqSBAIJ_N; 1767d71ae5a4SJacob Faibussowitsch break; 1768db4efbfdSBarry Smith } 1769db4efbfdSBarry Smith } else { 1770db4efbfdSBarry Smith switch (bs) { 1771d71ae5a4SJacob Faibussowitsch case 1: 1772d71ae5a4SJacob Faibussowitsch B->ops->choleskyfactornumeric = MatCholeskyFactorNumeric_SeqSBAIJ_1_NaturalOrdering_inplace; 1773d71ae5a4SJacob Faibussowitsch break; 1774d71ae5a4SJacob Faibussowitsch case 2: 1775d71ae5a4SJacob Faibussowitsch B->ops->choleskyfactornumeric = MatCholeskyFactorNumeric_SeqSBAIJ_2_NaturalOrdering; 1776d71ae5a4SJacob Faibussowitsch break; 1777d71ae5a4SJacob Faibussowitsch case 3: 1778d71ae5a4SJacob Faibussowitsch B->ops->choleskyfactornumeric = MatCholeskyFactorNumeric_SeqSBAIJ_3_NaturalOrdering; 1779d71ae5a4SJacob Faibussowitsch break; 1780d71ae5a4SJacob Faibussowitsch case 4: 1781d71ae5a4SJacob Faibussowitsch B->ops->choleskyfactornumeric = MatCholeskyFactorNumeric_SeqSBAIJ_4_NaturalOrdering; 1782d71ae5a4SJacob Faibussowitsch break; 1783d71ae5a4SJacob Faibussowitsch case 5: 1784d71ae5a4SJacob Faibussowitsch B->ops->choleskyfactornumeric = MatCholeskyFactorNumeric_SeqSBAIJ_5_NaturalOrdering; 1785d71ae5a4SJacob Faibussowitsch break; 1786d71ae5a4SJacob Faibussowitsch case 6: 1787d71ae5a4SJacob Faibussowitsch B->ops->choleskyfactornumeric = MatCholeskyFactorNumeric_SeqSBAIJ_6_NaturalOrdering; 1788d71ae5a4SJacob Faibussowitsch break; 1789d71ae5a4SJacob Faibussowitsch case 7: 1790d71ae5a4SJacob Faibussowitsch B->ops->choleskyfactornumeric = MatCholeskyFactorNumeric_SeqSBAIJ_7_NaturalOrdering; 1791d71ae5a4SJacob Faibussowitsch break; 1792d71ae5a4SJacob Faibussowitsch default: 1793d71ae5a4SJacob Faibussowitsch B->ops->choleskyfactornumeric = MatCholeskyFactorNumeric_SeqSBAIJ_N_NaturalOrdering; 1794d71ae5a4SJacob Faibussowitsch break; 1795db4efbfdSBarry Smith } 1796db4efbfdSBarry Smith } 17973ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1798db4efbfdSBarry Smith } 1799db4efbfdSBarry Smith 1800cc2e6a90SBarry Smith PETSC_INTERN PetscErrorCode MatConvert_SeqSBAIJ_SeqAIJ(Mat, MatType, MatReuse, Mat *); 1801cc2e6a90SBarry Smith PETSC_INTERN PetscErrorCode MatConvert_SeqSBAIJ_SeqBAIJ(Mat, MatType, MatReuse, Mat *); 1802d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatFactorGetSolverType_petsc(Mat A, MatSolverType *type) 1803d71ae5a4SJacob Faibussowitsch { 18044ac6704cSBarry Smith PetscFunctionBegin; 18054ac6704cSBarry Smith *type = MATSOLVERPETSC; 18063ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 18074ac6704cSBarry Smith } 1808d769727bSBarry Smith 1809d71ae5a4SJacob Faibussowitsch PETSC_INTERN PetscErrorCode MatGetFactor_seqsbaij_petsc(Mat A, MatFactorType ftype, Mat *B) 1810d71ae5a4SJacob Faibussowitsch { 1811d0f46423SBarry Smith PetscInt n = A->rmap->n; 18125c9eb25fSBarry Smith 18135c9eb25fSBarry Smith PetscFunctionBegin; 18140e92d65fSHong Zhang #if defined(PETSC_USE_COMPLEX) 1815b94d7dedSBarry Smith PetscCheck(A->hermitian != PETSC_BOOL3_TRUE || A->symmetric == PETSC_BOOL3_TRUE || (ftype != MAT_FACTOR_CHOLESKY && ftype != MAT_FACTOR_ICC), PETSC_COMM_SELF, PETSC_ERR_SUP, "Hermitian CHOLESKY or ICC Factor is not supported"); 18160e92d65fSHong Zhang #endif 1817eb1ec7c1SStefano Zampini 18189566063dSJacob Faibussowitsch PetscCall(MatCreate(PetscObjectComm((PetscObject)A), B)); 18199566063dSJacob Faibussowitsch PetscCall(MatSetSizes(*B, n, n, n, n)); 18205c9eb25fSBarry Smith if (ftype == MAT_FACTOR_CHOLESKY || ftype == MAT_FACTOR_ICC) { 18219566063dSJacob Faibussowitsch PetscCall(MatSetType(*B, MATSEQSBAIJ)); 18229566063dSJacob Faibussowitsch PetscCall(MatSeqSBAIJSetPreallocation(*B, A->rmap->bs, MAT_SKIP_ALLOCATION, NULL)); 182326fbe8dcSKarl Rupp 18247b056e98SHong Zhang (*B)->ops->choleskyfactorsymbolic = MatCholeskyFactorSymbolic_SeqSBAIJ; 1825c6d0d4f0SHong Zhang (*B)->ops->iccfactorsymbolic = MatICCFactorSymbolic_SeqSBAIJ; 18269566063dSJacob Faibussowitsch PetscCall(PetscStrallocpy(MATORDERINGNATURAL, (char **)&(*B)->preferredordering[MAT_FACTOR_CHOLESKY])); 18279566063dSJacob Faibussowitsch PetscCall(PetscStrallocpy(MATORDERINGNATURAL, (char **)&(*B)->preferredordering[MAT_FACTOR_ICC])); 1828e32f2f54SBarry Smith } else SETERRQ(PETSC_COMM_SELF, PETSC_ERR_SUP, "Factor type not supported"); 182900c67f3bSHong Zhang 1830d5f3da31SBarry Smith (*B)->factortype = ftype; 1831f73b0415SBarry Smith (*B)->canuseordering = PETSC_TRUE; 18329566063dSJacob Faibussowitsch PetscCall(PetscFree((*B)->solvertype)); 18339566063dSJacob Faibussowitsch PetscCall(PetscStrallocpy(MATSOLVERPETSC, &(*B)->solvertype)); 18349566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)*B, "MatFactorGetSolverType_C", MatFactorGetSolverType_petsc)); 18353ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 18365c9eb25fSBarry Smith } 18375c9eb25fSBarry Smith 18388397e458SBarry Smith /*@C 183911a5261eSBarry Smith MatSeqSBAIJGetArray - gives access to the array where the data for a `MATSEQSBAIJ` matrix is stored 18408397e458SBarry Smith 18418397e458SBarry Smith Not Collective 18428397e458SBarry Smith 18438397e458SBarry Smith Input Parameter: 184411a5261eSBarry Smith . mat - a `MATSEQSBAIJ` matrix 18458397e458SBarry Smith 18468397e458SBarry Smith Output Parameter: 18478397e458SBarry Smith . array - pointer to the data 18488397e458SBarry Smith 18498397e458SBarry Smith Level: intermediate 18508397e458SBarry Smith 185111a5261eSBarry Smith .seealso: `MATSEQSBAIJ`, `MatSeqSBAIJRestoreArray()`, `MatSeqAIJGetArray()`, `MatSeqAIJRestoreArray()` 18528397e458SBarry Smith @*/ 1853d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqSBAIJGetArray(Mat A, PetscScalar **array) 1854d71ae5a4SJacob Faibussowitsch { 18558397e458SBarry Smith PetscFunctionBegin; 1856cac4c232SBarry Smith PetscUseMethod(A, "MatSeqSBAIJGetArray_C", (Mat, PetscScalar **), (A, array)); 18573ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 18588397e458SBarry Smith } 18598397e458SBarry Smith 18608397e458SBarry Smith /*@C 186111a5261eSBarry Smith MatSeqSBAIJRestoreArray - returns access to the array where the data for a `MATSEQSBAIJ` matrix is stored obtained by `MatSeqSBAIJGetArray()` 18628397e458SBarry Smith 18638397e458SBarry Smith Not Collective 18648397e458SBarry Smith 18658397e458SBarry Smith Input Parameters: 1866a2b725a8SWilliam Gropp + mat - a MATSEQSBAIJ matrix 1867a2b725a8SWilliam Gropp - array - pointer to the data 18688397e458SBarry Smith 18698397e458SBarry Smith Level: intermediate 18708397e458SBarry Smith 187111a5261eSBarry Smith .seealso: `MATSEQSBAIJ`, `MatSeqSBAIJGetArray()`, `MatSeqAIJGetArray()`, `MatSeqAIJRestoreArray()` 18728397e458SBarry Smith @*/ 1873d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqSBAIJRestoreArray(Mat A, PetscScalar **array) 1874d71ae5a4SJacob Faibussowitsch { 18758397e458SBarry Smith PetscFunctionBegin; 1876cac4c232SBarry Smith PetscUseMethod(A, "MatSeqSBAIJRestoreArray_C", (Mat, PetscScalar **), (A, array)); 18773ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 18788397e458SBarry Smith } 18798397e458SBarry Smith 18800bad9183SKris Buschelman /*MC 1881fafad747SKris Buschelman MATSEQSBAIJ - MATSEQSBAIJ = "seqsbaij" - A matrix type to be used for sequential symmetric block sparse matrices, 18820bad9183SKris Buschelman based on block compressed sparse row format. Only the upper triangular portion of the matrix is stored. 18830bad9183SKris Buschelman 1884828413b8SBarry Smith For complex numbers by default this matrix is symmetric, NOT Hermitian symmetric. To make it Hermitian symmetric you 188511a5261eSBarry Smith can call `MatSetOption`(`Mat`, `MAT_HERMITIAN`). 1886828413b8SBarry Smith 18870bad9183SKris Buschelman Options Database Keys: 188811a5261eSBarry Smith . -mat_type seqsbaij - sets the matrix type to "seqsbaij" during a call to `MatSetFromOptions()` 18890bad9183SKris Buschelman 189095452b02SPatrick Sanan Notes: 189195452b02SPatrick Sanan By default if you insert values into the lower triangular part of the matrix they are simply ignored (since they are not 189211a5261eSBarry Smith stored and it is assumed they symmetric to the upper triangular). If you call `MatSetOption`(`Mat`,`MAT_IGNORE_LOWER_TRIANGULAR`,`PETSC_FALSE`) or use 189371dad5bbSBarry Smith the options database -mat_ignore_lower_triangular false it will generate an error if you try to set a value in the lower triangular portion. 189471dad5bbSBarry Smith 1895476417e5SBarry Smith The number of rows in the matrix must be less than or equal to the number of columns 189671dad5bbSBarry Smith 18970bad9183SKris Buschelman Level: beginner 18980bad9183SKris Buschelman 189911a5261eSBarry Smith .seealso: `MATSEQSBAIJ`, `MatCreateSeqSBAIJ()`, `MatType`, `MATMPISBAIJ` 19000bad9183SKris Buschelman M*/ 1901d71ae5a4SJacob Faibussowitsch PETSC_EXTERN PetscErrorCode MatCreate_SeqSBAIJ(Mat B) 1902d71ae5a4SJacob Faibussowitsch { 1903a23d5eceSKris Buschelman Mat_SeqSBAIJ *b; 190413f74950SBarry Smith PetscMPIInt size; 1905ace3abfcSBarry Smith PetscBool no_unroll = PETSC_FALSE, no_inode = PETSC_FALSE; 1906a23d5eceSKris Buschelman 1907a23d5eceSKris Buschelman PetscFunctionBegin; 19089566063dSJacob Faibussowitsch PetscCallMPI(MPI_Comm_size(PetscObjectComm((PetscObject)B), &size)); 190908401ef6SPierre Jolivet PetscCheck(size <= 1, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONG, "Comm must be of size 1"); 1910a23d5eceSKris Buschelman 19114dfa11a4SJacob Faibussowitsch PetscCall(PetscNew(&b)); 1912a23d5eceSKris Buschelman B->data = (void *)b; 19139566063dSJacob Faibussowitsch PetscCall(PetscMemcpy(B->ops, &MatOps_Values, sizeof(struct _MatOps))); 191426fbe8dcSKarl Rupp 1915a23d5eceSKris Buschelman B->ops->destroy = MatDestroy_SeqSBAIJ; 1916a23d5eceSKris Buschelman B->ops->view = MatView_SeqSBAIJ; 1917f4259b30SLisandro Dalcin b->row = NULL; 1918f4259b30SLisandro Dalcin b->icol = NULL; 1919a23d5eceSKris Buschelman b->reallocs = 0; 1920f4259b30SLisandro Dalcin b->saved_values = NULL; 19210def2e27SBarry Smith b->inode.limit = 5; 19220def2e27SBarry Smith b->inode.max_limit = 5; 1923a23d5eceSKris Buschelman 1924a23d5eceSKris Buschelman b->roworiented = PETSC_TRUE; 1925a23d5eceSKris Buschelman b->nonew = 0; 1926f4259b30SLisandro Dalcin b->diag = NULL; 1927f4259b30SLisandro Dalcin b->solve_work = NULL; 1928f4259b30SLisandro Dalcin b->mult_work = NULL; 1929f4259b30SLisandro Dalcin B->spptr = NULL; 1930f2cbd3d5SJed Brown B->info.nz_unneeded = (PetscReal)b->maxnz * b->bs2; 1931a9817697SBarry Smith b->keepnonzeropattern = PETSC_FALSE; 1932a23d5eceSKris Buschelman 1933f4259b30SLisandro Dalcin b->inew = NULL; 1934f4259b30SLisandro Dalcin b->jnew = NULL; 1935f4259b30SLisandro Dalcin b->anew = NULL; 1936f4259b30SLisandro Dalcin b->a2anew = NULL; 1937a23d5eceSKris Buschelman b->permute = PETSC_FALSE; 1938a23d5eceSKris Buschelman 193971dad5bbSBarry Smith b->ignore_ltriangular = PETSC_TRUE; 194026fbe8dcSKarl Rupp 19419566063dSJacob Faibussowitsch PetscCall(PetscOptionsGetBool(((PetscObject)B)->options, ((PetscObject)B)->prefix, "-mat_ignore_lower_triangular", &b->ignore_ltriangular, NULL)); 1942941593c8SHong Zhang 1943f5edf698SHong Zhang b->getrow_utriangular = PETSC_FALSE; 194426fbe8dcSKarl Rupp 19459566063dSJacob Faibussowitsch PetscCall(PetscOptionsGetBool(((PetscObject)B)->options, ((PetscObject)B)->prefix, "-mat_getrow_uppertriangular", &b->getrow_utriangular, NULL)); 1946f5edf698SHong Zhang 19479566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSeqSBAIJGetArray_C", MatSeqSBAIJGetArray_SeqSBAIJ)); 19489566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSeqSBAIJRestoreArray_C", MatSeqSBAIJRestoreArray_SeqSBAIJ)); 19499566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatStoreValues_C", MatStoreValues_SeqSBAIJ)); 19509566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatRetrieveValues_C", MatRetrieveValues_SeqSBAIJ)); 19519566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSeqSBAIJSetColumnIndices_C", MatSeqSBAIJSetColumnIndices_SeqSBAIJ)); 19529566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqsbaij_seqaij_C", MatConvert_SeqSBAIJ_SeqAIJ)); 19539566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqsbaij_seqbaij_C", MatConvert_SeqSBAIJ_SeqBAIJ)); 19549566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSeqSBAIJSetPreallocation_C", MatSeqSBAIJSetPreallocation_SeqSBAIJ)); 19559566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSeqSBAIJSetPreallocationCSR_C", MatSeqSBAIJSetPreallocationCSR_SeqSBAIJ)); 19566214f412SHong Zhang #if defined(PETSC_HAVE_ELEMENTAL) 19579566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqsbaij_elemental_C", MatConvert_SeqSBAIJ_Elemental)); 19586214f412SHong Zhang #endif 1959d24d4204SJose E. Roman #if defined(PETSC_HAVE_SCALAPACK) 19609566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqsbaij_scalapack_C", MatConvert_SBAIJ_ScaLAPACK)); 1961d24d4204SJose E. Roman #endif 196223ce1328SBarry Smith 1963b94d7dedSBarry Smith B->symmetry_eternal = PETSC_TRUE; 1964b94d7dedSBarry Smith B->structural_symmetry_eternal = PETSC_TRUE; 1965b94d7dedSBarry Smith B->symmetric = PETSC_BOOL3_TRUE; 1966b94d7dedSBarry Smith B->structurally_symmetric = PETSC_BOOL3_TRUE; 1967eb1ec7c1SStefano Zampini #if defined(PETSC_USE_COMPLEX) 1968b94d7dedSBarry Smith B->hermitian = PETSC_BOOL3_FALSE; 1969eb1ec7c1SStefano Zampini #else 1970b94d7dedSBarry Smith B->hermitian = PETSC_BOOL3_TRUE; 1971eb1ec7c1SStefano Zampini #endif 197213647f61SHong Zhang 19739566063dSJacob Faibussowitsch PetscCall(PetscObjectChangeTypeName((PetscObject)B, MATSEQSBAIJ)); 19740def2e27SBarry Smith 1975d0609cedSBarry Smith PetscOptionsBegin(PetscObjectComm((PetscObject)B), ((PetscObject)B)->prefix, "Options for SEQSBAIJ matrix", "Mat"); 19769566063dSJacob Faibussowitsch PetscCall(PetscOptionsBool("-mat_no_unroll", "Do not optimize for inodes (slower)", NULL, no_unroll, &no_unroll, NULL)); 197748a46eb9SPierre Jolivet if (no_unroll) PetscCall(PetscInfo(B, "Not using Inode routines due to -mat_no_unroll\n")); 19789566063dSJacob Faibussowitsch PetscCall(PetscOptionsBool("-mat_no_inode", "Do not optimize for inodes (slower)", NULL, no_inode, &no_inode, NULL)); 19799566063dSJacob Faibussowitsch if (no_inode) PetscCall(PetscInfo(B, "Not using Inode routines due to -mat_no_inode\n")); 19809566063dSJacob Faibussowitsch PetscCall(PetscOptionsInt("-mat_inode_limit", "Do not use inodes larger then this value", NULL, b->inode.limit, &b->inode.limit, NULL)); 1981d0609cedSBarry Smith PetscOptionsEnd(); 1982ace3abfcSBarry Smith b->inode.use = (PetscBool)(!(no_unroll || no_inode)); 19830def2e27SBarry Smith if (b->inode.limit > b->inode.max_limit) b->inode.limit = b->inode.max_limit; 19843ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1985a23d5eceSKris Buschelman } 1986a23d5eceSKris Buschelman 1987a23d5eceSKris Buschelman /*@C 1988a23d5eceSKris Buschelman MatSeqSBAIJSetPreallocation - Creates a sparse symmetric matrix in block AIJ (block 198911a5261eSBarry Smith compressed row) `MATSEQSBAIJ` format. For good matrix assembly performance the 1990a23d5eceSKris Buschelman user should preallocate the matrix storage by setting the parameter nz 1991a23d5eceSKris Buschelman (or the array nnz). By setting these parameters accurately, performance 1992a23d5eceSKris Buschelman during matrix assembly can be increased by more than a factor of 50. 1993a23d5eceSKris Buschelman 1994c3339decSBarry Smith Collective 1995a23d5eceSKris Buschelman 1996a23d5eceSKris Buschelman Input Parameters: 19971c4f3114SJed Brown + B - the symmetric matrix 199811a5261eSBarry Smith . bs - size of block, the blocks are ALWAYS square. One can use `MatSetBlockSizes()` to set a different row and column blocksize but the row 199911a5261eSBarry Smith blocksize always defines the size of the blocks. The column blocksize sets the blocksize of the vectors obtained with `MatCreateVecs()` 2000a23d5eceSKris Buschelman . nz - number of block nonzeros per block row (same for all rows) 2001a23d5eceSKris Buschelman - nnz - array containing the number of block nonzeros in the upper triangular plus 20020298fd71SBarry Smith diagonal portion of each block (possibly different for each block row) or NULL 2003a23d5eceSKris Buschelman 2004a23d5eceSKris Buschelman Options Database Keys: 2005a2b725a8SWilliam Gropp + -mat_no_unroll - uses code that does not unroll the loops in the 2006a23d5eceSKris Buschelman block calculations (much slower) 2007a2b725a8SWilliam Gropp - -mat_block_size - size of the blocks to use (only works if a negative bs is passed in 2008a23d5eceSKris Buschelman 2009a23d5eceSKris Buschelman Level: intermediate 2010a23d5eceSKris Buschelman 2011a23d5eceSKris Buschelman Notes: 2012a23d5eceSKris Buschelman Specify the preallocated storage with either nz or nnz (not both). 201311a5261eSBarry Smith Set nz = `PETSC_DEFAULT` and nnz = NULL for PETSc to control dynamic memory 2014651615e1SBarry Smith allocation. See [Sparse Matrices](sec_matsparse) for details. 2015a23d5eceSKris Buschelman 201611a5261eSBarry Smith You can call `MatGetInfo()` to get information on how effective the preallocation was; 2017aa95bbe8SBarry Smith for example the fields mallocs,nz_allocated,nz_used,nz_unneeded; 2018aa95bbe8SBarry Smith You can also run with the option -info and look for messages with the string 2019aa95bbe8SBarry Smith malloc in them to see if additional memory allocation was needed. 2020aa95bbe8SBarry Smith 202149a6f317SBarry Smith If the nnz parameter is given then the nz parameter is ignored 202249a6f317SBarry Smith 2023651615e1SBarry Smith .seealso: [Sparse Matrices](sec_matsparse), `MATSEQSBAIJ`, `MatCreate()`, `MatCreateSeqAIJ()`, `MatSetValues()`, `MatCreateSBAIJ()` 2024a23d5eceSKris Buschelman @*/ 2025d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqSBAIJSetPreallocation(Mat B, PetscInt bs, PetscInt nz, const PetscInt nnz[]) 2026d71ae5a4SJacob Faibussowitsch { 2027a23d5eceSKris Buschelman PetscFunctionBegin; 20286ba663aaSJed Brown PetscValidHeaderSpecific(B, MAT_CLASSID, 1); 20296ba663aaSJed Brown PetscValidType(B, 1); 20306ba663aaSJed Brown PetscValidLogicalCollectiveInt(B, bs, 2); 2031cac4c232SBarry Smith PetscTryMethod(B, "MatSeqSBAIJSetPreallocation_C", (Mat, PetscInt, PetscInt, const PetscInt[]), (B, bs, nz, nnz)); 20323ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 2033a23d5eceSKris Buschelman } 203449b5e25fSSatish Balay 203538f409ebSLisandro Dalcin /*@C 203611a5261eSBarry Smith MatSeqSBAIJSetPreallocationCSR - Creates a sparse parallel matrix in `MATSEQSBAIJ` format using the given nonzero structure and (optional) numerical values 203738f409ebSLisandro Dalcin 203838f409ebSLisandro Dalcin Input Parameters: 20391c4f3114SJed Brown + B - the matrix 2040eab78319SHong Zhang . bs - size of block, the blocks are ALWAYS square. 204138f409ebSLisandro Dalcin . i - the indices into j for the start of each local row (starts with zero) 204238f409ebSLisandro Dalcin . j - the column indices for each local row (starts with zero) these must be sorted for each row 204338f409ebSLisandro Dalcin - v - optional values in the matrix 204438f409ebSLisandro Dalcin 2045664954b6SBarry Smith Level: advanced 204638f409ebSLisandro Dalcin 204738f409ebSLisandro Dalcin Notes: 204811a5261eSBarry Smith The order of the entries in values is specified by the `MatOption` `MAT_ROW_ORIENTED`. For example, C programs 204911a5261eSBarry Smith may want to use the default `MAT_ROW_ORIENTED` = `PETSC_TRUE` and use an array v[nnz][bs][bs] where the second index is 205038f409ebSLisandro Dalcin over rows within a block and the last index is over columns within a block row. Fortran programs will likely set 205111a5261eSBarry Smith `MAT_ROW_ORIENTED` = `PETSC_FALSE` and use a Fortran array v(bs,bs,nnz) in which the first index is over rows within a 205238f409ebSLisandro Dalcin block column and the second index is over columns within a block. 205338f409ebSLisandro Dalcin 205450c5228eSBarry Smith Any entries below the diagonal are ignored 20550cd7f59aSBarry Smith 20560cd7f59aSBarry Smith Though this routine has Preallocation() in the name it also sets the exact nonzero locations of the matrix entries 20570cd7f59aSBarry Smith and usually the numerical values as well 2058664954b6SBarry Smith 205911a5261eSBarry Smith .seealso: `MATSEQSBAIJ`, `MatCreate()`, `MatCreateSeqSBAIJ()`, `MatSetValuesBlocked()`, `MatSeqSBAIJSetPreallocation()`, `MATSEQSBAIJ` 206038f409ebSLisandro Dalcin @*/ 2061d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqSBAIJSetPreallocationCSR(Mat B, PetscInt bs, const PetscInt i[], const PetscInt j[], const PetscScalar v[]) 2062d71ae5a4SJacob Faibussowitsch { 206338f409ebSLisandro Dalcin PetscFunctionBegin; 206438f409ebSLisandro Dalcin PetscValidHeaderSpecific(B, MAT_CLASSID, 1); 206538f409ebSLisandro Dalcin PetscValidType(B, 1); 206638f409ebSLisandro Dalcin PetscValidLogicalCollectiveInt(B, bs, 2); 2067cac4c232SBarry Smith PetscTryMethod(B, "MatSeqSBAIJSetPreallocationCSR_C", (Mat, PetscInt, const PetscInt[], const PetscInt[], const PetscScalar[]), (B, bs, i, j, v)); 20683ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 206938f409ebSLisandro Dalcin } 207038f409ebSLisandro Dalcin 2071c464158bSHong Zhang /*@C 2072c464158bSHong Zhang MatCreateSeqSBAIJ - Creates a sparse symmetric matrix in block AIJ (block 207311a5261eSBarry Smith compressed row) `MATSEQSBAIJ` format. For good matrix assembly performance the 2074c464158bSHong Zhang user should preallocate the matrix storage by setting the parameter nz 2075c464158bSHong Zhang (or the array nnz). By setting these parameters accurately, performance 2076c464158bSHong Zhang during matrix assembly can be increased by more than a factor of 50. 207749b5e25fSSatish Balay 2078d083f849SBarry Smith Collective 2079c464158bSHong Zhang 2080c464158bSHong Zhang Input Parameters: 208111a5261eSBarry Smith + comm - MPI communicator, set to `PETSC_COMM_SELF` 208211a5261eSBarry Smith . bs - size of block, the blocks are ALWAYS square. One can use `MatSetBlockSizes()` to set a different row and column blocksize but the row 2083bb7ae925SBarry Smith blocksize always defines the size of the blocks. The column blocksize sets the blocksize of the vectors obtained with MatCreateVecs() 2084c464158bSHong Zhang . m - number of rows, or number of columns 2085c464158bSHong Zhang . nz - number of block nonzeros per block row (same for all rows) 2086744e8345SSatish Balay - nnz - array containing the number of block nonzeros in the upper triangular plus 20870298fd71SBarry Smith diagonal portion of each block (possibly different for each block row) or NULL 2088c464158bSHong Zhang 2089c464158bSHong Zhang Output Parameter: 2090c464158bSHong Zhang . A - the symmetric matrix 2091c464158bSHong Zhang 2092c464158bSHong Zhang Options Database Keys: 2093a2b725a8SWilliam Gropp + -mat_no_unroll - uses code that does not unroll the loops in the 2094c464158bSHong Zhang block calculations (much slower) 2095a2b725a8SWilliam Gropp - -mat_block_size - size of the blocks to use 2096c464158bSHong Zhang 2097c464158bSHong Zhang Level: intermediate 2098c464158bSHong Zhang 209911a5261eSBarry Smith It is recommended that one use the `MatCreate()`, `MatSetType()` and/or `MatSetFromOptions()`, 2100f6f02116SRichard Tran Mills MatXXXXSetPreallocation() paradigm instead of this routine directly. 210111a5261eSBarry Smith [MatXXXXSetPreallocation() is, for example, `MatSeqAIJSetPreallocation()`] 2102175b88e8SBarry Smith 2103c464158bSHong Zhang Notes: 21046d6d819aSHong Zhang The number of rows and columns must be divisible by blocksize. 21056d6d819aSHong Zhang This matrix type does not support complex Hermitian operation. 2106c464158bSHong Zhang 2107c464158bSHong Zhang Specify the preallocated storage with either nz or nnz (not both). 210811a5261eSBarry Smith Set nz = `PETSC_DEFAULT` and nnz = NULL for PETSc to control dynamic memory 2109651615e1SBarry Smith allocation. See [Sparse Matrices](sec_matsparse) for details. 2110c464158bSHong Zhang 211149a6f317SBarry Smith If the nnz parameter is given then the nz parameter is ignored 211249a6f317SBarry Smith 2113651615e1SBarry Smith .seealso: [Sparse Matrices](sec_matsparse), `MATSEQSBAIJ`, `MatCreate()`, `MatCreateSeqAIJ()`, `MatSetValues()`, `MatCreateSBAIJ()` 2114c464158bSHong Zhang @*/ 2115d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateSeqSBAIJ(MPI_Comm comm, PetscInt bs, PetscInt m, PetscInt n, PetscInt nz, const PetscInt nnz[], Mat *A) 2116d71ae5a4SJacob Faibussowitsch { 2117c464158bSHong Zhang PetscFunctionBegin; 21189566063dSJacob Faibussowitsch PetscCall(MatCreate(comm, A)); 21199566063dSJacob Faibussowitsch PetscCall(MatSetSizes(*A, m, n, m, n)); 21209566063dSJacob Faibussowitsch PetscCall(MatSetType(*A, MATSEQSBAIJ)); 21219566063dSJacob Faibussowitsch PetscCall(MatSeqSBAIJSetPreallocation(*A, bs, nz, (PetscInt *)nnz)); 21223ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 212349b5e25fSSatish Balay } 212449b5e25fSSatish Balay 2125d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDuplicate_SeqSBAIJ(Mat A, MatDuplicateOption cpvalues, Mat *B) 2126d71ae5a4SJacob Faibussowitsch { 212749b5e25fSSatish Balay Mat C; 212849b5e25fSSatish Balay Mat_SeqSBAIJ *c, *a = (Mat_SeqSBAIJ *)A->data; 2129b40805acSSatish Balay PetscInt i, mbs = a->mbs, nz = a->nz, bs2 = a->bs2; 213049b5e25fSSatish Balay 213149b5e25fSSatish Balay PetscFunctionBegin; 213208401ef6SPierre Jolivet PetscCheck(a->i[mbs] == nz, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Corrupt matrix"); 213349b5e25fSSatish Balay 2134f4259b30SLisandro Dalcin *B = NULL; 21359566063dSJacob Faibussowitsch PetscCall(MatCreate(PetscObjectComm((PetscObject)A), &C)); 21369566063dSJacob Faibussowitsch PetscCall(MatSetSizes(C, A->rmap->N, A->cmap->n, A->rmap->N, A->cmap->n)); 21379566063dSJacob Faibussowitsch PetscCall(MatSetBlockSizesFromMats(C, A, A)); 21389566063dSJacob Faibussowitsch PetscCall(MatSetType(C, MATSEQSBAIJ)); 2139692f9cbeSHong Zhang c = (Mat_SeqSBAIJ *)C->data; 2140692f9cbeSHong Zhang 2141273d9f13SBarry Smith C->preallocated = PETSC_TRUE; 2142d5f3da31SBarry Smith C->factortype = A->factortype; 2143f4259b30SLisandro Dalcin c->row = NULL; 2144f4259b30SLisandro Dalcin c->icol = NULL; 2145f4259b30SLisandro Dalcin c->saved_values = NULL; 2146a9817697SBarry Smith c->keepnonzeropattern = a->keepnonzeropattern; 214749b5e25fSSatish Balay C->assembled = PETSC_TRUE; 214849b5e25fSSatish Balay 21499566063dSJacob Faibussowitsch PetscCall(PetscLayoutReference(A->rmap, &C->rmap)); 21509566063dSJacob Faibussowitsch PetscCall(PetscLayoutReference(A->cmap, &C->cmap)); 215149b5e25fSSatish Balay c->bs2 = a->bs2; 215249b5e25fSSatish Balay c->mbs = a->mbs; 215349b5e25fSSatish Balay c->nbs = a->nbs; 215449b5e25fSSatish Balay 2155c760cd28SBarry Smith if (cpvalues == MAT_SHARE_NONZERO_PATTERN) { 2156c760cd28SBarry Smith c->imax = a->imax; 2157c760cd28SBarry Smith c->ilen = a->ilen; 2158c760cd28SBarry Smith c->free_imax_ilen = PETSC_FALSE; 2159c760cd28SBarry Smith } else { 21609566063dSJacob Faibussowitsch PetscCall(PetscMalloc2((mbs + 1), &c->imax, (mbs + 1), &c->ilen)); 216149b5e25fSSatish Balay for (i = 0; i < mbs; i++) { 216249b5e25fSSatish Balay c->imax[i] = a->imax[i]; 216349b5e25fSSatish Balay c->ilen[i] = a->ilen[i]; 216449b5e25fSSatish Balay } 2165c760cd28SBarry Smith c->free_imax_ilen = PETSC_TRUE; 2166c760cd28SBarry Smith } 216749b5e25fSSatish Balay 216849b5e25fSSatish Balay /* allocate the matrix space */ 21694da8f245SBarry Smith if (cpvalues == MAT_SHARE_NONZERO_PATTERN) { 21709566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(bs2 * nz, &c->a)); 217144e1c64aSLisandro Dalcin c->i = a->i; 217244e1c64aSLisandro Dalcin c->j = a->j; 21734da8f245SBarry Smith c->singlemalloc = PETSC_FALSE; 217444e1c64aSLisandro Dalcin c->free_a = PETSC_TRUE; 21754da8f245SBarry Smith c->free_ij = PETSC_FALSE; 21764da8f245SBarry Smith c->parent = A; 21779566063dSJacob Faibussowitsch PetscCall(PetscObjectReference((PetscObject)A)); 21789566063dSJacob Faibussowitsch PetscCall(MatSetOption(A, MAT_NEW_NONZERO_LOCATION_ERR, PETSC_TRUE)); 21799566063dSJacob Faibussowitsch PetscCall(MatSetOption(C, MAT_NEW_NONZERO_LOCATION_ERR, PETSC_TRUE)); 21804da8f245SBarry Smith } else { 21819566063dSJacob Faibussowitsch PetscCall(PetscMalloc3(bs2 * nz, &c->a, nz, &c->j, mbs + 1, &c->i)); 21829566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(c->i, a->i, mbs + 1)); 21834da8f245SBarry Smith c->singlemalloc = PETSC_TRUE; 218444e1c64aSLisandro Dalcin c->free_a = PETSC_TRUE; 21854da8f245SBarry Smith c->free_ij = PETSC_TRUE; 21864da8f245SBarry Smith } 218749b5e25fSSatish Balay if (mbs > 0) { 218848a46eb9SPierre Jolivet if (cpvalues != MAT_SHARE_NONZERO_PATTERN) PetscCall(PetscArraycpy(c->j, a->j, nz)); 218949b5e25fSSatish Balay if (cpvalues == MAT_COPY_VALUES) { 21909566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(c->a, a->a, bs2 * nz)); 219149b5e25fSSatish Balay } else { 21929566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(c->a, bs2 * nz)); 219349b5e25fSSatish Balay } 2194a1c3900fSBarry Smith if (a->jshort) { 219544e1c64aSLisandro Dalcin /* cannot share jshort, it is reallocated in MatAssemblyEnd_SeqSBAIJ() */ 219644e1c64aSLisandro Dalcin /* if the parent matrix is reassembled, this child matrix will never notice */ 21979566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nz, &c->jshort)); 21989566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(c->jshort, a->jshort, nz)); 219926fbe8dcSKarl Rupp 22004da8f245SBarry Smith c->free_jshort = PETSC_TRUE; 22014da8f245SBarry Smith } 2202a1c3900fSBarry Smith } 220349b5e25fSSatish Balay 220449b5e25fSSatish Balay c->roworiented = a->roworiented; 220549b5e25fSSatish Balay c->nonew = a->nonew; 220649b5e25fSSatish Balay 220749b5e25fSSatish Balay if (a->diag) { 2208c760cd28SBarry Smith if (cpvalues == MAT_SHARE_NONZERO_PATTERN) { 2209c760cd28SBarry Smith c->diag = a->diag; 2210c760cd28SBarry Smith c->free_diag = PETSC_FALSE; 2211c760cd28SBarry Smith } else { 22129566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(mbs, &c->diag)); 221326fbe8dcSKarl Rupp for (i = 0; i < mbs; i++) c->diag[i] = a->diag[i]; 2214c760cd28SBarry Smith c->free_diag = PETSC_TRUE; 2215c760cd28SBarry Smith } 221644e1c64aSLisandro Dalcin } 22176c6c5352SBarry Smith c->nz = a->nz; 2218f2cbd3d5SJed Brown c->maxnz = a->nz; /* Since we allocate exactly the right amount */ 2219f4259b30SLisandro Dalcin c->solve_work = NULL; 2220f4259b30SLisandro Dalcin c->mult_work = NULL; 222126fbe8dcSKarl Rupp 222249b5e25fSSatish Balay *B = C; 22239566063dSJacob Faibussowitsch PetscCall(PetscFunctionListDuplicate(((PetscObject)A)->qlist, &((PetscObject)C)->qlist)); 22243ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 222549b5e25fSSatish Balay } 222649b5e25fSSatish Balay 2227618cc2edSLisandro Dalcin /* Used for both SeqBAIJ and SeqSBAIJ matrices */ 2228618cc2edSLisandro Dalcin #define MatLoad_SeqSBAIJ_Binary MatLoad_SeqBAIJ_Binary 2229618cc2edSLisandro Dalcin 2230d71ae5a4SJacob Faibussowitsch PetscErrorCode MatLoad_SeqSBAIJ(Mat mat, PetscViewer viewer) 2231d71ae5a4SJacob Faibussowitsch { 22327f489da9SVaclav Hapla PetscBool isbinary; 22332f480046SShri Abhyankar 22342f480046SShri Abhyankar PetscFunctionBegin; 22359566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERBINARY, &isbinary)); 223628b400f6SJacob Faibussowitsch PetscCheck(isbinary, PetscObjectComm((PetscObject)viewer), PETSC_ERR_SUP, "Viewer type %s not yet supported for reading %s matrices", ((PetscObject)viewer)->type_name, ((PetscObject)mat)->type_name); 22379566063dSJacob Faibussowitsch PetscCall(MatLoad_SeqSBAIJ_Binary(mat, viewer)); 22383ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 22392f480046SShri Abhyankar } 22402f480046SShri Abhyankar 2241c75a6043SHong Zhang /*@ 224211a5261eSBarry Smith MatCreateSeqSBAIJWithArrays - Creates an sequential `MATSEQSBAIJ` matrix using matrix elements 2243c75a6043SHong Zhang (upper triangular entries in CSR format) provided by the user. 2244c75a6043SHong Zhang 2245d083f849SBarry Smith Collective 2246c75a6043SHong Zhang 2247c75a6043SHong Zhang Input Parameters: 2248c75a6043SHong Zhang + comm - must be an MPI communicator of size 1 2249c75a6043SHong Zhang . bs - size of block 2250c75a6043SHong Zhang . m - number of rows 2251c75a6043SHong Zhang . n - number of columns 2252483a2f95SBarry Smith . i - row indices; that is i[0] = 0, i[row] = i[row-1] + number of block elements in that row block row of the matrix 2253c75a6043SHong Zhang . j - column indices 2254c75a6043SHong Zhang - a - matrix values 2255c75a6043SHong Zhang 2256c75a6043SHong Zhang Output Parameter: 2257c75a6043SHong Zhang . mat - the matrix 2258c75a6043SHong Zhang 2259dfb205c3SBarry Smith Level: advanced 2260c75a6043SHong Zhang 2261c75a6043SHong Zhang Notes: 2262c75a6043SHong Zhang The i, j, and a arrays are not copied by this routine, the user must free these arrays 2263c75a6043SHong Zhang once the matrix is destroyed 2264c75a6043SHong Zhang 2265c75a6043SHong Zhang You cannot set new nonzero locations into this matrix, that will generate an error. 2266c75a6043SHong Zhang 2267c75a6043SHong Zhang The i and j indices are 0 based 2268c75a6043SHong Zhang 226911a5261eSBarry Smith When block size is greater than 1 the matrix values must be stored using the SBAIJ storage format (see the SBAIJ source code to determine this). For block size of 1 2270dfb205c3SBarry Smith it is the regular CSR format excluding the lower triangular elements. 2271dfb205c3SBarry Smith 227211a5261eSBarry Smith .seealso: `MATSEQSBAIJ`, `MatCreate()`, `MatCreateSBAIJ()`, `MatCreateSeqSBAIJ()` 2273c75a6043SHong Zhang @*/ 2274d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateSeqSBAIJWithArrays(MPI_Comm comm, PetscInt bs, PetscInt m, PetscInt n, PetscInt i[], PetscInt j[], PetscScalar a[], Mat *mat) 2275d71ae5a4SJacob Faibussowitsch { 2276c75a6043SHong Zhang PetscInt ii; 2277c75a6043SHong Zhang Mat_SeqSBAIJ *sbaij; 2278c75a6043SHong Zhang 2279c75a6043SHong Zhang PetscFunctionBegin; 228008401ef6SPierre Jolivet PetscCheck(bs == 1, PETSC_COMM_SELF, PETSC_ERR_SUP, "block size %" PetscInt_FMT " > 1 is not supported yet", bs); 2281aed4548fSBarry Smith PetscCheck(m == 0 || i[0] == 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "i (row indices) must start with 0"); 2282c75a6043SHong Zhang 22839566063dSJacob Faibussowitsch PetscCall(MatCreate(comm, mat)); 22849566063dSJacob Faibussowitsch PetscCall(MatSetSizes(*mat, m, n, m, n)); 22859566063dSJacob Faibussowitsch PetscCall(MatSetType(*mat, MATSEQSBAIJ)); 22869566063dSJacob Faibussowitsch PetscCall(MatSeqSBAIJSetPreallocation(*mat, bs, MAT_SKIP_ALLOCATION, NULL)); 2287c75a6043SHong Zhang sbaij = (Mat_SeqSBAIJ *)(*mat)->data; 22889566063dSJacob Faibussowitsch PetscCall(PetscMalloc2(m, &sbaij->imax, m, &sbaij->ilen)); 2289c75a6043SHong Zhang 2290c75a6043SHong Zhang sbaij->i = i; 2291c75a6043SHong Zhang sbaij->j = j; 2292c75a6043SHong Zhang sbaij->a = a; 229326fbe8dcSKarl Rupp 2294c75a6043SHong Zhang sbaij->singlemalloc = PETSC_FALSE; 2295c75a6043SHong Zhang sbaij->nonew = -1; /*this indicates that inserting a new value in the matrix that generates a new nonzero is an error*/ 2296e6b907acSBarry Smith sbaij->free_a = PETSC_FALSE; 2297e6b907acSBarry Smith sbaij->free_ij = PETSC_FALSE; 2298ddf7884eSMatthew Knepley sbaij->free_imax_ilen = PETSC_TRUE; 2299c75a6043SHong Zhang 2300c75a6043SHong Zhang for (ii = 0; ii < m; ii++) { 2301c75a6043SHong Zhang sbaij->ilen[ii] = sbaij->imax[ii] = i[ii + 1] - i[ii]; 23026bdcaf15SBarry Smith PetscCheck(i[ii + 1] >= i[ii], PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Negative row length in i (row indices) row = %" PetscInt_FMT " length = %" PetscInt_FMT, ii, i[ii + 1] - i[ii]); 2303c75a6043SHong Zhang } 230476bd3646SJed Brown if (PetscDefined(USE_DEBUG)) { 2305c75a6043SHong Zhang for (ii = 0; ii < sbaij->i[m]; ii++) { 23066bdcaf15SBarry Smith PetscCheck(j[ii] >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Negative column index at location = %" PetscInt_FMT " index = %" PetscInt_FMT, ii, j[ii]); 23076bdcaf15SBarry Smith PetscCheck(j[ii] < n, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Column index too large at location = %" PetscInt_FMT " index = %" PetscInt_FMT, ii, j[ii]); 2308c75a6043SHong Zhang } 230976bd3646SJed Brown } 2310c75a6043SHong Zhang 23119566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(*mat, MAT_FINAL_ASSEMBLY)); 23129566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(*mat, MAT_FINAL_ASSEMBLY)); 23133ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 2314c75a6043SHong Zhang } 2315d06b337dSHong Zhang 2316d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateMPIMatConcatenateSeqMat_SeqSBAIJ(MPI_Comm comm, Mat inmat, PetscInt n, MatReuse scall, Mat *outmat) 2317d71ae5a4SJacob Faibussowitsch { 231859f5e6ceSHong Zhang PetscFunctionBegin; 23199566063dSJacob Faibussowitsch PetscCall(MatCreateMPIMatConcatenateSeqMat_MPISBAIJ(comm, inmat, n, scall, outmat)); 23203ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 232159f5e6ceSHong Zhang } 2322