149b5e25fSSatish Balay 249b5e25fSSatish Balay /* 3a1373b80SHong Zhang Defines the basic matrix operations for the SBAIJ (compressed row) 449b5e25fSSatish Balay matrix storage format. 549b5e25fSSatish Balay */ 6c6db04a5SJed Brown #include <../src/mat/impls/baij/seq/baij.h> /*I "petscmat.h" I*/ 7c6db04a5SJed Brown #include <../src/mat/impls/sbaij/seq/sbaij.h> 8c6db04a5SJed Brown #include <petscblaslapack.h> 949b5e25fSSatish Balay 10c6db04a5SJed Brown #include <../src/mat/impls/sbaij/seq/relax.h> 1170dcbbb9SBarry Smith #define USESHORT 12c6db04a5SJed Brown #include <../src/mat/impls/sbaij/seq/relax.h> 1370dcbbb9SBarry Smith 1426cec326SBarry Smith /* defines MatSetValues_Seq_Hash(), MatAssemblyEnd_Seq_Hash(), MatSetUp_Seq_Hash() */ 1526cec326SBarry Smith #define TYPE SBAIJ 1626cec326SBarry Smith #define TYPE_SBAIJ 1726cec326SBarry Smith #define TYPE_BS 1826cec326SBarry Smith #include "../src/mat/impls/aij/seq/seqhashmatsetvalues.h" 1926cec326SBarry Smith #undef TYPE_BS 2026cec326SBarry Smith #define TYPE_BS _BS 2126cec326SBarry Smith #define TYPE_BS_ON 2226cec326SBarry Smith #include "../src/mat/impls/aij/seq/seqhashmatsetvalues.h" 2326cec326SBarry Smith #undef TYPE_BS 2426cec326SBarry Smith #undef TYPE_SBAIJ 2526cec326SBarry Smith #include "../src/mat/impls/aij/seq/seqhashmat.h" 2626cec326SBarry Smith #undef TYPE 2726cec326SBarry Smith #undef TYPE_BS_ON 2826cec326SBarry Smith 296214f412SHong Zhang #if defined(PETSC_HAVE_ELEMENTAL) 30cc2e6a90SBarry Smith PETSC_INTERN PetscErrorCode MatConvert_SeqSBAIJ_Elemental(Mat, MatType, MatReuse, Mat *); 316214f412SHong Zhang #endif 32d24d4204SJose E. Roman #if defined(PETSC_HAVE_SCALAPACK) 33d24d4204SJose E. Roman PETSC_INTERN PetscErrorCode MatConvert_SBAIJ_ScaLAPACK(Mat, MatType, MatReuse, Mat *); 34d24d4204SJose E. Roman #endif 3528d58a37SPierre Jolivet PETSC_INTERN PetscErrorCode MatConvert_MPISBAIJ_Basic(Mat, MatType, MatReuse, Mat *); 36b5b17502SBarry Smith 3749b5e25fSSatish Balay /* 3849b5e25fSSatish Balay Checks for missing diagonals 3949b5e25fSSatish Balay */ 40d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMissingDiagonal_SeqSBAIJ(Mat A, PetscBool *missing, PetscInt *dd) 41d71ae5a4SJacob Faibussowitsch { 42045c9aa0SHong Zhang Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)A->data; 437734d3b5SMatthew G. Knepley PetscInt *diag, *ii = a->i, i; 4449b5e25fSSatish Balay 4549b5e25fSSatish Balay PetscFunctionBegin; 469566063dSJacob Faibussowitsch PetscCall(MatMarkDiagonal_SeqSBAIJ(A)); 472af78befSBarry Smith *missing = PETSC_FALSE; 487734d3b5SMatthew G. Knepley if (A->rmap->n > 0 && !ii) { 49358d2f5dSShri Abhyankar *missing = PETSC_TRUE; 50358d2f5dSShri Abhyankar if (dd) *dd = 0; 519566063dSJacob Faibussowitsch PetscCall(PetscInfo(A, "Matrix has no entries therefore is missing diagonal\n")); 52358d2f5dSShri Abhyankar } else { 53358d2f5dSShri Abhyankar diag = a->diag; 5449b5e25fSSatish Balay for (i = 0; i < a->mbs; i++) { 557734d3b5SMatthew G. Knepley if (diag[i] >= ii[i + 1]) { 562af78befSBarry Smith *missing = PETSC_TRUE; 572af78befSBarry Smith if (dd) *dd = i; 582af78befSBarry Smith break; 592af78befSBarry Smith } 6049b5e25fSSatish Balay } 61358d2f5dSShri Abhyankar } 623ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 6349b5e25fSSatish Balay } 6449b5e25fSSatish Balay 65d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMarkDiagonal_SeqSBAIJ(Mat A) 66d71ae5a4SJacob Faibussowitsch { 67045c9aa0SHong Zhang Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)A->data; 6848dd3d27SHong Zhang PetscInt i, j; 6949b5e25fSSatish Balay 7049b5e25fSSatish Balay PetscFunctionBegin; 7109f38230SBarry Smith if (!a->diag) { 729566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(a->mbs, &a->diag)); 73c760cd28SBarry Smith a->free_diag = PETSC_TRUE; 7409f38230SBarry Smith } 7548dd3d27SHong Zhang for (i = 0; i < a->mbs; i++) { 7648dd3d27SHong Zhang a->diag[i] = a->i[i + 1]; 7748dd3d27SHong Zhang for (j = a->i[i]; j < a->i[i + 1]; j++) { 7848dd3d27SHong Zhang if (a->j[j] == i) { 7948dd3d27SHong Zhang a->diag[i] = j; 8048dd3d27SHong Zhang break; 8148dd3d27SHong Zhang } 8248dd3d27SHong Zhang } 8348dd3d27SHong Zhang } 843ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 8549b5e25fSSatish Balay } 8649b5e25fSSatish Balay 87d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatGetRowIJ_SeqSBAIJ(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool blockcompressed, PetscInt *nn, const PetscInt *inia[], const PetscInt *inja[], PetscBool *done) 88d71ae5a4SJacob Faibussowitsch { 89a6ece127SHong Zhang Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)A->data; 902462f5fdSStefano Zampini PetscInt i, j, n = a->mbs, nz = a->i[n], *tia, *tja, bs = A->rmap->bs, k, l, cnt; 912462f5fdSStefano Zampini PetscInt **ia = (PetscInt **)inia, **ja = (PetscInt **)inja; 9249b5e25fSSatish Balay 9349b5e25fSSatish Balay PetscFunctionBegin; 94d3e5a4abSHong Zhang *nn = n; 953ba16761SJacob Faibussowitsch if (!ia) PetscFunctionReturn(PETSC_SUCCESS); 962462f5fdSStefano Zampini if (symmetric) { 979566063dSJacob Faibussowitsch PetscCall(MatToSymmetricIJ_SeqAIJ(n, a->i, a->j, PETSC_FALSE, 0, 0, &tia, &tja)); 982462f5fdSStefano Zampini nz = tia[n]; 992462f5fdSStefano Zampini } else { 1009371c9d4SSatish Balay tia = a->i; 1019371c9d4SSatish Balay tja = a->j; 1022462f5fdSStefano Zampini } 1032462f5fdSStefano Zampini 1042462f5fdSStefano Zampini if (!blockcompressed && bs > 1) { 1052462f5fdSStefano Zampini (*nn) *= bs; 1068f7157efSSatish Balay /* malloc & create the natural set of indices */ 1079566063dSJacob Faibussowitsch PetscCall(PetscMalloc1((n + 1) * bs, ia)); 1082462f5fdSStefano Zampini if (n) { 1092462f5fdSStefano Zampini (*ia)[0] = oshift; 110ad540459SPierre Jolivet for (j = 1; j < bs; j++) (*ia)[j] = (tia[1] - tia[0]) * bs + (*ia)[j - 1]; 1112462f5fdSStefano Zampini } 1122462f5fdSStefano Zampini 1132462f5fdSStefano Zampini for (i = 1; i < n; i++) { 1142462f5fdSStefano Zampini (*ia)[i * bs] = (tia[i] - tia[i - 1]) * bs + (*ia)[i * bs - 1]; 115ad540459SPierre Jolivet for (j = 1; j < bs; j++) (*ia)[i * bs + j] = (tia[i + 1] - tia[i]) * bs + (*ia)[i * bs + j - 1]; 1162462f5fdSStefano Zampini } 117ad540459SPierre Jolivet if (n) (*ia)[n * bs] = (tia[n] - tia[n - 1]) * bs + (*ia)[n * bs - 1]; 1182462f5fdSStefano Zampini 1192462f5fdSStefano Zampini if (inja) { 1209566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nz * bs * bs, ja)); 1212462f5fdSStefano Zampini cnt = 0; 1222462f5fdSStefano Zampini for (i = 0; i < n; i++) { 1238f7157efSSatish Balay for (j = 0; j < bs; j++) { 1242462f5fdSStefano Zampini for (k = tia[i]; k < tia[i + 1]; k++) { 125ad540459SPierre Jolivet for (l = 0; l < bs; l++) (*ja)[cnt++] = bs * tja[k] + l; 1268f7157efSSatish Balay } 1278f7157efSSatish Balay } 1288f7157efSSatish Balay } 1298f7157efSSatish Balay } 1302462f5fdSStefano Zampini 1312462f5fdSStefano Zampini if (symmetric) { /* deallocate memory allocated in MatToSymmetricIJ_SeqAIJ() */ 1329566063dSJacob Faibussowitsch PetscCall(PetscFree(tia)); 1339566063dSJacob Faibussowitsch PetscCall(PetscFree(tja)); 1342462f5fdSStefano Zampini } 1352462f5fdSStefano Zampini } else if (oshift == 1) { 1362462f5fdSStefano Zampini if (symmetric) { 1372462f5fdSStefano Zampini nz = tia[A->rmap->n / bs]; 1382462f5fdSStefano Zampini /* add 1 to i and j indices */ 1392462f5fdSStefano Zampini for (i = 0; i < A->rmap->n / bs + 1; i++) tia[i] = tia[i] + 1; 1402462f5fdSStefano Zampini *ia = tia; 1412462f5fdSStefano Zampini if (ja) { 1422462f5fdSStefano Zampini for (i = 0; i < nz; i++) tja[i] = tja[i] + 1; 1432462f5fdSStefano Zampini *ja = tja; 1442462f5fdSStefano Zampini } 1452462f5fdSStefano Zampini } else { 1462462f5fdSStefano Zampini nz = a->i[A->rmap->n / bs]; 1472462f5fdSStefano Zampini /* malloc space and add 1 to i and j indices */ 1489566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(A->rmap->n / bs + 1, ia)); 1492462f5fdSStefano Zampini for (i = 0; i < A->rmap->n / bs + 1; i++) (*ia)[i] = a->i[i] + 1; 1502462f5fdSStefano Zampini if (ja) { 1519566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nz, ja)); 1522462f5fdSStefano Zampini for (i = 0; i < nz; i++) (*ja)[i] = a->j[i] + 1; 1532462f5fdSStefano Zampini } 1542462f5fdSStefano Zampini } 1552462f5fdSStefano Zampini } else { 1562462f5fdSStefano Zampini *ia = tia; 1572462f5fdSStefano Zampini if (ja) *ja = tja; 158a6ece127SHong Zhang } 1593ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 16049b5e25fSSatish Balay } 16149b5e25fSSatish Balay 162d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatRestoreRowIJ_SeqSBAIJ(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool blockcompressed, PetscInt *nn, const PetscInt *ia[], const PetscInt *ja[], PetscBool *done) 163d71ae5a4SJacob Faibussowitsch { 16449b5e25fSSatish Balay PetscFunctionBegin; 1653ba16761SJacob Faibussowitsch if (!ia) PetscFunctionReturn(PETSC_SUCCESS); 1662462f5fdSStefano Zampini if ((!blockcompressed && A->rmap->bs > 1) || (symmetric || oshift == 1)) { 1679566063dSJacob Faibussowitsch PetscCall(PetscFree(*ia)); 1689566063dSJacob Faibussowitsch if (ja) PetscCall(PetscFree(*ja)); 169a6ece127SHong Zhang } 1703ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 17149b5e25fSSatish Balay } 17249b5e25fSSatish Balay 173d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDestroy_SeqSBAIJ(Mat A) 174d71ae5a4SJacob Faibussowitsch { 17549b5e25fSSatish Balay Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)A->data; 17649b5e25fSSatish Balay 17749b5e25fSSatish Balay PetscFunctionBegin; 178a9f03627SSatish Balay #if defined(PETSC_USE_LOG) 1793ba16761SJacob Faibussowitsch PetscCall(PetscLogObjectState((PetscObject)A, "Rows=%" PetscInt_FMT ", NZ=%" PetscInt_FMT, A->rmap->N, a->nz)); 180a9f03627SSatish Balay #endif 1819566063dSJacob Faibussowitsch PetscCall(MatSeqXAIJFreeAIJ(A, &a->a, &a->j, &a->i)); 1829566063dSJacob Faibussowitsch if (a->free_diag) PetscCall(PetscFree(a->diag)); 1839566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->row)); 1849566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->col)); 1859566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->icol)); 1869566063dSJacob Faibussowitsch PetscCall(PetscFree(a->idiag)); 1879566063dSJacob Faibussowitsch PetscCall(PetscFree(a->inode.size)); 1889566063dSJacob Faibussowitsch if (a->free_imax_ilen) PetscCall(PetscFree2(a->imax, a->ilen)); 1899566063dSJacob Faibussowitsch PetscCall(PetscFree(a->solve_work)); 1909566063dSJacob Faibussowitsch PetscCall(PetscFree(a->sor_work)); 1919566063dSJacob Faibussowitsch PetscCall(PetscFree(a->solves_work)); 1929566063dSJacob Faibussowitsch PetscCall(PetscFree(a->mult_work)); 1939566063dSJacob Faibussowitsch PetscCall(PetscFree(a->saved_values)); 1949566063dSJacob Faibussowitsch if (a->free_jshort) PetscCall(PetscFree(a->jshort)); 1959566063dSJacob Faibussowitsch PetscCall(PetscFree(a->inew)); 1969566063dSJacob Faibussowitsch PetscCall(MatDestroy(&a->parent)); 1979566063dSJacob Faibussowitsch PetscCall(PetscFree(A->data)); 198901853e0SKris Buschelman 1999566063dSJacob Faibussowitsch PetscCall(PetscObjectChangeTypeName((PetscObject)A, NULL)); 2002e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSeqSBAIJGetArray_C", NULL)); 2012e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSeqSBAIJRestoreArray_C", NULL)); 2029566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatStoreValues_C", NULL)); 2039566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatRetrieveValues_C", NULL)); 2049566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSeqSBAIJSetColumnIndices_C", NULL)); 2059566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqsbaij_seqaij_C", NULL)); 2069566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqsbaij_seqbaij_C", NULL)); 2079566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSeqSBAIJSetPreallocation_C", NULL)); 2089566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSeqSBAIJSetPreallocationCSR_C", NULL)); 2096214f412SHong Zhang #if defined(PETSC_HAVE_ELEMENTAL) 2109566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqsbaij_elemental_C", NULL)); 2116214f412SHong Zhang #endif 212d24d4204SJose E. Roman #if defined(PETSC_HAVE_SCALAPACK) 2139566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqsbaij_scalapack_C", NULL)); 214d24d4204SJose E. Roman #endif 2152e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatFactorGetSolverType_C", NULL)); 2163ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 21749b5e25fSSatish Balay } 21849b5e25fSSatish Balay 219d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetOption_SeqSBAIJ(Mat A, MatOption op, PetscBool flg) 220d71ae5a4SJacob Faibussowitsch { 221045c9aa0SHong Zhang Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)A->data; 222eb1ec7c1SStefano Zampini #if defined(PETSC_USE_COMPLEX) 223eb1ec7c1SStefano Zampini PetscInt bs; 224eb1ec7c1SStefano Zampini #endif 22549b5e25fSSatish Balay 22649b5e25fSSatish Balay PetscFunctionBegin; 227eb1ec7c1SStefano Zampini #if defined(PETSC_USE_COMPLEX) 2289566063dSJacob Faibussowitsch PetscCall(MatGetBlockSize(A, &bs)); 229eb1ec7c1SStefano Zampini #endif 2304d9d31abSKris Buschelman switch (op) { 231d71ae5a4SJacob Faibussowitsch case MAT_ROW_ORIENTED: 232d71ae5a4SJacob Faibussowitsch a->roworiented = flg; 233d71ae5a4SJacob Faibussowitsch break; 234d71ae5a4SJacob Faibussowitsch case MAT_KEEP_NONZERO_PATTERN: 235d71ae5a4SJacob Faibussowitsch a->keepnonzeropattern = flg; 236d71ae5a4SJacob Faibussowitsch break; 237d71ae5a4SJacob Faibussowitsch case MAT_NEW_NONZERO_LOCATIONS: 238d71ae5a4SJacob Faibussowitsch a->nonew = (flg ? 0 : 1); 239d71ae5a4SJacob Faibussowitsch break; 240d71ae5a4SJacob Faibussowitsch case MAT_NEW_NONZERO_LOCATION_ERR: 241d71ae5a4SJacob Faibussowitsch a->nonew = (flg ? -1 : 0); 242d71ae5a4SJacob Faibussowitsch break; 243d71ae5a4SJacob Faibussowitsch case MAT_NEW_NONZERO_ALLOCATION_ERR: 244d71ae5a4SJacob Faibussowitsch a->nonew = (flg ? -2 : 0); 245d71ae5a4SJacob Faibussowitsch break; 246d71ae5a4SJacob Faibussowitsch case MAT_UNUSED_NONZERO_LOCATION_ERR: 247d71ae5a4SJacob Faibussowitsch a->nounused = (flg ? -1 : 0); 248d71ae5a4SJacob Faibussowitsch break; 2498c78258cSHong Zhang case MAT_FORCE_DIAGONAL_ENTRIES: 2504d9d31abSKris Buschelman case MAT_IGNORE_OFF_PROC_ENTRIES: 2514d9d31abSKris Buschelman case MAT_USE_HASH_TABLE: 252d71ae5a4SJacob Faibussowitsch case MAT_SORTED_FULL: 253d71ae5a4SJacob Faibussowitsch PetscCall(PetscInfo(A, "Option %s ignored\n", MatOptions[op])); 254d71ae5a4SJacob Faibussowitsch break; 2559a4540c5SBarry Smith case MAT_HERMITIAN: 256eb1ec7c1SStefano Zampini #if defined(PETSC_USE_COMPLEX) 257eb1ec7c1SStefano Zampini if (flg) { /* disable transpose ops */ 25808401ef6SPierre Jolivet PetscCheck(bs <= 1, PETSC_COMM_SELF, PETSC_ERR_SUP, "No support for Hermitian with block size greater than 1"); 259eb1ec7c1SStefano Zampini A->ops->multtranspose = NULL; 260eb1ec7c1SStefano Zampini A->ops->multtransposeadd = NULL; 261b94d7dedSBarry Smith A->symmetric = PETSC_BOOL3_FALSE; 262eb1ec7c1SStefano Zampini } 2630f2140c7SStefano Zampini #endif 264eeffb40dSHong Zhang break; 26577e54ba9SKris Buschelman case MAT_SYMMETRIC: 266eb1ec7c1SStefano Zampini case MAT_SPD: 267eb1ec7c1SStefano Zampini #if defined(PETSC_USE_COMPLEX) 268eb1ec7c1SStefano Zampini if (flg) { /* An hermitian and symmetric matrix has zero imaginary part (restore back transpose ops) */ 269eb1ec7c1SStefano Zampini A->ops->multtranspose = A->ops->mult; 270eb1ec7c1SStefano Zampini A->ops->multtransposeadd = A->ops->multadd; 271eb1ec7c1SStefano Zampini } 272eb1ec7c1SStefano Zampini #endif 273eb1ec7c1SStefano Zampini break; 274eb1ec7c1SStefano Zampini /* These options are handled directly by MatSetOption() */ 27577e54ba9SKris Buschelman case MAT_STRUCTURALLY_SYMMETRIC: 2769a4540c5SBarry Smith case MAT_SYMMETRY_ETERNAL: 277b94d7dedSBarry Smith case MAT_STRUCTURAL_SYMMETRY_ETERNAL: 278672ba085SHong Zhang case MAT_STRUCTURE_ONLY: 279b94d7dedSBarry Smith case MAT_SPD_ETERNAL: 2804dcd73b1SHong Zhang /* These options are handled directly by MatSetOption() */ 281290bbb0aSBarry Smith break; 282d71ae5a4SJacob Faibussowitsch case MAT_IGNORE_LOWER_TRIANGULAR: 283d71ae5a4SJacob Faibussowitsch a->ignore_ltriangular = flg; 284d71ae5a4SJacob Faibussowitsch break; 285d71ae5a4SJacob Faibussowitsch case MAT_ERROR_LOWER_TRIANGULAR: 286d71ae5a4SJacob Faibussowitsch a->ignore_ltriangular = flg; 287d71ae5a4SJacob Faibussowitsch break; 288d71ae5a4SJacob Faibussowitsch case MAT_GETROW_UPPERTRIANGULAR: 289d71ae5a4SJacob Faibussowitsch a->getrow_utriangular = flg; 290d71ae5a4SJacob Faibussowitsch break; 291d71ae5a4SJacob Faibussowitsch case MAT_SUBMAT_SINGLEIS: 292d71ae5a4SJacob Faibussowitsch break; 293d71ae5a4SJacob Faibussowitsch default: 294d71ae5a4SJacob Faibussowitsch SETERRQ(PETSC_COMM_SELF, PETSC_ERR_SUP, "unknown option %d", op); 29549b5e25fSSatish Balay } 2963ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 29749b5e25fSSatish Balay } 29849b5e25fSSatish Balay 299d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetRow_SeqSBAIJ(Mat A, PetscInt row, PetscInt *nz, PetscInt **idx, PetscScalar **v) 300d71ae5a4SJacob Faibussowitsch { 30149b5e25fSSatish Balay Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)A->data; 30249b5e25fSSatish Balay 30349b5e25fSSatish Balay PetscFunctionBegin; 30408401ef6SPierre Jolivet PetscCheck(!A || a->getrow_utriangular, PETSC_COMM_SELF, PETSC_ERR_SUP, "MatGetRow is not supported for SBAIJ matrix format. Getting the upper triangular part of row, run with -mat_getrow_uppertriangular, call MatSetOption(mat,MAT_GETROW_UPPERTRIANGULAR,PETSC_TRUE) or MatGetRowUpperTriangular()"); 30552768537SHong Zhang 306f5edf698SHong Zhang /* Get the upper triangular part of the row */ 3079566063dSJacob Faibussowitsch PetscCall(MatGetRow_SeqBAIJ_private(A, row, nz, idx, v, a->i, a->j, a->a)); 3083ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 30949b5e25fSSatish Balay } 31049b5e25fSSatish Balay 311d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRestoreRow_SeqSBAIJ(Mat A, PetscInt row, PetscInt *nz, PetscInt **idx, PetscScalar **v) 312d71ae5a4SJacob Faibussowitsch { 31349b5e25fSSatish Balay PetscFunctionBegin; 314cb4a9cd9SHong Zhang if (nz) *nz = 0; 3159566063dSJacob Faibussowitsch if (idx) PetscCall(PetscFree(*idx)); 3169566063dSJacob Faibussowitsch if (v) PetscCall(PetscFree(*v)); 3173ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 31849b5e25fSSatish Balay } 31949b5e25fSSatish Balay 320d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetRowUpperTriangular_SeqSBAIJ(Mat A) 321d71ae5a4SJacob Faibussowitsch { 322f5edf698SHong Zhang Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)A->data; 323f5edf698SHong Zhang 324f5edf698SHong Zhang PetscFunctionBegin; 325f5edf698SHong Zhang a->getrow_utriangular = PETSC_TRUE; 3263ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 327f5edf698SHong Zhang } 328a323099bSStefano Zampini 329d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRestoreRowUpperTriangular_SeqSBAIJ(Mat A) 330d71ae5a4SJacob Faibussowitsch { 331f5edf698SHong Zhang Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)A->data; 332f5edf698SHong Zhang 333f5edf698SHong Zhang PetscFunctionBegin; 334f5edf698SHong Zhang a->getrow_utriangular = PETSC_FALSE; 3353ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 336f5edf698SHong Zhang } 337f5edf698SHong Zhang 338d71ae5a4SJacob Faibussowitsch PetscErrorCode MatTranspose_SeqSBAIJ(Mat A, MatReuse reuse, Mat *B) 339d71ae5a4SJacob Faibussowitsch { 34049b5e25fSSatish Balay PetscFunctionBegin; 3417fb60732SBarry Smith if (reuse == MAT_REUSE_MATRIX) PetscCall(MatTransposeCheckNonzeroState_Private(A, *B)); 342cf37664fSBarry Smith if (reuse == MAT_INITIAL_MATRIX) { 3439566063dSJacob Faibussowitsch PetscCall(MatDuplicate(A, MAT_COPY_VALUES, B)); 344cf37664fSBarry Smith } else if (reuse == MAT_REUSE_MATRIX) { 3459566063dSJacob Faibussowitsch PetscCall(MatCopy(A, *B, SAME_NONZERO_PATTERN)); 346fc4dec0aSBarry Smith } 3473ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 34849b5e25fSSatish Balay } 34949b5e25fSSatish Balay 350d71ae5a4SJacob Faibussowitsch PetscErrorCode MatView_SeqSBAIJ_ASCII(Mat A, PetscViewer viewer) 351d71ae5a4SJacob Faibussowitsch { 35249b5e25fSSatish Balay Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)A->data; 353d0f46423SBarry Smith PetscInt i, j, bs = A->rmap->bs, k, l, bs2 = a->bs2; 354f3ef73ceSBarry Smith PetscViewerFormat format; 355121deb67SSatish Balay PetscInt *diag; 356b3a0534dSBarry Smith const char *matname; 35749b5e25fSSatish Balay 35849b5e25fSSatish Balay PetscFunctionBegin; 3599566063dSJacob Faibussowitsch PetscCall(PetscViewerGetFormat(viewer, &format)); 360456192e2SBarry Smith if (format == PETSC_VIEWER_ASCII_INFO || format == PETSC_VIEWER_ASCII_INFO_DETAIL) { 3619566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " block size is %" PetscInt_FMT "\n", bs)); 362fb9695e5SSatish Balay } else if (format == PETSC_VIEWER_ASCII_MATLAB) { 363d2507d54SMatthew Knepley Mat aij; 364ade3a672SBarry Smith 365d5f3da31SBarry Smith if (A->factortype && bs > 1) { 3669566063dSJacob Faibussowitsch PetscCall(PetscPrintf(PETSC_COMM_SELF, "Warning: matrix is factored with bs>1. MatView() with PETSC_VIEWER_ASCII_MATLAB is not supported and ignored!\n")); 3673ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 36870d5e725SHong Zhang } 3699566063dSJacob Faibussowitsch PetscCall(MatConvert(A, MATSEQAIJ, MAT_INITIAL_MATRIX, &aij)); 37023a3927dSBarry Smith if (((PetscObject)A)->name) PetscCall(PetscObjectGetName((PetscObject)A, &matname)); 37123a3927dSBarry Smith if (((PetscObject)A)->name) PetscCall(PetscObjectSetName((PetscObject)aij, matname)); 37223a3927dSBarry Smith PetscCall(MatView_SeqAIJ(aij, viewer)); 3739566063dSJacob Faibussowitsch PetscCall(MatDestroy(&aij)); 374fb9695e5SSatish Balay } else if (format == PETSC_VIEWER_ASCII_COMMON) { 375b3a0534dSBarry Smith Mat B; 376b3a0534dSBarry Smith 377b3a0534dSBarry Smith PetscCall(MatConvert(A, MATSEQAIJ, MAT_INITIAL_MATRIX, &B)); 378b3a0534dSBarry Smith if (((PetscObject)A)->name) PetscCall(PetscObjectGetName((PetscObject)A, &matname)); 379b3a0534dSBarry Smith if (((PetscObject)A)->name) PetscCall(PetscObjectSetName((PetscObject)B, matname)); 380b3a0534dSBarry Smith PetscCall(MatView_SeqAIJ(B, viewer)); 381b3a0534dSBarry Smith PetscCall(MatDestroy(&B)); 382c1490034SHong Zhang } else if (format == PETSC_VIEWER_ASCII_FACTOR_INFO) { 3833ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 38449b5e25fSSatish Balay } else { 3859566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE)); 3862c990fa1SHong Zhang if (A->factortype) { /* for factored matrix */ 38708401ef6SPierre Jolivet PetscCheck(bs <= 1, PETSC_COMM_SELF, PETSC_ERR_SUP, "matrix is factored with bs>1. Not implemented yet"); 3882c990fa1SHong Zhang 389121deb67SSatish Balay diag = a->diag; 390121deb67SSatish Balay for (i = 0; i < a->mbs; i++) { /* for row block i */ 3919566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "row %" PetscInt_FMT ":", i)); 3922c990fa1SHong Zhang /* diagonal entry */ 3932c990fa1SHong Zhang #if defined(PETSC_USE_COMPLEX) 3942c990fa1SHong Zhang if (PetscImaginaryPart(a->a[diag[i]]) > 0.0) { 3959566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g + %g i) ", a->j[diag[i]], (double)PetscRealPart(1.0 / a->a[diag[i]]), (double)PetscImaginaryPart(1.0 / a->a[diag[i]]))); 3962c990fa1SHong Zhang } else if (PetscImaginaryPart(a->a[diag[i]]) < 0.0) { 3979566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g - %g i) ", a->j[diag[i]], (double)PetscRealPart(1.0 / a->a[diag[i]]), -(double)PetscImaginaryPart(1.0 / a->a[diag[i]]))); 3982c990fa1SHong Zhang } else { 3999566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[diag[i]], (double)PetscRealPart(1.0 / a->a[diag[i]]))); 4002c990fa1SHong Zhang } 4012c990fa1SHong Zhang #else 4029566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[diag[i]], (double)(1.0 / a->a[diag[i]]))); 4032c990fa1SHong Zhang #endif 4042c990fa1SHong Zhang /* off-diagonal entries */ 4052c990fa1SHong Zhang for (k = a->i[i]; k < a->i[i + 1] - 1; k++) { 4062c990fa1SHong Zhang #if defined(PETSC_USE_COMPLEX) 407ca0704adSBarry Smith if (PetscImaginaryPart(a->a[k]) > 0.0) { 4089566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g + %g i) ", bs * a->j[k], (double)PetscRealPart(a->a[k]), (double)PetscImaginaryPart(a->a[k]))); 409ca0704adSBarry Smith } else if (PetscImaginaryPart(a->a[k]) < 0.0) { 4109566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g - %g i) ", bs * a->j[k], (double)PetscRealPart(a->a[k]), -(double)PetscImaginaryPart(a->a[k]))); 4112c990fa1SHong Zhang } else { 4129566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", bs * a->j[k], (double)PetscRealPart(a->a[k]))); 4132c990fa1SHong Zhang } 4142c990fa1SHong Zhang #else 4159566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[k], (double)a->a[k])); 4162c990fa1SHong Zhang #endif 4172c990fa1SHong Zhang } 4189566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 4192c990fa1SHong Zhang } 4202c990fa1SHong Zhang 4212c990fa1SHong Zhang } else { /* for non-factored matrix */ 4220c74a584SJed Brown for (i = 0; i < a->mbs; i++) { /* for row block i */ 4230c74a584SJed Brown for (j = 0; j < bs; j++) { /* for row bs*i + j */ 4249566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "row %" PetscInt_FMT ":", i * bs + j)); 4250c74a584SJed Brown for (k = a->i[i]; k < a->i[i + 1]; k++) { /* for column block */ 4260c74a584SJed Brown for (l = 0; l < bs; l++) { /* for column */ 42749b5e25fSSatish Balay #if defined(PETSC_USE_COMPLEX) 42849b5e25fSSatish Balay if (PetscImaginaryPart(a->a[bs2 * k + l * bs + j]) > 0.0) { 4299371c9d4SSatish Balay PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g + %g i) ", bs * a->j[k] + l, (double)PetscRealPart(a->a[bs2 * k + l * bs + j]), (double)PetscImaginaryPart(a->a[bs2 * k + l * bs + j]))); 43049b5e25fSSatish Balay } else if (PetscImaginaryPart(a->a[bs2 * k + l * bs + j]) < 0.0) { 4319371c9d4SSatish Balay PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g - %g i) ", bs * a->j[k] + l, (double)PetscRealPart(a->a[bs2 * k + l * bs + j]), -(double)PetscImaginaryPart(a->a[bs2 * k + l * bs + j]))); 43249b5e25fSSatish Balay } else { 4339566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", bs * a->j[k] + l, (double)PetscRealPart(a->a[bs2 * k + l * bs + j]))); 43449b5e25fSSatish Balay } 43549b5e25fSSatish Balay #else 4369566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", bs * a->j[k] + l, (double)a->a[bs2 * k + l * bs + j])); 43749b5e25fSSatish Balay #endif 43849b5e25fSSatish Balay } 43949b5e25fSSatish Balay } 4409566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 44149b5e25fSSatish Balay } 44249b5e25fSSatish Balay } 4432c990fa1SHong Zhang } 4449566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE)); 44549b5e25fSSatish Balay } 4469566063dSJacob Faibussowitsch PetscCall(PetscViewerFlush(viewer)); 4473ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 44849b5e25fSSatish Balay } 44949b5e25fSSatish Balay 4509804daf3SBarry Smith #include <petscdraw.h> 451d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatView_SeqSBAIJ_Draw_Zoom(PetscDraw draw, void *Aa) 452d71ae5a4SJacob Faibussowitsch { 45349b5e25fSSatish Balay Mat A = (Mat)Aa; 45449b5e25fSSatish Balay Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)A->data; 455d0f46423SBarry Smith PetscInt row, i, j, k, l, mbs = a->mbs, color, bs = A->rmap->bs, bs2 = a->bs2; 45649b5e25fSSatish Balay PetscReal xl, yl, xr, yr, x_l, x_r, y_l, y_r; 45749b5e25fSSatish Balay MatScalar *aa; 458b0a32e0cSBarry Smith PetscViewer viewer; 45949b5e25fSSatish Balay 46049b5e25fSSatish Balay PetscFunctionBegin; 4619566063dSJacob Faibussowitsch PetscCall(PetscObjectQuery((PetscObject)A, "Zoomviewer", (PetscObject *)&viewer)); 4629566063dSJacob Faibussowitsch PetscCall(PetscDrawGetCoordinates(draw, &xl, &yl, &xr, &yr)); 46349b5e25fSSatish Balay 46449b5e25fSSatish Balay /* loop over matrix elements drawing boxes */ 465383922c3SLisandro Dalcin 466d0609cedSBarry Smith PetscDrawCollectiveBegin(draw); 4679566063dSJacob Faibussowitsch PetscCall(PetscDrawString(draw, .3 * (xl + xr), .3 * (yl + yr), PETSC_DRAW_BLACK, "symmetric")); 468383922c3SLisandro Dalcin /* Blue for negative, Cyan for zero and Red for positive */ 469b0a32e0cSBarry Smith color = PETSC_DRAW_BLUE; 47049b5e25fSSatish Balay for (i = 0, row = 0; i < mbs; i++, row += bs) { 47149b5e25fSSatish Balay for (j = a->i[i]; j < a->i[i + 1]; j++) { 4729371c9d4SSatish Balay y_l = A->rmap->N - row - 1.0; 4739371c9d4SSatish Balay y_r = y_l + 1.0; 4749371c9d4SSatish Balay x_l = a->j[j] * bs; 4759371c9d4SSatish Balay x_r = x_l + 1.0; 47649b5e25fSSatish Balay aa = a->a + j * bs2; 47749b5e25fSSatish Balay for (k = 0; k < bs; k++) { 47849b5e25fSSatish Balay for (l = 0; l < bs; l++) { 47949b5e25fSSatish Balay if (PetscRealPart(*aa++) >= 0.) continue; 4809566063dSJacob Faibussowitsch PetscCall(PetscDrawRectangle(draw, x_l + k, y_l - l, x_r + k, y_r - l, color, color, color, color)); 48149b5e25fSSatish Balay } 48249b5e25fSSatish Balay } 48349b5e25fSSatish Balay } 48449b5e25fSSatish Balay } 485b0a32e0cSBarry Smith color = PETSC_DRAW_CYAN; 48649b5e25fSSatish Balay for (i = 0, row = 0; i < mbs; i++, row += bs) { 48749b5e25fSSatish Balay for (j = a->i[i]; j < a->i[i + 1]; j++) { 4889371c9d4SSatish Balay y_l = A->rmap->N - row - 1.0; 4899371c9d4SSatish Balay y_r = y_l + 1.0; 4909371c9d4SSatish Balay x_l = a->j[j] * bs; 4919371c9d4SSatish Balay x_r = x_l + 1.0; 49249b5e25fSSatish Balay aa = a->a + j * bs2; 49349b5e25fSSatish Balay for (k = 0; k < bs; k++) { 49449b5e25fSSatish Balay for (l = 0; l < bs; l++) { 49549b5e25fSSatish Balay if (PetscRealPart(*aa++) != 0.) continue; 4969566063dSJacob Faibussowitsch PetscCall(PetscDrawRectangle(draw, x_l + k, y_l - l, x_r + k, y_r - l, color, color, color, color)); 49749b5e25fSSatish Balay } 49849b5e25fSSatish Balay } 49949b5e25fSSatish Balay } 50049b5e25fSSatish Balay } 501b0a32e0cSBarry Smith color = PETSC_DRAW_RED; 50249b5e25fSSatish Balay for (i = 0, row = 0; i < mbs; i++, row += bs) { 50349b5e25fSSatish Balay for (j = a->i[i]; j < a->i[i + 1]; j++) { 5049371c9d4SSatish Balay y_l = A->rmap->N - row - 1.0; 5059371c9d4SSatish Balay y_r = y_l + 1.0; 5069371c9d4SSatish Balay x_l = a->j[j] * bs; 5079371c9d4SSatish Balay x_r = x_l + 1.0; 50849b5e25fSSatish Balay aa = a->a + j * bs2; 50949b5e25fSSatish Balay for (k = 0; k < bs; k++) { 51049b5e25fSSatish Balay for (l = 0; l < bs; l++) { 51149b5e25fSSatish Balay if (PetscRealPart(*aa++) <= 0.) continue; 5129566063dSJacob Faibussowitsch PetscCall(PetscDrawRectangle(draw, x_l + k, y_l - l, x_r + k, y_r - l, color, color, color, color)); 51349b5e25fSSatish Balay } 51449b5e25fSSatish Balay } 51549b5e25fSSatish Balay } 51649b5e25fSSatish Balay } 517d0609cedSBarry Smith PetscDrawCollectiveEnd(draw); 5183ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 51949b5e25fSSatish Balay } 52049b5e25fSSatish Balay 521d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatView_SeqSBAIJ_Draw(Mat A, PetscViewer viewer) 522d71ae5a4SJacob Faibussowitsch { 52349b5e25fSSatish Balay PetscReal xl, yl, xr, yr, w, h; 524b0a32e0cSBarry Smith PetscDraw draw; 525ace3abfcSBarry Smith PetscBool isnull; 52649b5e25fSSatish Balay 52749b5e25fSSatish Balay PetscFunctionBegin; 5289566063dSJacob Faibussowitsch PetscCall(PetscViewerDrawGetDraw(viewer, 0, &draw)); 5299566063dSJacob Faibussowitsch PetscCall(PetscDrawIsNull(draw, &isnull)); 5303ba16761SJacob Faibussowitsch if (isnull) PetscFunctionReturn(PETSC_SUCCESS); 53149b5e25fSSatish Balay 5329371c9d4SSatish Balay xr = A->rmap->N; 5339371c9d4SSatish Balay yr = A->rmap->N; 5349371c9d4SSatish Balay h = yr / 10.0; 5359371c9d4SSatish Balay w = xr / 10.0; 5369371c9d4SSatish Balay xr += w; 5379371c9d4SSatish Balay yr += h; 5389371c9d4SSatish Balay xl = -w; 5399371c9d4SSatish Balay yl = -h; 5409566063dSJacob Faibussowitsch PetscCall(PetscDrawSetCoordinates(draw, xl, yl, xr, yr)); 5419566063dSJacob Faibussowitsch PetscCall(PetscObjectCompose((PetscObject)A, "Zoomviewer", (PetscObject)viewer)); 5429566063dSJacob Faibussowitsch PetscCall(PetscDrawZoom(draw, MatView_SeqSBAIJ_Draw_Zoom, A)); 5439566063dSJacob Faibussowitsch PetscCall(PetscObjectCompose((PetscObject)A, "Zoomviewer", NULL)); 5449566063dSJacob Faibussowitsch PetscCall(PetscDrawSave(draw)); 5453ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 54649b5e25fSSatish Balay } 54749b5e25fSSatish Balay 548618cc2edSLisandro Dalcin /* Used for both MPIBAIJ and MPISBAIJ matrices */ 549618cc2edSLisandro Dalcin #define MatView_SeqSBAIJ_Binary MatView_SeqBAIJ_Binary 550618cc2edSLisandro Dalcin 551d71ae5a4SJacob Faibussowitsch PetscErrorCode MatView_SeqSBAIJ(Mat A, PetscViewer viewer) 552d71ae5a4SJacob Faibussowitsch { 553618cc2edSLisandro Dalcin PetscBool iascii, isbinary, isdraw; 55449b5e25fSSatish Balay 55549b5e25fSSatish Balay PetscFunctionBegin; 5569566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERASCII, &iascii)); 5579566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERBINARY, &isbinary)); 5589566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERDRAW, &isdraw)); 55932077d6dSBarry Smith if (iascii) { 5609566063dSJacob Faibussowitsch PetscCall(MatView_SeqSBAIJ_ASCII(A, viewer)); 561618cc2edSLisandro Dalcin } else if (isbinary) { 5629566063dSJacob Faibussowitsch PetscCall(MatView_SeqSBAIJ_Binary(A, viewer)); 56349b5e25fSSatish Balay } else if (isdraw) { 5649566063dSJacob Faibussowitsch PetscCall(MatView_SeqSBAIJ_Draw(A, viewer)); 56549b5e25fSSatish Balay } else { 566a5e6ed63SBarry Smith Mat B; 567ade3a672SBarry Smith const char *matname; 5689566063dSJacob Faibussowitsch PetscCall(MatConvert(A, MATSEQAIJ, MAT_INITIAL_MATRIX, &B)); 56923a3927dSBarry Smith if (((PetscObject)A)->name) PetscCall(PetscObjectGetName((PetscObject)A, &matname)); 57023a3927dSBarry Smith if (((PetscObject)A)->name) PetscCall(PetscObjectSetName((PetscObject)B, matname)); 5719566063dSJacob Faibussowitsch PetscCall(MatView(B, viewer)); 5729566063dSJacob Faibussowitsch PetscCall(MatDestroy(&B)); 57349b5e25fSSatish Balay } 5743ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 57549b5e25fSSatish Balay } 57649b5e25fSSatish Balay 577d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetValues_SeqSBAIJ(Mat A, PetscInt m, const PetscInt im[], PetscInt n, const PetscInt in[], PetscScalar v[]) 578d71ae5a4SJacob Faibussowitsch { 579045c9aa0SHong Zhang Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)A->data; 58013f74950SBarry Smith PetscInt *rp, k, low, high, t, row, nrow, i, col, l, *aj = a->j; 58113f74950SBarry Smith PetscInt *ai = a->i, *ailen = a->ilen; 582d0f46423SBarry Smith PetscInt brow, bcol, ridx, cidx, bs = A->rmap->bs, bs2 = a->bs2; 58397e567efSBarry Smith MatScalar *ap, *aa = a->a; 58449b5e25fSSatish Balay 58549b5e25fSSatish Balay PetscFunctionBegin; 58649b5e25fSSatish Balay for (k = 0; k < m; k++) { /* loop over rows */ 5879371c9d4SSatish Balay row = im[k]; 5889371c9d4SSatish Balay brow = row / bs; 5899371c9d4SSatish Balay if (row < 0) { 5909371c9d4SSatish Balay v += n; 5919371c9d4SSatish Balay continue; 5929371c9d4SSatish Balay } /* negative row */ 59354c59aa7SJacob Faibussowitsch PetscCheck(row < A->rmap->N, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Row too large: row %" PetscInt_FMT " max %" PetscInt_FMT, row, A->rmap->N - 1); 5949371c9d4SSatish Balay rp = aj + ai[brow]; 5959371c9d4SSatish Balay ap = aa + bs2 * ai[brow]; 59649b5e25fSSatish Balay nrow = ailen[brow]; 59749b5e25fSSatish Balay for (l = 0; l < n; l++) { /* loop over columns */ 5989371c9d4SSatish Balay if (in[l] < 0) { 5999371c9d4SSatish Balay v++; 6009371c9d4SSatish Balay continue; 6019371c9d4SSatish Balay } /* negative column */ 60254c59aa7SJacob Faibussowitsch PetscCheck(in[l] < A->cmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Column too large: col %" PetscInt_FMT " max %" PetscInt_FMT, in[l], A->cmap->n - 1); 60349b5e25fSSatish Balay col = in[l]; 60449b5e25fSSatish Balay bcol = col / bs; 60549b5e25fSSatish Balay cidx = col % bs; 60649b5e25fSSatish Balay ridx = row % bs; 60749b5e25fSSatish Balay high = nrow; 60849b5e25fSSatish Balay low = 0; /* assume unsorted */ 60949b5e25fSSatish Balay while (high - low > 5) { 61049b5e25fSSatish Balay t = (low + high) / 2; 61149b5e25fSSatish Balay if (rp[t] > bcol) high = t; 61249b5e25fSSatish Balay else low = t; 61349b5e25fSSatish Balay } 61449b5e25fSSatish Balay for (i = low; i < high; i++) { 61549b5e25fSSatish Balay if (rp[i] > bcol) break; 61649b5e25fSSatish Balay if (rp[i] == bcol) { 61749b5e25fSSatish Balay *v++ = ap[bs2 * i + bs * cidx + ridx]; 61849b5e25fSSatish Balay goto finished; 61949b5e25fSSatish Balay } 62049b5e25fSSatish Balay } 62197e567efSBarry Smith *v++ = 0.0; 62249b5e25fSSatish Balay finished:; 62349b5e25fSSatish Balay } 62449b5e25fSSatish Balay } 6253ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 62649b5e25fSSatish Balay } 62749b5e25fSSatish Balay 628d71ae5a4SJacob Faibussowitsch PetscErrorCode MatPermute_SeqSBAIJ(Mat A, IS rowp, IS colp, Mat *B) 629d71ae5a4SJacob Faibussowitsch { 630dc29a518SPierre Jolivet Mat C; 631dc29a518SPierre Jolivet 632dc29a518SPierre Jolivet PetscFunctionBegin; 6339566063dSJacob Faibussowitsch PetscCall(MatConvert(A, MATSEQBAIJ, MAT_INITIAL_MATRIX, &C)); 6349566063dSJacob Faibussowitsch PetscCall(MatPermute(C, rowp, colp, B)); 6359566063dSJacob Faibussowitsch PetscCall(MatDestroy(&C)); 63648a46eb9SPierre Jolivet if (rowp == colp) PetscCall(MatConvert(*B, MATSEQSBAIJ, MAT_INPLACE_MATRIX, B)); 6373ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 638dc29a518SPierre Jolivet } 63949b5e25fSSatish Balay 640d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetValuesBlocked_SeqSBAIJ(Mat A, PetscInt m, const PetscInt im[], PetscInt n, const PetscInt in[], const PetscScalar v[], InsertMode is) 641d71ae5a4SJacob Faibussowitsch { 6420880e062SHong Zhang Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)A->data; 643e2ee6c50SBarry Smith PetscInt *rp, k, low, high, t, ii, jj, row, nrow, i, col, l, rmax, N, lastcol = -1; 64413f74950SBarry Smith PetscInt *imax = a->imax, *ai = a->i, *ailen = a->ilen; 645d0f46423SBarry Smith PetscInt *aj = a->j, nonew = a->nonew, bs2 = a->bs2, bs = A->rmap->bs, stepval; 646ace3abfcSBarry Smith PetscBool roworiented = a->roworiented; 647dd6ea824SBarry Smith const PetscScalar *value = v; 648f15d580aSBarry Smith MatScalar *ap, *aa = a->a, *bap; 6490880e062SHong Zhang 65049b5e25fSSatish Balay PetscFunctionBegin; 65126fbe8dcSKarl Rupp if (roworiented) stepval = (n - 1) * bs; 65226fbe8dcSKarl Rupp else stepval = (m - 1) * bs; 65326fbe8dcSKarl Rupp 6540880e062SHong Zhang for (k = 0; k < m; k++) { /* loop over added rows */ 6550880e062SHong Zhang row = im[k]; 6560880e062SHong Zhang if (row < 0) continue; 6576bdcaf15SBarry Smith PetscCheck(row < a->mbs, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Block index row too large %" PetscInt_FMT " max %" PetscInt_FMT, row, a->mbs - 1); 6580880e062SHong Zhang rp = aj + ai[row]; 6590880e062SHong Zhang ap = aa + bs2 * ai[row]; 6600880e062SHong Zhang rmax = imax[row]; 6610880e062SHong Zhang nrow = ailen[row]; 6620880e062SHong Zhang low = 0; 663818f2c47SBarry Smith high = nrow; 6640880e062SHong Zhang for (l = 0; l < n; l++) { /* loop over added columns */ 6650880e062SHong Zhang if (in[l] < 0) continue; 6660880e062SHong Zhang col = in[l]; 6676bdcaf15SBarry Smith PetscCheck(col < a->nbs, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Block index column too large %" PetscInt_FMT " max %" PetscInt_FMT, col, a->nbs - 1); 668b98bf0e1SJed Brown if (col < row) { 66926fbe8dcSKarl Rupp if (a->ignore_ltriangular) continue; /* ignore lower triangular block */ 67026fbe8dcSKarl Rupp else SETERRQ(PETSC_COMM_SELF, PETSC_ERR_USER, "Lower triangular value cannot be set for sbaij format. Ignoring these values, run with -mat_ignore_lower_triangular or call MatSetOption(mat,MAT_IGNORE_LOWER_TRIANGULAR,PETSC_TRUE)"); 671b98bf0e1SJed Brown } 67226fbe8dcSKarl Rupp if (roworiented) value = v + k * (stepval + bs) * bs + l * bs; 67326fbe8dcSKarl Rupp else value = v + l * (stepval + bs) * bs + k * bs; 67426fbe8dcSKarl Rupp 67526fbe8dcSKarl Rupp if (col <= lastcol) low = 0; 67626fbe8dcSKarl Rupp else high = nrow; 67726fbe8dcSKarl Rupp 678e2ee6c50SBarry Smith lastcol = col; 6790880e062SHong Zhang while (high - low > 7) { 6800880e062SHong Zhang t = (low + high) / 2; 6810880e062SHong Zhang if (rp[t] > col) high = t; 6820880e062SHong Zhang else low = t; 6830880e062SHong Zhang } 6840880e062SHong Zhang for (i = low; i < high; i++) { 6850880e062SHong Zhang if (rp[i] > col) break; 6860880e062SHong Zhang if (rp[i] == col) { 6870880e062SHong Zhang bap = ap + bs2 * i; 6880880e062SHong Zhang if (roworiented) { 6890880e062SHong Zhang if (is == ADD_VALUES) { 6900880e062SHong Zhang for (ii = 0; ii < bs; ii++, value += stepval) { 691ad540459SPierre Jolivet for (jj = ii; jj < bs2; jj += bs) bap[jj] += *value++; 6920880e062SHong Zhang } 6930880e062SHong Zhang } else { 6940880e062SHong Zhang for (ii = 0; ii < bs; ii++, value += stepval) { 695ad540459SPierre Jolivet for (jj = ii; jj < bs2; jj += bs) bap[jj] = *value++; 6960880e062SHong Zhang } 6970880e062SHong Zhang } 6980880e062SHong Zhang } else { 6990880e062SHong Zhang if (is == ADD_VALUES) { 7000880e062SHong Zhang for (ii = 0; ii < bs; ii++, value += stepval) { 701ad540459SPierre Jolivet for (jj = 0; jj < bs; jj++) *bap++ += *value++; 7020880e062SHong Zhang } 7030880e062SHong Zhang } else { 7040880e062SHong Zhang for (ii = 0; ii < bs; ii++, value += stepval) { 705ad540459SPierre Jolivet for (jj = 0; jj < bs; jj++) *bap++ = *value++; 7060880e062SHong Zhang } 7070880e062SHong Zhang } 7080880e062SHong Zhang } 7090880e062SHong Zhang goto noinsert2; 7100880e062SHong Zhang } 7110880e062SHong Zhang } 7120880e062SHong Zhang if (nonew == 1) goto noinsert2; 71308401ef6SPierre Jolivet PetscCheck(nonew != -1, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Inserting a new block index nonzero block (%" PetscInt_FMT ", %" PetscInt_FMT ") in the matrix", row, col); 714fef13f97SBarry Smith MatSeqXAIJReallocateAIJ(A, a->mbs, bs2, nrow, row, col, rmax, aa, ai, aj, rp, ap, imax, nonew, MatScalar); 7159371c9d4SSatish Balay N = nrow++ - 1; 7169371c9d4SSatish Balay high++; 7170880e062SHong Zhang /* shift up all the later entries in this row */ 7189566063dSJacob Faibussowitsch PetscCall(PetscArraymove(rp + i + 1, rp + i, N - i + 1)); 7199566063dSJacob Faibussowitsch PetscCall(PetscArraymove(ap + bs2 * (i + 1), ap + bs2 * i, bs2 * (N - i + 1))); 7209566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(ap + bs2 * i, bs2)); 7210880e062SHong Zhang rp[i] = col; 7220880e062SHong Zhang bap = ap + bs2 * i; 7230880e062SHong Zhang if (roworiented) { 7240880e062SHong Zhang for (ii = 0; ii < bs; ii++, value += stepval) { 725ad540459SPierre Jolivet for (jj = ii; jj < bs2; jj += bs) bap[jj] = *value++; 7260880e062SHong Zhang } 7270880e062SHong Zhang } else { 7280880e062SHong Zhang for (ii = 0; ii < bs; ii++, value += stepval) { 729ad540459SPierre Jolivet for (jj = 0; jj < bs; jj++) *bap++ = *value++; 7300880e062SHong Zhang } 7310880e062SHong Zhang } 7320880e062SHong Zhang noinsert2:; 7330880e062SHong Zhang low = i; 7340880e062SHong Zhang } 7350880e062SHong Zhang ailen[row] = nrow; 7360880e062SHong Zhang } 7373ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 73849b5e25fSSatish Balay } 73949b5e25fSSatish Balay 74064831d72SBarry Smith /* 74164831d72SBarry Smith This is not yet used 74264831d72SBarry Smith */ 743d71ae5a4SJacob Faibussowitsch PetscErrorCode MatAssemblyEnd_SeqSBAIJ_SeqAIJ_Inode(Mat A) 744d71ae5a4SJacob Faibussowitsch { 7450def2e27SBarry Smith Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)A->data; 7460def2e27SBarry Smith const PetscInt *ai = a->i, *aj = a->j, *cols; 7470def2e27SBarry Smith PetscInt i = 0, j, blk_size, m = A->rmap->n, node_count = 0, nzx, nzy, *ns, row, nz, cnt, cnt2, *counts; 748ace3abfcSBarry Smith PetscBool flag; 7490def2e27SBarry Smith 7500def2e27SBarry Smith PetscFunctionBegin; 7519566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m, &ns)); 7520def2e27SBarry Smith while (i < m) { 7530def2e27SBarry Smith nzx = ai[i + 1] - ai[i]; /* Number of nonzeros */ 7540def2e27SBarry Smith /* Limits the number of elements in a node to 'a->inode.limit' */ 7550def2e27SBarry Smith for (j = i + 1, blk_size = 1; j < m && blk_size < a->inode.limit; ++j, ++blk_size) { 7560def2e27SBarry Smith nzy = ai[j + 1] - ai[j]; 7570def2e27SBarry Smith if (nzy != (nzx - j + i)) break; 7589566063dSJacob Faibussowitsch PetscCall(PetscArraycmp(aj + ai[i] + j - i, aj + ai[j], nzy, &flag)); 7590def2e27SBarry Smith if (!flag) break; 7600def2e27SBarry Smith } 7610def2e27SBarry Smith ns[node_count++] = blk_size; 76226fbe8dcSKarl Rupp 7630def2e27SBarry Smith i = j; 7640def2e27SBarry Smith } 7650def2e27SBarry Smith if (!a->inode.size && m && node_count > .9 * m) { 7669566063dSJacob Faibussowitsch PetscCall(PetscFree(ns)); 7679566063dSJacob Faibussowitsch PetscCall(PetscInfo(A, "Found %" PetscInt_FMT " nodes out of %" PetscInt_FMT " rows. Not using Inode routines\n", node_count, m)); 7680def2e27SBarry Smith } else { 7690def2e27SBarry Smith a->inode.node_count = node_count; 77026fbe8dcSKarl Rupp 7719566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(node_count, &a->inode.size)); 7729566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(a->inode.size, ns, node_count)); 7739566063dSJacob Faibussowitsch PetscCall(PetscFree(ns)); 7749566063dSJacob Faibussowitsch PetscCall(PetscInfo(A, "Found %" PetscInt_FMT " nodes of %" PetscInt_FMT ". Limit used: %" PetscInt_FMT ". Using Inode routines\n", node_count, m, a->inode.limit)); 7750def2e27SBarry Smith 7760def2e27SBarry Smith /* count collections of adjacent columns in each inode */ 7770def2e27SBarry Smith row = 0; 7780def2e27SBarry Smith cnt = 0; 7790def2e27SBarry Smith for (i = 0; i < node_count; i++) { 7800def2e27SBarry Smith cols = aj + ai[row] + a->inode.size[i]; 7810def2e27SBarry Smith nz = ai[row + 1] - ai[row] - a->inode.size[i]; 7820def2e27SBarry Smith for (j = 1; j < nz; j++) { 78326fbe8dcSKarl Rupp if (cols[j] != cols[j - 1] + 1) cnt++; 7840def2e27SBarry Smith } 7850def2e27SBarry Smith cnt++; 7860def2e27SBarry Smith row += a->inode.size[i]; 7870def2e27SBarry Smith } 7889566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(2 * cnt, &counts)); 7890def2e27SBarry Smith cnt = 0; 7900def2e27SBarry Smith row = 0; 7910def2e27SBarry Smith for (i = 0; i < node_count; i++) { 7920def2e27SBarry Smith cols = aj + ai[row] + a->inode.size[i]; 7930def2e27SBarry Smith counts[2 * cnt] = cols[0]; 7940def2e27SBarry Smith nz = ai[row + 1] - ai[row] - a->inode.size[i]; 7950def2e27SBarry Smith cnt2 = 1; 7960def2e27SBarry Smith for (j = 1; j < nz; j++) { 7970def2e27SBarry Smith if (cols[j] != cols[j - 1] + 1) { 7980def2e27SBarry Smith counts[2 * (cnt++) + 1] = cnt2; 7990def2e27SBarry Smith counts[2 * cnt] = cols[j]; 8000def2e27SBarry Smith cnt2 = 1; 8010def2e27SBarry Smith } else cnt2++; 8020def2e27SBarry Smith } 8030def2e27SBarry Smith counts[2 * (cnt++) + 1] = cnt2; 8040def2e27SBarry Smith row += a->inode.size[i]; 8050def2e27SBarry Smith } 8069566063dSJacob Faibussowitsch PetscCall(PetscIntView(2 * cnt, counts, NULL)); 8070def2e27SBarry Smith } 8083ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 80938702af4SBarry Smith } 81038702af4SBarry Smith 811d71ae5a4SJacob Faibussowitsch PetscErrorCode MatAssemblyEnd_SeqSBAIJ(Mat A, MatAssemblyType mode) 812d71ae5a4SJacob Faibussowitsch { 81349b5e25fSSatish Balay Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)A->data; 8148f8f2f0dSBarry Smith PetscInt fshift = 0, i, *ai = a->i, *aj = a->j, *imax = a->imax; 815d0f46423SBarry Smith PetscInt m = A->rmap->N, *ip, N, *ailen = a->ilen; 81613f74950SBarry Smith PetscInt mbs = a->mbs, bs2 = a->bs2, rmax = 0; 81749b5e25fSSatish Balay MatScalar *aa = a->a, *ap; 81849b5e25fSSatish Balay 81949b5e25fSSatish Balay PetscFunctionBegin; 8203ba16761SJacob Faibussowitsch if (mode == MAT_FLUSH_ASSEMBLY) PetscFunctionReturn(PETSC_SUCCESS); 82149b5e25fSSatish Balay 82249b5e25fSSatish Balay if (m) rmax = ailen[0]; 82349b5e25fSSatish Balay for (i = 1; i < mbs; i++) { 82449b5e25fSSatish Balay /* move each row back by the amount of empty slots (fshift) before it*/ 82549b5e25fSSatish Balay fshift += imax[i - 1] - ailen[i - 1]; 82649b5e25fSSatish Balay rmax = PetscMax(rmax, ailen[i]); 82749b5e25fSSatish Balay if (fshift) { 828580bdb30SBarry Smith ip = aj + ai[i]; 829580bdb30SBarry Smith ap = aa + bs2 * ai[i]; 83049b5e25fSSatish Balay N = ailen[i]; 8319566063dSJacob Faibussowitsch PetscCall(PetscArraymove(ip - fshift, ip, N)); 8329566063dSJacob Faibussowitsch PetscCall(PetscArraymove(ap - bs2 * fshift, ap, bs2 * N)); 83349b5e25fSSatish Balay } 83449b5e25fSSatish Balay ai[i] = ai[i - 1] + ailen[i - 1]; 83549b5e25fSSatish Balay } 83649b5e25fSSatish Balay if (mbs) { 83749b5e25fSSatish Balay fshift += imax[mbs - 1] - ailen[mbs - 1]; 83849b5e25fSSatish Balay ai[mbs] = ai[mbs - 1] + ailen[mbs - 1]; 83949b5e25fSSatish Balay } 84049b5e25fSSatish Balay /* reset ilen and imax for each row */ 841ad540459SPierre Jolivet for (i = 0; i < mbs; i++) ailen[i] = imax[i] = ai[i + 1] - ai[i]; 8426c6c5352SBarry Smith a->nz = ai[mbs]; 84349b5e25fSSatish Balay 844b424e231SHong Zhang /* diagonals may have moved, reset it */ 8451baa6e33SBarry Smith if (a->diag) PetscCall(PetscArraycpy(a->diag, ai, mbs)); 846aed4548fSBarry Smith PetscCheck(!fshift || a->nounused != -1, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Unused space detected in matrix: %" PetscInt_FMT " X %" PetscInt_FMT " block size %" PetscInt_FMT ", %" PetscInt_FMT " unneeded", m, A->cmap->n, A->rmap->bs, fshift * bs2); 84726fbe8dcSKarl Rupp 8489566063dSJacob Faibussowitsch PetscCall(PetscInfo(A, "Matrix size: %" PetscInt_FMT " X %" PetscInt_FMT ", block size %" PetscInt_FMT "; storage space: %" PetscInt_FMT " unneeded, %" PetscInt_FMT " used\n", m, A->rmap->N, A->rmap->bs, fshift * bs2, a->nz * bs2)); 8499566063dSJacob Faibussowitsch PetscCall(PetscInfo(A, "Number of mallocs during MatSetValues is %" PetscInt_FMT "\n", a->reallocs)); 8509566063dSJacob Faibussowitsch PetscCall(PetscInfo(A, "Most nonzeros blocks in any row is %" PetscInt_FMT "\n", rmax)); 85126fbe8dcSKarl Rupp 8528e58a170SBarry Smith A->info.mallocs += a->reallocs; 85349b5e25fSSatish Balay a->reallocs = 0; 85449b5e25fSSatish Balay A->info.nz_unneeded = (PetscReal)fshift * bs2; 855061b2667SBarry Smith a->idiagvalid = PETSC_FALSE; 8564dcd73b1SHong Zhang a->rmax = rmax; 85738702af4SBarry Smith 85838702af4SBarry Smith if (A->cmap->n < 65536 && A->cmap->bs == 1) { 85944e1c64aSLisandro Dalcin if (a->jshort && a->free_jshort) { 86017803ae8SHong Zhang /* when matrix data structure is changed, previous jshort must be replaced */ 8619566063dSJacob Faibussowitsch PetscCall(PetscFree(a->jshort)); 86217803ae8SHong Zhang } 8639566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(a->i[A->rmap->n], &a->jshort)); 86438702af4SBarry Smith for (i = 0; i < a->i[A->rmap->n]; i++) a->jshort[i] = a->j[i]; 86538702af4SBarry Smith A->ops->mult = MatMult_SeqSBAIJ_1_ushort; 86641f059aeSBarry Smith A->ops->sor = MatSOR_SeqSBAIJ_ushort; 8674da8f245SBarry Smith a->free_jshort = PETSC_TRUE; 86838702af4SBarry Smith } 8693ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 87049b5e25fSSatish Balay } 87149b5e25fSSatish Balay 87249b5e25fSSatish Balay /* 87349b5e25fSSatish Balay This function returns an array of flags which indicate the locations of contiguous 87449b5e25fSSatish Balay blocks that should be zeroed. for eg: if bs = 3 and is = [0,1,2,3,5,6,7,8,9] 875a5b23f4aSJose E. Roman then the resulting sizes = [3,1,1,3,1] corresponding to sets [(0,1,2),(3),(5),(6,7,8),(9)] 87649b5e25fSSatish Balay Assume: sizes should be long enough to hold all the values. 87749b5e25fSSatish Balay */ 878d71ae5a4SJacob Faibussowitsch PetscErrorCode MatZeroRows_SeqSBAIJ_Check_Blocks(PetscInt idx[], PetscInt n, PetscInt bs, PetscInt sizes[], PetscInt *bs_max) 879d71ae5a4SJacob Faibussowitsch { 88013f74950SBarry Smith PetscInt i, j, k, row; 881ace3abfcSBarry Smith PetscBool flg; 88249b5e25fSSatish Balay 88349b5e25fSSatish Balay PetscFunctionBegin; 88449b5e25fSSatish Balay for (i = 0, j = 0; i < n; j++) { 88549b5e25fSSatish Balay row = idx[i]; 886a5b23f4aSJose E. Roman if (row % bs != 0) { /* Not the beginning of a block */ 88749b5e25fSSatish Balay sizes[j] = 1; 88849b5e25fSSatish Balay i++; 88949b5e25fSSatish Balay } else if (i + bs > n) { /* Beginning of a block, but complete block doesn't exist (at idx end) */ 89049b5e25fSSatish Balay sizes[j] = 1; /* Also makes sure at least 'bs' values exist for next else */ 89149b5e25fSSatish Balay i++; 8926aad120cSJose E. Roman } else { /* Beginning of the block, so check if the complete block exists */ 89349b5e25fSSatish Balay flg = PETSC_TRUE; 89449b5e25fSSatish Balay for (k = 1; k < bs; k++) { 89549b5e25fSSatish Balay if (row + k != idx[i + k]) { /* break in the block */ 89649b5e25fSSatish Balay flg = PETSC_FALSE; 89749b5e25fSSatish Balay break; 89849b5e25fSSatish Balay } 89949b5e25fSSatish Balay } 900abc0a331SBarry Smith if (flg) { /* No break in the bs */ 90149b5e25fSSatish Balay sizes[j] = bs; 90249b5e25fSSatish Balay i += bs; 90349b5e25fSSatish Balay } else { 90449b5e25fSSatish Balay sizes[j] = 1; 90549b5e25fSSatish Balay i++; 90649b5e25fSSatish Balay } 90749b5e25fSSatish Balay } 90849b5e25fSSatish Balay } 90949b5e25fSSatish Balay *bs_max = j; 9103ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 91149b5e25fSSatish Balay } 91249b5e25fSSatish Balay 91349b5e25fSSatish Balay /* Only add/insert a(i,j) with i<=j (blocks). 914da81f932SPierre Jolivet Any a(i,j) with i>j input by user is ignored. 91549b5e25fSSatish Balay */ 91649b5e25fSSatish Balay 917d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetValues_SeqSBAIJ(Mat A, PetscInt m, const PetscInt im[], PetscInt n, const PetscInt in[], const PetscScalar v[], InsertMode is) 918d71ae5a4SJacob Faibussowitsch { 91949b5e25fSSatish Balay Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)A->data; 920e2ee6c50SBarry Smith PetscInt *rp, k, low, high, t, ii, row, nrow, i, col, l, rmax, N, lastcol = -1; 92113f74950SBarry Smith PetscInt *imax = a->imax, *ai = a->i, *ailen = a->ilen, roworiented = a->roworiented; 922d0f46423SBarry Smith PetscInt *aj = a->j, nonew = a->nonew, bs = A->rmap->bs, brow, bcol; 92313f74950SBarry Smith PetscInt ridx, cidx, bs2 = a->bs2; 92449b5e25fSSatish Balay MatScalar *ap, value, *aa = a->a, *bap; 92549b5e25fSSatish Balay 92649b5e25fSSatish Balay PetscFunctionBegin; 92749b5e25fSSatish Balay for (k = 0; k < m; k++) { /* loop over added rows */ 92849b5e25fSSatish Balay row = im[k]; /* row number */ 92949b5e25fSSatish Balay brow = row / bs; /* block row number */ 93049b5e25fSSatish Balay if (row < 0) continue; 9316bdcaf15SBarry Smith PetscCheck(row < A->rmap->N, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Row too large: row %" PetscInt_FMT " max %" PetscInt_FMT, row, A->rmap->N - 1); 93249b5e25fSSatish Balay rp = aj + ai[brow]; /*ptr to beginning of column value of the row block*/ 93349b5e25fSSatish Balay ap = aa + bs2 * ai[brow]; /*ptr to beginning of element value of the row block*/ 93449b5e25fSSatish Balay rmax = imax[brow]; /* maximum space allocated for this row */ 93549b5e25fSSatish Balay nrow = ailen[brow]; /* actual length of this row */ 93649b5e25fSSatish Balay low = 0; 9378509e838SStefano Zampini high = nrow; 93849b5e25fSSatish Balay for (l = 0; l < n; l++) { /* loop over added columns */ 93949b5e25fSSatish Balay if (in[l] < 0) continue; 9406bdcaf15SBarry Smith PetscCheck(in[l] < A->cmap->N, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Column too large: col %" PetscInt_FMT " max %" PetscInt_FMT, in[l], A->cmap->N - 1); 94149b5e25fSSatish Balay col = in[l]; 94249b5e25fSSatish Balay bcol = col / bs; /* block col number */ 94349b5e25fSSatish Balay 944941593c8SHong Zhang if (brow > bcol) { 94526fbe8dcSKarl Rupp if (a->ignore_ltriangular) continue; /* ignore lower triangular values */ 94626fbe8dcSKarl Rupp else SETERRQ(PETSC_COMM_SELF, PETSC_ERR_USER, "Lower triangular value cannot be set for sbaij format. Ignoring these values, run with -mat_ignore_lower_triangular or call MatSetOption(mat,MAT_IGNORE_LOWER_TRIANGULAR,PETSC_TRUE)"); 947941593c8SHong Zhang } 948f4989cb3SHong Zhang 9499371c9d4SSatish Balay ridx = row % bs; 9509371c9d4SSatish Balay cidx = col % bs; /*row and col index inside the block */ 9518549e402SHong Zhang if ((brow == bcol && ridx <= cidx) || (brow < bcol)) { 95249b5e25fSSatish Balay /* element value a(k,l) */ 95326fbe8dcSKarl Rupp if (roworiented) value = v[l + k * n]; 95426fbe8dcSKarl Rupp else value = v[k + l * m]; 95549b5e25fSSatish Balay 95649b5e25fSSatish Balay /* move pointer bap to a(k,l) quickly and add/insert value */ 95726fbe8dcSKarl Rupp if (col <= lastcol) low = 0; 9588509e838SStefano Zampini else high = nrow; 9598509e838SStefano Zampini 960e2ee6c50SBarry Smith lastcol = col; 96149b5e25fSSatish Balay while (high - low > 7) { 96249b5e25fSSatish Balay t = (low + high) / 2; 96349b5e25fSSatish Balay if (rp[t] > bcol) high = t; 96449b5e25fSSatish Balay else low = t; 96549b5e25fSSatish Balay } 96649b5e25fSSatish Balay for (i = low; i < high; i++) { 96749b5e25fSSatish Balay if (rp[i] > bcol) break; 96849b5e25fSSatish Balay if (rp[i] == bcol) { 96949b5e25fSSatish Balay bap = ap + bs2 * i + bs * cidx + ridx; 97049b5e25fSSatish Balay if (is == ADD_VALUES) *bap += value; 97149b5e25fSSatish Balay else *bap = value; 9728549e402SHong Zhang /* for diag block, add/insert its symmetric element a(cidx,ridx) */ 9738549e402SHong Zhang if (brow == bcol && ridx < cidx) { 9748549e402SHong Zhang bap = ap + bs2 * i + bs * ridx + cidx; 9758549e402SHong Zhang if (is == ADD_VALUES) *bap += value; 9768549e402SHong Zhang else *bap = value; 9778549e402SHong Zhang } 97849b5e25fSSatish Balay goto noinsert1; 97949b5e25fSSatish Balay } 98049b5e25fSSatish Balay } 98149b5e25fSSatish Balay 98249b5e25fSSatish Balay if (nonew == 1) goto noinsert1; 98308401ef6SPierre Jolivet PetscCheck(nonew != -1, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Inserting a new nonzero (%" PetscInt_FMT ", %" PetscInt_FMT ") in the matrix", row, col); 984fef13f97SBarry Smith MatSeqXAIJReallocateAIJ(A, a->mbs, bs2, nrow, brow, bcol, rmax, aa, ai, aj, rp, ap, imax, nonew, MatScalar); 98549b5e25fSSatish Balay 9869371c9d4SSatish Balay N = nrow++ - 1; 9879371c9d4SSatish Balay high++; 98849b5e25fSSatish Balay /* shift up all the later entries in this row */ 9899566063dSJacob Faibussowitsch PetscCall(PetscArraymove(rp + i + 1, rp + i, N - i + 1)); 9909566063dSJacob Faibussowitsch PetscCall(PetscArraymove(ap + bs2 * (i + 1), ap + bs2 * i, bs2 * (N - i + 1))); 9919566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(ap + bs2 * i, bs2)); 99249b5e25fSSatish Balay rp[i] = bcol; 99349b5e25fSSatish Balay ap[bs2 * i + bs * cidx + ridx] = value; 9948509e838SStefano Zampini /* for diag block, add/insert its symmetric element a(cidx,ridx) */ 995ad540459SPierre Jolivet if (brow == bcol && ridx < cidx) ap[bs2 * i + bs * ridx + cidx] = value; 996e56f5c9eSBarry Smith A->nonzerostate++; 99749b5e25fSSatish Balay noinsert1:; 99849b5e25fSSatish Balay low = i; 9998549e402SHong Zhang } 100049b5e25fSSatish Balay } /* end of loop over added columns */ 100149b5e25fSSatish Balay ailen[brow] = nrow; 100249b5e25fSSatish Balay } /* end of loop over added rows */ 10033ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 100449b5e25fSSatish Balay } 100549b5e25fSSatish Balay 1006d71ae5a4SJacob Faibussowitsch PetscErrorCode MatICCFactor_SeqSBAIJ(Mat inA, IS row, const MatFactorInfo *info) 1007d71ae5a4SJacob Faibussowitsch { 10084ccecd49SHong Zhang Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)inA->data; 100949b5e25fSSatish Balay Mat outA; 1010ace3abfcSBarry Smith PetscBool row_identity; 101149b5e25fSSatish Balay 101249b5e25fSSatish Balay PetscFunctionBegin; 101308401ef6SPierre Jolivet PetscCheck(info->levels == 0, PETSC_COMM_SELF, PETSC_ERR_SUP, "Only levels=0 is supported for in-place icc"); 10149566063dSJacob Faibussowitsch PetscCall(ISIdentity(row, &row_identity)); 101528b400f6SJacob Faibussowitsch PetscCheck(row_identity, PETSC_COMM_SELF, PETSC_ERR_SUP, "Matrix reordering is not supported"); 101608401ef6SPierre Jolivet PetscCheck(inA->rmap->bs == 1, PETSC_COMM_SELF, PETSC_ERR_SUP, "Matrix block size %" PetscInt_FMT " is not supported", inA->rmap->bs); /* Need to replace MatCholeskyFactorSymbolic_SeqSBAIJ_MSR()! */ 1017c84f5b01SHong Zhang 101849b5e25fSSatish Balay outA = inA; 1019d5f3da31SBarry Smith inA->factortype = MAT_FACTOR_ICC; 10209566063dSJacob Faibussowitsch PetscCall(PetscFree(inA->solvertype)); 10219566063dSJacob Faibussowitsch PetscCall(PetscStrallocpy(MATSOLVERPETSC, &inA->solvertype)); 102249b5e25fSSatish Balay 10239566063dSJacob Faibussowitsch PetscCall(MatMarkDiagonal_SeqSBAIJ(inA)); 10249566063dSJacob Faibussowitsch PetscCall(MatSeqSBAIJSetNumericFactorization_inplace(inA, row_identity)); 102549b5e25fSSatish Balay 10269566063dSJacob Faibussowitsch PetscCall(PetscObjectReference((PetscObject)row)); 10279566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->row)); 1028c84f5b01SHong Zhang a->row = row; 10299566063dSJacob Faibussowitsch PetscCall(PetscObjectReference((PetscObject)row)); 10309566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->col)); 1031c84f5b01SHong Zhang a->col = row; 1032c84f5b01SHong Zhang 1033c84f5b01SHong Zhang /* Create the invert permutation so that it can be used in MatCholeskyFactorNumeric() */ 10349566063dSJacob Faibussowitsch if (a->icol) PetscCall(ISInvertPermutation(row, PETSC_DECIDE, &a->icol)); 103549b5e25fSSatish Balay 10364dfa11a4SJacob Faibussowitsch if (!a->solve_work) { PetscCall(PetscMalloc1(inA->rmap->N + inA->rmap->bs, &a->solve_work)); } 103749b5e25fSSatish Balay 10389566063dSJacob Faibussowitsch PetscCall(MatCholeskyFactorNumeric(outA, inA, info)); 10393ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 104049b5e25fSSatish Balay } 1041950f1e5bSHong Zhang 1042d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqSBAIJSetColumnIndices_SeqSBAIJ(Mat mat, PetscInt *indices) 1043d71ae5a4SJacob Faibussowitsch { 1044045c9aa0SHong Zhang Mat_SeqSBAIJ *baij = (Mat_SeqSBAIJ *)mat->data; 104513f74950SBarry Smith PetscInt i, nz, n; 104649b5e25fSSatish Balay 104749b5e25fSSatish Balay PetscFunctionBegin; 10486c6c5352SBarry Smith nz = baij->maxnz; 1049d0f46423SBarry Smith n = mat->cmap->n; 105026fbe8dcSKarl Rupp for (i = 0; i < nz; i++) baij->j[i] = indices[i]; 105126fbe8dcSKarl Rupp 10526c6c5352SBarry Smith baij->nz = nz; 105326fbe8dcSKarl Rupp for (i = 0; i < n; i++) baij->ilen[i] = baij->imax[i]; 105426fbe8dcSKarl Rupp 10559566063dSJacob Faibussowitsch PetscCall(MatSetOption(mat, MAT_NEW_NONZERO_LOCATION_ERR, PETSC_TRUE)); 10563ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 105749b5e25fSSatish Balay } 105849b5e25fSSatish Balay 105949b5e25fSSatish Balay /*@ 106019585528SSatish Balay MatSeqSBAIJSetColumnIndices - Set the column indices for all the rows 106111a5261eSBarry Smith in a `MATSEQSBAIJ` matrix. 106249b5e25fSSatish Balay 106349b5e25fSSatish Balay Input Parameters: 106411a5261eSBarry Smith + mat - the `MATSEQSBAIJ` matrix 106549b5e25fSSatish Balay - indices - the column indices 106649b5e25fSSatish Balay 106749b5e25fSSatish Balay Level: advanced 106849b5e25fSSatish Balay 106949b5e25fSSatish Balay Notes: 107049b5e25fSSatish Balay This can be called if you have precomputed the nonzero structure of the 107149b5e25fSSatish Balay matrix and want to provide it to the matrix object to improve the performance 107211a5261eSBarry Smith of the `MatSetValues()` operation. 107349b5e25fSSatish Balay 107449b5e25fSSatish Balay You MUST have set the correct numbers of nonzeros per row in the call to 107511a5261eSBarry Smith `MatCreateSeqSBAIJ()`, and the columns indices MUST be sorted. 107649b5e25fSSatish Balay 1077ab9f2c04SSatish Balay MUST be called before any calls to MatSetValues() 107849b5e25fSSatish Balay 107911a5261eSBarry Smith .seealso: `MATSEQSBAIJ`, `MatCreateSeqSBAIJ` 108049b5e25fSSatish Balay @*/ 1081d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqSBAIJSetColumnIndices(Mat mat, PetscInt *indices) 1082d71ae5a4SJacob Faibussowitsch { 108349b5e25fSSatish Balay PetscFunctionBegin; 10840700a824SBarry Smith PetscValidHeaderSpecific(mat, MAT_CLASSID, 1); 1085dadcf809SJacob Faibussowitsch PetscValidIntPointer(indices, 2); 1086cac4c232SBarry Smith PetscUseMethod(mat, "MatSeqSBAIJSetColumnIndices_C", (Mat, PetscInt *), (mat, indices)); 10873ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 108849b5e25fSSatish Balay } 108949b5e25fSSatish Balay 1090d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCopy_SeqSBAIJ(Mat A, Mat B, MatStructure str) 1091d71ae5a4SJacob Faibussowitsch { 10924c7a3774SStefano Zampini PetscBool isbaij; 10933c896bc6SHong Zhang 10943c896bc6SHong Zhang PetscFunctionBegin; 10959566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompareAny((PetscObject)B, &isbaij, MATSEQSBAIJ, MATMPISBAIJ, "")); 109628b400f6SJacob Faibussowitsch PetscCheck(isbaij, PetscObjectComm((PetscObject)B), PETSC_ERR_SUP, "Not for matrix type %s", ((PetscObject)B)->type_name); 10974c7a3774SStefano Zampini /* If the two matrices have the same copy implementation and nonzero pattern, use fast copy. */ 10984c7a3774SStefano Zampini if (str == SAME_NONZERO_PATTERN && A->ops->copy == B->ops->copy) { 10993c896bc6SHong Zhang Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)A->data; 11003c896bc6SHong Zhang Mat_SeqSBAIJ *b = (Mat_SeqSBAIJ *)B->data; 11013c896bc6SHong Zhang 110208401ef6SPierre Jolivet PetscCheck(a->i[a->mbs] == b->i[b->mbs], PETSC_COMM_SELF, PETSC_ERR_ARG_INCOMP, "Number of nonzeros in two matrices are different"); 110308401ef6SPierre Jolivet PetscCheck(a->mbs == b->mbs, PETSC_COMM_SELF, PETSC_ERR_ARG_INCOMP, "Number of rows in two matrices are different"); 110408401ef6SPierre Jolivet PetscCheck(a->bs2 == b->bs2, PETSC_COMM_SELF, PETSC_ERR_ARG_INCOMP, "Different block size"); 11059566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(b->a, a->a, a->bs2 * a->i[a->mbs])); 11069566063dSJacob Faibussowitsch PetscCall(PetscObjectStateIncrease((PetscObject)B)); 11073c896bc6SHong Zhang } else { 11089566063dSJacob Faibussowitsch PetscCall(MatGetRowUpperTriangular(A)); 11099566063dSJacob Faibussowitsch PetscCall(MatCopy_Basic(A, B, str)); 11109566063dSJacob Faibussowitsch PetscCall(MatRestoreRowUpperTriangular(A)); 11113c896bc6SHong Zhang } 11123ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 11133c896bc6SHong Zhang } 11143c896bc6SHong Zhang 1115d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatSeqSBAIJGetArray_SeqSBAIJ(Mat A, PetscScalar *array[]) 1116d71ae5a4SJacob Faibussowitsch { 1117a6ece127SHong Zhang Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)A->data; 11185fd66863SKarl Rupp 1119a6ece127SHong Zhang PetscFunctionBegin; 1120a6ece127SHong Zhang *array = a->a; 11213ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1122a6ece127SHong Zhang } 1123a6ece127SHong Zhang 1124d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatSeqSBAIJRestoreArray_SeqSBAIJ(Mat A, PetscScalar *array[]) 1125d71ae5a4SJacob Faibussowitsch { 1126a6ece127SHong Zhang PetscFunctionBegin; 1127cda14afcSprj- *array = NULL; 11283ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1129a6ece127SHong Zhang } 1130a6ece127SHong Zhang 1131d71ae5a4SJacob Faibussowitsch PetscErrorCode MatAXPYGetPreallocation_SeqSBAIJ(Mat Y, Mat X, PetscInt *nnz) 1132d71ae5a4SJacob Faibussowitsch { 1133b264fe52SHong Zhang PetscInt bs = Y->rmap->bs, mbs = Y->rmap->N / bs; 113452768537SHong Zhang Mat_SeqSBAIJ *x = (Mat_SeqSBAIJ *)X->data; 113552768537SHong Zhang Mat_SeqSBAIJ *y = (Mat_SeqSBAIJ *)Y->data; 113652768537SHong Zhang 113752768537SHong Zhang PetscFunctionBegin; 113852768537SHong Zhang /* Set the number of nonzeros in the new matrix */ 11399566063dSJacob Faibussowitsch PetscCall(MatAXPYGetPreallocation_SeqX_private(mbs, x->i, x->j, y->i, y->j, nnz)); 11403ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 114152768537SHong Zhang } 114252768537SHong Zhang 1143d71ae5a4SJacob Faibussowitsch PetscErrorCode MatAXPY_SeqSBAIJ(Mat Y, PetscScalar a, Mat X, MatStructure str) 1144d71ae5a4SJacob Faibussowitsch { 114542ee4b1aSHong Zhang Mat_SeqSBAIJ *x = (Mat_SeqSBAIJ *)X->data, *y = (Mat_SeqSBAIJ *)Y->data; 114631ce2d13SHong Zhang PetscInt bs = Y->rmap->bs, bs2 = bs * bs; 1147e838b9e7SJed Brown PetscBLASInt one = 1; 114842ee4b1aSHong Zhang 114942ee4b1aSHong Zhang PetscFunctionBegin; 1150134adf20SPierre Jolivet if (str == UNKNOWN_NONZERO_PATTERN || (PetscDefined(USE_DEBUG) && str == SAME_NONZERO_PATTERN)) { 1151134adf20SPierre Jolivet PetscBool e = x->nz == y->nz && x->mbs == y->mbs ? PETSC_TRUE : PETSC_FALSE; 1152134adf20SPierre Jolivet if (e) { 11539566063dSJacob Faibussowitsch PetscCall(PetscArraycmp(x->i, y->i, x->mbs + 1, &e)); 1154134adf20SPierre Jolivet if (e) { 11559566063dSJacob Faibussowitsch PetscCall(PetscArraycmp(x->j, y->j, x->i[x->mbs], &e)); 1156134adf20SPierre Jolivet if (e) str = SAME_NONZERO_PATTERN; 1157134adf20SPierre Jolivet } 1158134adf20SPierre Jolivet } 115954c59aa7SJacob Faibussowitsch if (!e) PetscCheck(str != SAME_NONZERO_PATTERN, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONG, "MatStructure is not SAME_NONZERO_PATTERN"); 1160134adf20SPierre Jolivet } 116142ee4b1aSHong Zhang if (str == SAME_NONZERO_PATTERN) { 1162f4df32b1SMatthew Knepley PetscScalar alpha = a; 1163c5df96a5SBarry Smith PetscBLASInt bnz; 11649566063dSJacob Faibussowitsch PetscCall(PetscBLASIntCast(x->nz * bs2, &bnz)); 1165792fecdfSBarry Smith PetscCallBLAS("BLASaxpy", BLASaxpy_(&bnz, &alpha, x->a, &one, y->a, &one)); 11669566063dSJacob Faibussowitsch PetscCall(PetscObjectStateIncrease((PetscObject)Y)); 1167ab784542SHong Zhang } else if (str == SUBSET_NONZERO_PATTERN) { /* nonzeros of X is a subset of Y's */ 11689566063dSJacob Faibussowitsch PetscCall(MatSetOption(X, MAT_GETROW_UPPERTRIANGULAR, PETSC_TRUE)); 11699566063dSJacob Faibussowitsch PetscCall(MatAXPY_Basic(Y, a, X, str)); 11709566063dSJacob Faibussowitsch PetscCall(MatSetOption(X, MAT_GETROW_UPPERTRIANGULAR, PETSC_FALSE)); 117142ee4b1aSHong Zhang } else { 117252768537SHong Zhang Mat B; 117352768537SHong Zhang PetscInt *nnz; 117454c59aa7SJacob Faibussowitsch PetscCheck(bs == X->rmap->bs, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Matrices must have same block size"); 11759566063dSJacob Faibussowitsch PetscCall(MatGetRowUpperTriangular(X)); 11769566063dSJacob Faibussowitsch PetscCall(MatGetRowUpperTriangular(Y)); 11779566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(Y->rmap->N, &nnz)); 11789566063dSJacob Faibussowitsch PetscCall(MatCreate(PetscObjectComm((PetscObject)Y), &B)); 11799566063dSJacob Faibussowitsch PetscCall(PetscObjectSetName((PetscObject)B, ((PetscObject)Y)->name)); 11809566063dSJacob Faibussowitsch PetscCall(MatSetSizes(B, Y->rmap->n, Y->cmap->n, Y->rmap->N, Y->cmap->N)); 11819566063dSJacob Faibussowitsch PetscCall(MatSetBlockSizesFromMats(B, Y, Y)); 11829566063dSJacob Faibussowitsch PetscCall(MatSetType(B, ((PetscObject)Y)->type_name)); 11839566063dSJacob Faibussowitsch PetscCall(MatAXPYGetPreallocation_SeqSBAIJ(Y, X, nnz)); 11849566063dSJacob Faibussowitsch PetscCall(MatSeqSBAIJSetPreallocation(B, bs, 0, nnz)); 118552768537SHong Zhang 11869566063dSJacob Faibussowitsch PetscCall(MatAXPY_BasicWithPreallocation(B, Y, a, X, str)); 118752768537SHong Zhang 11889566063dSJacob Faibussowitsch PetscCall(MatHeaderMerge(Y, &B)); 11899566063dSJacob Faibussowitsch PetscCall(PetscFree(nnz)); 11909566063dSJacob Faibussowitsch PetscCall(MatRestoreRowUpperTriangular(X)); 11919566063dSJacob Faibussowitsch PetscCall(MatRestoreRowUpperTriangular(Y)); 119242ee4b1aSHong Zhang } 11933ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 119442ee4b1aSHong Zhang } 119542ee4b1aSHong Zhang 1196d71ae5a4SJacob Faibussowitsch PetscErrorCode MatIsSymmetric_SeqSBAIJ(Mat A, PetscReal tol, PetscBool *flg) 1197d71ae5a4SJacob Faibussowitsch { 1198efcf0fc3SBarry Smith PetscFunctionBegin; 1199efcf0fc3SBarry Smith *flg = PETSC_TRUE; 12003ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1201efcf0fc3SBarry Smith } 1202efcf0fc3SBarry Smith 1203d71ae5a4SJacob Faibussowitsch PetscErrorCode MatIsStructurallySymmetric_SeqSBAIJ(Mat A, PetscBool *flg) 1204d71ae5a4SJacob Faibussowitsch { 1205efcf0fc3SBarry Smith PetscFunctionBegin; 1206efcf0fc3SBarry Smith *flg = PETSC_TRUE; 12073ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1208efcf0fc3SBarry Smith } 1209efcf0fc3SBarry Smith 1210d71ae5a4SJacob Faibussowitsch PetscErrorCode MatIsHermitian_SeqSBAIJ(Mat A, PetscReal tol, PetscBool *flg) 1211d71ae5a4SJacob Faibussowitsch { 1212efcf0fc3SBarry Smith PetscFunctionBegin; 1213efcf0fc3SBarry Smith *flg = PETSC_FALSE; 12143ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1215efcf0fc3SBarry Smith } 1216efcf0fc3SBarry Smith 1217d71ae5a4SJacob Faibussowitsch PetscErrorCode MatConjugate_SeqSBAIJ(Mat A) 1218d71ae5a4SJacob Faibussowitsch { 12192726fb6dSPierre Jolivet #if defined(PETSC_USE_COMPLEX) 12202726fb6dSPierre Jolivet Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)A->data; 12212726fb6dSPierre Jolivet PetscInt i, nz = a->bs2 * a->i[a->mbs]; 12222726fb6dSPierre Jolivet MatScalar *aa = a->a; 12232726fb6dSPierre Jolivet 12242726fb6dSPierre Jolivet PetscFunctionBegin; 12252726fb6dSPierre Jolivet for (i = 0; i < nz; i++) aa[i] = PetscConj(aa[i]); 12262726fb6dSPierre Jolivet #else 12272726fb6dSPierre Jolivet PetscFunctionBegin; 12282726fb6dSPierre Jolivet #endif 12293ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 12302726fb6dSPierre Jolivet } 12312726fb6dSPierre Jolivet 1232d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRealPart_SeqSBAIJ(Mat A) 1233d71ae5a4SJacob Faibussowitsch { 123499cafbc1SBarry Smith Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)A->data; 123599cafbc1SBarry Smith PetscInt i, nz = a->bs2 * a->i[a->mbs]; 1236dd6ea824SBarry Smith MatScalar *aa = a->a; 123799cafbc1SBarry Smith 123899cafbc1SBarry Smith PetscFunctionBegin; 123999cafbc1SBarry Smith for (i = 0; i < nz; i++) aa[i] = PetscRealPart(aa[i]); 12403ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 124199cafbc1SBarry Smith } 124299cafbc1SBarry Smith 1243d71ae5a4SJacob Faibussowitsch PetscErrorCode MatImaginaryPart_SeqSBAIJ(Mat A) 1244d71ae5a4SJacob Faibussowitsch { 124599cafbc1SBarry Smith Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)A->data; 124699cafbc1SBarry Smith PetscInt i, nz = a->bs2 * a->i[a->mbs]; 1247dd6ea824SBarry Smith MatScalar *aa = a->a; 124899cafbc1SBarry Smith 124999cafbc1SBarry Smith PetscFunctionBegin; 125099cafbc1SBarry Smith for (i = 0; i < nz; i++) aa[i] = PetscImaginaryPart(aa[i]); 12513ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 125299cafbc1SBarry Smith } 125399cafbc1SBarry Smith 1254d71ae5a4SJacob Faibussowitsch PetscErrorCode MatZeroRowsColumns_SeqSBAIJ(Mat A, PetscInt is_n, const PetscInt is_idx[], PetscScalar diag, Vec x, Vec b) 1255d71ae5a4SJacob Faibussowitsch { 12563bededecSBarry Smith Mat_SeqSBAIJ *baij = (Mat_SeqSBAIJ *)A->data; 12573bededecSBarry Smith PetscInt i, j, k, count; 12583bededecSBarry Smith PetscInt bs = A->rmap->bs, bs2 = baij->bs2, row, col; 12593bededecSBarry Smith PetscScalar zero = 0.0; 12603bededecSBarry Smith MatScalar *aa; 12613bededecSBarry Smith const PetscScalar *xx; 12623bededecSBarry Smith PetscScalar *bb; 126356777dd2SBarry Smith PetscBool *zeroed, vecs = PETSC_FALSE; 12643bededecSBarry Smith 12653bededecSBarry Smith PetscFunctionBegin; 12663bededecSBarry Smith /* fix right hand side if needed */ 12673bededecSBarry Smith if (x && b) { 12689566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(x, &xx)); 12699566063dSJacob Faibussowitsch PetscCall(VecGetArray(b, &bb)); 127056777dd2SBarry Smith vecs = PETSC_TRUE; 12713bededecSBarry Smith } 12723bededecSBarry Smith 12733bededecSBarry Smith /* zero the columns */ 12749566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(A->rmap->n, &zeroed)); 12753bededecSBarry Smith for (i = 0; i < is_n; i++) { 1276aed4548fSBarry Smith PetscCheck(is_idx[i] >= 0 && is_idx[i] < A->rmap->N, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "row %" PetscInt_FMT " out of range", is_idx[i]); 12773bededecSBarry Smith zeroed[is_idx[i]] = PETSC_TRUE; 12783bededecSBarry Smith } 127956777dd2SBarry Smith if (vecs) { 128056777dd2SBarry Smith for (i = 0; i < A->rmap->N; i++) { 128156777dd2SBarry Smith row = i / bs; 128256777dd2SBarry Smith for (j = baij->i[row]; j < baij->i[row + 1]; j++) { 128356777dd2SBarry Smith for (k = 0; k < bs; k++) { 128456777dd2SBarry Smith col = bs * baij->j[j] + k; 128556777dd2SBarry Smith if (col <= i) continue; 128656777dd2SBarry Smith aa = ((MatScalar *)(baij->a)) + j * bs2 + (i % bs) + bs * k; 128726fbe8dcSKarl Rupp if (!zeroed[i] && zeroed[col]) bb[i] -= aa[0] * xx[col]; 128826fbe8dcSKarl Rupp if (zeroed[i] && !zeroed[col]) bb[col] -= aa[0] * xx[i]; 128956777dd2SBarry Smith } 129056777dd2SBarry Smith } 129156777dd2SBarry Smith } 129226fbe8dcSKarl Rupp for (i = 0; i < is_n; i++) bb[is_idx[i]] = diag * xx[is_idx[i]]; 129356777dd2SBarry Smith } 129456777dd2SBarry Smith 12953bededecSBarry Smith for (i = 0; i < A->rmap->N; i++) { 12963bededecSBarry Smith if (!zeroed[i]) { 12973bededecSBarry Smith row = i / bs; 12983bededecSBarry Smith for (j = baij->i[row]; j < baij->i[row + 1]; j++) { 12993bededecSBarry Smith for (k = 0; k < bs; k++) { 13003bededecSBarry Smith col = bs * baij->j[j] + k; 13013bededecSBarry Smith if (zeroed[col]) { 13023bededecSBarry Smith aa = ((MatScalar *)(baij->a)) + j * bs2 + (i % bs) + bs * k; 13033bededecSBarry Smith aa[0] = 0.0; 13043bededecSBarry Smith } 13053bededecSBarry Smith } 13063bededecSBarry Smith } 13073bededecSBarry Smith } 13083bededecSBarry Smith } 13099566063dSJacob Faibussowitsch PetscCall(PetscFree(zeroed)); 131056777dd2SBarry Smith if (vecs) { 13119566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(x, &xx)); 13129566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(b, &bb)); 131356777dd2SBarry Smith } 13143bededecSBarry Smith 13153bededecSBarry Smith /* zero the rows */ 13163bededecSBarry Smith for (i = 0; i < is_n; i++) { 13173bededecSBarry Smith row = is_idx[i]; 13183bededecSBarry Smith count = (baij->i[row / bs + 1] - baij->i[row / bs]) * bs; 13193bededecSBarry Smith aa = ((MatScalar *)(baij->a)) + baij->i[row / bs] * bs2 + (row % bs); 13203bededecSBarry Smith for (k = 0; k < count; k++) { 13213bededecSBarry Smith aa[0] = zero; 13223bededecSBarry Smith aa += bs; 13233bededecSBarry Smith } 1324dbbe0bcdSBarry Smith if (diag != 0.0) PetscUseTypeMethod(A, setvalues, 1, &row, 1, &row, &diag, INSERT_VALUES); 13253bededecSBarry Smith } 13269566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd_SeqSBAIJ(A, MAT_FINAL_ASSEMBLY)); 13273ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 13283bededecSBarry Smith } 13293bededecSBarry Smith 1330d71ae5a4SJacob Faibussowitsch PetscErrorCode MatShift_SeqSBAIJ(Mat Y, PetscScalar a) 1331d71ae5a4SJacob Faibussowitsch { 13327d68702bSBarry Smith Mat_SeqSBAIJ *aij = (Mat_SeqSBAIJ *)Y->data; 13337d68702bSBarry Smith 13347d68702bSBarry Smith PetscFunctionBegin; 133548a46eb9SPierre Jolivet if (!Y->preallocated || !aij->nz) PetscCall(MatSeqSBAIJSetPreallocation(Y, Y->rmap->bs, 1, NULL)); 13369566063dSJacob Faibussowitsch PetscCall(MatShift_Basic(Y, a)); 13373ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 13387d68702bSBarry Smith } 13397d68702bSBarry Smith 134049b5e25fSSatish Balay /* -------------------------------------------------------------------*/ 13413964eb88SJed Brown static struct _MatOps MatOps_Values = {MatSetValues_SeqSBAIJ, 134249b5e25fSSatish Balay MatGetRow_SeqSBAIJ, 134349b5e25fSSatish Balay MatRestoreRow_SeqSBAIJ, 134449b5e25fSSatish Balay MatMult_SeqSBAIJ_N, 134597304618SKris Buschelman /* 4*/ MatMultAdd_SeqSBAIJ_N, 1346431c96f7SBarry Smith MatMult_SeqSBAIJ_N, /* transpose versions are same as non-transpose versions */ 1347e005ede5SBarry Smith MatMultAdd_SeqSBAIJ_N, 1348f4259b30SLisandro Dalcin NULL, 1349f4259b30SLisandro Dalcin NULL, 1350f4259b30SLisandro Dalcin NULL, 1351f4259b30SLisandro Dalcin /* 10*/ NULL, 1352f4259b30SLisandro Dalcin NULL, 1353c078aec8SLisandro Dalcin MatCholeskyFactor_SeqSBAIJ, 135441f059aeSBarry Smith MatSOR_SeqSBAIJ, 135549b5e25fSSatish Balay MatTranspose_SeqSBAIJ, 135697304618SKris Buschelman /* 15*/ MatGetInfo_SeqSBAIJ, 135749b5e25fSSatish Balay MatEqual_SeqSBAIJ, 135849b5e25fSSatish Balay MatGetDiagonal_SeqSBAIJ, 135949b5e25fSSatish Balay MatDiagonalScale_SeqSBAIJ, 136049b5e25fSSatish Balay MatNorm_SeqSBAIJ, 1361f4259b30SLisandro Dalcin /* 20*/ NULL, 136249b5e25fSSatish Balay MatAssemblyEnd_SeqSBAIJ, 136349b5e25fSSatish Balay MatSetOption_SeqSBAIJ, 136449b5e25fSSatish Balay MatZeroEntries_SeqSBAIJ, 1365f4259b30SLisandro Dalcin /* 24*/ NULL, 1366f4259b30SLisandro Dalcin NULL, 1367f4259b30SLisandro Dalcin NULL, 1368f4259b30SLisandro Dalcin NULL, 1369f4259b30SLisandro Dalcin NULL, 137026cec326SBarry Smith /* 29*/ MatSetUp_Seq_Hash, 1371f4259b30SLisandro Dalcin NULL, 1372f4259b30SLisandro Dalcin NULL, 1373f4259b30SLisandro Dalcin NULL, 1374f4259b30SLisandro Dalcin NULL, 1375d519adbfSMatthew Knepley /* 34*/ MatDuplicate_SeqSBAIJ, 1376f4259b30SLisandro Dalcin NULL, 1377f4259b30SLisandro Dalcin NULL, 1378f4259b30SLisandro Dalcin NULL, 1379c84f5b01SHong Zhang MatICCFactor_SeqSBAIJ, 1380d519adbfSMatthew Knepley /* 39*/ MatAXPY_SeqSBAIJ, 13817dae84e0SHong Zhang MatCreateSubMatrices_SeqSBAIJ, 138249b5e25fSSatish Balay MatIncreaseOverlap_SeqSBAIJ, 138349b5e25fSSatish Balay MatGetValues_SeqSBAIJ, 13843c896bc6SHong Zhang MatCopy_SeqSBAIJ, 1385f4259b30SLisandro Dalcin /* 44*/ NULL, 138649b5e25fSSatish Balay MatScale_SeqSBAIJ, 13877d68702bSBarry Smith MatShift_SeqSBAIJ, 1388f4259b30SLisandro Dalcin NULL, 13893bededecSBarry Smith MatZeroRowsColumns_SeqSBAIJ, 1390f4259b30SLisandro Dalcin /* 49*/ NULL, 139149b5e25fSSatish Balay MatGetRowIJ_SeqSBAIJ, 139249b5e25fSSatish Balay MatRestoreRowIJ_SeqSBAIJ, 1393f4259b30SLisandro Dalcin NULL, 1394f4259b30SLisandro Dalcin NULL, 1395f4259b30SLisandro Dalcin /* 54*/ NULL, 1396f4259b30SLisandro Dalcin NULL, 1397f4259b30SLisandro Dalcin NULL, 1398dc29a518SPierre Jolivet MatPermute_SeqSBAIJ, 139949b5e25fSSatish Balay MatSetValuesBlocked_SeqSBAIJ, 14007dae84e0SHong Zhang /* 59*/ MatCreateSubMatrix_SeqSBAIJ, 1401f4259b30SLisandro Dalcin NULL, 1402f4259b30SLisandro Dalcin NULL, 1403f4259b30SLisandro Dalcin NULL, 1404f4259b30SLisandro Dalcin NULL, 1405f4259b30SLisandro Dalcin /* 64*/ NULL, 1406f4259b30SLisandro Dalcin NULL, 1407f4259b30SLisandro Dalcin NULL, 1408f4259b30SLisandro Dalcin NULL, 1409f4259b30SLisandro Dalcin NULL, 1410d519adbfSMatthew Knepley /* 69*/ MatGetRowMaxAbs_SeqSBAIJ, 1411f4259b30SLisandro Dalcin NULL, 141228d58a37SPierre Jolivet MatConvert_MPISBAIJ_Basic, 1413f4259b30SLisandro Dalcin NULL, 1414f4259b30SLisandro Dalcin NULL, 1415f4259b30SLisandro Dalcin /* 74*/ NULL, 1416f4259b30SLisandro Dalcin NULL, 1417f4259b30SLisandro Dalcin NULL, 1418f4259b30SLisandro Dalcin NULL, 1419f4259b30SLisandro Dalcin NULL, 1420f4259b30SLisandro Dalcin /* 79*/ NULL, 1421f4259b30SLisandro Dalcin NULL, 1422f4259b30SLisandro Dalcin NULL, 142397304618SKris Buschelman MatGetInertia_SeqSBAIJ, 14245bba2384SShri Abhyankar MatLoad_SeqSBAIJ, 1425d519adbfSMatthew Knepley /* 84*/ MatIsSymmetric_SeqSBAIJ, 1426865e5f61SKris Buschelman MatIsHermitian_SeqSBAIJ, 1427efcf0fc3SBarry Smith MatIsStructurallySymmetric_SeqSBAIJ, 1428f4259b30SLisandro Dalcin NULL, 1429f4259b30SLisandro Dalcin NULL, 1430f4259b30SLisandro Dalcin /* 89*/ NULL, 1431f4259b30SLisandro Dalcin NULL, 1432f4259b30SLisandro Dalcin NULL, 1433f4259b30SLisandro Dalcin NULL, 1434f4259b30SLisandro Dalcin NULL, 1435f4259b30SLisandro Dalcin /* 94*/ NULL, 1436f4259b30SLisandro Dalcin NULL, 1437f4259b30SLisandro Dalcin NULL, 1438f4259b30SLisandro Dalcin NULL, 1439f4259b30SLisandro Dalcin NULL, 1440f4259b30SLisandro Dalcin /* 99*/ NULL, 1441f4259b30SLisandro Dalcin NULL, 1442f4259b30SLisandro Dalcin NULL, 14432726fb6dSPierre Jolivet MatConjugate_SeqSBAIJ, 1444f4259b30SLisandro Dalcin NULL, 1445f4259b30SLisandro Dalcin /*104*/ NULL, 144699cafbc1SBarry Smith MatRealPart_SeqSBAIJ, 1447f5edf698SHong Zhang MatImaginaryPart_SeqSBAIJ, 1448f5edf698SHong Zhang MatGetRowUpperTriangular_SeqSBAIJ, 14492af78befSBarry Smith MatRestoreRowUpperTriangular_SeqSBAIJ, 1450f4259b30SLisandro Dalcin /*109*/ NULL, 1451f4259b30SLisandro Dalcin NULL, 1452f4259b30SLisandro Dalcin NULL, 1453f4259b30SLisandro Dalcin NULL, 1454547795f9SHong Zhang MatMissingDiagonal_SeqSBAIJ, 1455f4259b30SLisandro Dalcin /*114*/ NULL, 1456f4259b30SLisandro Dalcin NULL, 1457f4259b30SLisandro Dalcin NULL, 1458f4259b30SLisandro Dalcin NULL, 1459f4259b30SLisandro Dalcin NULL, 1460f4259b30SLisandro Dalcin /*119*/ NULL, 1461f4259b30SLisandro Dalcin NULL, 1462f4259b30SLisandro Dalcin NULL, 1463f4259b30SLisandro Dalcin NULL, 1464f4259b30SLisandro Dalcin NULL, 1465f4259b30SLisandro Dalcin /*124*/ NULL, 1466f4259b30SLisandro Dalcin NULL, 1467f4259b30SLisandro Dalcin NULL, 1468f4259b30SLisandro Dalcin NULL, 1469f4259b30SLisandro Dalcin NULL, 1470f4259b30SLisandro Dalcin /*129*/ NULL, 1471f4259b30SLisandro Dalcin NULL, 1472f4259b30SLisandro Dalcin NULL, 1473f4259b30SLisandro Dalcin NULL, 1474f4259b30SLisandro Dalcin NULL, 1475f4259b30SLisandro Dalcin /*134*/ NULL, 1476f4259b30SLisandro Dalcin NULL, 1477f4259b30SLisandro Dalcin NULL, 1478f4259b30SLisandro Dalcin NULL, 1479f4259b30SLisandro Dalcin NULL, 148046533700Sstefano_zampini /*139*/ MatSetBlockSizes_Default, 1481f4259b30SLisandro Dalcin NULL, 1482f4259b30SLisandro Dalcin NULL, 1483f4259b30SLisandro Dalcin NULL, 1484f4259b30SLisandro Dalcin NULL, 1485d70f29a3SPierre Jolivet /*144*/ MatCreateMPIMatConcatenateSeqMat_SeqSBAIJ, 1486d70f29a3SPierre Jolivet NULL, 1487d70f29a3SPierre Jolivet NULL, 148899a7f59eSMark Adams NULL, 148999a7f59eSMark Adams NULL, 14907fb60732SBarry Smith NULL, 1491dec0b466SHong Zhang /*150*/ NULL, 1492dec0b466SHong Zhang NULL}; 1493be1d678aSKris Buschelman 1494d71ae5a4SJacob Faibussowitsch PetscErrorCode MatStoreValues_SeqSBAIJ(Mat mat) 1495d71ae5a4SJacob Faibussowitsch { 14964afc71dfSHong Zhang Mat_SeqSBAIJ *aij = (Mat_SeqSBAIJ *)mat->data; 1497d0f46423SBarry Smith PetscInt nz = aij->i[mat->rmap->N] * mat->rmap->bs * aij->bs2; 149849b5e25fSSatish Balay 149949b5e25fSSatish Balay PetscFunctionBegin; 150008401ef6SPierre Jolivet PetscCheck(aij->nonew == 1, PETSC_COMM_SELF, PETSC_ERR_ORDER, "Must call MatSetOption(A,MAT_NEW_NONZERO_LOCATIONS,PETSC_FALSE);first"); 150149b5e25fSSatish Balay 150249b5e25fSSatish Balay /* allocate space for values if not already there */ 150348a46eb9SPierre Jolivet if (!aij->saved_values) PetscCall(PetscMalloc1(nz + 1, &aij->saved_values)); 150449b5e25fSSatish Balay 150549b5e25fSSatish Balay /* copy values over */ 15069566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(aij->saved_values, aij->a, nz)); 15073ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 150849b5e25fSSatish Balay } 150949b5e25fSSatish Balay 1510d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRetrieveValues_SeqSBAIJ(Mat mat) 1511d71ae5a4SJacob Faibussowitsch { 15124afc71dfSHong Zhang Mat_SeqSBAIJ *aij = (Mat_SeqSBAIJ *)mat->data; 1513d0f46423SBarry Smith PetscInt nz = aij->i[mat->rmap->N] * mat->rmap->bs * aij->bs2; 151449b5e25fSSatish Balay 151549b5e25fSSatish Balay PetscFunctionBegin; 151608401ef6SPierre Jolivet PetscCheck(aij->nonew == 1, PETSC_COMM_SELF, PETSC_ERR_ORDER, "Must call MatSetOption(A,MAT_NEW_NONZERO_LOCATIONS,PETSC_FALSE);first"); 151728b400f6SJacob Faibussowitsch PetscCheck(aij->saved_values, PETSC_COMM_SELF, PETSC_ERR_ORDER, "Must call MatStoreValues(A);first"); 151849b5e25fSSatish Balay 151949b5e25fSSatish Balay /* copy values over */ 15209566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(aij->a, aij->saved_values, nz)); 15213ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 152249b5e25fSSatish Balay } 152349b5e25fSSatish Balay 1524d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatSeqSBAIJSetPreallocation_SeqSBAIJ(Mat B, PetscInt bs, PetscInt nz, PetscInt *nnz) 1525d71ae5a4SJacob Faibussowitsch { 1526c464158bSHong Zhang Mat_SeqSBAIJ *b = (Mat_SeqSBAIJ *)B->data; 15274dcd73b1SHong Zhang PetscInt i, mbs, nbs, bs2; 15282576faa2SJed Brown PetscBool skipallocation = PETSC_FALSE, flg = PETSC_FALSE, realalloc = PETSC_FALSE; 152949b5e25fSSatish Balay 1530ad79cf63SBarry Smith if (B->hash_active) { 1531ad79cf63SBarry Smith PetscInt bs; 1532ad79cf63SBarry Smith PetscCall(PetscMemcpy(&B->ops, &b->cops, sizeof(*(B->ops)))); 1533ad79cf63SBarry Smith PetscCall(PetscHMapIJVDestroy(&b->ht)); 1534ad79cf63SBarry Smith PetscCall(MatGetBlockSize(B, &bs)); 1535ad79cf63SBarry Smith if (bs > 1) PetscCall(PetscHSetIJDestroy(&b->bht)); 1536ad79cf63SBarry Smith PetscCall(PetscFree(b->dnz)); 1537ad79cf63SBarry Smith PetscCall(PetscFree(b->bdnz)); 1538ad79cf63SBarry Smith B->hash_active = PETSC_FALSE; 1539ad79cf63SBarry Smith } 154049b5e25fSSatish Balay PetscFunctionBegin; 15412576faa2SJed Brown if (nz >= 0 || nnz) realalloc = PETSC_TRUE; 1542db4efbfdSBarry Smith 15439566063dSJacob Faibussowitsch PetscCall(MatSetBlockSize(B, PetscAbs(bs))); 15449566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(B->rmap)); 15459566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(B->cmap)); 154608401ef6SPierre Jolivet PetscCheck(B->rmap->N <= B->cmap->N, PETSC_COMM_SELF, PETSC_ERR_SUP, "SEQSBAIJ matrix cannot have more rows %" PetscInt_FMT " than columns %" PetscInt_FMT, B->rmap->N, B->cmap->N); 15479566063dSJacob Faibussowitsch PetscCall(PetscLayoutGetBlockSize(B->rmap, &bs)); 1548899cda47SBarry Smith 154921940c7eSstefano_zampini B->preallocated = PETSC_TRUE; 155021940c7eSstefano_zampini 1551d0f46423SBarry Smith mbs = B->rmap->N / bs; 15524dcd73b1SHong Zhang nbs = B->cmap->n / bs; 155349b5e25fSSatish Balay bs2 = bs * bs; 155449b5e25fSSatish Balay 1555aed4548fSBarry Smith PetscCheck(mbs * bs == B->rmap->N && nbs * bs == B->cmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Number rows, cols must be divisible by blocksize"); 155649b5e25fSSatish Balay 1557ab93d7beSBarry Smith if (nz == MAT_SKIP_ALLOCATION) { 1558ab93d7beSBarry Smith skipallocation = PETSC_TRUE; 1559ab93d7beSBarry Smith nz = 0; 1560ab93d7beSBarry Smith } 1561ab93d7beSBarry Smith 1562435da068SBarry Smith if (nz == PETSC_DEFAULT || nz == PETSC_DECIDE) nz = 3; 156308401ef6SPierre Jolivet PetscCheck(nz >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "nz cannot be less than 0: value %" PetscInt_FMT, nz); 156449b5e25fSSatish Balay if (nnz) { 156549b5e25fSSatish Balay for (i = 0; i < mbs; i++) { 156608401ef6SPierre Jolivet PetscCheck(nnz[i] >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "nnz cannot be less than 0: local row %" PetscInt_FMT " value %" PetscInt_FMT, i, nnz[i]); 156708401ef6SPierre Jolivet PetscCheck(nnz[i] <= nbs, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "nnz cannot be greater than block row length: local row %" PetscInt_FMT " value %" PetscInt_FMT " block rowlength %" PetscInt_FMT, i, nnz[i], nbs); 156849b5e25fSSatish Balay } 156949b5e25fSSatish Balay } 157049b5e25fSSatish Balay 1571db4efbfdSBarry Smith B->ops->mult = MatMult_SeqSBAIJ_N; 1572db4efbfdSBarry Smith B->ops->multadd = MatMultAdd_SeqSBAIJ_N; 1573db4efbfdSBarry Smith B->ops->multtranspose = MatMult_SeqSBAIJ_N; 1574db4efbfdSBarry Smith B->ops->multtransposeadd = MatMultAdd_SeqSBAIJ_N; 157526fbe8dcSKarl Rupp 15769566063dSJacob Faibussowitsch PetscCall(PetscOptionsGetBool(((PetscObject)B)->options, ((PetscObject)B)->prefix, "-mat_no_unroll", &flg, NULL)); 157749b5e25fSSatish Balay if (!flg) { 157849b5e25fSSatish Balay switch (bs) { 157949b5e25fSSatish Balay case 1: 158049b5e25fSSatish Balay B->ops->mult = MatMult_SeqSBAIJ_1; 158149b5e25fSSatish Balay B->ops->multadd = MatMultAdd_SeqSBAIJ_1; 1582431c96f7SBarry Smith B->ops->multtranspose = MatMult_SeqSBAIJ_1; 1583431c96f7SBarry Smith B->ops->multtransposeadd = MatMultAdd_SeqSBAIJ_1; 158449b5e25fSSatish Balay break; 158549b5e25fSSatish Balay case 2: 158649b5e25fSSatish Balay B->ops->mult = MatMult_SeqSBAIJ_2; 158749b5e25fSSatish Balay B->ops->multadd = MatMultAdd_SeqSBAIJ_2; 1588431c96f7SBarry Smith B->ops->multtranspose = MatMult_SeqSBAIJ_2; 1589431c96f7SBarry Smith B->ops->multtransposeadd = MatMultAdd_SeqSBAIJ_2; 159049b5e25fSSatish Balay break; 159149b5e25fSSatish Balay case 3: 159249b5e25fSSatish Balay B->ops->mult = MatMult_SeqSBAIJ_3; 159349b5e25fSSatish Balay B->ops->multadd = MatMultAdd_SeqSBAIJ_3; 1594431c96f7SBarry Smith B->ops->multtranspose = MatMult_SeqSBAIJ_3; 1595431c96f7SBarry Smith B->ops->multtransposeadd = MatMultAdd_SeqSBAIJ_3; 159649b5e25fSSatish Balay break; 159749b5e25fSSatish Balay case 4: 159849b5e25fSSatish Balay B->ops->mult = MatMult_SeqSBAIJ_4; 159949b5e25fSSatish Balay B->ops->multadd = MatMultAdd_SeqSBAIJ_4; 1600431c96f7SBarry Smith B->ops->multtranspose = MatMult_SeqSBAIJ_4; 1601431c96f7SBarry Smith B->ops->multtransposeadd = MatMultAdd_SeqSBAIJ_4; 160249b5e25fSSatish Balay break; 160349b5e25fSSatish Balay case 5: 160449b5e25fSSatish Balay B->ops->mult = MatMult_SeqSBAIJ_5; 160549b5e25fSSatish Balay B->ops->multadd = MatMultAdd_SeqSBAIJ_5; 1606431c96f7SBarry Smith B->ops->multtranspose = MatMult_SeqSBAIJ_5; 1607431c96f7SBarry Smith B->ops->multtransposeadd = MatMultAdd_SeqSBAIJ_5; 160849b5e25fSSatish Balay break; 160949b5e25fSSatish Balay case 6: 161049b5e25fSSatish Balay B->ops->mult = MatMult_SeqSBAIJ_6; 161149b5e25fSSatish Balay B->ops->multadd = MatMultAdd_SeqSBAIJ_6; 1612431c96f7SBarry Smith B->ops->multtranspose = MatMult_SeqSBAIJ_6; 1613431c96f7SBarry Smith B->ops->multtransposeadd = MatMultAdd_SeqSBAIJ_6; 161449b5e25fSSatish Balay break; 161549b5e25fSSatish Balay case 7: 1616de53e5efSHong Zhang B->ops->mult = MatMult_SeqSBAIJ_7; 161749b5e25fSSatish Balay B->ops->multadd = MatMultAdd_SeqSBAIJ_7; 1618431c96f7SBarry Smith B->ops->multtranspose = MatMult_SeqSBAIJ_7; 1619431c96f7SBarry Smith B->ops->multtransposeadd = MatMultAdd_SeqSBAIJ_7; 162049b5e25fSSatish Balay break; 162149b5e25fSSatish Balay } 162249b5e25fSSatish Balay } 162349b5e25fSSatish Balay 162449b5e25fSSatish Balay b->mbs = mbs; 16254dcd73b1SHong Zhang b->nbs = nbs; 1626ab93d7beSBarry Smith if (!skipallocation) { 16272ee49352SLisandro Dalcin if (!b->imax) { 16289566063dSJacob Faibussowitsch PetscCall(PetscMalloc2(mbs, &b->imax, mbs, &b->ilen)); 162926fbe8dcSKarl Rupp 1630c760cd28SBarry Smith b->free_imax_ilen = PETSC_TRUE; 16312ee49352SLisandro Dalcin } 163249b5e25fSSatish Balay if (!nnz) { 1633435da068SBarry Smith if (nz == PETSC_DEFAULT || nz == PETSC_DECIDE) nz = 5; 163449b5e25fSSatish Balay else if (nz <= 0) nz = 1; 16355d2a9ed1SStefano Zampini nz = PetscMin(nbs, nz); 163626fbe8dcSKarl Rupp for (i = 0; i < mbs; i++) b->imax[i] = nz; 16379566063dSJacob Faibussowitsch PetscCall(PetscIntMultError(nz, mbs, &nz)); 163849b5e25fSSatish Balay } else { 1639c73702f5SBarry Smith PetscInt64 nz64 = 0; 16409371c9d4SSatish Balay for (i = 0; i < mbs; i++) { 16419371c9d4SSatish Balay b->imax[i] = nnz[i]; 16429371c9d4SSatish Balay nz64 += nnz[i]; 16439371c9d4SSatish Balay } 16449566063dSJacob Faibussowitsch PetscCall(PetscIntCast(nz64, &nz)); 164549b5e25fSSatish Balay } 16462ee49352SLisandro Dalcin /* b->ilen will count nonzeros in each block row so far. */ 164726fbe8dcSKarl Rupp for (i = 0; i < mbs; i++) b->ilen[i] = 0; 16486c6c5352SBarry Smith /* nz=(nz+mbs)/2; */ /* total diagonal and superdiagonal nonzero blocks */ 164949b5e25fSSatish Balay 165049b5e25fSSatish Balay /* allocate the matrix space */ 16519566063dSJacob Faibussowitsch PetscCall(MatSeqXAIJFreeAIJ(B, &b->a, &b->j, &b->i)); 16529566063dSJacob Faibussowitsch PetscCall(PetscMalloc3(bs2 * nz, &b->a, nz, &b->j, B->rmap->N + 1, &b->i)); 16539566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(b->a, nz * bs2)); 16549566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(b->j, nz)); 165526fbe8dcSKarl Rupp 165649b5e25fSSatish Balay b->singlemalloc = PETSC_TRUE; 165749b5e25fSSatish Balay 165849b5e25fSSatish Balay /* pointer to beginning of each row */ 1659e60cf9a0SBarry Smith b->i[0] = 0; 166026fbe8dcSKarl Rupp for (i = 1; i < mbs + 1; i++) b->i[i] = b->i[i - 1] + b->imax[i - 1]; 166126fbe8dcSKarl Rupp 1662e6b907acSBarry Smith b->free_a = PETSC_TRUE; 1663e6b907acSBarry Smith b->free_ij = PETSC_TRUE; 1664e811da20SHong Zhang } else { 1665e6b907acSBarry Smith b->free_a = PETSC_FALSE; 1666e6b907acSBarry Smith b->free_ij = PETSC_FALSE; 1667ab93d7beSBarry Smith } 166849b5e25fSSatish Balay 166949b5e25fSSatish Balay b->bs2 = bs2; 16706c6c5352SBarry Smith b->nz = 0; 1671b32cb4a7SJed Brown b->maxnz = nz; 1672f4259b30SLisandro Dalcin b->inew = NULL; 1673f4259b30SLisandro Dalcin b->jnew = NULL; 1674f4259b30SLisandro Dalcin b->anew = NULL; 1675f4259b30SLisandro Dalcin b->a2anew = NULL; 16761a3463dfSHong Zhang b->permute = PETSC_FALSE; 1677cb7b82ddSBarry Smith 1678cb7b82ddSBarry Smith B->was_assembled = PETSC_FALSE; 1679cb7b82ddSBarry Smith B->assembled = PETSC_FALSE; 16809566063dSJacob Faibussowitsch if (realalloc) PetscCall(MatSetOption(B, MAT_NEW_NONZERO_ALLOCATION_ERR, PETSC_TRUE)); 16813ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1682c464158bSHong Zhang } 1683153ea458SHong Zhang 1684d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqSBAIJSetPreallocationCSR_SeqSBAIJ(Mat B, PetscInt bs, const PetscInt ii[], const PetscInt jj[], const PetscScalar V[]) 1685d71ae5a4SJacob Faibussowitsch { 16860cd7f59aSBarry Smith PetscInt i, j, m, nz, anz, nz_max = 0, *nnz; 1687f4259b30SLisandro Dalcin PetscScalar *values = NULL; 168838f409ebSLisandro Dalcin PetscBool roworiented = ((Mat_SeqSBAIJ *)B->data)->roworiented; 16890cd7f59aSBarry Smith 169038f409ebSLisandro Dalcin PetscFunctionBegin; 169108401ef6SPierre Jolivet PetscCheck(bs >= 1, PetscObjectComm((PetscObject)B), PETSC_ERR_ARG_OUTOFRANGE, "Invalid block size specified, must be positive but it is %" PetscInt_FMT, bs); 16929566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetBlockSize(B->rmap, bs)); 16939566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetBlockSize(B->cmap, bs)); 16949566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(B->rmap)); 16959566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(B->cmap)); 16969566063dSJacob Faibussowitsch PetscCall(PetscLayoutGetBlockSize(B->rmap, &bs)); 169738f409ebSLisandro Dalcin m = B->rmap->n / bs; 169838f409ebSLisandro Dalcin 1699aed4548fSBarry Smith PetscCheck(!ii[0], PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "ii[0] must be 0 but it is %" PetscInt_FMT, ii[0]); 17009566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m + 1, &nnz)); 170138f409ebSLisandro Dalcin for (i = 0; i < m; i++) { 170238f409ebSLisandro Dalcin nz = ii[i + 1] - ii[i]; 170308401ef6SPierre Jolivet PetscCheck(nz >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Row %" PetscInt_FMT " has a negative number of columns %" PetscInt_FMT, i, nz); 17040cd7f59aSBarry Smith anz = 0; 17050cd7f59aSBarry Smith for (j = 0; j < nz; j++) { 17060cd7f59aSBarry Smith /* count only values on the diagonal or above */ 17070cd7f59aSBarry Smith if (jj[ii[i] + j] >= i) { 17080cd7f59aSBarry Smith anz = nz - j; 17090cd7f59aSBarry Smith break; 17100cd7f59aSBarry Smith } 17110cd7f59aSBarry Smith } 17120cd7f59aSBarry Smith nz_max = PetscMax(nz_max, anz); 17130cd7f59aSBarry Smith nnz[i] = anz; 171438f409ebSLisandro Dalcin } 17159566063dSJacob Faibussowitsch PetscCall(MatSeqSBAIJSetPreallocation(B, bs, 0, nnz)); 17169566063dSJacob Faibussowitsch PetscCall(PetscFree(nnz)); 171738f409ebSLisandro Dalcin 171838f409ebSLisandro Dalcin values = (PetscScalar *)V; 171948a46eb9SPierre Jolivet if (!values) PetscCall(PetscCalloc1(bs * bs * nz_max, &values)); 172038f409ebSLisandro Dalcin for (i = 0; i < m; i++) { 172138f409ebSLisandro Dalcin PetscInt ncols = ii[i + 1] - ii[i]; 172238f409ebSLisandro Dalcin const PetscInt *icols = jj + ii[i]; 172338f409ebSLisandro Dalcin if (!roworiented || bs == 1) { 172438f409ebSLisandro Dalcin const PetscScalar *svals = values + (V ? (bs * bs * ii[i]) : 0); 17259566063dSJacob Faibussowitsch PetscCall(MatSetValuesBlocked_SeqSBAIJ(B, 1, &i, ncols, icols, svals, INSERT_VALUES)); 172638f409ebSLisandro Dalcin } else { 172738f409ebSLisandro Dalcin for (j = 0; j < ncols; j++) { 172838f409ebSLisandro Dalcin const PetscScalar *svals = values + (V ? (bs * bs * (ii[i] + j)) : 0); 17299566063dSJacob Faibussowitsch PetscCall(MatSetValuesBlocked_SeqSBAIJ(B, 1, &i, 1, &icols[j], svals, INSERT_VALUES)); 173038f409ebSLisandro Dalcin } 173138f409ebSLisandro Dalcin } 173238f409ebSLisandro Dalcin } 17339566063dSJacob Faibussowitsch if (!V) PetscCall(PetscFree(values)); 17349566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(B, MAT_FINAL_ASSEMBLY)); 17359566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(B, MAT_FINAL_ASSEMBLY)); 17369566063dSJacob Faibussowitsch PetscCall(MatSetOption(B, MAT_NEW_NONZERO_LOCATION_ERR, PETSC_TRUE)); 17373ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 173838f409ebSLisandro Dalcin } 173938f409ebSLisandro Dalcin 1740db4efbfdSBarry Smith /* 1741db4efbfdSBarry Smith This is used to set the numeric factorization for both Cholesky and ICC symbolic factorization 1742db4efbfdSBarry Smith */ 1743d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqSBAIJSetNumericFactorization_inplace(Mat B, PetscBool natural) 1744d71ae5a4SJacob Faibussowitsch { 1745ace3abfcSBarry Smith PetscBool flg = PETSC_FALSE; 1746db4efbfdSBarry Smith PetscInt bs = B->rmap->bs; 1747db4efbfdSBarry Smith 1748db4efbfdSBarry Smith PetscFunctionBegin; 17499566063dSJacob Faibussowitsch PetscCall(PetscOptionsGetBool(((PetscObject)B)->options, ((PetscObject)B)->prefix, "-mat_no_unroll", &flg, NULL)); 1750db4efbfdSBarry Smith if (flg) bs = 8; 1751db4efbfdSBarry Smith 1752db4efbfdSBarry Smith if (!natural) { 1753db4efbfdSBarry Smith switch (bs) { 1754d71ae5a4SJacob Faibussowitsch case 1: 1755d71ae5a4SJacob Faibussowitsch B->ops->choleskyfactornumeric = MatCholeskyFactorNumeric_SeqSBAIJ_1_inplace; 1756d71ae5a4SJacob Faibussowitsch break; 1757d71ae5a4SJacob Faibussowitsch case 2: 1758d71ae5a4SJacob Faibussowitsch B->ops->choleskyfactornumeric = MatCholeskyFactorNumeric_SeqSBAIJ_2; 1759d71ae5a4SJacob Faibussowitsch break; 1760d71ae5a4SJacob Faibussowitsch case 3: 1761d71ae5a4SJacob Faibussowitsch B->ops->choleskyfactornumeric = MatCholeskyFactorNumeric_SeqSBAIJ_3; 1762d71ae5a4SJacob Faibussowitsch break; 1763d71ae5a4SJacob Faibussowitsch case 4: 1764d71ae5a4SJacob Faibussowitsch B->ops->choleskyfactornumeric = MatCholeskyFactorNumeric_SeqSBAIJ_4; 1765d71ae5a4SJacob Faibussowitsch break; 1766d71ae5a4SJacob Faibussowitsch case 5: 1767d71ae5a4SJacob Faibussowitsch B->ops->choleskyfactornumeric = MatCholeskyFactorNumeric_SeqSBAIJ_5; 1768d71ae5a4SJacob Faibussowitsch break; 1769d71ae5a4SJacob Faibussowitsch case 6: 1770d71ae5a4SJacob Faibussowitsch B->ops->choleskyfactornumeric = MatCholeskyFactorNumeric_SeqSBAIJ_6; 1771d71ae5a4SJacob Faibussowitsch break; 1772d71ae5a4SJacob Faibussowitsch case 7: 1773d71ae5a4SJacob Faibussowitsch B->ops->choleskyfactornumeric = MatCholeskyFactorNumeric_SeqSBAIJ_7; 1774d71ae5a4SJacob Faibussowitsch break; 1775d71ae5a4SJacob Faibussowitsch default: 1776d71ae5a4SJacob Faibussowitsch B->ops->choleskyfactornumeric = MatCholeskyFactorNumeric_SeqSBAIJ_N; 1777d71ae5a4SJacob Faibussowitsch break; 1778db4efbfdSBarry Smith } 1779db4efbfdSBarry Smith } else { 1780db4efbfdSBarry Smith switch (bs) { 1781d71ae5a4SJacob Faibussowitsch case 1: 1782d71ae5a4SJacob Faibussowitsch B->ops->choleskyfactornumeric = MatCholeskyFactorNumeric_SeqSBAIJ_1_NaturalOrdering_inplace; 1783d71ae5a4SJacob Faibussowitsch break; 1784d71ae5a4SJacob Faibussowitsch case 2: 1785d71ae5a4SJacob Faibussowitsch B->ops->choleskyfactornumeric = MatCholeskyFactorNumeric_SeqSBAIJ_2_NaturalOrdering; 1786d71ae5a4SJacob Faibussowitsch break; 1787d71ae5a4SJacob Faibussowitsch case 3: 1788d71ae5a4SJacob Faibussowitsch B->ops->choleskyfactornumeric = MatCholeskyFactorNumeric_SeqSBAIJ_3_NaturalOrdering; 1789d71ae5a4SJacob Faibussowitsch break; 1790d71ae5a4SJacob Faibussowitsch case 4: 1791d71ae5a4SJacob Faibussowitsch B->ops->choleskyfactornumeric = MatCholeskyFactorNumeric_SeqSBAIJ_4_NaturalOrdering; 1792d71ae5a4SJacob Faibussowitsch break; 1793d71ae5a4SJacob Faibussowitsch case 5: 1794d71ae5a4SJacob Faibussowitsch B->ops->choleskyfactornumeric = MatCholeskyFactorNumeric_SeqSBAIJ_5_NaturalOrdering; 1795d71ae5a4SJacob Faibussowitsch break; 1796d71ae5a4SJacob Faibussowitsch case 6: 1797d71ae5a4SJacob Faibussowitsch B->ops->choleskyfactornumeric = MatCholeskyFactorNumeric_SeqSBAIJ_6_NaturalOrdering; 1798d71ae5a4SJacob Faibussowitsch break; 1799d71ae5a4SJacob Faibussowitsch case 7: 1800d71ae5a4SJacob Faibussowitsch B->ops->choleskyfactornumeric = MatCholeskyFactorNumeric_SeqSBAIJ_7_NaturalOrdering; 1801d71ae5a4SJacob Faibussowitsch break; 1802d71ae5a4SJacob Faibussowitsch default: 1803d71ae5a4SJacob Faibussowitsch B->ops->choleskyfactornumeric = MatCholeskyFactorNumeric_SeqSBAIJ_N_NaturalOrdering; 1804d71ae5a4SJacob Faibussowitsch break; 1805db4efbfdSBarry Smith } 1806db4efbfdSBarry Smith } 18073ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1808db4efbfdSBarry Smith } 1809db4efbfdSBarry Smith 1810cc2e6a90SBarry Smith PETSC_INTERN PetscErrorCode MatConvert_SeqSBAIJ_SeqAIJ(Mat, MatType, MatReuse, Mat *); 1811cc2e6a90SBarry Smith PETSC_INTERN PetscErrorCode MatConvert_SeqSBAIJ_SeqBAIJ(Mat, MatType, MatReuse, Mat *); 1812d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatFactorGetSolverType_petsc(Mat A, MatSolverType *type) 1813d71ae5a4SJacob Faibussowitsch { 18144ac6704cSBarry Smith PetscFunctionBegin; 18154ac6704cSBarry Smith *type = MATSOLVERPETSC; 18163ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 18174ac6704cSBarry Smith } 1818d769727bSBarry Smith 1819d71ae5a4SJacob Faibussowitsch PETSC_INTERN PetscErrorCode MatGetFactor_seqsbaij_petsc(Mat A, MatFactorType ftype, Mat *B) 1820d71ae5a4SJacob Faibussowitsch { 1821d0f46423SBarry Smith PetscInt n = A->rmap->n; 18225c9eb25fSBarry Smith 18235c9eb25fSBarry Smith PetscFunctionBegin; 18240e92d65fSHong Zhang #if defined(PETSC_USE_COMPLEX) 1825b94d7dedSBarry Smith PetscCheck(A->hermitian != PETSC_BOOL3_TRUE || A->symmetric == PETSC_BOOL3_TRUE || (ftype != MAT_FACTOR_CHOLESKY && ftype != MAT_FACTOR_ICC), PETSC_COMM_SELF, PETSC_ERR_SUP, "Hermitian CHOLESKY or ICC Factor is not supported"); 18260e92d65fSHong Zhang #endif 1827eb1ec7c1SStefano Zampini 18289566063dSJacob Faibussowitsch PetscCall(MatCreate(PetscObjectComm((PetscObject)A), B)); 18299566063dSJacob Faibussowitsch PetscCall(MatSetSizes(*B, n, n, n, n)); 18305c9eb25fSBarry Smith if (ftype == MAT_FACTOR_CHOLESKY || ftype == MAT_FACTOR_ICC) { 18319566063dSJacob Faibussowitsch PetscCall(MatSetType(*B, MATSEQSBAIJ)); 18329566063dSJacob Faibussowitsch PetscCall(MatSeqSBAIJSetPreallocation(*B, A->rmap->bs, MAT_SKIP_ALLOCATION, NULL)); 183326fbe8dcSKarl Rupp 18347b056e98SHong Zhang (*B)->ops->choleskyfactorsymbolic = MatCholeskyFactorSymbolic_SeqSBAIJ; 1835c6d0d4f0SHong Zhang (*B)->ops->iccfactorsymbolic = MatICCFactorSymbolic_SeqSBAIJ; 18369566063dSJacob Faibussowitsch PetscCall(PetscStrallocpy(MATORDERINGNATURAL, (char **)&(*B)->preferredordering[MAT_FACTOR_CHOLESKY])); 18379566063dSJacob Faibussowitsch PetscCall(PetscStrallocpy(MATORDERINGNATURAL, (char **)&(*B)->preferredordering[MAT_FACTOR_ICC])); 1838e32f2f54SBarry Smith } else SETERRQ(PETSC_COMM_SELF, PETSC_ERR_SUP, "Factor type not supported"); 183900c67f3bSHong Zhang 1840d5f3da31SBarry Smith (*B)->factortype = ftype; 1841f73b0415SBarry Smith (*B)->canuseordering = PETSC_TRUE; 18429566063dSJacob Faibussowitsch PetscCall(PetscFree((*B)->solvertype)); 18439566063dSJacob Faibussowitsch PetscCall(PetscStrallocpy(MATSOLVERPETSC, &(*B)->solvertype)); 18449566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)*B, "MatFactorGetSolverType_C", MatFactorGetSolverType_petsc)); 18453ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 18465c9eb25fSBarry Smith } 18475c9eb25fSBarry Smith 18488397e458SBarry Smith /*@C 184911a5261eSBarry Smith MatSeqSBAIJGetArray - gives access to the array where the data for a `MATSEQSBAIJ` matrix is stored 18508397e458SBarry Smith 18518397e458SBarry Smith Not Collective 18528397e458SBarry Smith 18538397e458SBarry Smith Input Parameter: 185411a5261eSBarry Smith . mat - a `MATSEQSBAIJ` matrix 18558397e458SBarry Smith 18568397e458SBarry Smith Output Parameter: 18578397e458SBarry Smith . array - pointer to the data 18588397e458SBarry Smith 18598397e458SBarry Smith Level: intermediate 18608397e458SBarry Smith 186111a5261eSBarry Smith .seealso: `MATSEQSBAIJ`, `MatSeqSBAIJRestoreArray()`, `MatSeqAIJGetArray()`, `MatSeqAIJRestoreArray()` 18628397e458SBarry Smith @*/ 1863d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqSBAIJGetArray(Mat A, PetscScalar **array) 1864d71ae5a4SJacob Faibussowitsch { 18658397e458SBarry Smith PetscFunctionBegin; 1866cac4c232SBarry Smith PetscUseMethod(A, "MatSeqSBAIJGetArray_C", (Mat, PetscScalar **), (A, array)); 18673ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 18688397e458SBarry Smith } 18698397e458SBarry Smith 18708397e458SBarry Smith /*@C 187111a5261eSBarry Smith MatSeqSBAIJRestoreArray - returns access to the array where the data for a `MATSEQSBAIJ` matrix is stored obtained by `MatSeqSBAIJGetArray()` 18728397e458SBarry Smith 18738397e458SBarry Smith Not Collective 18748397e458SBarry Smith 18758397e458SBarry Smith Input Parameters: 1876a2b725a8SWilliam Gropp + mat - a MATSEQSBAIJ matrix 1877a2b725a8SWilliam Gropp - array - pointer to the data 18788397e458SBarry Smith 18798397e458SBarry Smith Level: intermediate 18808397e458SBarry Smith 188111a5261eSBarry Smith .seealso: `MATSEQSBAIJ`, `MatSeqSBAIJGetArray()`, `MatSeqAIJGetArray()`, `MatSeqAIJRestoreArray()` 18828397e458SBarry Smith @*/ 1883d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqSBAIJRestoreArray(Mat A, PetscScalar **array) 1884d71ae5a4SJacob Faibussowitsch { 18858397e458SBarry Smith PetscFunctionBegin; 1886cac4c232SBarry Smith PetscUseMethod(A, "MatSeqSBAIJRestoreArray_C", (Mat, PetscScalar **), (A, array)); 18873ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 18888397e458SBarry Smith } 18898397e458SBarry Smith 18900bad9183SKris Buschelman /*MC 1891fafad747SKris Buschelman MATSEQSBAIJ - MATSEQSBAIJ = "seqsbaij" - A matrix type to be used for sequential symmetric block sparse matrices, 18920bad9183SKris Buschelman based on block compressed sparse row format. Only the upper triangular portion of the matrix is stored. 18930bad9183SKris Buschelman 1894828413b8SBarry Smith For complex numbers by default this matrix is symmetric, NOT Hermitian symmetric. To make it Hermitian symmetric you 189511a5261eSBarry Smith can call `MatSetOption`(`Mat`, `MAT_HERMITIAN`). 1896828413b8SBarry Smith 18970bad9183SKris Buschelman Options Database Keys: 189811a5261eSBarry Smith . -mat_type seqsbaij - sets the matrix type to "seqsbaij" during a call to `MatSetFromOptions()` 18990bad9183SKris Buschelman 190095452b02SPatrick Sanan Notes: 190195452b02SPatrick Sanan By default if you insert values into the lower triangular part of the matrix they are simply ignored (since they are not 190211a5261eSBarry Smith stored and it is assumed they symmetric to the upper triangular). If you call `MatSetOption`(`Mat`,`MAT_IGNORE_LOWER_TRIANGULAR`,`PETSC_FALSE`) or use 190371dad5bbSBarry Smith the options database -mat_ignore_lower_triangular false it will generate an error if you try to set a value in the lower triangular portion. 190471dad5bbSBarry Smith 1905476417e5SBarry Smith The number of rows in the matrix must be less than or equal to the number of columns 190671dad5bbSBarry Smith 19070bad9183SKris Buschelman Level: beginner 19080bad9183SKris Buschelman 190911a5261eSBarry Smith .seealso: `MATSEQSBAIJ`, `MatCreateSeqSBAIJ()`, `MatType`, `MATMPISBAIJ` 19100bad9183SKris Buschelman M*/ 1911d71ae5a4SJacob Faibussowitsch PETSC_EXTERN PetscErrorCode MatCreate_SeqSBAIJ(Mat B) 1912d71ae5a4SJacob Faibussowitsch { 1913a23d5eceSKris Buschelman Mat_SeqSBAIJ *b; 191413f74950SBarry Smith PetscMPIInt size; 1915ace3abfcSBarry Smith PetscBool no_unroll = PETSC_FALSE, no_inode = PETSC_FALSE; 1916a23d5eceSKris Buschelman 1917a23d5eceSKris Buschelman PetscFunctionBegin; 19189566063dSJacob Faibussowitsch PetscCallMPI(MPI_Comm_size(PetscObjectComm((PetscObject)B), &size)); 191908401ef6SPierre Jolivet PetscCheck(size <= 1, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONG, "Comm must be of size 1"); 1920a23d5eceSKris Buschelman 19214dfa11a4SJacob Faibussowitsch PetscCall(PetscNew(&b)); 1922a23d5eceSKris Buschelman B->data = (void *)b; 19239566063dSJacob Faibussowitsch PetscCall(PetscMemcpy(B->ops, &MatOps_Values, sizeof(struct _MatOps))); 192426fbe8dcSKarl Rupp 1925a23d5eceSKris Buschelman B->ops->destroy = MatDestroy_SeqSBAIJ; 1926a23d5eceSKris Buschelman B->ops->view = MatView_SeqSBAIJ; 1927f4259b30SLisandro Dalcin b->row = NULL; 1928f4259b30SLisandro Dalcin b->icol = NULL; 1929a23d5eceSKris Buschelman b->reallocs = 0; 1930f4259b30SLisandro Dalcin b->saved_values = NULL; 19310def2e27SBarry Smith b->inode.limit = 5; 19320def2e27SBarry Smith b->inode.max_limit = 5; 1933a23d5eceSKris Buschelman 1934a23d5eceSKris Buschelman b->roworiented = PETSC_TRUE; 1935a23d5eceSKris Buschelman b->nonew = 0; 1936f4259b30SLisandro Dalcin b->diag = NULL; 1937f4259b30SLisandro Dalcin b->solve_work = NULL; 1938f4259b30SLisandro Dalcin b->mult_work = NULL; 1939f4259b30SLisandro Dalcin B->spptr = NULL; 1940f2cbd3d5SJed Brown B->info.nz_unneeded = (PetscReal)b->maxnz * b->bs2; 1941a9817697SBarry Smith b->keepnonzeropattern = PETSC_FALSE; 1942a23d5eceSKris Buschelman 1943f4259b30SLisandro Dalcin b->inew = NULL; 1944f4259b30SLisandro Dalcin b->jnew = NULL; 1945f4259b30SLisandro Dalcin b->anew = NULL; 1946f4259b30SLisandro Dalcin b->a2anew = NULL; 1947a23d5eceSKris Buschelman b->permute = PETSC_FALSE; 1948a23d5eceSKris Buschelman 194971dad5bbSBarry Smith b->ignore_ltriangular = PETSC_TRUE; 195026fbe8dcSKarl Rupp 19519566063dSJacob Faibussowitsch PetscCall(PetscOptionsGetBool(((PetscObject)B)->options, ((PetscObject)B)->prefix, "-mat_ignore_lower_triangular", &b->ignore_ltriangular, NULL)); 1952941593c8SHong Zhang 1953f5edf698SHong Zhang b->getrow_utriangular = PETSC_FALSE; 195426fbe8dcSKarl Rupp 19559566063dSJacob Faibussowitsch PetscCall(PetscOptionsGetBool(((PetscObject)B)->options, ((PetscObject)B)->prefix, "-mat_getrow_uppertriangular", &b->getrow_utriangular, NULL)); 1956f5edf698SHong Zhang 19579566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSeqSBAIJGetArray_C", MatSeqSBAIJGetArray_SeqSBAIJ)); 19589566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSeqSBAIJRestoreArray_C", MatSeqSBAIJRestoreArray_SeqSBAIJ)); 19599566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatStoreValues_C", MatStoreValues_SeqSBAIJ)); 19609566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatRetrieveValues_C", MatRetrieveValues_SeqSBAIJ)); 19619566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSeqSBAIJSetColumnIndices_C", MatSeqSBAIJSetColumnIndices_SeqSBAIJ)); 19629566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqsbaij_seqaij_C", MatConvert_SeqSBAIJ_SeqAIJ)); 19639566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqsbaij_seqbaij_C", MatConvert_SeqSBAIJ_SeqBAIJ)); 19649566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSeqSBAIJSetPreallocation_C", MatSeqSBAIJSetPreallocation_SeqSBAIJ)); 19659566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSeqSBAIJSetPreallocationCSR_C", MatSeqSBAIJSetPreallocationCSR_SeqSBAIJ)); 19666214f412SHong Zhang #if defined(PETSC_HAVE_ELEMENTAL) 19679566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqsbaij_elemental_C", MatConvert_SeqSBAIJ_Elemental)); 19686214f412SHong Zhang #endif 1969d24d4204SJose E. Roman #if defined(PETSC_HAVE_SCALAPACK) 19709566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqsbaij_scalapack_C", MatConvert_SBAIJ_ScaLAPACK)); 1971d24d4204SJose E. Roman #endif 197223ce1328SBarry Smith 1973b94d7dedSBarry Smith B->symmetry_eternal = PETSC_TRUE; 1974b94d7dedSBarry Smith B->structural_symmetry_eternal = PETSC_TRUE; 1975b94d7dedSBarry Smith B->symmetric = PETSC_BOOL3_TRUE; 1976b94d7dedSBarry Smith B->structurally_symmetric = PETSC_BOOL3_TRUE; 1977eb1ec7c1SStefano Zampini #if defined(PETSC_USE_COMPLEX) 1978b94d7dedSBarry Smith B->hermitian = PETSC_BOOL3_FALSE; 1979eb1ec7c1SStefano Zampini #else 1980b94d7dedSBarry Smith B->hermitian = PETSC_BOOL3_TRUE; 1981eb1ec7c1SStefano Zampini #endif 198213647f61SHong Zhang 19839566063dSJacob Faibussowitsch PetscCall(PetscObjectChangeTypeName((PetscObject)B, MATSEQSBAIJ)); 19840def2e27SBarry Smith 1985d0609cedSBarry Smith PetscOptionsBegin(PetscObjectComm((PetscObject)B), ((PetscObject)B)->prefix, "Options for SEQSBAIJ matrix", "Mat"); 19869566063dSJacob Faibussowitsch PetscCall(PetscOptionsBool("-mat_no_unroll", "Do not optimize for inodes (slower)", NULL, no_unroll, &no_unroll, NULL)); 198748a46eb9SPierre Jolivet if (no_unroll) PetscCall(PetscInfo(B, "Not using Inode routines due to -mat_no_unroll\n")); 19889566063dSJacob Faibussowitsch PetscCall(PetscOptionsBool("-mat_no_inode", "Do not optimize for inodes (slower)", NULL, no_inode, &no_inode, NULL)); 19899566063dSJacob Faibussowitsch if (no_inode) PetscCall(PetscInfo(B, "Not using Inode routines due to -mat_no_inode\n")); 19909566063dSJacob Faibussowitsch PetscCall(PetscOptionsInt("-mat_inode_limit", "Do not use inodes larger then this value", NULL, b->inode.limit, &b->inode.limit, NULL)); 1991d0609cedSBarry Smith PetscOptionsEnd(); 1992ace3abfcSBarry Smith b->inode.use = (PetscBool)(!(no_unroll || no_inode)); 19930def2e27SBarry Smith if (b->inode.limit > b->inode.max_limit) b->inode.limit = b->inode.max_limit; 19943ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1995a23d5eceSKris Buschelman } 1996a23d5eceSKris Buschelman 1997a23d5eceSKris Buschelman /*@C 1998a23d5eceSKris Buschelman MatSeqSBAIJSetPreallocation - Creates a sparse symmetric matrix in block AIJ (block 199911a5261eSBarry Smith compressed row) `MATSEQSBAIJ` format. For good matrix assembly performance the 2000a23d5eceSKris Buschelman user should preallocate the matrix storage by setting the parameter nz 2001a23d5eceSKris Buschelman (or the array nnz). By setting these parameters accurately, performance 2002a23d5eceSKris Buschelman during matrix assembly can be increased by more than a factor of 50. 2003a23d5eceSKris Buschelman 2004c3339decSBarry Smith Collective 2005a23d5eceSKris Buschelman 2006a23d5eceSKris Buschelman Input Parameters: 20071c4f3114SJed Brown + B - the symmetric matrix 200811a5261eSBarry Smith . bs - size of block, the blocks are ALWAYS square. One can use `MatSetBlockSizes()` to set a different row and column blocksize but the row 200911a5261eSBarry Smith blocksize always defines the size of the blocks. The column blocksize sets the blocksize of the vectors obtained with `MatCreateVecs()` 2010a23d5eceSKris Buschelman . nz - number of block nonzeros per block row (same for all rows) 2011a23d5eceSKris Buschelman - nnz - array containing the number of block nonzeros in the upper triangular plus 20120298fd71SBarry Smith diagonal portion of each block (possibly different for each block row) or NULL 2013a23d5eceSKris Buschelman 2014a23d5eceSKris Buschelman Options Database Keys: 2015a2b725a8SWilliam Gropp + -mat_no_unroll - uses code that does not unroll the loops in the 2016a23d5eceSKris Buschelman block calculations (much slower) 2017a2b725a8SWilliam Gropp - -mat_block_size - size of the blocks to use (only works if a negative bs is passed in 2018a23d5eceSKris Buschelman 2019a23d5eceSKris Buschelman Level: intermediate 2020a23d5eceSKris Buschelman 2021a23d5eceSKris Buschelman Notes: 2022a23d5eceSKris Buschelman Specify the preallocated storage with either nz or nnz (not both). 202311a5261eSBarry Smith Set nz = `PETSC_DEFAULT` and nnz = NULL for PETSc to control dynamic memory 2024651615e1SBarry Smith allocation. See [Sparse Matrices](sec_matsparse) for details. 2025a23d5eceSKris Buschelman 202611a5261eSBarry Smith You can call `MatGetInfo()` to get information on how effective the preallocation was; 2027aa95bbe8SBarry Smith for example the fields mallocs,nz_allocated,nz_used,nz_unneeded; 2028aa95bbe8SBarry Smith You can also run with the option -info and look for messages with the string 2029aa95bbe8SBarry Smith malloc in them to see if additional memory allocation was needed. 2030aa95bbe8SBarry Smith 203149a6f317SBarry Smith If the nnz parameter is given then the nz parameter is ignored 203249a6f317SBarry Smith 2033651615e1SBarry Smith .seealso: [Sparse Matrices](sec_matsparse), `MATSEQSBAIJ`, `MatCreate()`, `MatCreateSeqAIJ()`, `MatSetValues()`, `MatCreateSBAIJ()` 2034a23d5eceSKris Buschelman @*/ 2035d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqSBAIJSetPreallocation(Mat B, PetscInt bs, PetscInt nz, const PetscInt nnz[]) 2036d71ae5a4SJacob Faibussowitsch { 2037a23d5eceSKris Buschelman PetscFunctionBegin; 20386ba663aaSJed Brown PetscValidHeaderSpecific(B, MAT_CLASSID, 1); 20396ba663aaSJed Brown PetscValidType(B, 1); 20406ba663aaSJed Brown PetscValidLogicalCollectiveInt(B, bs, 2); 2041cac4c232SBarry Smith PetscTryMethod(B, "MatSeqSBAIJSetPreallocation_C", (Mat, PetscInt, PetscInt, const PetscInt[]), (B, bs, nz, nnz)); 20423ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 2043a23d5eceSKris Buschelman } 204449b5e25fSSatish Balay 204538f409ebSLisandro Dalcin /*@C 204611a5261eSBarry Smith MatSeqSBAIJSetPreallocationCSR - Creates a sparse parallel matrix in `MATSEQSBAIJ` format using the given nonzero structure and (optional) numerical values 204738f409ebSLisandro Dalcin 204838f409ebSLisandro Dalcin Input Parameters: 20491c4f3114SJed Brown + B - the matrix 2050eab78319SHong Zhang . bs - size of block, the blocks are ALWAYS square. 205138f409ebSLisandro Dalcin . i - the indices into j for the start of each local row (starts with zero) 205238f409ebSLisandro Dalcin . j - the column indices for each local row (starts with zero) these must be sorted for each row 205338f409ebSLisandro Dalcin - v - optional values in the matrix 205438f409ebSLisandro Dalcin 2055664954b6SBarry Smith Level: advanced 205638f409ebSLisandro Dalcin 205738f409ebSLisandro Dalcin Notes: 205811a5261eSBarry Smith The order of the entries in values is specified by the `MatOption` `MAT_ROW_ORIENTED`. For example, C programs 205911a5261eSBarry Smith may want to use the default `MAT_ROW_ORIENTED` = `PETSC_TRUE` and use an array v[nnz][bs][bs] where the second index is 206038f409ebSLisandro Dalcin over rows within a block and the last index is over columns within a block row. Fortran programs will likely set 206111a5261eSBarry Smith `MAT_ROW_ORIENTED` = `PETSC_FALSE` and use a Fortran array v(bs,bs,nnz) in which the first index is over rows within a 206238f409ebSLisandro Dalcin block column and the second index is over columns within a block. 206338f409ebSLisandro Dalcin 206450c5228eSBarry Smith Any entries below the diagonal are ignored 20650cd7f59aSBarry Smith 20660cd7f59aSBarry Smith Though this routine has Preallocation() in the name it also sets the exact nonzero locations of the matrix entries 20670cd7f59aSBarry Smith and usually the numerical values as well 2068664954b6SBarry Smith 206911a5261eSBarry Smith .seealso: `MATSEQSBAIJ`, `MatCreate()`, `MatCreateSeqSBAIJ()`, `MatSetValuesBlocked()`, `MatSeqSBAIJSetPreallocation()`, `MATSEQSBAIJ` 207038f409ebSLisandro Dalcin @*/ 2071d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqSBAIJSetPreallocationCSR(Mat B, PetscInt bs, const PetscInt i[], const PetscInt j[], const PetscScalar v[]) 2072d71ae5a4SJacob Faibussowitsch { 207338f409ebSLisandro Dalcin PetscFunctionBegin; 207438f409ebSLisandro Dalcin PetscValidHeaderSpecific(B, MAT_CLASSID, 1); 207538f409ebSLisandro Dalcin PetscValidType(B, 1); 207638f409ebSLisandro Dalcin PetscValidLogicalCollectiveInt(B, bs, 2); 2077cac4c232SBarry Smith PetscTryMethod(B, "MatSeqSBAIJSetPreallocationCSR_C", (Mat, PetscInt, const PetscInt[], const PetscInt[], const PetscScalar[]), (B, bs, i, j, v)); 20783ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 207938f409ebSLisandro Dalcin } 208038f409ebSLisandro Dalcin 2081c464158bSHong Zhang /*@C 2082c464158bSHong Zhang MatCreateSeqSBAIJ - Creates a sparse symmetric matrix in block AIJ (block 208311a5261eSBarry Smith compressed row) `MATSEQSBAIJ` format. For good matrix assembly performance the 2084c464158bSHong Zhang user should preallocate the matrix storage by setting the parameter nz 2085c464158bSHong Zhang (or the array nnz). By setting these parameters accurately, performance 2086c464158bSHong Zhang during matrix assembly can be increased by more than a factor of 50. 208749b5e25fSSatish Balay 2088d083f849SBarry Smith Collective 2089c464158bSHong Zhang 2090c464158bSHong Zhang Input Parameters: 209111a5261eSBarry Smith + comm - MPI communicator, set to `PETSC_COMM_SELF` 209211a5261eSBarry Smith . bs - size of block, the blocks are ALWAYS square. One can use `MatSetBlockSizes()` to set a different row and column blocksize but the row 2093bb7ae925SBarry Smith blocksize always defines the size of the blocks. The column blocksize sets the blocksize of the vectors obtained with MatCreateVecs() 2094c464158bSHong Zhang . m - number of rows, or number of columns 2095c464158bSHong Zhang . nz - number of block nonzeros per block row (same for all rows) 2096744e8345SSatish Balay - nnz - array containing the number of block nonzeros in the upper triangular plus 20970298fd71SBarry Smith diagonal portion of each block (possibly different for each block row) or NULL 2098c464158bSHong Zhang 2099c464158bSHong Zhang Output Parameter: 2100c464158bSHong Zhang . A - the symmetric matrix 2101c464158bSHong Zhang 2102c464158bSHong Zhang Options Database Keys: 2103a2b725a8SWilliam Gropp + -mat_no_unroll - uses code that does not unroll the loops in the 2104c464158bSHong Zhang block calculations (much slower) 2105a2b725a8SWilliam Gropp - -mat_block_size - size of the blocks to use 2106c464158bSHong Zhang 2107c464158bSHong Zhang Level: intermediate 2108c464158bSHong Zhang 210911a5261eSBarry Smith It is recommended that one use the `MatCreate()`, `MatSetType()` and/or `MatSetFromOptions()`, 2110f6f02116SRichard Tran Mills MatXXXXSetPreallocation() paradigm instead of this routine directly. 211111a5261eSBarry Smith [MatXXXXSetPreallocation() is, for example, `MatSeqAIJSetPreallocation()`] 2112175b88e8SBarry Smith 2113c464158bSHong Zhang Notes: 21146d6d819aSHong Zhang The number of rows and columns must be divisible by blocksize. 21156d6d819aSHong Zhang This matrix type does not support complex Hermitian operation. 2116c464158bSHong Zhang 2117c464158bSHong Zhang Specify the preallocated storage with either nz or nnz (not both). 211811a5261eSBarry Smith Set nz = `PETSC_DEFAULT` and nnz = NULL for PETSc to control dynamic memory 2119651615e1SBarry Smith allocation. See [Sparse Matrices](sec_matsparse) for details. 2120c464158bSHong Zhang 212149a6f317SBarry Smith If the nnz parameter is given then the nz parameter is ignored 212249a6f317SBarry Smith 2123651615e1SBarry Smith .seealso: [Sparse Matrices](sec_matsparse), `MATSEQSBAIJ`, `MatCreate()`, `MatCreateSeqAIJ()`, `MatSetValues()`, `MatCreateSBAIJ()` 2124c464158bSHong Zhang @*/ 2125d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateSeqSBAIJ(MPI_Comm comm, PetscInt bs, PetscInt m, PetscInt n, PetscInt nz, const PetscInt nnz[], Mat *A) 2126d71ae5a4SJacob Faibussowitsch { 2127c464158bSHong Zhang PetscFunctionBegin; 21289566063dSJacob Faibussowitsch PetscCall(MatCreate(comm, A)); 21299566063dSJacob Faibussowitsch PetscCall(MatSetSizes(*A, m, n, m, n)); 21309566063dSJacob Faibussowitsch PetscCall(MatSetType(*A, MATSEQSBAIJ)); 21319566063dSJacob Faibussowitsch PetscCall(MatSeqSBAIJSetPreallocation(*A, bs, nz, (PetscInt *)nnz)); 21323ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 213349b5e25fSSatish Balay } 213449b5e25fSSatish Balay 2135d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDuplicate_SeqSBAIJ(Mat A, MatDuplicateOption cpvalues, Mat *B) 2136d71ae5a4SJacob Faibussowitsch { 213749b5e25fSSatish Balay Mat C; 213849b5e25fSSatish Balay Mat_SeqSBAIJ *c, *a = (Mat_SeqSBAIJ *)A->data; 2139b40805acSSatish Balay PetscInt i, mbs = a->mbs, nz = a->nz, bs2 = a->bs2; 214049b5e25fSSatish Balay 214149b5e25fSSatish Balay PetscFunctionBegin; 2142*31fe6a7dSBarry Smith PetscCheck(A->assembled, PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_WRONGSTATE, "Cannot duplicate unassembled matrix"); 214308401ef6SPierre Jolivet PetscCheck(a->i[mbs] == nz, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Corrupt matrix"); 214449b5e25fSSatish Balay 2145f4259b30SLisandro Dalcin *B = NULL; 21469566063dSJacob Faibussowitsch PetscCall(MatCreate(PetscObjectComm((PetscObject)A), &C)); 21479566063dSJacob Faibussowitsch PetscCall(MatSetSizes(C, A->rmap->N, A->cmap->n, A->rmap->N, A->cmap->n)); 21489566063dSJacob Faibussowitsch PetscCall(MatSetBlockSizesFromMats(C, A, A)); 21499566063dSJacob Faibussowitsch PetscCall(MatSetType(C, MATSEQSBAIJ)); 2150692f9cbeSHong Zhang c = (Mat_SeqSBAIJ *)C->data; 2151692f9cbeSHong Zhang 2152273d9f13SBarry Smith C->preallocated = PETSC_TRUE; 2153d5f3da31SBarry Smith C->factortype = A->factortype; 2154f4259b30SLisandro Dalcin c->row = NULL; 2155f4259b30SLisandro Dalcin c->icol = NULL; 2156f4259b30SLisandro Dalcin c->saved_values = NULL; 2157a9817697SBarry Smith c->keepnonzeropattern = a->keepnonzeropattern; 215849b5e25fSSatish Balay C->assembled = PETSC_TRUE; 215949b5e25fSSatish Balay 21609566063dSJacob Faibussowitsch PetscCall(PetscLayoutReference(A->rmap, &C->rmap)); 21619566063dSJacob Faibussowitsch PetscCall(PetscLayoutReference(A->cmap, &C->cmap)); 216249b5e25fSSatish Balay c->bs2 = a->bs2; 216349b5e25fSSatish Balay c->mbs = a->mbs; 216449b5e25fSSatish Balay c->nbs = a->nbs; 216549b5e25fSSatish Balay 2166c760cd28SBarry Smith if (cpvalues == MAT_SHARE_NONZERO_PATTERN) { 2167c760cd28SBarry Smith c->imax = a->imax; 2168c760cd28SBarry Smith c->ilen = a->ilen; 2169c760cd28SBarry Smith c->free_imax_ilen = PETSC_FALSE; 2170c760cd28SBarry Smith } else { 21719566063dSJacob Faibussowitsch PetscCall(PetscMalloc2((mbs + 1), &c->imax, (mbs + 1), &c->ilen)); 217249b5e25fSSatish Balay for (i = 0; i < mbs; i++) { 217349b5e25fSSatish Balay c->imax[i] = a->imax[i]; 217449b5e25fSSatish Balay c->ilen[i] = a->ilen[i]; 217549b5e25fSSatish Balay } 2176c760cd28SBarry Smith c->free_imax_ilen = PETSC_TRUE; 2177c760cd28SBarry Smith } 217849b5e25fSSatish Balay 217949b5e25fSSatish Balay /* allocate the matrix space */ 21804da8f245SBarry Smith if (cpvalues == MAT_SHARE_NONZERO_PATTERN) { 21819566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(bs2 * nz, &c->a)); 218244e1c64aSLisandro Dalcin c->i = a->i; 218344e1c64aSLisandro Dalcin c->j = a->j; 21844da8f245SBarry Smith c->singlemalloc = PETSC_FALSE; 218544e1c64aSLisandro Dalcin c->free_a = PETSC_TRUE; 21864da8f245SBarry Smith c->free_ij = PETSC_FALSE; 21874da8f245SBarry Smith c->parent = A; 21889566063dSJacob Faibussowitsch PetscCall(PetscObjectReference((PetscObject)A)); 21899566063dSJacob Faibussowitsch PetscCall(MatSetOption(A, MAT_NEW_NONZERO_LOCATION_ERR, PETSC_TRUE)); 21909566063dSJacob Faibussowitsch PetscCall(MatSetOption(C, MAT_NEW_NONZERO_LOCATION_ERR, PETSC_TRUE)); 21914da8f245SBarry Smith } else { 21929566063dSJacob Faibussowitsch PetscCall(PetscMalloc3(bs2 * nz, &c->a, nz, &c->j, mbs + 1, &c->i)); 21939566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(c->i, a->i, mbs + 1)); 21944da8f245SBarry Smith c->singlemalloc = PETSC_TRUE; 219544e1c64aSLisandro Dalcin c->free_a = PETSC_TRUE; 21964da8f245SBarry Smith c->free_ij = PETSC_TRUE; 21974da8f245SBarry Smith } 219849b5e25fSSatish Balay if (mbs > 0) { 219948a46eb9SPierre Jolivet if (cpvalues != MAT_SHARE_NONZERO_PATTERN) PetscCall(PetscArraycpy(c->j, a->j, nz)); 220049b5e25fSSatish Balay if (cpvalues == MAT_COPY_VALUES) { 22019566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(c->a, a->a, bs2 * nz)); 220249b5e25fSSatish Balay } else { 22039566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(c->a, bs2 * nz)); 220449b5e25fSSatish Balay } 2205a1c3900fSBarry Smith if (a->jshort) { 220644e1c64aSLisandro Dalcin /* cannot share jshort, it is reallocated in MatAssemblyEnd_SeqSBAIJ() */ 220744e1c64aSLisandro Dalcin /* if the parent matrix is reassembled, this child matrix will never notice */ 22089566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nz, &c->jshort)); 22099566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(c->jshort, a->jshort, nz)); 221026fbe8dcSKarl Rupp 22114da8f245SBarry Smith c->free_jshort = PETSC_TRUE; 22124da8f245SBarry Smith } 2213a1c3900fSBarry Smith } 221449b5e25fSSatish Balay 221549b5e25fSSatish Balay c->roworiented = a->roworiented; 221649b5e25fSSatish Balay c->nonew = a->nonew; 221749b5e25fSSatish Balay 221849b5e25fSSatish Balay if (a->diag) { 2219c760cd28SBarry Smith if (cpvalues == MAT_SHARE_NONZERO_PATTERN) { 2220c760cd28SBarry Smith c->diag = a->diag; 2221c760cd28SBarry Smith c->free_diag = PETSC_FALSE; 2222c760cd28SBarry Smith } else { 22239566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(mbs, &c->diag)); 222426fbe8dcSKarl Rupp for (i = 0; i < mbs; i++) c->diag[i] = a->diag[i]; 2225c760cd28SBarry Smith c->free_diag = PETSC_TRUE; 2226c760cd28SBarry Smith } 222744e1c64aSLisandro Dalcin } 22286c6c5352SBarry Smith c->nz = a->nz; 2229f2cbd3d5SJed Brown c->maxnz = a->nz; /* Since we allocate exactly the right amount */ 2230f4259b30SLisandro Dalcin c->solve_work = NULL; 2231f4259b30SLisandro Dalcin c->mult_work = NULL; 223226fbe8dcSKarl Rupp 223349b5e25fSSatish Balay *B = C; 22349566063dSJacob Faibussowitsch PetscCall(PetscFunctionListDuplicate(((PetscObject)A)->qlist, &((PetscObject)C)->qlist)); 22353ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 223649b5e25fSSatish Balay } 223749b5e25fSSatish Balay 2238618cc2edSLisandro Dalcin /* Used for both SeqBAIJ and SeqSBAIJ matrices */ 2239618cc2edSLisandro Dalcin #define MatLoad_SeqSBAIJ_Binary MatLoad_SeqBAIJ_Binary 2240618cc2edSLisandro Dalcin 2241d71ae5a4SJacob Faibussowitsch PetscErrorCode MatLoad_SeqSBAIJ(Mat mat, PetscViewer viewer) 2242d71ae5a4SJacob Faibussowitsch { 22437f489da9SVaclav Hapla PetscBool isbinary; 22442f480046SShri Abhyankar 22452f480046SShri Abhyankar PetscFunctionBegin; 22469566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERBINARY, &isbinary)); 224728b400f6SJacob Faibussowitsch PetscCheck(isbinary, PetscObjectComm((PetscObject)viewer), PETSC_ERR_SUP, "Viewer type %s not yet supported for reading %s matrices", ((PetscObject)viewer)->type_name, ((PetscObject)mat)->type_name); 22489566063dSJacob Faibussowitsch PetscCall(MatLoad_SeqSBAIJ_Binary(mat, viewer)); 22493ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 22502f480046SShri Abhyankar } 22512f480046SShri Abhyankar 2252c75a6043SHong Zhang /*@ 225311a5261eSBarry Smith MatCreateSeqSBAIJWithArrays - Creates an sequential `MATSEQSBAIJ` matrix using matrix elements 2254c75a6043SHong Zhang (upper triangular entries in CSR format) provided by the user. 2255c75a6043SHong Zhang 2256d083f849SBarry Smith Collective 2257c75a6043SHong Zhang 2258c75a6043SHong Zhang Input Parameters: 2259c75a6043SHong Zhang + comm - must be an MPI communicator of size 1 2260c75a6043SHong Zhang . bs - size of block 2261c75a6043SHong Zhang . m - number of rows 2262c75a6043SHong Zhang . n - number of columns 2263483a2f95SBarry Smith . i - row indices; that is i[0] = 0, i[row] = i[row-1] + number of block elements in that row block row of the matrix 2264c75a6043SHong Zhang . j - column indices 2265c75a6043SHong Zhang - a - matrix values 2266c75a6043SHong Zhang 2267c75a6043SHong Zhang Output Parameter: 2268c75a6043SHong Zhang . mat - the matrix 2269c75a6043SHong Zhang 2270dfb205c3SBarry Smith Level: advanced 2271c75a6043SHong Zhang 2272c75a6043SHong Zhang Notes: 2273c75a6043SHong Zhang The i, j, and a arrays are not copied by this routine, the user must free these arrays 2274c75a6043SHong Zhang once the matrix is destroyed 2275c75a6043SHong Zhang 2276c75a6043SHong Zhang You cannot set new nonzero locations into this matrix, that will generate an error. 2277c75a6043SHong Zhang 2278c75a6043SHong Zhang The i and j indices are 0 based 2279c75a6043SHong Zhang 228011a5261eSBarry Smith When block size is greater than 1 the matrix values must be stored using the SBAIJ storage format (see the SBAIJ source code to determine this). For block size of 1 2281dfb205c3SBarry Smith it is the regular CSR format excluding the lower triangular elements. 2282dfb205c3SBarry Smith 228311a5261eSBarry Smith .seealso: `MATSEQSBAIJ`, `MatCreate()`, `MatCreateSBAIJ()`, `MatCreateSeqSBAIJ()` 2284c75a6043SHong Zhang @*/ 2285d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateSeqSBAIJWithArrays(MPI_Comm comm, PetscInt bs, PetscInt m, PetscInt n, PetscInt i[], PetscInt j[], PetscScalar a[], Mat *mat) 2286d71ae5a4SJacob Faibussowitsch { 2287c75a6043SHong Zhang PetscInt ii; 2288c75a6043SHong Zhang Mat_SeqSBAIJ *sbaij; 2289c75a6043SHong Zhang 2290c75a6043SHong Zhang PetscFunctionBegin; 229108401ef6SPierre Jolivet PetscCheck(bs == 1, PETSC_COMM_SELF, PETSC_ERR_SUP, "block size %" PetscInt_FMT " > 1 is not supported yet", bs); 2292aed4548fSBarry Smith PetscCheck(m == 0 || i[0] == 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "i (row indices) must start with 0"); 2293c75a6043SHong Zhang 22949566063dSJacob Faibussowitsch PetscCall(MatCreate(comm, mat)); 22959566063dSJacob Faibussowitsch PetscCall(MatSetSizes(*mat, m, n, m, n)); 22969566063dSJacob Faibussowitsch PetscCall(MatSetType(*mat, MATSEQSBAIJ)); 22979566063dSJacob Faibussowitsch PetscCall(MatSeqSBAIJSetPreallocation(*mat, bs, MAT_SKIP_ALLOCATION, NULL)); 2298c75a6043SHong Zhang sbaij = (Mat_SeqSBAIJ *)(*mat)->data; 22999566063dSJacob Faibussowitsch PetscCall(PetscMalloc2(m, &sbaij->imax, m, &sbaij->ilen)); 2300c75a6043SHong Zhang 2301c75a6043SHong Zhang sbaij->i = i; 2302c75a6043SHong Zhang sbaij->j = j; 2303c75a6043SHong Zhang sbaij->a = a; 230426fbe8dcSKarl Rupp 2305c75a6043SHong Zhang sbaij->singlemalloc = PETSC_FALSE; 2306c75a6043SHong Zhang sbaij->nonew = -1; /*this indicates that inserting a new value in the matrix that generates a new nonzero is an error*/ 2307e6b907acSBarry Smith sbaij->free_a = PETSC_FALSE; 2308e6b907acSBarry Smith sbaij->free_ij = PETSC_FALSE; 2309ddf7884eSMatthew Knepley sbaij->free_imax_ilen = PETSC_TRUE; 2310c75a6043SHong Zhang 2311c75a6043SHong Zhang for (ii = 0; ii < m; ii++) { 2312c75a6043SHong Zhang sbaij->ilen[ii] = sbaij->imax[ii] = i[ii + 1] - i[ii]; 23136bdcaf15SBarry Smith PetscCheck(i[ii + 1] >= i[ii], PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Negative row length in i (row indices) row = %" PetscInt_FMT " length = %" PetscInt_FMT, ii, i[ii + 1] - i[ii]); 2314c75a6043SHong Zhang } 231576bd3646SJed Brown if (PetscDefined(USE_DEBUG)) { 2316c75a6043SHong Zhang for (ii = 0; ii < sbaij->i[m]; ii++) { 23176bdcaf15SBarry Smith PetscCheck(j[ii] >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Negative column index at location = %" PetscInt_FMT " index = %" PetscInt_FMT, ii, j[ii]); 23186bdcaf15SBarry Smith PetscCheck(j[ii] < n, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Column index too large at location = %" PetscInt_FMT " index = %" PetscInt_FMT, ii, j[ii]); 2319c75a6043SHong Zhang } 232076bd3646SJed Brown } 2321c75a6043SHong Zhang 23229566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(*mat, MAT_FINAL_ASSEMBLY)); 23239566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(*mat, MAT_FINAL_ASSEMBLY)); 23243ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 2325c75a6043SHong Zhang } 2326d06b337dSHong Zhang 2327d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateMPIMatConcatenateSeqMat_SeqSBAIJ(MPI_Comm comm, Mat inmat, PetscInt n, MatReuse scall, Mat *outmat) 2328d71ae5a4SJacob Faibussowitsch { 232959f5e6ceSHong Zhang PetscFunctionBegin; 23309566063dSJacob Faibussowitsch PetscCall(MatCreateMPIMatConcatenateSeqMat_MPISBAIJ(comm, inmat, n, scall, outmat)); 23313ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 233259f5e6ceSHong Zhang } 2333