149b5e25fSSatish Balay 249b5e25fSSatish Balay /* 3a1373b80SHong Zhang Defines the basic matrix operations for the SBAIJ (compressed row) 449b5e25fSSatish Balay matrix storage format. 549b5e25fSSatish Balay */ 6c6db04a5SJed Brown #include <../src/mat/impls/baij/seq/baij.h> /*I "petscmat.h" I*/ 7c6db04a5SJed Brown #include <../src/mat/impls/sbaij/seq/sbaij.h> 8c6db04a5SJed Brown #include <petscblaslapack.h> 949b5e25fSSatish Balay 10c6db04a5SJed Brown #include <../src/mat/impls/sbaij/seq/relax.h> 1170dcbbb9SBarry Smith #define USESHORT 12c6db04a5SJed Brown #include <../src/mat/impls/sbaij/seq/relax.h> 1370dcbbb9SBarry Smith 1426cec326SBarry Smith /* defines MatSetValues_Seq_Hash(), MatAssemblyEnd_Seq_Hash(), MatSetUp_Seq_Hash() */ 1526cec326SBarry Smith #define TYPE SBAIJ 1626cec326SBarry Smith #define TYPE_SBAIJ 1726cec326SBarry Smith #define TYPE_BS 1826cec326SBarry Smith #include "../src/mat/impls/aij/seq/seqhashmatsetvalues.h" 1926cec326SBarry Smith #undef TYPE_BS 2026cec326SBarry Smith #define TYPE_BS _BS 2126cec326SBarry Smith #define TYPE_BS_ON 2226cec326SBarry Smith #include "../src/mat/impls/aij/seq/seqhashmatsetvalues.h" 2326cec326SBarry Smith #undef TYPE_BS 2426cec326SBarry Smith #undef TYPE_SBAIJ 2526cec326SBarry Smith #include "../src/mat/impls/aij/seq/seqhashmat.h" 2626cec326SBarry Smith #undef TYPE 2726cec326SBarry Smith #undef TYPE_BS_ON 2826cec326SBarry Smith 296214f412SHong Zhang #if defined(PETSC_HAVE_ELEMENTAL) 30cc2e6a90SBarry Smith PETSC_INTERN PetscErrorCode MatConvert_SeqSBAIJ_Elemental(Mat, MatType, MatReuse, Mat *); 316214f412SHong Zhang #endif 32d24d4204SJose E. Roman #if defined(PETSC_HAVE_SCALAPACK) 33d24d4204SJose E. Roman PETSC_INTERN PetscErrorCode MatConvert_SBAIJ_ScaLAPACK(Mat, MatType, MatReuse, Mat *); 34d24d4204SJose E. Roman #endif 3528d58a37SPierre Jolivet PETSC_INTERN PetscErrorCode MatConvert_MPISBAIJ_Basic(Mat, MatType, MatReuse, Mat *); 36b5b17502SBarry Smith 3749b5e25fSSatish Balay /* 3849b5e25fSSatish Balay Checks for missing diagonals 3949b5e25fSSatish Balay */ 40d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMissingDiagonal_SeqSBAIJ(Mat A, PetscBool *missing, PetscInt *dd) 41d71ae5a4SJacob Faibussowitsch { 42045c9aa0SHong Zhang Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)A->data; 437734d3b5SMatthew G. Knepley PetscInt *diag, *ii = a->i, i; 4449b5e25fSSatish Balay 4549b5e25fSSatish Balay PetscFunctionBegin; 469566063dSJacob Faibussowitsch PetscCall(MatMarkDiagonal_SeqSBAIJ(A)); 472af78befSBarry Smith *missing = PETSC_FALSE; 487734d3b5SMatthew G. Knepley if (A->rmap->n > 0 && !ii) { 49358d2f5dSShri Abhyankar *missing = PETSC_TRUE; 50358d2f5dSShri Abhyankar if (dd) *dd = 0; 519566063dSJacob Faibussowitsch PetscCall(PetscInfo(A, "Matrix has no entries therefore is missing diagonal\n")); 52358d2f5dSShri Abhyankar } else { 53358d2f5dSShri Abhyankar diag = a->diag; 5449b5e25fSSatish Balay for (i = 0; i < a->mbs; i++) { 557734d3b5SMatthew G. Knepley if (diag[i] >= ii[i + 1]) { 562af78befSBarry Smith *missing = PETSC_TRUE; 572af78befSBarry Smith if (dd) *dd = i; 582af78befSBarry Smith break; 592af78befSBarry Smith } 6049b5e25fSSatish Balay } 61358d2f5dSShri Abhyankar } 623ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 6349b5e25fSSatish Balay } 6449b5e25fSSatish Balay 65d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMarkDiagonal_SeqSBAIJ(Mat A) 66d71ae5a4SJacob Faibussowitsch { 67045c9aa0SHong Zhang Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)A->data; 6848dd3d27SHong Zhang PetscInt i, j; 6949b5e25fSSatish Balay 7049b5e25fSSatish Balay PetscFunctionBegin; 7109f38230SBarry Smith if (!a->diag) { 729566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(a->mbs, &a->diag)); 73c760cd28SBarry Smith a->free_diag = PETSC_TRUE; 7409f38230SBarry Smith } 7548dd3d27SHong Zhang for (i = 0; i < a->mbs; i++) { 7648dd3d27SHong Zhang a->diag[i] = a->i[i + 1]; 7748dd3d27SHong Zhang for (j = a->i[i]; j < a->i[i + 1]; j++) { 7848dd3d27SHong Zhang if (a->j[j] == i) { 7948dd3d27SHong Zhang a->diag[i] = j; 8048dd3d27SHong Zhang break; 8148dd3d27SHong Zhang } 8248dd3d27SHong Zhang } 8348dd3d27SHong Zhang } 843ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 8549b5e25fSSatish Balay } 8649b5e25fSSatish Balay 87d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatGetRowIJ_SeqSBAIJ(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool blockcompressed, PetscInt *nn, const PetscInt *inia[], const PetscInt *inja[], PetscBool *done) 88d71ae5a4SJacob Faibussowitsch { 89a6ece127SHong Zhang Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)A->data; 902462f5fdSStefano Zampini PetscInt i, j, n = a->mbs, nz = a->i[n], *tia, *tja, bs = A->rmap->bs, k, l, cnt; 912462f5fdSStefano Zampini PetscInt **ia = (PetscInt **)inia, **ja = (PetscInt **)inja; 9249b5e25fSSatish Balay 9349b5e25fSSatish Balay PetscFunctionBegin; 94d3e5a4abSHong Zhang *nn = n; 953ba16761SJacob Faibussowitsch if (!ia) PetscFunctionReturn(PETSC_SUCCESS); 962462f5fdSStefano Zampini if (symmetric) { 979566063dSJacob Faibussowitsch PetscCall(MatToSymmetricIJ_SeqAIJ(n, a->i, a->j, PETSC_FALSE, 0, 0, &tia, &tja)); 982462f5fdSStefano Zampini nz = tia[n]; 992462f5fdSStefano Zampini } else { 1009371c9d4SSatish Balay tia = a->i; 1019371c9d4SSatish Balay tja = a->j; 1022462f5fdSStefano Zampini } 1032462f5fdSStefano Zampini 1042462f5fdSStefano Zampini if (!blockcompressed && bs > 1) { 1052462f5fdSStefano Zampini (*nn) *= bs; 1068f7157efSSatish Balay /* malloc & create the natural set of indices */ 1079566063dSJacob Faibussowitsch PetscCall(PetscMalloc1((n + 1) * bs, ia)); 1082462f5fdSStefano Zampini if (n) { 1092462f5fdSStefano Zampini (*ia)[0] = oshift; 110ad540459SPierre Jolivet for (j = 1; j < bs; j++) (*ia)[j] = (tia[1] - tia[0]) * bs + (*ia)[j - 1]; 1112462f5fdSStefano Zampini } 1122462f5fdSStefano Zampini 1132462f5fdSStefano Zampini for (i = 1; i < n; i++) { 1142462f5fdSStefano Zampini (*ia)[i * bs] = (tia[i] - tia[i - 1]) * bs + (*ia)[i * bs - 1]; 115ad540459SPierre Jolivet for (j = 1; j < bs; j++) (*ia)[i * bs + j] = (tia[i + 1] - tia[i]) * bs + (*ia)[i * bs + j - 1]; 1162462f5fdSStefano Zampini } 117ad540459SPierre Jolivet if (n) (*ia)[n * bs] = (tia[n] - tia[n - 1]) * bs + (*ia)[n * bs - 1]; 1182462f5fdSStefano Zampini 1192462f5fdSStefano Zampini if (inja) { 1209566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nz * bs * bs, ja)); 1212462f5fdSStefano Zampini cnt = 0; 1222462f5fdSStefano Zampini for (i = 0; i < n; i++) { 1238f7157efSSatish Balay for (j = 0; j < bs; j++) { 1242462f5fdSStefano Zampini for (k = tia[i]; k < tia[i + 1]; k++) { 125ad540459SPierre Jolivet for (l = 0; l < bs; l++) (*ja)[cnt++] = bs * tja[k] + l; 1268f7157efSSatish Balay } 1278f7157efSSatish Balay } 1288f7157efSSatish Balay } 1298f7157efSSatish Balay } 1302462f5fdSStefano Zampini 1312462f5fdSStefano Zampini if (symmetric) { /* deallocate memory allocated in MatToSymmetricIJ_SeqAIJ() */ 1329566063dSJacob Faibussowitsch PetscCall(PetscFree(tia)); 1339566063dSJacob Faibussowitsch PetscCall(PetscFree(tja)); 1342462f5fdSStefano Zampini } 1352462f5fdSStefano Zampini } else if (oshift == 1) { 1362462f5fdSStefano Zampini if (symmetric) { 1372462f5fdSStefano Zampini nz = tia[A->rmap->n / bs]; 1382462f5fdSStefano Zampini /* add 1 to i and j indices */ 1392462f5fdSStefano Zampini for (i = 0; i < A->rmap->n / bs + 1; i++) tia[i] = tia[i] + 1; 1402462f5fdSStefano Zampini *ia = tia; 1412462f5fdSStefano Zampini if (ja) { 1422462f5fdSStefano Zampini for (i = 0; i < nz; i++) tja[i] = tja[i] + 1; 1432462f5fdSStefano Zampini *ja = tja; 1442462f5fdSStefano Zampini } 1452462f5fdSStefano Zampini } else { 1462462f5fdSStefano Zampini nz = a->i[A->rmap->n / bs]; 1472462f5fdSStefano Zampini /* malloc space and add 1 to i and j indices */ 1489566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(A->rmap->n / bs + 1, ia)); 1492462f5fdSStefano Zampini for (i = 0; i < A->rmap->n / bs + 1; i++) (*ia)[i] = a->i[i] + 1; 1502462f5fdSStefano Zampini if (ja) { 1519566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nz, ja)); 1522462f5fdSStefano Zampini for (i = 0; i < nz; i++) (*ja)[i] = a->j[i] + 1; 1532462f5fdSStefano Zampini } 1542462f5fdSStefano Zampini } 1552462f5fdSStefano Zampini } else { 1562462f5fdSStefano Zampini *ia = tia; 1572462f5fdSStefano Zampini if (ja) *ja = tja; 158a6ece127SHong Zhang } 1593ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 16049b5e25fSSatish Balay } 16149b5e25fSSatish Balay 162d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatRestoreRowIJ_SeqSBAIJ(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool blockcompressed, PetscInt *nn, const PetscInt *ia[], const PetscInt *ja[], PetscBool *done) 163d71ae5a4SJacob Faibussowitsch { 16449b5e25fSSatish Balay PetscFunctionBegin; 1653ba16761SJacob Faibussowitsch if (!ia) PetscFunctionReturn(PETSC_SUCCESS); 1662462f5fdSStefano Zampini if ((!blockcompressed && A->rmap->bs > 1) || (symmetric || oshift == 1)) { 1679566063dSJacob Faibussowitsch PetscCall(PetscFree(*ia)); 1689566063dSJacob Faibussowitsch if (ja) PetscCall(PetscFree(*ja)); 169a6ece127SHong Zhang } 1703ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 17149b5e25fSSatish Balay } 17249b5e25fSSatish Balay 173d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDestroy_SeqSBAIJ(Mat A) 174d71ae5a4SJacob Faibussowitsch { 17549b5e25fSSatish Balay Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)A->data; 17649b5e25fSSatish Balay 17749b5e25fSSatish Balay PetscFunctionBegin; 178a9f03627SSatish Balay #if defined(PETSC_USE_LOG) 1793ba16761SJacob Faibussowitsch PetscCall(PetscLogObjectState((PetscObject)A, "Rows=%" PetscInt_FMT ", NZ=%" PetscInt_FMT, A->rmap->N, a->nz)); 180a9f03627SSatish Balay #endif 1819566063dSJacob Faibussowitsch PetscCall(MatSeqXAIJFreeAIJ(A, &a->a, &a->j, &a->i)); 1829566063dSJacob Faibussowitsch if (a->free_diag) PetscCall(PetscFree(a->diag)); 1839566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->row)); 1849566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->col)); 1859566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->icol)); 1869566063dSJacob Faibussowitsch PetscCall(PetscFree(a->idiag)); 1879566063dSJacob Faibussowitsch PetscCall(PetscFree(a->inode.size)); 1889566063dSJacob Faibussowitsch if (a->free_imax_ilen) PetscCall(PetscFree2(a->imax, a->ilen)); 1899566063dSJacob Faibussowitsch PetscCall(PetscFree(a->solve_work)); 1909566063dSJacob Faibussowitsch PetscCall(PetscFree(a->sor_work)); 1919566063dSJacob Faibussowitsch PetscCall(PetscFree(a->solves_work)); 1929566063dSJacob Faibussowitsch PetscCall(PetscFree(a->mult_work)); 1939566063dSJacob Faibussowitsch PetscCall(PetscFree(a->saved_values)); 1949566063dSJacob Faibussowitsch if (a->free_jshort) PetscCall(PetscFree(a->jshort)); 1959566063dSJacob Faibussowitsch PetscCall(PetscFree(a->inew)); 1969566063dSJacob Faibussowitsch PetscCall(MatDestroy(&a->parent)); 1979566063dSJacob Faibussowitsch PetscCall(PetscFree(A->data)); 198901853e0SKris Buschelman 1999566063dSJacob Faibussowitsch PetscCall(PetscObjectChangeTypeName((PetscObject)A, NULL)); 2002e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSeqSBAIJGetArray_C", NULL)); 2012e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSeqSBAIJRestoreArray_C", NULL)); 2029566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatStoreValues_C", NULL)); 2039566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatRetrieveValues_C", NULL)); 2049566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSeqSBAIJSetColumnIndices_C", NULL)); 2059566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqsbaij_seqaij_C", NULL)); 2069566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqsbaij_seqbaij_C", NULL)); 2079566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSeqSBAIJSetPreallocation_C", NULL)); 2089566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSeqSBAIJSetPreallocationCSR_C", NULL)); 2096214f412SHong Zhang #if defined(PETSC_HAVE_ELEMENTAL) 2109566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqsbaij_elemental_C", NULL)); 2116214f412SHong Zhang #endif 212d24d4204SJose E. Roman #if defined(PETSC_HAVE_SCALAPACK) 2139566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqsbaij_scalapack_C", NULL)); 214d24d4204SJose E. Roman #endif 2152e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatFactorGetSolverType_C", NULL)); 2163ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 21749b5e25fSSatish Balay } 21849b5e25fSSatish Balay 219d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetOption_SeqSBAIJ(Mat A, MatOption op, PetscBool flg) 220d71ae5a4SJacob Faibussowitsch { 221045c9aa0SHong Zhang Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)A->data; 222eb1ec7c1SStefano Zampini #if defined(PETSC_USE_COMPLEX) 223eb1ec7c1SStefano Zampini PetscInt bs; 224eb1ec7c1SStefano Zampini #endif 22549b5e25fSSatish Balay 22649b5e25fSSatish Balay PetscFunctionBegin; 227eb1ec7c1SStefano Zampini #if defined(PETSC_USE_COMPLEX) 2289566063dSJacob Faibussowitsch PetscCall(MatGetBlockSize(A, &bs)); 229eb1ec7c1SStefano Zampini #endif 2304d9d31abSKris Buschelman switch (op) { 231d71ae5a4SJacob Faibussowitsch case MAT_ROW_ORIENTED: 232d71ae5a4SJacob Faibussowitsch a->roworiented = flg; 233d71ae5a4SJacob Faibussowitsch break; 234d71ae5a4SJacob Faibussowitsch case MAT_KEEP_NONZERO_PATTERN: 235d71ae5a4SJacob Faibussowitsch a->keepnonzeropattern = flg; 236d71ae5a4SJacob Faibussowitsch break; 237d71ae5a4SJacob Faibussowitsch case MAT_NEW_NONZERO_LOCATIONS: 238d71ae5a4SJacob Faibussowitsch a->nonew = (flg ? 0 : 1); 239d71ae5a4SJacob Faibussowitsch break; 240d71ae5a4SJacob Faibussowitsch case MAT_NEW_NONZERO_LOCATION_ERR: 241d71ae5a4SJacob Faibussowitsch a->nonew = (flg ? -1 : 0); 242d71ae5a4SJacob Faibussowitsch break; 243d71ae5a4SJacob Faibussowitsch case MAT_NEW_NONZERO_ALLOCATION_ERR: 244d71ae5a4SJacob Faibussowitsch a->nonew = (flg ? -2 : 0); 245d71ae5a4SJacob Faibussowitsch break; 246d71ae5a4SJacob Faibussowitsch case MAT_UNUSED_NONZERO_LOCATION_ERR: 247d71ae5a4SJacob Faibussowitsch a->nounused = (flg ? -1 : 0); 248d71ae5a4SJacob Faibussowitsch break; 2498c78258cSHong Zhang case MAT_FORCE_DIAGONAL_ENTRIES: 2504d9d31abSKris Buschelman case MAT_IGNORE_OFF_PROC_ENTRIES: 2514d9d31abSKris Buschelman case MAT_USE_HASH_TABLE: 252d71ae5a4SJacob Faibussowitsch case MAT_SORTED_FULL: 253d71ae5a4SJacob Faibussowitsch PetscCall(PetscInfo(A, "Option %s ignored\n", MatOptions[op])); 254d71ae5a4SJacob Faibussowitsch break; 2559a4540c5SBarry Smith case MAT_HERMITIAN: 256eb1ec7c1SStefano Zampini #if defined(PETSC_USE_COMPLEX) 257eb1ec7c1SStefano Zampini if (flg) { /* disable transpose ops */ 25808401ef6SPierre Jolivet PetscCheck(bs <= 1, PETSC_COMM_SELF, PETSC_ERR_SUP, "No support for Hermitian with block size greater than 1"); 259eb1ec7c1SStefano Zampini A->ops->multtranspose = NULL; 260eb1ec7c1SStefano Zampini A->ops->multtransposeadd = NULL; 261b94d7dedSBarry Smith A->symmetric = PETSC_BOOL3_FALSE; 262eb1ec7c1SStefano Zampini } 2630f2140c7SStefano Zampini #endif 264eeffb40dSHong Zhang break; 26577e54ba9SKris Buschelman case MAT_SYMMETRIC: 266eb1ec7c1SStefano Zampini case MAT_SPD: 267eb1ec7c1SStefano Zampini #if defined(PETSC_USE_COMPLEX) 268eb1ec7c1SStefano Zampini if (flg) { /* An hermitian and symmetric matrix has zero imaginary part (restore back transpose ops) */ 269eb1ec7c1SStefano Zampini A->ops->multtranspose = A->ops->mult; 270eb1ec7c1SStefano Zampini A->ops->multtransposeadd = A->ops->multadd; 271eb1ec7c1SStefano Zampini } 272eb1ec7c1SStefano Zampini #endif 273eb1ec7c1SStefano Zampini break; 274eb1ec7c1SStefano Zampini /* These options are handled directly by MatSetOption() */ 27577e54ba9SKris Buschelman case MAT_STRUCTURALLY_SYMMETRIC: 2769a4540c5SBarry Smith case MAT_SYMMETRY_ETERNAL: 277b94d7dedSBarry Smith case MAT_STRUCTURAL_SYMMETRY_ETERNAL: 278672ba085SHong Zhang case MAT_STRUCTURE_ONLY: 279b94d7dedSBarry Smith case MAT_SPD_ETERNAL: 2804dcd73b1SHong Zhang /* These options are handled directly by MatSetOption() */ 281290bbb0aSBarry Smith break; 282d71ae5a4SJacob Faibussowitsch case MAT_IGNORE_LOWER_TRIANGULAR: 283d71ae5a4SJacob Faibussowitsch a->ignore_ltriangular = flg; 284d71ae5a4SJacob Faibussowitsch break; 285d71ae5a4SJacob Faibussowitsch case MAT_ERROR_LOWER_TRIANGULAR: 286d71ae5a4SJacob Faibussowitsch a->ignore_ltriangular = flg; 287d71ae5a4SJacob Faibussowitsch break; 288d71ae5a4SJacob Faibussowitsch case MAT_GETROW_UPPERTRIANGULAR: 289d71ae5a4SJacob Faibussowitsch a->getrow_utriangular = flg; 290d71ae5a4SJacob Faibussowitsch break; 291d71ae5a4SJacob Faibussowitsch case MAT_SUBMAT_SINGLEIS: 292d71ae5a4SJacob Faibussowitsch break; 293d71ae5a4SJacob Faibussowitsch default: 294d71ae5a4SJacob Faibussowitsch SETERRQ(PETSC_COMM_SELF, PETSC_ERR_SUP, "unknown option %d", op); 29549b5e25fSSatish Balay } 2963ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 29749b5e25fSSatish Balay } 29849b5e25fSSatish Balay 299d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetRow_SeqSBAIJ(Mat A, PetscInt row, PetscInt *nz, PetscInt **idx, PetscScalar **v) 300d71ae5a4SJacob Faibussowitsch { 30149b5e25fSSatish Balay Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)A->data; 30249b5e25fSSatish Balay 30349b5e25fSSatish Balay PetscFunctionBegin; 30408401ef6SPierre Jolivet PetscCheck(!A || a->getrow_utriangular, PETSC_COMM_SELF, PETSC_ERR_SUP, "MatGetRow is not supported for SBAIJ matrix format. Getting the upper triangular part of row, run with -mat_getrow_uppertriangular, call MatSetOption(mat,MAT_GETROW_UPPERTRIANGULAR,PETSC_TRUE) or MatGetRowUpperTriangular()"); 30552768537SHong Zhang 306f5edf698SHong Zhang /* Get the upper triangular part of the row */ 3079566063dSJacob Faibussowitsch PetscCall(MatGetRow_SeqBAIJ_private(A, row, nz, idx, v, a->i, a->j, a->a)); 3083ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 30949b5e25fSSatish Balay } 31049b5e25fSSatish Balay 311d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRestoreRow_SeqSBAIJ(Mat A, PetscInt row, PetscInt *nz, PetscInt **idx, PetscScalar **v) 312d71ae5a4SJacob Faibussowitsch { 31349b5e25fSSatish Balay PetscFunctionBegin; 314cb4a9cd9SHong Zhang if (nz) *nz = 0; 3159566063dSJacob Faibussowitsch if (idx) PetscCall(PetscFree(*idx)); 3169566063dSJacob Faibussowitsch if (v) PetscCall(PetscFree(*v)); 3173ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 31849b5e25fSSatish Balay } 31949b5e25fSSatish Balay 320d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetRowUpperTriangular_SeqSBAIJ(Mat A) 321d71ae5a4SJacob Faibussowitsch { 322f5edf698SHong Zhang Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)A->data; 323f5edf698SHong Zhang 324f5edf698SHong Zhang PetscFunctionBegin; 325f5edf698SHong Zhang a->getrow_utriangular = PETSC_TRUE; 3263ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 327f5edf698SHong Zhang } 328a323099bSStefano Zampini 329d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRestoreRowUpperTriangular_SeqSBAIJ(Mat A) 330d71ae5a4SJacob Faibussowitsch { 331f5edf698SHong Zhang Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)A->data; 332f5edf698SHong Zhang 333f5edf698SHong Zhang PetscFunctionBegin; 334f5edf698SHong Zhang a->getrow_utriangular = PETSC_FALSE; 3353ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 336f5edf698SHong Zhang } 337f5edf698SHong Zhang 338d71ae5a4SJacob Faibussowitsch PetscErrorCode MatTranspose_SeqSBAIJ(Mat A, MatReuse reuse, Mat *B) 339d71ae5a4SJacob Faibussowitsch { 34049b5e25fSSatish Balay PetscFunctionBegin; 3417fb60732SBarry Smith if (reuse == MAT_REUSE_MATRIX) PetscCall(MatTransposeCheckNonzeroState_Private(A, *B)); 342cf37664fSBarry Smith if (reuse == MAT_INITIAL_MATRIX) { 3439566063dSJacob Faibussowitsch PetscCall(MatDuplicate(A, MAT_COPY_VALUES, B)); 344cf37664fSBarry Smith } else if (reuse == MAT_REUSE_MATRIX) { 3459566063dSJacob Faibussowitsch PetscCall(MatCopy(A, *B, SAME_NONZERO_PATTERN)); 346fc4dec0aSBarry Smith } 3473ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 34849b5e25fSSatish Balay } 34949b5e25fSSatish Balay 350d71ae5a4SJacob Faibussowitsch PetscErrorCode MatView_SeqSBAIJ_ASCII(Mat A, PetscViewer viewer) 351d71ae5a4SJacob Faibussowitsch { 35249b5e25fSSatish Balay Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)A->data; 353d0f46423SBarry Smith PetscInt i, j, bs = A->rmap->bs, k, l, bs2 = a->bs2; 354f3ef73ceSBarry Smith PetscViewerFormat format; 355121deb67SSatish Balay PetscInt *diag; 356b3a0534dSBarry Smith const char *matname; 35749b5e25fSSatish Balay 35849b5e25fSSatish Balay PetscFunctionBegin; 3599566063dSJacob Faibussowitsch PetscCall(PetscViewerGetFormat(viewer, &format)); 360456192e2SBarry Smith if (format == PETSC_VIEWER_ASCII_INFO || format == PETSC_VIEWER_ASCII_INFO_DETAIL) { 3619566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " block size is %" PetscInt_FMT "\n", bs)); 362fb9695e5SSatish Balay } else if (format == PETSC_VIEWER_ASCII_MATLAB) { 363d2507d54SMatthew Knepley Mat aij; 364ade3a672SBarry Smith 365d5f3da31SBarry Smith if (A->factortype && bs > 1) { 3669566063dSJacob Faibussowitsch PetscCall(PetscPrintf(PETSC_COMM_SELF, "Warning: matrix is factored with bs>1. MatView() with PETSC_VIEWER_ASCII_MATLAB is not supported and ignored!\n")); 3673ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 36870d5e725SHong Zhang } 3699566063dSJacob Faibussowitsch PetscCall(MatConvert(A, MATSEQAIJ, MAT_INITIAL_MATRIX, &aij)); 37023a3927dSBarry Smith if (((PetscObject)A)->name) PetscCall(PetscObjectGetName((PetscObject)A, &matname)); 37123a3927dSBarry Smith if (((PetscObject)A)->name) PetscCall(PetscObjectSetName((PetscObject)aij, matname)); 37223a3927dSBarry Smith PetscCall(MatView_SeqAIJ(aij, viewer)); 3739566063dSJacob Faibussowitsch PetscCall(MatDestroy(&aij)); 374fb9695e5SSatish Balay } else if (format == PETSC_VIEWER_ASCII_COMMON) { 375b3a0534dSBarry Smith Mat B; 376b3a0534dSBarry Smith 377b3a0534dSBarry Smith PetscCall(MatConvert(A, MATSEQAIJ, MAT_INITIAL_MATRIX, &B)); 378b3a0534dSBarry Smith if (((PetscObject)A)->name) PetscCall(PetscObjectGetName((PetscObject)A, &matname)); 379b3a0534dSBarry Smith if (((PetscObject)A)->name) PetscCall(PetscObjectSetName((PetscObject)B, matname)); 380b3a0534dSBarry Smith PetscCall(MatView_SeqAIJ(B, viewer)); 381b3a0534dSBarry Smith PetscCall(MatDestroy(&B)); 382c1490034SHong Zhang } else if (format == PETSC_VIEWER_ASCII_FACTOR_INFO) { 3833ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 38449b5e25fSSatish Balay } else { 3859566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE)); 3862c990fa1SHong Zhang if (A->factortype) { /* for factored matrix */ 38708401ef6SPierre Jolivet PetscCheck(bs <= 1, PETSC_COMM_SELF, PETSC_ERR_SUP, "matrix is factored with bs>1. Not implemented yet"); 3882c990fa1SHong Zhang 389121deb67SSatish Balay diag = a->diag; 390121deb67SSatish Balay for (i = 0; i < a->mbs; i++) { /* for row block i */ 3919566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "row %" PetscInt_FMT ":", i)); 3922c990fa1SHong Zhang /* diagonal entry */ 3932c990fa1SHong Zhang #if defined(PETSC_USE_COMPLEX) 3942c990fa1SHong Zhang if (PetscImaginaryPart(a->a[diag[i]]) > 0.0) { 3959566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g + %g i) ", a->j[diag[i]], (double)PetscRealPart(1.0 / a->a[diag[i]]), (double)PetscImaginaryPart(1.0 / a->a[diag[i]]))); 3962c990fa1SHong Zhang } else if (PetscImaginaryPart(a->a[diag[i]]) < 0.0) { 3979566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g - %g i) ", a->j[diag[i]], (double)PetscRealPart(1.0 / a->a[diag[i]]), -(double)PetscImaginaryPart(1.0 / a->a[diag[i]]))); 3982c990fa1SHong Zhang } else { 3999566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[diag[i]], (double)PetscRealPart(1.0 / a->a[diag[i]]))); 4002c990fa1SHong Zhang } 4012c990fa1SHong Zhang #else 4029566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[diag[i]], (double)(1.0 / a->a[diag[i]]))); 4032c990fa1SHong Zhang #endif 4042c990fa1SHong Zhang /* off-diagonal entries */ 4052c990fa1SHong Zhang for (k = a->i[i]; k < a->i[i + 1] - 1; k++) { 4062c990fa1SHong Zhang #if defined(PETSC_USE_COMPLEX) 407ca0704adSBarry Smith if (PetscImaginaryPart(a->a[k]) > 0.0) { 4089566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g + %g i) ", bs * a->j[k], (double)PetscRealPart(a->a[k]), (double)PetscImaginaryPart(a->a[k]))); 409ca0704adSBarry Smith } else if (PetscImaginaryPart(a->a[k]) < 0.0) { 4109566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g - %g i) ", bs * a->j[k], (double)PetscRealPart(a->a[k]), -(double)PetscImaginaryPart(a->a[k]))); 4112c990fa1SHong Zhang } else { 4129566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", bs * a->j[k], (double)PetscRealPart(a->a[k]))); 4132c990fa1SHong Zhang } 4142c990fa1SHong Zhang #else 4159566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[k], (double)a->a[k])); 4162c990fa1SHong Zhang #endif 4172c990fa1SHong Zhang } 4189566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 4192c990fa1SHong Zhang } 4202c990fa1SHong Zhang 4212c990fa1SHong Zhang } else { /* for non-factored matrix */ 4220c74a584SJed Brown for (i = 0; i < a->mbs; i++) { /* for row block i */ 4230c74a584SJed Brown for (j = 0; j < bs; j++) { /* for row bs*i + j */ 4249566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "row %" PetscInt_FMT ":", i * bs + j)); 4250c74a584SJed Brown for (k = a->i[i]; k < a->i[i + 1]; k++) { /* for column block */ 4260c74a584SJed Brown for (l = 0; l < bs; l++) { /* for column */ 42749b5e25fSSatish Balay #if defined(PETSC_USE_COMPLEX) 42849b5e25fSSatish Balay if (PetscImaginaryPart(a->a[bs2 * k + l * bs + j]) > 0.0) { 4299371c9d4SSatish Balay PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g + %g i) ", bs * a->j[k] + l, (double)PetscRealPart(a->a[bs2 * k + l * bs + j]), (double)PetscImaginaryPart(a->a[bs2 * k + l * bs + j]))); 43049b5e25fSSatish Balay } else if (PetscImaginaryPart(a->a[bs2 * k + l * bs + j]) < 0.0) { 4319371c9d4SSatish Balay PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g - %g i) ", bs * a->j[k] + l, (double)PetscRealPart(a->a[bs2 * k + l * bs + j]), -(double)PetscImaginaryPart(a->a[bs2 * k + l * bs + j]))); 43249b5e25fSSatish Balay } else { 4339566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", bs * a->j[k] + l, (double)PetscRealPart(a->a[bs2 * k + l * bs + j]))); 43449b5e25fSSatish Balay } 43549b5e25fSSatish Balay #else 4369566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", bs * a->j[k] + l, (double)a->a[bs2 * k + l * bs + j])); 43749b5e25fSSatish Balay #endif 43849b5e25fSSatish Balay } 43949b5e25fSSatish Balay } 4409566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 44149b5e25fSSatish Balay } 44249b5e25fSSatish Balay } 4432c990fa1SHong Zhang } 4449566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE)); 44549b5e25fSSatish Balay } 4469566063dSJacob Faibussowitsch PetscCall(PetscViewerFlush(viewer)); 4473ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 44849b5e25fSSatish Balay } 44949b5e25fSSatish Balay 4509804daf3SBarry Smith #include <petscdraw.h> 451d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatView_SeqSBAIJ_Draw_Zoom(PetscDraw draw, void *Aa) 452d71ae5a4SJacob Faibussowitsch { 45349b5e25fSSatish Balay Mat A = (Mat)Aa; 45449b5e25fSSatish Balay Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)A->data; 455d0f46423SBarry Smith PetscInt row, i, j, k, l, mbs = a->mbs, color, bs = A->rmap->bs, bs2 = a->bs2; 45649b5e25fSSatish Balay PetscReal xl, yl, xr, yr, x_l, x_r, y_l, y_r; 45749b5e25fSSatish Balay MatScalar *aa; 458b0a32e0cSBarry Smith PetscViewer viewer; 45949b5e25fSSatish Balay 46049b5e25fSSatish Balay PetscFunctionBegin; 4619566063dSJacob Faibussowitsch PetscCall(PetscObjectQuery((PetscObject)A, "Zoomviewer", (PetscObject *)&viewer)); 4629566063dSJacob Faibussowitsch PetscCall(PetscDrawGetCoordinates(draw, &xl, &yl, &xr, &yr)); 46349b5e25fSSatish Balay 46449b5e25fSSatish Balay /* loop over matrix elements drawing boxes */ 465383922c3SLisandro Dalcin 466d0609cedSBarry Smith PetscDrawCollectiveBegin(draw); 4679566063dSJacob Faibussowitsch PetscCall(PetscDrawString(draw, .3 * (xl + xr), .3 * (yl + yr), PETSC_DRAW_BLACK, "symmetric")); 468383922c3SLisandro Dalcin /* Blue for negative, Cyan for zero and Red for positive */ 469b0a32e0cSBarry Smith color = PETSC_DRAW_BLUE; 47049b5e25fSSatish Balay for (i = 0, row = 0; i < mbs; i++, row += bs) { 47149b5e25fSSatish Balay for (j = a->i[i]; j < a->i[i + 1]; j++) { 4729371c9d4SSatish Balay y_l = A->rmap->N - row - 1.0; 4739371c9d4SSatish Balay y_r = y_l + 1.0; 4749371c9d4SSatish Balay x_l = a->j[j] * bs; 4759371c9d4SSatish Balay x_r = x_l + 1.0; 47649b5e25fSSatish Balay aa = a->a + j * bs2; 47749b5e25fSSatish Balay for (k = 0; k < bs; k++) { 47849b5e25fSSatish Balay for (l = 0; l < bs; l++) { 47949b5e25fSSatish Balay if (PetscRealPart(*aa++) >= 0.) continue; 4809566063dSJacob Faibussowitsch PetscCall(PetscDrawRectangle(draw, x_l + k, y_l - l, x_r + k, y_r - l, color, color, color, color)); 48149b5e25fSSatish Balay } 48249b5e25fSSatish Balay } 48349b5e25fSSatish Balay } 48449b5e25fSSatish Balay } 485b0a32e0cSBarry Smith color = PETSC_DRAW_CYAN; 48649b5e25fSSatish Balay for (i = 0, row = 0; i < mbs; i++, row += bs) { 48749b5e25fSSatish Balay for (j = a->i[i]; j < a->i[i + 1]; j++) { 4889371c9d4SSatish Balay y_l = A->rmap->N - row - 1.0; 4899371c9d4SSatish Balay y_r = y_l + 1.0; 4909371c9d4SSatish Balay x_l = a->j[j] * bs; 4919371c9d4SSatish Balay x_r = x_l + 1.0; 49249b5e25fSSatish Balay aa = a->a + j * bs2; 49349b5e25fSSatish Balay for (k = 0; k < bs; k++) { 49449b5e25fSSatish Balay for (l = 0; l < bs; l++) { 49549b5e25fSSatish Balay if (PetscRealPart(*aa++) != 0.) continue; 4969566063dSJacob Faibussowitsch PetscCall(PetscDrawRectangle(draw, x_l + k, y_l - l, x_r + k, y_r - l, color, color, color, color)); 49749b5e25fSSatish Balay } 49849b5e25fSSatish Balay } 49949b5e25fSSatish Balay } 50049b5e25fSSatish Balay } 501b0a32e0cSBarry Smith color = PETSC_DRAW_RED; 50249b5e25fSSatish Balay for (i = 0, row = 0; i < mbs; i++, row += bs) { 50349b5e25fSSatish Balay for (j = a->i[i]; j < a->i[i + 1]; j++) { 5049371c9d4SSatish Balay y_l = A->rmap->N - row - 1.0; 5059371c9d4SSatish Balay y_r = y_l + 1.0; 5069371c9d4SSatish Balay x_l = a->j[j] * bs; 5079371c9d4SSatish Balay x_r = x_l + 1.0; 50849b5e25fSSatish Balay aa = a->a + j * bs2; 50949b5e25fSSatish Balay for (k = 0; k < bs; k++) { 51049b5e25fSSatish Balay for (l = 0; l < bs; l++) { 51149b5e25fSSatish Balay if (PetscRealPart(*aa++) <= 0.) continue; 5129566063dSJacob Faibussowitsch PetscCall(PetscDrawRectangle(draw, x_l + k, y_l - l, x_r + k, y_r - l, color, color, color, color)); 51349b5e25fSSatish Balay } 51449b5e25fSSatish Balay } 51549b5e25fSSatish Balay } 51649b5e25fSSatish Balay } 517d0609cedSBarry Smith PetscDrawCollectiveEnd(draw); 5183ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 51949b5e25fSSatish Balay } 52049b5e25fSSatish Balay 521d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatView_SeqSBAIJ_Draw(Mat A, PetscViewer viewer) 522d71ae5a4SJacob Faibussowitsch { 52349b5e25fSSatish Balay PetscReal xl, yl, xr, yr, w, h; 524b0a32e0cSBarry Smith PetscDraw draw; 525ace3abfcSBarry Smith PetscBool isnull; 52649b5e25fSSatish Balay 52749b5e25fSSatish Balay PetscFunctionBegin; 5289566063dSJacob Faibussowitsch PetscCall(PetscViewerDrawGetDraw(viewer, 0, &draw)); 5299566063dSJacob Faibussowitsch PetscCall(PetscDrawIsNull(draw, &isnull)); 5303ba16761SJacob Faibussowitsch if (isnull) PetscFunctionReturn(PETSC_SUCCESS); 53149b5e25fSSatish Balay 5329371c9d4SSatish Balay xr = A->rmap->N; 5339371c9d4SSatish Balay yr = A->rmap->N; 5349371c9d4SSatish Balay h = yr / 10.0; 5359371c9d4SSatish Balay w = xr / 10.0; 5369371c9d4SSatish Balay xr += w; 5379371c9d4SSatish Balay yr += h; 5389371c9d4SSatish Balay xl = -w; 5399371c9d4SSatish Balay yl = -h; 5409566063dSJacob Faibussowitsch PetscCall(PetscDrawSetCoordinates(draw, xl, yl, xr, yr)); 5419566063dSJacob Faibussowitsch PetscCall(PetscObjectCompose((PetscObject)A, "Zoomviewer", (PetscObject)viewer)); 5429566063dSJacob Faibussowitsch PetscCall(PetscDrawZoom(draw, MatView_SeqSBAIJ_Draw_Zoom, A)); 5439566063dSJacob Faibussowitsch PetscCall(PetscObjectCompose((PetscObject)A, "Zoomviewer", NULL)); 5449566063dSJacob Faibussowitsch PetscCall(PetscDrawSave(draw)); 5453ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 54649b5e25fSSatish Balay } 54749b5e25fSSatish Balay 548618cc2edSLisandro Dalcin /* Used for both MPIBAIJ and MPISBAIJ matrices */ 549618cc2edSLisandro Dalcin #define MatView_SeqSBAIJ_Binary MatView_SeqBAIJ_Binary 550618cc2edSLisandro Dalcin 551d71ae5a4SJacob Faibussowitsch PetscErrorCode MatView_SeqSBAIJ(Mat A, PetscViewer viewer) 552d71ae5a4SJacob Faibussowitsch { 553618cc2edSLisandro Dalcin PetscBool iascii, isbinary, isdraw; 55449b5e25fSSatish Balay 55549b5e25fSSatish Balay PetscFunctionBegin; 5569566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERASCII, &iascii)); 5579566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERBINARY, &isbinary)); 5589566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERDRAW, &isdraw)); 55932077d6dSBarry Smith if (iascii) { 5609566063dSJacob Faibussowitsch PetscCall(MatView_SeqSBAIJ_ASCII(A, viewer)); 561618cc2edSLisandro Dalcin } else if (isbinary) { 5629566063dSJacob Faibussowitsch PetscCall(MatView_SeqSBAIJ_Binary(A, viewer)); 56349b5e25fSSatish Balay } else if (isdraw) { 5649566063dSJacob Faibussowitsch PetscCall(MatView_SeqSBAIJ_Draw(A, viewer)); 56549b5e25fSSatish Balay } else { 566a5e6ed63SBarry Smith Mat B; 567ade3a672SBarry Smith const char *matname; 5689566063dSJacob Faibussowitsch PetscCall(MatConvert(A, MATSEQAIJ, MAT_INITIAL_MATRIX, &B)); 56923a3927dSBarry Smith if (((PetscObject)A)->name) PetscCall(PetscObjectGetName((PetscObject)A, &matname)); 57023a3927dSBarry Smith if (((PetscObject)A)->name) PetscCall(PetscObjectSetName((PetscObject)B, matname)); 5719566063dSJacob Faibussowitsch PetscCall(MatView(B, viewer)); 5729566063dSJacob Faibussowitsch PetscCall(MatDestroy(&B)); 57349b5e25fSSatish Balay } 5743ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 57549b5e25fSSatish Balay } 57649b5e25fSSatish Balay 577d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetValues_SeqSBAIJ(Mat A, PetscInt m, const PetscInt im[], PetscInt n, const PetscInt in[], PetscScalar v[]) 578d71ae5a4SJacob Faibussowitsch { 579045c9aa0SHong Zhang Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)A->data; 58013f74950SBarry Smith PetscInt *rp, k, low, high, t, row, nrow, i, col, l, *aj = a->j; 58113f74950SBarry Smith PetscInt *ai = a->i, *ailen = a->ilen; 582d0f46423SBarry Smith PetscInt brow, bcol, ridx, cidx, bs = A->rmap->bs, bs2 = a->bs2; 58397e567efSBarry Smith MatScalar *ap, *aa = a->a; 58449b5e25fSSatish Balay 58549b5e25fSSatish Balay PetscFunctionBegin; 58649b5e25fSSatish Balay for (k = 0; k < m; k++) { /* loop over rows */ 5879371c9d4SSatish Balay row = im[k]; 5889371c9d4SSatish Balay brow = row / bs; 5899371c9d4SSatish Balay if (row < 0) { 5909371c9d4SSatish Balay v += n; 5919371c9d4SSatish Balay continue; 5929371c9d4SSatish Balay } /* negative row */ 59354c59aa7SJacob Faibussowitsch PetscCheck(row < A->rmap->N, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Row too large: row %" PetscInt_FMT " max %" PetscInt_FMT, row, A->rmap->N - 1); 5949371c9d4SSatish Balay rp = aj + ai[brow]; 5959371c9d4SSatish Balay ap = aa + bs2 * ai[brow]; 59649b5e25fSSatish Balay nrow = ailen[brow]; 59749b5e25fSSatish Balay for (l = 0; l < n; l++) { /* loop over columns */ 5989371c9d4SSatish Balay if (in[l] < 0) { 5999371c9d4SSatish Balay v++; 6009371c9d4SSatish Balay continue; 6019371c9d4SSatish Balay } /* negative column */ 60254c59aa7SJacob Faibussowitsch PetscCheck(in[l] < A->cmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Column too large: col %" PetscInt_FMT " max %" PetscInt_FMT, in[l], A->cmap->n - 1); 60349b5e25fSSatish Balay col = in[l]; 60449b5e25fSSatish Balay bcol = col / bs; 60549b5e25fSSatish Balay cidx = col % bs; 60649b5e25fSSatish Balay ridx = row % bs; 60749b5e25fSSatish Balay high = nrow; 60849b5e25fSSatish Balay low = 0; /* assume unsorted */ 60949b5e25fSSatish Balay while (high - low > 5) { 61049b5e25fSSatish Balay t = (low + high) / 2; 61149b5e25fSSatish Balay if (rp[t] > bcol) high = t; 61249b5e25fSSatish Balay else low = t; 61349b5e25fSSatish Balay } 61449b5e25fSSatish Balay for (i = low; i < high; i++) { 61549b5e25fSSatish Balay if (rp[i] > bcol) break; 61649b5e25fSSatish Balay if (rp[i] == bcol) { 61749b5e25fSSatish Balay *v++ = ap[bs2 * i + bs * cidx + ridx]; 61849b5e25fSSatish Balay goto finished; 61949b5e25fSSatish Balay } 62049b5e25fSSatish Balay } 62197e567efSBarry Smith *v++ = 0.0; 62249b5e25fSSatish Balay finished:; 62349b5e25fSSatish Balay } 62449b5e25fSSatish Balay } 6253ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 62649b5e25fSSatish Balay } 62749b5e25fSSatish Balay 628d71ae5a4SJacob Faibussowitsch PetscErrorCode MatPermute_SeqSBAIJ(Mat A, IS rowp, IS colp, Mat *B) 629d71ae5a4SJacob Faibussowitsch { 630dc29a518SPierre Jolivet Mat C; 631dc29a518SPierre Jolivet 632dc29a518SPierre Jolivet PetscFunctionBegin; 6339566063dSJacob Faibussowitsch PetscCall(MatConvert(A, MATSEQBAIJ, MAT_INITIAL_MATRIX, &C)); 6349566063dSJacob Faibussowitsch PetscCall(MatPermute(C, rowp, colp, B)); 6359566063dSJacob Faibussowitsch PetscCall(MatDestroy(&C)); 63648a46eb9SPierre Jolivet if (rowp == colp) PetscCall(MatConvert(*B, MATSEQSBAIJ, MAT_INPLACE_MATRIX, B)); 6373ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 638dc29a518SPierre Jolivet } 63949b5e25fSSatish Balay 640d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetValuesBlocked_SeqSBAIJ(Mat A, PetscInt m, const PetscInt im[], PetscInt n, const PetscInt in[], const PetscScalar v[], InsertMode is) 641d71ae5a4SJacob Faibussowitsch { 6420880e062SHong Zhang Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)A->data; 643e2ee6c50SBarry Smith PetscInt *rp, k, low, high, t, ii, jj, row, nrow, i, col, l, rmax, N, lastcol = -1; 64413f74950SBarry Smith PetscInt *imax = a->imax, *ai = a->i, *ailen = a->ilen; 645d0f46423SBarry Smith PetscInt *aj = a->j, nonew = a->nonew, bs2 = a->bs2, bs = A->rmap->bs, stepval; 646ace3abfcSBarry Smith PetscBool roworiented = a->roworiented; 647dd6ea824SBarry Smith const PetscScalar *value = v; 648f15d580aSBarry Smith MatScalar *ap, *aa = a->a, *bap; 6490880e062SHong Zhang 65049b5e25fSSatish Balay PetscFunctionBegin; 65126fbe8dcSKarl Rupp if (roworiented) stepval = (n - 1) * bs; 65226fbe8dcSKarl Rupp else stepval = (m - 1) * bs; 65326fbe8dcSKarl Rupp 6540880e062SHong Zhang for (k = 0; k < m; k++) { /* loop over added rows */ 6550880e062SHong Zhang row = im[k]; 6560880e062SHong Zhang if (row < 0) continue; 6576bdcaf15SBarry Smith PetscCheck(row < a->mbs, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Block index row too large %" PetscInt_FMT " max %" PetscInt_FMT, row, a->mbs - 1); 6580880e062SHong Zhang rp = aj + ai[row]; 6590880e062SHong Zhang ap = aa + bs2 * ai[row]; 6600880e062SHong Zhang rmax = imax[row]; 6610880e062SHong Zhang nrow = ailen[row]; 6620880e062SHong Zhang low = 0; 663818f2c47SBarry Smith high = nrow; 6640880e062SHong Zhang for (l = 0; l < n; l++) { /* loop over added columns */ 6650880e062SHong Zhang if (in[l] < 0) continue; 6660880e062SHong Zhang col = in[l]; 6676bdcaf15SBarry Smith PetscCheck(col < a->nbs, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Block index column too large %" PetscInt_FMT " max %" PetscInt_FMT, col, a->nbs - 1); 668b98bf0e1SJed Brown if (col < row) { 66926fbe8dcSKarl Rupp if (a->ignore_ltriangular) continue; /* ignore lower triangular block */ 67026fbe8dcSKarl Rupp else SETERRQ(PETSC_COMM_SELF, PETSC_ERR_USER, "Lower triangular value cannot be set for sbaij format. Ignoring these values, run with -mat_ignore_lower_triangular or call MatSetOption(mat,MAT_IGNORE_LOWER_TRIANGULAR,PETSC_TRUE)"); 671b98bf0e1SJed Brown } 67226fbe8dcSKarl Rupp if (roworiented) value = v + k * (stepval + bs) * bs + l * bs; 67326fbe8dcSKarl Rupp else value = v + l * (stepval + bs) * bs + k * bs; 67426fbe8dcSKarl Rupp 67526fbe8dcSKarl Rupp if (col <= lastcol) low = 0; 67626fbe8dcSKarl Rupp else high = nrow; 67726fbe8dcSKarl Rupp 678e2ee6c50SBarry Smith lastcol = col; 6790880e062SHong Zhang while (high - low > 7) { 6800880e062SHong Zhang t = (low + high) / 2; 6810880e062SHong Zhang if (rp[t] > col) high = t; 6820880e062SHong Zhang else low = t; 6830880e062SHong Zhang } 6840880e062SHong Zhang for (i = low; i < high; i++) { 6850880e062SHong Zhang if (rp[i] > col) break; 6860880e062SHong Zhang if (rp[i] == col) { 6870880e062SHong Zhang bap = ap + bs2 * i; 6880880e062SHong Zhang if (roworiented) { 6890880e062SHong Zhang if (is == ADD_VALUES) { 6900880e062SHong Zhang for (ii = 0; ii < bs; ii++, value += stepval) { 691ad540459SPierre Jolivet for (jj = ii; jj < bs2; jj += bs) bap[jj] += *value++; 6920880e062SHong Zhang } 6930880e062SHong Zhang } else { 6940880e062SHong Zhang for (ii = 0; ii < bs; ii++, value += stepval) { 695ad540459SPierre Jolivet for (jj = ii; jj < bs2; jj += bs) bap[jj] = *value++; 6960880e062SHong Zhang } 6970880e062SHong Zhang } 6980880e062SHong Zhang } else { 6990880e062SHong Zhang if (is == ADD_VALUES) { 7000880e062SHong Zhang for (ii = 0; ii < bs; ii++, value += stepval) { 701ad540459SPierre Jolivet for (jj = 0; jj < bs; jj++) *bap++ += *value++; 7020880e062SHong Zhang } 7030880e062SHong Zhang } else { 7040880e062SHong Zhang for (ii = 0; ii < bs; ii++, value += stepval) { 705ad540459SPierre Jolivet for (jj = 0; jj < bs; jj++) *bap++ = *value++; 7060880e062SHong Zhang } 7070880e062SHong Zhang } 7080880e062SHong Zhang } 7090880e062SHong Zhang goto noinsert2; 7100880e062SHong Zhang } 7110880e062SHong Zhang } 7120880e062SHong Zhang if (nonew == 1) goto noinsert2; 71308401ef6SPierre Jolivet PetscCheck(nonew != -1, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Inserting a new block index nonzero block (%" PetscInt_FMT ", %" PetscInt_FMT ") in the matrix", row, col); 714fef13f97SBarry Smith MatSeqXAIJReallocateAIJ(A, a->mbs, bs2, nrow, row, col, rmax, aa, ai, aj, rp, ap, imax, nonew, MatScalar); 7159371c9d4SSatish Balay N = nrow++ - 1; 7169371c9d4SSatish Balay high++; 7170880e062SHong Zhang /* shift up all the later entries in this row */ 7189566063dSJacob Faibussowitsch PetscCall(PetscArraymove(rp + i + 1, rp + i, N - i + 1)); 7199566063dSJacob Faibussowitsch PetscCall(PetscArraymove(ap + bs2 * (i + 1), ap + bs2 * i, bs2 * (N - i + 1))); 7209566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(ap + bs2 * i, bs2)); 7210880e062SHong Zhang rp[i] = col; 7220880e062SHong Zhang bap = ap + bs2 * i; 7230880e062SHong Zhang if (roworiented) { 7240880e062SHong Zhang for (ii = 0; ii < bs; ii++, value += stepval) { 725ad540459SPierre Jolivet for (jj = ii; jj < bs2; jj += bs) bap[jj] = *value++; 7260880e062SHong Zhang } 7270880e062SHong Zhang } else { 7280880e062SHong Zhang for (ii = 0; ii < bs; ii++, value += stepval) { 729ad540459SPierre Jolivet for (jj = 0; jj < bs; jj++) *bap++ = *value++; 7300880e062SHong Zhang } 7310880e062SHong Zhang } 7320880e062SHong Zhang noinsert2:; 7330880e062SHong Zhang low = i; 7340880e062SHong Zhang } 7350880e062SHong Zhang ailen[row] = nrow; 7360880e062SHong Zhang } 7373ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 73849b5e25fSSatish Balay } 73949b5e25fSSatish Balay 74064831d72SBarry Smith /* 74164831d72SBarry Smith This is not yet used 74264831d72SBarry Smith */ 743d71ae5a4SJacob Faibussowitsch PetscErrorCode MatAssemblyEnd_SeqSBAIJ_SeqAIJ_Inode(Mat A) 744d71ae5a4SJacob Faibussowitsch { 7450def2e27SBarry Smith Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)A->data; 7460def2e27SBarry Smith const PetscInt *ai = a->i, *aj = a->j, *cols; 7470def2e27SBarry Smith PetscInt i = 0, j, blk_size, m = A->rmap->n, node_count = 0, nzx, nzy, *ns, row, nz, cnt, cnt2, *counts; 748ace3abfcSBarry Smith PetscBool flag; 7490def2e27SBarry Smith 7500def2e27SBarry Smith PetscFunctionBegin; 7519566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m, &ns)); 7520def2e27SBarry Smith while (i < m) { 7530def2e27SBarry Smith nzx = ai[i + 1] - ai[i]; /* Number of nonzeros */ 7540def2e27SBarry Smith /* Limits the number of elements in a node to 'a->inode.limit' */ 7550def2e27SBarry Smith for (j = i + 1, blk_size = 1; j < m && blk_size < a->inode.limit; ++j, ++blk_size) { 7560def2e27SBarry Smith nzy = ai[j + 1] - ai[j]; 7570def2e27SBarry Smith if (nzy != (nzx - j + i)) break; 7589566063dSJacob Faibussowitsch PetscCall(PetscArraycmp(aj + ai[i] + j - i, aj + ai[j], nzy, &flag)); 7590def2e27SBarry Smith if (!flag) break; 7600def2e27SBarry Smith } 7610def2e27SBarry Smith ns[node_count++] = blk_size; 76226fbe8dcSKarl Rupp 7630def2e27SBarry Smith i = j; 7640def2e27SBarry Smith } 7650def2e27SBarry Smith if (!a->inode.size && m && node_count > .9 * m) { 7669566063dSJacob Faibussowitsch PetscCall(PetscFree(ns)); 7679566063dSJacob Faibussowitsch PetscCall(PetscInfo(A, "Found %" PetscInt_FMT " nodes out of %" PetscInt_FMT " rows. Not using Inode routines\n", node_count, m)); 7680def2e27SBarry Smith } else { 7690def2e27SBarry Smith a->inode.node_count = node_count; 77026fbe8dcSKarl Rupp 7719566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(node_count, &a->inode.size)); 7729566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(a->inode.size, ns, node_count)); 7739566063dSJacob Faibussowitsch PetscCall(PetscFree(ns)); 7749566063dSJacob Faibussowitsch PetscCall(PetscInfo(A, "Found %" PetscInt_FMT " nodes of %" PetscInt_FMT ". Limit used: %" PetscInt_FMT ". Using Inode routines\n", node_count, m, a->inode.limit)); 7750def2e27SBarry Smith 7760def2e27SBarry Smith /* count collections of adjacent columns in each inode */ 7770def2e27SBarry Smith row = 0; 7780def2e27SBarry Smith cnt = 0; 7790def2e27SBarry Smith for (i = 0; i < node_count; i++) { 7800def2e27SBarry Smith cols = aj + ai[row] + a->inode.size[i]; 7810def2e27SBarry Smith nz = ai[row + 1] - ai[row] - a->inode.size[i]; 7820def2e27SBarry Smith for (j = 1; j < nz; j++) { 78326fbe8dcSKarl Rupp if (cols[j] != cols[j - 1] + 1) cnt++; 7840def2e27SBarry Smith } 7850def2e27SBarry Smith cnt++; 7860def2e27SBarry Smith row += a->inode.size[i]; 7870def2e27SBarry Smith } 7889566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(2 * cnt, &counts)); 7890def2e27SBarry Smith cnt = 0; 7900def2e27SBarry Smith row = 0; 7910def2e27SBarry Smith for (i = 0; i < node_count; i++) { 7920def2e27SBarry Smith cols = aj + ai[row] + a->inode.size[i]; 7930def2e27SBarry Smith counts[2 * cnt] = cols[0]; 7940def2e27SBarry Smith nz = ai[row + 1] - ai[row] - a->inode.size[i]; 7950def2e27SBarry Smith cnt2 = 1; 7960def2e27SBarry Smith for (j = 1; j < nz; j++) { 7970def2e27SBarry Smith if (cols[j] != cols[j - 1] + 1) { 7980def2e27SBarry Smith counts[2 * (cnt++) + 1] = cnt2; 7990def2e27SBarry Smith counts[2 * cnt] = cols[j]; 8000def2e27SBarry Smith cnt2 = 1; 8010def2e27SBarry Smith } else cnt2++; 8020def2e27SBarry Smith } 8030def2e27SBarry Smith counts[2 * (cnt++) + 1] = cnt2; 8040def2e27SBarry Smith row += a->inode.size[i]; 8050def2e27SBarry Smith } 8069566063dSJacob Faibussowitsch PetscCall(PetscIntView(2 * cnt, counts, NULL)); 8070def2e27SBarry Smith } 8083ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 80938702af4SBarry Smith } 81038702af4SBarry Smith 811d71ae5a4SJacob Faibussowitsch PetscErrorCode MatAssemblyEnd_SeqSBAIJ(Mat A, MatAssemblyType mode) 812d71ae5a4SJacob Faibussowitsch { 81349b5e25fSSatish Balay Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)A->data; 8148f8f2f0dSBarry Smith PetscInt fshift = 0, i, *ai = a->i, *aj = a->j, *imax = a->imax; 815d0f46423SBarry Smith PetscInt m = A->rmap->N, *ip, N, *ailen = a->ilen; 81613f74950SBarry Smith PetscInt mbs = a->mbs, bs2 = a->bs2, rmax = 0; 81749b5e25fSSatish Balay MatScalar *aa = a->a, *ap; 81849b5e25fSSatish Balay 81949b5e25fSSatish Balay PetscFunctionBegin; 8203ba16761SJacob Faibussowitsch if (mode == MAT_FLUSH_ASSEMBLY) PetscFunctionReturn(PETSC_SUCCESS); 82149b5e25fSSatish Balay 82249b5e25fSSatish Balay if (m) rmax = ailen[0]; 82349b5e25fSSatish Balay for (i = 1; i < mbs; i++) { 82449b5e25fSSatish Balay /* move each row back by the amount of empty slots (fshift) before it*/ 82549b5e25fSSatish Balay fshift += imax[i - 1] - ailen[i - 1]; 82649b5e25fSSatish Balay rmax = PetscMax(rmax, ailen[i]); 82749b5e25fSSatish Balay if (fshift) { 828580bdb30SBarry Smith ip = aj + ai[i]; 829580bdb30SBarry Smith ap = aa + bs2 * ai[i]; 83049b5e25fSSatish Balay N = ailen[i]; 8319566063dSJacob Faibussowitsch PetscCall(PetscArraymove(ip - fshift, ip, N)); 8329566063dSJacob Faibussowitsch PetscCall(PetscArraymove(ap - bs2 * fshift, ap, bs2 * N)); 83349b5e25fSSatish Balay } 83449b5e25fSSatish Balay ai[i] = ai[i - 1] + ailen[i - 1]; 83549b5e25fSSatish Balay } 83649b5e25fSSatish Balay if (mbs) { 83749b5e25fSSatish Balay fshift += imax[mbs - 1] - ailen[mbs - 1]; 83849b5e25fSSatish Balay ai[mbs] = ai[mbs - 1] + ailen[mbs - 1]; 83949b5e25fSSatish Balay } 84049b5e25fSSatish Balay /* reset ilen and imax for each row */ 841ad540459SPierre Jolivet for (i = 0; i < mbs; i++) ailen[i] = imax[i] = ai[i + 1] - ai[i]; 8426c6c5352SBarry Smith a->nz = ai[mbs]; 84349b5e25fSSatish Balay 844b424e231SHong Zhang /* diagonals may have moved, reset it */ 8451baa6e33SBarry Smith if (a->diag) PetscCall(PetscArraycpy(a->diag, ai, mbs)); 846aed4548fSBarry Smith PetscCheck(!fshift || a->nounused != -1, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Unused space detected in matrix: %" PetscInt_FMT " X %" PetscInt_FMT " block size %" PetscInt_FMT ", %" PetscInt_FMT " unneeded", m, A->cmap->n, A->rmap->bs, fshift * bs2); 84726fbe8dcSKarl Rupp 8489566063dSJacob Faibussowitsch PetscCall(PetscInfo(A, "Matrix size: %" PetscInt_FMT " X %" PetscInt_FMT ", block size %" PetscInt_FMT "; storage space: %" PetscInt_FMT " unneeded, %" PetscInt_FMT " used\n", m, A->rmap->N, A->rmap->bs, fshift * bs2, a->nz * bs2)); 8499566063dSJacob Faibussowitsch PetscCall(PetscInfo(A, "Number of mallocs during MatSetValues is %" PetscInt_FMT "\n", a->reallocs)); 8509566063dSJacob Faibussowitsch PetscCall(PetscInfo(A, "Most nonzeros blocks in any row is %" PetscInt_FMT "\n", rmax)); 85126fbe8dcSKarl Rupp 8528e58a170SBarry Smith A->info.mallocs += a->reallocs; 85349b5e25fSSatish Balay a->reallocs = 0; 85449b5e25fSSatish Balay A->info.nz_unneeded = (PetscReal)fshift * bs2; 855061b2667SBarry Smith a->idiagvalid = PETSC_FALSE; 8564dcd73b1SHong Zhang a->rmax = rmax; 85738702af4SBarry Smith 85838702af4SBarry Smith if (A->cmap->n < 65536 && A->cmap->bs == 1) { 85944e1c64aSLisandro Dalcin if (a->jshort && a->free_jshort) { 86017803ae8SHong Zhang /* when matrix data structure is changed, previous jshort must be replaced */ 8619566063dSJacob Faibussowitsch PetscCall(PetscFree(a->jshort)); 86217803ae8SHong Zhang } 8639566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(a->i[A->rmap->n], &a->jshort)); 86438702af4SBarry Smith for (i = 0; i < a->i[A->rmap->n]; i++) a->jshort[i] = a->j[i]; 86538702af4SBarry Smith A->ops->mult = MatMult_SeqSBAIJ_1_ushort; 86641f059aeSBarry Smith A->ops->sor = MatSOR_SeqSBAIJ_ushort; 8674da8f245SBarry Smith a->free_jshort = PETSC_TRUE; 86838702af4SBarry Smith } 8693ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 87049b5e25fSSatish Balay } 87149b5e25fSSatish Balay 87249b5e25fSSatish Balay /* 87349b5e25fSSatish Balay This function returns an array of flags which indicate the locations of contiguous 87449b5e25fSSatish Balay blocks that should be zeroed. for eg: if bs = 3 and is = [0,1,2,3,5,6,7,8,9] 875a5b23f4aSJose E. Roman then the resulting sizes = [3,1,1,3,1] corresponding to sets [(0,1,2),(3),(5),(6,7,8),(9)] 87649b5e25fSSatish Balay Assume: sizes should be long enough to hold all the values. 87749b5e25fSSatish Balay */ 878d71ae5a4SJacob Faibussowitsch PetscErrorCode MatZeroRows_SeqSBAIJ_Check_Blocks(PetscInt idx[], PetscInt n, PetscInt bs, PetscInt sizes[], PetscInt *bs_max) 879d71ae5a4SJacob Faibussowitsch { 88013f74950SBarry Smith PetscInt i, j, k, row; 881ace3abfcSBarry Smith PetscBool flg; 88249b5e25fSSatish Balay 88349b5e25fSSatish Balay PetscFunctionBegin; 88449b5e25fSSatish Balay for (i = 0, j = 0; i < n; j++) { 88549b5e25fSSatish Balay row = idx[i]; 886a5b23f4aSJose E. Roman if (row % bs != 0) { /* Not the beginning of a block */ 88749b5e25fSSatish Balay sizes[j] = 1; 88849b5e25fSSatish Balay i++; 88949b5e25fSSatish Balay } else if (i + bs > n) { /* Beginning of a block, but complete block doesn't exist (at idx end) */ 89049b5e25fSSatish Balay sizes[j] = 1; /* Also makes sure at least 'bs' values exist for next else */ 89149b5e25fSSatish Balay i++; 8926aad120cSJose E. Roman } else { /* Beginning of the block, so check if the complete block exists */ 89349b5e25fSSatish Balay flg = PETSC_TRUE; 89449b5e25fSSatish Balay for (k = 1; k < bs; k++) { 89549b5e25fSSatish Balay if (row + k != idx[i + k]) { /* break in the block */ 89649b5e25fSSatish Balay flg = PETSC_FALSE; 89749b5e25fSSatish Balay break; 89849b5e25fSSatish Balay } 89949b5e25fSSatish Balay } 900abc0a331SBarry Smith if (flg) { /* No break in the bs */ 90149b5e25fSSatish Balay sizes[j] = bs; 90249b5e25fSSatish Balay i += bs; 90349b5e25fSSatish Balay } else { 90449b5e25fSSatish Balay sizes[j] = 1; 90549b5e25fSSatish Balay i++; 90649b5e25fSSatish Balay } 90749b5e25fSSatish Balay } 90849b5e25fSSatish Balay } 90949b5e25fSSatish Balay *bs_max = j; 9103ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 91149b5e25fSSatish Balay } 91249b5e25fSSatish Balay 91349b5e25fSSatish Balay /* Only add/insert a(i,j) with i<=j (blocks). 914da81f932SPierre Jolivet Any a(i,j) with i>j input by user is ignored. 91549b5e25fSSatish Balay */ 91649b5e25fSSatish Balay 917d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetValues_SeqSBAIJ(Mat A, PetscInt m, const PetscInt im[], PetscInt n, const PetscInt in[], const PetscScalar v[], InsertMode is) 918d71ae5a4SJacob Faibussowitsch { 91949b5e25fSSatish Balay Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)A->data; 920e2ee6c50SBarry Smith PetscInt *rp, k, low, high, t, ii, row, nrow, i, col, l, rmax, N, lastcol = -1; 92113f74950SBarry Smith PetscInt *imax = a->imax, *ai = a->i, *ailen = a->ilen, roworiented = a->roworiented; 922d0f46423SBarry Smith PetscInt *aj = a->j, nonew = a->nonew, bs = A->rmap->bs, brow, bcol; 92313f74950SBarry Smith PetscInt ridx, cidx, bs2 = a->bs2; 92449b5e25fSSatish Balay MatScalar *ap, value, *aa = a->a, *bap; 92549b5e25fSSatish Balay 92649b5e25fSSatish Balay PetscFunctionBegin; 92749b5e25fSSatish Balay for (k = 0; k < m; k++) { /* loop over added rows */ 92849b5e25fSSatish Balay row = im[k]; /* row number */ 92949b5e25fSSatish Balay brow = row / bs; /* block row number */ 93049b5e25fSSatish Balay if (row < 0) continue; 9316bdcaf15SBarry Smith PetscCheck(row < A->rmap->N, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Row too large: row %" PetscInt_FMT " max %" PetscInt_FMT, row, A->rmap->N - 1); 93249b5e25fSSatish Balay rp = aj + ai[brow]; /*ptr to beginning of column value of the row block*/ 93349b5e25fSSatish Balay ap = aa + bs2 * ai[brow]; /*ptr to beginning of element value of the row block*/ 93449b5e25fSSatish Balay rmax = imax[brow]; /* maximum space allocated for this row */ 93549b5e25fSSatish Balay nrow = ailen[brow]; /* actual length of this row */ 93649b5e25fSSatish Balay low = 0; 9378509e838SStefano Zampini high = nrow; 93849b5e25fSSatish Balay for (l = 0; l < n; l++) { /* loop over added columns */ 93949b5e25fSSatish Balay if (in[l] < 0) continue; 9406bdcaf15SBarry Smith PetscCheck(in[l] < A->cmap->N, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Column too large: col %" PetscInt_FMT " max %" PetscInt_FMT, in[l], A->cmap->N - 1); 94149b5e25fSSatish Balay col = in[l]; 94249b5e25fSSatish Balay bcol = col / bs; /* block col number */ 94349b5e25fSSatish Balay 944941593c8SHong Zhang if (brow > bcol) { 94526fbe8dcSKarl Rupp if (a->ignore_ltriangular) continue; /* ignore lower triangular values */ 94626fbe8dcSKarl Rupp else SETERRQ(PETSC_COMM_SELF, PETSC_ERR_USER, "Lower triangular value cannot be set for sbaij format. Ignoring these values, run with -mat_ignore_lower_triangular or call MatSetOption(mat,MAT_IGNORE_LOWER_TRIANGULAR,PETSC_TRUE)"); 947941593c8SHong Zhang } 948f4989cb3SHong Zhang 9499371c9d4SSatish Balay ridx = row % bs; 9509371c9d4SSatish Balay cidx = col % bs; /*row and col index inside the block */ 9518549e402SHong Zhang if ((brow == bcol && ridx <= cidx) || (brow < bcol)) { 95249b5e25fSSatish Balay /* element value a(k,l) */ 95326fbe8dcSKarl Rupp if (roworiented) value = v[l + k * n]; 95426fbe8dcSKarl Rupp else value = v[k + l * m]; 95549b5e25fSSatish Balay 95649b5e25fSSatish Balay /* move pointer bap to a(k,l) quickly and add/insert value */ 95726fbe8dcSKarl Rupp if (col <= lastcol) low = 0; 9588509e838SStefano Zampini else high = nrow; 9598509e838SStefano Zampini 960e2ee6c50SBarry Smith lastcol = col; 96149b5e25fSSatish Balay while (high - low > 7) { 96249b5e25fSSatish Balay t = (low + high) / 2; 96349b5e25fSSatish Balay if (rp[t] > bcol) high = t; 96449b5e25fSSatish Balay else low = t; 96549b5e25fSSatish Balay } 96649b5e25fSSatish Balay for (i = low; i < high; i++) { 96749b5e25fSSatish Balay if (rp[i] > bcol) break; 96849b5e25fSSatish Balay if (rp[i] == bcol) { 96949b5e25fSSatish Balay bap = ap + bs2 * i + bs * cidx + ridx; 97049b5e25fSSatish Balay if (is == ADD_VALUES) *bap += value; 97149b5e25fSSatish Balay else *bap = value; 9728549e402SHong Zhang /* for diag block, add/insert its symmetric element a(cidx,ridx) */ 9738549e402SHong Zhang if (brow == bcol && ridx < cidx) { 9748549e402SHong Zhang bap = ap + bs2 * i + bs * ridx + cidx; 9758549e402SHong Zhang if (is == ADD_VALUES) *bap += value; 9768549e402SHong Zhang else *bap = value; 9778549e402SHong Zhang } 97849b5e25fSSatish Balay goto noinsert1; 97949b5e25fSSatish Balay } 98049b5e25fSSatish Balay } 98149b5e25fSSatish Balay 98249b5e25fSSatish Balay if (nonew == 1) goto noinsert1; 98308401ef6SPierre Jolivet PetscCheck(nonew != -1, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Inserting a new nonzero (%" PetscInt_FMT ", %" PetscInt_FMT ") in the matrix", row, col); 984fef13f97SBarry Smith MatSeqXAIJReallocateAIJ(A, a->mbs, bs2, nrow, brow, bcol, rmax, aa, ai, aj, rp, ap, imax, nonew, MatScalar); 98549b5e25fSSatish Balay 9869371c9d4SSatish Balay N = nrow++ - 1; 9879371c9d4SSatish Balay high++; 98849b5e25fSSatish Balay /* shift up all the later entries in this row */ 9899566063dSJacob Faibussowitsch PetscCall(PetscArraymove(rp + i + 1, rp + i, N - i + 1)); 9909566063dSJacob Faibussowitsch PetscCall(PetscArraymove(ap + bs2 * (i + 1), ap + bs2 * i, bs2 * (N - i + 1))); 9919566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(ap + bs2 * i, bs2)); 99249b5e25fSSatish Balay rp[i] = bcol; 99349b5e25fSSatish Balay ap[bs2 * i + bs * cidx + ridx] = value; 9948509e838SStefano Zampini /* for diag block, add/insert its symmetric element a(cidx,ridx) */ 995ad540459SPierre Jolivet if (brow == bcol && ridx < cidx) ap[bs2 * i + bs * ridx + cidx] = value; 996e56f5c9eSBarry Smith A->nonzerostate++; 99749b5e25fSSatish Balay noinsert1:; 99849b5e25fSSatish Balay low = i; 9998549e402SHong Zhang } 100049b5e25fSSatish Balay } /* end of loop over added columns */ 100149b5e25fSSatish Balay ailen[brow] = nrow; 100249b5e25fSSatish Balay } /* end of loop over added rows */ 10033ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 100449b5e25fSSatish Balay } 100549b5e25fSSatish Balay 1006d71ae5a4SJacob Faibussowitsch PetscErrorCode MatICCFactor_SeqSBAIJ(Mat inA, IS row, const MatFactorInfo *info) 1007d71ae5a4SJacob Faibussowitsch { 10084ccecd49SHong Zhang Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)inA->data; 100949b5e25fSSatish Balay Mat outA; 1010ace3abfcSBarry Smith PetscBool row_identity; 101149b5e25fSSatish Balay 101249b5e25fSSatish Balay PetscFunctionBegin; 101308401ef6SPierre Jolivet PetscCheck(info->levels == 0, PETSC_COMM_SELF, PETSC_ERR_SUP, "Only levels=0 is supported for in-place icc"); 10149566063dSJacob Faibussowitsch PetscCall(ISIdentity(row, &row_identity)); 101528b400f6SJacob Faibussowitsch PetscCheck(row_identity, PETSC_COMM_SELF, PETSC_ERR_SUP, "Matrix reordering is not supported"); 101608401ef6SPierre Jolivet PetscCheck(inA->rmap->bs == 1, PETSC_COMM_SELF, PETSC_ERR_SUP, "Matrix block size %" PetscInt_FMT " is not supported", inA->rmap->bs); /* Need to replace MatCholeskyFactorSymbolic_SeqSBAIJ_MSR()! */ 1017c84f5b01SHong Zhang 101849b5e25fSSatish Balay outA = inA; 1019d5f3da31SBarry Smith inA->factortype = MAT_FACTOR_ICC; 10209566063dSJacob Faibussowitsch PetscCall(PetscFree(inA->solvertype)); 10219566063dSJacob Faibussowitsch PetscCall(PetscStrallocpy(MATSOLVERPETSC, &inA->solvertype)); 102249b5e25fSSatish Balay 10239566063dSJacob Faibussowitsch PetscCall(MatMarkDiagonal_SeqSBAIJ(inA)); 10249566063dSJacob Faibussowitsch PetscCall(MatSeqSBAIJSetNumericFactorization_inplace(inA, row_identity)); 102549b5e25fSSatish Balay 10269566063dSJacob Faibussowitsch PetscCall(PetscObjectReference((PetscObject)row)); 10279566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->row)); 1028c84f5b01SHong Zhang a->row = row; 10299566063dSJacob Faibussowitsch PetscCall(PetscObjectReference((PetscObject)row)); 10309566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->col)); 1031c84f5b01SHong Zhang a->col = row; 1032c84f5b01SHong Zhang 1033c84f5b01SHong Zhang /* Create the invert permutation so that it can be used in MatCholeskyFactorNumeric() */ 10349566063dSJacob Faibussowitsch if (a->icol) PetscCall(ISInvertPermutation(row, PETSC_DECIDE, &a->icol)); 103549b5e25fSSatish Balay 1036aa624791SPierre Jolivet if (!a->solve_work) PetscCall(PetscMalloc1(inA->rmap->N + inA->rmap->bs, &a->solve_work)); 103749b5e25fSSatish Balay 10389566063dSJacob Faibussowitsch PetscCall(MatCholeskyFactorNumeric(outA, inA, info)); 10393ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 104049b5e25fSSatish Balay } 1041950f1e5bSHong Zhang 1042d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqSBAIJSetColumnIndices_SeqSBAIJ(Mat mat, PetscInt *indices) 1043d71ae5a4SJacob Faibussowitsch { 1044045c9aa0SHong Zhang Mat_SeqSBAIJ *baij = (Mat_SeqSBAIJ *)mat->data; 104513f74950SBarry Smith PetscInt i, nz, n; 104649b5e25fSSatish Balay 104749b5e25fSSatish Balay PetscFunctionBegin; 10486c6c5352SBarry Smith nz = baij->maxnz; 1049d0f46423SBarry Smith n = mat->cmap->n; 105026fbe8dcSKarl Rupp for (i = 0; i < nz; i++) baij->j[i] = indices[i]; 105126fbe8dcSKarl Rupp 10526c6c5352SBarry Smith baij->nz = nz; 105326fbe8dcSKarl Rupp for (i = 0; i < n; i++) baij->ilen[i] = baij->imax[i]; 105426fbe8dcSKarl Rupp 10559566063dSJacob Faibussowitsch PetscCall(MatSetOption(mat, MAT_NEW_NONZERO_LOCATION_ERR, PETSC_TRUE)); 10563ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 105749b5e25fSSatish Balay } 105849b5e25fSSatish Balay 105949b5e25fSSatish Balay /*@ 106019585528SSatish Balay MatSeqSBAIJSetColumnIndices - Set the column indices for all the rows 106111a5261eSBarry Smith in a `MATSEQSBAIJ` matrix. 106249b5e25fSSatish Balay 106349b5e25fSSatish Balay Input Parameters: 106411a5261eSBarry Smith + mat - the `MATSEQSBAIJ` matrix 106549b5e25fSSatish Balay - indices - the column indices 106649b5e25fSSatish Balay 106749b5e25fSSatish Balay Level: advanced 106849b5e25fSSatish Balay 106949b5e25fSSatish Balay Notes: 107049b5e25fSSatish Balay This can be called if you have precomputed the nonzero structure of the 107149b5e25fSSatish Balay matrix and want to provide it to the matrix object to improve the performance 107211a5261eSBarry Smith of the `MatSetValues()` operation. 107349b5e25fSSatish Balay 107449b5e25fSSatish Balay You MUST have set the correct numbers of nonzeros per row in the call to 107511a5261eSBarry Smith `MatCreateSeqSBAIJ()`, and the columns indices MUST be sorted. 107649b5e25fSSatish Balay 10772ef1f0ffSBarry Smith MUST be called before any calls to `MatSetValues()` 107849b5e25fSSatish Balay 1079*1cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MATSEQSBAIJ`, `MatCreateSeqSBAIJ` 108049b5e25fSSatish Balay @*/ 1081d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqSBAIJSetColumnIndices(Mat mat, PetscInt *indices) 1082d71ae5a4SJacob Faibussowitsch { 108349b5e25fSSatish Balay PetscFunctionBegin; 10840700a824SBarry Smith PetscValidHeaderSpecific(mat, MAT_CLASSID, 1); 1085dadcf809SJacob Faibussowitsch PetscValidIntPointer(indices, 2); 1086cac4c232SBarry Smith PetscUseMethod(mat, "MatSeqSBAIJSetColumnIndices_C", (Mat, PetscInt *), (mat, indices)); 10873ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 108849b5e25fSSatish Balay } 108949b5e25fSSatish Balay 1090d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCopy_SeqSBAIJ(Mat A, Mat B, MatStructure str) 1091d71ae5a4SJacob Faibussowitsch { 10924c7a3774SStefano Zampini PetscBool isbaij; 10933c896bc6SHong Zhang 10943c896bc6SHong Zhang PetscFunctionBegin; 10959566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompareAny((PetscObject)B, &isbaij, MATSEQSBAIJ, MATMPISBAIJ, "")); 109628b400f6SJacob Faibussowitsch PetscCheck(isbaij, PetscObjectComm((PetscObject)B), PETSC_ERR_SUP, "Not for matrix type %s", ((PetscObject)B)->type_name); 10974c7a3774SStefano Zampini /* If the two matrices have the same copy implementation and nonzero pattern, use fast copy. */ 10984c7a3774SStefano Zampini if (str == SAME_NONZERO_PATTERN && A->ops->copy == B->ops->copy) { 10993c896bc6SHong Zhang Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)A->data; 11003c896bc6SHong Zhang Mat_SeqSBAIJ *b = (Mat_SeqSBAIJ *)B->data; 11013c896bc6SHong Zhang 110208401ef6SPierre Jolivet PetscCheck(a->i[a->mbs] == b->i[b->mbs], PETSC_COMM_SELF, PETSC_ERR_ARG_INCOMP, "Number of nonzeros in two matrices are different"); 110308401ef6SPierre Jolivet PetscCheck(a->mbs == b->mbs, PETSC_COMM_SELF, PETSC_ERR_ARG_INCOMP, "Number of rows in two matrices are different"); 110408401ef6SPierre Jolivet PetscCheck(a->bs2 == b->bs2, PETSC_COMM_SELF, PETSC_ERR_ARG_INCOMP, "Different block size"); 11059566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(b->a, a->a, a->bs2 * a->i[a->mbs])); 11069566063dSJacob Faibussowitsch PetscCall(PetscObjectStateIncrease((PetscObject)B)); 11073c896bc6SHong Zhang } else { 11089566063dSJacob Faibussowitsch PetscCall(MatGetRowUpperTriangular(A)); 11099566063dSJacob Faibussowitsch PetscCall(MatCopy_Basic(A, B, str)); 11109566063dSJacob Faibussowitsch PetscCall(MatRestoreRowUpperTriangular(A)); 11113c896bc6SHong Zhang } 11123ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 11133c896bc6SHong Zhang } 11143c896bc6SHong Zhang 1115d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatSeqSBAIJGetArray_SeqSBAIJ(Mat A, PetscScalar *array[]) 1116d71ae5a4SJacob Faibussowitsch { 1117a6ece127SHong Zhang Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)A->data; 11185fd66863SKarl Rupp 1119a6ece127SHong Zhang PetscFunctionBegin; 1120a6ece127SHong Zhang *array = a->a; 11213ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1122a6ece127SHong Zhang } 1123a6ece127SHong Zhang 1124d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatSeqSBAIJRestoreArray_SeqSBAIJ(Mat A, PetscScalar *array[]) 1125d71ae5a4SJacob Faibussowitsch { 1126a6ece127SHong Zhang PetscFunctionBegin; 1127cda14afcSprj- *array = NULL; 11283ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1129a6ece127SHong Zhang } 1130a6ece127SHong Zhang 1131d71ae5a4SJacob Faibussowitsch PetscErrorCode MatAXPYGetPreallocation_SeqSBAIJ(Mat Y, Mat X, PetscInt *nnz) 1132d71ae5a4SJacob Faibussowitsch { 1133b264fe52SHong Zhang PetscInt bs = Y->rmap->bs, mbs = Y->rmap->N / bs; 113452768537SHong Zhang Mat_SeqSBAIJ *x = (Mat_SeqSBAIJ *)X->data; 113552768537SHong Zhang Mat_SeqSBAIJ *y = (Mat_SeqSBAIJ *)Y->data; 113652768537SHong Zhang 113752768537SHong Zhang PetscFunctionBegin; 113852768537SHong Zhang /* Set the number of nonzeros in the new matrix */ 11399566063dSJacob Faibussowitsch PetscCall(MatAXPYGetPreallocation_SeqX_private(mbs, x->i, x->j, y->i, y->j, nnz)); 11403ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 114152768537SHong Zhang } 114252768537SHong Zhang 1143d71ae5a4SJacob Faibussowitsch PetscErrorCode MatAXPY_SeqSBAIJ(Mat Y, PetscScalar a, Mat X, MatStructure str) 1144d71ae5a4SJacob Faibussowitsch { 114542ee4b1aSHong Zhang Mat_SeqSBAIJ *x = (Mat_SeqSBAIJ *)X->data, *y = (Mat_SeqSBAIJ *)Y->data; 114631ce2d13SHong Zhang PetscInt bs = Y->rmap->bs, bs2 = bs * bs; 1147e838b9e7SJed Brown PetscBLASInt one = 1; 114842ee4b1aSHong Zhang 114942ee4b1aSHong Zhang PetscFunctionBegin; 1150134adf20SPierre Jolivet if (str == UNKNOWN_NONZERO_PATTERN || (PetscDefined(USE_DEBUG) && str == SAME_NONZERO_PATTERN)) { 1151134adf20SPierre Jolivet PetscBool e = x->nz == y->nz && x->mbs == y->mbs ? PETSC_TRUE : PETSC_FALSE; 1152134adf20SPierre Jolivet if (e) { 11539566063dSJacob Faibussowitsch PetscCall(PetscArraycmp(x->i, y->i, x->mbs + 1, &e)); 1154134adf20SPierre Jolivet if (e) { 11559566063dSJacob Faibussowitsch PetscCall(PetscArraycmp(x->j, y->j, x->i[x->mbs], &e)); 1156134adf20SPierre Jolivet if (e) str = SAME_NONZERO_PATTERN; 1157134adf20SPierre Jolivet } 1158134adf20SPierre Jolivet } 115954c59aa7SJacob Faibussowitsch if (!e) PetscCheck(str != SAME_NONZERO_PATTERN, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONG, "MatStructure is not SAME_NONZERO_PATTERN"); 1160134adf20SPierre Jolivet } 116142ee4b1aSHong Zhang if (str == SAME_NONZERO_PATTERN) { 1162f4df32b1SMatthew Knepley PetscScalar alpha = a; 1163c5df96a5SBarry Smith PetscBLASInt bnz; 11649566063dSJacob Faibussowitsch PetscCall(PetscBLASIntCast(x->nz * bs2, &bnz)); 1165792fecdfSBarry Smith PetscCallBLAS("BLASaxpy", BLASaxpy_(&bnz, &alpha, x->a, &one, y->a, &one)); 11669566063dSJacob Faibussowitsch PetscCall(PetscObjectStateIncrease((PetscObject)Y)); 1167ab784542SHong Zhang } else if (str == SUBSET_NONZERO_PATTERN) { /* nonzeros of X is a subset of Y's */ 11689566063dSJacob Faibussowitsch PetscCall(MatSetOption(X, MAT_GETROW_UPPERTRIANGULAR, PETSC_TRUE)); 11699566063dSJacob Faibussowitsch PetscCall(MatAXPY_Basic(Y, a, X, str)); 11709566063dSJacob Faibussowitsch PetscCall(MatSetOption(X, MAT_GETROW_UPPERTRIANGULAR, PETSC_FALSE)); 117142ee4b1aSHong Zhang } else { 117252768537SHong Zhang Mat B; 117352768537SHong Zhang PetscInt *nnz; 117454c59aa7SJacob Faibussowitsch PetscCheck(bs == X->rmap->bs, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Matrices must have same block size"); 11759566063dSJacob Faibussowitsch PetscCall(MatGetRowUpperTriangular(X)); 11769566063dSJacob Faibussowitsch PetscCall(MatGetRowUpperTriangular(Y)); 11779566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(Y->rmap->N, &nnz)); 11789566063dSJacob Faibussowitsch PetscCall(MatCreate(PetscObjectComm((PetscObject)Y), &B)); 11799566063dSJacob Faibussowitsch PetscCall(PetscObjectSetName((PetscObject)B, ((PetscObject)Y)->name)); 11809566063dSJacob Faibussowitsch PetscCall(MatSetSizes(B, Y->rmap->n, Y->cmap->n, Y->rmap->N, Y->cmap->N)); 11819566063dSJacob Faibussowitsch PetscCall(MatSetBlockSizesFromMats(B, Y, Y)); 11829566063dSJacob Faibussowitsch PetscCall(MatSetType(B, ((PetscObject)Y)->type_name)); 11839566063dSJacob Faibussowitsch PetscCall(MatAXPYGetPreallocation_SeqSBAIJ(Y, X, nnz)); 11849566063dSJacob Faibussowitsch PetscCall(MatSeqSBAIJSetPreallocation(B, bs, 0, nnz)); 118552768537SHong Zhang 11869566063dSJacob Faibussowitsch PetscCall(MatAXPY_BasicWithPreallocation(B, Y, a, X, str)); 118752768537SHong Zhang 11889566063dSJacob Faibussowitsch PetscCall(MatHeaderMerge(Y, &B)); 11899566063dSJacob Faibussowitsch PetscCall(PetscFree(nnz)); 11909566063dSJacob Faibussowitsch PetscCall(MatRestoreRowUpperTriangular(X)); 11919566063dSJacob Faibussowitsch PetscCall(MatRestoreRowUpperTriangular(Y)); 119242ee4b1aSHong Zhang } 11933ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 119442ee4b1aSHong Zhang } 119542ee4b1aSHong Zhang 1196d71ae5a4SJacob Faibussowitsch PetscErrorCode MatIsSymmetric_SeqSBAIJ(Mat A, PetscReal tol, PetscBool *flg) 1197d71ae5a4SJacob Faibussowitsch { 1198efcf0fc3SBarry Smith PetscFunctionBegin; 1199efcf0fc3SBarry Smith *flg = PETSC_TRUE; 12003ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1201efcf0fc3SBarry Smith } 1202efcf0fc3SBarry Smith 1203d71ae5a4SJacob Faibussowitsch PetscErrorCode MatIsStructurallySymmetric_SeqSBAIJ(Mat A, PetscBool *flg) 1204d71ae5a4SJacob Faibussowitsch { 1205efcf0fc3SBarry Smith PetscFunctionBegin; 1206efcf0fc3SBarry Smith *flg = PETSC_TRUE; 12073ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1208efcf0fc3SBarry Smith } 1209efcf0fc3SBarry Smith 1210d71ae5a4SJacob Faibussowitsch PetscErrorCode MatIsHermitian_SeqSBAIJ(Mat A, PetscReal tol, PetscBool *flg) 1211d71ae5a4SJacob Faibussowitsch { 1212efcf0fc3SBarry Smith PetscFunctionBegin; 1213efcf0fc3SBarry Smith *flg = PETSC_FALSE; 12143ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1215efcf0fc3SBarry Smith } 1216efcf0fc3SBarry Smith 1217d71ae5a4SJacob Faibussowitsch PetscErrorCode MatConjugate_SeqSBAIJ(Mat A) 1218d71ae5a4SJacob Faibussowitsch { 12192726fb6dSPierre Jolivet #if defined(PETSC_USE_COMPLEX) 12202726fb6dSPierre Jolivet Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)A->data; 12212726fb6dSPierre Jolivet PetscInt i, nz = a->bs2 * a->i[a->mbs]; 12222726fb6dSPierre Jolivet MatScalar *aa = a->a; 12232726fb6dSPierre Jolivet 12242726fb6dSPierre Jolivet PetscFunctionBegin; 12252726fb6dSPierre Jolivet for (i = 0; i < nz; i++) aa[i] = PetscConj(aa[i]); 12262726fb6dSPierre Jolivet #else 12272726fb6dSPierre Jolivet PetscFunctionBegin; 12282726fb6dSPierre Jolivet #endif 12293ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 12302726fb6dSPierre Jolivet } 12312726fb6dSPierre Jolivet 1232d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRealPart_SeqSBAIJ(Mat A) 1233d71ae5a4SJacob Faibussowitsch { 123499cafbc1SBarry Smith Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)A->data; 123599cafbc1SBarry Smith PetscInt i, nz = a->bs2 * a->i[a->mbs]; 1236dd6ea824SBarry Smith MatScalar *aa = a->a; 123799cafbc1SBarry Smith 123899cafbc1SBarry Smith PetscFunctionBegin; 123999cafbc1SBarry Smith for (i = 0; i < nz; i++) aa[i] = PetscRealPart(aa[i]); 12403ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 124199cafbc1SBarry Smith } 124299cafbc1SBarry Smith 1243d71ae5a4SJacob Faibussowitsch PetscErrorCode MatImaginaryPart_SeqSBAIJ(Mat A) 1244d71ae5a4SJacob Faibussowitsch { 124599cafbc1SBarry Smith Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)A->data; 124699cafbc1SBarry Smith PetscInt i, nz = a->bs2 * a->i[a->mbs]; 1247dd6ea824SBarry Smith MatScalar *aa = a->a; 124899cafbc1SBarry Smith 124999cafbc1SBarry Smith PetscFunctionBegin; 125099cafbc1SBarry Smith for (i = 0; i < nz; i++) aa[i] = PetscImaginaryPart(aa[i]); 12513ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 125299cafbc1SBarry Smith } 125399cafbc1SBarry Smith 1254d71ae5a4SJacob Faibussowitsch PetscErrorCode MatZeroRowsColumns_SeqSBAIJ(Mat A, PetscInt is_n, const PetscInt is_idx[], PetscScalar diag, Vec x, Vec b) 1255d71ae5a4SJacob Faibussowitsch { 12563bededecSBarry Smith Mat_SeqSBAIJ *baij = (Mat_SeqSBAIJ *)A->data; 12573bededecSBarry Smith PetscInt i, j, k, count; 12583bededecSBarry Smith PetscInt bs = A->rmap->bs, bs2 = baij->bs2, row, col; 12593bededecSBarry Smith PetscScalar zero = 0.0; 12603bededecSBarry Smith MatScalar *aa; 12613bededecSBarry Smith const PetscScalar *xx; 12623bededecSBarry Smith PetscScalar *bb; 126356777dd2SBarry Smith PetscBool *zeroed, vecs = PETSC_FALSE; 12643bededecSBarry Smith 12653bededecSBarry Smith PetscFunctionBegin; 12663bededecSBarry Smith /* fix right hand side if needed */ 12673bededecSBarry Smith if (x && b) { 12689566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(x, &xx)); 12699566063dSJacob Faibussowitsch PetscCall(VecGetArray(b, &bb)); 127056777dd2SBarry Smith vecs = PETSC_TRUE; 12713bededecSBarry Smith } 12723bededecSBarry Smith 12733bededecSBarry Smith /* zero the columns */ 12749566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(A->rmap->n, &zeroed)); 12753bededecSBarry Smith for (i = 0; i < is_n; i++) { 1276aed4548fSBarry Smith PetscCheck(is_idx[i] >= 0 && is_idx[i] < A->rmap->N, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "row %" PetscInt_FMT " out of range", is_idx[i]); 12773bededecSBarry Smith zeroed[is_idx[i]] = PETSC_TRUE; 12783bededecSBarry Smith } 127956777dd2SBarry Smith if (vecs) { 128056777dd2SBarry Smith for (i = 0; i < A->rmap->N; i++) { 128156777dd2SBarry Smith row = i / bs; 128256777dd2SBarry Smith for (j = baij->i[row]; j < baij->i[row + 1]; j++) { 128356777dd2SBarry Smith for (k = 0; k < bs; k++) { 128456777dd2SBarry Smith col = bs * baij->j[j] + k; 128556777dd2SBarry Smith if (col <= i) continue; 128656777dd2SBarry Smith aa = ((MatScalar *)(baij->a)) + j * bs2 + (i % bs) + bs * k; 128726fbe8dcSKarl Rupp if (!zeroed[i] && zeroed[col]) bb[i] -= aa[0] * xx[col]; 128826fbe8dcSKarl Rupp if (zeroed[i] && !zeroed[col]) bb[col] -= aa[0] * xx[i]; 128956777dd2SBarry Smith } 129056777dd2SBarry Smith } 129156777dd2SBarry Smith } 129226fbe8dcSKarl Rupp for (i = 0; i < is_n; i++) bb[is_idx[i]] = diag * xx[is_idx[i]]; 129356777dd2SBarry Smith } 129456777dd2SBarry Smith 12953bededecSBarry Smith for (i = 0; i < A->rmap->N; i++) { 12963bededecSBarry Smith if (!zeroed[i]) { 12973bededecSBarry Smith row = i / bs; 12983bededecSBarry Smith for (j = baij->i[row]; j < baij->i[row + 1]; j++) { 12993bededecSBarry Smith for (k = 0; k < bs; k++) { 13003bededecSBarry Smith col = bs * baij->j[j] + k; 13013bededecSBarry Smith if (zeroed[col]) { 13023bededecSBarry Smith aa = ((MatScalar *)(baij->a)) + j * bs2 + (i % bs) + bs * k; 13033bededecSBarry Smith aa[0] = 0.0; 13043bededecSBarry Smith } 13053bededecSBarry Smith } 13063bededecSBarry Smith } 13073bededecSBarry Smith } 13083bededecSBarry Smith } 13099566063dSJacob Faibussowitsch PetscCall(PetscFree(zeroed)); 131056777dd2SBarry Smith if (vecs) { 13119566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(x, &xx)); 13129566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(b, &bb)); 131356777dd2SBarry Smith } 13143bededecSBarry Smith 13153bededecSBarry Smith /* zero the rows */ 13163bededecSBarry Smith for (i = 0; i < is_n; i++) { 13173bededecSBarry Smith row = is_idx[i]; 13183bededecSBarry Smith count = (baij->i[row / bs + 1] - baij->i[row / bs]) * bs; 13193bededecSBarry Smith aa = ((MatScalar *)(baij->a)) + baij->i[row / bs] * bs2 + (row % bs); 13203bededecSBarry Smith for (k = 0; k < count; k++) { 13213bededecSBarry Smith aa[0] = zero; 13223bededecSBarry Smith aa += bs; 13233bededecSBarry Smith } 1324dbbe0bcdSBarry Smith if (diag != 0.0) PetscUseTypeMethod(A, setvalues, 1, &row, 1, &row, &diag, INSERT_VALUES); 13253bededecSBarry Smith } 13269566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd_SeqSBAIJ(A, MAT_FINAL_ASSEMBLY)); 13273ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 13283bededecSBarry Smith } 13293bededecSBarry Smith 1330d71ae5a4SJacob Faibussowitsch PetscErrorCode MatShift_SeqSBAIJ(Mat Y, PetscScalar a) 1331d71ae5a4SJacob Faibussowitsch { 13327d68702bSBarry Smith Mat_SeqSBAIJ *aij = (Mat_SeqSBAIJ *)Y->data; 13337d68702bSBarry Smith 13347d68702bSBarry Smith PetscFunctionBegin; 133548a46eb9SPierre Jolivet if (!Y->preallocated || !aij->nz) PetscCall(MatSeqSBAIJSetPreallocation(Y, Y->rmap->bs, 1, NULL)); 13369566063dSJacob Faibussowitsch PetscCall(MatShift_Basic(Y, a)); 13373ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 13387d68702bSBarry Smith } 13397d68702bSBarry Smith 13403964eb88SJed Brown static struct _MatOps MatOps_Values = {MatSetValues_SeqSBAIJ, 134149b5e25fSSatish Balay MatGetRow_SeqSBAIJ, 134249b5e25fSSatish Balay MatRestoreRow_SeqSBAIJ, 134349b5e25fSSatish Balay MatMult_SeqSBAIJ_N, 134497304618SKris Buschelman /* 4*/ MatMultAdd_SeqSBAIJ_N, 1345431c96f7SBarry Smith MatMult_SeqSBAIJ_N, /* transpose versions are same as non-transpose versions */ 1346e005ede5SBarry Smith MatMultAdd_SeqSBAIJ_N, 1347f4259b30SLisandro Dalcin NULL, 1348f4259b30SLisandro Dalcin NULL, 1349f4259b30SLisandro Dalcin NULL, 1350f4259b30SLisandro Dalcin /* 10*/ NULL, 1351f4259b30SLisandro Dalcin NULL, 1352c078aec8SLisandro Dalcin MatCholeskyFactor_SeqSBAIJ, 135341f059aeSBarry Smith MatSOR_SeqSBAIJ, 135449b5e25fSSatish Balay MatTranspose_SeqSBAIJ, 135597304618SKris Buschelman /* 15*/ MatGetInfo_SeqSBAIJ, 135649b5e25fSSatish Balay MatEqual_SeqSBAIJ, 135749b5e25fSSatish Balay MatGetDiagonal_SeqSBAIJ, 135849b5e25fSSatish Balay MatDiagonalScale_SeqSBAIJ, 135949b5e25fSSatish Balay MatNorm_SeqSBAIJ, 1360f4259b30SLisandro Dalcin /* 20*/ NULL, 136149b5e25fSSatish Balay MatAssemblyEnd_SeqSBAIJ, 136249b5e25fSSatish Balay MatSetOption_SeqSBAIJ, 136349b5e25fSSatish Balay MatZeroEntries_SeqSBAIJ, 1364f4259b30SLisandro Dalcin /* 24*/ NULL, 1365f4259b30SLisandro Dalcin NULL, 1366f4259b30SLisandro Dalcin NULL, 1367f4259b30SLisandro Dalcin NULL, 1368f4259b30SLisandro Dalcin NULL, 136926cec326SBarry Smith /* 29*/ MatSetUp_Seq_Hash, 1370f4259b30SLisandro Dalcin NULL, 1371f4259b30SLisandro Dalcin NULL, 1372f4259b30SLisandro Dalcin NULL, 1373f4259b30SLisandro Dalcin NULL, 1374d519adbfSMatthew Knepley /* 34*/ MatDuplicate_SeqSBAIJ, 1375f4259b30SLisandro Dalcin NULL, 1376f4259b30SLisandro Dalcin NULL, 1377f4259b30SLisandro Dalcin NULL, 1378c84f5b01SHong Zhang MatICCFactor_SeqSBAIJ, 1379d519adbfSMatthew Knepley /* 39*/ MatAXPY_SeqSBAIJ, 13807dae84e0SHong Zhang MatCreateSubMatrices_SeqSBAIJ, 138149b5e25fSSatish Balay MatIncreaseOverlap_SeqSBAIJ, 138249b5e25fSSatish Balay MatGetValues_SeqSBAIJ, 13833c896bc6SHong Zhang MatCopy_SeqSBAIJ, 1384f4259b30SLisandro Dalcin /* 44*/ NULL, 138549b5e25fSSatish Balay MatScale_SeqSBAIJ, 13867d68702bSBarry Smith MatShift_SeqSBAIJ, 1387f4259b30SLisandro Dalcin NULL, 13883bededecSBarry Smith MatZeroRowsColumns_SeqSBAIJ, 1389f4259b30SLisandro Dalcin /* 49*/ NULL, 139049b5e25fSSatish Balay MatGetRowIJ_SeqSBAIJ, 139149b5e25fSSatish Balay MatRestoreRowIJ_SeqSBAIJ, 1392f4259b30SLisandro Dalcin NULL, 1393f4259b30SLisandro Dalcin NULL, 1394f4259b30SLisandro Dalcin /* 54*/ NULL, 1395f4259b30SLisandro Dalcin NULL, 1396f4259b30SLisandro Dalcin NULL, 1397dc29a518SPierre Jolivet MatPermute_SeqSBAIJ, 139849b5e25fSSatish Balay MatSetValuesBlocked_SeqSBAIJ, 13997dae84e0SHong Zhang /* 59*/ MatCreateSubMatrix_SeqSBAIJ, 1400f4259b30SLisandro Dalcin NULL, 1401f4259b30SLisandro Dalcin NULL, 1402f4259b30SLisandro Dalcin NULL, 1403f4259b30SLisandro Dalcin NULL, 1404f4259b30SLisandro Dalcin /* 64*/ NULL, 1405f4259b30SLisandro Dalcin NULL, 1406f4259b30SLisandro Dalcin NULL, 1407f4259b30SLisandro Dalcin NULL, 1408f4259b30SLisandro Dalcin NULL, 1409d519adbfSMatthew Knepley /* 69*/ MatGetRowMaxAbs_SeqSBAIJ, 1410f4259b30SLisandro Dalcin NULL, 141128d58a37SPierre Jolivet MatConvert_MPISBAIJ_Basic, 1412f4259b30SLisandro Dalcin NULL, 1413f4259b30SLisandro Dalcin NULL, 1414f4259b30SLisandro Dalcin /* 74*/ NULL, 1415f4259b30SLisandro Dalcin NULL, 1416f4259b30SLisandro Dalcin NULL, 1417f4259b30SLisandro Dalcin NULL, 1418f4259b30SLisandro Dalcin NULL, 1419f4259b30SLisandro Dalcin /* 79*/ NULL, 1420f4259b30SLisandro Dalcin NULL, 1421f4259b30SLisandro Dalcin NULL, 142297304618SKris Buschelman MatGetInertia_SeqSBAIJ, 14235bba2384SShri Abhyankar MatLoad_SeqSBAIJ, 1424d519adbfSMatthew Knepley /* 84*/ MatIsSymmetric_SeqSBAIJ, 1425865e5f61SKris Buschelman MatIsHermitian_SeqSBAIJ, 1426efcf0fc3SBarry Smith MatIsStructurallySymmetric_SeqSBAIJ, 1427f4259b30SLisandro Dalcin NULL, 1428f4259b30SLisandro Dalcin NULL, 1429f4259b30SLisandro Dalcin /* 89*/ NULL, 1430f4259b30SLisandro Dalcin NULL, 1431f4259b30SLisandro Dalcin NULL, 1432f4259b30SLisandro Dalcin NULL, 1433f4259b30SLisandro Dalcin NULL, 1434f4259b30SLisandro Dalcin /* 94*/ NULL, 1435f4259b30SLisandro Dalcin NULL, 1436f4259b30SLisandro Dalcin NULL, 1437f4259b30SLisandro Dalcin NULL, 1438f4259b30SLisandro Dalcin NULL, 1439f4259b30SLisandro Dalcin /* 99*/ NULL, 1440f4259b30SLisandro Dalcin NULL, 1441f4259b30SLisandro Dalcin NULL, 14422726fb6dSPierre Jolivet MatConjugate_SeqSBAIJ, 1443f4259b30SLisandro Dalcin NULL, 1444f4259b30SLisandro Dalcin /*104*/ NULL, 144599cafbc1SBarry Smith MatRealPart_SeqSBAIJ, 1446f5edf698SHong Zhang MatImaginaryPart_SeqSBAIJ, 1447f5edf698SHong Zhang MatGetRowUpperTriangular_SeqSBAIJ, 14482af78befSBarry Smith MatRestoreRowUpperTriangular_SeqSBAIJ, 1449f4259b30SLisandro Dalcin /*109*/ NULL, 1450f4259b30SLisandro Dalcin NULL, 1451f4259b30SLisandro Dalcin NULL, 1452f4259b30SLisandro Dalcin NULL, 1453547795f9SHong Zhang MatMissingDiagonal_SeqSBAIJ, 1454f4259b30SLisandro Dalcin /*114*/ NULL, 1455f4259b30SLisandro Dalcin NULL, 1456f4259b30SLisandro Dalcin NULL, 1457f4259b30SLisandro Dalcin NULL, 1458f4259b30SLisandro Dalcin NULL, 1459f4259b30SLisandro Dalcin /*119*/ NULL, 1460f4259b30SLisandro Dalcin NULL, 1461f4259b30SLisandro Dalcin NULL, 1462f4259b30SLisandro Dalcin NULL, 1463f4259b30SLisandro Dalcin NULL, 1464f4259b30SLisandro Dalcin /*124*/ NULL, 1465f4259b30SLisandro Dalcin NULL, 1466f4259b30SLisandro Dalcin NULL, 1467f4259b30SLisandro Dalcin NULL, 1468f4259b30SLisandro Dalcin NULL, 1469f4259b30SLisandro Dalcin /*129*/ NULL, 1470f4259b30SLisandro Dalcin NULL, 1471f4259b30SLisandro Dalcin NULL, 1472f4259b30SLisandro Dalcin NULL, 1473f4259b30SLisandro Dalcin NULL, 1474f4259b30SLisandro Dalcin /*134*/ NULL, 1475f4259b30SLisandro Dalcin NULL, 1476f4259b30SLisandro Dalcin NULL, 1477f4259b30SLisandro Dalcin NULL, 1478f4259b30SLisandro Dalcin NULL, 147946533700Sstefano_zampini /*139*/ MatSetBlockSizes_Default, 1480f4259b30SLisandro Dalcin NULL, 1481f4259b30SLisandro Dalcin NULL, 1482f4259b30SLisandro Dalcin NULL, 1483f4259b30SLisandro Dalcin NULL, 1484d70f29a3SPierre Jolivet /*144*/ MatCreateMPIMatConcatenateSeqMat_SeqSBAIJ, 1485d70f29a3SPierre Jolivet NULL, 1486d70f29a3SPierre Jolivet NULL, 148799a7f59eSMark Adams NULL, 148899a7f59eSMark Adams NULL, 14897fb60732SBarry Smith NULL, 1490dec0b466SHong Zhang /*150*/ NULL, 1491dec0b466SHong Zhang NULL}; 1492be1d678aSKris Buschelman 1493d71ae5a4SJacob Faibussowitsch PetscErrorCode MatStoreValues_SeqSBAIJ(Mat mat) 1494d71ae5a4SJacob Faibussowitsch { 14954afc71dfSHong Zhang Mat_SeqSBAIJ *aij = (Mat_SeqSBAIJ *)mat->data; 1496d0f46423SBarry Smith PetscInt nz = aij->i[mat->rmap->N] * mat->rmap->bs * aij->bs2; 149749b5e25fSSatish Balay 149849b5e25fSSatish Balay PetscFunctionBegin; 149908401ef6SPierre Jolivet PetscCheck(aij->nonew == 1, PETSC_COMM_SELF, PETSC_ERR_ORDER, "Must call MatSetOption(A,MAT_NEW_NONZERO_LOCATIONS,PETSC_FALSE);first"); 150049b5e25fSSatish Balay 150149b5e25fSSatish Balay /* allocate space for values if not already there */ 150248a46eb9SPierre Jolivet if (!aij->saved_values) PetscCall(PetscMalloc1(nz + 1, &aij->saved_values)); 150349b5e25fSSatish Balay 150449b5e25fSSatish Balay /* copy values over */ 15059566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(aij->saved_values, aij->a, nz)); 15063ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 150749b5e25fSSatish Balay } 150849b5e25fSSatish Balay 1509d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRetrieveValues_SeqSBAIJ(Mat mat) 1510d71ae5a4SJacob Faibussowitsch { 15114afc71dfSHong Zhang Mat_SeqSBAIJ *aij = (Mat_SeqSBAIJ *)mat->data; 1512d0f46423SBarry Smith PetscInt nz = aij->i[mat->rmap->N] * mat->rmap->bs * aij->bs2; 151349b5e25fSSatish Balay 151449b5e25fSSatish Balay PetscFunctionBegin; 151508401ef6SPierre Jolivet PetscCheck(aij->nonew == 1, PETSC_COMM_SELF, PETSC_ERR_ORDER, "Must call MatSetOption(A,MAT_NEW_NONZERO_LOCATIONS,PETSC_FALSE);first"); 151628b400f6SJacob Faibussowitsch PetscCheck(aij->saved_values, PETSC_COMM_SELF, PETSC_ERR_ORDER, "Must call MatStoreValues(A);first"); 151749b5e25fSSatish Balay 151849b5e25fSSatish Balay /* copy values over */ 15199566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(aij->a, aij->saved_values, nz)); 15203ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 152149b5e25fSSatish Balay } 152249b5e25fSSatish Balay 1523d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatSeqSBAIJSetPreallocation_SeqSBAIJ(Mat B, PetscInt bs, PetscInt nz, PetscInt *nnz) 1524d71ae5a4SJacob Faibussowitsch { 1525c464158bSHong Zhang Mat_SeqSBAIJ *b = (Mat_SeqSBAIJ *)B->data; 15264dcd73b1SHong Zhang PetscInt i, mbs, nbs, bs2; 15272576faa2SJed Brown PetscBool skipallocation = PETSC_FALSE, flg = PETSC_FALSE, realalloc = PETSC_FALSE; 152849b5e25fSSatish Balay 1529ad79cf63SBarry Smith if (B->hash_active) { 1530ad79cf63SBarry Smith PetscInt bs; 1531ad79cf63SBarry Smith PetscCall(PetscMemcpy(&B->ops, &b->cops, sizeof(*(B->ops)))); 1532ad79cf63SBarry Smith PetscCall(PetscHMapIJVDestroy(&b->ht)); 1533ad79cf63SBarry Smith PetscCall(MatGetBlockSize(B, &bs)); 1534ad79cf63SBarry Smith if (bs > 1) PetscCall(PetscHSetIJDestroy(&b->bht)); 1535ad79cf63SBarry Smith PetscCall(PetscFree(b->dnz)); 1536ad79cf63SBarry Smith PetscCall(PetscFree(b->bdnz)); 1537ad79cf63SBarry Smith B->hash_active = PETSC_FALSE; 1538ad79cf63SBarry Smith } 153949b5e25fSSatish Balay PetscFunctionBegin; 15402576faa2SJed Brown if (nz >= 0 || nnz) realalloc = PETSC_TRUE; 1541db4efbfdSBarry Smith 15429566063dSJacob Faibussowitsch PetscCall(MatSetBlockSize(B, PetscAbs(bs))); 15439566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(B->rmap)); 15449566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(B->cmap)); 154508401ef6SPierre Jolivet PetscCheck(B->rmap->N <= B->cmap->N, PETSC_COMM_SELF, PETSC_ERR_SUP, "SEQSBAIJ matrix cannot have more rows %" PetscInt_FMT " than columns %" PetscInt_FMT, B->rmap->N, B->cmap->N); 15469566063dSJacob Faibussowitsch PetscCall(PetscLayoutGetBlockSize(B->rmap, &bs)); 1547899cda47SBarry Smith 154821940c7eSstefano_zampini B->preallocated = PETSC_TRUE; 154921940c7eSstefano_zampini 1550d0f46423SBarry Smith mbs = B->rmap->N / bs; 15514dcd73b1SHong Zhang nbs = B->cmap->n / bs; 155249b5e25fSSatish Balay bs2 = bs * bs; 155349b5e25fSSatish Balay 1554aed4548fSBarry Smith PetscCheck(mbs * bs == B->rmap->N && nbs * bs == B->cmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Number rows, cols must be divisible by blocksize"); 155549b5e25fSSatish Balay 1556ab93d7beSBarry Smith if (nz == MAT_SKIP_ALLOCATION) { 1557ab93d7beSBarry Smith skipallocation = PETSC_TRUE; 1558ab93d7beSBarry Smith nz = 0; 1559ab93d7beSBarry Smith } 1560ab93d7beSBarry Smith 1561435da068SBarry Smith if (nz == PETSC_DEFAULT || nz == PETSC_DECIDE) nz = 3; 156208401ef6SPierre Jolivet PetscCheck(nz >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "nz cannot be less than 0: value %" PetscInt_FMT, nz); 156349b5e25fSSatish Balay if (nnz) { 156449b5e25fSSatish Balay for (i = 0; i < mbs; i++) { 156508401ef6SPierre Jolivet PetscCheck(nnz[i] >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "nnz cannot be less than 0: local row %" PetscInt_FMT " value %" PetscInt_FMT, i, nnz[i]); 156608401ef6SPierre Jolivet PetscCheck(nnz[i] <= nbs, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "nnz cannot be greater than block row length: local row %" PetscInt_FMT " value %" PetscInt_FMT " block rowlength %" PetscInt_FMT, i, nnz[i], nbs); 156749b5e25fSSatish Balay } 156849b5e25fSSatish Balay } 156949b5e25fSSatish Balay 1570db4efbfdSBarry Smith B->ops->mult = MatMult_SeqSBAIJ_N; 1571db4efbfdSBarry Smith B->ops->multadd = MatMultAdd_SeqSBAIJ_N; 1572db4efbfdSBarry Smith B->ops->multtranspose = MatMult_SeqSBAIJ_N; 1573db4efbfdSBarry Smith B->ops->multtransposeadd = MatMultAdd_SeqSBAIJ_N; 157426fbe8dcSKarl Rupp 15759566063dSJacob Faibussowitsch PetscCall(PetscOptionsGetBool(((PetscObject)B)->options, ((PetscObject)B)->prefix, "-mat_no_unroll", &flg, NULL)); 157649b5e25fSSatish Balay if (!flg) { 157749b5e25fSSatish Balay switch (bs) { 157849b5e25fSSatish Balay case 1: 157949b5e25fSSatish Balay B->ops->mult = MatMult_SeqSBAIJ_1; 158049b5e25fSSatish Balay B->ops->multadd = MatMultAdd_SeqSBAIJ_1; 1581431c96f7SBarry Smith B->ops->multtranspose = MatMult_SeqSBAIJ_1; 1582431c96f7SBarry Smith B->ops->multtransposeadd = MatMultAdd_SeqSBAIJ_1; 158349b5e25fSSatish Balay break; 158449b5e25fSSatish Balay case 2: 158549b5e25fSSatish Balay B->ops->mult = MatMult_SeqSBAIJ_2; 158649b5e25fSSatish Balay B->ops->multadd = MatMultAdd_SeqSBAIJ_2; 1587431c96f7SBarry Smith B->ops->multtranspose = MatMult_SeqSBAIJ_2; 1588431c96f7SBarry Smith B->ops->multtransposeadd = MatMultAdd_SeqSBAIJ_2; 158949b5e25fSSatish Balay break; 159049b5e25fSSatish Balay case 3: 159149b5e25fSSatish Balay B->ops->mult = MatMult_SeqSBAIJ_3; 159249b5e25fSSatish Balay B->ops->multadd = MatMultAdd_SeqSBAIJ_3; 1593431c96f7SBarry Smith B->ops->multtranspose = MatMult_SeqSBAIJ_3; 1594431c96f7SBarry Smith B->ops->multtransposeadd = MatMultAdd_SeqSBAIJ_3; 159549b5e25fSSatish Balay break; 159649b5e25fSSatish Balay case 4: 159749b5e25fSSatish Balay B->ops->mult = MatMult_SeqSBAIJ_4; 159849b5e25fSSatish Balay B->ops->multadd = MatMultAdd_SeqSBAIJ_4; 1599431c96f7SBarry Smith B->ops->multtranspose = MatMult_SeqSBAIJ_4; 1600431c96f7SBarry Smith B->ops->multtransposeadd = MatMultAdd_SeqSBAIJ_4; 160149b5e25fSSatish Balay break; 160249b5e25fSSatish Balay case 5: 160349b5e25fSSatish Balay B->ops->mult = MatMult_SeqSBAIJ_5; 160449b5e25fSSatish Balay B->ops->multadd = MatMultAdd_SeqSBAIJ_5; 1605431c96f7SBarry Smith B->ops->multtranspose = MatMult_SeqSBAIJ_5; 1606431c96f7SBarry Smith B->ops->multtransposeadd = MatMultAdd_SeqSBAIJ_5; 160749b5e25fSSatish Balay break; 160849b5e25fSSatish Balay case 6: 160949b5e25fSSatish Balay B->ops->mult = MatMult_SeqSBAIJ_6; 161049b5e25fSSatish Balay B->ops->multadd = MatMultAdd_SeqSBAIJ_6; 1611431c96f7SBarry Smith B->ops->multtranspose = MatMult_SeqSBAIJ_6; 1612431c96f7SBarry Smith B->ops->multtransposeadd = MatMultAdd_SeqSBAIJ_6; 161349b5e25fSSatish Balay break; 161449b5e25fSSatish Balay case 7: 1615de53e5efSHong Zhang B->ops->mult = MatMult_SeqSBAIJ_7; 161649b5e25fSSatish Balay B->ops->multadd = MatMultAdd_SeqSBAIJ_7; 1617431c96f7SBarry Smith B->ops->multtranspose = MatMult_SeqSBAIJ_7; 1618431c96f7SBarry Smith B->ops->multtransposeadd = MatMultAdd_SeqSBAIJ_7; 161949b5e25fSSatish Balay break; 162049b5e25fSSatish Balay } 162149b5e25fSSatish Balay } 162249b5e25fSSatish Balay 162349b5e25fSSatish Balay b->mbs = mbs; 16244dcd73b1SHong Zhang b->nbs = nbs; 1625ab93d7beSBarry Smith if (!skipallocation) { 16262ee49352SLisandro Dalcin if (!b->imax) { 16279566063dSJacob Faibussowitsch PetscCall(PetscMalloc2(mbs, &b->imax, mbs, &b->ilen)); 162826fbe8dcSKarl Rupp 1629c760cd28SBarry Smith b->free_imax_ilen = PETSC_TRUE; 16302ee49352SLisandro Dalcin } 163149b5e25fSSatish Balay if (!nnz) { 1632435da068SBarry Smith if (nz == PETSC_DEFAULT || nz == PETSC_DECIDE) nz = 5; 163349b5e25fSSatish Balay else if (nz <= 0) nz = 1; 16345d2a9ed1SStefano Zampini nz = PetscMin(nbs, nz); 163526fbe8dcSKarl Rupp for (i = 0; i < mbs; i++) b->imax[i] = nz; 16369566063dSJacob Faibussowitsch PetscCall(PetscIntMultError(nz, mbs, &nz)); 163749b5e25fSSatish Balay } else { 1638c73702f5SBarry Smith PetscInt64 nz64 = 0; 16399371c9d4SSatish Balay for (i = 0; i < mbs; i++) { 16409371c9d4SSatish Balay b->imax[i] = nnz[i]; 16419371c9d4SSatish Balay nz64 += nnz[i]; 16429371c9d4SSatish Balay } 16439566063dSJacob Faibussowitsch PetscCall(PetscIntCast(nz64, &nz)); 164449b5e25fSSatish Balay } 16452ee49352SLisandro Dalcin /* b->ilen will count nonzeros in each block row so far. */ 164626fbe8dcSKarl Rupp for (i = 0; i < mbs; i++) b->ilen[i] = 0; 16476c6c5352SBarry Smith /* nz=(nz+mbs)/2; */ /* total diagonal and superdiagonal nonzero blocks */ 164849b5e25fSSatish Balay 164949b5e25fSSatish Balay /* allocate the matrix space */ 16509566063dSJacob Faibussowitsch PetscCall(MatSeqXAIJFreeAIJ(B, &b->a, &b->j, &b->i)); 16519566063dSJacob Faibussowitsch PetscCall(PetscMalloc3(bs2 * nz, &b->a, nz, &b->j, B->rmap->N + 1, &b->i)); 16529566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(b->a, nz * bs2)); 16539566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(b->j, nz)); 165426fbe8dcSKarl Rupp 165549b5e25fSSatish Balay b->singlemalloc = PETSC_TRUE; 165649b5e25fSSatish Balay 165749b5e25fSSatish Balay /* pointer to beginning of each row */ 1658e60cf9a0SBarry Smith b->i[0] = 0; 165926fbe8dcSKarl Rupp for (i = 1; i < mbs + 1; i++) b->i[i] = b->i[i - 1] + b->imax[i - 1]; 166026fbe8dcSKarl Rupp 1661e6b907acSBarry Smith b->free_a = PETSC_TRUE; 1662e6b907acSBarry Smith b->free_ij = PETSC_TRUE; 1663e811da20SHong Zhang } else { 1664e6b907acSBarry Smith b->free_a = PETSC_FALSE; 1665e6b907acSBarry Smith b->free_ij = PETSC_FALSE; 1666ab93d7beSBarry Smith } 166749b5e25fSSatish Balay 166849b5e25fSSatish Balay b->bs2 = bs2; 16696c6c5352SBarry Smith b->nz = 0; 1670b32cb4a7SJed Brown b->maxnz = nz; 1671f4259b30SLisandro Dalcin b->inew = NULL; 1672f4259b30SLisandro Dalcin b->jnew = NULL; 1673f4259b30SLisandro Dalcin b->anew = NULL; 1674f4259b30SLisandro Dalcin b->a2anew = NULL; 16751a3463dfSHong Zhang b->permute = PETSC_FALSE; 1676cb7b82ddSBarry Smith 1677cb7b82ddSBarry Smith B->was_assembled = PETSC_FALSE; 1678cb7b82ddSBarry Smith B->assembled = PETSC_FALSE; 16799566063dSJacob Faibussowitsch if (realalloc) PetscCall(MatSetOption(B, MAT_NEW_NONZERO_ALLOCATION_ERR, PETSC_TRUE)); 16803ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1681c464158bSHong Zhang } 1682153ea458SHong Zhang 1683d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqSBAIJSetPreallocationCSR_SeqSBAIJ(Mat B, PetscInt bs, const PetscInt ii[], const PetscInt jj[], const PetscScalar V[]) 1684d71ae5a4SJacob Faibussowitsch { 16850cd7f59aSBarry Smith PetscInt i, j, m, nz, anz, nz_max = 0, *nnz; 1686f4259b30SLisandro Dalcin PetscScalar *values = NULL; 168738f409ebSLisandro Dalcin PetscBool roworiented = ((Mat_SeqSBAIJ *)B->data)->roworiented; 16880cd7f59aSBarry Smith 168938f409ebSLisandro Dalcin PetscFunctionBegin; 169008401ef6SPierre Jolivet PetscCheck(bs >= 1, PetscObjectComm((PetscObject)B), PETSC_ERR_ARG_OUTOFRANGE, "Invalid block size specified, must be positive but it is %" PetscInt_FMT, bs); 16919566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetBlockSize(B->rmap, bs)); 16929566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetBlockSize(B->cmap, bs)); 16939566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(B->rmap)); 16949566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(B->cmap)); 16959566063dSJacob Faibussowitsch PetscCall(PetscLayoutGetBlockSize(B->rmap, &bs)); 169638f409ebSLisandro Dalcin m = B->rmap->n / bs; 169738f409ebSLisandro Dalcin 1698aed4548fSBarry Smith PetscCheck(!ii[0], PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "ii[0] must be 0 but it is %" PetscInt_FMT, ii[0]); 16999566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m + 1, &nnz)); 170038f409ebSLisandro Dalcin for (i = 0; i < m; i++) { 170138f409ebSLisandro Dalcin nz = ii[i + 1] - ii[i]; 170208401ef6SPierre Jolivet PetscCheck(nz >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Row %" PetscInt_FMT " has a negative number of columns %" PetscInt_FMT, i, nz); 17030cd7f59aSBarry Smith anz = 0; 17040cd7f59aSBarry Smith for (j = 0; j < nz; j++) { 17050cd7f59aSBarry Smith /* count only values on the diagonal or above */ 17060cd7f59aSBarry Smith if (jj[ii[i] + j] >= i) { 17070cd7f59aSBarry Smith anz = nz - j; 17080cd7f59aSBarry Smith break; 17090cd7f59aSBarry Smith } 17100cd7f59aSBarry Smith } 17110cd7f59aSBarry Smith nz_max = PetscMax(nz_max, anz); 17120cd7f59aSBarry Smith nnz[i] = anz; 171338f409ebSLisandro Dalcin } 17149566063dSJacob Faibussowitsch PetscCall(MatSeqSBAIJSetPreallocation(B, bs, 0, nnz)); 17159566063dSJacob Faibussowitsch PetscCall(PetscFree(nnz)); 171638f409ebSLisandro Dalcin 171738f409ebSLisandro Dalcin values = (PetscScalar *)V; 171848a46eb9SPierre Jolivet if (!values) PetscCall(PetscCalloc1(bs * bs * nz_max, &values)); 171938f409ebSLisandro Dalcin for (i = 0; i < m; i++) { 172038f409ebSLisandro Dalcin PetscInt ncols = ii[i + 1] - ii[i]; 172138f409ebSLisandro Dalcin const PetscInt *icols = jj + ii[i]; 172238f409ebSLisandro Dalcin if (!roworiented || bs == 1) { 172338f409ebSLisandro Dalcin const PetscScalar *svals = values + (V ? (bs * bs * ii[i]) : 0); 17249566063dSJacob Faibussowitsch PetscCall(MatSetValuesBlocked_SeqSBAIJ(B, 1, &i, ncols, icols, svals, INSERT_VALUES)); 172538f409ebSLisandro Dalcin } else { 172638f409ebSLisandro Dalcin for (j = 0; j < ncols; j++) { 172738f409ebSLisandro Dalcin const PetscScalar *svals = values + (V ? (bs * bs * (ii[i] + j)) : 0); 17289566063dSJacob Faibussowitsch PetscCall(MatSetValuesBlocked_SeqSBAIJ(B, 1, &i, 1, &icols[j], svals, INSERT_VALUES)); 172938f409ebSLisandro Dalcin } 173038f409ebSLisandro Dalcin } 173138f409ebSLisandro Dalcin } 17329566063dSJacob Faibussowitsch if (!V) PetscCall(PetscFree(values)); 17339566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(B, MAT_FINAL_ASSEMBLY)); 17349566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(B, MAT_FINAL_ASSEMBLY)); 17359566063dSJacob Faibussowitsch PetscCall(MatSetOption(B, MAT_NEW_NONZERO_LOCATION_ERR, PETSC_TRUE)); 17363ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 173738f409ebSLisandro Dalcin } 173838f409ebSLisandro Dalcin 1739db4efbfdSBarry Smith /* 1740db4efbfdSBarry Smith This is used to set the numeric factorization for both Cholesky and ICC symbolic factorization 1741db4efbfdSBarry Smith */ 1742d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqSBAIJSetNumericFactorization_inplace(Mat B, PetscBool natural) 1743d71ae5a4SJacob Faibussowitsch { 1744ace3abfcSBarry Smith PetscBool flg = PETSC_FALSE; 1745db4efbfdSBarry Smith PetscInt bs = B->rmap->bs; 1746db4efbfdSBarry Smith 1747db4efbfdSBarry Smith PetscFunctionBegin; 17489566063dSJacob Faibussowitsch PetscCall(PetscOptionsGetBool(((PetscObject)B)->options, ((PetscObject)B)->prefix, "-mat_no_unroll", &flg, NULL)); 1749db4efbfdSBarry Smith if (flg) bs = 8; 1750db4efbfdSBarry Smith 1751db4efbfdSBarry Smith if (!natural) { 1752db4efbfdSBarry Smith switch (bs) { 1753d71ae5a4SJacob Faibussowitsch case 1: 1754d71ae5a4SJacob Faibussowitsch B->ops->choleskyfactornumeric = MatCholeskyFactorNumeric_SeqSBAIJ_1_inplace; 1755d71ae5a4SJacob Faibussowitsch break; 1756d71ae5a4SJacob Faibussowitsch case 2: 1757d71ae5a4SJacob Faibussowitsch B->ops->choleskyfactornumeric = MatCholeskyFactorNumeric_SeqSBAIJ_2; 1758d71ae5a4SJacob Faibussowitsch break; 1759d71ae5a4SJacob Faibussowitsch case 3: 1760d71ae5a4SJacob Faibussowitsch B->ops->choleskyfactornumeric = MatCholeskyFactorNumeric_SeqSBAIJ_3; 1761d71ae5a4SJacob Faibussowitsch break; 1762d71ae5a4SJacob Faibussowitsch case 4: 1763d71ae5a4SJacob Faibussowitsch B->ops->choleskyfactornumeric = MatCholeskyFactorNumeric_SeqSBAIJ_4; 1764d71ae5a4SJacob Faibussowitsch break; 1765d71ae5a4SJacob Faibussowitsch case 5: 1766d71ae5a4SJacob Faibussowitsch B->ops->choleskyfactornumeric = MatCholeskyFactorNumeric_SeqSBAIJ_5; 1767d71ae5a4SJacob Faibussowitsch break; 1768d71ae5a4SJacob Faibussowitsch case 6: 1769d71ae5a4SJacob Faibussowitsch B->ops->choleskyfactornumeric = MatCholeskyFactorNumeric_SeqSBAIJ_6; 1770d71ae5a4SJacob Faibussowitsch break; 1771d71ae5a4SJacob Faibussowitsch case 7: 1772d71ae5a4SJacob Faibussowitsch B->ops->choleskyfactornumeric = MatCholeskyFactorNumeric_SeqSBAIJ_7; 1773d71ae5a4SJacob Faibussowitsch break; 1774d71ae5a4SJacob Faibussowitsch default: 1775d71ae5a4SJacob Faibussowitsch B->ops->choleskyfactornumeric = MatCholeskyFactorNumeric_SeqSBAIJ_N; 1776d71ae5a4SJacob Faibussowitsch break; 1777db4efbfdSBarry Smith } 1778db4efbfdSBarry Smith } else { 1779db4efbfdSBarry Smith switch (bs) { 1780d71ae5a4SJacob Faibussowitsch case 1: 1781d71ae5a4SJacob Faibussowitsch B->ops->choleskyfactornumeric = MatCholeskyFactorNumeric_SeqSBAIJ_1_NaturalOrdering_inplace; 1782d71ae5a4SJacob Faibussowitsch break; 1783d71ae5a4SJacob Faibussowitsch case 2: 1784d71ae5a4SJacob Faibussowitsch B->ops->choleskyfactornumeric = MatCholeskyFactorNumeric_SeqSBAIJ_2_NaturalOrdering; 1785d71ae5a4SJacob Faibussowitsch break; 1786d71ae5a4SJacob Faibussowitsch case 3: 1787d71ae5a4SJacob Faibussowitsch B->ops->choleskyfactornumeric = MatCholeskyFactorNumeric_SeqSBAIJ_3_NaturalOrdering; 1788d71ae5a4SJacob Faibussowitsch break; 1789d71ae5a4SJacob Faibussowitsch case 4: 1790d71ae5a4SJacob Faibussowitsch B->ops->choleskyfactornumeric = MatCholeskyFactorNumeric_SeqSBAIJ_4_NaturalOrdering; 1791d71ae5a4SJacob Faibussowitsch break; 1792d71ae5a4SJacob Faibussowitsch case 5: 1793d71ae5a4SJacob Faibussowitsch B->ops->choleskyfactornumeric = MatCholeskyFactorNumeric_SeqSBAIJ_5_NaturalOrdering; 1794d71ae5a4SJacob Faibussowitsch break; 1795d71ae5a4SJacob Faibussowitsch case 6: 1796d71ae5a4SJacob Faibussowitsch B->ops->choleskyfactornumeric = MatCholeskyFactorNumeric_SeqSBAIJ_6_NaturalOrdering; 1797d71ae5a4SJacob Faibussowitsch break; 1798d71ae5a4SJacob Faibussowitsch case 7: 1799d71ae5a4SJacob Faibussowitsch B->ops->choleskyfactornumeric = MatCholeskyFactorNumeric_SeqSBAIJ_7_NaturalOrdering; 1800d71ae5a4SJacob Faibussowitsch break; 1801d71ae5a4SJacob Faibussowitsch default: 1802d71ae5a4SJacob Faibussowitsch B->ops->choleskyfactornumeric = MatCholeskyFactorNumeric_SeqSBAIJ_N_NaturalOrdering; 1803d71ae5a4SJacob Faibussowitsch break; 1804db4efbfdSBarry Smith } 1805db4efbfdSBarry Smith } 18063ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1807db4efbfdSBarry Smith } 1808db4efbfdSBarry Smith 1809cc2e6a90SBarry Smith PETSC_INTERN PetscErrorCode MatConvert_SeqSBAIJ_SeqAIJ(Mat, MatType, MatReuse, Mat *); 1810cc2e6a90SBarry Smith PETSC_INTERN PetscErrorCode MatConvert_SeqSBAIJ_SeqBAIJ(Mat, MatType, MatReuse, Mat *); 1811d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatFactorGetSolverType_petsc(Mat A, MatSolverType *type) 1812d71ae5a4SJacob Faibussowitsch { 18134ac6704cSBarry Smith PetscFunctionBegin; 18144ac6704cSBarry Smith *type = MATSOLVERPETSC; 18153ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 18164ac6704cSBarry Smith } 1817d769727bSBarry Smith 1818d71ae5a4SJacob Faibussowitsch PETSC_INTERN PetscErrorCode MatGetFactor_seqsbaij_petsc(Mat A, MatFactorType ftype, Mat *B) 1819d71ae5a4SJacob Faibussowitsch { 1820d0f46423SBarry Smith PetscInt n = A->rmap->n; 18215c9eb25fSBarry Smith 18225c9eb25fSBarry Smith PetscFunctionBegin; 18230e92d65fSHong Zhang #if defined(PETSC_USE_COMPLEX) 1824b94d7dedSBarry Smith PetscCheck(A->hermitian != PETSC_BOOL3_TRUE || A->symmetric == PETSC_BOOL3_TRUE || (ftype != MAT_FACTOR_CHOLESKY && ftype != MAT_FACTOR_ICC), PETSC_COMM_SELF, PETSC_ERR_SUP, "Hermitian CHOLESKY or ICC Factor is not supported"); 18250e92d65fSHong Zhang #endif 1826eb1ec7c1SStefano Zampini 18279566063dSJacob Faibussowitsch PetscCall(MatCreate(PetscObjectComm((PetscObject)A), B)); 18289566063dSJacob Faibussowitsch PetscCall(MatSetSizes(*B, n, n, n, n)); 18295c9eb25fSBarry Smith if (ftype == MAT_FACTOR_CHOLESKY || ftype == MAT_FACTOR_ICC) { 18309566063dSJacob Faibussowitsch PetscCall(MatSetType(*B, MATSEQSBAIJ)); 18319566063dSJacob Faibussowitsch PetscCall(MatSeqSBAIJSetPreallocation(*B, A->rmap->bs, MAT_SKIP_ALLOCATION, NULL)); 183226fbe8dcSKarl Rupp 18337b056e98SHong Zhang (*B)->ops->choleskyfactorsymbolic = MatCholeskyFactorSymbolic_SeqSBAIJ; 1834c6d0d4f0SHong Zhang (*B)->ops->iccfactorsymbolic = MatICCFactorSymbolic_SeqSBAIJ; 18359566063dSJacob Faibussowitsch PetscCall(PetscStrallocpy(MATORDERINGNATURAL, (char **)&(*B)->preferredordering[MAT_FACTOR_CHOLESKY])); 18369566063dSJacob Faibussowitsch PetscCall(PetscStrallocpy(MATORDERINGNATURAL, (char **)&(*B)->preferredordering[MAT_FACTOR_ICC])); 1837e32f2f54SBarry Smith } else SETERRQ(PETSC_COMM_SELF, PETSC_ERR_SUP, "Factor type not supported"); 183800c67f3bSHong Zhang 1839d5f3da31SBarry Smith (*B)->factortype = ftype; 1840f73b0415SBarry Smith (*B)->canuseordering = PETSC_TRUE; 18419566063dSJacob Faibussowitsch PetscCall(PetscFree((*B)->solvertype)); 18429566063dSJacob Faibussowitsch PetscCall(PetscStrallocpy(MATSOLVERPETSC, &(*B)->solvertype)); 18439566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)*B, "MatFactorGetSolverType_C", MatFactorGetSolverType_petsc)); 18443ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 18455c9eb25fSBarry Smith } 18465c9eb25fSBarry Smith 18478397e458SBarry Smith /*@C 18482ef1f0ffSBarry Smith MatSeqSBAIJGetArray - gives access to the array where the numerical data for a `MATSEQSBAIJ` matrix is stored 18498397e458SBarry Smith 18508397e458SBarry Smith Not Collective 18518397e458SBarry Smith 18528397e458SBarry Smith Input Parameter: 185311a5261eSBarry Smith . mat - a `MATSEQSBAIJ` matrix 18548397e458SBarry Smith 18558397e458SBarry Smith Output Parameter: 18568397e458SBarry Smith . array - pointer to the data 18578397e458SBarry Smith 18588397e458SBarry Smith Level: intermediate 18598397e458SBarry Smith 1860*1cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MATSEQSBAIJ`, `MatSeqSBAIJRestoreArray()`, `MatSeqAIJGetArray()`, `MatSeqAIJRestoreArray()` 18618397e458SBarry Smith @*/ 1862d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqSBAIJGetArray(Mat A, PetscScalar **array) 1863d71ae5a4SJacob Faibussowitsch { 18648397e458SBarry Smith PetscFunctionBegin; 1865cac4c232SBarry Smith PetscUseMethod(A, "MatSeqSBAIJGetArray_C", (Mat, PetscScalar **), (A, array)); 18663ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 18678397e458SBarry Smith } 18688397e458SBarry Smith 18698397e458SBarry Smith /*@C 18702ef1f0ffSBarry Smith MatSeqSBAIJRestoreArray - returns access to the array where the numerical data for a `MATSEQSBAIJ` matrix is stored obtained by `MatSeqSBAIJGetArray()` 18718397e458SBarry Smith 18728397e458SBarry Smith Not Collective 18738397e458SBarry Smith 18748397e458SBarry Smith Input Parameters: 18752ef1f0ffSBarry Smith + mat - a `MATSEQSBAIJ` matrix 1876a2b725a8SWilliam Gropp - array - pointer to the data 18778397e458SBarry Smith 18788397e458SBarry Smith Level: intermediate 18798397e458SBarry Smith 1880*1cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MATSEQSBAIJ`, `MatSeqSBAIJGetArray()`, `MatSeqAIJGetArray()`, `MatSeqAIJRestoreArray()` 18818397e458SBarry Smith @*/ 1882d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqSBAIJRestoreArray(Mat A, PetscScalar **array) 1883d71ae5a4SJacob Faibussowitsch { 18848397e458SBarry Smith PetscFunctionBegin; 1885cac4c232SBarry Smith PetscUseMethod(A, "MatSeqSBAIJRestoreArray_C", (Mat, PetscScalar **), (A, array)); 18863ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 18878397e458SBarry Smith } 18888397e458SBarry Smith 18890bad9183SKris Buschelman /*MC 1890fafad747SKris Buschelman MATSEQSBAIJ - MATSEQSBAIJ = "seqsbaij" - A matrix type to be used for sequential symmetric block sparse matrices, 18910bad9183SKris Buschelman based on block compressed sparse row format. Only the upper triangular portion of the matrix is stored. 18920bad9183SKris Buschelman 1893828413b8SBarry Smith For complex numbers by default this matrix is symmetric, NOT Hermitian symmetric. To make it Hermitian symmetric you 189411a5261eSBarry Smith can call `MatSetOption`(`Mat`, `MAT_HERMITIAN`). 1895828413b8SBarry Smith 18962ef1f0ffSBarry Smith Options Database Key: 189711a5261eSBarry Smith . -mat_type seqsbaij - sets the matrix type to "seqsbaij" during a call to `MatSetFromOptions()` 18980bad9183SKris Buschelman 18992ef1f0ffSBarry Smith Level: beginner 19002ef1f0ffSBarry Smith 190195452b02SPatrick Sanan Notes: 190295452b02SPatrick Sanan By default if you insert values into the lower triangular part of the matrix they are simply ignored (since they are not 190311a5261eSBarry Smith stored and it is assumed they symmetric to the upper triangular). If you call `MatSetOption`(`Mat`,`MAT_IGNORE_LOWER_TRIANGULAR`,`PETSC_FALSE`) or use 19042ef1f0ffSBarry Smith the options database `-mat_ignore_lower_triangular` false it will generate an error if you try to set a value in the lower triangular portion. 190571dad5bbSBarry Smith 1906476417e5SBarry Smith The number of rows in the matrix must be less than or equal to the number of columns 190771dad5bbSBarry Smith 1908*1cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MATSEQSBAIJ`, `MatCreateSeqSBAIJ()`, `MatType`, `MATMPISBAIJ` 19090bad9183SKris Buschelman M*/ 1910d71ae5a4SJacob Faibussowitsch PETSC_EXTERN PetscErrorCode MatCreate_SeqSBAIJ(Mat B) 1911d71ae5a4SJacob Faibussowitsch { 1912a23d5eceSKris Buschelman Mat_SeqSBAIJ *b; 191313f74950SBarry Smith PetscMPIInt size; 1914ace3abfcSBarry Smith PetscBool no_unroll = PETSC_FALSE, no_inode = PETSC_FALSE; 1915a23d5eceSKris Buschelman 1916a23d5eceSKris Buschelman PetscFunctionBegin; 19179566063dSJacob Faibussowitsch PetscCallMPI(MPI_Comm_size(PetscObjectComm((PetscObject)B), &size)); 191808401ef6SPierre Jolivet PetscCheck(size <= 1, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONG, "Comm must be of size 1"); 1919a23d5eceSKris Buschelman 19204dfa11a4SJacob Faibussowitsch PetscCall(PetscNew(&b)); 1921a23d5eceSKris Buschelman B->data = (void *)b; 19229566063dSJacob Faibussowitsch PetscCall(PetscMemcpy(B->ops, &MatOps_Values, sizeof(struct _MatOps))); 192326fbe8dcSKarl Rupp 1924a23d5eceSKris Buschelman B->ops->destroy = MatDestroy_SeqSBAIJ; 1925a23d5eceSKris Buschelman B->ops->view = MatView_SeqSBAIJ; 1926f4259b30SLisandro Dalcin b->row = NULL; 1927f4259b30SLisandro Dalcin b->icol = NULL; 1928a23d5eceSKris Buschelman b->reallocs = 0; 1929f4259b30SLisandro Dalcin b->saved_values = NULL; 19300def2e27SBarry Smith b->inode.limit = 5; 19310def2e27SBarry Smith b->inode.max_limit = 5; 1932a23d5eceSKris Buschelman 1933a23d5eceSKris Buschelman b->roworiented = PETSC_TRUE; 1934a23d5eceSKris Buschelman b->nonew = 0; 1935f4259b30SLisandro Dalcin b->diag = NULL; 1936f4259b30SLisandro Dalcin b->solve_work = NULL; 1937f4259b30SLisandro Dalcin b->mult_work = NULL; 1938f4259b30SLisandro Dalcin B->spptr = NULL; 1939f2cbd3d5SJed Brown B->info.nz_unneeded = (PetscReal)b->maxnz * b->bs2; 1940a9817697SBarry Smith b->keepnonzeropattern = PETSC_FALSE; 1941a23d5eceSKris Buschelman 1942f4259b30SLisandro Dalcin b->inew = NULL; 1943f4259b30SLisandro Dalcin b->jnew = NULL; 1944f4259b30SLisandro Dalcin b->anew = NULL; 1945f4259b30SLisandro Dalcin b->a2anew = NULL; 1946a23d5eceSKris Buschelman b->permute = PETSC_FALSE; 1947a23d5eceSKris Buschelman 194871dad5bbSBarry Smith b->ignore_ltriangular = PETSC_TRUE; 194926fbe8dcSKarl Rupp 19509566063dSJacob Faibussowitsch PetscCall(PetscOptionsGetBool(((PetscObject)B)->options, ((PetscObject)B)->prefix, "-mat_ignore_lower_triangular", &b->ignore_ltriangular, NULL)); 1951941593c8SHong Zhang 1952f5edf698SHong Zhang b->getrow_utriangular = PETSC_FALSE; 195326fbe8dcSKarl Rupp 19549566063dSJacob Faibussowitsch PetscCall(PetscOptionsGetBool(((PetscObject)B)->options, ((PetscObject)B)->prefix, "-mat_getrow_uppertriangular", &b->getrow_utriangular, NULL)); 1955f5edf698SHong Zhang 19569566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSeqSBAIJGetArray_C", MatSeqSBAIJGetArray_SeqSBAIJ)); 19579566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSeqSBAIJRestoreArray_C", MatSeqSBAIJRestoreArray_SeqSBAIJ)); 19589566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatStoreValues_C", MatStoreValues_SeqSBAIJ)); 19599566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatRetrieveValues_C", MatRetrieveValues_SeqSBAIJ)); 19609566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSeqSBAIJSetColumnIndices_C", MatSeqSBAIJSetColumnIndices_SeqSBAIJ)); 19619566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqsbaij_seqaij_C", MatConvert_SeqSBAIJ_SeqAIJ)); 19629566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqsbaij_seqbaij_C", MatConvert_SeqSBAIJ_SeqBAIJ)); 19639566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSeqSBAIJSetPreallocation_C", MatSeqSBAIJSetPreallocation_SeqSBAIJ)); 19649566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSeqSBAIJSetPreallocationCSR_C", MatSeqSBAIJSetPreallocationCSR_SeqSBAIJ)); 19656214f412SHong Zhang #if defined(PETSC_HAVE_ELEMENTAL) 19669566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqsbaij_elemental_C", MatConvert_SeqSBAIJ_Elemental)); 19676214f412SHong Zhang #endif 1968d24d4204SJose E. Roman #if defined(PETSC_HAVE_SCALAPACK) 19699566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqsbaij_scalapack_C", MatConvert_SBAIJ_ScaLAPACK)); 1970d24d4204SJose E. Roman #endif 197123ce1328SBarry Smith 1972b94d7dedSBarry Smith B->symmetry_eternal = PETSC_TRUE; 1973b94d7dedSBarry Smith B->structural_symmetry_eternal = PETSC_TRUE; 1974b94d7dedSBarry Smith B->symmetric = PETSC_BOOL3_TRUE; 1975b94d7dedSBarry Smith B->structurally_symmetric = PETSC_BOOL3_TRUE; 1976eb1ec7c1SStefano Zampini #if defined(PETSC_USE_COMPLEX) 1977b94d7dedSBarry Smith B->hermitian = PETSC_BOOL3_FALSE; 1978eb1ec7c1SStefano Zampini #else 1979b94d7dedSBarry Smith B->hermitian = PETSC_BOOL3_TRUE; 1980eb1ec7c1SStefano Zampini #endif 198113647f61SHong Zhang 19829566063dSJacob Faibussowitsch PetscCall(PetscObjectChangeTypeName((PetscObject)B, MATSEQSBAIJ)); 19830def2e27SBarry Smith 1984d0609cedSBarry Smith PetscOptionsBegin(PetscObjectComm((PetscObject)B), ((PetscObject)B)->prefix, "Options for SEQSBAIJ matrix", "Mat"); 19859566063dSJacob Faibussowitsch PetscCall(PetscOptionsBool("-mat_no_unroll", "Do not optimize for inodes (slower)", NULL, no_unroll, &no_unroll, NULL)); 198648a46eb9SPierre Jolivet if (no_unroll) PetscCall(PetscInfo(B, "Not using Inode routines due to -mat_no_unroll\n")); 19879566063dSJacob Faibussowitsch PetscCall(PetscOptionsBool("-mat_no_inode", "Do not optimize for inodes (slower)", NULL, no_inode, &no_inode, NULL)); 19889566063dSJacob Faibussowitsch if (no_inode) PetscCall(PetscInfo(B, "Not using Inode routines due to -mat_no_inode\n")); 19899566063dSJacob Faibussowitsch PetscCall(PetscOptionsInt("-mat_inode_limit", "Do not use inodes larger then this value", NULL, b->inode.limit, &b->inode.limit, NULL)); 1990d0609cedSBarry Smith PetscOptionsEnd(); 1991ace3abfcSBarry Smith b->inode.use = (PetscBool)(!(no_unroll || no_inode)); 19920def2e27SBarry Smith if (b->inode.limit > b->inode.max_limit) b->inode.limit = b->inode.max_limit; 19933ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1994a23d5eceSKris Buschelman } 1995a23d5eceSKris Buschelman 1996a23d5eceSKris Buschelman /*@C 1997a23d5eceSKris Buschelman MatSeqSBAIJSetPreallocation - Creates a sparse symmetric matrix in block AIJ (block 199811a5261eSBarry Smith compressed row) `MATSEQSBAIJ` format. For good matrix assembly performance the 199920f4b53cSBarry Smith user should preallocate the matrix storage by setting the parameter `nz` 200020f4b53cSBarry Smith (or the array `nnz`). 2001a23d5eceSKris Buschelman 2002c3339decSBarry Smith Collective 2003a23d5eceSKris Buschelman 2004a23d5eceSKris Buschelman Input Parameters: 20051c4f3114SJed Brown + B - the symmetric matrix 200611a5261eSBarry Smith . bs - size of block, the blocks are ALWAYS square. One can use `MatSetBlockSizes()` to set a different row and column blocksize but the row 200711a5261eSBarry Smith blocksize always defines the size of the blocks. The column blocksize sets the blocksize of the vectors obtained with `MatCreateVecs()` 2008a23d5eceSKris Buschelman . nz - number of block nonzeros per block row (same for all rows) 2009a23d5eceSKris Buschelman - nnz - array containing the number of block nonzeros in the upper triangular plus 20102ef1f0ffSBarry Smith diagonal portion of each block (possibly different for each block row) or `NULL` 2011a23d5eceSKris Buschelman 2012a23d5eceSKris Buschelman Options Database Keys: 2013a2b725a8SWilliam Gropp + -mat_no_unroll - uses code that does not unroll the loops in the 2014a23d5eceSKris Buschelman block calculations (much slower) 2015a2b725a8SWilliam Gropp - -mat_block_size - size of the blocks to use (only works if a negative bs is passed in 2016a23d5eceSKris Buschelman 2017a23d5eceSKris Buschelman Level: intermediate 2018a23d5eceSKris Buschelman 2019a23d5eceSKris Buschelman Notes: 202020f4b53cSBarry Smith Specify the preallocated storage with either `nz` or `nnz` (not both). 20212ef1f0ffSBarry Smith Set `nz` = `PETSC_DEFAULT` and `nnz` = `NULL` for PETSc to control dynamic memory 2022651615e1SBarry Smith allocation. See [Sparse Matrices](sec_matsparse) for details. 2023a23d5eceSKris Buschelman 202411a5261eSBarry Smith You can call `MatGetInfo()` to get information on how effective the preallocation was; 2025aa95bbe8SBarry Smith for example the fields mallocs,nz_allocated,nz_used,nz_unneeded; 20262ef1f0ffSBarry Smith You can also run with the option `-info` and look for messages with the string 2027aa95bbe8SBarry Smith malloc in them to see if additional memory allocation was needed. 2028aa95bbe8SBarry Smith 20292ef1f0ffSBarry Smith If the `nnz` parameter is given then the `nz` parameter is ignored 203049a6f317SBarry Smith 2031*1cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, [Sparse Matrices](sec_matsparse), `MATSEQSBAIJ`, `MatCreate()`, `MatCreateSeqAIJ()`, `MatSetValues()`, `MatCreateSBAIJ()` 2032a23d5eceSKris Buschelman @*/ 2033d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqSBAIJSetPreallocation(Mat B, PetscInt bs, PetscInt nz, const PetscInt nnz[]) 2034d71ae5a4SJacob Faibussowitsch { 2035a23d5eceSKris Buschelman PetscFunctionBegin; 20366ba663aaSJed Brown PetscValidHeaderSpecific(B, MAT_CLASSID, 1); 20376ba663aaSJed Brown PetscValidType(B, 1); 20386ba663aaSJed Brown PetscValidLogicalCollectiveInt(B, bs, 2); 2039cac4c232SBarry Smith PetscTryMethod(B, "MatSeqSBAIJSetPreallocation_C", (Mat, PetscInt, PetscInt, const PetscInt[]), (B, bs, nz, nnz)); 20403ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 2041a23d5eceSKris Buschelman } 204249b5e25fSSatish Balay 204338f409ebSLisandro Dalcin /*@C 204411a5261eSBarry Smith MatSeqSBAIJSetPreallocationCSR - Creates a sparse parallel matrix in `MATSEQSBAIJ` format using the given nonzero structure and (optional) numerical values 204538f409ebSLisandro Dalcin 204638f409ebSLisandro Dalcin Input Parameters: 20471c4f3114SJed Brown + B - the matrix 2048eab78319SHong Zhang . bs - size of block, the blocks are ALWAYS square. 204938f409ebSLisandro Dalcin . i - the indices into j for the start of each local row (starts with zero) 205038f409ebSLisandro Dalcin . j - the column indices for each local row (starts with zero) these must be sorted for each row 205138f409ebSLisandro Dalcin - v - optional values in the matrix 205238f409ebSLisandro Dalcin 2053664954b6SBarry Smith Level: advanced 205438f409ebSLisandro Dalcin 205538f409ebSLisandro Dalcin Notes: 205611a5261eSBarry Smith The order of the entries in values is specified by the `MatOption` `MAT_ROW_ORIENTED`. For example, C programs 205711a5261eSBarry Smith may want to use the default `MAT_ROW_ORIENTED` = `PETSC_TRUE` and use an array v[nnz][bs][bs] where the second index is 205838f409ebSLisandro Dalcin over rows within a block and the last index is over columns within a block row. Fortran programs will likely set 205911a5261eSBarry Smith `MAT_ROW_ORIENTED` = `PETSC_FALSE` and use a Fortran array v(bs,bs,nnz) in which the first index is over rows within a 206038f409ebSLisandro Dalcin block column and the second index is over columns within a block. 206138f409ebSLisandro Dalcin 206250c5228eSBarry Smith Any entries below the diagonal are ignored 20630cd7f59aSBarry Smith 20640cd7f59aSBarry Smith Though this routine has Preallocation() in the name it also sets the exact nonzero locations of the matrix entries 20650cd7f59aSBarry Smith and usually the numerical values as well 2066664954b6SBarry Smith 2067*1cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MATSEQSBAIJ`, `MatCreate()`, `MatCreateSeqSBAIJ()`, `MatSetValuesBlocked()`, `MatSeqSBAIJSetPreallocation()`, `MATSEQSBAIJ` 206838f409ebSLisandro Dalcin @*/ 2069d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqSBAIJSetPreallocationCSR(Mat B, PetscInt bs, const PetscInt i[], const PetscInt j[], const PetscScalar v[]) 2070d71ae5a4SJacob Faibussowitsch { 207138f409ebSLisandro Dalcin PetscFunctionBegin; 207238f409ebSLisandro Dalcin PetscValidHeaderSpecific(B, MAT_CLASSID, 1); 207338f409ebSLisandro Dalcin PetscValidType(B, 1); 207438f409ebSLisandro Dalcin PetscValidLogicalCollectiveInt(B, bs, 2); 2075cac4c232SBarry Smith PetscTryMethod(B, "MatSeqSBAIJSetPreallocationCSR_C", (Mat, PetscInt, const PetscInt[], const PetscInt[], const PetscScalar[]), (B, bs, i, j, v)); 20763ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 207738f409ebSLisandro Dalcin } 207838f409ebSLisandro Dalcin 2079c464158bSHong Zhang /*@C 20802ef1f0ffSBarry Smith MatCreateSeqSBAIJ - Creates a sparse symmetric matrix in (block 208111a5261eSBarry Smith compressed row) `MATSEQSBAIJ` format. For good matrix assembly performance the 20822ef1f0ffSBarry Smith user should preallocate the matrix storage by setting the parameter `nz` 20832ef1f0ffSBarry Smith (or the array `nnz`). 208449b5e25fSSatish Balay 2085d083f849SBarry Smith Collective 2086c464158bSHong Zhang 2087c464158bSHong Zhang Input Parameters: 208811a5261eSBarry Smith + comm - MPI communicator, set to `PETSC_COMM_SELF` 208911a5261eSBarry Smith . bs - size of block, the blocks are ALWAYS square. One can use `MatSetBlockSizes()` to set a different row and column blocksize but the row 2090bb7ae925SBarry Smith blocksize always defines the size of the blocks. The column blocksize sets the blocksize of the vectors obtained with MatCreateVecs() 209120f4b53cSBarry Smith . m - number of rows 209220f4b53cSBarry Smith . n - number of columns 2093c464158bSHong Zhang . nz - number of block nonzeros per block row (same for all rows) 2094744e8345SSatish Balay - nnz - array containing the number of block nonzeros in the upper triangular plus 20952ef1f0ffSBarry Smith diagonal portion of each block (possibly different for each block row) or `NULL` 2096c464158bSHong Zhang 2097c464158bSHong Zhang Output Parameter: 2098c464158bSHong Zhang . A - the symmetric matrix 2099c464158bSHong Zhang 2100c464158bSHong Zhang Options Database Keys: 2101a2b725a8SWilliam Gropp + -mat_no_unroll - uses code that does not unroll the loops in the 2102c464158bSHong Zhang block calculations (much slower) 2103a2b725a8SWilliam Gropp - -mat_block_size - size of the blocks to use 2104c464158bSHong Zhang 2105c464158bSHong Zhang Level: intermediate 2106c464158bSHong Zhang 21072ef1f0ffSBarry Smith Notes: 210811a5261eSBarry Smith It is recommended that one use the `MatCreate()`, `MatSetType()` and/or `MatSetFromOptions()`, 2109f6f02116SRichard Tran Mills MatXXXXSetPreallocation() paradigm instead of this routine directly. 211011a5261eSBarry Smith [MatXXXXSetPreallocation() is, for example, `MatSeqAIJSetPreallocation()`] 2111175b88e8SBarry Smith 21126d6d819aSHong Zhang The number of rows and columns must be divisible by blocksize. 21136d6d819aSHong Zhang This matrix type does not support complex Hermitian operation. 2114c464158bSHong Zhang 21152ef1f0ffSBarry Smith Specify the preallocated storage with either `nz` or `nnz` (not both). 21162ef1f0ffSBarry Smith Set `nz` = `PETSC_DEFAULT` and `nnz` = `NULL` for PETSc to control dynamic memory 2117651615e1SBarry Smith allocation. See [Sparse Matrices](sec_matsparse) for details. 2118c464158bSHong Zhang 21192ef1f0ffSBarry Smith If the `nnz` parameter is given then the `nz` parameter is ignored 212049a6f317SBarry Smith 2121*1cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, [Sparse Matrices](sec_matsparse), `MATSEQSBAIJ`, `MatCreate()`, `MatCreateSeqAIJ()`, `MatSetValues()`, `MatCreateSBAIJ()` 2122c464158bSHong Zhang @*/ 2123d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateSeqSBAIJ(MPI_Comm comm, PetscInt bs, PetscInt m, PetscInt n, PetscInt nz, const PetscInt nnz[], Mat *A) 2124d71ae5a4SJacob Faibussowitsch { 2125c464158bSHong Zhang PetscFunctionBegin; 21269566063dSJacob Faibussowitsch PetscCall(MatCreate(comm, A)); 21279566063dSJacob Faibussowitsch PetscCall(MatSetSizes(*A, m, n, m, n)); 21289566063dSJacob Faibussowitsch PetscCall(MatSetType(*A, MATSEQSBAIJ)); 21299566063dSJacob Faibussowitsch PetscCall(MatSeqSBAIJSetPreallocation(*A, bs, nz, (PetscInt *)nnz)); 21303ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 213149b5e25fSSatish Balay } 213249b5e25fSSatish Balay 2133d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDuplicate_SeqSBAIJ(Mat A, MatDuplicateOption cpvalues, Mat *B) 2134d71ae5a4SJacob Faibussowitsch { 213549b5e25fSSatish Balay Mat C; 213649b5e25fSSatish Balay Mat_SeqSBAIJ *c, *a = (Mat_SeqSBAIJ *)A->data; 2137b40805acSSatish Balay PetscInt i, mbs = a->mbs, nz = a->nz, bs2 = a->bs2; 213849b5e25fSSatish Balay 213949b5e25fSSatish Balay PetscFunctionBegin; 214031fe6a7dSBarry Smith PetscCheck(A->assembled, PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_WRONGSTATE, "Cannot duplicate unassembled matrix"); 214108401ef6SPierre Jolivet PetscCheck(a->i[mbs] == nz, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Corrupt matrix"); 214249b5e25fSSatish Balay 2143f4259b30SLisandro Dalcin *B = NULL; 21449566063dSJacob Faibussowitsch PetscCall(MatCreate(PetscObjectComm((PetscObject)A), &C)); 21459566063dSJacob Faibussowitsch PetscCall(MatSetSizes(C, A->rmap->N, A->cmap->n, A->rmap->N, A->cmap->n)); 21469566063dSJacob Faibussowitsch PetscCall(MatSetBlockSizesFromMats(C, A, A)); 21479566063dSJacob Faibussowitsch PetscCall(MatSetType(C, MATSEQSBAIJ)); 2148692f9cbeSHong Zhang c = (Mat_SeqSBAIJ *)C->data; 2149692f9cbeSHong Zhang 2150273d9f13SBarry Smith C->preallocated = PETSC_TRUE; 2151d5f3da31SBarry Smith C->factortype = A->factortype; 2152f4259b30SLisandro Dalcin c->row = NULL; 2153f4259b30SLisandro Dalcin c->icol = NULL; 2154f4259b30SLisandro Dalcin c->saved_values = NULL; 2155a9817697SBarry Smith c->keepnonzeropattern = a->keepnonzeropattern; 215649b5e25fSSatish Balay C->assembled = PETSC_TRUE; 215749b5e25fSSatish Balay 21589566063dSJacob Faibussowitsch PetscCall(PetscLayoutReference(A->rmap, &C->rmap)); 21599566063dSJacob Faibussowitsch PetscCall(PetscLayoutReference(A->cmap, &C->cmap)); 216049b5e25fSSatish Balay c->bs2 = a->bs2; 216149b5e25fSSatish Balay c->mbs = a->mbs; 216249b5e25fSSatish Balay c->nbs = a->nbs; 216349b5e25fSSatish Balay 2164c760cd28SBarry Smith if (cpvalues == MAT_SHARE_NONZERO_PATTERN) { 2165c760cd28SBarry Smith c->imax = a->imax; 2166c760cd28SBarry Smith c->ilen = a->ilen; 2167c760cd28SBarry Smith c->free_imax_ilen = PETSC_FALSE; 2168c760cd28SBarry Smith } else { 21699566063dSJacob Faibussowitsch PetscCall(PetscMalloc2((mbs + 1), &c->imax, (mbs + 1), &c->ilen)); 217049b5e25fSSatish Balay for (i = 0; i < mbs; i++) { 217149b5e25fSSatish Balay c->imax[i] = a->imax[i]; 217249b5e25fSSatish Balay c->ilen[i] = a->ilen[i]; 217349b5e25fSSatish Balay } 2174c760cd28SBarry Smith c->free_imax_ilen = PETSC_TRUE; 2175c760cd28SBarry Smith } 217649b5e25fSSatish Balay 217749b5e25fSSatish Balay /* allocate the matrix space */ 21784da8f245SBarry Smith if (cpvalues == MAT_SHARE_NONZERO_PATTERN) { 21799566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(bs2 * nz, &c->a)); 218044e1c64aSLisandro Dalcin c->i = a->i; 218144e1c64aSLisandro Dalcin c->j = a->j; 21824da8f245SBarry Smith c->singlemalloc = PETSC_FALSE; 218344e1c64aSLisandro Dalcin c->free_a = PETSC_TRUE; 21844da8f245SBarry Smith c->free_ij = PETSC_FALSE; 21854da8f245SBarry Smith c->parent = A; 21869566063dSJacob Faibussowitsch PetscCall(PetscObjectReference((PetscObject)A)); 21879566063dSJacob Faibussowitsch PetscCall(MatSetOption(A, MAT_NEW_NONZERO_LOCATION_ERR, PETSC_TRUE)); 21889566063dSJacob Faibussowitsch PetscCall(MatSetOption(C, MAT_NEW_NONZERO_LOCATION_ERR, PETSC_TRUE)); 21894da8f245SBarry Smith } else { 21909566063dSJacob Faibussowitsch PetscCall(PetscMalloc3(bs2 * nz, &c->a, nz, &c->j, mbs + 1, &c->i)); 21919566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(c->i, a->i, mbs + 1)); 21924da8f245SBarry Smith c->singlemalloc = PETSC_TRUE; 219344e1c64aSLisandro Dalcin c->free_a = PETSC_TRUE; 21944da8f245SBarry Smith c->free_ij = PETSC_TRUE; 21954da8f245SBarry Smith } 219649b5e25fSSatish Balay if (mbs > 0) { 219748a46eb9SPierre Jolivet if (cpvalues != MAT_SHARE_NONZERO_PATTERN) PetscCall(PetscArraycpy(c->j, a->j, nz)); 219849b5e25fSSatish Balay if (cpvalues == MAT_COPY_VALUES) { 21999566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(c->a, a->a, bs2 * nz)); 220049b5e25fSSatish Balay } else { 22019566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(c->a, bs2 * nz)); 220249b5e25fSSatish Balay } 2203a1c3900fSBarry Smith if (a->jshort) { 220444e1c64aSLisandro Dalcin /* cannot share jshort, it is reallocated in MatAssemblyEnd_SeqSBAIJ() */ 220544e1c64aSLisandro Dalcin /* if the parent matrix is reassembled, this child matrix will never notice */ 22069566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nz, &c->jshort)); 22079566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(c->jshort, a->jshort, nz)); 220826fbe8dcSKarl Rupp 22094da8f245SBarry Smith c->free_jshort = PETSC_TRUE; 22104da8f245SBarry Smith } 2211a1c3900fSBarry Smith } 221249b5e25fSSatish Balay 221349b5e25fSSatish Balay c->roworiented = a->roworiented; 221449b5e25fSSatish Balay c->nonew = a->nonew; 221549b5e25fSSatish Balay 221649b5e25fSSatish Balay if (a->diag) { 2217c760cd28SBarry Smith if (cpvalues == MAT_SHARE_NONZERO_PATTERN) { 2218c760cd28SBarry Smith c->diag = a->diag; 2219c760cd28SBarry Smith c->free_diag = PETSC_FALSE; 2220c760cd28SBarry Smith } else { 22219566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(mbs, &c->diag)); 222226fbe8dcSKarl Rupp for (i = 0; i < mbs; i++) c->diag[i] = a->diag[i]; 2223c760cd28SBarry Smith c->free_diag = PETSC_TRUE; 2224c760cd28SBarry Smith } 222544e1c64aSLisandro Dalcin } 22266c6c5352SBarry Smith c->nz = a->nz; 2227f2cbd3d5SJed Brown c->maxnz = a->nz; /* Since we allocate exactly the right amount */ 2228f4259b30SLisandro Dalcin c->solve_work = NULL; 2229f4259b30SLisandro Dalcin c->mult_work = NULL; 223026fbe8dcSKarl Rupp 223149b5e25fSSatish Balay *B = C; 22329566063dSJacob Faibussowitsch PetscCall(PetscFunctionListDuplicate(((PetscObject)A)->qlist, &((PetscObject)C)->qlist)); 22333ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 223449b5e25fSSatish Balay } 223549b5e25fSSatish Balay 2236618cc2edSLisandro Dalcin /* Used for both SeqBAIJ and SeqSBAIJ matrices */ 2237618cc2edSLisandro Dalcin #define MatLoad_SeqSBAIJ_Binary MatLoad_SeqBAIJ_Binary 2238618cc2edSLisandro Dalcin 2239d71ae5a4SJacob Faibussowitsch PetscErrorCode MatLoad_SeqSBAIJ(Mat mat, PetscViewer viewer) 2240d71ae5a4SJacob Faibussowitsch { 22417f489da9SVaclav Hapla PetscBool isbinary; 22422f480046SShri Abhyankar 22432f480046SShri Abhyankar PetscFunctionBegin; 22449566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERBINARY, &isbinary)); 224528b400f6SJacob Faibussowitsch PetscCheck(isbinary, PetscObjectComm((PetscObject)viewer), PETSC_ERR_SUP, "Viewer type %s not yet supported for reading %s matrices", ((PetscObject)viewer)->type_name, ((PetscObject)mat)->type_name); 22469566063dSJacob Faibussowitsch PetscCall(MatLoad_SeqSBAIJ_Binary(mat, viewer)); 22473ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 22482f480046SShri Abhyankar } 22492f480046SShri Abhyankar 2250c75a6043SHong Zhang /*@ 225111a5261eSBarry Smith MatCreateSeqSBAIJWithArrays - Creates an sequential `MATSEQSBAIJ` matrix using matrix elements 2252c75a6043SHong Zhang (upper triangular entries in CSR format) provided by the user. 2253c75a6043SHong Zhang 2254d083f849SBarry Smith Collective 2255c75a6043SHong Zhang 2256c75a6043SHong Zhang Input Parameters: 2257c75a6043SHong Zhang + comm - must be an MPI communicator of size 1 2258c75a6043SHong Zhang . bs - size of block 2259c75a6043SHong Zhang . m - number of rows 2260c75a6043SHong Zhang . n - number of columns 2261483a2f95SBarry Smith . i - row indices; that is i[0] = 0, i[row] = i[row-1] + number of block elements in that row block row of the matrix 2262c75a6043SHong Zhang . j - column indices 2263c75a6043SHong Zhang - a - matrix values 2264c75a6043SHong Zhang 2265c75a6043SHong Zhang Output Parameter: 2266c75a6043SHong Zhang . mat - the matrix 2267c75a6043SHong Zhang 2268dfb205c3SBarry Smith Level: advanced 2269c75a6043SHong Zhang 2270c75a6043SHong Zhang Notes: 22712ef1f0ffSBarry Smith The `i`, `j`, and `a` arrays are not copied by this routine, the user must free these arrays 2272c75a6043SHong Zhang once the matrix is destroyed 2273c75a6043SHong Zhang 2274c75a6043SHong Zhang You cannot set new nonzero locations into this matrix, that will generate an error. 2275c75a6043SHong Zhang 22762ef1f0ffSBarry Smith The `i` and `j` indices are 0 based 2277c75a6043SHong Zhang 22782ef1f0ffSBarry Smith When block size is greater than 1 the matrix values must be stored using the `MATSBAIJ` storage format. For block size of 1 2279dfb205c3SBarry Smith it is the regular CSR format excluding the lower triangular elements. 2280dfb205c3SBarry Smith 2281*1cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MATSEQSBAIJ`, `MatCreate()`, `MatCreateSBAIJ()`, `MatCreateSeqSBAIJ()` 2282c75a6043SHong Zhang @*/ 2283d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateSeqSBAIJWithArrays(MPI_Comm comm, PetscInt bs, PetscInt m, PetscInt n, PetscInt i[], PetscInt j[], PetscScalar a[], Mat *mat) 2284d71ae5a4SJacob Faibussowitsch { 2285c75a6043SHong Zhang PetscInt ii; 2286c75a6043SHong Zhang Mat_SeqSBAIJ *sbaij; 2287c75a6043SHong Zhang 2288c75a6043SHong Zhang PetscFunctionBegin; 228908401ef6SPierre Jolivet PetscCheck(bs == 1, PETSC_COMM_SELF, PETSC_ERR_SUP, "block size %" PetscInt_FMT " > 1 is not supported yet", bs); 2290aed4548fSBarry Smith PetscCheck(m == 0 || i[0] == 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "i (row indices) must start with 0"); 2291c75a6043SHong Zhang 22929566063dSJacob Faibussowitsch PetscCall(MatCreate(comm, mat)); 22939566063dSJacob Faibussowitsch PetscCall(MatSetSizes(*mat, m, n, m, n)); 22949566063dSJacob Faibussowitsch PetscCall(MatSetType(*mat, MATSEQSBAIJ)); 22959566063dSJacob Faibussowitsch PetscCall(MatSeqSBAIJSetPreallocation(*mat, bs, MAT_SKIP_ALLOCATION, NULL)); 2296c75a6043SHong Zhang sbaij = (Mat_SeqSBAIJ *)(*mat)->data; 22979566063dSJacob Faibussowitsch PetscCall(PetscMalloc2(m, &sbaij->imax, m, &sbaij->ilen)); 2298c75a6043SHong Zhang 2299c75a6043SHong Zhang sbaij->i = i; 2300c75a6043SHong Zhang sbaij->j = j; 2301c75a6043SHong Zhang sbaij->a = a; 230226fbe8dcSKarl Rupp 2303c75a6043SHong Zhang sbaij->singlemalloc = PETSC_FALSE; 2304c75a6043SHong Zhang sbaij->nonew = -1; /*this indicates that inserting a new value in the matrix that generates a new nonzero is an error*/ 2305e6b907acSBarry Smith sbaij->free_a = PETSC_FALSE; 2306e6b907acSBarry Smith sbaij->free_ij = PETSC_FALSE; 2307ddf7884eSMatthew Knepley sbaij->free_imax_ilen = PETSC_TRUE; 2308c75a6043SHong Zhang 2309c75a6043SHong Zhang for (ii = 0; ii < m; ii++) { 2310c75a6043SHong Zhang sbaij->ilen[ii] = sbaij->imax[ii] = i[ii + 1] - i[ii]; 23116bdcaf15SBarry Smith PetscCheck(i[ii + 1] >= i[ii], PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Negative row length in i (row indices) row = %" PetscInt_FMT " length = %" PetscInt_FMT, ii, i[ii + 1] - i[ii]); 2312c75a6043SHong Zhang } 231376bd3646SJed Brown if (PetscDefined(USE_DEBUG)) { 2314c75a6043SHong Zhang for (ii = 0; ii < sbaij->i[m]; ii++) { 23156bdcaf15SBarry Smith PetscCheck(j[ii] >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Negative column index at location = %" PetscInt_FMT " index = %" PetscInt_FMT, ii, j[ii]); 23166bdcaf15SBarry Smith PetscCheck(j[ii] < n, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Column index too large at location = %" PetscInt_FMT " index = %" PetscInt_FMT, ii, j[ii]); 2317c75a6043SHong Zhang } 231876bd3646SJed Brown } 2319c75a6043SHong Zhang 23209566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(*mat, MAT_FINAL_ASSEMBLY)); 23219566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(*mat, MAT_FINAL_ASSEMBLY)); 23223ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 2323c75a6043SHong Zhang } 2324d06b337dSHong Zhang 2325d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateMPIMatConcatenateSeqMat_SeqSBAIJ(MPI_Comm comm, Mat inmat, PetscInt n, MatReuse scall, Mat *outmat) 2326d71ae5a4SJacob Faibussowitsch { 232759f5e6ceSHong Zhang PetscFunctionBegin; 23289566063dSJacob Faibussowitsch PetscCall(MatCreateMPIMatConcatenateSeqMat_MPISBAIJ(comm, inmat, n, scall, outmat)); 23293ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 233059f5e6ceSHong Zhang } 2331