149b5e25fSSatish Balay 249b5e25fSSatish Balay /* 3a1373b80SHong Zhang Defines the basic matrix operations for the SBAIJ (compressed row) 449b5e25fSSatish Balay matrix storage format. 549b5e25fSSatish Balay */ 6c6db04a5SJed Brown #include <../src/mat/impls/baij/seq/baij.h> /*I "petscmat.h" I*/ 7c6db04a5SJed Brown #include <../src/mat/impls/sbaij/seq/sbaij.h> 8c6db04a5SJed Brown #include <petscblaslapack.h> 949b5e25fSSatish Balay 10c6db04a5SJed Brown #include <../src/mat/impls/sbaij/seq/relax.h> 1170dcbbb9SBarry Smith #define USESHORT 12c6db04a5SJed Brown #include <../src/mat/impls/sbaij/seq/relax.h> 1370dcbbb9SBarry Smith 1426cec326SBarry Smith /* defines MatSetValues_Seq_Hash(), MatAssemblyEnd_Seq_Hash(), MatSetUp_Seq_Hash() */ 1526cec326SBarry Smith #define TYPE SBAIJ 1626cec326SBarry Smith #define TYPE_SBAIJ 1726cec326SBarry Smith #define TYPE_BS 1826cec326SBarry Smith #include "../src/mat/impls/aij/seq/seqhashmatsetvalues.h" 1926cec326SBarry Smith #undef TYPE_BS 2026cec326SBarry Smith #define TYPE_BS _BS 2126cec326SBarry Smith #define TYPE_BS_ON 2226cec326SBarry Smith #include "../src/mat/impls/aij/seq/seqhashmatsetvalues.h" 2326cec326SBarry Smith #undef TYPE_BS 2426cec326SBarry Smith #undef TYPE_SBAIJ 2526cec326SBarry Smith #include "../src/mat/impls/aij/seq/seqhashmat.h" 2626cec326SBarry Smith #undef TYPE 2726cec326SBarry Smith #undef TYPE_BS_ON 2826cec326SBarry Smith 296214f412SHong Zhang #if defined(PETSC_HAVE_ELEMENTAL) 30cc2e6a90SBarry Smith PETSC_INTERN PetscErrorCode MatConvert_SeqSBAIJ_Elemental(Mat, MatType, MatReuse, Mat *); 316214f412SHong Zhang #endif 32d24d4204SJose E. Roman #if defined(PETSC_HAVE_SCALAPACK) 33d24d4204SJose E. Roman PETSC_INTERN PetscErrorCode MatConvert_SBAIJ_ScaLAPACK(Mat, MatType, MatReuse, Mat *); 34d24d4204SJose E. Roman #endif 3528d58a37SPierre Jolivet PETSC_INTERN PetscErrorCode MatConvert_MPISBAIJ_Basic(Mat, MatType, MatReuse, Mat *); 36b5b17502SBarry Smith 3749b5e25fSSatish Balay /* 3849b5e25fSSatish Balay Checks for missing diagonals 3949b5e25fSSatish Balay */ 40d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMissingDiagonal_SeqSBAIJ(Mat A, PetscBool *missing, PetscInt *dd) 41d71ae5a4SJacob Faibussowitsch { 42045c9aa0SHong Zhang Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)A->data; 437734d3b5SMatthew G. Knepley PetscInt *diag, *ii = a->i, i; 4449b5e25fSSatish Balay 4549b5e25fSSatish Balay PetscFunctionBegin; 469566063dSJacob Faibussowitsch PetscCall(MatMarkDiagonal_SeqSBAIJ(A)); 472af78befSBarry Smith *missing = PETSC_FALSE; 487734d3b5SMatthew G. Knepley if (A->rmap->n > 0 && !ii) { 49358d2f5dSShri Abhyankar *missing = PETSC_TRUE; 50358d2f5dSShri Abhyankar if (dd) *dd = 0; 519566063dSJacob Faibussowitsch PetscCall(PetscInfo(A, "Matrix has no entries therefore is missing diagonal\n")); 52358d2f5dSShri Abhyankar } else { 53358d2f5dSShri Abhyankar diag = a->diag; 5449b5e25fSSatish Balay for (i = 0; i < a->mbs; i++) { 557734d3b5SMatthew G. Knepley if (diag[i] >= ii[i + 1]) { 562af78befSBarry Smith *missing = PETSC_TRUE; 572af78befSBarry Smith if (dd) *dd = i; 582af78befSBarry Smith break; 592af78befSBarry Smith } 6049b5e25fSSatish Balay } 61358d2f5dSShri Abhyankar } 623ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 6349b5e25fSSatish Balay } 6449b5e25fSSatish Balay 65d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMarkDiagonal_SeqSBAIJ(Mat A) 66d71ae5a4SJacob Faibussowitsch { 67045c9aa0SHong Zhang Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)A->data; 6848dd3d27SHong Zhang PetscInt i, j; 6949b5e25fSSatish Balay 7049b5e25fSSatish Balay PetscFunctionBegin; 7109f38230SBarry Smith if (!a->diag) { 729566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(a->mbs, &a->diag)); 73c760cd28SBarry Smith a->free_diag = PETSC_TRUE; 7409f38230SBarry Smith } 7548dd3d27SHong Zhang for (i = 0; i < a->mbs; i++) { 7648dd3d27SHong Zhang a->diag[i] = a->i[i + 1]; 7748dd3d27SHong Zhang for (j = a->i[i]; j < a->i[i + 1]; j++) { 7848dd3d27SHong Zhang if (a->j[j] == i) { 7948dd3d27SHong Zhang a->diag[i] = j; 8048dd3d27SHong Zhang break; 8148dd3d27SHong Zhang } 8248dd3d27SHong Zhang } 8348dd3d27SHong Zhang } 843ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 8549b5e25fSSatish Balay } 8649b5e25fSSatish Balay 87d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatGetRowIJ_SeqSBAIJ(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool blockcompressed, PetscInt *nn, const PetscInt *inia[], const PetscInt *inja[], PetscBool *done) 88d71ae5a4SJacob Faibussowitsch { 89a6ece127SHong Zhang Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)A->data; 902462f5fdSStefano Zampini PetscInt i, j, n = a->mbs, nz = a->i[n], *tia, *tja, bs = A->rmap->bs, k, l, cnt; 912462f5fdSStefano Zampini PetscInt **ia = (PetscInt **)inia, **ja = (PetscInt **)inja; 9249b5e25fSSatish Balay 9349b5e25fSSatish Balay PetscFunctionBegin; 94d3e5a4abSHong Zhang *nn = n; 953ba16761SJacob Faibussowitsch if (!ia) PetscFunctionReturn(PETSC_SUCCESS); 962462f5fdSStefano Zampini if (symmetric) { 979566063dSJacob Faibussowitsch PetscCall(MatToSymmetricIJ_SeqAIJ(n, a->i, a->j, PETSC_FALSE, 0, 0, &tia, &tja)); 982462f5fdSStefano Zampini nz = tia[n]; 992462f5fdSStefano Zampini } else { 1009371c9d4SSatish Balay tia = a->i; 1019371c9d4SSatish Balay tja = a->j; 1022462f5fdSStefano Zampini } 1032462f5fdSStefano Zampini 1042462f5fdSStefano Zampini if (!blockcompressed && bs > 1) { 1052462f5fdSStefano Zampini (*nn) *= bs; 1068f7157efSSatish Balay /* malloc & create the natural set of indices */ 1079566063dSJacob Faibussowitsch PetscCall(PetscMalloc1((n + 1) * bs, ia)); 1082462f5fdSStefano Zampini if (n) { 1092462f5fdSStefano Zampini (*ia)[0] = oshift; 110ad540459SPierre Jolivet for (j = 1; j < bs; j++) (*ia)[j] = (tia[1] - tia[0]) * bs + (*ia)[j - 1]; 1112462f5fdSStefano Zampini } 1122462f5fdSStefano Zampini 1132462f5fdSStefano Zampini for (i = 1; i < n; i++) { 1142462f5fdSStefano Zampini (*ia)[i * bs] = (tia[i] - tia[i - 1]) * bs + (*ia)[i * bs - 1]; 115ad540459SPierre Jolivet for (j = 1; j < bs; j++) (*ia)[i * bs + j] = (tia[i + 1] - tia[i]) * bs + (*ia)[i * bs + j - 1]; 1162462f5fdSStefano Zampini } 117ad540459SPierre Jolivet if (n) (*ia)[n * bs] = (tia[n] - tia[n - 1]) * bs + (*ia)[n * bs - 1]; 1182462f5fdSStefano Zampini 1192462f5fdSStefano Zampini if (inja) { 1209566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nz * bs * bs, ja)); 1212462f5fdSStefano Zampini cnt = 0; 1222462f5fdSStefano Zampini for (i = 0; i < n; i++) { 1238f7157efSSatish Balay for (j = 0; j < bs; j++) { 1242462f5fdSStefano Zampini for (k = tia[i]; k < tia[i + 1]; k++) { 125ad540459SPierre Jolivet for (l = 0; l < bs; l++) (*ja)[cnt++] = bs * tja[k] + l; 1268f7157efSSatish Balay } 1278f7157efSSatish Balay } 1288f7157efSSatish Balay } 1298f7157efSSatish Balay } 1302462f5fdSStefano Zampini 1312462f5fdSStefano Zampini if (symmetric) { /* deallocate memory allocated in MatToSymmetricIJ_SeqAIJ() */ 1329566063dSJacob Faibussowitsch PetscCall(PetscFree(tia)); 1339566063dSJacob Faibussowitsch PetscCall(PetscFree(tja)); 1342462f5fdSStefano Zampini } 1352462f5fdSStefano Zampini } else if (oshift == 1) { 1362462f5fdSStefano Zampini if (symmetric) { 1372462f5fdSStefano Zampini nz = tia[A->rmap->n / bs]; 1382462f5fdSStefano Zampini /* add 1 to i and j indices */ 1392462f5fdSStefano Zampini for (i = 0; i < A->rmap->n / bs + 1; i++) tia[i] = tia[i] + 1; 1402462f5fdSStefano Zampini *ia = tia; 1412462f5fdSStefano Zampini if (ja) { 1422462f5fdSStefano Zampini for (i = 0; i < nz; i++) tja[i] = tja[i] + 1; 1432462f5fdSStefano Zampini *ja = tja; 1442462f5fdSStefano Zampini } 1452462f5fdSStefano Zampini } else { 1462462f5fdSStefano Zampini nz = a->i[A->rmap->n / bs]; 1472462f5fdSStefano Zampini /* malloc space and add 1 to i and j indices */ 1489566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(A->rmap->n / bs + 1, ia)); 1492462f5fdSStefano Zampini for (i = 0; i < A->rmap->n / bs + 1; i++) (*ia)[i] = a->i[i] + 1; 1502462f5fdSStefano Zampini if (ja) { 1519566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nz, ja)); 1522462f5fdSStefano Zampini for (i = 0; i < nz; i++) (*ja)[i] = a->j[i] + 1; 1532462f5fdSStefano Zampini } 1542462f5fdSStefano Zampini } 1552462f5fdSStefano Zampini } else { 1562462f5fdSStefano Zampini *ia = tia; 1572462f5fdSStefano Zampini if (ja) *ja = tja; 158a6ece127SHong Zhang } 1593ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 16049b5e25fSSatish Balay } 16149b5e25fSSatish Balay 162d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatRestoreRowIJ_SeqSBAIJ(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool blockcompressed, PetscInt *nn, const PetscInt *ia[], const PetscInt *ja[], PetscBool *done) 163d71ae5a4SJacob Faibussowitsch { 16449b5e25fSSatish Balay PetscFunctionBegin; 1653ba16761SJacob Faibussowitsch if (!ia) PetscFunctionReturn(PETSC_SUCCESS); 1662462f5fdSStefano Zampini if ((!blockcompressed && A->rmap->bs > 1) || (symmetric || oshift == 1)) { 1679566063dSJacob Faibussowitsch PetscCall(PetscFree(*ia)); 1689566063dSJacob Faibussowitsch if (ja) PetscCall(PetscFree(*ja)); 169a6ece127SHong Zhang } 1703ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 17149b5e25fSSatish Balay } 17249b5e25fSSatish Balay 173d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDestroy_SeqSBAIJ(Mat A) 174d71ae5a4SJacob Faibussowitsch { 17549b5e25fSSatish Balay Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)A->data; 17649b5e25fSSatish Balay 17749b5e25fSSatish Balay PetscFunctionBegin; 178*b4e2f619SBarry Smith if (A->hash_active) { 179*b4e2f619SBarry Smith PetscInt bs; 180*b4e2f619SBarry Smith PetscCall(PetscMemcpy(&A->ops, &a->cops, sizeof(*(A->ops)))); 181*b4e2f619SBarry Smith PetscCall(PetscHMapIJVDestroy(&a->ht)); 182*b4e2f619SBarry Smith PetscCall(MatGetBlockSize(A, &bs)); 183*b4e2f619SBarry Smith if (bs > 1) PetscCall(PetscHSetIJDestroy(&a->bht)); 184*b4e2f619SBarry Smith PetscCall(PetscFree(a->dnz)); 185*b4e2f619SBarry Smith PetscCall(PetscFree(a->bdnz)); 186*b4e2f619SBarry Smith A->hash_active = PETSC_FALSE; 187*b4e2f619SBarry Smith } 188a9f03627SSatish Balay #if defined(PETSC_USE_LOG) 1893ba16761SJacob Faibussowitsch PetscCall(PetscLogObjectState((PetscObject)A, "Rows=%" PetscInt_FMT ", NZ=%" PetscInt_FMT, A->rmap->N, a->nz)); 190a9f03627SSatish Balay #endif 1919566063dSJacob Faibussowitsch PetscCall(MatSeqXAIJFreeAIJ(A, &a->a, &a->j, &a->i)); 1929566063dSJacob Faibussowitsch if (a->free_diag) PetscCall(PetscFree(a->diag)); 1939566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->row)); 1949566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->col)); 1959566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->icol)); 1969566063dSJacob Faibussowitsch PetscCall(PetscFree(a->idiag)); 1979566063dSJacob Faibussowitsch PetscCall(PetscFree(a->inode.size)); 1989566063dSJacob Faibussowitsch if (a->free_imax_ilen) PetscCall(PetscFree2(a->imax, a->ilen)); 1999566063dSJacob Faibussowitsch PetscCall(PetscFree(a->solve_work)); 2009566063dSJacob Faibussowitsch PetscCall(PetscFree(a->sor_work)); 2019566063dSJacob Faibussowitsch PetscCall(PetscFree(a->solves_work)); 2029566063dSJacob Faibussowitsch PetscCall(PetscFree(a->mult_work)); 2039566063dSJacob Faibussowitsch PetscCall(PetscFree(a->saved_values)); 2049566063dSJacob Faibussowitsch if (a->free_jshort) PetscCall(PetscFree(a->jshort)); 2059566063dSJacob Faibussowitsch PetscCall(PetscFree(a->inew)); 2069566063dSJacob Faibussowitsch PetscCall(MatDestroy(&a->parent)); 2079566063dSJacob Faibussowitsch PetscCall(PetscFree(A->data)); 208901853e0SKris Buschelman 2099566063dSJacob Faibussowitsch PetscCall(PetscObjectChangeTypeName((PetscObject)A, NULL)); 2102e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSeqSBAIJGetArray_C", NULL)); 2112e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSeqSBAIJRestoreArray_C", NULL)); 2129566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatStoreValues_C", NULL)); 2139566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatRetrieveValues_C", NULL)); 2149566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSeqSBAIJSetColumnIndices_C", NULL)); 2159566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqsbaij_seqaij_C", NULL)); 2169566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqsbaij_seqbaij_C", NULL)); 2179566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSeqSBAIJSetPreallocation_C", NULL)); 2189566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSeqSBAIJSetPreallocationCSR_C", NULL)); 2196214f412SHong Zhang #if defined(PETSC_HAVE_ELEMENTAL) 2209566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqsbaij_elemental_C", NULL)); 2216214f412SHong Zhang #endif 222d24d4204SJose E. Roman #if defined(PETSC_HAVE_SCALAPACK) 2239566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqsbaij_scalapack_C", NULL)); 224d24d4204SJose E. Roman #endif 2252e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatFactorGetSolverType_C", NULL)); 2263ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 22749b5e25fSSatish Balay } 22849b5e25fSSatish Balay 229d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetOption_SeqSBAIJ(Mat A, MatOption op, PetscBool flg) 230d71ae5a4SJacob Faibussowitsch { 231045c9aa0SHong Zhang Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)A->data; 232eb1ec7c1SStefano Zampini #if defined(PETSC_USE_COMPLEX) 233eb1ec7c1SStefano Zampini PetscInt bs; 234eb1ec7c1SStefano Zampini #endif 23549b5e25fSSatish Balay 23649b5e25fSSatish Balay PetscFunctionBegin; 237eb1ec7c1SStefano Zampini #if defined(PETSC_USE_COMPLEX) 2389566063dSJacob Faibussowitsch PetscCall(MatGetBlockSize(A, &bs)); 239eb1ec7c1SStefano Zampini #endif 2404d9d31abSKris Buschelman switch (op) { 241d71ae5a4SJacob Faibussowitsch case MAT_ROW_ORIENTED: 242d71ae5a4SJacob Faibussowitsch a->roworiented = flg; 243d71ae5a4SJacob Faibussowitsch break; 244d71ae5a4SJacob Faibussowitsch case MAT_KEEP_NONZERO_PATTERN: 245d71ae5a4SJacob Faibussowitsch a->keepnonzeropattern = flg; 246d71ae5a4SJacob Faibussowitsch break; 247d71ae5a4SJacob Faibussowitsch case MAT_NEW_NONZERO_LOCATIONS: 248d71ae5a4SJacob Faibussowitsch a->nonew = (flg ? 0 : 1); 249d71ae5a4SJacob Faibussowitsch break; 250d71ae5a4SJacob Faibussowitsch case MAT_NEW_NONZERO_LOCATION_ERR: 251d71ae5a4SJacob Faibussowitsch a->nonew = (flg ? -1 : 0); 252d71ae5a4SJacob Faibussowitsch break; 253d71ae5a4SJacob Faibussowitsch case MAT_NEW_NONZERO_ALLOCATION_ERR: 254d71ae5a4SJacob Faibussowitsch a->nonew = (flg ? -2 : 0); 255d71ae5a4SJacob Faibussowitsch break; 256d71ae5a4SJacob Faibussowitsch case MAT_UNUSED_NONZERO_LOCATION_ERR: 257d71ae5a4SJacob Faibussowitsch a->nounused = (flg ? -1 : 0); 258d71ae5a4SJacob Faibussowitsch break; 2598c78258cSHong Zhang case MAT_FORCE_DIAGONAL_ENTRIES: 2604d9d31abSKris Buschelman case MAT_IGNORE_OFF_PROC_ENTRIES: 2614d9d31abSKris Buschelman case MAT_USE_HASH_TABLE: 262d71ae5a4SJacob Faibussowitsch case MAT_SORTED_FULL: 263d71ae5a4SJacob Faibussowitsch PetscCall(PetscInfo(A, "Option %s ignored\n", MatOptions[op])); 264d71ae5a4SJacob Faibussowitsch break; 2659a4540c5SBarry Smith case MAT_HERMITIAN: 266eb1ec7c1SStefano Zampini #if defined(PETSC_USE_COMPLEX) 267eb1ec7c1SStefano Zampini if (flg) { /* disable transpose ops */ 26808401ef6SPierre Jolivet PetscCheck(bs <= 1, PETSC_COMM_SELF, PETSC_ERR_SUP, "No support for Hermitian with block size greater than 1"); 269eb1ec7c1SStefano Zampini A->ops->multtranspose = NULL; 270eb1ec7c1SStefano Zampini A->ops->multtransposeadd = NULL; 271b94d7dedSBarry Smith A->symmetric = PETSC_BOOL3_FALSE; 272eb1ec7c1SStefano Zampini } 2730f2140c7SStefano Zampini #endif 274eeffb40dSHong Zhang break; 27577e54ba9SKris Buschelman case MAT_SYMMETRIC: 276eb1ec7c1SStefano Zampini case MAT_SPD: 277eb1ec7c1SStefano Zampini #if defined(PETSC_USE_COMPLEX) 278eb1ec7c1SStefano Zampini if (flg) { /* An hermitian and symmetric matrix has zero imaginary part (restore back transpose ops) */ 279eb1ec7c1SStefano Zampini A->ops->multtranspose = A->ops->mult; 280eb1ec7c1SStefano Zampini A->ops->multtransposeadd = A->ops->multadd; 281eb1ec7c1SStefano Zampini } 282eb1ec7c1SStefano Zampini #endif 283eb1ec7c1SStefano Zampini break; 284eb1ec7c1SStefano Zampini /* These options are handled directly by MatSetOption() */ 28577e54ba9SKris Buschelman case MAT_STRUCTURALLY_SYMMETRIC: 2869a4540c5SBarry Smith case MAT_SYMMETRY_ETERNAL: 287b94d7dedSBarry Smith case MAT_STRUCTURAL_SYMMETRY_ETERNAL: 288672ba085SHong Zhang case MAT_STRUCTURE_ONLY: 289b94d7dedSBarry Smith case MAT_SPD_ETERNAL: 2904dcd73b1SHong Zhang /* These options are handled directly by MatSetOption() */ 291290bbb0aSBarry Smith break; 292d71ae5a4SJacob Faibussowitsch case MAT_IGNORE_LOWER_TRIANGULAR: 293d71ae5a4SJacob Faibussowitsch a->ignore_ltriangular = flg; 294d71ae5a4SJacob Faibussowitsch break; 295d71ae5a4SJacob Faibussowitsch case MAT_ERROR_LOWER_TRIANGULAR: 296d71ae5a4SJacob Faibussowitsch a->ignore_ltriangular = flg; 297d71ae5a4SJacob Faibussowitsch break; 298d71ae5a4SJacob Faibussowitsch case MAT_GETROW_UPPERTRIANGULAR: 299d71ae5a4SJacob Faibussowitsch a->getrow_utriangular = flg; 300d71ae5a4SJacob Faibussowitsch break; 301d71ae5a4SJacob Faibussowitsch case MAT_SUBMAT_SINGLEIS: 302d71ae5a4SJacob Faibussowitsch break; 303d71ae5a4SJacob Faibussowitsch default: 304d71ae5a4SJacob Faibussowitsch SETERRQ(PETSC_COMM_SELF, PETSC_ERR_SUP, "unknown option %d", op); 30549b5e25fSSatish Balay } 3063ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 30749b5e25fSSatish Balay } 30849b5e25fSSatish Balay 309d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetRow_SeqSBAIJ(Mat A, PetscInt row, PetscInt *nz, PetscInt **idx, PetscScalar **v) 310d71ae5a4SJacob Faibussowitsch { 31149b5e25fSSatish Balay Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)A->data; 31249b5e25fSSatish Balay 31349b5e25fSSatish Balay PetscFunctionBegin; 31408401ef6SPierre Jolivet PetscCheck(!A || a->getrow_utriangular, PETSC_COMM_SELF, PETSC_ERR_SUP, "MatGetRow is not supported for SBAIJ matrix format. Getting the upper triangular part of row, run with -mat_getrow_uppertriangular, call MatSetOption(mat,MAT_GETROW_UPPERTRIANGULAR,PETSC_TRUE) or MatGetRowUpperTriangular()"); 31552768537SHong Zhang 316f5edf698SHong Zhang /* Get the upper triangular part of the row */ 3179566063dSJacob Faibussowitsch PetscCall(MatGetRow_SeqBAIJ_private(A, row, nz, idx, v, a->i, a->j, a->a)); 3183ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 31949b5e25fSSatish Balay } 32049b5e25fSSatish Balay 321d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRestoreRow_SeqSBAIJ(Mat A, PetscInt row, PetscInt *nz, PetscInt **idx, PetscScalar **v) 322d71ae5a4SJacob Faibussowitsch { 32349b5e25fSSatish Balay PetscFunctionBegin; 324cb4a9cd9SHong Zhang if (nz) *nz = 0; 3259566063dSJacob Faibussowitsch if (idx) PetscCall(PetscFree(*idx)); 3269566063dSJacob Faibussowitsch if (v) PetscCall(PetscFree(*v)); 3273ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 32849b5e25fSSatish Balay } 32949b5e25fSSatish Balay 330d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetRowUpperTriangular_SeqSBAIJ(Mat A) 331d71ae5a4SJacob Faibussowitsch { 332f5edf698SHong Zhang Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)A->data; 333f5edf698SHong Zhang 334f5edf698SHong Zhang PetscFunctionBegin; 335f5edf698SHong Zhang a->getrow_utriangular = PETSC_TRUE; 3363ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 337f5edf698SHong Zhang } 338a323099bSStefano Zampini 339d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRestoreRowUpperTriangular_SeqSBAIJ(Mat A) 340d71ae5a4SJacob Faibussowitsch { 341f5edf698SHong Zhang Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)A->data; 342f5edf698SHong Zhang 343f5edf698SHong Zhang PetscFunctionBegin; 344f5edf698SHong Zhang a->getrow_utriangular = PETSC_FALSE; 3453ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 346f5edf698SHong Zhang } 347f5edf698SHong Zhang 348d71ae5a4SJacob Faibussowitsch PetscErrorCode MatTranspose_SeqSBAIJ(Mat A, MatReuse reuse, Mat *B) 349d71ae5a4SJacob Faibussowitsch { 35049b5e25fSSatish Balay PetscFunctionBegin; 3517fb60732SBarry Smith if (reuse == MAT_REUSE_MATRIX) PetscCall(MatTransposeCheckNonzeroState_Private(A, *B)); 352cf37664fSBarry Smith if (reuse == MAT_INITIAL_MATRIX) { 3539566063dSJacob Faibussowitsch PetscCall(MatDuplicate(A, MAT_COPY_VALUES, B)); 354cf37664fSBarry Smith } else if (reuse == MAT_REUSE_MATRIX) { 3559566063dSJacob Faibussowitsch PetscCall(MatCopy(A, *B, SAME_NONZERO_PATTERN)); 356fc4dec0aSBarry Smith } 3573ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 35849b5e25fSSatish Balay } 35949b5e25fSSatish Balay 360d71ae5a4SJacob Faibussowitsch PetscErrorCode MatView_SeqSBAIJ_ASCII(Mat A, PetscViewer viewer) 361d71ae5a4SJacob Faibussowitsch { 36249b5e25fSSatish Balay Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)A->data; 363d0f46423SBarry Smith PetscInt i, j, bs = A->rmap->bs, k, l, bs2 = a->bs2; 364f3ef73ceSBarry Smith PetscViewerFormat format; 365121deb67SSatish Balay PetscInt *diag; 366b3a0534dSBarry Smith const char *matname; 36749b5e25fSSatish Balay 36849b5e25fSSatish Balay PetscFunctionBegin; 3699566063dSJacob Faibussowitsch PetscCall(PetscViewerGetFormat(viewer, &format)); 370456192e2SBarry Smith if (format == PETSC_VIEWER_ASCII_INFO || format == PETSC_VIEWER_ASCII_INFO_DETAIL) { 3719566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " block size is %" PetscInt_FMT "\n", bs)); 372fb9695e5SSatish Balay } else if (format == PETSC_VIEWER_ASCII_MATLAB) { 373d2507d54SMatthew Knepley Mat aij; 374ade3a672SBarry Smith 375d5f3da31SBarry Smith if (A->factortype && bs > 1) { 3769566063dSJacob Faibussowitsch PetscCall(PetscPrintf(PETSC_COMM_SELF, "Warning: matrix is factored with bs>1. MatView() with PETSC_VIEWER_ASCII_MATLAB is not supported and ignored!\n")); 3773ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 37870d5e725SHong Zhang } 3799566063dSJacob Faibussowitsch PetscCall(MatConvert(A, MATSEQAIJ, MAT_INITIAL_MATRIX, &aij)); 38023a3927dSBarry Smith if (((PetscObject)A)->name) PetscCall(PetscObjectGetName((PetscObject)A, &matname)); 38123a3927dSBarry Smith if (((PetscObject)A)->name) PetscCall(PetscObjectSetName((PetscObject)aij, matname)); 38223a3927dSBarry Smith PetscCall(MatView_SeqAIJ(aij, viewer)); 3839566063dSJacob Faibussowitsch PetscCall(MatDestroy(&aij)); 384fb9695e5SSatish Balay } else if (format == PETSC_VIEWER_ASCII_COMMON) { 385b3a0534dSBarry Smith Mat B; 386b3a0534dSBarry Smith 387b3a0534dSBarry Smith PetscCall(MatConvert(A, MATSEQAIJ, MAT_INITIAL_MATRIX, &B)); 388b3a0534dSBarry Smith if (((PetscObject)A)->name) PetscCall(PetscObjectGetName((PetscObject)A, &matname)); 389b3a0534dSBarry Smith if (((PetscObject)A)->name) PetscCall(PetscObjectSetName((PetscObject)B, matname)); 390b3a0534dSBarry Smith PetscCall(MatView_SeqAIJ(B, viewer)); 391b3a0534dSBarry Smith PetscCall(MatDestroy(&B)); 392c1490034SHong Zhang } else if (format == PETSC_VIEWER_ASCII_FACTOR_INFO) { 3933ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 39449b5e25fSSatish Balay } else { 3959566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE)); 3962c990fa1SHong Zhang if (A->factortype) { /* for factored matrix */ 39708401ef6SPierre Jolivet PetscCheck(bs <= 1, PETSC_COMM_SELF, PETSC_ERR_SUP, "matrix is factored with bs>1. Not implemented yet"); 3982c990fa1SHong Zhang 399121deb67SSatish Balay diag = a->diag; 400121deb67SSatish Balay for (i = 0; i < a->mbs; i++) { /* for row block i */ 4019566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "row %" PetscInt_FMT ":", i)); 4022c990fa1SHong Zhang /* diagonal entry */ 4032c990fa1SHong Zhang #if defined(PETSC_USE_COMPLEX) 4042c990fa1SHong Zhang if (PetscImaginaryPart(a->a[diag[i]]) > 0.0) { 4059566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g + %g i) ", a->j[diag[i]], (double)PetscRealPart(1.0 / a->a[diag[i]]), (double)PetscImaginaryPart(1.0 / a->a[diag[i]]))); 4062c990fa1SHong Zhang } else if (PetscImaginaryPart(a->a[diag[i]]) < 0.0) { 4079566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g - %g i) ", a->j[diag[i]], (double)PetscRealPart(1.0 / a->a[diag[i]]), -(double)PetscImaginaryPart(1.0 / a->a[diag[i]]))); 4082c990fa1SHong Zhang } else { 4099566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[diag[i]], (double)PetscRealPart(1.0 / a->a[diag[i]]))); 4102c990fa1SHong Zhang } 4112c990fa1SHong Zhang #else 4129566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[diag[i]], (double)(1.0 / a->a[diag[i]]))); 4132c990fa1SHong Zhang #endif 4142c990fa1SHong Zhang /* off-diagonal entries */ 4152c990fa1SHong Zhang for (k = a->i[i]; k < a->i[i + 1] - 1; k++) { 4162c990fa1SHong Zhang #if defined(PETSC_USE_COMPLEX) 417ca0704adSBarry Smith if (PetscImaginaryPart(a->a[k]) > 0.0) { 4189566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g + %g i) ", bs * a->j[k], (double)PetscRealPart(a->a[k]), (double)PetscImaginaryPart(a->a[k]))); 419ca0704adSBarry Smith } else if (PetscImaginaryPart(a->a[k]) < 0.0) { 4209566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g - %g i) ", bs * a->j[k], (double)PetscRealPart(a->a[k]), -(double)PetscImaginaryPart(a->a[k]))); 4212c990fa1SHong Zhang } else { 4229566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", bs * a->j[k], (double)PetscRealPart(a->a[k]))); 4232c990fa1SHong Zhang } 4242c990fa1SHong Zhang #else 4259566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[k], (double)a->a[k])); 4262c990fa1SHong Zhang #endif 4272c990fa1SHong Zhang } 4289566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 4292c990fa1SHong Zhang } 4302c990fa1SHong Zhang 4312c990fa1SHong Zhang } else { /* for non-factored matrix */ 4320c74a584SJed Brown for (i = 0; i < a->mbs; i++) { /* for row block i */ 4330c74a584SJed Brown for (j = 0; j < bs; j++) { /* for row bs*i + j */ 4349566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "row %" PetscInt_FMT ":", i * bs + j)); 4350c74a584SJed Brown for (k = a->i[i]; k < a->i[i + 1]; k++) { /* for column block */ 4360c74a584SJed Brown for (l = 0; l < bs; l++) { /* for column */ 43749b5e25fSSatish Balay #if defined(PETSC_USE_COMPLEX) 43849b5e25fSSatish Balay if (PetscImaginaryPart(a->a[bs2 * k + l * bs + j]) > 0.0) { 4399371c9d4SSatish Balay PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g + %g i) ", bs * a->j[k] + l, (double)PetscRealPart(a->a[bs2 * k + l * bs + j]), (double)PetscImaginaryPart(a->a[bs2 * k + l * bs + j]))); 44049b5e25fSSatish Balay } else if (PetscImaginaryPart(a->a[bs2 * k + l * bs + j]) < 0.0) { 4419371c9d4SSatish Balay PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g - %g i) ", bs * a->j[k] + l, (double)PetscRealPart(a->a[bs2 * k + l * bs + j]), -(double)PetscImaginaryPart(a->a[bs2 * k + l * bs + j]))); 44249b5e25fSSatish Balay } else { 4439566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", bs * a->j[k] + l, (double)PetscRealPart(a->a[bs2 * k + l * bs + j]))); 44449b5e25fSSatish Balay } 44549b5e25fSSatish Balay #else 4469566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", bs * a->j[k] + l, (double)a->a[bs2 * k + l * bs + j])); 44749b5e25fSSatish Balay #endif 44849b5e25fSSatish Balay } 44949b5e25fSSatish Balay } 4509566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 45149b5e25fSSatish Balay } 45249b5e25fSSatish Balay } 4532c990fa1SHong Zhang } 4549566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE)); 45549b5e25fSSatish Balay } 4569566063dSJacob Faibussowitsch PetscCall(PetscViewerFlush(viewer)); 4573ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 45849b5e25fSSatish Balay } 45949b5e25fSSatish Balay 4609804daf3SBarry Smith #include <petscdraw.h> 461d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatView_SeqSBAIJ_Draw_Zoom(PetscDraw draw, void *Aa) 462d71ae5a4SJacob Faibussowitsch { 46349b5e25fSSatish Balay Mat A = (Mat)Aa; 46449b5e25fSSatish Balay Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)A->data; 465d0f46423SBarry Smith PetscInt row, i, j, k, l, mbs = a->mbs, color, bs = A->rmap->bs, bs2 = a->bs2; 46649b5e25fSSatish Balay PetscReal xl, yl, xr, yr, x_l, x_r, y_l, y_r; 46749b5e25fSSatish Balay MatScalar *aa; 468b0a32e0cSBarry Smith PetscViewer viewer; 46949b5e25fSSatish Balay 47049b5e25fSSatish Balay PetscFunctionBegin; 4719566063dSJacob Faibussowitsch PetscCall(PetscObjectQuery((PetscObject)A, "Zoomviewer", (PetscObject *)&viewer)); 4729566063dSJacob Faibussowitsch PetscCall(PetscDrawGetCoordinates(draw, &xl, &yl, &xr, &yr)); 47349b5e25fSSatish Balay 47449b5e25fSSatish Balay /* loop over matrix elements drawing boxes */ 475383922c3SLisandro Dalcin 476d0609cedSBarry Smith PetscDrawCollectiveBegin(draw); 4779566063dSJacob Faibussowitsch PetscCall(PetscDrawString(draw, .3 * (xl + xr), .3 * (yl + yr), PETSC_DRAW_BLACK, "symmetric")); 478383922c3SLisandro Dalcin /* Blue for negative, Cyan for zero and Red for positive */ 479b0a32e0cSBarry Smith color = PETSC_DRAW_BLUE; 48049b5e25fSSatish Balay for (i = 0, row = 0; i < mbs; i++, row += bs) { 48149b5e25fSSatish Balay for (j = a->i[i]; j < a->i[i + 1]; j++) { 4829371c9d4SSatish Balay y_l = A->rmap->N - row - 1.0; 4839371c9d4SSatish Balay y_r = y_l + 1.0; 4849371c9d4SSatish Balay x_l = a->j[j] * bs; 4859371c9d4SSatish Balay x_r = x_l + 1.0; 48649b5e25fSSatish Balay aa = a->a + j * bs2; 48749b5e25fSSatish Balay for (k = 0; k < bs; k++) { 48849b5e25fSSatish Balay for (l = 0; l < bs; l++) { 48949b5e25fSSatish Balay if (PetscRealPart(*aa++) >= 0.) continue; 4909566063dSJacob Faibussowitsch PetscCall(PetscDrawRectangle(draw, x_l + k, y_l - l, x_r + k, y_r - l, color, color, color, color)); 49149b5e25fSSatish Balay } 49249b5e25fSSatish Balay } 49349b5e25fSSatish Balay } 49449b5e25fSSatish Balay } 495b0a32e0cSBarry Smith color = PETSC_DRAW_CYAN; 49649b5e25fSSatish Balay for (i = 0, row = 0; i < mbs; i++, row += bs) { 49749b5e25fSSatish Balay for (j = a->i[i]; j < a->i[i + 1]; j++) { 4989371c9d4SSatish Balay y_l = A->rmap->N - row - 1.0; 4999371c9d4SSatish Balay y_r = y_l + 1.0; 5009371c9d4SSatish Balay x_l = a->j[j] * bs; 5019371c9d4SSatish Balay x_r = x_l + 1.0; 50249b5e25fSSatish Balay aa = a->a + j * bs2; 50349b5e25fSSatish Balay for (k = 0; k < bs; k++) { 50449b5e25fSSatish Balay for (l = 0; l < bs; l++) { 50549b5e25fSSatish Balay if (PetscRealPart(*aa++) != 0.) continue; 5069566063dSJacob Faibussowitsch PetscCall(PetscDrawRectangle(draw, x_l + k, y_l - l, x_r + k, y_r - l, color, color, color, color)); 50749b5e25fSSatish Balay } 50849b5e25fSSatish Balay } 50949b5e25fSSatish Balay } 51049b5e25fSSatish Balay } 511b0a32e0cSBarry Smith color = PETSC_DRAW_RED; 51249b5e25fSSatish Balay for (i = 0, row = 0; i < mbs; i++, row += bs) { 51349b5e25fSSatish Balay for (j = a->i[i]; j < a->i[i + 1]; j++) { 5149371c9d4SSatish Balay y_l = A->rmap->N - row - 1.0; 5159371c9d4SSatish Balay y_r = y_l + 1.0; 5169371c9d4SSatish Balay x_l = a->j[j] * bs; 5179371c9d4SSatish Balay x_r = x_l + 1.0; 51849b5e25fSSatish Balay aa = a->a + j * bs2; 51949b5e25fSSatish Balay for (k = 0; k < bs; k++) { 52049b5e25fSSatish Balay for (l = 0; l < bs; l++) { 52149b5e25fSSatish Balay if (PetscRealPart(*aa++) <= 0.) continue; 5229566063dSJacob Faibussowitsch PetscCall(PetscDrawRectangle(draw, x_l + k, y_l - l, x_r + k, y_r - l, color, color, color, color)); 52349b5e25fSSatish Balay } 52449b5e25fSSatish Balay } 52549b5e25fSSatish Balay } 52649b5e25fSSatish Balay } 527d0609cedSBarry Smith PetscDrawCollectiveEnd(draw); 5283ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 52949b5e25fSSatish Balay } 53049b5e25fSSatish Balay 531d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatView_SeqSBAIJ_Draw(Mat A, PetscViewer viewer) 532d71ae5a4SJacob Faibussowitsch { 53349b5e25fSSatish Balay PetscReal xl, yl, xr, yr, w, h; 534b0a32e0cSBarry Smith PetscDraw draw; 535ace3abfcSBarry Smith PetscBool isnull; 53649b5e25fSSatish Balay 53749b5e25fSSatish Balay PetscFunctionBegin; 5389566063dSJacob Faibussowitsch PetscCall(PetscViewerDrawGetDraw(viewer, 0, &draw)); 5399566063dSJacob Faibussowitsch PetscCall(PetscDrawIsNull(draw, &isnull)); 5403ba16761SJacob Faibussowitsch if (isnull) PetscFunctionReturn(PETSC_SUCCESS); 54149b5e25fSSatish Balay 5429371c9d4SSatish Balay xr = A->rmap->N; 5439371c9d4SSatish Balay yr = A->rmap->N; 5449371c9d4SSatish Balay h = yr / 10.0; 5459371c9d4SSatish Balay w = xr / 10.0; 5469371c9d4SSatish Balay xr += w; 5479371c9d4SSatish Balay yr += h; 5489371c9d4SSatish Balay xl = -w; 5499371c9d4SSatish Balay yl = -h; 5509566063dSJacob Faibussowitsch PetscCall(PetscDrawSetCoordinates(draw, xl, yl, xr, yr)); 5519566063dSJacob Faibussowitsch PetscCall(PetscObjectCompose((PetscObject)A, "Zoomviewer", (PetscObject)viewer)); 5529566063dSJacob Faibussowitsch PetscCall(PetscDrawZoom(draw, MatView_SeqSBAIJ_Draw_Zoom, A)); 5539566063dSJacob Faibussowitsch PetscCall(PetscObjectCompose((PetscObject)A, "Zoomviewer", NULL)); 5549566063dSJacob Faibussowitsch PetscCall(PetscDrawSave(draw)); 5553ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 55649b5e25fSSatish Balay } 55749b5e25fSSatish Balay 558618cc2edSLisandro Dalcin /* Used for both MPIBAIJ and MPISBAIJ matrices */ 559618cc2edSLisandro Dalcin #define MatView_SeqSBAIJ_Binary MatView_SeqBAIJ_Binary 560618cc2edSLisandro Dalcin 561d71ae5a4SJacob Faibussowitsch PetscErrorCode MatView_SeqSBAIJ(Mat A, PetscViewer viewer) 562d71ae5a4SJacob Faibussowitsch { 563618cc2edSLisandro Dalcin PetscBool iascii, isbinary, isdraw; 56449b5e25fSSatish Balay 56549b5e25fSSatish Balay PetscFunctionBegin; 5669566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERASCII, &iascii)); 5679566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERBINARY, &isbinary)); 5689566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERDRAW, &isdraw)); 56932077d6dSBarry Smith if (iascii) { 5709566063dSJacob Faibussowitsch PetscCall(MatView_SeqSBAIJ_ASCII(A, viewer)); 571618cc2edSLisandro Dalcin } else if (isbinary) { 5729566063dSJacob Faibussowitsch PetscCall(MatView_SeqSBAIJ_Binary(A, viewer)); 57349b5e25fSSatish Balay } else if (isdraw) { 5749566063dSJacob Faibussowitsch PetscCall(MatView_SeqSBAIJ_Draw(A, viewer)); 57549b5e25fSSatish Balay } else { 576a5e6ed63SBarry Smith Mat B; 577ade3a672SBarry Smith const char *matname; 5789566063dSJacob Faibussowitsch PetscCall(MatConvert(A, MATSEQAIJ, MAT_INITIAL_MATRIX, &B)); 57923a3927dSBarry Smith if (((PetscObject)A)->name) PetscCall(PetscObjectGetName((PetscObject)A, &matname)); 58023a3927dSBarry Smith if (((PetscObject)A)->name) PetscCall(PetscObjectSetName((PetscObject)B, matname)); 5819566063dSJacob Faibussowitsch PetscCall(MatView(B, viewer)); 5829566063dSJacob Faibussowitsch PetscCall(MatDestroy(&B)); 58349b5e25fSSatish Balay } 5843ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 58549b5e25fSSatish Balay } 58649b5e25fSSatish Balay 587d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetValues_SeqSBAIJ(Mat A, PetscInt m, const PetscInt im[], PetscInt n, const PetscInt in[], PetscScalar v[]) 588d71ae5a4SJacob Faibussowitsch { 589045c9aa0SHong Zhang Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)A->data; 59013f74950SBarry Smith PetscInt *rp, k, low, high, t, row, nrow, i, col, l, *aj = a->j; 59113f74950SBarry Smith PetscInt *ai = a->i, *ailen = a->ilen; 592d0f46423SBarry Smith PetscInt brow, bcol, ridx, cidx, bs = A->rmap->bs, bs2 = a->bs2; 59397e567efSBarry Smith MatScalar *ap, *aa = a->a; 59449b5e25fSSatish Balay 59549b5e25fSSatish Balay PetscFunctionBegin; 59649b5e25fSSatish Balay for (k = 0; k < m; k++) { /* loop over rows */ 5979371c9d4SSatish Balay row = im[k]; 5989371c9d4SSatish Balay brow = row / bs; 5999371c9d4SSatish Balay if (row < 0) { 6009371c9d4SSatish Balay v += n; 6019371c9d4SSatish Balay continue; 6029371c9d4SSatish Balay } /* negative row */ 60354c59aa7SJacob Faibussowitsch PetscCheck(row < A->rmap->N, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Row too large: row %" PetscInt_FMT " max %" PetscInt_FMT, row, A->rmap->N - 1); 6049371c9d4SSatish Balay rp = aj + ai[brow]; 6059371c9d4SSatish Balay ap = aa + bs2 * ai[brow]; 60649b5e25fSSatish Balay nrow = ailen[brow]; 60749b5e25fSSatish Balay for (l = 0; l < n; l++) { /* loop over columns */ 6089371c9d4SSatish Balay if (in[l] < 0) { 6099371c9d4SSatish Balay v++; 6109371c9d4SSatish Balay continue; 6119371c9d4SSatish Balay } /* negative column */ 61254c59aa7SJacob Faibussowitsch PetscCheck(in[l] < A->cmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Column too large: col %" PetscInt_FMT " max %" PetscInt_FMT, in[l], A->cmap->n - 1); 61349b5e25fSSatish Balay col = in[l]; 61449b5e25fSSatish Balay bcol = col / bs; 61549b5e25fSSatish Balay cidx = col % bs; 61649b5e25fSSatish Balay ridx = row % bs; 61749b5e25fSSatish Balay high = nrow; 61849b5e25fSSatish Balay low = 0; /* assume unsorted */ 61949b5e25fSSatish Balay while (high - low > 5) { 62049b5e25fSSatish Balay t = (low + high) / 2; 62149b5e25fSSatish Balay if (rp[t] > bcol) high = t; 62249b5e25fSSatish Balay else low = t; 62349b5e25fSSatish Balay } 62449b5e25fSSatish Balay for (i = low; i < high; i++) { 62549b5e25fSSatish Balay if (rp[i] > bcol) break; 62649b5e25fSSatish Balay if (rp[i] == bcol) { 62749b5e25fSSatish Balay *v++ = ap[bs2 * i + bs * cidx + ridx]; 62849b5e25fSSatish Balay goto finished; 62949b5e25fSSatish Balay } 63049b5e25fSSatish Balay } 63197e567efSBarry Smith *v++ = 0.0; 63249b5e25fSSatish Balay finished:; 63349b5e25fSSatish Balay } 63449b5e25fSSatish Balay } 6353ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 63649b5e25fSSatish Balay } 63749b5e25fSSatish Balay 638d71ae5a4SJacob Faibussowitsch PetscErrorCode MatPermute_SeqSBAIJ(Mat A, IS rowp, IS colp, Mat *B) 639d71ae5a4SJacob Faibussowitsch { 640dc29a518SPierre Jolivet Mat C; 641dc29a518SPierre Jolivet 642dc29a518SPierre Jolivet PetscFunctionBegin; 6439566063dSJacob Faibussowitsch PetscCall(MatConvert(A, MATSEQBAIJ, MAT_INITIAL_MATRIX, &C)); 6449566063dSJacob Faibussowitsch PetscCall(MatPermute(C, rowp, colp, B)); 6459566063dSJacob Faibussowitsch PetscCall(MatDestroy(&C)); 64648a46eb9SPierre Jolivet if (rowp == colp) PetscCall(MatConvert(*B, MATSEQSBAIJ, MAT_INPLACE_MATRIX, B)); 6473ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 648dc29a518SPierre Jolivet } 64949b5e25fSSatish Balay 650d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetValuesBlocked_SeqSBAIJ(Mat A, PetscInt m, const PetscInt im[], PetscInt n, const PetscInt in[], const PetscScalar v[], InsertMode is) 651d71ae5a4SJacob Faibussowitsch { 6520880e062SHong Zhang Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)A->data; 653e2ee6c50SBarry Smith PetscInt *rp, k, low, high, t, ii, jj, row, nrow, i, col, l, rmax, N, lastcol = -1; 65413f74950SBarry Smith PetscInt *imax = a->imax, *ai = a->i, *ailen = a->ilen; 655d0f46423SBarry Smith PetscInt *aj = a->j, nonew = a->nonew, bs2 = a->bs2, bs = A->rmap->bs, stepval; 656ace3abfcSBarry Smith PetscBool roworiented = a->roworiented; 657dd6ea824SBarry Smith const PetscScalar *value = v; 658f15d580aSBarry Smith MatScalar *ap, *aa = a->a, *bap; 6590880e062SHong Zhang 66049b5e25fSSatish Balay PetscFunctionBegin; 66126fbe8dcSKarl Rupp if (roworiented) stepval = (n - 1) * bs; 66226fbe8dcSKarl Rupp else stepval = (m - 1) * bs; 66326fbe8dcSKarl Rupp 6640880e062SHong Zhang for (k = 0; k < m; k++) { /* loop over added rows */ 6650880e062SHong Zhang row = im[k]; 6660880e062SHong Zhang if (row < 0) continue; 6676bdcaf15SBarry Smith PetscCheck(row < a->mbs, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Block index row too large %" PetscInt_FMT " max %" PetscInt_FMT, row, a->mbs - 1); 6680880e062SHong Zhang rp = aj + ai[row]; 6690880e062SHong Zhang ap = aa + bs2 * ai[row]; 6700880e062SHong Zhang rmax = imax[row]; 6710880e062SHong Zhang nrow = ailen[row]; 6720880e062SHong Zhang low = 0; 673818f2c47SBarry Smith high = nrow; 6740880e062SHong Zhang for (l = 0; l < n; l++) { /* loop over added columns */ 6750880e062SHong Zhang if (in[l] < 0) continue; 6760880e062SHong Zhang col = in[l]; 6776bdcaf15SBarry Smith PetscCheck(col < a->nbs, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Block index column too large %" PetscInt_FMT " max %" PetscInt_FMT, col, a->nbs - 1); 678b98bf0e1SJed Brown if (col < row) { 67926fbe8dcSKarl Rupp if (a->ignore_ltriangular) continue; /* ignore lower triangular block */ 68026fbe8dcSKarl Rupp else SETERRQ(PETSC_COMM_SELF, PETSC_ERR_USER, "Lower triangular value cannot be set for sbaij format. Ignoring these values, run with -mat_ignore_lower_triangular or call MatSetOption(mat,MAT_IGNORE_LOWER_TRIANGULAR,PETSC_TRUE)"); 681b98bf0e1SJed Brown } 68226fbe8dcSKarl Rupp if (roworiented) value = v + k * (stepval + bs) * bs + l * bs; 68326fbe8dcSKarl Rupp else value = v + l * (stepval + bs) * bs + k * bs; 68426fbe8dcSKarl Rupp 68526fbe8dcSKarl Rupp if (col <= lastcol) low = 0; 68626fbe8dcSKarl Rupp else high = nrow; 68726fbe8dcSKarl Rupp 688e2ee6c50SBarry Smith lastcol = col; 6890880e062SHong Zhang while (high - low > 7) { 6900880e062SHong Zhang t = (low + high) / 2; 6910880e062SHong Zhang if (rp[t] > col) high = t; 6920880e062SHong Zhang else low = t; 6930880e062SHong Zhang } 6940880e062SHong Zhang for (i = low; i < high; i++) { 6950880e062SHong Zhang if (rp[i] > col) break; 6960880e062SHong Zhang if (rp[i] == col) { 6970880e062SHong Zhang bap = ap + bs2 * i; 6980880e062SHong Zhang if (roworiented) { 6990880e062SHong Zhang if (is == ADD_VALUES) { 7000880e062SHong Zhang for (ii = 0; ii < bs; ii++, value += stepval) { 701ad540459SPierre Jolivet for (jj = ii; jj < bs2; jj += bs) bap[jj] += *value++; 7020880e062SHong Zhang } 7030880e062SHong Zhang } else { 7040880e062SHong Zhang for (ii = 0; ii < bs; ii++, value += stepval) { 705ad540459SPierre Jolivet for (jj = ii; jj < bs2; jj += bs) bap[jj] = *value++; 7060880e062SHong Zhang } 7070880e062SHong Zhang } 7080880e062SHong Zhang } else { 7090880e062SHong Zhang if (is == ADD_VALUES) { 7100880e062SHong Zhang for (ii = 0; ii < bs; ii++, value += stepval) { 711ad540459SPierre Jolivet for (jj = 0; jj < bs; jj++) *bap++ += *value++; 7120880e062SHong Zhang } 7130880e062SHong Zhang } else { 7140880e062SHong Zhang for (ii = 0; ii < bs; ii++, value += stepval) { 715ad540459SPierre Jolivet for (jj = 0; jj < bs; jj++) *bap++ = *value++; 7160880e062SHong Zhang } 7170880e062SHong Zhang } 7180880e062SHong Zhang } 7190880e062SHong Zhang goto noinsert2; 7200880e062SHong Zhang } 7210880e062SHong Zhang } 7220880e062SHong Zhang if (nonew == 1) goto noinsert2; 72308401ef6SPierre Jolivet PetscCheck(nonew != -1, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Inserting a new block index nonzero block (%" PetscInt_FMT ", %" PetscInt_FMT ") in the matrix", row, col); 724fef13f97SBarry Smith MatSeqXAIJReallocateAIJ(A, a->mbs, bs2, nrow, row, col, rmax, aa, ai, aj, rp, ap, imax, nonew, MatScalar); 7259371c9d4SSatish Balay N = nrow++ - 1; 7269371c9d4SSatish Balay high++; 7270880e062SHong Zhang /* shift up all the later entries in this row */ 7289566063dSJacob Faibussowitsch PetscCall(PetscArraymove(rp + i + 1, rp + i, N - i + 1)); 7299566063dSJacob Faibussowitsch PetscCall(PetscArraymove(ap + bs2 * (i + 1), ap + bs2 * i, bs2 * (N - i + 1))); 7309566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(ap + bs2 * i, bs2)); 7310880e062SHong Zhang rp[i] = col; 7320880e062SHong Zhang bap = ap + bs2 * i; 7330880e062SHong Zhang if (roworiented) { 7340880e062SHong Zhang for (ii = 0; ii < bs; ii++, value += stepval) { 735ad540459SPierre Jolivet for (jj = ii; jj < bs2; jj += bs) bap[jj] = *value++; 7360880e062SHong Zhang } 7370880e062SHong Zhang } else { 7380880e062SHong Zhang for (ii = 0; ii < bs; ii++, value += stepval) { 739ad540459SPierre Jolivet for (jj = 0; jj < bs; jj++) *bap++ = *value++; 7400880e062SHong Zhang } 7410880e062SHong Zhang } 7420880e062SHong Zhang noinsert2:; 7430880e062SHong Zhang low = i; 7440880e062SHong Zhang } 7450880e062SHong Zhang ailen[row] = nrow; 7460880e062SHong Zhang } 7473ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 74849b5e25fSSatish Balay } 74949b5e25fSSatish Balay 75064831d72SBarry Smith /* 75164831d72SBarry Smith This is not yet used 75264831d72SBarry Smith */ 753d71ae5a4SJacob Faibussowitsch PetscErrorCode MatAssemblyEnd_SeqSBAIJ_SeqAIJ_Inode(Mat A) 754d71ae5a4SJacob Faibussowitsch { 7550def2e27SBarry Smith Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)A->data; 7560def2e27SBarry Smith const PetscInt *ai = a->i, *aj = a->j, *cols; 7570def2e27SBarry Smith PetscInt i = 0, j, blk_size, m = A->rmap->n, node_count = 0, nzx, nzy, *ns, row, nz, cnt, cnt2, *counts; 758ace3abfcSBarry Smith PetscBool flag; 7590def2e27SBarry Smith 7600def2e27SBarry Smith PetscFunctionBegin; 7619566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m, &ns)); 7620def2e27SBarry Smith while (i < m) { 7630def2e27SBarry Smith nzx = ai[i + 1] - ai[i]; /* Number of nonzeros */ 7640def2e27SBarry Smith /* Limits the number of elements in a node to 'a->inode.limit' */ 7650def2e27SBarry Smith for (j = i + 1, blk_size = 1; j < m && blk_size < a->inode.limit; ++j, ++blk_size) { 7660def2e27SBarry Smith nzy = ai[j + 1] - ai[j]; 7670def2e27SBarry Smith if (nzy != (nzx - j + i)) break; 7689566063dSJacob Faibussowitsch PetscCall(PetscArraycmp(aj + ai[i] + j - i, aj + ai[j], nzy, &flag)); 7690def2e27SBarry Smith if (!flag) break; 7700def2e27SBarry Smith } 7710def2e27SBarry Smith ns[node_count++] = blk_size; 77226fbe8dcSKarl Rupp 7730def2e27SBarry Smith i = j; 7740def2e27SBarry Smith } 7750def2e27SBarry Smith if (!a->inode.size && m && node_count > .9 * m) { 7769566063dSJacob Faibussowitsch PetscCall(PetscFree(ns)); 7779566063dSJacob Faibussowitsch PetscCall(PetscInfo(A, "Found %" PetscInt_FMT " nodes out of %" PetscInt_FMT " rows. Not using Inode routines\n", node_count, m)); 7780def2e27SBarry Smith } else { 7790def2e27SBarry Smith a->inode.node_count = node_count; 78026fbe8dcSKarl Rupp 7819566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(node_count, &a->inode.size)); 7829566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(a->inode.size, ns, node_count)); 7839566063dSJacob Faibussowitsch PetscCall(PetscFree(ns)); 7849566063dSJacob Faibussowitsch PetscCall(PetscInfo(A, "Found %" PetscInt_FMT " nodes of %" PetscInt_FMT ". Limit used: %" PetscInt_FMT ". Using Inode routines\n", node_count, m, a->inode.limit)); 7850def2e27SBarry Smith 7860def2e27SBarry Smith /* count collections of adjacent columns in each inode */ 7870def2e27SBarry Smith row = 0; 7880def2e27SBarry Smith cnt = 0; 7890def2e27SBarry Smith for (i = 0; i < node_count; i++) { 7900def2e27SBarry Smith cols = aj + ai[row] + a->inode.size[i]; 7910def2e27SBarry Smith nz = ai[row + 1] - ai[row] - a->inode.size[i]; 7920def2e27SBarry Smith for (j = 1; j < nz; j++) { 79326fbe8dcSKarl Rupp if (cols[j] != cols[j - 1] + 1) cnt++; 7940def2e27SBarry Smith } 7950def2e27SBarry Smith cnt++; 7960def2e27SBarry Smith row += a->inode.size[i]; 7970def2e27SBarry Smith } 7989566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(2 * cnt, &counts)); 7990def2e27SBarry Smith cnt = 0; 8000def2e27SBarry Smith row = 0; 8010def2e27SBarry Smith for (i = 0; i < node_count; i++) { 8020def2e27SBarry Smith cols = aj + ai[row] + a->inode.size[i]; 8030def2e27SBarry Smith counts[2 * cnt] = cols[0]; 8040def2e27SBarry Smith nz = ai[row + 1] - ai[row] - a->inode.size[i]; 8050def2e27SBarry Smith cnt2 = 1; 8060def2e27SBarry Smith for (j = 1; j < nz; j++) { 8070def2e27SBarry Smith if (cols[j] != cols[j - 1] + 1) { 8080def2e27SBarry Smith counts[2 * (cnt++) + 1] = cnt2; 8090def2e27SBarry Smith counts[2 * cnt] = cols[j]; 8100def2e27SBarry Smith cnt2 = 1; 8110def2e27SBarry Smith } else cnt2++; 8120def2e27SBarry Smith } 8130def2e27SBarry Smith counts[2 * (cnt++) + 1] = cnt2; 8140def2e27SBarry Smith row += a->inode.size[i]; 8150def2e27SBarry Smith } 8169566063dSJacob Faibussowitsch PetscCall(PetscIntView(2 * cnt, counts, NULL)); 8170def2e27SBarry Smith } 8183ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 81938702af4SBarry Smith } 82038702af4SBarry Smith 821d71ae5a4SJacob Faibussowitsch PetscErrorCode MatAssemblyEnd_SeqSBAIJ(Mat A, MatAssemblyType mode) 822d71ae5a4SJacob Faibussowitsch { 82349b5e25fSSatish Balay Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)A->data; 8248f8f2f0dSBarry Smith PetscInt fshift = 0, i, *ai = a->i, *aj = a->j, *imax = a->imax; 825d0f46423SBarry Smith PetscInt m = A->rmap->N, *ip, N, *ailen = a->ilen; 82613f74950SBarry Smith PetscInt mbs = a->mbs, bs2 = a->bs2, rmax = 0; 82749b5e25fSSatish Balay MatScalar *aa = a->a, *ap; 82849b5e25fSSatish Balay 82949b5e25fSSatish Balay PetscFunctionBegin; 8303ba16761SJacob Faibussowitsch if (mode == MAT_FLUSH_ASSEMBLY) PetscFunctionReturn(PETSC_SUCCESS); 83149b5e25fSSatish Balay 83249b5e25fSSatish Balay if (m) rmax = ailen[0]; 83349b5e25fSSatish Balay for (i = 1; i < mbs; i++) { 83449b5e25fSSatish Balay /* move each row back by the amount of empty slots (fshift) before it*/ 83549b5e25fSSatish Balay fshift += imax[i - 1] - ailen[i - 1]; 83649b5e25fSSatish Balay rmax = PetscMax(rmax, ailen[i]); 83749b5e25fSSatish Balay if (fshift) { 838580bdb30SBarry Smith ip = aj + ai[i]; 839580bdb30SBarry Smith ap = aa + bs2 * ai[i]; 84049b5e25fSSatish Balay N = ailen[i]; 8419566063dSJacob Faibussowitsch PetscCall(PetscArraymove(ip - fshift, ip, N)); 8429566063dSJacob Faibussowitsch PetscCall(PetscArraymove(ap - bs2 * fshift, ap, bs2 * N)); 84349b5e25fSSatish Balay } 84449b5e25fSSatish Balay ai[i] = ai[i - 1] + ailen[i - 1]; 84549b5e25fSSatish Balay } 84649b5e25fSSatish Balay if (mbs) { 84749b5e25fSSatish Balay fshift += imax[mbs - 1] - ailen[mbs - 1]; 84849b5e25fSSatish Balay ai[mbs] = ai[mbs - 1] + ailen[mbs - 1]; 84949b5e25fSSatish Balay } 85049b5e25fSSatish Balay /* reset ilen and imax for each row */ 851ad540459SPierre Jolivet for (i = 0; i < mbs; i++) ailen[i] = imax[i] = ai[i + 1] - ai[i]; 8526c6c5352SBarry Smith a->nz = ai[mbs]; 85349b5e25fSSatish Balay 854b424e231SHong Zhang /* diagonals may have moved, reset it */ 8551baa6e33SBarry Smith if (a->diag) PetscCall(PetscArraycpy(a->diag, ai, mbs)); 856aed4548fSBarry Smith PetscCheck(!fshift || a->nounused != -1, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Unused space detected in matrix: %" PetscInt_FMT " X %" PetscInt_FMT " block size %" PetscInt_FMT ", %" PetscInt_FMT " unneeded", m, A->cmap->n, A->rmap->bs, fshift * bs2); 85726fbe8dcSKarl Rupp 8589566063dSJacob Faibussowitsch PetscCall(PetscInfo(A, "Matrix size: %" PetscInt_FMT " X %" PetscInt_FMT ", block size %" PetscInt_FMT "; storage space: %" PetscInt_FMT " unneeded, %" PetscInt_FMT " used\n", m, A->rmap->N, A->rmap->bs, fshift * bs2, a->nz * bs2)); 8599566063dSJacob Faibussowitsch PetscCall(PetscInfo(A, "Number of mallocs during MatSetValues is %" PetscInt_FMT "\n", a->reallocs)); 8609566063dSJacob Faibussowitsch PetscCall(PetscInfo(A, "Most nonzeros blocks in any row is %" PetscInt_FMT "\n", rmax)); 86126fbe8dcSKarl Rupp 8628e58a170SBarry Smith A->info.mallocs += a->reallocs; 86349b5e25fSSatish Balay a->reallocs = 0; 86449b5e25fSSatish Balay A->info.nz_unneeded = (PetscReal)fshift * bs2; 865061b2667SBarry Smith a->idiagvalid = PETSC_FALSE; 8664dcd73b1SHong Zhang a->rmax = rmax; 86738702af4SBarry Smith 86838702af4SBarry Smith if (A->cmap->n < 65536 && A->cmap->bs == 1) { 86944e1c64aSLisandro Dalcin if (a->jshort && a->free_jshort) { 87017803ae8SHong Zhang /* when matrix data structure is changed, previous jshort must be replaced */ 8719566063dSJacob Faibussowitsch PetscCall(PetscFree(a->jshort)); 87217803ae8SHong Zhang } 8739566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(a->i[A->rmap->n], &a->jshort)); 87438702af4SBarry Smith for (i = 0; i < a->i[A->rmap->n]; i++) a->jshort[i] = a->j[i]; 87538702af4SBarry Smith A->ops->mult = MatMult_SeqSBAIJ_1_ushort; 87641f059aeSBarry Smith A->ops->sor = MatSOR_SeqSBAIJ_ushort; 8774da8f245SBarry Smith a->free_jshort = PETSC_TRUE; 87838702af4SBarry Smith } 8793ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 88049b5e25fSSatish Balay } 88149b5e25fSSatish Balay 88249b5e25fSSatish Balay /* 88349b5e25fSSatish Balay This function returns an array of flags which indicate the locations of contiguous 88449b5e25fSSatish Balay blocks that should be zeroed. for eg: if bs = 3 and is = [0,1,2,3,5,6,7,8,9] 885a5b23f4aSJose E. Roman then the resulting sizes = [3,1,1,3,1] corresponding to sets [(0,1,2),(3),(5),(6,7,8),(9)] 88649b5e25fSSatish Balay Assume: sizes should be long enough to hold all the values. 88749b5e25fSSatish Balay */ 888d71ae5a4SJacob Faibussowitsch PetscErrorCode MatZeroRows_SeqSBAIJ_Check_Blocks(PetscInt idx[], PetscInt n, PetscInt bs, PetscInt sizes[], PetscInt *bs_max) 889d71ae5a4SJacob Faibussowitsch { 89013f74950SBarry Smith PetscInt i, j, k, row; 891ace3abfcSBarry Smith PetscBool flg; 89249b5e25fSSatish Balay 89349b5e25fSSatish Balay PetscFunctionBegin; 89449b5e25fSSatish Balay for (i = 0, j = 0; i < n; j++) { 89549b5e25fSSatish Balay row = idx[i]; 896a5b23f4aSJose E. Roman if (row % bs != 0) { /* Not the beginning of a block */ 89749b5e25fSSatish Balay sizes[j] = 1; 89849b5e25fSSatish Balay i++; 89949b5e25fSSatish Balay } else if (i + bs > n) { /* Beginning of a block, but complete block doesn't exist (at idx end) */ 90049b5e25fSSatish Balay sizes[j] = 1; /* Also makes sure at least 'bs' values exist for next else */ 90149b5e25fSSatish Balay i++; 9026aad120cSJose E. Roman } else { /* Beginning of the block, so check if the complete block exists */ 90349b5e25fSSatish Balay flg = PETSC_TRUE; 90449b5e25fSSatish Balay for (k = 1; k < bs; k++) { 90549b5e25fSSatish Balay if (row + k != idx[i + k]) { /* break in the block */ 90649b5e25fSSatish Balay flg = PETSC_FALSE; 90749b5e25fSSatish Balay break; 90849b5e25fSSatish Balay } 90949b5e25fSSatish Balay } 910abc0a331SBarry Smith if (flg) { /* No break in the bs */ 91149b5e25fSSatish Balay sizes[j] = bs; 91249b5e25fSSatish Balay i += bs; 91349b5e25fSSatish Balay } else { 91449b5e25fSSatish Balay sizes[j] = 1; 91549b5e25fSSatish Balay i++; 91649b5e25fSSatish Balay } 91749b5e25fSSatish Balay } 91849b5e25fSSatish Balay } 91949b5e25fSSatish Balay *bs_max = j; 9203ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 92149b5e25fSSatish Balay } 92249b5e25fSSatish Balay 92349b5e25fSSatish Balay /* Only add/insert a(i,j) with i<=j (blocks). 924da81f932SPierre Jolivet Any a(i,j) with i>j input by user is ignored. 92549b5e25fSSatish Balay */ 92649b5e25fSSatish Balay 927d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetValues_SeqSBAIJ(Mat A, PetscInt m, const PetscInt im[], PetscInt n, const PetscInt in[], const PetscScalar v[], InsertMode is) 928d71ae5a4SJacob Faibussowitsch { 92949b5e25fSSatish Balay Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)A->data; 930e2ee6c50SBarry Smith PetscInt *rp, k, low, high, t, ii, row, nrow, i, col, l, rmax, N, lastcol = -1; 93113f74950SBarry Smith PetscInt *imax = a->imax, *ai = a->i, *ailen = a->ilen, roworiented = a->roworiented; 932d0f46423SBarry Smith PetscInt *aj = a->j, nonew = a->nonew, bs = A->rmap->bs, brow, bcol; 93313f74950SBarry Smith PetscInt ridx, cidx, bs2 = a->bs2; 93449b5e25fSSatish Balay MatScalar *ap, value, *aa = a->a, *bap; 93549b5e25fSSatish Balay 93649b5e25fSSatish Balay PetscFunctionBegin; 93749b5e25fSSatish Balay for (k = 0; k < m; k++) { /* loop over added rows */ 93849b5e25fSSatish Balay row = im[k]; /* row number */ 93949b5e25fSSatish Balay brow = row / bs; /* block row number */ 94049b5e25fSSatish Balay if (row < 0) continue; 9416bdcaf15SBarry Smith PetscCheck(row < A->rmap->N, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Row too large: row %" PetscInt_FMT " max %" PetscInt_FMT, row, A->rmap->N - 1); 94249b5e25fSSatish Balay rp = aj + ai[brow]; /*ptr to beginning of column value of the row block*/ 94349b5e25fSSatish Balay ap = aa + bs2 * ai[brow]; /*ptr to beginning of element value of the row block*/ 94449b5e25fSSatish Balay rmax = imax[brow]; /* maximum space allocated for this row */ 94549b5e25fSSatish Balay nrow = ailen[brow]; /* actual length of this row */ 94649b5e25fSSatish Balay low = 0; 9478509e838SStefano Zampini high = nrow; 94849b5e25fSSatish Balay for (l = 0; l < n; l++) { /* loop over added columns */ 94949b5e25fSSatish Balay if (in[l] < 0) continue; 9506bdcaf15SBarry Smith PetscCheck(in[l] < A->cmap->N, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Column too large: col %" PetscInt_FMT " max %" PetscInt_FMT, in[l], A->cmap->N - 1); 95149b5e25fSSatish Balay col = in[l]; 95249b5e25fSSatish Balay bcol = col / bs; /* block col number */ 95349b5e25fSSatish Balay 954941593c8SHong Zhang if (brow > bcol) { 95526fbe8dcSKarl Rupp if (a->ignore_ltriangular) continue; /* ignore lower triangular values */ 95626fbe8dcSKarl Rupp else SETERRQ(PETSC_COMM_SELF, PETSC_ERR_USER, "Lower triangular value cannot be set for sbaij format. Ignoring these values, run with -mat_ignore_lower_triangular or call MatSetOption(mat,MAT_IGNORE_LOWER_TRIANGULAR,PETSC_TRUE)"); 957941593c8SHong Zhang } 958f4989cb3SHong Zhang 9599371c9d4SSatish Balay ridx = row % bs; 9609371c9d4SSatish Balay cidx = col % bs; /*row and col index inside the block */ 9618549e402SHong Zhang if ((brow == bcol && ridx <= cidx) || (brow < bcol)) { 96249b5e25fSSatish Balay /* element value a(k,l) */ 96326fbe8dcSKarl Rupp if (roworiented) value = v[l + k * n]; 96426fbe8dcSKarl Rupp else value = v[k + l * m]; 96549b5e25fSSatish Balay 96649b5e25fSSatish Balay /* move pointer bap to a(k,l) quickly and add/insert value */ 96726fbe8dcSKarl Rupp if (col <= lastcol) low = 0; 9688509e838SStefano Zampini else high = nrow; 9698509e838SStefano Zampini 970e2ee6c50SBarry Smith lastcol = col; 97149b5e25fSSatish Balay while (high - low > 7) { 97249b5e25fSSatish Balay t = (low + high) / 2; 97349b5e25fSSatish Balay if (rp[t] > bcol) high = t; 97449b5e25fSSatish Balay else low = t; 97549b5e25fSSatish Balay } 97649b5e25fSSatish Balay for (i = low; i < high; i++) { 97749b5e25fSSatish Balay if (rp[i] > bcol) break; 97849b5e25fSSatish Balay if (rp[i] == bcol) { 97949b5e25fSSatish Balay bap = ap + bs2 * i + bs * cidx + ridx; 98049b5e25fSSatish Balay if (is == ADD_VALUES) *bap += value; 98149b5e25fSSatish Balay else *bap = value; 9828549e402SHong Zhang /* for diag block, add/insert its symmetric element a(cidx,ridx) */ 9838549e402SHong Zhang if (brow == bcol && ridx < cidx) { 9848549e402SHong Zhang bap = ap + bs2 * i + bs * ridx + cidx; 9858549e402SHong Zhang if (is == ADD_VALUES) *bap += value; 9868549e402SHong Zhang else *bap = value; 9878549e402SHong Zhang } 98849b5e25fSSatish Balay goto noinsert1; 98949b5e25fSSatish Balay } 99049b5e25fSSatish Balay } 99149b5e25fSSatish Balay 99249b5e25fSSatish Balay if (nonew == 1) goto noinsert1; 99308401ef6SPierre Jolivet PetscCheck(nonew != -1, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Inserting a new nonzero (%" PetscInt_FMT ", %" PetscInt_FMT ") in the matrix", row, col); 994fef13f97SBarry Smith MatSeqXAIJReallocateAIJ(A, a->mbs, bs2, nrow, brow, bcol, rmax, aa, ai, aj, rp, ap, imax, nonew, MatScalar); 99549b5e25fSSatish Balay 9969371c9d4SSatish Balay N = nrow++ - 1; 9979371c9d4SSatish Balay high++; 99849b5e25fSSatish Balay /* shift up all the later entries in this row */ 9999566063dSJacob Faibussowitsch PetscCall(PetscArraymove(rp + i + 1, rp + i, N - i + 1)); 10009566063dSJacob Faibussowitsch PetscCall(PetscArraymove(ap + bs2 * (i + 1), ap + bs2 * i, bs2 * (N - i + 1))); 10019566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(ap + bs2 * i, bs2)); 100249b5e25fSSatish Balay rp[i] = bcol; 100349b5e25fSSatish Balay ap[bs2 * i + bs * cidx + ridx] = value; 10048509e838SStefano Zampini /* for diag block, add/insert its symmetric element a(cidx,ridx) */ 1005ad540459SPierre Jolivet if (brow == bcol && ridx < cidx) ap[bs2 * i + bs * ridx + cidx] = value; 1006e56f5c9eSBarry Smith A->nonzerostate++; 100749b5e25fSSatish Balay noinsert1:; 100849b5e25fSSatish Balay low = i; 10098549e402SHong Zhang } 101049b5e25fSSatish Balay } /* end of loop over added columns */ 101149b5e25fSSatish Balay ailen[brow] = nrow; 101249b5e25fSSatish Balay } /* end of loop over added rows */ 10133ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 101449b5e25fSSatish Balay } 101549b5e25fSSatish Balay 1016d71ae5a4SJacob Faibussowitsch PetscErrorCode MatICCFactor_SeqSBAIJ(Mat inA, IS row, const MatFactorInfo *info) 1017d71ae5a4SJacob Faibussowitsch { 10184ccecd49SHong Zhang Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)inA->data; 101949b5e25fSSatish Balay Mat outA; 1020ace3abfcSBarry Smith PetscBool row_identity; 102149b5e25fSSatish Balay 102249b5e25fSSatish Balay PetscFunctionBegin; 102308401ef6SPierre Jolivet PetscCheck(info->levels == 0, PETSC_COMM_SELF, PETSC_ERR_SUP, "Only levels=0 is supported for in-place icc"); 10249566063dSJacob Faibussowitsch PetscCall(ISIdentity(row, &row_identity)); 102528b400f6SJacob Faibussowitsch PetscCheck(row_identity, PETSC_COMM_SELF, PETSC_ERR_SUP, "Matrix reordering is not supported"); 102608401ef6SPierre Jolivet PetscCheck(inA->rmap->bs == 1, PETSC_COMM_SELF, PETSC_ERR_SUP, "Matrix block size %" PetscInt_FMT " is not supported", inA->rmap->bs); /* Need to replace MatCholeskyFactorSymbolic_SeqSBAIJ_MSR()! */ 1027c84f5b01SHong Zhang 102849b5e25fSSatish Balay outA = inA; 1029d5f3da31SBarry Smith inA->factortype = MAT_FACTOR_ICC; 10309566063dSJacob Faibussowitsch PetscCall(PetscFree(inA->solvertype)); 10319566063dSJacob Faibussowitsch PetscCall(PetscStrallocpy(MATSOLVERPETSC, &inA->solvertype)); 103249b5e25fSSatish Balay 10339566063dSJacob Faibussowitsch PetscCall(MatMarkDiagonal_SeqSBAIJ(inA)); 10349566063dSJacob Faibussowitsch PetscCall(MatSeqSBAIJSetNumericFactorization_inplace(inA, row_identity)); 103549b5e25fSSatish Balay 10369566063dSJacob Faibussowitsch PetscCall(PetscObjectReference((PetscObject)row)); 10379566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->row)); 1038c84f5b01SHong Zhang a->row = row; 10399566063dSJacob Faibussowitsch PetscCall(PetscObjectReference((PetscObject)row)); 10409566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->col)); 1041c84f5b01SHong Zhang a->col = row; 1042c84f5b01SHong Zhang 1043c84f5b01SHong Zhang /* Create the invert permutation so that it can be used in MatCholeskyFactorNumeric() */ 10449566063dSJacob Faibussowitsch if (a->icol) PetscCall(ISInvertPermutation(row, PETSC_DECIDE, &a->icol)); 104549b5e25fSSatish Balay 1046aa624791SPierre Jolivet if (!a->solve_work) PetscCall(PetscMalloc1(inA->rmap->N + inA->rmap->bs, &a->solve_work)); 104749b5e25fSSatish Balay 10489566063dSJacob Faibussowitsch PetscCall(MatCholeskyFactorNumeric(outA, inA, info)); 10493ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 105049b5e25fSSatish Balay } 1051950f1e5bSHong Zhang 1052d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqSBAIJSetColumnIndices_SeqSBAIJ(Mat mat, PetscInt *indices) 1053d71ae5a4SJacob Faibussowitsch { 1054045c9aa0SHong Zhang Mat_SeqSBAIJ *baij = (Mat_SeqSBAIJ *)mat->data; 105513f74950SBarry Smith PetscInt i, nz, n; 105649b5e25fSSatish Balay 105749b5e25fSSatish Balay PetscFunctionBegin; 10586c6c5352SBarry Smith nz = baij->maxnz; 1059d0f46423SBarry Smith n = mat->cmap->n; 106026fbe8dcSKarl Rupp for (i = 0; i < nz; i++) baij->j[i] = indices[i]; 106126fbe8dcSKarl Rupp 10626c6c5352SBarry Smith baij->nz = nz; 106326fbe8dcSKarl Rupp for (i = 0; i < n; i++) baij->ilen[i] = baij->imax[i]; 106426fbe8dcSKarl Rupp 10659566063dSJacob Faibussowitsch PetscCall(MatSetOption(mat, MAT_NEW_NONZERO_LOCATION_ERR, PETSC_TRUE)); 10663ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 106749b5e25fSSatish Balay } 106849b5e25fSSatish Balay 106949b5e25fSSatish Balay /*@ 107019585528SSatish Balay MatSeqSBAIJSetColumnIndices - Set the column indices for all the rows 107111a5261eSBarry Smith in a `MATSEQSBAIJ` matrix. 107249b5e25fSSatish Balay 107349b5e25fSSatish Balay Input Parameters: 107411a5261eSBarry Smith + mat - the `MATSEQSBAIJ` matrix 107549b5e25fSSatish Balay - indices - the column indices 107649b5e25fSSatish Balay 107749b5e25fSSatish Balay Level: advanced 107849b5e25fSSatish Balay 107949b5e25fSSatish Balay Notes: 108049b5e25fSSatish Balay This can be called if you have precomputed the nonzero structure of the 108149b5e25fSSatish Balay matrix and want to provide it to the matrix object to improve the performance 108211a5261eSBarry Smith of the `MatSetValues()` operation. 108349b5e25fSSatish Balay 108449b5e25fSSatish Balay You MUST have set the correct numbers of nonzeros per row in the call to 108511a5261eSBarry Smith `MatCreateSeqSBAIJ()`, and the columns indices MUST be sorted. 108649b5e25fSSatish Balay 10872ef1f0ffSBarry Smith MUST be called before any calls to `MatSetValues()` 108849b5e25fSSatish Balay 10891cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MATSEQSBAIJ`, `MatCreateSeqSBAIJ` 109049b5e25fSSatish Balay @*/ 1091d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqSBAIJSetColumnIndices(Mat mat, PetscInt *indices) 1092d71ae5a4SJacob Faibussowitsch { 109349b5e25fSSatish Balay PetscFunctionBegin; 10940700a824SBarry Smith PetscValidHeaderSpecific(mat, MAT_CLASSID, 1); 1095dadcf809SJacob Faibussowitsch PetscValidIntPointer(indices, 2); 1096cac4c232SBarry Smith PetscUseMethod(mat, "MatSeqSBAIJSetColumnIndices_C", (Mat, PetscInt *), (mat, indices)); 10973ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 109849b5e25fSSatish Balay } 109949b5e25fSSatish Balay 1100d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCopy_SeqSBAIJ(Mat A, Mat B, MatStructure str) 1101d71ae5a4SJacob Faibussowitsch { 11024c7a3774SStefano Zampini PetscBool isbaij; 11033c896bc6SHong Zhang 11043c896bc6SHong Zhang PetscFunctionBegin; 11059566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompareAny((PetscObject)B, &isbaij, MATSEQSBAIJ, MATMPISBAIJ, "")); 110628b400f6SJacob Faibussowitsch PetscCheck(isbaij, PetscObjectComm((PetscObject)B), PETSC_ERR_SUP, "Not for matrix type %s", ((PetscObject)B)->type_name); 11074c7a3774SStefano Zampini /* If the two matrices have the same copy implementation and nonzero pattern, use fast copy. */ 11084c7a3774SStefano Zampini if (str == SAME_NONZERO_PATTERN && A->ops->copy == B->ops->copy) { 11093c896bc6SHong Zhang Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)A->data; 11103c896bc6SHong Zhang Mat_SeqSBAIJ *b = (Mat_SeqSBAIJ *)B->data; 11113c896bc6SHong Zhang 111208401ef6SPierre Jolivet PetscCheck(a->i[a->mbs] == b->i[b->mbs], PETSC_COMM_SELF, PETSC_ERR_ARG_INCOMP, "Number of nonzeros in two matrices are different"); 111308401ef6SPierre Jolivet PetscCheck(a->mbs == b->mbs, PETSC_COMM_SELF, PETSC_ERR_ARG_INCOMP, "Number of rows in two matrices are different"); 111408401ef6SPierre Jolivet PetscCheck(a->bs2 == b->bs2, PETSC_COMM_SELF, PETSC_ERR_ARG_INCOMP, "Different block size"); 11159566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(b->a, a->a, a->bs2 * a->i[a->mbs])); 11169566063dSJacob Faibussowitsch PetscCall(PetscObjectStateIncrease((PetscObject)B)); 11173c896bc6SHong Zhang } else { 11189566063dSJacob Faibussowitsch PetscCall(MatGetRowUpperTriangular(A)); 11199566063dSJacob Faibussowitsch PetscCall(MatCopy_Basic(A, B, str)); 11209566063dSJacob Faibussowitsch PetscCall(MatRestoreRowUpperTriangular(A)); 11213c896bc6SHong Zhang } 11223ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 11233c896bc6SHong Zhang } 11243c896bc6SHong Zhang 1125d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatSeqSBAIJGetArray_SeqSBAIJ(Mat A, PetscScalar *array[]) 1126d71ae5a4SJacob Faibussowitsch { 1127a6ece127SHong Zhang Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)A->data; 11285fd66863SKarl Rupp 1129a6ece127SHong Zhang PetscFunctionBegin; 1130a6ece127SHong Zhang *array = a->a; 11313ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1132a6ece127SHong Zhang } 1133a6ece127SHong Zhang 1134d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatSeqSBAIJRestoreArray_SeqSBAIJ(Mat A, PetscScalar *array[]) 1135d71ae5a4SJacob Faibussowitsch { 1136a6ece127SHong Zhang PetscFunctionBegin; 1137cda14afcSprj- *array = NULL; 11383ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1139a6ece127SHong Zhang } 1140a6ece127SHong Zhang 1141d71ae5a4SJacob Faibussowitsch PetscErrorCode MatAXPYGetPreallocation_SeqSBAIJ(Mat Y, Mat X, PetscInt *nnz) 1142d71ae5a4SJacob Faibussowitsch { 1143b264fe52SHong Zhang PetscInt bs = Y->rmap->bs, mbs = Y->rmap->N / bs; 114452768537SHong Zhang Mat_SeqSBAIJ *x = (Mat_SeqSBAIJ *)X->data; 114552768537SHong Zhang Mat_SeqSBAIJ *y = (Mat_SeqSBAIJ *)Y->data; 114652768537SHong Zhang 114752768537SHong Zhang PetscFunctionBegin; 114852768537SHong Zhang /* Set the number of nonzeros in the new matrix */ 11499566063dSJacob Faibussowitsch PetscCall(MatAXPYGetPreallocation_SeqX_private(mbs, x->i, x->j, y->i, y->j, nnz)); 11503ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 115152768537SHong Zhang } 115252768537SHong Zhang 1153d71ae5a4SJacob Faibussowitsch PetscErrorCode MatAXPY_SeqSBAIJ(Mat Y, PetscScalar a, Mat X, MatStructure str) 1154d71ae5a4SJacob Faibussowitsch { 115542ee4b1aSHong Zhang Mat_SeqSBAIJ *x = (Mat_SeqSBAIJ *)X->data, *y = (Mat_SeqSBAIJ *)Y->data; 115631ce2d13SHong Zhang PetscInt bs = Y->rmap->bs, bs2 = bs * bs; 1157e838b9e7SJed Brown PetscBLASInt one = 1; 115842ee4b1aSHong Zhang 115942ee4b1aSHong Zhang PetscFunctionBegin; 1160134adf20SPierre Jolivet if (str == UNKNOWN_NONZERO_PATTERN || (PetscDefined(USE_DEBUG) && str == SAME_NONZERO_PATTERN)) { 1161134adf20SPierre Jolivet PetscBool e = x->nz == y->nz && x->mbs == y->mbs ? PETSC_TRUE : PETSC_FALSE; 1162134adf20SPierre Jolivet if (e) { 11639566063dSJacob Faibussowitsch PetscCall(PetscArraycmp(x->i, y->i, x->mbs + 1, &e)); 1164134adf20SPierre Jolivet if (e) { 11659566063dSJacob Faibussowitsch PetscCall(PetscArraycmp(x->j, y->j, x->i[x->mbs], &e)); 1166134adf20SPierre Jolivet if (e) str = SAME_NONZERO_PATTERN; 1167134adf20SPierre Jolivet } 1168134adf20SPierre Jolivet } 116954c59aa7SJacob Faibussowitsch if (!e) PetscCheck(str != SAME_NONZERO_PATTERN, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONG, "MatStructure is not SAME_NONZERO_PATTERN"); 1170134adf20SPierre Jolivet } 117142ee4b1aSHong Zhang if (str == SAME_NONZERO_PATTERN) { 1172f4df32b1SMatthew Knepley PetscScalar alpha = a; 1173c5df96a5SBarry Smith PetscBLASInt bnz; 11749566063dSJacob Faibussowitsch PetscCall(PetscBLASIntCast(x->nz * bs2, &bnz)); 1175792fecdfSBarry Smith PetscCallBLAS("BLASaxpy", BLASaxpy_(&bnz, &alpha, x->a, &one, y->a, &one)); 11769566063dSJacob Faibussowitsch PetscCall(PetscObjectStateIncrease((PetscObject)Y)); 1177ab784542SHong Zhang } else if (str == SUBSET_NONZERO_PATTERN) { /* nonzeros of X is a subset of Y's */ 11789566063dSJacob Faibussowitsch PetscCall(MatSetOption(X, MAT_GETROW_UPPERTRIANGULAR, PETSC_TRUE)); 11799566063dSJacob Faibussowitsch PetscCall(MatAXPY_Basic(Y, a, X, str)); 11809566063dSJacob Faibussowitsch PetscCall(MatSetOption(X, MAT_GETROW_UPPERTRIANGULAR, PETSC_FALSE)); 118142ee4b1aSHong Zhang } else { 118252768537SHong Zhang Mat B; 118352768537SHong Zhang PetscInt *nnz; 118454c59aa7SJacob Faibussowitsch PetscCheck(bs == X->rmap->bs, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Matrices must have same block size"); 11859566063dSJacob Faibussowitsch PetscCall(MatGetRowUpperTriangular(X)); 11869566063dSJacob Faibussowitsch PetscCall(MatGetRowUpperTriangular(Y)); 11879566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(Y->rmap->N, &nnz)); 11889566063dSJacob Faibussowitsch PetscCall(MatCreate(PetscObjectComm((PetscObject)Y), &B)); 11899566063dSJacob Faibussowitsch PetscCall(PetscObjectSetName((PetscObject)B, ((PetscObject)Y)->name)); 11909566063dSJacob Faibussowitsch PetscCall(MatSetSizes(B, Y->rmap->n, Y->cmap->n, Y->rmap->N, Y->cmap->N)); 11919566063dSJacob Faibussowitsch PetscCall(MatSetBlockSizesFromMats(B, Y, Y)); 11929566063dSJacob Faibussowitsch PetscCall(MatSetType(B, ((PetscObject)Y)->type_name)); 11939566063dSJacob Faibussowitsch PetscCall(MatAXPYGetPreallocation_SeqSBAIJ(Y, X, nnz)); 11949566063dSJacob Faibussowitsch PetscCall(MatSeqSBAIJSetPreallocation(B, bs, 0, nnz)); 119552768537SHong Zhang 11969566063dSJacob Faibussowitsch PetscCall(MatAXPY_BasicWithPreallocation(B, Y, a, X, str)); 119752768537SHong Zhang 11989566063dSJacob Faibussowitsch PetscCall(MatHeaderMerge(Y, &B)); 11999566063dSJacob Faibussowitsch PetscCall(PetscFree(nnz)); 12009566063dSJacob Faibussowitsch PetscCall(MatRestoreRowUpperTriangular(X)); 12019566063dSJacob Faibussowitsch PetscCall(MatRestoreRowUpperTriangular(Y)); 120242ee4b1aSHong Zhang } 12033ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 120442ee4b1aSHong Zhang } 120542ee4b1aSHong Zhang 1206d71ae5a4SJacob Faibussowitsch PetscErrorCode MatIsSymmetric_SeqSBAIJ(Mat A, PetscReal tol, PetscBool *flg) 1207d71ae5a4SJacob Faibussowitsch { 1208efcf0fc3SBarry Smith PetscFunctionBegin; 1209efcf0fc3SBarry Smith *flg = PETSC_TRUE; 12103ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1211efcf0fc3SBarry Smith } 1212efcf0fc3SBarry Smith 1213d71ae5a4SJacob Faibussowitsch PetscErrorCode MatIsStructurallySymmetric_SeqSBAIJ(Mat A, PetscBool *flg) 1214d71ae5a4SJacob Faibussowitsch { 1215efcf0fc3SBarry Smith PetscFunctionBegin; 1216efcf0fc3SBarry Smith *flg = PETSC_TRUE; 12173ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1218efcf0fc3SBarry Smith } 1219efcf0fc3SBarry Smith 1220d71ae5a4SJacob Faibussowitsch PetscErrorCode MatIsHermitian_SeqSBAIJ(Mat A, PetscReal tol, PetscBool *flg) 1221d71ae5a4SJacob Faibussowitsch { 1222efcf0fc3SBarry Smith PetscFunctionBegin; 1223efcf0fc3SBarry Smith *flg = PETSC_FALSE; 12243ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1225efcf0fc3SBarry Smith } 1226efcf0fc3SBarry Smith 1227d71ae5a4SJacob Faibussowitsch PetscErrorCode MatConjugate_SeqSBAIJ(Mat A) 1228d71ae5a4SJacob Faibussowitsch { 12292726fb6dSPierre Jolivet #if defined(PETSC_USE_COMPLEX) 12302726fb6dSPierre Jolivet Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)A->data; 12312726fb6dSPierre Jolivet PetscInt i, nz = a->bs2 * a->i[a->mbs]; 12322726fb6dSPierre Jolivet MatScalar *aa = a->a; 12332726fb6dSPierre Jolivet 12342726fb6dSPierre Jolivet PetscFunctionBegin; 12352726fb6dSPierre Jolivet for (i = 0; i < nz; i++) aa[i] = PetscConj(aa[i]); 12362726fb6dSPierre Jolivet #else 12372726fb6dSPierre Jolivet PetscFunctionBegin; 12382726fb6dSPierre Jolivet #endif 12393ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 12402726fb6dSPierre Jolivet } 12412726fb6dSPierre Jolivet 1242d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRealPart_SeqSBAIJ(Mat A) 1243d71ae5a4SJacob Faibussowitsch { 124499cafbc1SBarry Smith Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)A->data; 124599cafbc1SBarry Smith PetscInt i, nz = a->bs2 * a->i[a->mbs]; 1246dd6ea824SBarry Smith MatScalar *aa = a->a; 124799cafbc1SBarry Smith 124899cafbc1SBarry Smith PetscFunctionBegin; 124999cafbc1SBarry Smith for (i = 0; i < nz; i++) aa[i] = PetscRealPart(aa[i]); 12503ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 125199cafbc1SBarry Smith } 125299cafbc1SBarry Smith 1253d71ae5a4SJacob Faibussowitsch PetscErrorCode MatImaginaryPart_SeqSBAIJ(Mat A) 1254d71ae5a4SJacob Faibussowitsch { 125599cafbc1SBarry Smith Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)A->data; 125699cafbc1SBarry Smith PetscInt i, nz = a->bs2 * a->i[a->mbs]; 1257dd6ea824SBarry Smith MatScalar *aa = a->a; 125899cafbc1SBarry Smith 125999cafbc1SBarry Smith PetscFunctionBegin; 126099cafbc1SBarry Smith for (i = 0; i < nz; i++) aa[i] = PetscImaginaryPart(aa[i]); 12613ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 126299cafbc1SBarry Smith } 126399cafbc1SBarry Smith 1264d71ae5a4SJacob Faibussowitsch PetscErrorCode MatZeroRowsColumns_SeqSBAIJ(Mat A, PetscInt is_n, const PetscInt is_idx[], PetscScalar diag, Vec x, Vec b) 1265d71ae5a4SJacob Faibussowitsch { 12663bededecSBarry Smith Mat_SeqSBAIJ *baij = (Mat_SeqSBAIJ *)A->data; 12673bededecSBarry Smith PetscInt i, j, k, count; 12683bededecSBarry Smith PetscInt bs = A->rmap->bs, bs2 = baij->bs2, row, col; 12693bededecSBarry Smith PetscScalar zero = 0.0; 12703bededecSBarry Smith MatScalar *aa; 12713bededecSBarry Smith const PetscScalar *xx; 12723bededecSBarry Smith PetscScalar *bb; 127356777dd2SBarry Smith PetscBool *zeroed, vecs = PETSC_FALSE; 12743bededecSBarry Smith 12753bededecSBarry Smith PetscFunctionBegin; 12763bededecSBarry Smith /* fix right hand side if needed */ 12773bededecSBarry Smith if (x && b) { 12789566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(x, &xx)); 12799566063dSJacob Faibussowitsch PetscCall(VecGetArray(b, &bb)); 128056777dd2SBarry Smith vecs = PETSC_TRUE; 12813bededecSBarry Smith } 12823bededecSBarry Smith 12833bededecSBarry Smith /* zero the columns */ 12849566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(A->rmap->n, &zeroed)); 12853bededecSBarry Smith for (i = 0; i < is_n; i++) { 1286aed4548fSBarry Smith PetscCheck(is_idx[i] >= 0 && is_idx[i] < A->rmap->N, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "row %" PetscInt_FMT " out of range", is_idx[i]); 12873bededecSBarry Smith zeroed[is_idx[i]] = PETSC_TRUE; 12883bededecSBarry Smith } 128956777dd2SBarry Smith if (vecs) { 129056777dd2SBarry Smith for (i = 0; i < A->rmap->N; i++) { 129156777dd2SBarry Smith row = i / bs; 129256777dd2SBarry Smith for (j = baij->i[row]; j < baij->i[row + 1]; j++) { 129356777dd2SBarry Smith for (k = 0; k < bs; k++) { 129456777dd2SBarry Smith col = bs * baij->j[j] + k; 129556777dd2SBarry Smith if (col <= i) continue; 129656777dd2SBarry Smith aa = ((MatScalar *)(baij->a)) + j * bs2 + (i % bs) + bs * k; 129726fbe8dcSKarl Rupp if (!zeroed[i] && zeroed[col]) bb[i] -= aa[0] * xx[col]; 129826fbe8dcSKarl Rupp if (zeroed[i] && !zeroed[col]) bb[col] -= aa[0] * xx[i]; 129956777dd2SBarry Smith } 130056777dd2SBarry Smith } 130156777dd2SBarry Smith } 130226fbe8dcSKarl Rupp for (i = 0; i < is_n; i++) bb[is_idx[i]] = diag * xx[is_idx[i]]; 130356777dd2SBarry Smith } 130456777dd2SBarry Smith 13053bededecSBarry Smith for (i = 0; i < A->rmap->N; i++) { 13063bededecSBarry Smith if (!zeroed[i]) { 13073bededecSBarry Smith row = i / bs; 13083bededecSBarry Smith for (j = baij->i[row]; j < baij->i[row + 1]; j++) { 13093bededecSBarry Smith for (k = 0; k < bs; k++) { 13103bededecSBarry Smith col = bs * baij->j[j] + k; 13113bededecSBarry Smith if (zeroed[col]) { 13123bededecSBarry Smith aa = ((MatScalar *)(baij->a)) + j * bs2 + (i % bs) + bs * k; 13133bededecSBarry Smith aa[0] = 0.0; 13143bededecSBarry Smith } 13153bededecSBarry Smith } 13163bededecSBarry Smith } 13173bededecSBarry Smith } 13183bededecSBarry Smith } 13199566063dSJacob Faibussowitsch PetscCall(PetscFree(zeroed)); 132056777dd2SBarry Smith if (vecs) { 13219566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(x, &xx)); 13229566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(b, &bb)); 132356777dd2SBarry Smith } 13243bededecSBarry Smith 13253bededecSBarry Smith /* zero the rows */ 13263bededecSBarry Smith for (i = 0; i < is_n; i++) { 13273bededecSBarry Smith row = is_idx[i]; 13283bededecSBarry Smith count = (baij->i[row / bs + 1] - baij->i[row / bs]) * bs; 13293bededecSBarry Smith aa = ((MatScalar *)(baij->a)) + baij->i[row / bs] * bs2 + (row % bs); 13303bededecSBarry Smith for (k = 0; k < count; k++) { 13313bededecSBarry Smith aa[0] = zero; 13323bededecSBarry Smith aa += bs; 13333bededecSBarry Smith } 1334dbbe0bcdSBarry Smith if (diag != 0.0) PetscUseTypeMethod(A, setvalues, 1, &row, 1, &row, &diag, INSERT_VALUES); 13353bededecSBarry Smith } 13369566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd_SeqSBAIJ(A, MAT_FINAL_ASSEMBLY)); 13373ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 13383bededecSBarry Smith } 13393bededecSBarry Smith 1340d71ae5a4SJacob Faibussowitsch PetscErrorCode MatShift_SeqSBAIJ(Mat Y, PetscScalar a) 1341d71ae5a4SJacob Faibussowitsch { 13427d68702bSBarry Smith Mat_SeqSBAIJ *aij = (Mat_SeqSBAIJ *)Y->data; 13437d68702bSBarry Smith 13447d68702bSBarry Smith PetscFunctionBegin; 134548a46eb9SPierre Jolivet if (!Y->preallocated || !aij->nz) PetscCall(MatSeqSBAIJSetPreallocation(Y, Y->rmap->bs, 1, NULL)); 13469566063dSJacob Faibussowitsch PetscCall(MatShift_Basic(Y, a)); 13473ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 13487d68702bSBarry Smith } 13497d68702bSBarry Smith 13503964eb88SJed Brown static struct _MatOps MatOps_Values = {MatSetValues_SeqSBAIJ, 135149b5e25fSSatish Balay MatGetRow_SeqSBAIJ, 135249b5e25fSSatish Balay MatRestoreRow_SeqSBAIJ, 135349b5e25fSSatish Balay MatMult_SeqSBAIJ_N, 135497304618SKris Buschelman /* 4*/ MatMultAdd_SeqSBAIJ_N, 1355431c96f7SBarry Smith MatMult_SeqSBAIJ_N, /* transpose versions are same as non-transpose versions */ 1356e005ede5SBarry Smith MatMultAdd_SeqSBAIJ_N, 1357f4259b30SLisandro Dalcin NULL, 1358f4259b30SLisandro Dalcin NULL, 1359f4259b30SLisandro Dalcin NULL, 1360f4259b30SLisandro Dalcin /* 10*/ NULL, 1361f4259b30SLisandro Dalcin NULL, 1362c078aec8SLisandro Dalcin MatCholeskyFactor_SeqSBAIJ, 136341f059aeSBarry Smith MatSOR_SeqSBAIJ, 136449b5e25fSSatish Balay MatTranspose_SeqSBAIJ, 136597304618SKris Buschelman /* 15*/ MatGetInfo_SeqSBAIJ, 136649b5e25fSSatish Balay MatEqual_SeqSBAIJ, 136749b5e25fSSatish Balay MatGetDiagonal_SeqSBAIJ, 136849b5e25fSSatish Balay MatDiagonalScale_SeqSBAIJ, 136949b5e25fSSatish Balay MatNorm_SeqSBAIJ, 1370f4259b30SLisandro Dalcin /* 20*/ NULL, 137149b5e25fSSatish Balay MatAssemblyEnd_SeqSBAIJ, 137249b5e25fSSatish Balay MatSetOption_SeqSBAIJ, 137349b5e25fSSatish Balay MatZeroEntries_SeqSBAIJ, 1374f4259b30SLisandro Dalcin /* 24*/ NULL, 1375f4259b30SLisandro Dalcin NULL, 1376f4259b30SLisandro Dalcin NULL, 1377f4259b30SLisandro Dalcin NULL, 1378f4259b30SLisandro Dalcin NULL, 137926cec326SBarry Smith /* 29*/ MatSetUp_Seq_Hash, 1380f4259b30SLisandro Dalcin NULL, 1381f4259b30SLisandro Dalcin NULL, 1382f4259b30SLisandro Dalcin NULL, 1383f4259b30SLisandro Dalcin NULL, 1384d519adbfSMatthew Knepley /* 34*/ MatDuplicate_SeqSBAIJ, 1385f4259b30SLisandro Dalcin NULL, 1386f4259b30SLisandro Dalcin NULL, 1387f4259b30SLisandro Dalcin NULL, 1388c84f5b01SHong Zhang MatICCFactor_SeqSBAIJ, 1389d519adbfSMatthew Knepley /* 39*/ MatAXPY_SeqSBAIJ, 13907dae84e0SHong Zhang MatCreateSubMatrices_SeqSBAIJ, 139149b5e25fSSatish Balay MatIncreaseOverlap_SeqSBAIJ, 139249b5e25fSSatish Balay MatGetValues_SeqSBAIJ, 13933c896bc6SHong Zhang MatCopy_SeqSBAIJ, 1394f4259b30SLisandro Dalcin /* 44*/ NULL, 139549b5e25fSSatish Balay MatScale_SeqSBAIJ, 13967d68702bSBarry Smith MatShift_SeqSBAIJ, 1397f4259b30SLisandro Dalcin NULL, 13983bededecSBarry Smith MatZeroRowsColumns_SeqSBAIJ, 1399f4259b30SLisandro Dalcin /* 49*/ NULL, 140049b5e25fSSatish Balay MatGetRowIJ_SeqSBAIJ, 140149b5e25fSSatish Balay MatRestoreRowIJ_SeqSBAIJ, 1402f4259b30SLisandro Dalcin NULL, 1403f4259b30SLisandro Dalcin NULL, 1404f4259b30SLisandro Dalcin /* 54*/ NULL, 1405f4259b30SLisandro Dalcin NULL, 1406f4259b30SLisandro Dalcin NULL, 1407dc29a518SPierre Jolivet MatPermute_SeqSBAIJ, 140849b5e25fSSatish Balay MatSetValuesBlocked_SeqSBAIJ, 14097dae84e0SHong Zhang /* 59*/ MatCreateSubMatrix_SeqSBAIJ, 1410f4259b30SLisandro Dalcin NULL, 1411f4259b30SLisandro Dalcin NULL, 1412f4259b30SLisandro Dalcin NULL, 1413f4259b30SLisandro Dalcin NULL, 1414f4259b30SLisandro Dalcin /* 64*/ NULL, 1415f4259b30SLisandro Dalcin NULL, 1416f4259b30SLisandro Dalcin NULL, 1417f4259b30SLisandro Dalcin NULL, 1418f4259b30SLisandro Dalcin NULL, 1419d519adbfSMatthew Knepley /* 69*/ MatGetRowMaxAbs_SeqSBAIJ, 1420f4259b30SLisandro Dalcin NULL, 142128d58a37SPierre Jolivet MatConvert_MPISBAIJ_Basic, 1422f4259b30SLisandro Dalcin NULL, 1423f4259b30SLisandro Dalcin NULL, 1424f4259b30SLisandro Dalcin /* 74*/ NULL, 1425f4259b30SLisandro Dalcin NULL, 1426f4259b30SLisandro Dalcin NULL, 1427f4259b30SLisandro Dalcin NULL, 1428f4259b30SLisandro Dalcin NULL, 1429f4259b30SLisandro Dalcin /* 79*/ NULL, 1430f4259b30SLisandro Dalcin NULL, 1431f4259b30SLisandro Dalcin NULL, 143297304618SKris Buschelman MatGetInertia_SeqSBAIJ, 14335bba2384SShri Abhyankar MatLoad_SeqSBAIJ, 1434d519adbfSMatthew Knepley /* 84*/ MatIsSymmetric_SeqSBAIJ, 1435865e5f61SKris Buschelman MatIsHermitian_SeqSBAIJ, 1436efcf0fc3SBarry Smith MatIsStructurallySymmetric_SeqSBAIJ, 1437f4259b30SLisandro Dalcin NULL, 1438f4259b30SLisandro Dalcin NULL, 1439f4259b30SLisandro Dalcin /* 89*/ NULL, 1440f4259b30SLisandro Dalcin NULL, 1441f4259b30SLisandro Dalcin NULL, 1442f4259b30SLisandro Dalcin NULL, 1443f4259b30SLisandro Dalcin NULL, 1444f4259b30SLisandro Dalcin /* 94*/ NULL, 1445f4259b30SLisandro Dalcin NULL, 1446f4259b30SLisandro Dalcin NULL, 1447f4259b30SLisandro Dalcin NULL, 1448f4259b30SLisandro Dalcin NULL, 1449f4259b30SLisandro Dalcin /* 99*/ NULL, 1450f4259b30SLisandro Dalcin NULL, 1451f4259b30SLisandro Dalcin NULL, 14522726fb6dSPierre Jolivet MatConjugate_SeqSBAIJ, 1453f4259b30SLisandro Dalcin NULL, 1454f4259b30SLisandro Dalcin /*104*/ NULL, 145599cafbc1SBarry Smith MatRealPart_SeqSBAIJ, 1456f5edf698SHong Zhang MatImaginaryPart_SeqSBAIJ, 1457f5edf698SHong Zhang MatGetRowUpperTriangular_SeqSBAIJ, 14582af78befSBarry Smith MatRestoreRowUpperTriangular_SeqSBAIJ, 1459f4259b30SLisandro Dalcin /*109*/ NULL, 1460f4259b30SLisandro Dalcin NULL, 1461f4259b30SLisandro Dalcin NULL, 1462f4259b30SLisandro Dalcin NULL, 1463547795f9SHong Zhang MatMissingDiagonal_SeqSBAIJ, 1464f4259b30SLisandro Dalcin /*114*/ NULL, 1465f4259b30SLisandro Dalcin NULL, 1466f4259b30SLisandro Dalcin NULL, 1467f4259b30SLisandro Dalcin NULL, 1468f4259b30SLisandro Dalcin NULL, 1469f4259b30SLisandro Dalcin /*119*/ NULL, 1470f4259b30SLisandro Dalcin NULL, 1471f4259b30SLisandro Dalcin NULL, 1472f4259b30SLisandro Dalcin NULL, 1473f4259b30SLisandro Dalcin NULL, 1474f4259b30SLisandro Dalcin /*124*/ NULL, 1475f4259b30SLisandro Dalcin NULL, 1476f4259b30SLisandro Dalcin NULL, 1477f4259b30SLisandro Dalcin NULL, 1478f4259b30SLisandro Dalcin NULL, 1479f4259b30SLisandro Dalcin /*129*/ NULL, 1480f4259b30SLisandro Dalcin NULL, 1481f4259b30SLisandro Dalcin NULL, 1482f4259b30SLisandro Dalcin NULL, 1483f4259b30SLisandro Dalcin NULL, 1484f4259b30SLisandro Dalcin /*134*/ NULL, 1485f4259b30SLisandro Dalcin NULL, 1486f4259b30SLisandro Dalcin NULL, 1487f4259b30SLisandro Dalcin NULL, 1488f4259b30SLisandro Dalcin NULL, 148946533700Sstefano_zampini /*139*/ MatSetBlockSizes_Default, 1490f4259b30SLisandro Dalcin NULL, 1491f4259b30SLisandro Dalcin NULL, 1492f4259b30SLisandro Dalcin NULL, 1493f4259b30SLisandro Dalcin NULL, 1494d70f29a3SPierre Jolivet /*144*/ MatCreateMPIMatConcatenateSeqMat_SeqSBAIJ, 1495d70f29a3SPierre Jolivet NULL, 1496d70f29a3SPierre Jolivet NULL, 149799a7f59eSMark Adams NULL, 149899a7f59eSMark Adams NULL, 14997fb60732SBarry Smith NULL, 1500dec0b466SHong Zhang /*150*/ NULL, 1501dec0b466SHong Zhang NULL}; 1502be1d678aSKris Buschelman 1503d71ae5a4SJacob Faibussowitsch PetscErrorCode MatStoreValues_SeqSBAIJ(Mat mat) 1504d71ae5a4SJacob Faibussowitsch { 15054afc71dfSHong Zhang Mat_SeqSBAIJ *aij = (Mat_SeqSBAIJ *)mat->data; 1506d0f46423SBarry Smith PetscInt nz = aij->i[mat->rmap->N] * mat->rmap->bs * aij->bs2; 150749b5e25fSSatish Balay 150849b5e25fSSatish Balay PetscFunctionBegin; 150908401ef6SPierre Jolivet PetscCheck(aij->nonew == 1, PETSC_COMM_SELF, PETSC_ERR_ORDER, "Must call MatSetOption(A,MAT_NEW_NONZERO_LOCATIONS,PETSC_FALSE);first"); 151049b5e25fSSatish Balay 151149b5e25fSSatish Balay /* allocate space for values if not already there */ 151248a46eb9SPierre Jolivet if (!aij->saved_values) PetscCall(PetscMalloc1(nz + 1, &aij->saved_values)); 151349b5e25fSSatish Balay 151449b5e25fSSatish Balay /* copy values over */ 15159566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(aij->saved_values, aij->a, nz)); 15163ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 151749b5e25fSSatish Balay } 151849b5e25fSSatish Balay 1519d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRetrieveValues_SeqSBAIJ(Mat mat) 1520d71ae5a4SJacob Faibussowitsch { 15214afc71dfSHong Zhang Mat_SeqSBAIJ *aij = (Mat_SeqSBAIJ *)mat->data; 1522d0f46423SBarry Smith PetscInt nz = aij->i[mat->rmap->N] * mat->rmap->bs * aij->bs2; 152349b5e25fSSatish Balay 152449b5e25fSSatish Balay PetscFunctionBegin; 152508401ef6SPierre Jolivet PetscCheck(aij->nonew == 1, PETSC_COMM_SELF, PETSC_ERR_ORDER, "Must call MatSetOption(A,MAT_NEW_NONZERO_LOCATIONS,PETSC_FALSE);first"); 152628b400f6SJacob Faibussowitsch PetscCheck(aij->saved_values, PETSC_COMM_SELF, PETSC_ERR_ORDER, "Must call MatStoreValues(A);first"); 152749b5e25fSSatish Balay 152849b5e25fSSatish Balay /* copy values over */ 15299566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(aij->a, aij->saved_values, nz)); 15303ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 153149b5e25fSSatish Balay } 153249b5e25fSSatish Balay 1533d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatSeqSBAIJSetPreallocation_SeqSBAIJ(Mat B, PetscInt bs, PetscInt nz, PetscInt *nnz) 1534d71ae5a4SJacob Faibussowitsch { 1535c464158bSHong Zhang Mat_SeqSBAIJ *b = (Mat_SeqSBAIJ *)B->data; 15364dcd73b1SHong Zhang PetscInt i, mbs, nbs, bs2; 15372576faa2SJed Brown PetscBool skipallocation = PETSC_FALSE, flg = PETSC_FALSE, realalloc = PETSC_FALSE; 153849b5e25fSSatish Balay 1539*b4e2f619SBarry Smith PetscFunctionBegin; 1540ad79cf63SBarry Smith if (B->hash_active) { 1541ad79cf63SBarry Smith PetscInt bs; 1542ad79cf63SBarry Smith PetscCall(PetscMemcpy(&B->ops, &b->cops, sizeof(*(B->ops)))); 1543ad79cf63SBarry Smith PetscCall(PetscHMapIJVDestroy(&b->ht)); 1544ad79cf63SBarry Smith PetscCall(MatGetBlockSize(B, &bs)); 1545ad79cf63SBarry Smith if (bs > 1) PetscCall(PetscHSetIJDestroy(&b->bht)); 1546ad79cf63SBarry Smith PetscCall(PetscFree(b->dnz)); 1547ad79cf63SBarry Smith PetscCall(PetscFree(b->bdnz)); 1548ad79cf63SBarry Smith B->hash_active = PETSC_FALSE; 1549ad79cf63SBarry Smith } 15502576faa2SJed Brown if (nz >= 0 || nnz) realalloc = PETSC_TRUE; 1551db4efbfdSBarry Smith 15529566063dSJacob Faibussowitsch PetscCall(MatSetBlockSize(B, PetscAbs(bs))); 15539566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(B->rmap)); 15549566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(B->cmap)); 155508401ef6SPierre Jolivet PetscCheck(B->rmap->N <= B->cmap->N, PETSC_COMM_SELF, PETSC_ERR_SUP, "SEQSBAIJ matrix cannot have more rows %" PetscInt_FMT " than columns %" PetscInt_FMT, B->rmap->N, B->cmap->N); 15569566063dSJacob Faibussowitsch PetscCall(PetscLayoutGetBlockSize(B->rmap, &bs)); 1557899cda47SBarry Smith 155821940c7eSstefano_zampini B->preallocated = PETSC_TRUE; 155921940c7eSstefano_zampini 1560d0f46423SBarry Smith mbs = B->rmap->N / bs; 15614dcd73b1SHong Zhang nbs = B->cmap->n / bs; 156249b5e25fSSatish Balay bs2 = bs * bs; 156349b5e25fSSatish Balay 1564aed4548fSBarry Smith PetscCheck(mbs * bs == B->rmap->N && nbs * bs == B->cmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Number rows, cols must be divisible by blocksize"); 156549b5e25fSSatish Balay 1566ab93d7beSBarry Smith if (nz == MAT_SKIP_ALLOCATION) { 1567ab93d7beSBarry Smith skipallocation = PETSC_TRUE; 1568ab93d7beSBarry Smith nz = 0; 1569ab93d7beSBarry Smith } 1570ab93d7beSBarry Smith 1571435da068SBarry Smith if (nz == PETSC_DEFAULT || nz == PETSC_DECIDE) nz = 3; 157208401ef6SPierre Jolivet PetscCheck(nz >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "nz cannot be less than 0: value %" PetscInt_FMT, nz); 157349b5e25fSSatish Balay if (nnz) { 157449b5e25fSSatish Balay for (i = 0; i < mbs; i++) { 157508401ef6SPierre Jolivet PetscCheck(nnz[i] >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "nnz cannot be less than 0: local row %" PetscInt_FMT " value %" PetscInt_FMT, i, nnz[i]); 157608401ef6SPierre Jolivet PetscCheck(nnz[i] <= nbs, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "nnz cannot be greater than block row length: local row %" PetscInt_FMT " value %" PetscInt_FMT " block rowlength %" PetscInt_FMT, i, nnz[i], nbs); 157749b5e25fSSatish Balay } 157849b5e25fSSatish Balay } 157949b5e25fSSatish Balay 1580db4efbfdSBarry Smith B->ops->mult = MatMult_SeqSBAIJ_N; 1581db4efbfdSBarry Smith B->ops->multadd = MatMultAdd_SeqSBAIJ_N; 1582db4efbfdSBarry Smith B->ops->multtranspose = MatMult_SeqSBAIJ_N; 1583db4efbfdSBarry Smith B->ops->multtransposeadd = MatMultAdd_SeqSBAIJ_N; 158426fbe8dcSKarl Rupp 15859566063dSJacob Faibussowitsch PetscCall(PetscOptionsGetBool(((PetscObject)B)->options, ((PetscObject)B)->prefix, "-mat_no_unroll", &flg, NULL)); 158649b5e25fSSatish Balay if (!flg) { 158749b5e25fSSatish Balay switch (bs) { 158849b5e25fSSatish Balay case 1: 158949b5e25fSSatish Balay B->ops->mult = MatMult_SeqSBAIJ_1; 159049b5e25fSSatish Balay B->ops->multadd = MatMultAdd_SeqSBAIJ_1; 1591431c96f7SBarry Smith B->ops->multtranspose = MatMult_SeqSBAIJ_1; 1592431c96f7SBarry Smith B->ops->multtransposeadd = MatMultAdd_SeqSBAIJ_1; 159349b5e25fSSatish Balay break; 159449b5e25fSSatish Balay case 2: 159549b5e25fSSatish Balay B->ops->mult = MatMult_SeqSBAIJ_2; 159649b5e25fSSatish Balay B->ops->multadd = MatMultAdd_SeqSBAIJ_2; 1597431c96f7SBarry Smith B->ops->multtranspose = MatMult_SeqSBAIJ_2; 1598431c96f7SBarry Smith B->ops->multtransposeadd = MatMultAdd_SeqSBAIJ_2; 159949b5e25fSSatish Balay break; 160049b5e25fSSatish Balay case 3: 160149b5e25fSSatish Balay B->ops->mult = MatMult_SeqSBAIJ_3; 160249b5e25fSSatish Balay B->ops->multadd = MatMultAdd_SeqSBAIJ_3; 1603431c96f7SBarry Smith B->ops->multtranspose = MatMult_SeqSBAIJ_3; 1604431c96f7SBarry Smith B->ops->multtransposeadd = MatMultAdd_SeqSBAIJ_3; 160549b5e25fSSatish Balay break; 160649b5e25fSSatish Balay case 4: 160749b5e25fSSatish Balay B->ops->mult = MatMult_SeqSBAIJ_4; 160849b5e25fSSatish Balay B->ops->multadd = MatMultAdd_SeqSBAIJ_4; 1609431c96f7SBarry Smith B->ops->multtranspose = MatMult_SeqSBAIJ_4; 1610431c96f7SBarry Smith B->ops->multtransposeadd = MatMultAdd_SeqSBAIJ_4; 161149b5e25fSSatish Balay break; 161249b5e25fSSatish Balay case 5: 161349b5e25fSSatish Balay B->ops->mult = MatMult_SeqSBAIJ_5; 161449b5e25fSSatish Balay B->ops->multadd = MatMultAdd_SeqSBAIJ_5; 1615431c96f7SBarry Smith B->ops->multtranspose = MatMult_SeqSBAIJ_5; 1616431c96f7SBarry Smith B->ops->multtransposeadd = MatMultAdd_SeqSBAIJ_5; 161749b5e25fSSatish Balay break; 161849b5e25fSSatish Balay case 6: 161949b5e25fSSatish Balay B->ops->mult = MatMult_SeqSBAIJ_6; 162049b5e25fSSatish Balay B->ops->multadd = MatMultAdd_SeqSBAIJ_6; 1621431c96f7SBarry Smith B->ops->multtranspose = MatMult_SeqSBAIJ_6; 1622431c96f7SBarry Smith B->ops->multtransposeadd = MatMultAdd_SeqSBAIJ_6; 162349b5e25fSSatish Balay break; 162449b5e25fSSatish Balay case 7: 1625de53e5efSHong Zhang B->ops->mult = MatMult_SeqSBAIJ_7; 162649b5e25fSSatish Balay B->ops->multadd = MatMultAdd_SeqSBAIJ_7; 1627431c96f7SBarry Smith B->ops->multtranspose = MatMult_SeqSBAIJ_7; 1628431c96f7SBarry Smith B->ops->multtransposeadd = MatMultAdd_SeqSBAIJ_7; 162949b5e25fSSatish Balay break; 163049b5e25fSSatish Balay } 163149b5e25fSSatish Balay } 163249b5e25fSSatish Balay 163349b5e25fSSatish Balay b->mbs = mbs; 16344dcd73b1SHong Zhang b->nbs = nbs; 1635ab93d7beSBarry Smith if (!skipallocation) { 16362ee49352SLisandro Dalcin if (!b->imax) { 16379566063dSJacob Faibussowitsch PetscCall(PetscMalloc2(mbs, &b->imax, mbs, &b->ilen)); 163826fbe8dcSKarl Rupp 1639c760cd28SBarry Smith b->free_imax_ilen = PETSC_TRUE; 16402ee49352SLisandro Dalcin } 164149b5e25fSSatish Balay if (!nnz) { 1642435da068SBarry Smith if (nz == PETSC_DEFAULT || nz == PETSC_DECIDE) nz = 5; 164349b5e25fSSatish Balay else if (nz <= 0) nz = 1; 16445d2a9ed1SStefano Zampini nz = PetscMin(nbs, nz); 164526fbe8dcSKarl Rupp for (i = 0; i < mbs; i++) b->imax[i] = nz; 16469566063dSJacob Faibussowitsch PetscCall(PetscIntMultError(nz, mbs, &nz)); 164749b5e25fSSatish Balay } else { 1648c73702f5SBarry Smith PetscInt64 nz64 = 0; 16499371c9d4SSatish Balay for (i = 0; i < mbs; i++) { 16509371c9d4SSatish Balay b->imax[i] = nnz[i]; 16519371c9d4SSatish Balay nz64 += nnz[i]; 16529371c9d4SSatish Balay } 16539566063dSJacob Faibussowitsch PetscCall(PetscIntCast(nz64, &nz)); 165449b5e25fSSatish Balay } 16552ee49352SLisandro Dalcin /* b->ilen will count nonzeros in each block row so far. */ 165626fbe8dcSKarl Rupp for (i = 0; i < mbs; i++) b->ilen[i] = 0; 16576c6c5352SBarry Smith /* nz=(nz+mbs)/2; */ /* total diagonal and superdiagonal nonzero blocks */ 165849b5e25fSSatish Balay 165949b5e25fSSatish Balay /* allocate the matrix space */ 16609566063dSJacob Faibussowitsch PetscCall(MatSeqXAIJFreeAIJ(B, &b->a, &b->j, &b->i)); 16619566063dSJacob Faibussowitsch PetscCall(PetscMalloc3(bs2 * nz, &b->a, nz, &b->j, B->rmap->N + 1, &b->i)); 16629566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(b->a, nz * bs2)); 16639566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(b->j, nz)); 166426fbe8dcSKarl Rupp 166549b5e25fSSatish Balay b->singlemalloc = PETSC_TRUE; 166649b5e25fSSatish Balay 166749b5e25fSSatish Balay /* pointer to beginning of each row */ 1668e60cf9a0SBarry Smith b->i[0] = 0; 166926fbe8dcSKarl Rupp for (i = 1; i < mbs + 1; i++) b->i[i] = b->i[i - 1] + b->imax[i - 1]; 167026fbe8dcSKarl Rupp 1671e6b907acSBarry Smith b->free_a = PETSC_TRUE; 1672e6b907acSBarry Smith b->free_ij = PETSC_TRUE; 1673e811da20SHong Zhang } else { 1674e6b907acSBarry Smith b->free_a = PETSC_FALSE; 1675e6b907acSBarry Smith b->free_ij = PETSC_FALSE; 1676ab93d7beSBarry Smith } 167749b5e25fSSatish Balay 167849b5e25fSSatish Balay b->bs2 = bs2; 16796c6c5352SBarry Smith b->nz = 0; 1680b32cb4a7SJed Brown b->maxnz = nz; 1681f4259b30SLisandro Dalcin b->inew = NULL; 1682f4259b30SLisandro Dalcin b->jnew = NULL; 1683f4259b30SLisandro Dalcin b->anew = NULL; 1684f4259b30SLisandro Dalcin b->a2anew = NULL; 16851a3463dfSHong Zhang b->permute = PETSC_FALSE; 1686cb7b82ddSBarry Smith 1687cb7b82ddSBarry Smith B->was_assembled = PETSC_FALSE; 1688cb7b82ddSBarry Smith B->assembled = PETSC_FALSE; 16899566063dSJacob Faibussowitsch if (realalloc) PetscCall(MatSetOption(B, MAT_NEW_NONZERO_ALLOCATION_ERR, PETSC_TRUE)); 16903ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1691c464158bSHong Zhang } 1692153ea458SHong Zhang 1693d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqSBAIJSetPreallocationCSR_SeqSBAIJ(Mat B, PetscInt bs, const PetscInt ii[], const PetscInt jj[], const PetscScalar V[]) 1694d71ae5a4SJacob Faibussowitsch { 16950cd7f59aSBarry Smith PetscInt i, j, m, nz, anz, nz_max = 0, *nnz; 1696f4259b30SLisandro Dalcin PetscScalar *values = NULL; 169738f409ebSLisandro Dalcin PetscBool roworiented = ((Mat_SeqSBAIJ *)B->data)->roworiented; 16980cd7f59aSBarry Smith 169938f409ebSLisandro Dalcin PetscFunctionBegin; 170008401ef6SPierre Jolivet PetscCheck(bs >= 1, PetscObjectComm((PetscObject)B), PETSC_ERR_ARG_OUTOFRANGE, "Invalid block size specified, must be positive but it is %" PetscInt_FMT, bs); 17019566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetBlockSize(B->rmap, bs)); 17029566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetBlockSize(B->cmap, bs)); 17039566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(B->rmap)); 17049566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(B->cmap)); 17059566063dSJacob Faibussowitsch PetscCall(PetscLayoutGetBlockSize(B->rmap, &bs)); 170638f409ebSLisandro Dalcin m = B->rmap->n / bs; 170738f409ebSLisandro Dalcin 1708aed4548fSBarry Smith PetscCheck(!ii[0], PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "ii[0] must be 0 but it is %" PetscInt_FMT, ii[0]); 17099566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m + 1, &nnz)); 171038f409ebSLisandro Dalcin for (i = 0; i < m; i++) { 171138f409ebSLisandro Dalcin nz = ii[i + 1] - ii[i]; 171208401ef6SPierre Jolivet PetscCheck(nz >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Row %" PetscInt_FMT " has a negative number of columns %" PetscInt_FMT, i, nz); 17130cd7f59aSBarry Smith anz = 0; 17140cd7f59aSBarry Smith for (j = 0; j < nz; j++) { 17150cd7f59aSBarry Smith /* count only values on the diagonal or above */ 17160cd7f59aSBarry Smith if (jj[ii[i] + j] >= i) { 17170cd7f59aSBarry Smith anz = nz - j; 17180cd7f59aSBarry Smith break; 17190cd7f59aSBarry Smith } 17200cd7f59aSBarry Smith } 17210cd7f59aSBarry Smith nz_max = PetscMax(nz_max, anz); 17220cd7f59aSBarry Smith nnz[i] = anz; 172338f409ebSLisandro Dalcin } 17249566063dSJacob Faibussowitsch PetscCall(MatSeqSBAIJSetPreallocation(B, bs, 0, nnz)); 17259566063dSJacob Faibussowitsch PetscCall(PetscFree(nnz)); 172638f409ebSLisandro Dalcin 172738f409ebSLisandro Dalcin values = (PetscScalar *)V; 172848a46eb9SPierre Jolivet if (!values) PetscCall(PetscCalloc1(bs * bs * nz_max, &values)); 172938f409ebSLisandro Dalcin for (i = 0; i < m; i++) { 173038f409ebSLisandro Dalcin PetscInt ncols = ii[i + 1] - ii[i]; 173138f409ebSLisandro Dalcin const PetscInt *icols = jj + ii[i]; 173238f409ebSLisandro Dalcin if (!roworiented || bs == 1) { 173338f409ebSLisandro Dalcin const PetscScalar *svals = values + (V ? (bs * bs * ii[i]) : 0); 17349566063dSJacob Faibussowitsch PetscCall(MatSetValuesBlocked_SeqSBAIJ(B, 1, &i, ncols, icols, svals, INSERT_VALUES)); 173538f409ebSLisandro Dalcin } else { 173638f409ebSLisandro Dalcin for (j = 0; j < ncols; j++) { 173738f409ebSLisandro Dalcin const PetscScalar *svals = values + (V ? (bs * bs * (ii[i] + j)) : 0); 17389566063dSJacob Faibussowitsch PetscCall(MatSetValuesBlocked_SeqSBAIJ(B, 1, &i, 1, &icols[j], svals, INSERT_VALUES)); 173938f409ebSLisandro Dalcin } 174038f409ebSLisandro Dalcin } 174138f409ebSLisandro Dalcin } 17429566063dSJacob Faibussowitsch if (!V) PetscCall(PetscFree(values)); 17439566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(B, MAT_FINAL_ASSEMBLY)); 17449566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(B, MAT_FINAL_ASSEMBLY)); 17459566063dSJacob Faibussowitsch PetscCall(MatSetOption(B, MAT_NEW_NONZERO_LOCATION_ERR, PETSC_TRUE)); 17463ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 174738f409ebSLisandro Dalcin } 174838f409ebSLisandro Dalcin 1749db4efbfdSBarry Smith /* 1750db4efbfdSBarry Smith This is used to set the numeric factorization for both Cholesky and ICC symbolic factorization 1751db4efbfdSBarry Smith */ 1752d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqSBAIJSetNumericFactorization_inplace(Mat B, PetscBool natural) 1753d71ae5a4SJacob Faibussowitsch { 1754ace3abfcSBarry Smith PetscBool flg = PETSC_FALSE; 1755db4efbfdSBarry Smith PetscInt bs = B->rmap->bs; 1756db4efbfdSBarry Smith 1757db4efbfdSBarry Smith PetscFunctionBegin; 17589566063dSJacob Faibussowitsch PetscCall(PetscOptionsGetBool(((PetscObject)B)->options, ((PetscObject)B)->prefix, "-mat_no_unroll", &flg, NULL)); 1759db4efbfdSBarry Smith if (flg) bs = 8; 1760db4efbfdSBarry Smith 1761db4efbfdSBarry Smith if (!natural) { 1762db4efbfdSBarry Smith switch (bs) { 1763d71ae5a4SJacob Faibussowitsch case 1: 1764d71ae5a4SJacob Faibussowitsch B->ops->choleskyfactornumeric = MatCholeskyFactorNumeric_SeqSBAIJ_1_inplace; 1765d71ae5a4SJacob Faibussowitsch break; 1766d71ae5a4SJacob Faibussowitsch case 2: 1767d71ae5a4SJacob Faibussowitsch B->ops->choleskyfactornumeric = MatCholeskyFactorNumeric_SeqSBAIJ_2; 1768d71ae5a4SJacob Faibussowitsch break; 1769d71ae5a4SJacob Faibussowitsch case 3: 1770d71ae5a4SJacob Faibussowitsch B->ops->choleskyfactornumeric = MatCholeskyFactorNumeric_SeqSBAIJ_3; 1771d71ae5a4SJacob Faibussowitsch break; 1772d71ae5a4SJacob Faibussowitsch case 4: 1773d71ae5a4SJacob Faibussowitsch B->ops->choleskyfactornumeric = MatCholeskyFactorNumeric_SeqSBAIJ_4; 1774d71ae5a4SJacob Faibussowitsch break; 1775d71ae5a4SJacob Faibussowitsch case 5: 1776d71ae5a4SJacob Faibussowitsch B->ops->choleskyfactornumeric = MatCholeskyFactorNumeric_SeqSBAIJ_5; 1777d71ae5a4SJacob Faibussowitsch break; 1778d71ae5a4SJacob Faibussowitsch case 6: 1779d71ae5a4SJacob Faibussowitsch B->ops->choleskyfactornumeric = MatCholeskyFactorNumeric_SeqSBAIJ_6; 1780d71ae5a4SJacob Faibussowitsch break; 1781d71ae5a4SJacob Faibussowitsch case 7: 1782d71ae5a4SJacob Faibussowitsch B->ops->choleskyfactornumeric = MatCholeskyFactorNumeric_SeqSBAIJ_7; 1783d71ae5a4SJacob Faibussowitsch break; 1784d71ae5a4SJacob Faibussowitsch default: 1785d71ae5a4SJacob Faibussowitsch B->ops->choleskyfactornumeric = MatCholeskyFactorNumeric_SeqSBAIJ_N; 1786d71ae5a4SJacob Faibussowitsch break; 1787db4efbfdSBarry Smith } 1788db4efbfdSBarry Smith } else { 1789db4efbfdSBarry Smith switch (bs) { 1790d71ae5a4SJacob Faibussowitsch case 1: 1791d71ae5a4SJacob Faibussowitsch B->ops->choleskyfactornumeric = MatCholeskyFactorNumeric_SeqSBAIJ_1_NaturalOrdering_inplace; 1792d71ae5a4SJacob Faibussowitsch break; 1793d71ae5a4SJacob Faibussowitsch case 2: 1794d71ae5a4SJacob Faibussowitsch B->ops->choleskyfactornumeric = MatCholeskyFactorNumeric_SeqSBAIJ_2_NaturalOrdering; 1795d71ae5a4SJacob Faibussowitsch break; 1796d71ae5a4SJacob Faibussowitsch case 3: 1797d71ae5a4SJacob Faibussowitsch B->ops->choleskyfactornumeric = MatCholeskyFactorNumeric_SeqSBAIJ_3_NaturalOrdering; 1798d71ae5a4SJacob Faibussowitsch break; 1799d71ae5a4SJacob Faibussowitsch case 4: 1800d71ae5a4SJacob Faibussowitsch B->ops->choleskyfactornumeric = MatCholeskyFactorNumeric_SeqSBAIJ_4_NaturalOrdering; 1801d71ae5a4SJacob Faibussowitsch break; 1802d71ae5a4SJacob Faibussowitsch case 5: 1803d71ae5a4SJacob Faibussowitsch B->ops->choleskyfactornumeric = MatCholeskyFactorNumeric_SeqSBAIJ_5_NaturalOrdering; 1804d71ae5a4SJacob Faibussowitsch break; 1805d71ae5a4SJacob Faibussowitsch case 6: 1806d71ae5a4SJacob Faibussowitsch B->ops->choleskyfactornumeric = MatCholeskyFactorNumeric_SeqSBAIJ_6_NaturalOrdering; 1807d71ae5a4SJacob Faibussowitsch break; 1808d71ae5a4SJacob Faibussowitsch case 7: 1809d71ae5a4SJacob Faibussowitsch B->ops->choleskyfactornumeric = MatCholeskyFactorNumeric_SeqSBAIJ_7_NaturalOrdering; 1810d71ae5a4SJacob Faibussowitsch break; 1811d71ae5a4SJacob Faibussowitsch default: 1812d71ae5a4SJacob Faibussowitsch B->ops->choleskyfactornumeric = MatCholeskyFactorNumeric_SeqSBAIJ_N_NaturalOrdering; 1813d71ae5a4SJacob Faibussowitsch break; 1814db4efbfdSBarry Smith } 1815db4efbfdSBarry Smith } 18163ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1817db4efbfdSBarry Smith } 1818db4efbfdSBarry Smith 1819cc2e6a90SBarry Smith PETSC_INTERN PetscErrorCode MatConvert_SeqSBAIJ_SeqAIJ(Mat, MatType, MatReuse, Mat *); 1820cc2e6a90SBarry Smith PETSC_INTERN PetscErrorCode MatConvert_SeqSBAIJ_SeqBAIJ(Mat, MatType, MatReuse, Mat *); 1821d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatFactorGetSolverType_petsc(Mat A, MatSolverType *type) 1822d71ae5a4SJacob Faibussowitsch { 18234ac6704cSBarry Smith PetscFunctionBegin; 18244ac6704cSBarry Smith *type = MATSOLVERPETSC; 18253ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 18264ac6704cSBarry Smith } 1827d769727bSBarry Smith 1828d71ae5a4SJacob Faibussowitsch PETSC_INTERN PetscErrorCode MatGetFactor_seqsbaij_petsc(Mat A, MatFactorType ftype, Mat *B) 1829d71ae5a4SJacob Faibussowitsch { 1830d0f46423SBarry Smith PetscInt n = A->rmap->n; 18315c9eb25fSBarry Smith 18325c9eb25fSBarry Smith PetscFunctionBegin; 18330e92d65fSHong Zhang #if defined(PETSC_USE_COMPLEX) 1834b94d7dedSBarry Smith PetscCheck(A->hermitian != PETSC_BOOL3_TRUE || A->symmetric == PETSC_BOOL3_TRUE || (ftype != MAT_FACTOR_CHOLESKY && ftype != MAT_FACTOR_ICC), PETSC_COMM_SELF, PETSC_ERR_SUP, "Hermitian CHOLESKY or ICC Factor is not supported"); 18350e92d65fSHong Zhang #endif 1836eb1ec7c1SStefano Zampini 18379566063dSJacob Faibussowitsch PetscCall(MatCreate(PetscObjectComm((PetscObject)A), B)); 18389566063dSJacob Faibussowitsch PetscCall(MatSetSizes(*B, n, n, n, n)); 18395c9eb25fSBarry Smith if (ftype == MAT_FACTOR_CHOLESKY || ftype == MAT_FACTOR_ICC) { 18409566063dSJacob Faibussowitsch PetscCall(MatSetType(*B, MATSEQSBAIJ)); 18419566063dSJacob Faibussowitsch PetscCall(MatSeqSBAIJSetPreallocation(*B, A->rmap->bs, MAT_SKIP_ALLOCATION, NULL)); 184226fbe8dcSKarl Rupp 18437b056e98SHong Zhang (*B)->ops->choleskyfactorsymbolic = MatCholeskyFactorSymbolic_SeqSBAIJ; 1844c6d0d4f0SHong Zhang (*B)->ops->iccfactorsymbolic = MatICCFactorSymbolic_SeqSBAIJ; 18459566063dSJacob Faibussowitsch PetscCall(PetscStrallocpy(MATORDERINGNATURAL, (char **)&(*B)->preferredordering[MAT_FACTOR_CHOLESKY])); 18469566063dSJacob Faibussowitsch PetscCall(PetscStrallocpy(MATORDERINGNATURAL, (char **)&(*B)->preferredordering[MAT_FACTOR_ICC])); 1847e32f2f54SBarry Smith } else SETERRQ(PETSC_COMM_SELF, PETSC_ERR_SUP, "Factor type not supported"); 184800c67f3bSHong Zhang 1849d5f3da31SBarry Smith (*B)->factortype = ftype; 1850f73b0415SBarry Smith (*B)->canuseordering = PETSC_TRUE; 18519566063dSJacob Faibussowitsch PetscCall(PetscFree((*B)->solvertype)); 18529566063dSJacob Faibussowitsch PetscCall(PetscStrallocpy(MATSOLVERPETSC, &(*B)->solvertype)); 18539566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)*B, "MatFactorGetSolverType_C", MatFactorGetSolverType_petsc)); 18543ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 18555c9eb25fSBarry Smith } 18565c9eb25fSBarry Smith 18578397e458SBarry Smith /*@C 18582ef1f0ffSBarry Smith MatSeqSBAIJGetArray - gives access to the array where the numerical data for a `MATSEQSBAIJ` matrix is stored 18598397e458SBarry Smith 18608397e458SBarry Smith Not Collective 18618397e458SBarry Smith 18628397e458SBarry Smith Input Parameter: 186311a5261eSBarry Smith . mat - a `MATSEQSBAIJ` matrix 18648397e458SBarry Smith 18658397e458SBarry Smith Output Parameter: 18668397e458SBarry Smith . array - pointer to the data 18678397e458SBarry Smith 18688397e458SBarry Smith Level: intermediate 18698397e458SBarry Smith 18701cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MATSEQSBAIJ`, `MatSeqSBAIJRestoreArray()`, `MatSeqAIJGetArray()`, `MatSeqAIJRestoreArray()` 18718397e458SBarry Smith @*/ 1872d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqSBAIJGetArray(Mat A, PetscScalar **array) 1873d71ae5a4SJacob Faibussowitsch { 18748397e458SBarry Smith PetscFunctionBegin; 1875cac4c232SBarry Smith PetscUseMethod(A, "MatSeqSBAIJGetArray_C", (Mat, PetscScalar **), (A, array)); 18763ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 18778397e458SBarry Smith } 18788397e458SBarry Smith 18798397e458SBarry Smith /*@C 18802ef1f0ffSBarry Smith MatSeqSBAIJRestoreArray - returns access to the array where the numerical data for a `MATSEQSBAIJ` matrix is stored obtained by `MatSeqSBAIJGetArray()` 18818397e458SBarry Smith 18828397e458SBarry Smith Not Collective 18838397e458SBarry Smith 18848397e458SBarry Smith Input Parameters: 18852ef1f0ffSBarry Smith + mat - a `MATSEQSBAIJ` matrix 1886a2b725a8SWilliam Gropp - array - pointer to the data 18878397e458SBarry Smith 18888397e458SBarry Smith Level: intermediate 18898397e458SBarry Smith 18901cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MATSEQSBAIJ`, `MatSeqSBAIJGetArray()`, `MatSeqAIJGetArray()`, `MatSeqAIJRestoreArray()` 18918397e458SBarry Smith @*/ 1892d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqSBAIJRestoreArray(Mat A, PetscScalar **array) 1893d71ae5a4SJacob Faibussowitsch { 18948397e458SBarry Smith PetscFunctionBegin; 1895cac4c232SBarry Smith PetscUseMethod(A, "MatSeqSBAIJRestoreArray_C", (Mat, PetscScalar **), (A, array)); 18963ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 18978397e458SBarry Smith } 18988397e458SBarry Smith 18990bad9183SKris Buschelman /*MC 1900fafad747SKris Buschelman MATSEQSBAIJ - MATSEQSBAIJ = "seqsbaij" - A matrix type to be used for sequential symmetric block sparse matrices, 19010bad9183SKris Buschelman based on block compressed sparse row format. Only the upper triangular portion of the matrix is stored. 19020bad9183SKris Buschelman 1903828413b8SBarry Smith For complex numbers by default this matrix is symmetric, NOT Hermitian symmetric. To make it Hermitian symmetric you 190411a5261eSBarry Smith can call `MatSetOption`(`Mat`, `MAT_HERMITIAN`). 1905828413b8SBarry Smith 19062ef1f0ffSBarry Smith Options Database Key: 190711a5261eSBarry Smith . -mat_type seqsbaij - sets the matrix type to "seqsbaij" during a call to `MatSetFromOptions()` 19080bad9183SKris Buschelman 19092ef1f0ffSBarry Smith Level: beginner 19102ef1f0ffSBarry Smith 191195452b02SPatrick Sanan Notes: 191295452b02SPatrick Sanan By default if you insert values into the lower triangular part of the matrix they are simply ignored (since they are not 191311a5261eSBarry Smith stored and it is assumed they symmetric to the upper triangular). If you call `MatSetOption`(`Mat`,`MAT_IGNORE_LOWER_TRIANGULAR`,`PETSC_FALSE`) or use 19142ef1f0ffSBarry Smith the options database `-mat_ignore_lower_triangular` false it will generate an error if you try to set a value in the lower triangular portion. 191571dad5bbSBarry Smith 1916476417e5SBarry Smith The number of rows in the matrix must be less than or equal to the number of columns 191771dad5bbSBarry Smith 19181cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MATSEQSBAIJ`, `MatCreateSeqSBAIJ()`, `MatType`, `MATMPISBAIJ` 19190bad9183SKris Buschelman M*/ 1920d71ae5a4SJacob Faibussowitsch PETSC_EXTERN PetscErrorCode MatCreate_SeqSBAIJ(Mat B) 1921d71ae5a4SJacob Faibussowitsch { 1922a23d5eceSKris Buschelman Mat_SeqSBAIJ *b; 192313f74950SBarry Smith PetscMPIInt size; 1924ace3abfcSBarry Smith PetscBool no_unroll = PETSC_FALSE, no_inode = PETSC_FALSE; 1925a23d5eceSKris Buschelman 1926a23d5eceSKris Buschelman PetscFunctionBegin; 19279566063dSJacob Faibussowitsch PetscCallMPI(MPI_Comm_size(PetscObjectComm((PetscObject)B), &size)); 192808401ef6SPierre Jolivet PetscCheck(size <= 1, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONG, "Comm must be of size 1"); 1929a23d5eceSKris Buschelman 19304dfa11a4SJacob Faibussowitsch PetscCall(PetscNew(&b)); 1931a23d5eceSKris Buschelman B->data = (void *)b; 19329566063dSJacob Faibussowitsch PetscCall(PetscMemcpy(B->ops, &MatOps_Values, sizeof(struct _MatOps))); 193326fbe8dcSKarl Rupp 1934a23d5eceSKris Buschelman B->ops->destroy = MatDestroy_SeqSBAIJ; 1935a23d5eceSKris Buschelman B->ops->view = MatView_SeqSBAIJ; 1936f4259b30SLisandro Dalcin b->row = NULL; 1937f4259b30SLisandro Dalcin b->icol = NULL; 1938a23d5eceSKris Buschelman b->reallocs = 0; 1939f4259b30SLisandro Dalcin b->saved_values = NULL; 19400def2e27SBarry Smith b->inode.limit = 5; 19410def2e27SBarry Smith b->inode.max_limit = 5; 1942a23d5eceSKris Buschelman 1943a23d5eceSKris Buschelman b->roworiented = PETSC_TRUE; 1944a23d5eceSKris Buschelman b->nonew = 0; 1945f4259b30SLisandro Dalcin b->diag = NULL; 1946f4259b30SLisandro Dalcin b->solve_work = NULL; 1947f4259b30SLisandro Dalcin b->mult_work = NULL; 1948f4259b30SLisandro Dalcin B->spptr = NULL; 1949f2cbd3d5SJed Brown B->info.nz_unneeded = (PetscReal)b->maxnz * b->bs2; 1950a9817697SBarry Smith b->keepnonzeropattern = PETSC_FALSE; 1951a23d5eceSKris Buschelman 1952f4259b30SLisandro Dalcin b->inew = NULL; 1953f4259b30SLisandro Dalcin b->jnew = NULL; 1954f4259b30SLisandro Dalcin b->anew = NULL; 1955f4259b30SLisandro Dalcin b->a2anew = NULL; 1956a23d5eceSKris Buschelman b->permute = PETSC_FALSE; 1957a23d5eceSKris Buschelman 195871dad5bbSBarry Smith b->ignore_ltriangular = PETSC_TRUE; 195926fbe8dcSKarl Rupp 19609566063dSJacob Faibussowitsch PetscCall(PetscOptionsGetBool(((PetscObject)B)->options, ((PetscObject)B)->prefix, "-mat_ignore_lower_triangular", &b->ignore_ltriangular, NULL)); 1961941593c8SHong Zhang 1962f5edf698SHong Zhang b->getrow_utriangular = PETSC_FALSE; 196326fbe8dcSKarl Rupp 19649566063dSJacob Faibussowitsch PetscCall(PetscOptionsGetBool(((PetscObject)B)->options, ((PetscObject)B)->prefix, "-mat_getrow_uppertriangular", &b->getrow_utriangular, NULL)); 1965f5edf698SHong Zhang 19669566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSeqSBAIJGetArray_C", MatSeqSBAIJGetArray_SeqSBAIJ)); 19679566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSeqSBAIJRestoreArray_C", MatSeqSBAIJRestoreArray_SeqSBAIJ)); 19689566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatStoreValues_C", MatStoreValues_SeqSBAIJ)); 19699566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatRetrieveValues_C", MatRetrieveValues_SeqSBAIJ)); 19709566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSeqSBAIJSetColumnIndices_C", MatSeqSBAIJSetColumnIndices_SeqSBAIJ)); 19719566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqsbaij_seqaij_C", MatConvert_SeqSBAIJ_SeqAIJ)); 19729566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqsbaij_seqbaij_C", MatConvert_SeqSBAIJ_SeqBAIJ)); 19739566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSeqSBAIJSetPreallocation_C", MatSeqSBAIJSetPreallocation_SeqSBAIJ)); 19749566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSeqSBAIJSetPreallocationCSR_C", MatSeqSBAIJSetPreallocationCSR_SeqSBAIJ)); 19756214f412SHong Zhang #if defined(PETSC_HAVE_ELEMENTAL) 19769566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqsbaij_elemental_C", MatConvert_SeqSBAIJ_Elemental)); 19776214f412SHong Zhang #endif 1978d24d4204SJose E. Roman #if defined(PETSC_HAVE_SCALAPACK) 19799566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqsbaij_scalapack_C", MatConvert_SBAIJ_ScaLAPACK)); 1980d24d4204SJose E. Roman #endif 198123ce1328SBarry Smith 1982b94d7dedSBarry Smith B->symmetry_eternal = PETSC_TRUE; 1983b94d7dedSBarry Smith B->structural_symmetry_eternal = PETSC_TRUE; 1984b94d7dedSBarry Smith B->symmetric = PETSC_BOOL3_TRUE; 1985b94d7dedSBarry Smith B->structurally_symmetric = PETSC_BOOL3_TRUE; 1986eb1ec7c1SStefano Zampini #if defined(PETSC_USE_COMPLEX) 1987b94d7dedSBarry Smith B->hermitian = PETSC_BOOL3_FALSE; 1988eb1ec7c1SStefano Zampini #else 1989b94d7dedSBarry Smith B->hermitian = PETSC_BOOL3_TRUE; 1990eb1ec7c1SStefano Zampini #endif 199113647f61SHong Zhang 19929566063dSJacob Faibussowitsch PetscCall(PetscObjectChangeTypeName((PetscObject)B, MATSEQSBAIJ)); 19930def2e27SBarry Smith 1994d0609cedSBarry Smith PetscOptionsBegin(PetscObjectComm((PetscObject)B), ((PetscObject)B)->prefix, "Options for SEQSBAIJ matrix", "Mat"); 19959566063dSJacob Faibussowitsch PetscCall(PetscOptionsBool("-mat_no_unroll", "Do not optimize for inodes (slower)", NULL, no_unroll, &no_unroll, NULL)); 199648a46eb9SPierre Jolivet if (no_unroll) PetscCall(PetscInfo(B, "Not using Inode routines due to -mat_no_unroll\n")); 19979566063dSJacob Faibussowitsch PetscCall(PetscOptionsBool("-mat_no_inode", "Do not optimize for inodes (slower)", NULL, no_inode, &no_inode, NULL)); 19989566063dSJacob Faibussowitsch if (no_inode) PetscCall(PetscInfo(B, "Not using Inode routines due to -mat_no_inode\n")); 19999566063dSJacob Faibussowitsch PetscCall(PetscOptionsInt("-mat_inode_limit", "Do not use inodes larger then this value", NULL, b->inode.limit, &b->inode.limit, NULL)); 2000d0609cedSBarry Smith PetscOptionsEnd(); 2001ace3abfcSBarry Smith b->inode.use = (PetscBool)(!(no_unroll || no_inode)); 20020def2e27SBarry Smith if (b->inode.limit > b->inode.max_limit) b->inode.limit = b->inode.max_limit; 20033ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 2004a23d5eceSKris Buschelman } 2005a23d5eceSKris Buschelman 2006a23d5eceSKris Buschelman /*@C 2007a23d5eceSKris Buschelman MatSeqSBAIJSetPreallocation - Creates a sparse symmetric matrix in block AIJ (block 200811a5261eSBarry Smith compressed row) `MATSEQSBAIJ` format. For good matrix assembly performance the 200920f4b53cSBarry Smith user should preallocate the matrix storage by setting the parameter `nz` 201020f4b53cSBarry Smith (or the array `nnz`). 2011a23d5eceSKris Buschelman 2012c3339decSBarry Smith Collective 2013a23d5eceSKris Buschelman 2014a23d5eceSKris Buschelman Input Parameters: 20151c4f3114SJed Brown + B - the symmetric matrix 201611a5261eSBarry Smith . bs - size of block, the blocks are ALWAYS square. One can use `MatSetBlockSizes()` to set a different row and column blocksize but the row 201711a5261eSBarry Smith blocksize always defines the size of the blocks. The column blocksize sets the blocksize of the vectors obtained with `MatCreateVecs()` 2018a23d5eceSKris Buschelman . nz - number of block nonzeros per block row (same for all rows) 2019a23d5eceSKris Buschelman - nnz - array containing the number of block nonzeros in the upper triangular plus 20202ef1f0ffSBarry Smith diagonal portion of each block (possibly different for each block row) or `NULL` 2021a23d5eceSKris Buschelman 2022a23d5eceSKris Buschelman Options Database Keys: 2023a2b725a8SWilliam Gropp + -mat_no_unroll - uses code that does not unroll the loops in the 2024a23d5eceSKris Buschelman block calculations (much slower) 2025a2b725a8SWilliam Gropp - -mat_block_size - size of the blocks to use (only works if a negative bs is passed in 2026a23d5eceSKris Buschelman 2027a23d5eceSKris Buschelman Level: intermediate 2028a23d5eceSKris Buschelman 2029a23d5eceSKris Buschelman Notes: 203020f4b53cSBarry Smith Specify the preallocated storage with either `nz` or `nnz` (not both). 20312ef1f0ffSBarry Smith Set `nz` = `PETSC_DEFAULT` and `nnz` = `NULL` for PETSc to control dynamic memory 2032651615e1SBarry Smith allocation. See [Sparse Matrices](sec_matsparse) for details. 2033a23d5eceSKris Buschelman 203411a5261eSBarry Smith You can call `MatGetInfo()` to get information on how effective the preallocation was; 2035aa95bbe8SBarry Smith for example the fields mallocs,nz_allocated,nz_used,nz_unneeded; 20362ef1f0ffSBarry Smith You can also run with the option `-info` and look for messages with the string 2037aa95bbe8SBarry Smith malloc in them to see if additional memory allocation was needed. 2038aa95bbe8SBarry Smith 20392ef1f0ffSBarry Smith If the `nnz` parameter is given then the `nz` parameter is ignored 204049a6f317SBarry Smith 20411cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, [Sparse Matrices](sec_matsparse), `MATSEQSBAIJ`, `MatCreate()`, `MatCreateSeqAIJ()`, `MatSetValues()`, `MatCreateSBAIJ()` 2042a23d5eceSKris Buschelman @*/ 2043d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqSBAIJSetPreallocation(Mat B, PetscInt bs, PetscInt nz, const PetscInt nnz[]) 2044d71ae5a4SJacob Faibussowitsch { 2045a23d5eceSKris Buschelman PetscFunctionBegin; 20466ba663aaSJed Brown PetscValidHeaderSpecific(B, MAT_CLASSID, 1); 20476ba663aaSJed Brown PetscValidType(B, 1); 20486ba663aaSJed Brown PetscValidLogicalCollectiveInt(B, bs, 2); 2049cac4c232SBarry Smith PetscTryMethod(B, "MatSeqSBAIJSetPreallocation_C", (Mat, PetscInt, PetscInt, const PetscInt[]), (B, bs, nz, nnz)); 20503ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 2051a23d5eceSKris Buschelman } 205249b5e25fSSatish Balay 205338f409ebSLisandro Dalcin /*@C 205411a5261eSBarry Smith MatSeqSBAIJSetPreallocationCSR - Creates a sparse parallel matrix in `MATSEQSBAIJ` format using the given nonzero structure and (optional) numerical values 205538f409ebSLisandro Dalcin 205638f409ebSLisandro Dalcin Input Parameters: 20571c4f3114SJed Brown + B - the matrix 2058eab78319SHong Zhang . bs - size of block, the blocks are ALWAYS square. 205938f409ebSLisandro Dalcin . i - the indices into j for the start of each local row (starts with zero) 206038f409ebSLisandro Dalcin . j - the column indices for each local row (starts with zero) these must be sorted for each row 206138f409ebSLisandro Dalcin - v - optional values in the matrix 206238f409ebSLisandro Dalcin 2063664954b6SBarry Smith Level: advanced 206438f409ebSLisandro Dalcin 206538f409ebSLisandro Dalcin Notes: 206611a5261eSBarry Smith The order of the entries in values is specified by the `MatOption` `MAT_ROW_ORIENTED`. For example, C programs 206711a5261eSBarry Smith may want to use the default `MAT_ROW_ORIENTED` = `PETSC_TRUE` and use an array v[nnz][bs][bs] where the second index is 206838f409ebSLisandro Dalcin over rows within a block and the last index is over columns within a block row. Fortran programs will likely set 206911a5261eSBarry Smith `MAT_ROW_ORIENTED` = `PETSC_FALSE` and use a Fortran array v(bs,bs,nnz) in which the first index is over rows within a 207038f409ebSLisandro Dalcin block column and the second index is over columns within a block. 207138f409ebSLisandro Dalcin 207250c5228eSBarry Smith Any entries below the diagonal are ignored 20730cd7f59aSBarry Smith 20740cd7f59aSBarry Smith Though this routine has Preallocation() in the name it also sets the exact nonzero locations of the matrix entries 20750cd7f59aSBarry Smith and usually the numerical values as well 2076664954b6SBarry Smith 20771cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MATSEQSBAIJ`, `MatCreate()`, `MatCreateSeqSBAIJ()`, `MatSetValuesBlocked()`, `MatSeqSBAIJSetPreallocation()`, `MATSEQSBAIJ` 207838f409ebSLisandro Dalcin @*/ 2079d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqSBAIJSetPreallocationCSR(Mat B, PetscInt bs, const PetscInt i[], const PetscInt j[], const PetscScalar v[]) 2080d71ae5a4SJacob Faibussowitsch { 208138f409ebSLisandro Dalcin PetscFunctionBegin; 208238f409ebSLisandro Dalcin PetscValidHeaderSpecific(B, MAT_CLASSID, 1); 208338f409ebSLisandro Dalcin PetscValidType(B, 1); 208438f409ebSLisandro Dalcin PetscValidLogicalCollectiveInt(B, bs, 2); 2085cac4c232SBarry Smith PetscTryMethod(B, "MatSeqSBAIJSetPreallocationCSR_C", (Mat, PetscInt, const PetscInt[], const PetscInt[], const PetscScalar[]), (B, bs, i, j, v)); 20863ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 208738f409ebSLisandro Dalcin } 208838f409ebSLisandro Dalcin 2089c464158bSHong Zhang /*@C 20902ef1f0ffSBarry Smith MatCreateSeqSBAIJ - Creates a sparse symmetric matrix in (block 209111a5261eSBarry Smith compressed row) `MATSEQSBAIJ` format. For good matrix assembly performance the 20922ef1f0ffSBarry Smith user should preallocate the matrix storage by setting the parameter `nz` 20932ef1f0ffSBarry Smith (or the array `nnz`). 209449b5e25fSSatish Balay 2095d083f849SBarry Smith Collective 2096c464158bSHong Zhang 2097c464158bSHong Zhang Input Parameters: 209811a5261eSBarry Smith + comm - MPI communicator, set to `PETSC_COMM_SELF` 209911a5261eSBarry Smith . bs - size of block, the blocks are ALWAYS square. One can use `MatSetBlockSizes()` to set a different row and column blocksize but the row 2100bb7ae925SBarry Smith blocksize always defines the size of the blocks. The column blocksize sets the blocksize of the vectors obtained with MatCreateVecs() 210120f4b53cSBarry Smith . m - number of rows 210220f4b53cSBarry Smith . n - number of columns 2103c464158bSHong Zhang . nz - number of block nonzeros per block row (same for all rows) 2104744e8345SSatish Balay - nnz - array containing the number of block nonzeros in the upper triangular plus 21052ef1f0ffSBarry Smith diagonal portion of each block (possibly different for each block row) or `NULL` 2106c464158bSHong Zhang 2107c464158bSHong Zhang Output Parameter: 2108c464158bSHong Zhang . A - the symmetric matrix 2109c464158bSHong Zhang 2110c464158bSHong Zhang Options Database Keys: 2111a2b725a8SWilliam Gropp + -mat_no_unroll - uses code that does not unroll the loops in the 2112c464158bSHong Zhang block calculations (much slower) 2113a2b725a8SWilliam Gropp - -mat_block_size - size of the blocks to use 2114c464158bSHong Zhang 2115c464158bSHong Zhang Level: intermediate 2116c464158bSHong Zhang 21172ef1f0ffSBarry Smith Notes: 211811a5261eSBarry Smith It is recommended that one use the `MatCreate()`, `MatSetType()` and/or `MatSetFromOptions()`, 2119f6f02116SRichard Tran Mills MatXXXXSetPreallocation() paradigm instead of this routine directly. 212011a5261eSBarry Smith [MatXXXXSetPreallocation() is, for example, `MatSeqAIJSetPreallocation()`] 2121175b88e8SBarry Smith 21226d6d819aSHong Zhang The number of rows and columns must be divisible by blocksize. 21236d6d819aSHong Zhang This matrix type does not support complex Hermitian operation. 2124c464158bSHong Zhang 21252ef1f0ffSBarry Smith Specify the preallocated storage with either `nz` or `nnz` (not both). 21262ef1f0ffSBarry Smith Set `nz` = `PETSC_DEFAULT` and `nnz` = `NULL` for PETSc to control dynamic memory 2127651615e1SBarry Smith allocation. See [Sparse Matrices](sec_matsparse) for details. 2128c464158bSHong Zhang 21292ef1f0ffSBarry Smith If the `nnz` parameter is given then the `nz` parameter is ignored 213049a6f317SBarry Smith 21311cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, [Sparse Matrices](sec_matsparse), `MATSEQSBAIJ`, `MatCreate()`, `MatCreateSeqAIJ()`, `MatSetValues()`, `MatCreateSBAIJ()` 2132c464158bSHong Zhang @*/ 2133d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateSeqSBAIJ(MPI_Comm comm, PetscInt bs, PetscInt m, PetscInt n, PetscInt nz, const PetscInt nnz[], Mat *A) 2134d71ae5a4SJacob Faibussowitsch { 2135c464158bSHong Zhang PetscFunctionBegin; 21369566063dSJacob Faibussowitsch PetscCall(MatCreate(comm, A)); 21379566063dSJacob Faibussowitsch PetscCall(MatSetSizes(*A, m, n, m, n)); 21389566063dSJacob Faibussowitsch PetscCall(MatSetType(*A, MATSEQSBAIJ)); 21399566063dSJacob Faibussowitsch PetscCall(MatSeqSBAIJSetPreallocation(*A, bs, nz, (PetscInt *)nnz)); 21403ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 214149b5e25fSSatish Balay } 214249b5e25fSSatish Balay 2143d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDuplicate_SeqSBAIJ(Mat A, MatDuplicateOption cpvalues, Mat *B) 2144d71ae5a4SJacob Faibussowitsch { 214549b5e25fSSatish Balay Mat C; 214649b5e25fSSatish Balay Mat_SeqSBAIJ *c, *a = (Mat_SeqSBAIJ *)A->data; 2147b40805acSSatish Balay PetscInt i, mbs = a->mbs, nz = a->nz, bs2 = a->bs2; 214849b5e25fSSatish Balay 214949b5e25fSSatish Balay PetscFunctionBegin; 215031fe6a7dSBarry Smith PetscCheck(A->assembled, PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_WRONGSTATE, "Cannot duplicate unassembled matrix"); 215108401ef6SPierre Jolivet PetscCheck(a->i[mbs] == nz, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Corrupt matrix"); 215249b5e25fSSatish Balay 2153f4259b30SLisandro Dalcin *B = NULL; 21549566063dSJacob Faibussowitsch PetscCall(MatCreate(PetscObjectComm((PetscObject)A), &C)); 21559566063dSJacob Faibussowitsch PetscCall(MatSetSizes(C, A->rmap->N, A->cmap->n, A->rmap->N, A->cmap->n)); 21569566063dSJacob Faibussowitsch PetscCall(MatSetBlockSizesFromMats(C, A, A)); 21579566063dSJacob Faibussowitsch PetscCall(MatSetType(C, MATSEQSBAIJ)); 2158692f9cbeSHong Zhang c = (Mat_SeqSBAIJ *)C->data; 2159692f9cbeSHong Zhang 2160273d9f13SBarry Smith C->preallocated = PETSC_TRUE; 2161d5f3da31SBarry Smith C->factortype = A->factortype; 2162f4259b30SLisandro Dalcin c->row = NULL; 2163f4259b30SLisandro Dalcin c->icol = NULL; 2164f4259b30SLisandro Dalcin c->saved_values = NULL; 2165a9817697SBarry Smith c->keepnonzeropattern = a->keepnonzeropattern; 216649b5e25fSSatish Balay C->assembled = PETSC_TRUE; 216749b5e25fSSatish Balay 21689566063dSJacob Faibussowitsch PetscCall(PetscLayoutReference(A->rmap, &C->rmap)); 21699566063dSJacob Faibussowitsch PetscCall(PetscLayoutReference(A->cmap, &C->cmap)); 217049b5e25fSSatish Balay c->bs2 = a->bs2; 217149b5e25fSSatish Balay c->mbs = a->mbs; 217249b5e25fSSatish Balay c->nbs = a->nbs; 217349b5e25fSSatish Balay 2174c760cd28SBarry Smith if (cpvalues == MAT_SHARE_NONZERO_PATTERN) { 2175c760cd28SBarry Smith c->imax = a->imax; 2176c760cd28SBarry Smith c->ilen = a->ilen; 2177c760cd28SBarry Smith c->free_imax_ilen = PETSC_FALSE; 2178c760cd28SBarry Smith } else { 21799566063dSJacob Faibussowitsch PetscCall(PetscMalloc2((mbs + 1), &c->imax, (mbs + 1), &c->ilen)); 218049b5e25fSSatish Balay for (i = 0; i < mbs; i++) { 218149b5e25fSSatish Balay c->imax[i] = a->imax[i]; 218249b5e25fSSatish Balay c->ilen[i] = a->ilen[i]; 218349b5e25fSSatish Balay } 2184c760cd28SBarry Smith c->free_imax_ilen = PETSC_TRUE; 2185c760cd28SBarry Smith } 218649b5e25fSSatish Balay 218749b5e25fSSatish Balay /* allocate the matrix space */ 21884da8f245SBarry Smith if (cpvalues == MAT_SHARE_NONZERO_PATTERN) { 21899566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(bs2 * nz, &c->a)); 219044e1c64aSLisandro Dalcin c->i = a->i; 219144e1c64aSLisandro Dalcin c->j = a->j; 21924da8f245SBarry Smith c->singlemalloc = PETSC_FALSE; 219344e1c64aSLisandro Dalcin c->free_a = PETSC_TRUE; 21944da8f245SBarry Smith c->free_ij = PETSC_FALSE; 21954da8f245SBarry Smith c->parent = A; 21969566063dSJacob Faibussowitsch PetscCall(PetscObjectReference((PetscObject)A)); 21979566063dSJacob Faibussowitsch PetscCall(MatSetOption(A, MAT_NEW_NONZERO_LOCATION_ERR, PETSC_TRUE)); 21989566063dSJacob Faibussowitsch PetscCall(MatSetOption(C, MAT_NEW_NONZERO_LOCATION_ERR, PETSC_TRUE)); 21994da8f245SBarry Smith } else { 22009566063dSJacob Faibussowitsch PetscCall(PetscMalloc3(bs2 * nz, &c->a, nz, &c->j, mbs + 1, &c->i)); 22019566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(c->i, a->i, mbs + 1)); 22024da8f245SBarry Smith c->singlemalloc = PETSC_TRUE; 220344e1c64aSLisandro Dalcin c->free_a = PETSC_TRUE; 22044da8f245SBarry Smith c->free_ij = PETSC_TRUE; 22054da8f245SBarry Smith } 220649b5e25fSSatish Balay if (mbs > 0) { 220748a46eb9SPierre Jolivet if (cpvalues != MAT_SHARE_NONZERO_PATTERN) PetscCall(PetscArraycpy(c->j, a->j, nz)); 220849b5e25fSSatish Balay if (cpvalues == MAT_COPY_VALUES) { 22099566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(c->a, a->a, bs2 * nz)); 221049b5e25fSSatish Balay } else { 22119566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(c->a, bs2 * nz)); 221249b5e25fSSatish Balay } 2213a1c3900fSBarry Smith if (a->jshort) { 221444e1c64aSLisandro Dalcin /* cannot share jshort, it is reallocated in MatAssemblyEnd_SeqSBAIJ() */ 221544e1c64aSLisandro Dalcin /* if the parent matrix is reassembled, this child matrix will never notice */ 22169566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nz, &c->jshort)); 22179566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(c->jshort, a->jshort, nz)); 221826fbe8dcSKarl Rupp 22194da8f245SBarry Smith c->free_jshort = PETSC_TRUE; 22204da8f245SBarry Smith } 2221a1c3900fSBarry Smith } 222249b5e25fSSatish Balay 222349b5e25fSSatish Balay c->roworiented = a->roworiented; 222449b5e25fSSatish Balay c->nonew = a->nonew; 222549b5e25fSSatish Balay 222649b5e25fSSatish Balay if (a->diag) { 2227c760cd28SBarry Smith if (cpvalues == MAT_SHARE_NONZERO_PATTERN) { 2228c760cd28SBarry Smith c->diag = a->diag; 2229c760cd28SBarry Smith c->free_diag = PETSC_FALSE; 2230c760cd28SBarry Smith } else { 22319566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(mbs, &c->diag)); 223226fbe8dcSKarl Rupp for (i = 0; i < mbs; i++) c->diag[i] = a->diag[i]; 2233c760cd28SBarry Smith c->free_diag = PETSC_TRUE; 2234c760cd28SBarry Smith } 223544e1c64aSLisandro Dalcin } 22366c6c5352SBarry Smith c->nz = a->nz; 2237f2cbd3d5SJed Brown c->maxnz = a->nz; /* Since we allocate exactly the right amount */ 2238f4259b30SLisandro Dalcin c->solve_work = NULL; 2239f4259b30SLisandro Dalcin c->mult_work = NULL; 224026fbe8dcSKarl Rupp 224149b5e25fSSatish Balay *B = C; 22429566063dSJacob Faibussowitsch PetscCall(PetscFunctionListDuplicate(((PetscObject)A)->qlist, &((PetscObject)C)->qlist)); 22433ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 224449b5e25fSSatish Balay } 224549b5e25fSSatish Balay 2246618cc2edSLisandro Dalcin /* Used for both SeqBAIJ and SeqSBAIJ matrices */ 2247618cc2edSLisandro Dalcin #define MatLoad_SeqSBAIJ_Binary MatLoad_SeqBAIJ_Binary 2248618cc2edSLisandro Dalcin 2249d71ae5a4SJacob Faibussowitsch PetscErrorCode MatLoad_SeqSBAIJ(Mat mat, PetscViewer viewer) 2250d71ae5a4SJacob Faibussowitsch { 22517f489da9SVaclav Hapla PetscBool isbinary; 22522f480046SShri Abhyankar 22532f480046SShri Abhyankar PetscFunctionBegin; 22549566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERBINARY, &isbinary)); 225528b400f6SJacob Faibussowitsch PetscCheck(isbinary, PetscObjectComm((PetscObject)viewer), PETSC_ERR_SUP, "Viewer type %s not yet supported for reading %s matrices", ((PetscObject)viewer)->type_name, ((PetscObject)mat)->type_name); 22569566063dSJacob Faibussowitsch PetscCall(MatLoad_SeqSBAIJ_Binary(mat, viewer)); 22573ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 22582f480046SShri Abhyankar } 22592f480046SShri Abhyankar 2260c75a6043SHong Zhang /*@ 226111a5261eSBarry Smith MatCreateSeqSBAIJWithArrays - Creates an sequential `MATSEQSBAIJ` matrix using matrix elements 2262c75a6043SHong Zhang (upper triangular entries in CSR format) provided by the user. 2263c75a6043SHong Zhang 2264d083f849SBarry Smith Collective 2265c75a6043SHong Zhang 2266c75a6043SHong Zhang Input Parameters: 2267c75a6043SHong Zhang + comm - must be an MPI communicator of size 1 2268c75a6043SHong Zhang . bs - size of block 2269c75a6043SHong Zhang . m - number of rows 2270c75a6043SHong Zhang . n - number of columns 2271483a2f95SBarry Smith . i - row indices; that is i[0] = 0, i[row] = i[row-1] + number of block elements in that row block row of the matrix 2272c75a6043SHong Zhang . j - column indices 2273c75a6043SHong Zhang - a - matrix values 2274c75a6043SHong Zhang 2275c75a6043SHong Zhang Output Parameter: 2276c75a6043SHong Zhang . mat - the matrix 2277c75a6043SHong Zhang 2278dfb205c3SBarry Smith Level: advanced 2279c75a6043SHong Zhang 2280c75a6043SHong Zhang Notes: 22812ef1f0ffSBarry Smith The `i`, `j`, and `a` arrays are not copied by this routine, the user must free these arrays 2282c75a6043SHong Zhang once the matrix is destroyed 2283c75a6043SHong Zhang 2284c75a6043SHong Zhang You cannot set new nonzero locations into this matrix, that will generate an error. 2285c75a6043SHong Zhang 22862ef1f0ffSBarry Smith The `i` and `j` indices are 0 based 2287c75a6043SHong Zhang 22882ef1f0ffSBarry Smith When block size is greater than 1 the matrix values must be stored using the `MATSBAIJ` storage format. For block size of 1 2289dfb205c3SBarry Smith it is the regular CSR format excluding the lower triangular elements. 2290dfb205c3SBarry Smith 22911cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MATSEQSBAIJ`, `MatCreate()`, `MatCreateSBAIJ()`, `MatCreateSeqSBAIJ()` 2292c75a6043SHong Zhang @*/ 2293d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateSeqSBAIJWithArrays(MPI_Comm comm, PetscInt bs, PetscInt m, PetscInt n, PetscInt i[], PetscInt j[], PetscScalar a[], Mat *mat) 2294d71ae5a4SJacob Faibussowitsch { 2295c75a6043SHong Zhang PetscInt ii; 2296c75a6043SHong Zhang Mat_SeqSBAIJ *sbaij; 2297c75a6043SHong Zhang 2298c75a6043SHong Zhang PetscFunctionBegin; 229908401ef6SPierre Jolivet PetscCheck(bs == 1, PETSC_COMM_SELF, PETSC_ERR_SUP, "block size %" PetscInt_FMT " > 1 is not supported yet", bs); 2300aed4548fSBarry Smith PetscCheck(m == 0 || i[0] == 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "i (row indices) must start with 0"); 2301c75a6043SHong Zhang 23029566063dSJacob Faibussowitsch PetscCall(MatCreate(comm, mat)); 23039566063dSJacob Faibussowitsch PetscCall(MatSetSizes(*mat, m, n, m, n)); 23049566063dSJacob Faibussowitsch PetscCall(MatSetType(*mat, MATSEQSBAIJ)); 23059566063dSJacob Faibussowitsch PetscCall(MatSeqSBAIJSetPreallocation(*mat, bs, MAT_SKIP_ALLOCATION, NULL)); 2306c75a6043SHong Zhang sbaij = (Mat_SeqSBAIJ *)(*mat)->data; 23079566063dSJacob Faibussowitsch PetscCall(PetscMalloc2(m, &sbaij->imax, m, &sbaij->ilen)); 2308c75a6043SHong Zhang 2309c75a6043SHong Zhang sbaij->i = i; 2310c75a6043SHong Zhang sbaij->j = j; 2311c75a6043SHong Zhang sbaij->a = a; 231226fbe8dcSKarl Rupp 2313c75a6043SHong Zhang sbaij->singlemalloc = PETSC_FALSE; 2314c75a6043SHong Zhang sbaij->nonew = -1; /*this indicates that inserting a new value in the matrix that generates a new nonzero is an error*/ 2315e6b907acSBarry Smith sbaij->free_a = PETSC_FALSE; 2316e6b907acSBarry Smith sbaij->free_ij = PETSC_FALSE; 2317ddf7884eSMatthew Knepley sbaij->free_imax_ilen = PETSC_TRUE; 2318c75a6043SHong Zhang 2319c75a6043SHong Zhang for (ii = 0; ii < m; ii++) { 2320c75a6043SHong Zhang sbaij->ilen[ii] = sbaij->imax[ii] = i[ii + 1] - i[ii]; 23216bdcaf15SBarry Smith PetscCheck(i[ii + 1] >= i[ii], PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Negative row length in i (row indices) row = %" PetscInt_FMT " length = %" PetscInt_FMT, ii, i[ii + 1] - i[ii]); 2322c75a6043SHong Zhang } 232376bd3646SJed Brown if (PetscDefined(USE_DEBUG)) { 2324c75a6043SHong Zhang for (ii = 0; ii < sbaij->i[m]; ii++) { 23256bdcaf15SBarry Smith PetscCheck(j[ii] >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Negative column index at location = %" PetscInt_FMT " index = %" PetscInt_FMT, ii, j[ii]); 23266bdcaf15SBarry Smith PetscCheck(j[ii] < n, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Column index too large at location = %" PetscInt_FMT " index = %" PetscInt_FMT, ii, j[ii]); 2327c75a6043SHong Zhang } 232876bd3646SJed Brown } 2329c75a6043SHong Zhang 23309566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(*mat, MAT_FINAL_ASSEMBLY)); 23319566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(*mat, MAT_FINAL_ASSEMBLY)); 23323ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 2333c75a6043SHong Zhang } 2334d06b337dSHong Zhang 2335d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateMPIMatConcatenateSeqMat_SeqSBAIJ(MPI_Comm comm, Mat inmat, PetscInt n, MatReuse scall, Mat *outmat) 2336d71ae5a4SJacob Faibussowitsch { 233759f5e6ceSHong Zhang PetscFunctionBegin; 23389566063dSJacob Faibussowitsch PetscCall(MatCreateMPIMatConcatenateSeqMat_MPISBAIJ(comm, inmat, n, scall, outmat)); 23393ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 234059f5e6ceSHong Zhang } 2341