149b5e25fSSatish Balay 249b5e25fSSatish Balay /* 3a1373b80SHong Zhang Defines the basic matrix operations for the SBAIJ (compressed row) 449b5e25fSSatish Balay matrix storage format. 549b5e25fSSatish Balay */ 6c6db04a5SJed Brown #include <../src/mat/impls/baij/seq/baij.h> /*I "petscmat.h" I*/ 7c6db04a5SJed Brown #include <../src/mat/impls/sbaij/seq/sbaij.h> 8c6db04a5SJed Brown #include <petscblaslapack.h> 949b5e25fSSatish Balay 10c6db04a5SJed Brown #include <../src/mat/impls/sbaij/seq/relax.h> 1170dcbbb9SBarry Smith #define USESHORT 12c6db04a5SJed Brown #include <../src/mat/impls/sbaij/seq/relax.h> 1370dcbbb9SBarry Smith 146214f412SHong Zhang #if defined(PETSC_HAVE_ELEMENTAL) 15cc2e6a90SBarry Smith PETSC_INTERN PetscErrorCode MatConvert_SeqSBAIJ_Elemental(Mat, MatType, MatReuse, Mat *); 166214f412SHong Zhang #endif 17d24d4204SJose E. Roman #if defined(PETSC_HAVE_SCALAPACK) 18d24d4204SJose E. Roman PETSC_INTERN PetscErrorCode MatConvert_SBAIJ_ScaLAPACK(Mat, MatType, MatReuse, Mat *); 19d24d4204SJose E. Roman #endif 2028d58a37SPierre Jolivet PETSC_INTERN PetscErrorCode MatConvert_MPISBAIJ_Basic(Mat, MatType, MatReuse, Mat *); 21b5b17502SBarry Smith 2249b5e25fSSatish Balay /* 2349b5e25fSSatish Balay Checks for missing diagonals 2449b5e25fSSatish Balay */ 25d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMissingDiagonal_SeqSBAIJ(Mat A, PetscBool *missing, PetscInt *dd) 26d71ae5a4SJacob Faibussowitsch { 27045c9aa0SHong Zhang Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)A->data; 287734d3b5SMatthew G. Knepley PetscInt *diag, *ii = a->i, i; 2949b5e25fSSatish Balay 3049b5e25fSSatish Balay PetscFunctionBegin; 319566063dSJacob Faibussowitsch PetscCall(MatMarkDiagonal_SeqSBAIJ(A)); 322af78befSBarry Smith *missing = PETSC_FALSE; 337734d3b5SMatthew G. Knepley if (A->rmap->n > 0 && !ii) { 34358d2f5dSShri Abhyankar *missing = PETSC_TRUE; 35358d2f5dSShri Abhyankar if (dd) *dd = 0; 369566063dSJacob Faibussowitsch PetscCall(PetscInfo(A, "Matrix has no entries therefore is missing diagonal\n")); 37358d2f5dSShri Abhyankar } else { 38358d2f5dSShri Abhyankar diag = a->diag; 3949b5e25fSSatish Balay for (i = 0; i < a->mbs; i++) { 407734d3b5SMatthew G. Knepley if (diag[i] >= ii[i + 1]) { 412af78befSBarry Smith *missing = PETSC_TRUE; 422af78befSBarry Smith if (dd) *dd = i; 432af78befSBarry Smith break; 442af78befSBarry Smith } 4549b5e25fSSatish Balay } 46358d2f5dSShri Abhyankar } 473ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 4849b5e25fSSatish Balay } 4949b5e25fSSatish Balay 50d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMarkDiagonal_SeqSBAIJ(Mat A) 51d71ae5a4SJacob Faibussowitsch { 52045c9aa0SHong Zhang Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)A->data; 5348dd3d27SHong Zhang PetscInt i, j; 5449b5e25fSSatish Balay 5549b5e25fSSatish Balay PetscFunctionBegin; 5609f38230SBarry Smith if (!a->diag) { 579566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(a->mbs, &a->diag)); 58c760cd28SBarry Smith a->free_diag = PETSC_TRUE; 5909f38230SBarry Smith } 6048dd3d27SHong Zhang for (i = 0; i < a->mbs; i++) { 6148dd3d27SHong Zhang a->diag[i] = a->i[i + 1]; 6248dd3d27SHong Zhang for (j = a->i[i]; j < a->i[i + 1]; j++) { 6348dd3d27SHong Zhang if (a->j[j] == i) { 6448dd3d27SHong Zhang a->diag[i] = j; 6548dd3d27SHong Zhang break; 6648dd3d27SHong Zhang } 6748dd3d27SHong Zhang } 6848dd3d27SHong Zhang } 693ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 7049b5e25fSSatish Balay } 7149b5e25fSSatish Balay 72d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatGetRowIJ_SeqSBAIJ(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool blockcompressed, PetscInt *nn, const PetscInt *inia[], const PetscInt *inja[], PetscBool *done) 73d71ae5a4SJacob Faibussowitsch { 74a6ece127SHong Zhang Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)A->data; 752462f5fdSStefano Zampini PetscInt i, j, n = a->mbs, nz = a->i[n], *tia, *tja, bs = A->rmap->bs, k, l, cnt; 762462f5fdSStefano Zampini PetscInt **ia = (PetscInt **)inia, **ja = (PetscInt **)inja; 7749b5e25fSSatish Balay 7849b5e25fSSatish Balay PetscFunctionBegin; 79d3e5a4abSHong Zhang *nn = n; 803ba16761SJacob Faibussowitsch if (!ia) PetscFunctionReturn(PETSC_SUCCESS); 812462f5fdSStefano Zampini if (symmetric) { 829566063dSJacob Faibussowitsch PetscCall(MatToSymmetricIJ_SeqAIJ(n, a->i, a->j, PETSC_FALSE, 0, 0, &tia, &tja)); 832462f5fdSStefano Zampini nz = tia[n]; 842462f5fdSStefano Zampini } else { 859371c9d4SSatish Balay tia = a->i; 869371c9d4SSatish Balay tja = a->j; 872462f5fdSStefano Zampini } 882462f5fdSStefano Zampini 892462f5fdSStefano Zampini if (!blockcompressed && bs > 1) { 902462f5fdSStefano Zampini (*nn) *= bs; 918f7157efSSatish Balay /* malloc & create the natural set of indices */ 929566063dSJacob Faibussowitsch PetscCall(PetscMalloc1((n + 1) * bs, ia)); 932462f5fdSStefano Zampini if (n) { 942462f5fdSStefano Zampini (*ia)[0] = oshift; 95ad540459SPierre Jolivet for (j = 1; j < bs; j++) (*ia)[j] = (tia[1] - tia[0]) * bs + (*ia)[j - 1]; 962462f5fdSStefano Zampini } 972462f5fdSStefano Zampini 982462f5fdSStefano Zampini for (i = 1; i < n; i++) { 992462f5fdSStefano Zampini (*ia)[i * bs] = (tia[i] - tia[i - 1]) * bs + (*ia)[i * bs - 1]; 100ad540459SPierre Jolivet for (j = 1; j < bs; j++) (*ia)[i * bs + j] = (tia[i + 1] - tia[i]) * bs + (*ia)[i * bs + j - 1]; 1012462f5fdSStefano Zampini } 102ad540459SPierre Jolivet if (n) (*ia)[n * bs] = (tia[n] - tia[n - 1]) * bs + (*ia)[n * bs - 1]; 1032462f5fdSStefano Zampini 1042462f5fdSStefano Zampini if (inja) { 1059566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nz * bs * bs, ja)); 1062462f5fdSStefano Zampini cnt = 0; 1072462f5fdSStefano Zampini for (i = 0; i < n; i++) { 1088f7157efSSatish Balay for (j = 0; j < bs; j++) { 1092462f5fdSStefano Zampini for (k = tia[i]; k < tia[i + 1]; k++) { 110ad540459SPierre Jolivet for (l = 0; l < bs; l++) (*ja)[cnt++] = bs * tja[k] + l; 1118f7157efSSatish Balay } 1128f7157efSSatish Balay } 1138f7157efSSatish Balay } 1148f7157efSSatish Balay } 1152462f5fdSStefano Zampini 1162462f5fdSStefano Zampini if (symmetric) { /* deallocate memory allocated in MatToSymmetricIJ_SeqAIJ() */ 1179566063dSJacob Faibussowitsch PetscCall(PetscFree(tia)); 1189566063dSJacob Faibussowitsch PetscCall(PetscFree(tja)); 1192462f5fdSStefano Zampini } 1202462f5fdSStefano Zampini } else if (oshift == 1) { 1212462f5fdSStefano Zampini if (symmetric) { 1222462f5fdSStefano Zampini nz = tia[A->rmap->n / bs]; 1232462f5fdSStefano Zampini /* add 1 to i and j indices */ 1242462f5fdSStefano Zampini for (i = 0; i < A->rmap->n / bs + 1; i++) tia[i] = tia[i] + 1; 1252462f5fdSStefano Zampini *ia = tia; 1262462f5fdSStefano Zampini if (ja) { 1272462f5fdSStefano Zampini for (i = 0; i < nz; i++) tja[i] = tja[i] + 1; 1282462f5fdSStefano Zampini *ja = tja; 1292462f5fdSStefano Zampini } 1302462f5fdSStefano Zampini } else { 1312462f5fdSStefano Zampini nz = a->i[A->rmap->n / bs]; 1322462f5fdSStefano Zampini /* malloc space and add 1 to i and j indices */ 1339566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(A->rmap->n / bs + 1, ia)); 1342462f5fdSStefano Zampini for (i = 0; i < A->rmap->n / bs + 1; i++) (*ia)[i] = a->i[i] + 1; 1352462f5fdSStefano Zampini if (ja) { 1369566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nz, ja)); 1372462f5fdSStefano Zampini for (i = 0; i < nz; i++) (*ja)[i] = a->j[i] + 1; 1382462f5fdSStefano Zampini } 1392462f5fdSStefano Zampini } 1402462f5fdSStefano Zampini } else { 1412462f5fdSStefano Zampini *ia = tia; 1422462f5fdSStefano Zampini if (ja) *ja = tja; 143a6ece127SHong Zhang } 1443ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 14549b5e25fSSatish Balay } 14649b5e25fSSatish Balay 147d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatRestoreRowIJ_SeqSBAIJ(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool blockcompressed, PetscInt *nn, const PetscInt *ia[], const PetscInt *ja[], PetscBool *done) 148d71ae5a4SJacob Faibussowitsch { 14949b5e25fSSatish Balay PetscFunctionBegin; 1503ba16761SJacob Faibussowitsch if (!ia) PetscFunctionReturn(PETSC_SUCCESS); 1512462f5fdSStefano Zampini if ((!blockcompressed && A->rmap->bs > 1) || (symmetric || oshift == 1)) { 1529566063dSJacob Faibussowitsch PetscCall(PetscFree(*ia)); 1539566063dSJacob Faibussowitsch if (ja) PetscCall(PetscFree(*ja)); 154a6ece127SHong Zhang } 1553ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 15649b5e25fSSatish Balay } 15749b5e25fSSatish Balay 158d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDestroy_SeqSBAIJ(Mat A) 159d71ae5a4SJacob Faibussowitsch { 16049b5e25fSSatish Balay Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)A->data; 16149b5e25fSSatish Balay 16249b5e25fSSatish Balay PetscFunctionBegin; 163a9f03627SSatish Balay #if defined(PETSC_USE_LOG) 1643ba16761SJacob Faibussowitsch PetscCall(PetscLogObjectState((PetscObject)A, "Rows=%" PetscInt_FMT ", NZ=%" PetscInt_FMT, A->rmap->N, a->nz)); 165a9f03627SSatish Balay #endif 1669566063dSJacob Faibussowitsch PetscCall(MatSeqXAIJFreeAIJ(A, &a->a, &a->j, &a->i)); 1679566063dSJacob Faibussowitsch if (a->free_diag) PetscCall(PetscFree(a->diag)); 1689566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->row)); 1699566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->col)); 1709566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->icol)); 1719566063dSJacob Faibussowitsch PetscCall(PetscFree(a->idiag)); 1729566063dSJacob Faibussowitsch PetscCall(PetscFree(a->inode.size)); 1739566063dSJacob Faibussowitsch if (a->free_imax_ilen) PetscCall(PetscFree2(a->imax, a->ilen)); 1749566063dSJacob Faibussowitsch PetscCall(PetscFree(a->solve_work)); 1759566063dSJacob Faibussowitsch PetscCall(PetscFree(a->sor_work)); 1769566063dSJacob Faibussowitsch PetscCall(PetscFree(a->solves_work)); 1779566063dSJacob Faibussowitsch PetscCall(PetscFree(a->mult_work)); 1789566063dSJacob Faibussowitsch PetscCall(PetscFree(a->saved_values)); 1799566063dSJacob Faibussowitsch if (a->free_jshort) PetscCall(PetscFree(a->jshort)); 1809566063dSJacob Faibussowitsch PetscCall(PetscFree(a->inew)); 1819566063dSJacob Faibussowitsch PetscCall(MatDestroy(&a->parent)); 1829566063dSJacob Faibussowitsch PetscCall(PetscFree(A->data)); 183901853e0SKris Buschelman 1849566063dSJacob Faibussowitsch PetscCall(PetscObjectChangeTypeName((PetscObject)A, NULL)); 1852e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSeqSBAIJGetArray_C", NULL)); 1862e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSeqSBAIJRestoreArray_C", NULL)); 1879566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatStoreValues_C", NULL)); 1889566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatRetrieveValues_C", NULL)); 1899566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSeqSBAIJSetColumnIndices_C", NULL)); 1909566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqsbaij_seqaij_C", NULL)); 1919566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqsbaij_seqbaij_C", NULL)); 1929566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSeqSBAIJSetPreallocation_C", NULL)); 1939566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSeqSBAIJSetPreallocationCSR_C", NULL)); 1946214f412SHong Zhang #if defined(PETSC_HAVE_ELEMENTAL) 1959566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqsbaij_elemental_C", NULL)); 1966214f412SHong Zhang #endif 197d24d4204SJose E. Roman #if defined(PETSC_HAVE_SCALAPACK) 1989566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqsbaij_scalapack_C", NULL)); 199d24d4204SJose E. Roman #endif 2002e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatFactorGetSolverType_C", NULL)); 2013ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 20249b5e25fSSatish Balay } 20349b5e25fSSatish Balay 204d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetOption_SeqSBAIJ(Mat A, MatOption op, PetscBool flg) 205d71ae5a4SJacob Faibussowitsch { 206045c9aa0SHong Zhang Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)A->data; 207eb1ec7c1SStefano Zampini #if defined(PETSC_USE_COMPLEX) 208eb1ec7c1SStefano Zampini PetscInt bs; 209eb1ec7c1SStefano Zampini #endif 21049b5e25fSSatish Balay 21149b5e25fSSatish Balay PetscFunctionBegin; 212eb1ec7c1SStefano Zampini #if defined(PETSC_USE_COMPLEX) 2139566063dSJacob Faibussowitsch PetscCall(MatGetBlockSize(A, &bs)); 214eb1ec7c1SStefano Zampini #endif 2154d9d31abSKris Buschelman switch (op) { 216d71ae5a4SJacob Faibussowitsch case MAT_ROW_ORIENTED: 217d71ae5a4SJacob Faibussowitsch a->roworiented = flg; 218d71ae5a4SJacob Faibussowitsch break; 219d71ae5a4SJacob Faibussowitsch case MAT_KEEP_NONZERO_PATTERN: 220d71ae5a4SJacob Faibussowitsch a->keepnonzeropattern = flg; 221d71ae5a4SJacob Faibussowitsch break; 222d71ae5a4SJacob Faibussowitsch case MAT_NEW_NONZERO_LOCATIONS: 223d71ae5a4SJacob Faibussowitsch a->nonew = (flg ? 0 : 1); 224d71ae5a4SJacob Faibussowitsch break; 225d71ae5a4SJacob Faibussowitsch case MAT_NEW_NONZERO_LOCATION_ERR: 226d71ae5a4SJacob Faibussowitsch a->nonew = (flg ? -1 : 0); 227d71ae5a4SJacob Faibussowitsch break; 228d71ae5a4SJacob Faibussowitsch case MAT_NEW_NONZERO_ALLOCATION_ERR: 229d71ae5a4SJacob Faibussowitsch a->nonew = (flg ? -2 : 0); 230d71ae5a4SJacob Faibussowitsch break; 231d71ae5a4SJacob Faibussowitsch case MAT_UNUSED_NONZERO_LOCATION_ERR: 232d71ae5a4SJacob Faibussowitsch a->nounused = (flg ? -1 : 0); 233d71ae5a4SJacob Faibussowitsch break; 2348c78258cSHong Zhang case MAT_FORCE_DIAGONAL_ENTRIES: 2354d9d31abSKris Buschelman case MAT_IGNORE_OFF_PROC_ENTRIES: 2364d9d31abSKris Buschelman case MAT_USE_HASH_TABLE: 237d71ae5a4SJacob Faibussowitsch case MAT_SORTED_FULL: 238d71ae5a4SJacob Faibussowitsch PetscCall(PetscInfo(A, "Option %s ignored\n", MatOptions[op])); 239d71ae5a4SJacob Faibussowitsch break; 2409a4540c5SBarry Smith case MAT_HERMITIAN: 241eb1ec7c1SStefano Zampini #if defined(PETSC_USE_COMPLEX) 242eb1ec7c1SStefano Zampini if (flg) { /* disable transpose ops */ 24308401ef6SPierre Jolivet PetscCheck(bs <= 1, PETSC_COMM_SELF, PETSC_ERR_SUP, "No support for Hermitian with block size greater than 1"); 244eb1ec7c1SStefano Zampini A->ops->multtranspose = NULL; 245eb1ec7c1SStefano Zampini A->ops->multtransposeadd = NULL; 246b94d7dedSBarry Smith A->symmetric = PETSC_BOOL3_FALSE; 247eb1ec7c1SStefano Zampini } 2480f2140c7SStefano Zampini #endif 249eeffb40dSHong Zhang break; 25077e54ba9SKris Buschelman case MAT_SYMMETRIC: 251eb1ec7c1SStefano Zampini case MAT_SPD: 252eb1ec7c1SStefano Zampini #if defined(PETSC_USE_COMPLEX) 253eb1ec7c1SStefano Zampini if (flg) { /* An hermitian and symmetric matrix has zero imaginary part (restore back transpose ops) */ 254eb1ec7c1SStefano Zampini A->ops->multtranspose = A->ops->mult; 255eb1ec7c1SStefano Zampini A->ops->multtransposeadd = A->ops->multadd; 256eb1ec7c1SStefano Zampini } 257eb1ec7c1SStefano Zampini #endif 258eb1ec7c1SStefano Zampini break; 259eb1ec7c1SStefano Zampini /* These options are handled directly by MatSetOption() */ 26077e54ba9SKris Buschelman case MAT_STRUCTURALLY_SYMMETRIC: 2619a4540c5SBarry Smith case MAT_SYMMETRY_ETERNAL: 262b94d7dedSBarry Smith case MAT_STRUCTURAL_SYMMETRY_ETERNAL: 263672ba085SHong Zhang case MAT_STRUCTURE_ONLY: 264b94d7dedSBarry Smith case MAT_SPD_ETERNAL: 2654dcd73b1SHong Zhang /* These options are handled directly by MatSetOption() */ 266290bbb0aSBarry Smith break; 267d71ae5a4SJacob Faibussowitsch case MAT_IGNORE_LOWER_TRIANGULAR: 268d71ae5a4SJacob Faibussowitsch a->ignore_ltriangular = flg; 269d71ae5a4SJacob Faibussowitsch break; 270d71ae5a4SJacob Faibussowitsch case MAT_ERROR_LOWER_TRIANGULAR: 271d71ae5a4SJacob Faibussowitsch a->ignore_ltriangular = flg; 272d71ae5a4SJacob Faibussowitsch break; 273d71ae5a4SJacob Faibussowitsch case MAT_GETROW_UPPERTRIANGULAR: 274d71ae5a4SJacob Faibussowitsch a->getrow_utriangular = flg; 275d71ae5a4SJacob Faibussowitsch break; 276d71ae5a4SJacob Faibussowitsch case MAT_SUBMAT_SINGLEIS: 277d71ae5a4SJacob Faibussowitsch break; 278d71ae5a4SJacob Faibussowitsch default: 279d71ae5a4SJacob Faibussowitsch SETERRQ(PETSC_COMM_SELF, PETSC_ERR_SUP, "unknown option %d", op); 28049b5e25fSSatish Balay } 2813ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 28249b5e25fSSatish Balay } 28349b5e25fSSatish Balay 284d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetRow_SeqSBAIJ(Mat A, PetscInt row, PetscInt *nz, PetscInt **idx, PetscScalar **v) 285d71ae5a4SJacob Faibussowitsch { 28649b5e25fSSatish Balay Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)A->data; 28749b5e25fSSatish Balay 28849b5e25fSSatish Balay PetscFunctionBegin; 28908401ef6SPierre Jolivet PetscCheck(!A || a->getrow_utriangular, PETSC_COMM_SELF, PETSC_ERR_SUP, "MatGetRow is not supported for SBAIJ matrix format. Getting the upper triangular part of row, run with -mat_getrow_uppertriangular, call MatSetOption(mat,MAT_GETROW_UPPERTRIANGULAR,PETSC_TRUE) or MatGetRowUpperTriangular()"); 29052768537SHong Zhang 291f5edf698SHong Zhang /* Get the upper triangular part of the row */ 2929566063dSJacob Faibussowitsch PetscCall(MatGetRow_SeqBAIJ_private(A, row, nz, idx, v, a->i, a->j, a->a)); 2933ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 29449b5e25fSSatish Balay } 29549b5e25fSSatish Balay 296d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRestoreRow_SeqSBAIJ(Mat A, PetscInt row, PetscInt *nz, PetscInt **idx, PetscScalar **v) 297d71ae5a4SJacob Faibussowitsch { 29849b5e25fSSatish Balay PetscFunctionBegin; 299cb4a9cd9SHong Zhang if (nz) *nz = 0; 3009566063dSJacob Faibussowitsch if (idx) PetscCall(PetscFree(*idx)); 3019566063dSJacob Faibussowitsch if (v) PetscCall(PetscFree(*v)); 3023ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 30349b5e25fSSatish Balay } 30449b5e25fSSatish Balay 305d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetRowUpperTriangular_SeqSBAIJ(Mat A) 306d71ae5a4SJacob Faibussowitsch { 307f5edf698SHong Zhang Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)A->data; 308f5edf698SHong Zhang 309f5edf698SHong Zhang PetscFunctionBegin; 310f5edf698SHong Zhang a->getrow_utriangular = PETSC_TRUE; 3113ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 312f5edf698SHong Zhang } 313a323099bSStefano Zampini 314d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRestoreRowUpperTriangular_SeqSBAIJ(Mat A) 315d71ae5a4SJacob Faibussowitsch { 316f5edf698SHong Zhang Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)A->data; 317f5edf698SHong Zhang 318f5edf698SHong Zhang PetscFunctionBegin; 319f5edf698SHong Zhang a->getrow_utriangular = PETSC_FALSE; 3203ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 321f5edf698SHong Zhang } 322f5edf698SHong Zhang 323d71ae5a4SJacob Faibussowitsch PetscErrorCode MatTranspose_SeqSBAIJ(Mat A, MatReuse reuse, Mat *B) 324d71ae5a4SJacob Faibussowitsch { 32549b5e25fSSatish Balay PetscFunctionBegin; 3267fb60732SBarry Smith if (reuse == MAT_REUSE_MATRIX) PetscCall(MatTransposeCheckNonzeroState_Private(A, *B)); 327cf37664fSBarry Smith if (reuse == MAT_INITIAL_MATRIX) { 3289566063dSJacob Faibussowitsch PetscCall(MatDuplicate(A, MAT_COPY_VALUES, B)); 329cf37664fSBarry Smith } else if (reuse == MAT_REUSE_MATRIX) { 3309566063dSJacob Faibussowitsch PetscCall(MatCopy(A, *B, SAME_NONZERO_PATTERN)); 331fc4dec0aSBarry Smith } 3323ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 33349b5e25fSSatish Balay } 33449b5e25fSSatish Balay 335d71ae5a4SJacob Faibussowitsch PetscErrorCode MatView_SeqSBAIJ_ASCII(Mat A, PetscViewer viewer) 336d71ae5a4SJacob Faibussowitsch { 33749b5e25fSSatish Balay Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)A->data; 338d0f46423SBarry Smith PetscInt i, j, bs = A->rmap->bs, k, l, bs2 = a->bs2; 339f3ef73ceSBarry Smith PetscViewerFormat format; 340121deb67SSatish Balay PetscInt *diag; 341*b3a0534dSBarry Smith const char *matname; 34249b5e25fSSatish Balay 34349b5e25fSSatish Balay PetscFunctionBegin; 3449566063dSJacob Faibussowitsch PetscCall(PetscViewerGetFormat(viewer, &format)); 345456192e2SBarry Smith if (format == PETSC_VIEWER_ASCII_INFO || format == PETSC_VIEWER_ASCII_INFO_DETAIL) { 3469566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " block size is %" PetscInt_FMT "\n", bs)); 347fb9695e5SSatish Balay } else if (format == PETSC_VIEWER_ASCII_MATLAB) { 348d2507d54SMatthew Knepley Mat aij; 349ade3a672SBarry Smith 350d5f3da31SBarry Smith if (A->factortype && bs > 1) { 3519566063dSJacob Faibussowitsch PetscCall(PetscPrintf(PETSC_COMM_SELF, "Warning: matrix is factored with bs>1. MatView() with PETSC_VIEWER_ASCII_MATLAB is not supported and ignored!\n")); 3523ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 35370d5e725SHong Zhang } 3549566063dSJacob Faibussowitsch PetscCall(MatConvert(A, MATSEQAIJ, MAT_INITIAL_MATRIX, &aij)); 35523a3927dSBarry Smith if (((PetscObject)A)->name) PetscCall(PetscObjectGetName((PetscObject)A, &matname)); 35623a3927dSBarry Smith if (((PetscObject)A)->name) PetscCall(PetscObjectSetName((PetscObject)aij, matname)); 35723a3927dSBarry Smith PetscCall(MatView_SeqAIJ(aij, viewer)); 3589566063dSJacob Faibussowitsch PetscCall(MatDestroy(&aij)); 359fb9695e5SSatish Balay } else if (format == PETSC_VIEWER_ASCII_COMMON) { 360*b3a0534dSBarry Smith Mat B; 361*b3a0534dSBarry Smith 362*b3a0534dSBarry Smith PetscCall(MatConvert(A, MATSEQAIJ, MAT_INITIAL_MATRIX, &B)); 363*b3a0534dSBarry Smith if (((PetscObject)A)->name) PetscCall(PetscObjectGetName((PetscObject)A, &matname)); 364*b3a0534dSBarry Smith if (((PetscObject)A)->name) PetscCall(PetscObjectSetName((PetscObject)B, matname)); 365*b3a0534dSBarry Smith PetscCall(MatView_SeqAIJ(B, viewer)); 366*b3a0534dSBarry Smith PetscCall(MatDestroy(&B)); 367c1490034SHong Zhang } else if (format == PETSC_VIEWER_ASCII_FACTOR_INFO) { 3683ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 36949b5e25fSSatish Balay } else { 3709566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE)); 3712c990fa1SHong Zhang if (A->factortype) { /* for factored matrix */ 37208401ef6SPierre Jolivet PetscCheck(bs <= 1, PETSC_COMM_SELF, PETSC_ERR_SUP, "matrix is factored with bs>1. Not implemented yet"); 3732c990fa1SHong Zhang 374121deb67SSatish Balay diag = a->diag; 375121deb67SSatish Balay for (i = 0; i < a->mbs; i++) { /* for row block i */ 3769566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "row %" PetscInt_FMT ":", i)); 3772c990fa1SHong Zhang /* diagonal entry */ 3782c990fa1SHong Zhang #if defined(PETSC_USE_COMPLEX) 3792c990fa1SHong Zhang if (PetscImaginaryPart(a->a[diag[i]]) > 0.0) { 3809566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g + %g i) ", a->j[diag[i]], (double)PetscRealPart(1.0 / a->a[diag[i]]), (double)PetscImaginaryPart(1.0 / a->a[diag[i]]))); 3812c990fa1SHong Zhang } else if (PetscImaginaryPart(a->a[diag[i]]) < 0.0) { 3829566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g - %g i) ", a->j[diag[i]], (double)PetscRealPart(1.0 / a->a[diag[i]]), -(double)PetscImaginaryPart(1.0 / a->a[diag[i]]))); 3832c990fa1SHong Zhang } else { 3849566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[diag[i]], (double)PetscRealPart(1.0 / a->a[diag[i]]))); 3852c990fa1SHong Zhang } 3862c990fa1SHong Zhang #else 3879566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[diag[i]], (double)(1.0 / a->a[diag[i]]))); 3882c990fa1SHong Zhang #endif 3892c990fa1SHong Zhang /* off-diagonal entries */ 3902c990fa1SHong Zhang for (k = a->i[i]; k < a->i[i + 1] - 1; k++) { 3912c990fa1SHong Zhang #if defined(PETSC_USE_COMPLEX) 392ca0704adSBarry Smith if (PetscImaginaryPart(a->a[k]) > 0.0) { 3939566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g + %g i) ", bs * a->j[k], (double)PetscRealPart(a->a[k]), (double)PetscImaginaryPart(a->a[k]))); 394ca0704adSBarry Smith } else if (PetscImaginaryPart(a->a[k]) < 0.0) { 3959566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g - %g i) ", bs * a->j[k], (double)PetscRealPart(a->a[k]), -(double)PetscImaginaryPart(a->a[k]))); 3962c990fa1SHong Zhang } else { 3979566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", bs * a->j[k], (double)PetscRealPart(a->a[k]))); 3982c990fa1SHong Zhang } 3992c990fa1SHong Zhang #else 4009566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[k], (double)a->a[k])); 4012c990fa1SHong Zhang #endif 4022c990fa1SHong Zhang } 4039566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 4042c990fa1SHong Zhang } 4052c990fa1SHong Zhang 4062c990fa1SHong Zhang } else { /* for non-factored matrix */ 4070c74a584SJed Brown for (i = 0; i < a->mbs; i++) { /* for row block i */ 4080c74a584SJed Brown for (j = 0; j < bs; j++) { /* for row bs*i + j */ 4099566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "row %" PetscInt_FMT ":", i * bs + j)); 4100c74a584SJed Brown for (k = a->i[i]; k < a->i[i + 1]; k++) { /* for column block */ 4110c74a584SJed Brown for (l = 0; l < bs; l++) { /* for column */ 41249b5e25fSSatish Balay #if defined(PETSC_USE_COMPLEX) 41349b5e25fSSatish Balay if (PetscImaginaryPart(a->a[bs2 * k + l * bs + j]) > 0.0) { 4149371c9d4SSatish Balay PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g + %g i) ", bs * a->j[k] + l, (double)PetscRealPart(a->a[bs2 * k + l * bs + j]), (double)PetscImaginaryPart(a->a[bs2 * k + l * bs + j]))); 41549b5e25fSSatish Balay } else if (PetscImaginaryPart(a->a[bs2 * k + l * bs + j]) < 0.0) { 4169371c9d4SSatish Balay PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g - %g i) ", bs * a->j[k] + l, (double)PetscRealPart(a->a[bs2 * k + l * bs + j]), -(double)PetscImaginaryPart(a->a[bs2 * k + l * bs + j]))); 41749b5e25fSSatish Balay } else { 4189566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", bs * a->j[k] + l, (double)PetscRealPart(a->a[bs2 * k + l * bs + j]))); 41949b5e25fSSatish Balay } 42049b5e25fSSatish Balay #else 4219566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", bs * a->j[k] + l, (double)a->a[bs2 * k + l * bs + j])); 42249b5e25fSSatish Balay #endif 42349b5e25fSSatish Balay } 42449b5e25fSSatish Balay } 4259566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 42649b5e25fSSatish Balay } 42749b5e25fSSatish Balay } 4282c990fa1SHong Zhang } 4299566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE)); 43049b5e25fSSatish Balay } 4319566063dSJacob Faibussowitsch PetscCall(PetscViewerFlush(viewer)); 4323ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 43349b5e25fSSatish Balay } 43449b5e25fSSatish Balay 4359804daf3SBarry Smith #include <petscdraw.h> 436d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatView_SeqSBAIJ_Draw_Zoom(PetscDraw draw, void *Aa) 437d71ae5a4SJacob Faibussowitsch { 43849b5e25fSSatish Balay Mat A = (Mat)Aa; 43949b5e25fSSatish Balay Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)A->data; 440d0f46423SBarry Smith PetscInt row, i, j, k, l, mbs = a->mbs, color, bs = A->rmap->bs, bs2 = a->bs2; 44149b5e25fSSatish Balay PetscReal xl, yl, xr, yr, x_l, x_r, y_l, y_r; 44249b5e25fSSatish Balay MatScalar *aa; 443b0a32e0cSBarry Smith PetscViewer viewer; 44449b5e25fSSatish Balay 44549b5e25fSSatish Balay PetscFunctionBegin; 4469566063dSJacob Faibussowitsch PetscCall(PetscObjectQuery((PetscObject)A, "Zoomviewer", (PetscObject *)&viewer)); 4479566063dSJacob Faibussowitsch PetscCall(PetscDrawGetCoordinates(draw, &xl, &yl, &xr, &yr)); 44849b5e25fSSatish Balay 44949b5e25fSSatish Balay /* loop over matrix elements drawing boxes */ 450383922c3SLisandro Dalcin 451d0609cedSBarry Smith PetscDrawCollectiveBegin(draw); 4529566063dSJacob Faibussowitsch PetscCall(PetscDrawString(draw, .3 * (xl + xr), .3 * (yl + yr), PETSC_DRAW_BLACK, "symmetric")); 453383922c3SLisandro Dalcin /* Blue for negative, Cyan for zero and Red for positive */ 454b0a32e0cSBarry Smith color = PETSC_DRAW_BLUE; 45549b5e25fSSatish Balay for (i = 0, row = 0; i < mbs; i++, row += bs) { 45649b5e25fSSatish Balay for (j = a->i[i]; j < a->i[i + 1]; j++) { 4579371c9d4SSatish Balay y_l = A->rmap->N - row - 1.0; 4589371c9d4SSatish Balay y_r = y_l + 1.0; 4599371c9d4SSatish Balay x_l = a->j[j] * bs; 4609371c9d4SSatish Balay x_r = x_l + 1.0; 46149b5e25fSSatish Balay aa = a->a + j * bs2; 46249b5e25fSSatish Balay for (k = 0; k < bs; k++) { 46349b5e25fSSatish Balay for (l = 0; l < bs; l++) { 46449b5e25fSSatish Balay if (PetscRealPart(*aa++) >= 0.) continue; 4659566063dSJacob Faibussowitsch PetscCall(PetscDrawRectangle(draw, x_l + k, y_l - l, x_r + k, y_r - l, color, color, color, color)); 46649b5e25fSSatish Balay } 46749b5e25fSSatish Balay } 46849b5e25fSSatish Balay } 46949b5e25fSSatish Balay } 470b0a32e0cSBarry Smith color = PETSC_DRAW_CYAN; 47149b5e25fSSatish Balay for (i = 0, row = 0; i < mbs; i++, row += bs) { 47249b5e25fSSatish Balay for (j = a->i[i]; j < a->i[i + 1]; j++) { 4739371c9d4SSatish Balay y_l = A->rmap->N - row - 1.0; 4749371c9d4SSatish Balay y_r = y_l + 1.0; 4759371c9d4SSatish Balay x_l = a->j[j] * bs; 4769371c9d4SSatish Balay x_r = x_l + 1.0; 47749b5e25fSSatish Balay aa = a->a + j * bs2; 47849b5e25fSSatish Balay for (k = 0; k < bs; k++) { 47949b5e25fSSatish Balay for (l = 0; l < bs; l++) { 48049b5e25fSSatish Balay if (PetscRealPart(*aa++) != 0.) continue; 4819566063dSJacob Faibussowitsch PetscCall(PetscDrawRectangle(draw, x_l + k, y_l - l, x_r + k, y_r - l, color, color, color, color)); 48249b5e25fSSatish Balay } 48349b5e25fSSatish Balay } 48449b5e25fSSatish Balay } 48549b5e25fSSatish Balay } 486b0a32e0cSBarry Smith color = PETSC_DRAW_RED; 48749b5e25fSSatish Balay for (i = 0, row = 0; i < mbs; i++, row += bs) { 48849b5e25fSSatish Balay for (j = a->i[i]; j < a->i[i + 1]; j++) { 4899371c9d4SSatish Balay y_l = A->rmap->N - row - 1.0; 4909371c9d4SSatish Balay y_r = y_l + 1.0; 4919371c9d4SSatish Balay x_l = a->j[j] * bs; 4929371c9d4SSatish Balay x_r = x_l + 1.0; 49349b5e25fSSatish Balay aa = a->a + j * bs2; 49449b5e25fSSatish Balay for (k = 0; k < bs; k++) { 49549b5e25fSSatish Balay for (l = 0; l < bs; l++) { 49649b5e25fSSatish Balay if (PetscRealPart(*aa++) <= 0.) continue; 4979566063dSJacob Faibussowitsch PetscCall(PetscDrawRectangle(draw, x_l + k, y_l - l, x_r + k, y_r - l, color, color, color, color)); 49849b5e25fSSatish Balay } 49949b5e25fSSatish Balay } 50049b5e25fSSatish Balay } 50149b5e25fSSatish Balay } 502d0609cedSBarry Smith PetscDrawCollectiveEnd(draw); 5033ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 50449b5e25fSSatish Balay } 50549b5e25fSSatish Balay 506d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatView_SeqSBAIJ_Draw(Mat A, PetscViewer viewer) 507d71ae5a4SJacob Faibussowitsch { 50849b5e25fSSatish Balay PetscReal xl, yl, xr, yr, w, h; 509b0a32e0cSBarry Smith PetscDraw draw; 510ace3abfcSBarry Smith PetscBool isnull; 51149b5e25fSSatish Balay 51249b5e25fSSatish Balay PetscFunctionBegin; 5139566063dSJacob Faibussowitsch PetscCall(PetscViewerDrawGetDraw(viewer, 0, &draw)); 5149566063dSJacob Faibussowitsch PetscCall(PetscDrawIsNull(draw, &isnull)); 5153ba16761SJacob Faibussowitsch if (isnull) PetscFunctionReturn(PETSC_SUCCESS); 51649b5e25fSSatish Balay 5179371c9d4SSatish Balay xr = A->rmap->N; 5189371c9d4SSatish Balay yr = A->rmap->N; 5199371c9d4SSatish Balay h = yr / 10.0; 5209371c9d4SSatish Balay w = xr / 10.0; 5219371c9d4SSatish Balay xr += w; 5229371c9d4SSatish Balay yr += h; 5239371c9d4SSatish Balay xl = -w; 5249371c9d4SSatish Balay yl = -h; 5259566063dSJacob Faibussowitsch PetscCall(PetscDrawSetCoordinates(draw, xl, yl, xr, yr)); 5269566063dSJacob Faibussowitsch PetscCall(PetscObjectCompose((PetscObject)A, "Zoomviewer", (PetscObject)viewer)); 5279566063dSJacob Faibussowitsch PetscCall(PetscDrawZoom(draw, MatView_SeqSBAIJ_Draw_Zoom, A)); 5289566063dSJacob Faibussowitsch PetscCall(PetscObjectCompose((PetscObject)A, "Zoomviewer", NULL)); 5299566063dSJacob Faibussowitsch PetscCall(PetscDrawSave(draw)); 5303ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 53149b5e25fSSatish Balay } 53249b5e25fSSatish Balay 533618cc2edSLisandro Dalcin /* Used for both MPIBAIJ and MPISBAIJ matrices */ 534618cc2edSLisandro Dalcin #define MatView_SeqSBAIJ_Binary MatView_SeqBAIJ_Binary 535618cc2edSLisandro Dalcin 536d71ae5a4SJacob Faibussowitsch PetscErrorCode MatView_SeqSBAIJ(Mat A, PetscViewer viewer) 537d71ae5a4SJacob Faibussowitsch { 538618cc2edSLisandro Dalcin PetscBool iascii, isbinary, isdraw; 53949b5e25fSSatish Balay 54049b5e25fSSatish Balay PetscFunctionBegin; 5419566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERASCII, &iascii)); 5429566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERBINARY, &isbinary)); 5439566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERDRAW, &isdraw)); 54432077d6dSBarry Smith if (iascii) { 5459566063dSJacob Faibussowitsch PetscCall(MatView_SeqSBAIJ_ASCII(A, viewer)); 546618cc2edSLisandro Dalcin } else if (isbinary) { 5479566063dSJacob Faibussowitsch PetscCall(MatView_SeqSBAIJ_Binary(A, viewer)); 54849b5e25fSSatish Balay } else if (isdraw) { 5499566063dSJacob Faibussowitsch PetscCall(MatView_SeqSBAIJ_Draw(A, viewer)); 55049b5e25fSSatish Balay } else { 551a5e6ed63SBarry Smith Mat B; 552ade3a672SBarry Smith const char *matname; 5539566063dSJacob Faibussowitsch PetscCall(MatConvert(A, MATSEQAIJ, MAT_INITIAL_MATRIX, &B)); 55423a3927dSBarry Smith if (((PetscObject)A)->name) PetscCall(PetscObjectGetName((PetscObject)A, &matname)); 55523a3927dSBarry Smith if (((PetscObject)A)->name) PetscCall(PetscObjectSetName((PetscObject)B, matname)); 5569566063dSJacob Faibussowitsch PetscCall(MatView(B, viewer)); 5579566063dSJacob Faibussowitsch PetscCall(MatDestroy(&B)); 55849b5e25fSSatish Balay } 5593ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 56049b5e25fSSatish Balay } 56149b5e25fSSatish Balay 562d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetValues_SeqSBAIJ(Mat A, PetscInt m, const PetscInt im[], PetscInt n, const PetscInt in[], PetscScalar v[]) 563d71ae5a4SJacob Faibussowitsch { 564045c9aa0SHong Zhang Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)A->data; 56513f74950SBarry Smith PetscInt *rp, k, low, high, t, row, nrow, i, col, l, *aj = a->j; 56613f74950SBarry Smith PetscInt *ai = a->i, *ailen = a->ilen; 567d0f46423SBarry Smith PetscInt brow, bcol, ridx, cidx, bs = A->rmap->bs, bs2 = a->bs2; 56897e567efSBarry Smith MatScalar *ap, *aa = a->a; 56949b5e25fSSatish Balay 57049b5e25fSSatish Balay PetscFunctionBegin; 57149b5e25fSSatish Balay for (k = 0; k < m; k++) { /* loop over rows */ 5729371c9d4SSatish Balay row = im[k]; 5739371c9d4SSatish Balay brow = row / bs; 5749371c9d4SSatish Balay if (row < 0) { 5759371c9d4SSatish Balay v += n; 5769371c9d4SSatish Balay continue; 5779371c9d4SSatish Balay } /* negative row */ 57854c59aa7SJacob Faibussowitsch PetscCheck(row < A->rmap->N, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Row too large: row %" PetscInt_FMT " max %" PetscInt_FMT, row, A->rmap->N - 1); 5799371c9d4SSatish Balay rp = aj + ai[brow]; 5809371c9d4SSatish Balay ap = aa + bs2 * ai[brow]; 58149b5e25fSSatish Balay nrow = ailen[brow]; 58249b5e25fSSatish Balay for (l = 0; l < n; l++) { /* loop over columns */ 5839371c9d4SSatish Balay if (in[l] < 0) { 5849371c9d4SSatish Balay v++; 5859371c9d4SSatish Balay continue; 5869371c9d4SSatish Balay } /* negative column */ 58754c59aa7SJacob Faibussowitsch PetscCheck(in[l] < A->cmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Column too large: col %" PetscInt_FMT " max %" PetscInt_FMT, in[l], A->cmap->n - 1); 58849b5e25fSSatish Balay col = in[l]; 58949b5e25fSSatish Balay bcol = col / bs; 59049b5e25fSSatish Balay cidx = col % bs; 59149b5e25fSSatish Balay ridx = row % bs; 59249b5e25fSSatish Balay high = nrow; 59349b5e25fSSatish Balay low = 0; /* assume unsorted */ 59449b5e25fSSatish Balay while (high - low > 5) { 59549b5e25fSSatish Balay t = (low + high) / 2; 59649b5e25fSSatish Balay if (rp[t] > bcol) high = t; 59749b5e25fSSatish Balay else low = t; 59849b5e25fSSatish Balay } 59949b5e25fSSatish Balay for (i = low; i < high; i++) { 60049b5e25fSSatish Balay if (rp[i] > bcol) break; 60149b5e25fSSatish Balay if (rp[i] == bcol) { 60249b5e25fSSatish Balay *v++ = ap[bs2 * i + bs * cidx + ridx]; 60349b5e25fSSatish Balay goto finished; 60449b5e25fSSatish Balay } 60549b5e25fSSatish Balay } 60697e567efSBarry Smith *v++ = 0.0; 60749b5e25fSSatish Balay finished:; 60849b5e25fSSatish Balay } 60949b5e25fSSatish Balay } 6103ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 61149b5e25fSSatish Balay } 61249b5e25fSSatish Balay 613d71ae5a4SJacob Faibussowitsch PetscErrorCode MatPermute_SeqSBAIJ(Mat A, IS rowp, IS colp, Mat *B) 614d71ae5a4SJacob Faibussowitsch { 615dc29a518SPierre Jolivet Mat C; 616dc29a518SPierre Jolivet 617dc29a518SPierre Jolivet PetscFunctionBegin; 6189566063dSJacob Faibussowitsch PetscCall(MatConvert(A, MATSEQBAIJ, MAT_INITIAL_MATRIX, &C)); 6199566063dSJacob Faibussowitsch PetscCall(MatPermute(C, rowp, colp, B)); 6209566063dSJacob Faibussowitsch PetscCall(MatDestroy(&C)); 62148a46eb9SPierre Jolivet if (rowp == colp) PetscCall(MatConvert(*B, MATSEQSBAIJ, MAT_INPLACE_MATRIX, B)); 6223ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 623dc29a518SPierre Jolivet } 62449b5e25fSSatish Balay 625d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetValuesBlocked_SeqSBAIJ(Mat A, PetscInt m, const PetscInt im[], PetscInt n, const PetscInt in[], const PetscScalar v[], InsertMode is) 626d71ae5a4SJacob Faibussowitsch { 6270880e062SHong Zhang Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)A->data; 628e2ee6c50SBarry Smith PetscInt *rp, k, low, high, t, ii, jj, row, nrow, i, col, l, rmax, N, lastcol = -1; 62913f74950SBarry Smith PetscInt *imax = a->imax, *ai = a->i, *ailen = a->ilen; 630d0f46423SBarry Smith PetscInt *aj = a->j, nonew = a->nonew, bs2 = a->bs2, bs = A->rmap->bs, stepval; 631ace3abfcSBarry Smith PetscBool roworiented = a->roworiented; 632dd6ea824SBarry Smith const PetscScalar *value = v; 633f15d580aSBarry Smith MatScalar *ap, *aa = a->a, *bap; 6340880e062SHong Zhang 63549b5e25fSSatish Balay PetscFunctionBegin; 63626fbe8dcSKarl Rupp if (roworiented) stepval = (n - 1) * bs; 63726fbe8dcSKarl Rupp else stepval = (m - 1) * bs; 63826fbe8dcSKarl Rupp 6390880e062SHong Zhang for (k = 0; k < m; k++) { /* loop over added rows */ 6400880e062SHong Zhang row = im[k]; 6410880e062SHong Zhang if (row < 0) continue; 6426bdcaf15SBarry Smith PetscCheck(row < a->mbs, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Block index row too large %" PetscInt_FMT " max %" PetscInt_FMT, row, a->mbs - 1); 6430880e062SHong Zhang rp = aj + ai[row]; 6440880e062SHong Zhang ap = aa + bs2 * ai[row]; 6450880e062SHong Zhang rmax = imax[row]; 6460880e062SHong Zhang nrow = ailen[row]; 6470880e062SHong Zhang low = 0; 648818f2c47SBarry Smith high = nrow; 6490880e062SHong Zhang for (l = 0; l < n; l++) { /* loop over added columns */ 6500880e062SHong Zhang if (in[l] < 0) continue; 6510880e062SHong Zhang col = in[l]; 6526bdcaf15SBarry Smith PetscCheck(col < a->nbs, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Block index column too large %" PetscInt_FMT " max %" PetscInt_FMT, col, a->nbs - 1); 653b98bf0e1SJed Brown if (col < row) { 65426fbe8dcSKarl Rupp if (a->ignore_ltriangular) continue; /* ignore lower triangular block */ 65526fbe8dcSKarl Rupp else SETERRQ(PETSC_COMM_SELF, PETSC_ERR_USER, "Lower triangular value cannot be set for sbaij format. Ignoring these values, run with -mat_ignore_lower_triangular or call MatSetOption(mat,MAT_IGNORE_LOWER_TRIANGULAR,PETSC_TRUE)"); 656b98bf0e1SJed Brown } 65726fbe8dcSKarl Rupp if (roworiented) value = v + k * (stepval + bs) * bs + l * bs; 65826fbe8dcSKarl Rupp else value = v + l * (stepval + bs) * bs + k * bs; 65926fbe8dcSKarl Rupp 66026fbe8dcSKarl Rupp if (col <= lastcol) low = 0; 66126fbe8dcSKarl Rupp else high = nrow; 66226fbe8dcSKarl Rupp 663e2ee6c50SBarry Smith lastcol = col; 6640880e062SHong Zhang while (high - low > 7) { 6650880e062SHong Zhang t = (low + high) / 2; 6660880e062SHong Zhang if (rp[t] > col) high = t; 6670880e062SHong Zhang else low = t; 6680880e062SHong Zhang } 6690880e062SHong Zhang for (i = low; i < high; i++) { 6700880e062SHong Zhang if (rp[i] > col) break; 6710880e062SHong Zhang if (rp[i] == col) { 6720880e062SHong Zhang bap = ap + bs2 * i; 6730880e062SHong Zhang if (roworiented) { 6740880e062SHong Zhang if (is == ADD_VALUES) { 6750880e062SHong Zhang for (ii = 0; ii < bs; ii++, value += stepval) { 676ad540459SPierre Jolivet for (jj = ii; jj < bs2; jj += bs) bap[jj] += *value++; 6770880e062SHong Zhang } 6780880e062SHong Zhang } else { 6790880e062SHong Zhang for (ii = 0; ii < bs; ii++, value += stepval) { 680ad540459SPierre Jolivet for (jj = ii; jj < bs2; jj += bs) bap[jj] = *value++; 6810880e062SHong Zhang } 6820880e062SHong Zhang } 6830880e062SHong Zhang } else { 6840880e062SHong Zhang if (is == ADD_VALUES) { 6850880e062SHong Zhang for (ii = 0; ii < bs; ii++, value += stepval) { 686ad540459SPierre Jolivet for (jj = 0; jj < bs; jj++) *bap++ += *value++; 6870880e062SHong Zhang } 6880880e062SHong Zhang } else { 6890880e062SHong Zhang for (ii = 0; ii < bs; ii++, value += stepval) { 690ad540459SPierre Jolivet for (jj = 0; jj < bs; jj++) *bap++ = *value++; 6910880e062SHong Zhang } 6920880e062SHong Zhang } 6930880e062SHong Zhang } 6940880e062SHong Zhang goto noinsert2; 6950880e062SHong Zhang } 6960880e062SHong Zhang } 6970880e062SHong Zhang if (nonew == 1) goto noinsert2; 69808401ef6SPierre Jolivet PetscCheck(nonew != -1, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Inserting a new block index nonzero block (%" PetscInt_FMT ", %" PetscInt_FMT ") in the matrix", row, col); 699fef13f97SBarry Smith MatSeqXAIJReallocateAIJ(A, a->mbs, bs2, nrow, row, col, rmax, aa, ai, aj, rp, ap, imax, nonew, MatScalar); 7009371c9d4SSatish Balay N = nrow++ - 1; 7019371c9d4SSatish Balay high++; 7020880e062SHong Zhang /* shift up all the later entries in this row */ 7039566063dSJacob Faibussowitsch PetscCall(PetscArraymove(rp + i + 1, rp + i, N - i + 1)); 7049566063dSJacob Faibussowitsch PetscCall(PetscArraymove(ap + bs2 * (i + 1), ap + bs2 * i, bs2 * (N - i + 1))); 7059566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(ap + bs2 * i, bs2)); 7060880e062SHong Zhang rp[i] = col; 7070880e062SHong Zhang bap = ap + bs2 * i; 7080880e062SHong Zhang if (roworiented) { 7090880e062SHong Zhang for (ii = 0; ii < bs; ii++, value += stepval) { 710ad540459SPierre Jolivet for (jj = ii; jj < bs2; jj += bs) bap[jj] = *value++; 7110880e062SHong Zhang } 7120880e062SHong Zhang } else { 7130880e062SHong Zhang for (ii = 0; ii < bs; ii++, value += stepval) { 714ad540459SPierre Jolivet for (jj = 0; jj < bs; jj++) *bap++ = *value++; 7150880e062SHong Zhang } 7160880e062SHong Zhang } 7170880e062SHong Zhang noinsert2:; 7180880e062SHong Zhang low = i; 7190880e062SHong Zhang } 7200880e062SHong Zhang ailen[row] = nrow; 7210880e062SHong Zhang } 7223ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 72349b5e25fSSatish Balay } 72449b5e25fSSatish Balay 72564831d72SBarry Smith /* 72664831d72SBarry Smith This is not yet used 72764831d72SBarry Smith */ 728d71ae5a4SJacob Faibussowitsch PetscErrorCode MatAssemblyEnd_SeqSBAIJ_SeqAIJ_Inode(Mat A) 729d71ae5a4SJacob Faibussowitsch { 7300def2e27SBarry Smith Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)A->data; 7310def2e27SBarry Smith const PetscInt *ai = a->i, *aj = a->j, *cols; 7320def2e27SBarry Smith PetscInt i = 0, j, blk_size, m = A->rmap->n, node_count = 0, nzx, nzy, *ns, row, nz, cnt, cnt2, *counts; 733ace3abfcSBarry Smith PetscBool flag; 7340def2e27SBarry Smith 7350def2e27SBarry Smith PetscFunctionBegin; 7369566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m, &ns)); 7370def2e27SBarry Smith while (i < m) { 7380def2e27SBarry Smith nzx = ai[i + 1] - ai[i]; /* Number of nonzeros */ 7390def2e27SBarry Smith /* Limits the number of elements in a node to 'a->inode.limit' */ 7400def2e27SBarry Smith for (j = i + 1, blk_size = 1; j < m && blk_size < a->inode.limit; ++j, ++blk_size) { 7410def2e27SBarry Smith nzy = ai[j + 1] - ai[j]; 7420def2e27SBarry Smith if (nzy != (nzx - j + i)) break; 7439566063dSJacob Faibussowitsch PetscCall(PetscArraycmp(aj + ai[i] + j - i, aj + ai[j], nzy, &flag)); 7440def2e27SBarry Smith if (!flag) break; 7450def2e27SBarry Smith } 7460def2e27SBarry Smith ns[node_count++] = blk_size; 74726fbe8dcSKarl Rupp 7480def2e27SBarry Smith i = j; 7490def2e27SBarry Smith } 7500def2e27SBarry Smith if (!a->inode.size && m && node_count > .9 * m) { 7519566063dSJacob Faibussowitsch PetscCall(PetscFree(ns)); 7529566063dSJacob Faibussowitsch PetscCall(PetscInfo(A, "Found %" PetscInt_FMT " nodes out of %" PetscInt_FMT " rows. Not using Inode routines\n", node_count, m)); 7530def2e27SBarry Smith } else { 7540def2e27SBarry Smith a->inode.node_count = node_count; 75526fbe8dcSKarl Rupp 7569566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(node_count, &a->inode.size)); 7579566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(a->inode.size, ns, node_count)); 7589566063dSJacob Faibussowitsch PetscCall(PetscFree(ns)); 7599566063dSJacob Faibussowitsch PetscCall(PetscInfo(A, "Found %" PetscInt_FMT " nodes of %" PetscInt_FMT ". Limit used: %" PetscInt_FMT ". Using Inode routines\n", node_count, m, a->inode.limit)); 7600def2e27SBarry Smith 7610def2e27SBarry Smith /* count collections of adjacent columns in each inode */ 7620def2e27SBarry Smith row = 0; 7630def2e27SBarry Smith cnt = 0; 7640def2e27SBarry Smith for (i = 0; i < node_count; i++) { 7650def2e27SBarry Smith cols = aj + ai[row] + a->inode.size[i]; 7660def2e27SBarry Smith nz = ai[row + 1] - ai[row] - a->inode.size[i]; 7670def2e27SBarry Smith for (j = 1; j < nz; j++) { 76826fbe8dcSKarl Rupp if (cols[j] != cols[j - 1] + 1) cnt++; 7690def2e27SBarry Smith } 7700def2e27SBarry Smith cnt++; 7710def2e27SBarry Smith row += a->inode.size[i]; 7720def2e27SBarry Smith } 7739566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(2 * cnt, &counts)); 7740def2e27SBarry Smith cnt = 0; 7750def2e27SBarry Smith row = 0; 7760def2e27SBarry Smith for (i = 0; i < node_count; i++) { 7770def2e27SBarry Smith cols = aj + ai[row] + a->inode.size[i]; 7780def2e27SBarry Smith counts[2 * cnt] = cols[0]; 7790def2e27SBarry Smith nz = ai[row + 1] - ai[row] - a->inode.size[i]; 7800def2e27SBarry Smith cnt2 = 1; 7810def2e27SBarry Smith for (j = 1; j < nz; j++) { 7820def2e27SBarry Smith if (cols[j] != cols[j - 1] + 1) { 7830def2e27SBarry Smith counts[2 * (cnt++) + 1] = cnt2; 7840def2e27SBarry Smith counts[2 * cnt] = cols[j]; 7850def2e27SBarry Smith cnt2 = 1; 7860def2e27SBarry Smith } else cnt2++; 7870def2e27SBarry Smith } 7880def2e27SBarry Smith counts[2 * (cnt++) + 1] = cnt2; 7890def2e27SBarry Smith row += a->inode.size[i]; 7900def2e27SBarry Smith } 7919566063dSJacob Faibussowitsch PetscCall(PetscIntView(2 * cnt, counts, NULL)); 7920def2e27SBarry Smith } 7933ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 79438702af4SBarry Smith } 79538702af4SBarry Smith 796d71ae5a4SJacob Faibussowitsch PetscErrorCode MatAssemblyEnd_SeqSBAIJ(Mat A, MatAssemblyType mode) 797d71ae5a4SJacob Faibussowitsch { 79849b5e25fSSatish Balay Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)A->data; 7998f8f2f0dSBarry Smith PetscInt fshift = 0, i, *ai = a->i, *aj = a->j, *imax = a->imax; 800d0f46423SBarry Smith PetscInt m = A->rmap->N, *ip, N, *ailen = a->ilen; 80113f74950SBarry Smith PetscInt mbs = a->mbs, bs2 = a->bs2, rmax = 0; 80249b5e25fSSatish Balay MatScalar *aa = a->a, *ap; 80349b5e25fSSatish Balay 80449b5e25fSSatish Balay PetscFunctionBegin; 8053ba16761SJacob Faibussowitsch if (mode == MAT_FLUSH_ASSEMBLY) PetscFunctionReturn(PETSC_SUCCESS); 80649b5e25fSSatish Balay 80749b5e25fSSatish Balay if (m) rmax = ailen[0]; 80849b5e25fSSatish Balay for (i = 1; i < mbs; i++) { 80949b5e25fSSatish Balay /* move each row back by the amount of empty slots (fshift) before it*/ 81049b5e25fSSatish Balay fshift += imax[i - 1] - ailen[i - 1]; 81149b5e25fSSatish Balay rmax = PetscMax(rmax, ailen[i]); 81249b5e25fSSatish Balay if (fshift) { 813580bdb30SBarry Smith ip = aj + ai[i]; 814580bdb30SBarry Smith ap = aa + bs2 * ai[i]; 81549b5e25fSSatish Balay N = ailen[i]; 8169566063dSJacob Faibussowitsch PetscCall(PetscArraymove(ip - fshift, ip, N)); 8179566063dSJacob Faibussowitsch PetscCall(PetscArraymove(ap - bs2 * fshift, ap, bs2 * N)); 81849b5e25fSSatish Balay } 81949b5e25fSSatish Balay ai[i] = ai[i - 1] + ailen[i - 1]; 82049b5e25fSSatish Balay } 82149b5e25fSSatish Balay if (mbs) { 82249b5e25fSSatish Balay fshift += imax[mbs - 1] - ailen[mbs - 1]; 82349b5e25fSSatish Balay ai[mbs] = ai[mbs - 1] + ailen[mbs - 1]; 82449b5e25fSSatish Balay } 82549b5e25fSSatish Balay /* reset ilen and imax for each row */ 826ad540459SPierre Jolivet for (i = 0; i < mbs; i++) ailen[i] = imax[i] = ai[i + 1] - ai[i]; 8276c6c5352SBarry Smith a->nz = ai[mbs]; 82849b5e25fSSatish Balay 829b424e231SHong Zhang /* diagonals may have moved, reset it */ 8301baa6e33SBarry Smith if (a->diag) PetscCall(PetscArraycpy(a->diag, ai, mbs)); 831aed4548fSBarry Smith PetscCheck(!fshift || a->nounused != -1, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Unused space detected in matrix: %" PetscInt_FMT " X %" PetscInt_FMT " block size %" PetscInt_FMT ", %" PetscInt_FMT " unneeded", m, A->cmap->n, A->rmap->bs, fshift * bs2); 83226fbe8dcSKarl Rupp 8339566063dSJacob Faibussowitsch PetscCall(PetscInfo(A, "Matrix size: %" PetscInt_FMT " X %" PetscInt_FMT ", block size %" PetscInt_FMT "; storage space: %" PetscInt_FMT " unneeded, %" PetscInt_FMT " used\n", m, A->rmap->N, A->rmap->bs, fshift * bs2, a->nz * bs2)); 8349566063dSJacob Faibussowitsch PetscCall(PetscInfo(A, "Number of mallocs during MatSetValues is %" PetscInt_FMT "\n", a->reallocs)); 8359566063dSJacob Faibussowitsch PetscCall(PetscInfo(A, "Most nonzeros blocks in any row is %" PetscInt_FMT "\n", rmax)); 83626fbe8dcSKarl Rupp 8378e58a170SBarry Smith A->info.mallocs += a->reallocs; 83849b5e25fSSatish Balay a->reallocs = 0; 83949b5e25fSSatish Balay A->info.nz_unneeded = (PetscReal)fshift * bs2; 840061b2667SBarry Smith a->idiagvalid = PETSC_FALSE; 8414dcd73b1SHong Zhang a->rmax = rmax; 84238702af4SBarry Smith 84338702af4SBarry Smith if (A->cmap->n < 65536 && A->cmap->bs == 1) { 84444e1c64aSLisandro Dalcin if (a->jshort && a->free_jshort) { 84517803ae8SHong Zhang /* when matrix data structure is changed, previous jshort must be replaced */ 8469566063dSJacob Faibussowitsch PetscCall(PetscFree(a->jshort)); 84717803ae8SHong Zhang } 8489566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(a->i[A->rmap->n], &a->jshort)); 84938702af4SBarry Smith for (i = 0; i < a->i[A->rmap->n]; i++) a->jshort[i] = a->j[i]; 85038702af4SBarry Smith A->ops->mult = MatMult_SeqSBAIJ_1_ushort; 85141f059aeSBarry Smith A->ops->sor = MatSOR_SeqSBAIJ_ushort; 8524da8f245SBarry Smith a->free_jshort = PETSC_TRUE; 85338702af4SBarry Smith } 8543ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 85549b5e25fSSatish Balay } 85649b5e25fSSatish Balay 85749b5e25fSSatish Balay /* 85849b5e25fSSatish Balay This function returns an array of flags which indicate the locations of contiguous 85949b5e25fSSatish Balay blocks that should be zeroed. for eg: if bs = 3 and is = [0,1,2,3,5,6,7,8,9] 860a5b23f4aSJose E. Roman then the resulting sizes = [3,1,1,3,1] corresponding to sets [(0,1,2),(3),(5),(6,7,8),(9)] 86149b5e25fSSatish Balay Assume: sizes should be long enough to hold all the values. 86249b5e25fSSatish Balay */ 863d71ae5a4SJacob Faibussowitsch PetscErrorCode MatZeroRows_SeqSBAIJ_Check_Blocks(PetscInt idx[], PetscInt n, PetscInt bs, PetscInt sizes[], PetscInt *bs_max) 864d71ae5a4SJacob Faibussowitsch { 86513f74950SBarry Smith PetscInt i, j, k, row; 866ace3abfcSBarry Smith PetscBool flg; 86749b5e25fSSatish Balay 86849b5e25fSSatish Balay PetscFunctionBegin; 86949b5e25fSSatish Balay for (i = 0, j = 0; i < n; j++) { 87049b5e25fSSatish Balay row = idx[i]; 871a5b23f4aSJose E. Roman if (row % bs != 0) { /* Not the beginning of a block */ 87249b5e25fSSatish Balay sizes[j] = 1; 87349b5e25fSSatish Balay i++; 87449b5e25fSSatish Balay } else if (i + bs > n) { /* Beginning of a block, but complete block doesn't exist (at idx end) */ 87549b5e25fSSatish Balay sizes[j] = 1; /* Also makes sure at least 'bs' values exist for next else */ 87649b5e25fSSatish Balay i++; 8776aad120cSJose E. Roman } else { /* Beginning of the block, so check if the complete block exists */ 87849b5e25fSSatish Balay flg = PETSC_TRUE; 87949b5e25fSSatish Balay for (k = 1; k < bs; k++) { 88049b5e25fSSatish Balay if (row + k != idx[i + k]) { /* break in the block */ 88149b5e25fSSatish Balay flg = PETSC_FALSE; 88249b5e25fSSatish Balay break; 88349b5e25fSSatish Balay } 88449b5e25fSSatish Balay } 885abc0a331SBarry Smith if (flg) { /* No break in the bs */ 88649b5e25fSSatish Balay sizes[j] = bs; 88749b5e25fSSatish Balay i += bs; 88849b5e25fSSatish Balay } else { 88949b5e25fSSatish Balay sizes[j] = 1; 89049b5e25fSSatish Balay i++; 89149b5e25fSSatish Balay } 89249b5e25fSSatish Balay } 89349b5e25fSSatish Balay } 89449b5e25fSSatish Balay *bs_max = j; 8953ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 89649b5e25fSSatish Balay } 89749b5e25fSSatish Balay 89849b5e25fSSatish Balay /* Only add/insert a(i,j) with i<=j (blocks). 899da81f932SPierre Jolivet Any a(i,j) with i>j input by user is ignored. 90049b5e25fSSatish Balay */ 90149b5e25fSSatish Balay 902d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetValues_SeqSBAIJ(Mat A, PetscInt m, const PetscInt im[], PetscInt n, const PetscInt in[], const PetscScalar v[], InsertMode is) 903d71ae5a4SJacob Faibussowitsch { 90449b5e25fSSatish Balay Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)A->data; 905e2ee6c50SBarry Smith PetscInt *rp, k, low, high, t, ii, row, nrow, i, col, l, rmax, N, lastcol = -1; 90613f74950SBarry Smith PetscInt *imax = a->imax, *ai = a->i, *ailen = a->ilen, roworiented = a->roworiented; 907d0f46423SBarry Smith PetscInt *aj = a->j, nonew = a->nonew, bs = A->rmap->bs, brow, bcol; 90813f74950SBarry Smith PetscInt ridx, cidx, bs2 = a->bs2; 90949b5e25fSSatish Balay MatScalar *ap, value, *aa = a->a, *bap; 91049b5e25fSSatish Balay 91149b5e25fSSatish Balay PetscFunctionBegin; 91249b5e25fSSatish Balay for (k = 0; k < m; k++) { /* loop over added rows */ 91349b5e25fSSatish Balay row = im[k]; /* row number */ 91449b5e25fSSatish Balay brow = row / bs; /* block row number */ 91549b5e25fSSatish Balay if (row < 0) continue; 9166bdcaf15SBarry Smith PetscCheck(row < A->rmap->N, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Row too large: row %" PetscInt_FMT " max %" PetscInt_FMT, row, A->rmap->N - 1); 91749b5e25fSSatish Balay rp = aj + ai[brow]; /*ptr to beginning of column value of the row block*/ 91849b5e25fSSatish Balay ap = aa + bs2 * ai[brow]; /*ptr to beginning of element value of the row block*/ 91949b5e25fSSatish Balay rmax = imax[brow]; /* maximum space allocated for this row */ 92049b5e25fSSatish Balay nrow = ailen[brow]; /* actual length of this row */ 92149b5e25fSSatish Balay low = 0; 9228509e838SStefano Zampini high = nrow; 92349b5e25fSSatish Balay for (l = 0; l < n; l++) { /* loop over added columns */ 92449b5e25fSSatish Balay if (in[l] < 0) continue; 9256bdcaf15SBarry Smith PetscCheck(in[l] < A->cmap->N, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Column too large: col %" PetscInt_FMT " max %" PetscInt_FMT, in[l], A->cmap->N - 1); 92649b5e25fSSatish Balay col = in[l]; 92749b5e25fSSatish Balay bcol = col / bs; /* block col number */ 92849b5e25fSSatish Balay 929941593c8SHong Zhang if (brow > bcol) { 93026fbe8dcSKarl Rupp if (a->ignore_ltriangular) continue; /* ignore lower triangular values */ 93126fbe8dcSKarl Rupp else SETERRQ(PETSC_COMM_SELF, PETSC_ERR_USER, "Lower triangular value cannot be set for sbaij format. Ignoring these values, run with -mat_ignore_lower_triangular or call MatSetOption(mat,MAT_IGNORE_LOWER_TRIANGULAR,PETSC_TRUE)"); 932941593c8SHong Zhang } 933f4989cb3SHong Zhang 9349371c9d4SSatish Balay ridx = row % bs; 9359371c9d4SSatish Balay cidx = col % bs; /*row and col index inside the block */ 9368549e402SHong Zhang if ((brow == bcol && ridx <= cidx) || (brow < bcol)) { 93749b5e25fSSatish Balay /* element value a(k,l) */ 93826fbe8dcSKarl Rupp if (roworiented) value = v[l + k * n]; 93926fbe8dcSKarl Rupp else value = v[k + l * m]; 94049b5e25fSSatish Balay 94149b5e25fSSatish Balay /* move pointer bap to a(k,l) quickly and add/insert value */ 94226fbe8dcSKarl Rupp if (col <= lastcol) low = 0; 9438509e838SStefano Zampini else high = nrow; 9448509e838SStefano Zampini 945e2ee6c50SBarry Smith lastcol = col; 94649b5e25fSSatish Balay while (high - low > 7) { 94749b5e25fSSatish Balay t = (low + high) / 2; 94849b5e25fSSatish Balay if (rp[t] > bcol) high = t; 94949b5e25fSSatish Balay else low = t; 95049b5e25fSSatish Balay } 95149b5e25fSSatish Balay for (i = low; i < high; i++) { 95249b5e25fSSatish Balay if (rp[i] > bcol) break; 95349b5e25fSSatish Balay if (rp[i] == bcol) { 95449b5e25fSSatish Balay bap = ap + bs2 * i + bs * cidx + ridx; 95549b5e25fSSatish Balay if (is == ADD_VALUES) *bap += value; 95649b5e25fSSatish Balay else *bap = value; 9578549e402SHong Zhang /* for diag block, add/insert its symmetric element a(cidx,ridx) */ 9588549e402SHong Zhang if (brow == bcol && ridx < cidx) { 9598549e402SHong Zhang bap = ap + bs2 * i + bs * ridx + cidx; 9608549e402SHong Zhang if (is == ADD_VALUES) *bap += value; 9618549e402SHong Zhang else *bap = value; 9628549e402SHong Zhang } 96349b5e25fSSatish Balay goto noinsert1; 96449b5e25fSSatish Balay } 96549b5e25fSSatish Balay } 96649b5e25fSSatish Balay 96749b5e25fSSatish Balay if (nonew == 1) goto noinsert1; 96808401ef6SPierre Jolivet PetscCheck(nonew != -1, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Inserting a new nonzero (%" PetscInt_FMT ", %" PetscInt_FMT ") in the matrix", row, col); 969fef13f97SBarry Smith MatSeqXAIJReallocateAIJ(A, a->mbs, bs2, nrow, brow, bcol, rmax, aa, ai, aj, rp, ap, imax, nonew, MatScalar); 97049b5e25fSSatish Balay 9719371c9d4SSatish Balay N = nrow++ - 1; 9729371c9d4SSatish Balay high++; 97349b5e25fSSatish Balay /* shift up all the later entries in this row */ 9749566063dSJacob Faibussowitsch PetscCall(PetscArraymove(rp + i + 1, rp + i, N - i + 1)); 9759566063dSJacob Faibussowitsch PetscCall(PetscArraymove(ap + bs2 * (i + 1), ap + bs2 * i, bs2 * (N - i + 1))); 9769566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(ap + bs2 * i, bs2)); 97749b5e25fSSatish Balay rp[i] = bcol; 97849b5e25fSSatish Balay ap[bs2 * i + bs * cidx + ridx] = value; 9798509e838SStefano Zampini /* for diag block, add/insert its symmetric element a(cidx,ridx) */ 980ad540459SPierre Jolivet if (brow == bcol && ridx < cidx) ap[bs2 * i + bs * ridx + cidx] = value; 981e56f5c9eSBarry Smith A->nonzerostate++; 98249b5e25fSSatish Balay noinsert1:; 98349b5e25fSSatish Balay low = i; 9848549e402SHong Zhang } 98549b5e25fSSatish Balay } /* end of loop over added columns */ 98649b5e25fSSatish Balay ailen[brow] = nrow; 98749b5e25fSSatish Balay } /* end of loop over added rows */ 9883ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 98949b5e25fSSatish Balay } 99049b5e25fSSatish Balay 991d71ae5a4SJacob Faibussowitsch PetscErrorCode MatICCFactor_SeqSBAIJ(Mat inA, IS row, const MatFactorInfo *info) 992d71ae5a4SJacob Faibussowitsch { 9934ccecd49SHong Zhang Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)inA->data; 99449b5e25fSSatish Balay Mat outA; 995ace3abfcSBarry Smith PetscBool row_identity; 99649b5e25fSSatish Balay 99749b5e25fSSatish Balay PetscFunctionBegin; 99808401ef6SPierre Jolivet PetscCheck(info->levels == 0, PETSC_COMM_SELF, PETSC_ERR_SUP, "Only levels=0 is supported for in-place icc"); 9999566063dSJacob Faibussowitsch PetscCall(ISIdentity(row, &row_identity)); 100028b400f6SJacob Faibussowitsch PetscCheck(row_identity, PETSC_COMM_SELF, PETSC_ERR_SUP, "Matrix reordering is not supported"); 100108401ef6SPierre Jolivet PetscCheck(inA->rmap->bs == 1, PETSC_COMM_SELF, PETSC_ERR_SUP, "Matrix block size %" PetscInt_FMT " is not supported", inA->rmap->bs); /* Need to replace MatCholeskyFactorSymbolic_SeqSBAIJ_MSR()! */ 1002c84f5b01SHong Zhang 100349b5e25fSSatish Balay outA = inA; 1004d5f3da31SBarry Smith inA->factortype = MAT_FACTOR_ICC; 10059566063dSJacob Faibussowitsch PetscCall(PetscFree(inA->solvertype)); 10069566063dSJacob Faibussowitsch PetscCall(PetscStrallocpy(MATSOLVERPETSC, &inA->solvertype)); 100749b5e25fSSatish Balay 10089566063dSJacob Faibussowitsch PetscCall(MatMarkDiagonal_SeqSBAIJ(inA)); 10099566063dSJacob Faibussowitsch PetscCall(MatSeqSBAIJSetNumericFactorization_inplace(inA, row_identity)); 101049b5e25fSSatish Balay 10119566063dSJacob Faibussowitsch PetscCall(PetscObjectReference((PetscObject)row)); 10129566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->row)); 1013c84f5b01SHong Zhang a->row = row; 10149566063dSJacob Faibussowitsch PetscCall(PetscObjectReference((PetscObject)row)); 10159566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->col)); 1016c84f5b01SHong Zhang a->col = row; 1017c84f5b01SHong Zhang 1018c84f5b01SHong Zhang /* Create the invert permutation so that it can be used in MatCholeskyFactorNumeric() */ 10199566063dSJacob Faibussowitsch if (a->icol) PetscCall(ISInvertPermutation(row, PETSC_DECIDE, &a->icol)); 102049b5e25fSSatish Balay 10214dfa11a4SJacob Faibussowitsch if (!a->solve_work) { PetscCall(PetscMalloc1(inA->rmap->N + inA->rmap->bs, &a->solve_work)); } 102249b5e25fSSatish Balay 10239566063dSJacob Faibussowitsch PetscCall(MatCholeskyFactorNumeric(outA, inA, info)); 10243ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 102549b5e25fSSatish Balay } 1026950f1e5bSHong Zhang 1027d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqSBAIJSetColumnIndices_SeqSBAIJ(Mat mat, PetscInt *indices) 1028d71ae5a4SJacob Faibussowitsch { 1029045c9aa0SHong Zhang Mat_SeqSBAIJ *baij = (Mat_SeqSBAIJ *)mat->data; 103013f74950SBarry Smith PetscInt i, nz, n; 103149b5e25fSSatish Balay 103249b5e25fSSatish Balay PetscFunctionBegin; 10336c6c5352SBarry Smith nz = baij->maxnz; 1034d0f46423SBarry Smith n = mat->cmap->n; 103526fbe8dcSKarl Rupp for (i = 0; i < nz; i++) baij->j[i] = indices[i]; 103626fbe8dcSKarl Rupp 10376c6c5352SBarry Smith baij->nz = nz; 103826fbe8dcSKarl Rupp for (i = 0; i < n; i++) baij->ilen[i] = baij->imax[i]; 103926fbe8dcSKarl Rupp 10409566063dSJacob Faibussowitsch PetscCall(MatSetOption(mat, MAT_NEW_NONZERO_LOCATION_ERR, PETSC_TRUE)); 10413ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 104249b5e25fSSatish Balay } 104349b5e25fSSatish Balay 104449b5e25fSSatish Balay /*@ 104519585528SSatish Balay MatSeqSBAIJSetColumnIndices - Set the column indices for all the rows 104611a5261eSBarry Smith in a `MATSEQSBAIJ` matrix. 104749b5e25fSSatish Balay 104849b5e25fSSatish Balay Input Parameters: 104911a5261eSBarry Smith + mat - the `MATSEQSBAIJ` matrix 105049b5e25fSSatish Balay - indices - the column indices 105149b5e25fSSatish Balay 105249b5e25fSSatish Balay Level: advanced 105349b5e25fSSatish Balay 105449b5e25fSSatish Balay Notes: 105549b5e25fSSatish Balay This can be called if you have precomputed the nonzero structure of the 105649b5e25fSSatish Balay matrix and want to provide it to the matrix object to improve the performance 105711a5261eSBarry Smith of the `MatSetValues()` operation. 105849b5e25fSSatish Balay 105949b5e25fSSatish Balay You MUST have set the correct numbers of nonzeros per row in the call to 106011a5261eSBarry Smith `MatCreateSeqSBAIJ()`, and the columns indices MUST be sorted. 106149b5e25fSSatish Balay 1062ab9f2c04SSatish Balay MUST be called before any calls to MatSetValues() 106349b5e25fSSatish Balay 106411a5261eSBarry Smith .seealso: `MATSEQSBAIJ`, `MatCreateSeqSBAIJ` 106549b5e25fSSatish Balay @*/ 1066d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqSBAIJSetColumnIndices(Mat mat, PetscInt *indices) 1067d71ae5a4SJacob Faibussowitsch { 106849b5e25fSSatish Balay PetscFunctionBegin; 10690700a824SBarry Smith PetscValidHeaderSpecific(mat, MAT_CLASSID, 1); 1070dadcf809SJacob Faibussowitsch PetscValidIntPointer(indices, 2); 1071cac4c232SBarry Smith PetscUseMethod(mat, "MatSeqSBAIJSetColumnIndices_C", (Mat, PetscInt *), (mat, indices)); 10723ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 107349b5e25fSSatish Balay } 107449b5e25fSSatish Balay 1075d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCopy_SeqSBAIJ(Mat A, Mat B, MatStructure str) 1076d71ae5a4SJacob Faibussowitsch { 10774c7a3774SStefano Zampini PetscBool isbaij; 10783c896bc6SHong Zhang 10793c896bc6SHong Zhang PetscFunctionBegin; 10809566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompareAny((PetscObject)B, &isbaij, MATSEQSBAIJ, MATMPISBAIJ, "")); 108128b400f6SJacob Faibussowitsch PetscCheck(isbaij, PetscObjectComm((PetscObject)B), PETSC_ERR_SUP, "Not for matrix type %s", ((PetscObject)B)->type_name); 10824c7a3774SStefano Zampini /* If the two matrices have the same copy implementation and nonzero pattern, use fast copy. */ 10834c7a3774SStefano Zampini if (str == SAME_NONZERO_PATTERN && A->ops->copy == B->ops->copy) { 10843c896bc6SHong Zhang Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)A->data; 10853c896bc6SHong Zhang Mat_SeqSBAIJ *b = (Mat_SeqSBAIJ *)B->data; 10863c896bc6SHong Zhang 108708401ef6SPierre Jolivet PetscCheck(a->i[a->mbs] == b->i[b->mbs], PETSC_COMM_SELF, PETSC_ERR_ARG_INCOMP, "Number of nonzeros in two matrices are different"); 108808401ef6SPierre Jolivet PetscCheck(a->mbs == b->mbs, PETSC_COMM_SELF, PETSC_ERR_ARG_INCOMP, "Number of rows in two matrices are different"); 108908401ef6SPierre Jolivet PetscCheck(a->bs2 == b->bs2, PETSC_COMM_SELF, PETSC_ERR_ARG_INCOMP, "Different block size"); 10909566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(b->a, a->a, a->bs2 * a->i[a->mbs])); 10919566063dSJacob Faibussowitsch PetscCall(PetscObjectStateIncrease((PetscObject)B)); 10923c896bc6SHong Zhang } else { 10939566063dSJacob Faibussowitsch PetscCall(MatGetRowUpperTriangular(A)); 10949566063dSJacob Faibussowitsch PetscCall(MatCopy_Basic(A, B, str)); 10959566063dSJacob Faibussowitsch PetscCall(MatRestoreRowUpperTriangular(A)); 10963c896bc6SHong Zhang } 10973ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 10983c896bc6SHong Zhang } 10993c896bc6SHong Zhang 1100d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetUp_SeqSBAIJ(Mat A) 1101d71ae5a4SJacob Faibussowitsch { 1102273d9f13SBarry Smith PetscFunctionBegin; 11039566063dSJacob Faibussowitsch PetscCall(MatSeqSBAIJSetPreallocation(A, A->rmap->bs, PETSC_DEFAULT, NULL)); 11043ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1105273d9f13SBarry Smith } 1106273d9f13SBarry Smith 1107d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatSeqSBAIJGetArray_SeqSBAIJ(Mat A, PetscScalar *array[]) 1108d71ae5a4SJacob Faibussowitsch { 1109a6ece127SHong Zhang Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)A->data; 11105fd66863SKarl Rupp 1111a6ece127SHong Zhang PetscFunctionBegin; 1112a6ece127SHong Zhang *array = a->a; 11133ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1114a6ece127SHong Zhang } 1115a6ece127SHong Zhang 1116d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatSeqSBAIJRestoreArray_SeqSBAIJ(Mat A, PetscScalar *array[]) 1117d71ae5a4SJacob Faibussowitsch { 1118a6ece127SHong Zhang PetscFunctionBegin; 1119cda14afcSprj- *array = NULL; 11203ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1121a6ece127SHong Zhang } 1122a6ece127SHong Zhang 1123d71ae5a4SJacob Faibussowitsch PetscErrorCode MatAXPYGetPreallocation_SeqSBAIJ(Mat Y, Mat X, PetscInt *nnz) 1124d71ae5a4SJacob Faibussowitsch { 1125b264fe52SHong Zhang PetscInt bs = Y->rmap->bs, mbs = Y->rmap->N / bs; 112652768537SHong Zhang Mat_SeqSBAIJ *x = (Mat_SeqSBAIJ *)X->data; 112752768537SHong Zhang Mat_SeqSBAIJ *y = (Mat_SeqSBAIJ *)Y->data; 112852768537SHong Zhang 112952768537SHong Zhang PetscFunctionBegin; 113052768537SHong Zhang /* Set the number of nonzeros in the new matrix */ 11319566063dSJacob Faibussowitsch PetscCall(MatAXPYGetPreallocation_SeqX_private(mbs, x->i, x->j, y->i, y->j, nnz)); 11323ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 113352768537SHong Zhang } 113452768537SHong Zhang 1135d71ae5a4SJacob Faibussowitsch PetscErrorCode MatAXPY_SeqSBAIJ(Mat Y, PetscScalar a, Mat X, MatStructure str) 1136d71ae5a4SJacob Faibussowitsch { 113742ee4b1aSHong Zhang Mat_SeqSBAIJ *x = (Mat_SeqSBAIJ *)X->data, *y = (Mat_SeqSBAIJ *)Y->data; 113831ce2d13SHong Zhang PetscInt bs = Y->rmap->bs, bs2 = bs * bs; 1139e838b9e7SJed Brown PetscBLASInt one = 1; 114042ee4b1aSHong Zhang 114142ee4b1aSHong Zhang PetscFunctionBegin; 1142134adf20SPierre Jolivet if (str == UNKNOWN_NONZERO_PATTERN || (PetscDefined(USE_DEBUG) && str == SAME_NONZERO_PATTERN)) { 1143134adf20SPierre Jolivet PetscBool e = x->nz == y->nz && x->mbs == y->mbs ? PETSC_TRUE : PETSC_FALSE; 1144134adf20SPierre Jolivet if (e) { 11459566063dSJacob Faibussowitsch PetscCall(PetscArraycmp(x->i, y->i, x->mbs + 1, &e)); 1146134adf20SPierre Jolivet if (e) { 11479566063dSJacob Faibussowitsch PetscCall(PetscArraycmp(x->j, y->j, x->i[x->mbs], &e)); 1148134adf20SPierre Jolivet if (e) str = SAME_NONZERO_PATTERN; 1149134adf20SPierre Jolivet } 1150134adf20SPierre Jolivet } 115154c59aa7SJacob Faibussowitsch if (!e) PetscCheck(str != SAME_NONZERO_PATTERN, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONG, "MatStructure is not SAME_NONZERO_PATTERN"); 1152134adf20SPierre Jolivet } 115342ee4b1aSHong Zhang if (str == SAME_NONZERO_PATTERN) { 1154f4df32b1SMatthew Knepley PetscScalar alpha = a; 1155c5df96a5SBarry Smith PetscBLASInt bnz; 11569566063dSJacob Faibussowitsch PetscCall(PetscBLASIntCast(x->nz * bs2, &bnz)); 1157792fecdfSBarry Smith PetscCallBLAS("BLASaxpy", BLASaxpy_(&bnz, &alpha, x->a, &one, y->a, &one)); 11589566063dSJacob Faibussowitsch PetscCall(PetscObjectStateIncrease((PetscObject)Y)); 1159ab784542SHong Zhang } else if (str == SUBSET_NONZERO_PATTERN) { /* nonzeros of X is a subset of Y's */ 11609566063dSJacob Faibussowitsch PetscCall(MatSetOption(X, MAT_GETROW_UPPERTRIANGULAR, PETSC_TRUE)); 11619566063dSJacob Faibussowitsch PetscCall(MatAXPY_Basic(Y, a, X, str)); 11629566063dSJacob Faibussowitsch PetscCall(MatSetOption(X, MAT_GETROW_UPPERTRIANGULAR, PETSC_FALSE)); 116342ee4b1aSHong Zhang } else { 116452768537SHong Zhang Mat B; 116552768537SHong Zhang PetscInt *nnz; 116654c59aa7SJacob Faibussowitsch PetscCheck(bs == X->rmap->bs, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Matrices must have same block size"); 11679566063dSJacob Faibussowitsch PetscCall(MatGetRowUpperTriangular(X)); 11689566063dSJacob Faibussowitsch PetscCall(MatGetRowUpperTriangular(Y)); 11699566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(Y->rmap->N, &nnz)); 11709566063dSJacob Faibussowitsch PetscCall(MatCreate(PetscObjectComm((PetscObject)Y), &B)); 11719566063dSJacob Faibussowitsch PetscCall(PetscObjectSetName((PetscObject)B, ((PetscObject)Y)->name)); 11729566063dSJacob Faibussowitsch PetscCall(MatSetSizes(B, Y->rmap->n, Y->cmap->n, Y->rmap->N, Y->cmap->N)); 11739566063dSJacob Faibussowitsch PetscCall(MatSetBlockSizesFromMats(B, Y, Y)); 11749566063dSJacob Faibussowitsch PetscCall(MatSetType(B, ((PetscObject)Y)->type_name)); 11759566063dSJacob Faibussowitsch PetscCall(MatAXPYGetPreallocation_SeqSBAIJ(Y, X, nnz)); 11769566063dSJacob Faibussowitsch PetscCall(MatSeqSBAIJSetPreallocation(B, bs, 0, nnz)); 117752768537SHong Zhang 11789566063dSJacob Faibussowitsch PetscCall(MatAXPY_BasicWithPreallocation(B, Y, a, X, str)); 117952768537SHong Zhang 11809566063dSJacob Faibussowitsch PetscCall(MatHeaderMerge(Y, &B)); 11819566063dSJacob Faibussowitsch PetscCall(PetscFree(nnz)); 11829566063dSJacob Faibussowitsch PetscCall(MatRestoreRowUpperTriangular(X)); 11839566063dSJacob Faibussowitsch PetscCall(MatRestoreRowUpperTriangular(Y)); 118442ee4b1aSHong Zhang } 11853ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 118642ee4b1aSHong Zhang } 118742ee4b1aSHong Zhang 1188d71ae5a4SJacob Faibussowitsch PetscErrorCode MatIsSymmetric_SeqSBAIJ(Mat A, PetscReal tol, PetscBool *flg) 1189d71ae5a4SJacob Faibussowitsch { 1190efcf0fc3SBarry Smith PetscFunctionBegin; 1191efcf0fc3SBarry Smith *flg = PETSC_TRUE; 11923ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1193efcf0fc3SBarry Smith } 1194efcf0fc3SBarry Smith 1195d71ae5a4SJacob Faibussowitsch PetscErrorCode MatIsStructurallySymmetric_SeqSBAIJ(Mat A, PetscBool *flg) 1196d71ae5a4SJacob Faibussowitsch { 1197efcf0fc3SBarry Smith PetscFunctionBegin; 1198efcf0fc3SBarry Smith *flg = PETSC_TRUE; 11993ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1200efcf0fc3SBarry Smith } 1201efcf0fc3SBarry Smith 1202d71ae5a4SJacob Faibussowitsch PetscErrorCode MatIsHermitian_SeqSBAIJ(Mat A, PetscReal tol, PetscBool *flg) 1203d71ae5a4SJacob Faibussowitsch { 1204efcf0fc3SBarry Smith PetscFunctionBegin; 1205efcf0fc3SBarry Smith *flg = PETSC_FALSE; 12063ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1207efcf0fc3SBarry Smith } 1208efcf0fc3SBarry Smith 1209d71ae5a4SJacob Faibussowitsch PetscErrorCode MatConjugate_SeqSBAIJ(Mat A) 1210d71ae5a4SJacob Faibussowitsch { 12112726fb6dSPierre Jolivet #if defined(PETSC_USE_COMPLEX) 12122726fb6dSPierre Jolivet Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)A->data; 12132726fb6dSPierre Jolivet PetscInt i, nz = a->bs2 * a->i[a->mbs]; 12142726fb6dSPierre Jolivet MatScalar *aa = a->a; 12152726fb6dSPierre Jolivet 12162726fb6dSPierre Jolivet PetscFunctionBegin; 12172726fb6dSPierre Jolivet for (i = 0; i < nz; i++) aa[i] = PetscConj(aa[i]); 12182726fb6dSPierre Jolivet #else 12192726fb6dSPierre Jolivet PetscFunctionBegin; 12202726fb6dSPierre Jolivet #endif 12213ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 12222726fb6dSPierre Jolivet } 12232726fb6dSPierre Jolivet 1224d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRealPart_SeqSBAIJ(Mat A) 1225d71ae5a4SJacob Faibussowitsch { 122699cafbc1SBarry Smith Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)A->data; 122799cafbc1SBarry Smith PetscInt i, nz = a->bs2 * a->i[a->mbs]; 1228dd6ea824SBarry Smith MatScalar *aa = a->a; 122999cafbc1SBarry Smith 123099cafbc1SBarry Smith PetscFunctionBegin; 123199cafbc1SBarry Smith for (i = 0; i < nz; i++) aa[i] = PetscRealPart(aa[i]); 12323ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 123399cafbc1SBarry Smith } 123499cafbc1SBarry Smith 1235d71ae5a4SJacob Faibussowitsch PetscErrorCode MatImaginaryPart_SeqSBAIJ(Mat A) 1236d71ae5a4SJacob Faibussowitsch { 123799cafbc1SBarry Smith Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)A->data; 123899cafbc1SBarry Smith PetscInt i, nz = a->bs2 * a->i[a->mbs]; 1239dd6ea824SBarry Smith MatScalar *aa = a->a; 124099cafbc1SBarry Smith 124199cafbc1SBarry Smith PetscFunctionBegin; 124299cafbc1SBarry Smith for (i = 0; i < nz; i++) aa[i] = PetscImaginaryPart(aa[i]); 12433ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 124499cafbc1SBarry Smith } 124599cafbc1SBarry Smith 1246d71ae5a4SJacob Faibussowitsch PetscErrorCode MatZeroRowsColumns_SeqSBAIJ(Mat A, PetscInt is_n, const PetscInt is_idx[], PetscScalar diag, Vec x, Vec b) 1247d71ae5a4SJacob Faibussowitsch { 12483bededecSBarry Smith Mat_SeqSBAIJ *baij = (Mat_SeqSBAIJ *)A->data; 12493bededecSBarry Smith PetscInt i, j, k, count; 12503bededecSBarry Smith PetscInt bs = A->rmap->bs, bs2 = baij->bs2, row, col; 12513bededecSBarry Smith PetscScalar zero = 0.0; 12523bededecSBarry Smith MatScalar *aa; 12533bededecSBarry Smith const PetscScalar *xx; 12543bededecSBarry Smith PetscScalar *bb; 125556777dd2SBarry Smith PetscBool *zeroed, vecs = PETSC_FALSE; 12563bededecSBarry Smith 12573bededecSBarry Smith PetscFunctionBegin; 12583bededecSBarry Smith /* fix right hand side if needed */ 12593bededecSBarry Smith if (x && b) { 12609566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(x, &xx)); 12619566063dSJacob Faibussowitsch PetscCall(VecGetArray(b, &bb)); 126256777dd2SBarry Smith vecs = PETSC_TRUE; 12633bededecSBarry Smith } 12643bededecSBarry Smith 12653bededecSBarry Smith /* zero the columns */ 12669566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(A->rmap->n, &zeroed)); 12673bededecSBarry Smith for (i = 0; i < is_n; i++) { 1268aed4548fSBarry Smith PetscCheck(is_idx[i] >= 0 && is_idx[i] < A->rmap->N, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "row %" PetscInt_FMT " out of range", is_idx[i]); 12693bededecSBarry Smith zeroed[is_idx[i]] = PETSC_TRUE; 12703bededecSBarry Smith } 127156777dd2SBarry Smith if (vecs) { 127256777dd2SBarry Smith for (i = 0; i < A->rmap->N; i++) { 127356777dd2SBarry Smith row = i / bs; 127456777dd2SBarry Smith for (j = baij->i[row]; j < baij->i[row + 1]; j++) { 127556777dd2SBarry Smith for (k = 0; k < bs; k++) { 127656777dd2SBarry Smith col = bs * baij->j[j] + k; 127756777dd2SBarry Smith if (col <= i) continue; 127856777dd2SBarry Smith aa = ((MatScalar *)(baij->a)) + j * bs2 + (i % bs) + bs * k; 127926fbe8dcSKarl Rupp if (!zeroed[i] && zeroed[col]) bb[i] -= aa[0] * xx[col]; 128026fbe8dcSKarl Rupp if (zeroed[i] && !zeroed[col]) bb[col] -= aa[0] * xx[i]; 128156777dd2SBarry Smith } 128256777dd2SBarry Smith } 128356777dd2SBarry Smith } 128426fbe8dcSKarl Rupp for (i = 0; i < is_n; i++) bb[is_idx[i]] = diag * xx[is_idx[i]]; 128556777dd2SBarry Smith } 128656777dd2SBarry Smith 12873bededecSBarry Smith for (i = 0; i < A->rmap->N; i++) { 12883bededecSBarry Smith if (!zeroed[i]) { 12893bededecSBarry Smith row = i / bs; 12903bededecSBarry Smith for (j = baij->i[row]; j < baij->i[row + 1]; j++) { 12913bededecSBarry Smith for (k = 0; k < bs; k++) { 12923bededecSBarry Smith col = bs * baij->j[j] + k; 12933bededecSBarry Smith if (zeroed[col]) { 12943bededecSBarry Smith aa = ((MatScalar *)(baij->a)) + j * bs2 + (i % bs) + bs * k; 12953bededecSBarry Smith aa[0] = 0.0; 12963bededecSBarry Smith } 12973bededecSBarry Smith } 12983bededecSBarry Smith } 12993bededecSBarry Smith } 13003bededecSBarry Smith } 13019566063dSJacob Faibussowitsch PetscCall(PetscFree(zeroed)); 130256777dd2SBarry Smith if (vecs) { 13039566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(x, &xx)); 13049566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(b, &bb)); 130556777dd2SBarry Smith } 13063bededecSBarry Smith 13073bededecSBarry Smith /* zero the rows */ 13083bededecSBarry Smith for (i = 0; i < is_n; i++) { 13093bededecSBarry Smith row = is_idx[i]; 13103bededecSBarry Smith count = (baij->i[row / bs + 1] - baij->i[row / bs]) * bs; 13113bededecSBarry Smith aa = ((MatScalar *)(baij->a)) + baij->i[row / bs] * bs2 + (row % bs); 13123bededecSBarry Smith for (k = 0; k < count; k++) { 13133bededecSBarry Smith aa[0] = zero; 13143bededecSBarry Smith aa += bs; 13153bededecSBarry Smith } 1316dbbe0bcdSBarry Smith if (diag != 0.0) PetscUseTypeMethod(A, setvalues, 1, &row, 1, &row, &diag, INSERT_VALUES); 13173bededecSBarry Smith } 13189566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd_SeqSBAIJ(A, MAT_FINAL_ASSEMBLY)); 13193ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 13203bededecSBarry Smith } 13213bededecSBarry Smith 1322d71ae5a4SJacob Faibussowitsch PetscErrorCode MatShift_SeqSBAIJ(Mat Y, PetscScalar a) 1323d71ae5a4SJacob Faibussowitsch { 13247d68702bSBarry Smith Mat_SeqSBAIJ *aij = (Mat_SeqSBAIJ *)Y->data; 13257d68702bSBarry Smith 13267d68702bSBarry Smith PetscFunctionBegin; 132748a46eb9SPierre Jolivet if (!Y->preallocated || !aij->nz) PetscCall(MatSeqSBAIJSetPreallocation(Y, Y->rmap->bs, 1, NULL)); 13289566063dSJacob Faibussowitsch PetscCall(MatShift_Basic(Y, a)); 13293ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 13307d68702bSBarry Smith } 13317d68702bSBarry Smith 133249b5e25fSSatish Balay /* -------------------------------------------------------------------*/ 13333964eb88SJed Brown static struct _MatOps MatOps_Values = {MatSetValues_SeqSBAIJ, 133449b5e25fSSatish Balay MatGetRow_SeqSBAIJ, 133549b5e25fSSatish Balay MatRestoreRow_SeqSBAIJ, 133649b5e25fSSatish Balay MatMult_SeqSBAIJ_N, 133797304618SKris Buschelman /* 4*/ MatMultAdd_SeqSBAIJ_N, 1338431c96f7SBarry Smith MatMult_SeqSBAIJ_N, /* transpose versions are same as non-transpose versions */ 1339e005ede5SBarry Smith MatMultAdd_SeqSBAIJ_N, 1340f4259b30SLisandro Dalcin NULL, 1341f4259b30SLisandro Dalcin NULL, 1342f4259b30SLisandro Dalcin NULL, 1343f4259b30SLisandro Dalcin /* 10*/ NULL, 1344f4259b30SLisandro Dalcin NULL, 1345c078aec8SLisandro Dalcin MatCholeskyFactor_SeqSBAIJ, 134641f059aeSBarry Smith MatSOR_SeqSBAIJ, 134749b5e25fSSatish Balay MatTranspose_SeqSBAIJ, 134897304618SKris Buschelman /* 15*/ MatGetInfo_SeqSBAIJ, 134949b5e25fSSatish Balay MatEqual_SeqSBAIJ, 135049b5e25fSSatish Balay MatGetDiagonal_SeqSBAIJ, 135149b5e25fSSatish Balay MatDiagonalScale_SeqSBAIJ, 135249b5e25fSSatish Balay MatNorm_SeqSBAIJ, 1353f4259b30SLisandro Dalcin /* 20*/ NULL, 135449b5e25fSSatish Balay MatAssemblyEnd_SeqSBAIJ, 135549b5e25fSSatish Balay MatSetOption_SeqSBAIJ, 135649b5e25fSSatish Balay MatZeroEntries_SeqSBAIJ, 1357f4259b30SLisandro Dalcin /* 24*/ NULL, 1358f4259b30SLisandro Dalcin NULL, 1359f4259b30SLisandro Dalcin NULL, 1360f4259b30SLisandro Dalcin NULL, 1361f4259b30SLisandro Dalcin NULL, 13624994cf47SJed Brown /* 29*/ MatSetUp_SeqSBAIJ, 1363f4259b30SLisandro Dalcin NULL, 1364f4259b30SLisandro Dalcin NULL, 1365f4259b30SLisandro Dalcin NULL, 1366f4259b30SLisandro Dalcin NULL, 1367d519adbfSMatthew Knepley /* 34*/ MatDuplicate_SeqSBAIJ, 1368f4259b30SLisandro Dalcin NULL, 1369f4259b30SLisandro Dalcin NULL, 1370f4259b30SLisandro Dalcin NULL, 1371c84f5b01SHong Zhang MatICCFactor_SeqSBAIJ, 1372d519adbfSMatthew Knepley /* 39*/ MatAXPY_SeqSBAIJ, 13737dae84e0SHong Zhang MatCreateSubMatrices_SeqSBAIJ, 137449b5e25fSSatish Balay MatIncreaseOverlap_SeqSBAIJ, 137549b5e25fSSatish Balay MatGetValues_SeqSBAIJ, 13763c896bc6SHong Zhang MatCopy_SeqSBAIJ, 1377f4259b30SLisandro Dalcin /* 44*/ NULL, 137849b5e25fSSatish Balay MatScale_SeqSBAIJ, 13797d68702bSBarry Smith MatShift_SeqSBAIJ, 1380f4259b30SLisandro Dalcin NULL, 13813bededecSBarry Smith MatZeroRowsColumns_SeqSBAIJ, 1382f4259b30SLisandro Dalcin /* 49*/ NULL, 138349b5e25fSSatish Balay MatGetRowIJ_SeqSBAIJ, 138449b5e25fSSatish Balay MatRestoreRowIJ_SeqSBAIJ, 1385f4259b30SLisandro Dalcin NULL, 1386f4259b30SLisandro Dalcin NULL, 1387f4259b30SLisandro Dalcin /* 54*/ NULL, 1388f4259b30SLisandro Dalcin NULL, 1389f4259b30SLisandro Dalcin NULL, 1390dc29a518SPierre Jolivet MatPermute_SeqSBAIJ, 139149b5e25fSSatish Balay MatSetValuesBlocked_SeqSBAIJ, 13927dae84e0SHong Zhang /* 59*/ MatCreateSubMatrix_SeqSBAIJ, 1393f4259b30SLisandro Dalcin NULL, 1394f4259b30SLisandro Dalcin NULL, 1395f4259b30SLisandro Dalcin NULL, 1396f4259b30SLisandro Dalcin NULL, 1397f4259b30SLisandro Dalcin /* 64*/ NULL, 1398f4259b30SLisandro Dalcin NULL, 1399f4259b30SLisandro Dalcin NULL, 1400f4259b30SLisandro Dalcin NULL, 1401f4259b30SLisandro Dalcin NULL, 1402d519adbfSMatthew Knepley /* 69*/ MatGetRowMaxAbs_SeqSBAIJ, 1403f4259b30SLisandro Dalcin NULL, 140428d58a37SPierre Jolivet MatConvert_MPISBAIJ_Basic, 1405f4259b30SLisandro Dalcin NULL, 1406f4259b30SLisandro Dalcin NULL, 1407f4259b30SLisandro Dalcin /* 74*/ NULL, 1408f4259b30SLisandro Dalcin NULL, 1409f4259b30SLisandro Dalcin NULL, 1410f4259b30SLisandro Dalcin NULL, 1411f4259b30SLisandro Dalcin NULL, 1412f4259b30SLisandro Dalcin /* 79*/ NULL, 1413f4259b30SLisandro Dalcin NULL, 1414f4259b30SLisandro Dalcin NULL, 141597304618SKris Buschelman MatGetInertia_SeqSBAIJ, 14165bba2384SShri Abhyankar MatLoad_SeqSBAIJ, 1417d519adbfSMatthew Knepley /* 84*/ MatIsSymmetric_SeqSBAIJ, 1418865e5f61SKris Buschelman MatIsHermitian_SeqSBAIJ, 1419efcf0fc3SBarry Smith MatIsStructurallySymmetric_SeqSBAIJ, 1420f4259b30SLisandro Dalcin NULL, 1421f4259b30SLisandro Dalcin NULL, 1422f4259b30SLisandro Dalcin /* 89*/ NULL, 1423f4259b30SLisandro Dalcin NULL, 1424f4259b30SLisandro Dalcin NULL, 1425f4259b30SLisandro Dalcin NULL, 1426f4259b30SLisandro Dalcin NULL, 1427f4259b30SLisandro Dalcin /* 94*/ NULL, 1428f4259b30SLisandro Dalcin NULL, 1429f4259b30SLisandro Dalcin NULL, 1430f4259b30SLisandro Dalcin NULL, 1431f4259b30SLisandro Dalcin NULL, 1432f4259b30SLisandro Dalcin /* 99*/ NULL, 1433f4259b30SLisandro Dalcin NULL, 1434f4259b30SLisandro Dalcin NULL, 14352726fb6dSPierre Jolivet MatConjugate_SeqSBAIJ, 1436f4259b30SLisandro Dalcin NULL, 1437f4259b30SLisandro Dalcin /*104*/ NULL, 143899cafbc1SBarry Smith MatRealPart_SeqSBAIJ, 1439f5edf698SHong Zhang MatImaginaryPart_SeqSBAIJ, 1440f5edf698SHong Zhang MatGetRowUpperTriangular_SeqSBAIJ, 14412af78befSBarry Smith MatRestoreRowUpperTriangular_SeqSBAIJ, 1442f4259b30SLisandro Dalcin /*109*/ NULL, 1443f4259b30SLisandro Dalcin NULL, 1444f4259b30SLisandro Dalcin NULL, 1445f4259b30SLisandro Dalcin NULL, 1446547795f9SHong Zhang MatMissingDiagonal_SeqSBAIJ, 1447f4259b30SLisandro Dalcin /*114*/ NULL, 1448f4259b30SLisandro Dalcin NULL, 1449f4259b30SLisandro Dalcin NULL, 1450f4259b30SLisandro Dalcin NULL, 1451f4259b30SLisandro Dalcin NULL, 1452f4259b30SLisandro Dalcin /*119*/ NULL, 1453f4259b30SLisandro Dalcin NULL, 1454f4259b30SLisandro Dalcin NULL, 1455f4259b30SLisandro Dalcin NULL, 1456f4259b30SLisandro Dalcin NULL, 1457f4259b30SLisandro Dalcin /*124*/ NULL, 1458f4259b30SLisandro Dalcin NULL, 1459f4259b30SLisandro Dalcin NULL, 1460f4259b30SLisandro Dalcin NULL, 1461f4259b30SLisandro Dalcin NULL, 1462f4259b30SLisandro Dalcin /*129*/ NULL, 1463f4259b30SLisandro Dalcin NULL, 1464f4259b30SLisandro Dalcin NULL, 1465f4259b30SLisandro Dalcin NULL, 1466f4259b30SLisandro Dalcin NULL, 1467f4259b30SLisandro Dalcin /*134*/ NULL, 1468f4259b30SLisandro Dalcin NULL, 1469f4259b30SLisandro Dalcin NULL, 1470f4259b30SLisandro Dalcin NULL, 1471f4259b30SLisandro Dalcin NULL, 147246533700Sstefano_zampini /*139*/ MatSetBlockSizes_Default, 1473f4259b30SLisandro Dalcin NULL, 1474f4259b30SLisandro Dalcin NULL, 1475f4259b30SLisandro Dalcin NULL, 1476f4259b30SLisandro Dalcin NULL, 1477d70f29a3SPierre Jolivet /*144*/ MatCreateMPIMatConcatenateSeqMat_SeqSBAIJ, 1478d70f29a3SPierre Jolivet NULL, 1479d70f29a3SPierre Jolivet NULL, 148099a7f59eSMark Adams NULL, 148199a7f59eSMark Adams NULL, 14827fb60732SBarry Smith NULL, 1483dec0b466SHong Zhang /*150*/ NULL, 1484dec0b466SHong Zhang NULL}; 1485be1d678aSKris Buschelman 1486d71ae5a4SJacob Faibussowitsch PetscErrorCode MatStoreValues_SeqSBAIJ(Mat mat) 1487d71ae5a4SJacob Faibussowitsch { 14884afc71dfSHong Zhang Mat_SeqSBAIJ *aij = (Mat_SeqSBAIJ *)mat->data; 1489d0f46423SBarry Smith PetscInt nz = aij->i[mat->rmap->N] * mat->rmap->bs * aij->bs2; 149049b5e25fSSatish Balay 149149b5e25fSSatish Balay PetscFunctionBegin; 149208401ef6SPierre Jolivet PetscCheck(aij->nonew == 1, PETSC_COMM_SELF, PETSC_ERR_ORDER, "Must call MatSetOption(A,MAT_NEW_NONZERO_LOCATIONS,PETSC_FALSE);first"); 149349b5e25fSSatish Balay 149449b5e25fSSatish Balay /* allocate space for values if not already there */ 149548a46eb9SPierre Jolivet if (!aij->saved_values) PetscCall(PetscMalloc1(nz + 1, &aij->saved_values)); 149649b5e25fSSatish Balay 149749b5e25fSSatish Balay /* copy values over */ 14989566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(aij->saved_values, aij->a, nz)); 14993ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 150049b5e25fSSatish Balay } 150149b5e25fSSatish Balay 1502d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRetrieveValues_SeqSBAIJ(Mat mat) 1503d71ae5a4SJacob Faibussowitsch { 15044afc71dfSHong Zhang Mat_SeqSBAIJ *aij = (Mat_SeqSBAIJ *)mat->data; 1505d0f46423SBarry Smith PetscInt nz = aij->i[mat->rmap->N] * mat->rmap->bs * aij->bs2; 150649b5e25fSSatish Balay 150749b5e25fSSatish Balay PetscFunctionBegin; 150808401ef6SPierre Jolivet PetscCheck(aij->nonew == 1, PETSC_COMM_SELF, PETSC_ERR_ORDER, "Must call MatSetOption(A,MAT_NEW_NONZERO_LOCATIONS,PETSC_FALSE);first"); 150928b400f6SJacob Faibussowitsch PetscCheck(aij->saved_values, PETSC_COMM_SELF, PETSC_ERR_ORDER, "Must call MatStoreValues(A);first"); 151049b5e25fSSatish Balay 151149b5e25fSSatish Balay /* copy values over */ 15129566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(aij->a, aij->saved_values, nz)); 15133ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 151449b5e25fSSatish Balay } 151549b5e25fSSatish Balay 1516d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatSeqSBAIJSetPreallocation_SeqSBAIJ(Mat B, PetscInt bs, PetscInt nz, PetscInt *nnz) 1517d71ae5a4SJacob Faibussowitsch { 1518c464158bSHong Zhang Mat_SeqSBAIJ *b = (Mat_SeqSBAIJ *)B->data; 15194dcd73b1SHong Zhang PetscInt i, mbs, nbs, bs2; 15202576faa2SJed Brown PetscBool skipallocation = PETSC_FALSE, flg = PETSC_FALSE, realalloc = PETSC_FALSE; 152149b5e25fSSatish Balay 152249b5e25fSSatish Balay PetscFunctionBegin; 15232576faa2SJed Brown if (nz >= 0 || nnz) realalloc = PETSC_TRUE; 1524db4efbfdSBarry Smith 15259566063dSJacob Faibussowitsch PetscCall(MatSetBlockSize(B, PetscAbs(bs))); 15269566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(B->rmap)); 15279566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(B->cmap)); 152808401ef6SPierre Jolivet PetscCheck(B->rmap->N <= B->cmap->N, PETSC_COMM_SELF, PETSC_ERR_SUP, "SEQSBAIJ matrix cannot have more rows %" PetscInt_FMT " than columns %" PetscInt_FMT, B->rmap->N, B->cmap->N); 15299566063dSJacob Faibussowitsch PetscCall(PetscLayoutGetBlockSize(B->rmap, &bs)); 1530899cda47SBarry Smith 153121940c7eSstefano_zampini B->preallocated = PETSC_TRUE; 153221940c7eSstefano_zampini 1533d0f46423SBarry Smith mbs = B->rmap->N / bs; 15344dcd73b1SHong Zhang nbs = B->cmap->n / bs; 153549b5e25fSSatish Balay bs2 = bs * bs; 153649b5e25fSSatish Balay 1537aed4548fSBarry Smith PetscCheck(mbs * bs == B->rmap->N && nbs * bs == B->cmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Number rows, cols must be divisible by blocksize"); 153849b5e25fSSatish Balay 1539ab93d7beSBarry Smith if (nz == MAT_SKIP_ALLOCATION) { 1540ab93d7beSBarry Smith skipallocation = PETSC_TRUE; 1541ab93d7beSBarry Smith nz = 0; 1542ab93d7beSBarry Smith } 1543ab93d7beSBarry Smith 1544435da068SBarry Smith if (nz == PETSC_DEFAULT || nz == PETSC_DECIDE) nz = 3; 154508401ef6SPierre Jolivet PetscCheck(nz >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "nz cannot be less than 0: value %" PetscInt_FMT, nz); 154649b5e25fSSatish Balay if (nnz) { 154749b5e25fSSatish Balay for (i = 0; i < mbs; i++) { 154808401ef6SPierre Jolivet PetscCheck(nnz[i] >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "nnz cannot be less than 0: local row %" PetscInt_FMT " value %" PetscInt_FMT, i, nnz[i]); 154908401ef6SPierre Jolivet PetscCheck(nnz[i] <= nbs, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "nnz cannot be greater than block row length: local row %" PetscInt_FMT " value %" PetscInt_FMT " block rowlength %" PetscInt_FMT, i, nnz[i], nbs); 155049b5e25fSSatish Balay } 155149b5e25fSSatish Balay } 155249b5e25fSSatish Balay 1553db4efbfdSBarry Smith B->ops->mult = MatMult_SeqSBAIJ_N; 1554db4efbfdSBarry Smith B->ops->multadd = MatMultAdd_SeqSBAIJ_N; 1555db4efbfdSBarry Smith B->ops->multtranspose = MatMult_SeqSBAIJ_N; 1556db4efbfdSBarry Smith B->ops->multtransposeadd = MatMultAdd_SeqSBAIJ_N; 155726fbe8dcSKarl Rupp 15589566063dSJacob Faibussowitsch PetscCall(PetscOptionsGetBool(((PetscObject)B)->options, ((PetscObject)B)->prefix, "-mat_no_unroll", &flg, NULL)); 155949b5e25fSSatish Balay if (!flg) { 156049b5e25fSSatish Balay switch (bs) { 156149b5e25fSSatish Balay case 1: 156249b5e25fSSatish Balay B->ops->mult = MatMult_SeqSBAIJ_1; 156349b5e25fSSatish Balay B->ops->multadd = MatMultAdd_SeqSBAIJ_1; 1564431c96f7SBarry Smith B->ops->multtranspose = MatMult_SeqSBAIJ_1; 1565431c96f7SBarry Smith B->ops->multtransposeadd = MatMultAdd_SeqSBAIJ_1; 156649b5e25fSSatish Balay break; 156749b5e25fSSatish Balay case 2: 156849b5e25fSSatish Balay B->ops->mult = MatMult_SeqSBAIJ_2; 156949b5e25fSSatish Balay B->ops->multadd = MatMultAdd_SeqSBAIJ_2; 1570431c96f7SBarry Smith B->ops->multtranspose = MatMult_SeqSBAIJ_2; 1571431c96f7SBarry Smith B->ops->multtransposeadd = MatMultAdd_SeqSBAIJ_2; 157249b5e25fSSatish Balay break; 157349b5e25fSSatish Balay case 3: 157449b5e25fSSatish Balay B->ops->mult = MatMult_SeqSBAIJ_3; 157549b5e25fSSatish Balay B->ops->multadd = MatMultAdd_SeqSBAIJ_3; 1576431c96f7SBarry Smith B->ops->multtranspose = MatMult_SeqSBAIJ_3; 1577431c96f7SBarry Smith B->ops->multtransposeadd = MatMultAdd_SeqSBAIJ_3; 157849b5e25fSSatish Balay break; 157949b5e25fSSatish Balay case 4: 158049b5e25fSSatish Balay B->ops->mult = MatMult_SeqSBAIJ_4; 158149b5e25fSSatish Balay B->ops->multadd = MatMultAdd_SeqSBAIJ_4; 1582431c96f7SBarry Smith B->ops->multtranspose = MatMult_SeqSBAIJ_4; 1583431c96f7SBarry Smith B->ops->multtransposeadd = MatMultAdd_SeqSBAIJ_4; 158449b5e25fSSatish Balay break; 158549b5e25fSSatish Balay case 5: 158649b5e25fSSatish Balay B->ops->mult = MatMult_SeqSBAIJ_5; 158749b5e25fSSatish Balay B->ops->multadd = MatMultAdd_SeqSBAIJ_5; 1588431c96f7SBarry Smith B->ops->multtranspose = MatMult_SeqSBAIJ_5; 1589431c96f7SBarry Smith B->ops->multtransposeadd = MatMultAdd_SeqSBAIJ_5; 159049b5e25fSSatish Balay break; 159149b5e25fSSatish Balay case 6: 159249b5e25fSSatish Balay B->ops->mult = MatMult_SeqSBAIJ_6; 159349b5e25fSSatish Balay B->ops->multadd = MatMultAdd_SeqSBAIJ_6; 1594431c96f7SBarry Smith B->ops->multtranspose = MatMult_SeqSBAIJ_6; 1595431c96f7SBarry Smith B->ops->multtransposeadd = MatMultAdd_SeqSBAIJ_6; 159649b5e25fSSatish Balay break; 159749b5e25fSSatish Balay case 7: 1598de53e5efSHong Zhang B->ops->mult = MatMult_SeqSBAIJ_7; 159949b5e25fSSatish Balay B->ops->multadd = MatMultAdd_SeqSBAIJ_7; 1600431c96f7SBarry Smith B->ops->multtranspose = MatMult_SeqSBAIJ_7; 1601431c96f7SBarry Smith B->ops->multtransposeadd = MatMultAdd_SeqSBAIJ_7; 160249b5e25fSSatish Balay break; 160349b5e25fSSatish Balay } 160449b5e25fSSatish Balay } 160549b5e25fSSatish Balay 160649b5e25fSSatish Balay b->mbs = mbs; 16074dcd73b1SHong Zhang b->nbs = nbs; 1608ab93d7beSBarry Smith if (!skipallocation) { 16092ee49352SLisandro Dalcin if (!b->imax) { 16109566063dSJacob Faibussowitsch PetscCall(PetscMalloc2(mbs, &b->imax, mbs, &b->ilen)); 161126fbe8dcSKarl Rupp 1612c760cd28SBarry Smith b->free_imax_ilen = PETSC_TRUE; 16132ee49352SLisandro Dalcin } 161449b5e25fSSatish Balay if (!nnz) { 1615435da068SBarry Smith if (nz == PETSC_DEFAULT || nz == PETSC_DECIDE) nz = 5; 161649b5e25fSSatish Balay else if (nz <= 0) nz = 1; 16175d2a9ed1SStefano Zampini nz = PetscMin(nbs, nz); 161826fbe8dcSKarl Rupp for (i = 0; i < mbs; i++) b->imax[i] = nz; 16199566063dSJacob Faibussowitsch PetscCall(PetscIntMultError(nz, mbs, &nz)); 162049b5e25fSSatish Balay } else { 1621c73702f5SBarry Smith PetscInt64 nz64 = 0; 16229371c9d4SSatish Balay for (i = 0; i < mbs; i++) { 16239371c9d4SSatish Balay b->imax[i] = nnz[i]; 16249371c9d4SSatish Balay nz64 += nnz[i]; 16259371c9d4SSatish Balay } 16269566063dSJacob Faibussowitsch PetscCall(PetscIntCast(nz64, &nz)); 162749b5e25fSSatish Balay } 16282ee49352SLisandro Dalcin /* b->ilen will count nonzeros in each block row so far. */ 162926fbe8dcSKarl Rupp for (i = 0; i < mbs; i++) b->ilen[i] = 0; 16306c6c5352SBarry Smith /* nz=(nz+mbs)/2; */ /* total diagonal and superdiagonal nonzero blocks */ 163149b5e25fSSatish Balay 163249b5e25fSSatish Balay /* allocate the matrix space */ 16339566063dSJacob Faibussowitsch PetscCall(MatSeqXAIJFreeAIJ(B, &b->a, &b->j, &b->i)); 16349566063dSJacob Faibussowitsch PetscCall(PetscMalloc3(bs2 * nz, &b->a, nz, &b->j, B->rmap->N + 1, &b->i)); 16359566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(b->a, nz * bs2)); 16369566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(b->j, nz)); 163726fbe8dcSKarl Rupp 163849b5e25fSSatish Balay b->singlemalloc = PETSC_TRUE; 163949b5e25fSSatish Balay 164049b5e25fSSatish Balay /* pointer to beginning of each row */ 1641e60cf9a0SBarry Smith b->i[0] = 0; 164226fbe8dcSKarl Rupp for (i = 1; i < mbs + 1; i++) b->i[i] = b->i[i - 1] + b->imax[i - 1]; 164326fbe8dcSKarl Rupp 1644e6b907acSBarry Smith b->free_a = PETSC_TRUE; 1645e6b907acSBarry Smith b->free_ij = PETSC_TRUE; 1646e811da20SHong Zhang } else { 1647e6b907acSBarry Smith b->free_a = PETSC_FALSE; 1648e6b907acSBarry Smith b->free_ij = PETSC_FALSE; 1649ab93d7beSBarry Smith } 165049b5e25fSSatish Balay 165149b5e25fSSatish Balay b->bs2 = bs2; 16526c6c5352SBarry Smith b->nz = 0; 1653b32cb4a7SJed Brown b->maxnz = nz; 1654f4259b30SLisandro Dalcin b->inew = NULL; 1655f4259b30SLisandro Dalcin b->jnew = NULL; 1656f4259b30SLisandro Dalcin b->anew = NULL; 1657f4259b30SLisandro Dalcin b->a2anew = NULL; 16581a3463dfSHong Zhang b->permute = PETSC_FALSE; 1659cb7b82ddSBarry Smith 1660cb7b82ddSBarry Smith B->was_assembled = PETSC_FALSE; 1661cb7b82ddSBarry Smith B->assembled = PETSC_FALSE; 16629566063dSJacob Faibussowitsch if (realalloc) PetscCall(MatSetOption(B, MAT_NEW_NONZERO_ALLOCATION_ERR, PETSC_TRUE)); 16633ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1664c464158bSHong Zhang } 1665153ea458SHong Zhang 1666d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqSBAIJSetPreallocationCSR_SeqSBAIJ(Mat B, PetscInt bs, const PetscInt ii[], const PetscInt jj[], const PetscScalar V[]) 1667d71ae5a4SJacob Faibussowitsch { 16680cd7f59aSBarry Smith PetscInt i, j, m, nz, anz, nz_max = 0, *nnz; 1669f4259b30SLisandro Dalcin PetscScalar *values = NULL; 167038f409ebSLisandro Dalcin PetscBool roworiented = ((Mat_SeqSBAIJ *)B->data)->roworiented; 16710cd7f59aSBarry Smith 167238f409ebSLisandro Dalcin PetscFunctionBegin; 167308401ef6SPierre Jolivet PetscCheck(bs >= 1, PetscObjectComm((PetscObject)B), PETSC_ERR_ARG_OUTOFRANGE, "Invalid block size specified, must be positive but it is %" PetscInt_FMT, bs); 16749566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetBlockSize(B->rmap, bs)); 16759566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetBlockSize(B->cmap, bs)); 16769566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(B->rmap)); 16779566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(B->cmap)); 16789566063dSJacob Faibussowitsch PetscCall(PetscLayoutGetBlockSize(B->rmap, &bs)); 167938f409ebSLisandro Dalcin m = B->rmap->n / bs; 168038f409ebSLisandro Dalcin 1681aed4548fSBarry Smith PetscCheck(!ii[0], PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "ii[0] must be 0 but it is %" PetscInt_FMT, ii[0]); 16829566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m + 1, &nnz)); 168338f409ebSLisandro Dalcin for (i = 0; i < m; i++) { 168438f409ebSLisandro Dalcin nz = ii[i + 1] - ii[i]; 168508401ef6SPierre Jolivet PetscCheck(nz >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Row %" PetscInt_FMT " has a negative number of columns %" PetscInt_FMT, i, nz); 16860cd7f59aSBarry Smith anz = 0; 16870cd7f59aSBarry Smith for (j = 0; j < nz; j++) { 16880cd7f59aSBarry Smith /* count only values on the diagonal or above */ 16890cd7f59aSBarry Smith if (jj[ii[i] + j] >= i) { 16900cd7f59aSBarry Smith anz = nz - j; 16910cd7f59aSBarry Smith break; 16920cd7f59aSBarry Smith } 16930cd7f59aSBarry Smith } 16940cd7f59aSBarry Smith nz_max = PetscMax(nz_max, anz); 16950cd7f59aSBarry Smith nnz[i] = anz; 169638f409ebSLisandro Dalcin } 16979566063dSJacob Faibussowitsch PetscCall(MatSeqSBAIJSetPreallocation(B, bs, 0, nnz)); 16989566063dSJacob Faibussowitsch PetscCall(PetscFree(nnz)); 169938f409ebSLisandro Dalcin 170038f409ebSLisandro Dalcin values = (PetscScalar *)V; 170148a46eb9SPierre Jolivet if (!values) PetscCall(PetscCalloc1(bs * bs * nz_max, &values)); 170238f409ebSLisandro Dalcin for (i = 0; i < m; i++) { 170338f409ebSLisandro Dalcin PetscInt ncols = ii[i + 1] - ii[i]; 170438f409ebSLisandro Dalcin const PetscInt *icols = jj + ii[i]; 170538f409ebSLisandro Dalcin if (!roworiented || bs == 1) { 170638f409ebSLisandro Dalcin const PetscScalar *svals = values + (V ? (bs * bs * ii[i]) : 0); 17079566063dSJacob Faibussowitsch PetscCall(MatSetValuesBlocked_SeqSBAIJ(B, 1, &i, ncols, icols, svals, INSERT_VALUES)); 170838f409ebSLisandro Dalcin } else { 170938f409ebSLisandro Dalcin for (j = 0; j < ncols; j++) { 171038f409ebSLisandro Dalcin const PetscScalar *svals = values + (V ? (bs * bs * (ii[i] + j)) : 0); 17119566063dSJacob Faibussowitsch PetscCall(MatSetValuesBlocked_SeqSBAIJ(B, 1, &i, 1, &icols[j], svals, INSERT_VALUES)); 171238f409ebSLisandro Dalcin } 171338f409ebSLisandro Dalcin } 171438f409ebSLisandro Dalcin } 17159566063dSJacob Faibussowitsch if (!V) PetscCall(PetscFree(values)); 17169566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(B, MAT_FINAL_ASSEMBLY)); 17179566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(B, MAT_FINAL_ASSEMBLY)); 17189566063dSJacob Faibussowitsch PetscCall(MatSetOption(B, MAT_NEW_NONZERO_LOCATION_ERR, PETSC_TRUE)); 17193ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 172038f409ebSLisandro Dalcin } 172138f409ebSLisandro Dalcin 1722db4efbfdSBarry Smith /* 1723db4efbfdSBarry Smith This is used to set the numeric factorization for both Cholesky and ICC symbolic factorization 1724db4efbfdSBarry Smith */ 1725d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqSBAIJSetNumericFactorization_inplace(Mat B, PetscBool natural) 1726d71ae5a4SJacob Faibussowitsch { 1727ace3abfcSBarry Smith PetscBool flg = PETSC_FALSE; 1728db4efbfdSBarry Smith PetscInt bs = B->rmap->bs; 1729db4efbfdSBarry Smith 1730db4efbfdSBarry Smith PetscFunctionBegin; 17319566063dSJacob Faibussowitsch PetscCall(PetscOptionsGetBool(((PetscObject)B)->options, ((PetscObject)B)->prefix, "-mat_no_unroll", &flg, NULL)); 1732db4efbfdSBarry Smith if (flg) bs = 8; 1733db4efbfdSBarry Smith 1734db4efbfdSBarry Smith if (!natural) { 1735db4efbfdSBarry Smith switch (bs) { 1736d71ae5a4SJacob Faibussowitsch case 1: 1737d71ae5a4SJacob Faibussowitsch B->ops->choleskyfactornumeric = MatCholeskyFactorNumeric_SeqSBAIJ_1_inplace; 1738d71ae5a4SJacob Faibussowitsch break; 1739d71ae5a4SJacob Faibussowitsch case 2: 1740d71ae5a4SJacob Faibussowitsch B->ops->choleskyfactornumeric = MatCholeskyFactorNumeric_SeqSBAIJ_2; 1741d71ae5a4SJacob Faibussowitsch break; 1742d71ae5a4SJacob Faibussowitsch case 3: 1743d71ae5a4SJacob Faibussowitsch B->ops->choleskyfactornumeric = MatCholeskyFactorNumeric_SeqSBAIJ_3; 1744d71ae5a4SJacob Faibussowitsch break; 1745d71ae5a4SJacob Faibussowitsch case 4: 1746d71ae5a4SJacob Faibussowitsch B->ops->choleskyfactornumeric = MatCholeskyFactorNumeric_SeqSBAIJ_4; 1747d71ae5a4SJacob Faibussowitsch break; 1748d71ae5a4SJacob Faibussowitsch case 5: 1749d71ae5a4SJacob Faibussowitsch B->ops->choleskyfactornumeric = MatCholeskyFactorNumeric_SeqSBAIJ_5; 1750d71ae5a4SJacob Faibussowitsch break; 1751d71ae5a4SJacob Faibussowitsch case 6: 1752d71ae5a4SJacob Faibussowitsch B->ops->choleskyfactornumeric = MatCholeskyFactorNumeric_SeqSBAIJ_6; 1753d71ae5a4SJacob Faibussowitsch break; 1754d71ae5a4SJacob Faibussowitsch case 7: 1755d71ae5a4SJacob Faibussowitsch B->ops->choleskyfactornumeric = MatCholeskyFactorNumeric_SeqSBAIJ_7; 1756d71ae5a4SJacob Faibussowitsch break; 1757d71ae5a4SJacob Faibussowitsch default: 1758d71ae5a4SJacob Faibussowitsch B->ops->choleskyfactornumeric = MatCholeskyFactorNumeric_SeqSBAIJ_N; 1759d71ae5a4SJacob Faibussowitsch break; 1760db4efbfdSBarry Smith } 1761db4efbfdSBarry Smith } else { 1762db4efbfdSBarry Smith switch (bs) { 1763d71ae5a4SJacob Faibussowitsch case 1: 1764d71ae5a4SJacob Faibussowitsch B->ops->choleskyfactornumeric = MatCholeskyFactorNumeric_SeqSBAIJ_1_NaturalOrdering_inplace; 1765d71ae5a4SJacob Faibussowitsch break; 1766d71ae5a4SJacob Faibussowitsch case 2: 1767d71ae5a4SJacob Faibussowitsch B->ops->choleskyfactornumeric = MatCholeskyFactorNumeric_SeqSBAIJ_2_NaturalOrdering; 1768d71ae5a4SJacob Faibussowitsch break; 1769d71ae5a4SJacob Faibussowitsch case 3: 1770d71ae5a4SJacob Faibussowitsch B->ops->choleskyfactornumeric = MatCholeskyFactorNumeric_SeqSBAIJ_3_NaturalOrdering; 1771d71ae5a4SJacob Faibussowitsch break; 1772d71ae5a4SJacob Faibussowitsch case 4: 1773d71ae5a4SJacob Faibussowitsch B->ops->choleskyfactornumeric = MatCholeskyFactorNumeric_SeqSBAIJ_4_NaturalOrdering; 1774d71ae5a4SJacob Faibussowitsch break; 1775d71ae5a4SJacob Faibussowitsch case 5: 1776d71ae5a4SJacob Faibussowitsch B->ops->choleskyfactornumeric = MatCholeskyFactorNumeric_SeqSBAIJ_5_NaturalOrdering; 1777d71ae5a4SJacob Faibussowitsch break; 1778d71ae5a4SJacob Faibussowitsch case 6: 1779d71ae5a4SJacob Faibussowitsch B->ops->choleskyfactornumeric = MatCholeskyFactorNumeric_SeqSBAIJ_6_NaturalOrdering; 1780d71ae5a4SJacob Faibussowitsch break; 1781d71ae5a4SJacob Faibussowitsch case 7: 1782d71ae5a4SJacob Faibussowitsch B->ops->choleskyfactornumeric = MatCholeskyFactorNumeric_SeqSBAIJ_7_NaturalOrdering; 1783d71ae5a4SJacob Faibussowitsch break; 1784d71ae5a4SJacob Faibussowitsch default: 1785d71ae5a4SJacob Faibussowitsch B->ops->choleskyfactornumeric = MatCholeskyFactorNumeric_SeqSBAIJ_N_NaturalOrdering; 1786d71ae5a4SJacob Faibussowitsch break; 1787db4efbfdSBarry Smith } 1788db4efbfdSBarry Smith } 17893ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1790db4efbfdSBarry Smith } 1791db4efbfdSBarry Smith 1792cc2e6a90SBarry Smith PETSC_INTERN PetscErrorCode MatConvert_SeqSBAIJ_SeqAIJ(Mat, MatType, MatReuse, Mat *); 1793cc2e6a90SBarry Smith PETSC_INTERN PetscErrorCode MatConvert_SeqSBAIJ_SeqBAIJ(Mat, MatType, MatReuse, Mat *); 1794d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatFactorGetSolverType_petsc(Mat A, MatSolverType *type) 1795d71ae5a4SJacob Faibussowitsch { 17964ac6704cSBarry Smith PetscFunctionBegin; 17974ac6704cSBarry Smith *type = MATSOLVERPETSC; 17983ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 17994ac6704cSBarry Smith } 1800d769727bSBarry Smith 1801d71ae5a4SJacob Faibussowitsch PETSC_INTERN PetscErrorCode MatGetFactor_seqsbaij_petsc(Mat A, MatFactorType ftype, Mat *B) 1802d71ae5a4SJacob Faibussowitsch { 1803d0f46423SBarry Smith PetscInt n = A->rmap->n; 18045c9eb25fSBarry Smith 18055c9eb25fSBarry Smith PetscFunctionBegin; 18060e92d65fSHong Zhang #if defined(PETSC_USE_COMPLEX) 1807b94d7dedSBarry Smith PetscCheck(A->hermitian != PETSC_BOOL3_TRUE || A->symmetric == PETSC_BOOL3_TRUE || (ftype != MAT_FACTOR_CHOLESKY && ftype != MAT_FACTOR_ICC), PETSC_COMM_SELF, PETSC_ERR_SUP, "Hermitian CHOLESKY or ICC Factor is not supported"); 18080e92d65fSHong Zhang #endif 1809eb1ec7c1SStefano Zampini 18109566063dSJacob Faibussowitsch PetscCall(MatCreate(PetscObjectComm((PetscObject)A), B)); 18119566063dSJacob Faibussowitsch PetscCall(MatSetSizes(*B, n, n, n, n)); 18125c9eb25fSBarry Smith if (ftype == MAT_FACTOR_CHOLESKY || ftype == MAT_FACTOR_ICC) { 18139566063dSJacob Faibussowitsch PetscCall(MatSetType(*B, MATSEQSBAIJ)); 18149566063dSJacob Faibussowitsch PetscCall(MatSeqSBAIJSetPreallocation(*B, A->rmap->bs, MAT_SKIP_ALLOCATION, NULL)); 181526fbe8dcSKarl Rupp 18167b056e98SHong Zhang (*B)->ops->choleskyfactorsymbolic = MatCholeskyFactorSymbolic_SeqSBAIJ; 1817c6d0d4f0SHong Zhang (*B)->ops->iccfactorsymbolic = MatICCFactorSymbolic_SeqSBAIJ; 18189566063dSJacob Faibussowitsch PetscCall(PetscStrallocpy(MATORDERINGNATURAL, (char **)&(*B)->preferredordering[MAT_FACTOR_CHOLESKY])); 18199566063dSJacob Faibussowitsch PetscCall(PetscStrallocpy(MATORDERINGNATURAL, (char **)&(*B)->preferredordering[MAT_FACTOR_ICC])); 1820e32f2f54SBarry Smith } else SETERRQ(PETSC_COMM_SELF, PETSC_ERR_SUP, "Factor type not supported"); 182100c67f3bSHong Zhang 1822d5f3da31SBarry Smith (*B)->factortype = ftype; 1823f73b0415SBarry Smith (*B)->canuseordering = PETSC_TRUE; 18249566063dSJacob Faibussowitsch PetscCall(PetscFree((*B)->solvertype)); 18259566063dSJacob Faibussowitsch PetscCall(PetscStrallocpy(MATSOLVERPETSC, &(*B)->solvertype)); 18269566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)*B, "MatFactorGetSolverType_C", MatFactorGetSolverType_petsc)); 18273ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 18285c9eb25fSBarry Smith } 18295c9eb25fSBarry Smith 18308397e458SBarry Smith /*@C 183111a5261eSBarry Smith MatSeqSBAIJGetArray - gives access to the array where the data for a `MATSEQSBAIJ` matrix is stored 18328397e458SBarry Smith 18338397e458SBarry Smith Not Collective 18348397e458SBarry Smith 18358397e458SBarry Smith Input Parameter: 183611a5261eSBarry Smith . mat - a `MATSEQSBAIJ` matrix 18378397e458SBarry Smith 18388397e458SBarry Smith Output Parameter: 18398397e458SBarry Smith . array - pointer to the data 18408397e458SBarry Smith 18418397e458SBarry Smith Level: intermediate 18428397e458SBarry Smith 184311a5261eSBarry Smith .seealso: `MATSEQSBAIJ`, `MatSeqSBAIJRestoreArray()`, `MatSeqAIJGetArray()`, `MatSeqAIJRestoreArray()` 18448397e458SBarry Smith @*/ 1845d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqSBAIJGetArray(Mat A, PetscScalar **array) 1846d71ae5a4SJacob Faibussowitsch { 18478397e458SBarry Smith PetscFunctionBegin; 1848cac4c232SBarry Smith PetscUseMethod(A, "MatSeqSBAIJGetArray_C", (Mat, PetscScalar **), (A, array)); 18493ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 18508397e458SBarry Smith } 18518397e458SBarry Smith 18528397e458SBarry Smith /*@C 185311a5261eSBarry Smith MatSeqSBAIJRestoreArray - returns access to the array where the data for a `MATSEQSBAIJ` matrix is stored obtained by `MatSeqSBAIJGetArray()` 18548397e458SBarry Smith 18558397e458SBarry Smith Not Collective 18568397e458SBarry Smith 18578397e458SBarry Smith Input Parameters: 1858a2b725a8SWilliam Gropp + mat - a MATSEQSBAIJ matrix 1859a2b725a8SWilliam Gropp - array - pointer to the data 18608397e458SBarry Smith 18618397e458SBarry Smith Level: intermediate 18628397e458SBarry Smith 186311a5261eSBarry Smith .seealso: `MATSEQSBAIJ`, `MatSeqSBAIJGetArray()`, `MatSeqAIJGetArray()`, `MatSeqAIJRestoreArray()` 18648397e458SBarry Smith @*/ 1865d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqSBAIJRestoreArray(Mat A, PetscScalar **array) 1866d71ae5a4SJacob Faibussowitsch { 18678397e458SBarry Smith PetscFunctionBegin; 1868cac4c232SBarry Smith PetscUseMethod(A, "MatSeqSBAIJRestoreArray_C", (Mat, PetscScalar **), (A, array)); 18693ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 18708397e458SBarry Smith } 18718397e458SBarry Smith 18720bad9183SKris Buschelman /*MC 1873fafad747SKris Buschelman MATSEQSBAIJ - MATSEQSBAIJ = "seqsbaij" - A matrix type to be used for sequential symmetric block sparse matrices, 18740bad9183SKris Buschelman based on block compressed sparse row format. Only the upper triangular portion of the matrix is stored. 18750bad9183SKris Buschelman 1876828413b8SBarry Smith For complex numbers by default this matrix is symmetric, NOT Hermitian symmetric. To make it Hermitian symmetric you 187711a5261eSBarry Smith can call `MatSetOption`(`Mat`, `MAT_HERMITIAN`). 1878828413b8SBarry Smith 18790bad9183SKris Buschelman Options Database Keys: 188011a5261eSBarry Smith . -mat_type seqsbaij - sets the matrix type to "seqsbaij" during a call to `MatSetFromOptions()` 18810bad9183SKris Buschelman 188295452b02SPatrick Sanan Notes: 188395452b02SPatrick Sanan By default if you insert values into the lower triangular part of the matrix they are simply ignored (since they are not 188411a5261eSBarry Smith stored and it is assumed they symmetric to the upper triangular). If you call `MatSetOption`(`Mat`,`MAT_IGNORE_LOWER_TRIANGULAR`,`PETSC_FALSE`) or use 188571dad5bbSBarry Smith the options database -mat_ignore_lower_triangular false it will generate an error if you try to set a value in the lower triangular portion. 188671dad5bbSBarry Smith 1887476417e5SBarry Smith The number of rows in the matrix must be less than or equal to the number of columns 188871dad5bbSBarry Smith 18890bad9183SKris Buschelman Level: beginner 18900bad9183SKris Buschelman 189111a5261eSBarry Smith .seealso: `MATSEQSBAIJ`, `MatCreateSeqSBAIJ()`, `MatType`, `MATMPISBAIJ` 18920bad9183SKris Buschelman M*/ 1893d71ae5a4SJacob Faibussowitsch PETSC_EXTERN PetscErrorCode MatCreate_SeqSBAIJ(Mat B) 1894d71ae5a4SJacob Faibussowitsch { 1895a23d5eceSKris Buschelman Mat_SeqSBAIJ *b; 189613f74950SBarry Smith PetscMPIInt size; 1897ace3abfcSBarry Smith PetscBool no_unroll = PETSC_FALSE, no_inode = PETSC_FALSE; 1898a23d5eceSKris Buschelman 1899a23d5eceSKris Buschelman PetscFunctionBegin; 19009566063dSJacob Faibussowitsch PetscCallMPI(MPI_Comm_size(PetscObjectComm((PetscObject)B), &size)); 190108401ef6SPierre Jolivet PetscCheck(size <= 1, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONG, "Comm must be of size 1"); 1902a23d5eceSKris Buschelman 19034dfa11a4SJacob Faibussowitsch PetscCall(PetscNew(&b)); 1904a23d5eceSKris Buschelman B->data = (void *)b; 19059566063dSJacob Faibussowitsch PetscCall(PetscMemcpy(B->ops, &MatOps_Values, sizeof(struct _MatOps))); 190626fbe8dcSKarl Rupp 1907a23d5eceSKris Buschelman B->ops->destroy = MatDestroy_SeqSBAIJ; 1908a23d5eceSKris Buschelman B->ops->view = MatView_SeqSBAIJ; 1909f4259b30SLisandro Dalcin b->row = NULL; 1910f4259b30SLisandro Dalcin b->icol = NULL; 1911a23d5eceSKris Buschelman b->reallocs = 0; 1912f4259b30SLisandro Dalcin b->saved_values = NULL; 19130def2e27SBarry Smith b->inode.limit = 5; 19140def2e27SBarry Smith b->inode.max_limit = 5; 1915a23d5eceSKris Buschelman 1916a23d5eceSKris Buschelman b->roworiented = PETSC_TRUE; 1917a23d5eceSKris Buschelman b->nonew = 0; 1918f4259b30SLisandro Dalcin b->diag = NULL; 1919f4259b30SLisandro Dalcin b->solve_work = NULL; 1920f4259b30SLisandro Dalcin b->mult_work = NULL; 1921f4259b30SLisandro Dalcin B->spptr = NULL; 1922f2cbd3d5SJed Brown B->info.nz_unneeded = (PetscReal)b->maxnz * b->bs2; 1923a9817697SBarry Smith b->keepnonzeropattern = PETSC_FALSE; 1924a23d5eceSKris Buschelman 1925f4259b30SLisandro Dalcin b->inew = NULL; 1926f4259b30SLisandro Dalcin b->jnew = NULL; 1927f4259b30SLisandro Dalcin b->anew = NULL; 1928f4259b30SLisandro Dalcin b->a2anew = NULL; 1929a23d5eceSKris Buschelman b->permute = PETSC_FALSE; 1930a23d5eceSKris Buschelman 193171dad5bbSBarry Smith b->ignore_ltriangular = PETSC_TRUE; 193226fbe8dcSKarl Rupp 19339566063dSJacob Faibussowitsch PetscCall(PetscOptionsGetBool(((PetscObject)B)->options, ((PetscObject)B)->prefix, "-mat_ignore_lower_triangular", &b->ignore_ltriangular, NULL)); 1934941593c8SHong Zhang 1935f5edf698SHong Zhang b->getrow_utriangular = PETSC_FALSE; 193626fbe8dcSKarl Rupp 19379566063dSJacob Faibussowitsch PetscCall(PetscOptionsGetBool(((PetscObject)B)->options, ((PetscObject)B)->prefix, "-mat_getrow_uppertriangular", &b->getrow_utriangular, NULL)); 1938f5edf698SHong Zhang 19399566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSeqSBAIJGetArray_C", MatSeqSBAIJGetArray_SeqSBAIJ)); 19409566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSeqSBAIJRestoreArray_C", MatSeqSBAIJRestoreArray_SeqSBAIJ)); 19419566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatStoreValues_C", MatStoreValues_SeqSBAIJ)); 19429566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatRetrieveValues_C", MatRetrieveValues_SeqSBAIJ)); 19439566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSeqSBAIJSetColumnIndices_C", MatSeqSBAIJSetColumnIndices_SeqSBAIJ)); 19449566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqsbaij_seqaij_C", MatConvert_SeqSBAIJ_SeqAIJ)); 19459566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqsbaij_seqbaij_C", MatConvert_SeqSBAIJ_SeqBAIJ)); 19469566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSeqSBAIJSetPreallocation_C", MatSeqSBAIJSetPreallocation_SeqSBAIJ)); 19479566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSeqSBAIJSetPreallocationCSR_C", MatSeqSBAIJSetPreallocationCSR_SeqSBAIJ)); 19486214f412SHong Zhang #if defined(PETSC_HAVE_ELEMENTAL) 19499566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqsbaij_elemental_C", MatConvert_SeqSBAIJ_Elemental)); 19506214f412SHong Zhang #endif 1951d24d4204SJose E. Roman #if defined(PETSC_HAVE_SCALAPACK) 19529566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqsbaij_scalapack_C", MatConvert_SBAIJ_ScaLAPACK)); 1953d24d4204SJose E. Roman #endif 195423ce1328SBarry Smith 1955b94d7dedSBarry Smith B->symmetry_eternal = PETSC_TRUE; 1956b94d7dedSBarry Smith B->structural_symmetry_eternal = PETSC_TRUE; 1957b94d7dedSBarry Smith B->symmetric = PETSC_BOOL3_TRUE; 1958b94d7dedSBarry Smith B->structurally_symmetric = PETSC_BOOL3_TRUE; 1959eb1ec7c1SStefano Zampini #if defined(PETSC_USE_COMPLEX) 1960b94d7dedSBarry Smith B->hermitian = PETSC_BOOL3_FALSE; 1961eb1ec7c1SStefano Zampini #else 1962b94d7dedSBarry Smith B->hermitian = PETSC_BOOL3_TRUE; 1963eb1ec7c1SStefano Zampini #endif 196413647f61SHong Zhang 19659566063dSJacob Faibussowitsch PetscCall(PetscObjectChangeTypeName((PetscObject)B, MATSEQSBAIJ)); 19660def2e27SBarry Smith 1967d0609cedSBarry Smith PetscOptionsBegin(PetscObjectComm((PetscObject)B), ((PetscObject)B)->prefix, "Options for SEQSBAIJ matrix", "Mat"); 19689566063dSJacob Faibussowitsch PetscCall(PetscOptionsBool("-mat_no_unroll", "Do not optimize for inodes (slower)", NULL, no_unroll, &no_unroll, NULL)); 196948a46eb9SPierre Jolivet if (no_unroll) PetscCall(PetscInfo(B, "Not using Inode routines due to -mat_no_unroll\n")); 19709566063dSJacob Faibussowitsch PetscCall(PetscOptionsBool("-mat_no_inode", "Do not optimize for inodes (slower)", NULL, no_inode, &no_inode, NULL)); 19719566063dSJacob Faibussowitsch if (no_inode) PetscCall(PetscInfo(B, "Not using Inode routines due to -mat_no_inode\n")); 19729566063dSJacob Faibussowitsch PetscCall(PetscOptionsInt("-mat_inode_limit", "Do not use inodes larger then this value", NULL, b->inode.limit, &b->inode.limit, NULL)); 1973d0609cedSBarry Smith PetscOptionsEnd(); 1974ace3abfcSBarry Smith b->inode.use = (PetscBool)(!(no_unroll || no_inode)); 19750def2e27SBarry Smith if (b->inode.limit > b->inode.max_limit) b->inode.limit = b->inode.max_limit; 19763ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1977a23d5eceSKris Buschelman } 1978a23d5eceSKris Buschelman 1979a23d5eceSKris Buschelman /*@C 1980a23d5eceSKris Buschelman MatSeqSBAIJSetPreallocation - Creates a sparse symmetric matrix in block AIJ (block 198111a5261eSBarry Smith compressed row) `MATSEQSBAIJ` format. For good matrix assembly performance the 1982a23d5eceSKris Buschelman user should preallocate the matrix storage by setting the parameter nz 1983a23d5eceSKris Buschelman (or the array nnz). By setting these parameters accurately, performance 1984a23d5eceSKris Buschelman during matrix assembly can be increased by more than a factor of 50. 1985a23d5eceSKris Buschelman 1986c3339decSBarry Smith Collective 1987a23d5eceSKris Buschelman 1988a23d5eceSKris Buschelman Input Parameters: 19891c4f3114SJed Brown + B - the symmetric matrix 199011a5261eSBarry Smith . bs - size of block, the blocks are ALWAYS square. One can use `MatSetBlockSizes()` to set a different row and column blocksize but the row 199111a5261eSBarry Smith blocksize always defines the size of the blocks. The column blocksize sets the blocksize of the vectors obtained with `MatCreateVecs()` 1992a23d5eceSKris Buschelman . nz - number of block nonzeros per block row (same for all rows) 1993a23d5eceSKris Buschelman - nnz - array containing the number of block nonzeros in the upper triangular plus 19940298fd71SBarry Smith diagonal portion of each block (possibly different for each block row) or NULL 1995a23d5eceSKris Buschelman 1996a23d5eceSKris Buschelman Options Database Keys: 1997a2b725a8SWilliam Gropp + -mat_no_unroll - uses code that does not unroll the loops in the 1998a23d5eceSKris Buschelman block calculations (much slower) 1999a2b725a8SWilliam Gropp - -mat_block_size - size of the blocks to use (only works if a negative bs is passed in 2000a23d5eceSKris Buschelman 2001a23d5eceSKris Buschelman Level: intermediate 2002a23d5eceSKris Buschelman 2003a23d5eceSKris Buschelman Notes: 2004a23d5eceSKris Buschelman Specify the preallocated storage with either nz or nnz (not both). 200511a5261eSBarry Smith Set nz = `PETSC_DEFAULT` and nnz = NULL for PETSc to control dynamic memory 2006651615e1SBarry Smith allocation. See [Sparse Matrices](sec_matsparse) for details. 2007a23d5eceSKris Buschelman 200811a5261eSBarry Smith You can call `MatGetInfo()` to get information on how effective the preallocation was; 2009aa95bbe8SBarry Smith for example the fields mallocs,nz_allocated,nz_used,nz_unneeded; 2010aa95bbe8SBarry Smith You can also run with the option -info and look for messages with the string 2011aa95bbe8SBarry Smith malloc in them to see if additional memory allocation was needed. 2012aa95bbe8SBarry Smith 201349a6f317SBarry Smith If the nnz parameter is given then the nz parameter is ignored 201449a6f317SBarry Smith 2015651615e1SBarry Smith .seealso: [Sparse Matrices](sec_matsparse), `MATSEQSBAIJ`, `MatCreate()`, `MatCreateSeqAIJ()`, `MatSetValues()`, `MatCreateSBAIJ()` 2016a23d5eceSKris Buschelman @*/ 2017d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqSBAIJSetPreallocation(Mat B, PetscInt bs, PetscInt nz, const PetscInt nnz[]) 2018d71ae5a4SJacob Faibussowitsch { 2019a23d5eceSKris Buschelman PetscFunctionBegin; 20206ba663aaSJed Brown PetscValidHeaderSpecific(B, MAT_CLASSID, 1); 20216ba663aaSJed Brown PetscValidType(B, 1); 20226ba663aaSJed Brown PetscValidLogicalCollectiveInt(B, bs, 2); 2023cac4c232SBarry Smith PetscTryMethod(B, "MatSeqSBAIJSetPreallocation_C", (Mat, PetscInt, PetscInt, const PetscInt[]), (B, bs, nz, nnz)); 20243ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 2025a23d5eceSKris Buschelman } 202649b5e25fSSatish Balay 202738f409ebSLisandro Dalcin /*@C 202811a5261eSBarry Smith MatSeqSBAIJSetPreallocationCSR - Creates a sparse parallel matrix in `MATSEQSBAIJ` format using the given nonzero structure and (optional) numerical values 202938f409ebSLisandro Dalcin 203038f409ebSLisandro Dalcin Input Parameters: 20311c4f3114SJed Brown + B - the matrix 2032eab78319SHong Zhang . bs - size of block, the blocks are ALWAYS square. 203338f409ebSLisandro Dalcin . i - the indices into j for the start of each local row (starts with zero) 203438f409ebSLisandro Dalcin . j - the column indices for each local row (starts with zero) these must be sorted for each row 203538f409ebSLisandro Dalcin - v - optional values in the matrix 203638f409ebSLisandro Dalcin 2037664954b6SBarry Smith Level: advanced 203838f409ebSLisandro Dalcin 203938f409ebSLisandro Dalcin Notes: 204011a5261eSBarry Smith The order of the entries in values is specified by the `MatOption` `MAT_ROW_ORIENTED`. For example, C programs 204111a5261eSBarry Smith may want to use the default `MAT_ROW_ORIENTED` = `PETSC_TRUE` and use an array v[nnz][bs][bs] where the second index is 204238f409ebSLisandro Dalcin over rows within a block and the last index is over columns within a block row. Fortran programs will likely set 204311a5261eSBarry Smith `MAT_ROW_ORIENTED` = `PETSC_FALSE` and use a Fortran array v(bs,bs,nnz) in which the first index is over rows within a 204438f409ebSLisandro Dalcin block column and the second index is over columns within a block. 204538f409ebSLisandro Dalcin 204650c5228eSBarry Smith Any entries below the diagonal are ignored 20470cd7f59aSBarry Smith 20480cd7f59aSBarry Smith Though this routine has Preallocation() in the name it also sets the exact nonzero locations of the matrix entries 20490cd7f59aSBarry Smith and usually the numerical values as well 2050664954b6SBarry Smith 205111a5261eSBarry Smith .seealso: `MATSEQSBAIJ`, `MatCreate()`, `MatCreateSeqSBAIJ()`, `MatSetValuesBlocked()`, `MatSeqSBAIJSetPreallocation()`, `MATSEQSBAIJ` 205238f409ebSLisandro Dalcin @*/ 2053d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqSBAIJSetPreallocationCSR(Mat B, PetscInt bs, const PetscInt i[], const PetscInt j[], const PetscScalar v[]) 2054d71ae5a4SJacob Faibussowitsch { 205538f409ebSLisandro Dalcin PetscFunctionBegin; 205638f409ebSLisandro Dalcin PetscValidHeaderSpecific(B, MAT_CLASSID, 1); 205738f409ebSLisandro Dalcin PetscValidType(B, 1); 205838f409ebSLisandro Dalcin PetscValidLogicalCollectiveInt(B, bs, 2); 2059cac4c232SBarry Smith PetscTryMethod(B, "MatSeqSBAIJSetPreallocationCSR_C", (Mat, PetscInt, const PetscInt[], const PetscInt[], const PetscScalar[]), (B, bs, i, j, v)); 20603ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 206138f409ebSLisandro Dalcin } 206238f409ebSLisandro Dalcin 2063c464158bSHong Zhang /*@C 2064c464158bSHong Zhang MatCreateSeqSBAIJ - Creates a sparse symmetric matrix in block AIJ (block 206511a5261eSBarry Smith compressed row) `MATSEQSBAIJ` format. For good matrix assembly performance the 2066c464158bSHong Zhang user should preallocate the matrix storage by setting the parameter nz 2067c464158bSHong Zhang (or the array nnz). By setting these parameters accurately, performance 2068c464158bSHong Zhang during matrix assembly can be increased by more than a factor of 50. 206949b5e25fSSatish Balay 2070d083f849SBarry Smith Collective 2071c464158bSHong Zhang 2072c464158bSHong Zhang Input Parameters: 207311a5261eSBarry Smith + comm - MPI communicator, set to `PETSC_COMM_SELF` 207411a5261eSBarry Smith . bs - size of block, the blocks are ALWAYS square. One can use `MatSetBlockSizes()` to set a different row and column blocksize but the row 2075bb7ae925SBarry Smith blocksize always defines the size of the blocks. The column blocksize sets the blocksize of the vectors obtained with MatCreateVecs() 2076c464158bSHong Zhang . m - number of rows, or number of columns 2077c464158bSHong Zhang . nz - number of block nonzeros per block row (same for all rows) 2078744e8345SSatish Balay - nnz - array containing the number of block nonzeros in the upper triangular plus 20790298fd71SBarry Smith diagonal portion of each block (possibly different for each block row) or NULL 2080c464158bSHong Zhang 2081c464158bSHong Zhang Output Parameter: 2082c464158bSHong Zhang . A - the symmetric matrix 2083c464158bSHong Zhang 2084c464158bSHong Zhang Options Database Keys: 2085a2b725a8SWilliam Gropp + -mat_no_unroll - uses code that does not unroll the loops in the 2086c464158bSHong Zhang block calculations (much slower) 2087a2b725a8SWilliam Gropp - -mat_block_size - size of the blocks to use 2088c464158bSHong Zhang 2089c464158bSHong Zhang Level: intermediate 2090c464158bSHong Zhang 209111a5261eSBarry Smith It is recommended that one use the `MatCreate()`, `MatSetType()` and/or `MatSetFromOptions()`, 2092f6f02116SRichard Tran Mills MatXXXXSetPreallocation() paradigm instead of this routine directly. 209311a5261eSBarry Smith [MatXXXXSetPreallocation() is, for example, `MatSeqAIJSetPreallocation()`] 2094175b88e8SBarry Smith 2095c464158bSHong Zhang Notes: 20966d6d819aSHong Zhang The number of rows and columns must be divisible by blocksize. 20976d6d819aSHong Zhang This matrix type does not support complex Hermitian operation. 2098c464158bSHong Zhang 2099c464158bSHong Zhang Specify the preallocated storage with either nz or nnz (not both). 210011a5261eSBarry Smith Set nz = `PETSC_DEFAULT` and nnz = NULL for PETSc to control dynamic memory 2101651615e1SBarry Smith allocation. See [Sparse Matrices](sec_matsparse) for details. 2102c464158bSHong Zhang 210349a6f317SBarry Smith If the nnz parameter is given then the nz parameter is ignored 210449a6f317SBarry Smith 2105651615e1SBarry Smith .seealso: [Sparse Matrices](sec_matsparse), `MATSEQSBAIJ`, `MatCreate()`, `MatCreateSeqAIJ()`, `MatSetValues()`, `MatCreateSBAIJ()` 2106c464158bSHong Zhang @*/ 2107d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateSeqSBAIJ(MPI_Comm comm, PetscInt bs, PetscInt m, PetscInt n, PetscInt nz, const PetscInt nnz[], Mat *A) 2108d71ae5a4SJacob Faibussowitsch { 2109c464158bSHong Zhang PetscFunctionBegin; 21109566063dSJacob Faibussowitsch PetscCall(MatCreate(comm, A)); 21119566063dSJacob Faibussowitsch PetscCall(MatSetSizes(*A, m, n, m, n)); 21129566063dSJacob Faibussowitsch PetscCall(MatSetType(*A, MATSEQSBAIJ)); 21139566063dSJacob Faibussowitsch PetscCall(MatSeqSBAIJSetPreallocation(*A, bs, nz, (PetscInt *)nnz)); 21143ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 211549b5e25fSSatish Balay } 211649b5e25fSSatish Balay 2117d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDuplicate_SeqSBAIJ(Mat A, MatDuplicateOption cpvalues, Mat *B) 2118d71ae5a4SJacob Faibussowitsch { 211949b5e25fSSatish Balay Mat C; 212049b5e25fSSatish Balay Mat_SeqSBAIJ *c, *a = (Mat_SeqSBAIJ *)A->data; 2121b40805acSSatish Balay PetscInt i, mbs = a->mbs, nz = a->nz, bs2 = a->bs2; 212249b5e25fSSatish Balay 212349b5e25fSSatish Balay PetscFunctionBegin; 212408401ef6SPierre Jolivet PetscCheck(a->i[mbs] == nz, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Corrupt matrix"); 212549b5e25fSSatish Balay 2126f4259b30SLisandro Dalcin *B = NULL; 21279566063dSJacob Faibussowitsch PetscCall(MatCreate(PetscObjectComm((PetscObject)A), &C)); 21289566063dSJacob Faibussowitsch PetscCall(MatSetSizes(C, A->rmap->N, A->cmap->n, A->rmap->N, A->cmap->n)); 21299566063dSJacob Faibussowitsch PetscCall(MatSetBlockSizesFromMats(C, A, A)); 21309566063dSJacob Faibussowitsch PetscCall(MatSetType(C, MATSEQSBAIJ)); 2131692f9cbeSHong Zhang c = (Mat_SeqSBAIJ *)C->data; 2132692f9cbeSHong Zhang 2133273d9f13SBarry Smith C->preallocated = PETSC_TRUE; 2134d5f3da31SBarry Smith C->factortype = A->factortype; 2135f4259b30SLisandro Dalcin c->row = NULL; 2136f4259b30SLisandro Dalcin c->icol = NULL; 2137f4259b30SLisandro Dalcin c->saved_values = NULL; 2138a9817697SBarry Smith c->keepnonzeropattern = a->keepnonzeropattern; 213949b5e25fSSatish Balay C->assembled = PETSC_TRUE; 214049b5e25fSSatish Balay 21419566063dSJacob Faibussowitsch PetscCall(PetscLayoutReference(A->rmap, &C->rmap)); 21429566063dSJacob Faibussowitsch PetscCall(PetscLayoutReference(A->cmap, &C->cmap)); 214349b5e25fSSatish Balay c->bs2 = a->bs2; 214449b5e25fSSatish Balay c->mbs = a->mbs; 214549b5e25fSSatish Balay c->nbs = a->nbs; 214649b5e25fSSatish Balay 2147c760cd28SBarry Smith if (cpvalues == MAT_SHARE_NONZERO_PATTERN) { 2148c760cd28SBarry Smith c->imax = a->imax; 2149c760cd28SBarry Smith c->ilen = a->ilen; 2150c760cd28SBarry Smith c->free_imax_ilen = PETSC_FALSE; 2151c760cd28SBarry Smith } else { 21529566063dSJacob Faibussowitsch PetscCall(PetscMalloc2((mbs + 1), &c->imax, (mbs + 1), &c->ilen)); 215349b5e25fSSatish Balay for (i = 0; i < mbs; i++) { 215449b5e25fSSatish Balay c->imax[i] = a->imax[i]; 215549b5e25fSSatish Balay c->ilen[i] = a->ilen[i]; 215649b5e25fSSatish Balay } 2157c760cd28SBarry Smith c->free_imax_ilen = PETSC_TRUE; 2158c760cd28SBarry Smith } 215949b5e25fSSatish Balay 216049b5e25fSSatish Balay /* allocate the matrix space */ 21614da8f245SBarry Smith if (cpvalues == MAT_SHARE_NONZERO_PATTERN) { 21629566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(bs2 * nz, &c->a)); 216344e1c64aSLisandro Dalcin c->i = a->i; 216444e1c64aSLisandro Dalcin c->j = a->j; 21654da8f245SBarry Smith c->singlemalloc = PETSC_FALSE; 216644e1c64aSLisandro Dalcin c->free_a = PETSC_TRUE; 21674da8f245SBarry Smith c->free_ij = PETSC_FALSE; 21684da8f245SBarry Smith c->parent = A; 21699566063dSJacob Faibussowitsch PetscCall(PetscObjectReference((PetscObject)A)); 21709566063dSJacob Faibussowitsch PetscCall(MatSetOption(A, MAT_NEW_NONZERO_LOCATION_ERR, PETSC_TRUE)); 21719566063dSJacob Faibussowitsch PetscCall(MatSetOption(C, MAT_NEW_NONZERO_LOCATION_ERR, PETSC_TRUE)); 21724da8f245SBarry Smith } else { 21739566063dSJacob Faibussowitsch PetscCall(PetscMalloc3(bs2 * nz, &c->a, nz, &c->j, mbs + 1, &c->i)); 21749566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(c->i, a->i, mbs + 1)); 21754da8f245SBarry Smith c->singlemalloc = PETSC_TRUE; 217644e1c64aSLisandro Dalcin c->free_a = PETSC_TRUE; 21774da8f245SBarry Smith c->free_ij = PETSC_TRUE; 21784da8f245SBarry Smith } 217949b5e25fSSatish Balay if (mbs > 0) { 218048a46eb9SPierre Jolivet if (cpvalues != MAT_SHARE_NONZERO_PATTERN) PetscCall(PetscArraycpy(c->j, a->j, nz)); 218149b5e25fSSatish Balay if (cpvalues == MAT_COPY_VALUES) { 21829566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(c->a, a->a, bs2 * nz)); 218349b5e25fSSatish Balay } else { 21849566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(c->a, bs2 * nz)); 218549b5e25fSSatish Balay } 2186a1c3900fSBarry Smith if (a->jshort) { 218744e1c64aSLisandro Dalcin /* cannot share jshort, it is reallocated in MatAssemblyEnd_SeqSBAIJ() */ 218844e1c64aSLisandro Dalcin /* if the parent matrix is reassembled, this child matrix will never notice */ 21899566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nz, &c->jshort)); 21909566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(c->jshort, a->jshort, nz)); 219126fbe8dcSKarl Rupp 21924da8f245SBarry Smith c->free_jshort = PETSC_TRUE; 21934da8f245SBarry Smith } 2194a1c3900fSBarry Smith } 219549b5e25fSSatish Balay 219649b5e25fSSatish Balay c->roworiented = a->roworiented; 219749b5e25fSSatish Balay c->nonew = a->nonew; 219849b5e25fSSatish Balay 219949b5e25fSSatish Balay if (a->diag) { 2200c760cd28SBarry Smith if (cpvalues == MAT_SHARE_NONZERO_PATTERN) { 2201c760cd28SBarry Smith c->diag = a->diag; 2202c760cd28SBarry Smith c->free_diag = PETSC_FALSE; 2203c760cd28SBarry Smith } else { 22049566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(mbs, &c->diag)); 220526fbe8dcSKarl Rupp for (i = 0; i < mbs; i++) c->diag[i] = a->diag[i]; 2206c760cd28SBarry Smith c->free_diag = PETSC_TRUE; 2207c760cd28SBarry Smith } 220844e1c64aSLisandro Dalcin } 22096c6c5352SBarry Smith c->nz = a->nz; 2210f2cbd3d5SJed Brown c->maxnz = a->nz; /* Since we allocate exactly the right amount */ 2211f4259b30SLisandro Dalcin c->solve_work = NULL; 2212f4259b30SLisandro Dalcin c->mult_work = NULL; 221326fbe8dcSKarl Rupp 221449b5e25fSSatish Balay *B = C; 22159566063dSJacob Faibussowitsch PetscCall(PetscFunctionListDuplicate(((PetscObject)A)->qlist, &((PetscObject)C)->qlist)); 22163ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 221749b5e25fSSatish Balay } 221849b5e25fSSatish Balay 2219618cc2edSLisandro Dalcin /* Used for both SeqBAIJ and SeqSBAIJ matrices */ 2220618cc2edSLisandro Dalcin #define MatLoad_SeqSBAIJ_Binary MatLoad_SeqBAIJ_Binary 2221618cc2edSLisandro Dalcin 2222d71ae5a4SJacob Faibussowitsch PetscErrorCode MatLoad_SeqSBAIJ(Mat mat, PetscViewer viewer) 2223d71ae5a4SJacob Faibussowitsch { 22247f489da9SVaclav Hapla PetscBool isbinary; 22252f480046SShri Abhyankar 22262f480046SShri Abhyankar PetscFunctionBegin; 22279566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERBINARY, &isbinary)); 222828b400f6SJacob Faibussowitsch PetscCheck(isbinary, PetscObjectComm((PetscObject)viewer), PETSC_ERR_SUP, "Viewer type %s not yet supported for reading %s matrices", ((PetscObject)viewer)->type_name, ((PetscObject)mat)->type_name); 22299566063dSJacob Faibussowitsch PetscCall(MatLoad_SeqSBAIJ_Binary(mat, viewer)); 22303ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 22312f480046SShri Abhyankar } 22322f480046SShri Abhyankar 2233c75a6043SHong Zhang /*@ 223411a5261eSBarry Smith MatCreateSeqSBAIJWithArrays - Creates an sequential `MATSEQSBAIJ` matrix using matrix elements 2235c75a6043SHong Zhang (upper triangular entries in CSR format) provided by the user. 2236c75a6043SHong Zhang 2237d083f849SBarry Smith Collective 2238c75a6043SHong Zhang 2239c75a6043SHong Zhang Input Parameters: 2240c75a6043SHong Zhang + comm - must be an MPI communicator of size 1 2241c75a6043SHong Zhang . bs - size of block 2242c75a6043SHong Zhang . m - number of rows 2243c75a6043SHong Zhang . n - number of columns 2244483a2f95SBarry Smith . i - row indices; that is i[0] = 0, i[row] = i[row-1] + number of block elements in that row block row of the matrix 2245c75a6043SHong Zhang . j - column indices 2246c75a6043SHong Zhang - a - matrix values 2247c75a6043SHong Zhang 2248c75a6043SHong Zhang Output Parameter: 2249c75a6043SHong Zhang . mat - the matrix 2250c75a6043SHong Zhang 2251dfb205c3SBarry Smith Level: advanced 2252c75a6043SHong Zhang 2253c75a6043SHong Zhang Notes: 2254c75a6043SHong Zhang The i, j, and a arrays are not copied by this routine, the user must free these arrays 2255c75a6043SHong Zhang once the matrix is destroyed 2256c75a6043SHong Zhang 2257c75a6043SHong Zhang You cannot set new nonzero locations into this matrix, that will generate an error. 2258c75a6043SHong Zhang 2259c75a6043SHong Zhang The i and j indices are 0 based 2260c75a6043SHong Zhang 226111a5261eSBarry Smith When block size is greater than 1 the matrix values must be stored using the SBAIJ storage format (see the SBAIJ source code to determine this). For block size of 1 2262dfb205c3SBarry Smith it is the regular CSR format excluding the lower triangular elements. 2263dfb205c3SBarry Smith 226411a5261eSBarry Smith .seealso: `MATSEQSBAIJ`, `MatCreate()`, `MatCreateSBAIJ()`, `MatCreateSeqSBAIJ()` 2265c75a6043SHong Zhang @*/ 2266d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateSeqSBAIJWithArrays(MPI_Comm comm, PetscInt bs, PetscInt m, PetscInt n, PetscInt i[], PetscInt j[], PetscScalar a[], Mat *mat) 2267d71ae5a4SJacob Faibussowitsch { 2268c75a6043SHong Zhang PetscInt ii; 2269c75a6043SHong Zhang Mat_SeqSBAIJ *sbaij; 2270c75a6043SHong Zhang 2271c75a6043SHong Zhang PetscFunctionBegin; 227208401ef6SPierre Jolivet PetscCheck(bs == 1, PETSC_COMM_SELF, PETSC_ERR_SUP, "block size %" PetscInt_FMT " > 1 is not supported yet", bs); 2273aed4548fSBarry Smith PetscCheck(m == 0 || i[0] == 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "i (row indices) must start with 0"); 2274c75a6043SHong Zhang 22759566063dSJacob Faibussowitsch PetscCall(MatCreate(comm, mat)); 22769566063dSJacob Faibussowitsch PetscCall(MatSetSizes(*mat, m, n, m, n)); 22779566063dSJacob Faibussowitsch PetscCall(MatSetType(*mat, MATSEQSBAIJ)); 22789566063dSJacob Faibussowitsch PetscCall(MatSeqSBAIJSetPreallocation(*mat, bs, MAT_SKIP_ALLOCATION, NULL)); 2279c75a6043SHong Zhang sbaij = (Mat_SeqSBAIJ *)(*mat)->data; 22809566063dSJacob Faibussowitsch PetscCall(PetscMalloc2(m, &sbaij->imax, m, &sbaij->ilen)); 2281c75a6043SHong Zhang 2282c75a6043SHong Zhang sbaij->i = i; 2283c75a6043SHong Zhang sbaij->j = j; 2284c75a6043SHong Zhang sbaij->a = a; 228526fbe8dcSKarl Rupp 2286c75a6043SHong Zhang sbaij->singlemalloc = PETSC_FALSE; 2287c75a6043SHong Zhang sbaij->nonew = -1; /*this indicates that inserting a new value in the matrix that generates a new nonzero is an error*/ 2288e6b907acSBarry Smith sbaij->free_a = PETSC_FALSE; 2289e6b907acSBarry Smith sbaij->free_ij = PETSC_FALSE; 2290ddf7884eSMatthew Knepley sbaij->free_imax_ilen = PETSC_TRUE; 2291c75a6043SHong Zhang 2292c75a6043SHong Zhang for (ii = 0; ii < m; ii++) { 2293c75a6043SHong Zhang sbaij->ilen[ii] = sbaij->imax[ii] = i[ii + 1] - i[ii]; 22946bdcaf15SBarry Smith PetscCheck(i[ii + 1] >= i[ii], PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Negative row length in i (row indices) row = %" PetscInt_FMT " length = %" PetscInt_FMT, ii, i[ii + 1] - i[ii]); 2295c75a6043SHong Zhang } 229676bd3646SJed Brown if (PetscDefined(USE_DEBUG)) { 2297c75a6043SHong Zhang for (ii = 0; ii < sbaij->i[m]; ii++) { 22986bdcaf15SBarry Smith PetscCheck(j[ii] >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Negative column index at location = %" PetscInt_FMT " index = %" PetscInt_FMT, ii, j[ii]); 22996bdcaf15SBarry Smith PetscCheck(j[ii] < n, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Column index too large at location = %" PetscInt_FMT " index = %" PetscInt_FMT, ii, j[ii]); 2300c75a6043SHong Zhang } 230176bd3646SJed Brown } 2302c75a6043SHong Zhang 23039566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(*mat, MAT_FINAL_ASSEMBLY)); 23049566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(*mat, MAT_FINAL_ASSEMBLY)); 23053ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 2306c75a6043SHong Zhang } 2307d06b337dSHong Zhang 2308d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateMPIMatConcatenateSeqMat_SeqSBAIJ(MPI_Comm comm, Mat inmat, PetscInt n, MatReuse scall, Mat *outmat) 2309d71ae5a4SJacob Faibussowitsch { 231059f5e6ceSHong Zhang PetscFunctionBegin; 23119566063dSJacob Faibussowitsch PetscCall(MatCreateMPIMatConcatenateSeqMat_MPISBAIJ(comm, inmat, n, scall, outmat)); 23123ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 231359f5e6ceSHong Zhang } 2314