149b5e25fSSatish Balay /* 2a1373b80SHong Zhang Defines the basic matrix operations for the SBAIJ (compressed row) 349b5e25fSSatish Balay matrix storage format. 449b5e25fSSatish Balay */ 5c6db04a5SJed Brown #include <../src/mat/impls/baij/seq/baij.h> /*I "petscmat.h" I*/ 6c6db04a5SJed Brown #include <../src/mat/impls/sbaij/seq/sbaij.h> 7c6db04a5SJed Brown #include <petscblaslapack.h> 849b5e25fSSatish Balay 9c6db04a5SJed Brown #include <../src/mat/impls/sbaij/seq/relax.h> 1070dcbbb9SBarry Smith #define USESHORT 11c6db04a5SJed Brown #include <../src/mat/impls/sbaij/seq/relax.h> 1270dcbbb9SBarry Smith 1326cec326SBarry Smith /* defines MatSetValues_Seq_Hash(), MatAssemblyEnd_Seq_Hash(), MatSetUp_Seq_Hash() */ 1426cec326SBarry Smith #define TYPE SBAIJ 1526cec326SBarry Smith #define TYPE_SBAIJ 1626cec326SBarry Smith #define TYPE_BS 1726cec326SBarry Smith #include "../src/mat/impls/aij/seq/seqhashmatsetvalues.h" 1826cec326SBarry Smith #undef TYPE_BS 1926cec326SBarry Smith #define TYPE_BS _BS 2026cec326SBarry Smith #define TYPE_BS_ON 2126cec326SBarry Smith #include "../src/mat/impls/aij/seq/seqhashmatsetvalues.h" 2226cec326SBarry Smith #undef TYPE_BS 2326cec326SBarry Smith #undef TYPE_SBAIJ 2426cec326SBarry Smith #include "../src/mat/impls/aij/seq/seqhashmat.h" 2526cec326SBarry Smith #undef TYPE 2626cec326SBarry Smith #undef TYPE_BS_ON 2726cec326SBarry Smith 286214f412SHong Zhang #if defined(PETSC_HAVE_ELEMENTAL) 29cc2e6a90SBarry Smith PETSC_INTERN PetscErrorCode MatConvert_SeqSBAIJ_Elemental(Mat, MatType, MatReuse, Mat *); 306214f412SHong Zhang #endif 31d24d4204SJose E. Roman #if defined(PETSC_HAVE_SCALAPACK) 32d24d4204SJose E. Roman PETSC_INTERN PetscErrorCode MatConvert_SBAIJ_ScaLAPACK(Mat, MatType, MatReuse, Mat *); 33d24d4204SJose E. Roman #endif 3428d58a37SPierre Jolivet PETSC_INTERN PetscErrorCode MatConvert_MPISBAIJ_Basic(Mat, MatType, MatReuse, Mat *); 35b5b17502SBarry Smith 3649b5e25fSSatish Balay /* 3749b5e25fSSatish Balay Checks for missing diagonals 3849b5e25fSSatish Balay */ 39ba38deedSJacob Faibussowitsch static PetscErrorCode MatMissingDiagonal_SeqSBAIJ(Mat A, PetscBool *missing, PetscInt *dd) 40d71ae5a4SJacob Faibussowitsch { 41045c9aa0SHong Zhang Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)A->data; 427734d3b5SMatthew G. Knepley PetscInt *diag, *ii = a->i, i; 4349b5e25fSSatish Balay 4449b5e25fSSatish Balay PetscFunctionBegin; 459566063dSJacob Faibussowitsch PetscCall(MatMarkDiagonal_SeqSBAIJ(A)); 462af78befSBarry Smith *missing = PETSC_FALSE; 477734d3b5SMatthew G. Knepley if (A->rmap->n > 0 && !ii) { 48358d2f5dSShri Abhyankar *missing = PETSC_TRUE; 49358d2f5dSShri Abhyankar if (dd) *dd = 0; 509566063dSJacob Faibussowitsch PetscCall(PetscInfo(A, "Matrix has no entries therefore is missing diagonal\n")); 51358d2f5dSShri Abhyankar } else { 52358d2f5dSShri Abhyankar diag = a->diag; 5349b5e25fSSatish Balay for (i = 0; i < a->mbs; i++) { 547734d3b5SMatthew G. Knepley if (diag[i] >= ii[i + 1]) { 552af78befSBarry Smith *missing = PETSC_TRUE; 562af78befSBarry Smith if (dd) *dd = i; 572af78befSBarry Smith break; 582af78befSBarry Smith } 5949b5e25fSSatish Balay } 60358d2f5dSShri Abhyankar } 613ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 6249b5e25fSSatish Balay } 6349b5e25fSSatish Balay 64d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMarkDiagonal_SeqSBAIJ(Mat A) 65d71ae5a4SJacob Faibussowitsch { 66045c9aa0SHong Zhang Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)A->data; 6748dd3d27SHong Zhang PetscInt i, j; 6849b5e25fSSatish Balay 6949b5e25fSSatish Balay PetscFunctionBegin; 7009f38230SBarry Smith if (!a->diag) { 719566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(a->mbs, &a->diag)); 72c760cd28SBarry Smith a->free_diag = PETSC_TRUE; 7309f38230SBarry Smith } 7448dd3d27SHong Zhang for (i = 0; i < a->mbs; i++) { 7548dd3d27SHong Zhang a->diag[i] = a->i[i + 1]; 7648dd3d27SHong Zhang for (j = a->i[i]; j < a->i[i + 1]; j++) { 7748dd3d27SHong Zhang if (a->j[j] == i) { 7848dd3d27SHong Zhang a->diag[i] = j; 7948dd3d27SHong Zhang break; 8048dd3d27SHong Zhang } 8148dd3d27SHong Zhang } 8248dd3d27SHong Zhang } 833ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 8449b5e25fSSatish Balay } 8549b5e25fSSatish Balay 86d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatGetRowIJ_SeqSBAIJ(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool blockcompressed, PetscInt *nn, const PetscInt *inia[], const PetscInt *inja[], PetscBool *done) 87d71ae5a4SJacob Faibussowitsch { 88a6ece127SHong Zhang Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)A->data; 892462f5fdSStefano Zampini PetscInt i, j, n = a->mbs, nz = a->i[n], *tia, *tja, bs = A->rmap->bs, k, l, cnt; 902462f5fdSStefano Zampini PetscInt **ia = (PetscInt **)inia, **ja = (PetscInt **)inja; 9149b5e25fSSatish Balay 9249b5e25fSSatish Balay PetscFunctionBegin; 93d3e5a4abSHong Zhang *nn = n; 943ba16761SJacob Faibussowitsch if (!ia) PetscFunctionReturn(PETSC_SUCCESS); 952462f5fdSStefano Zampini if (symmetric) { 969566063dSJacob Faibussowitsch PetscCall(MatToSymmetricIJ_SeqAIJ(n, a->i, a->j, PETSC_FALSE, 0, 0, &tia, &tja)); 972462f5fdSStefano Zampini nz = tia[n]; 982462f5fdSStefano Zampini } else { 999371c9d4SSatish Balay tia = a->i; 1009371c9d4SSatish Balay tja = a->j; 1012462f5fdSStefano Zampini } 1022462f5fdSStefano Zampini 1032462f5fdSStefano Zampini if (!blockcompressed && bs > 1) { 1042462f5fdSStefano Zampini (*nn) *= bs; 1058f7157efSSatish Balay /* malloc & create the natural set of indices */ 1069566063dSJacob Faibussowitsch PetscCall(PetscMalloc1((n + 1) * bs, ia)); 1072462f5fdSStefano Zampini if (n) { 1082462f5fdSStefano Zampini (*ia)[0] = oshift; 109ad540459SPierre Jolivet for (j = 1; j < bs; j++) (*ia)[j] = (tia[1] - tia[0]) * bs + (*ia)[j - 1]; 1102462f5fdSStefano Zampini } 1112462f5fdSStefano Zampini 1122462f5fdSStefano Zampini for (i = 1; i < n; i++) { 1132462f5fdSStefano Zampini (*ia)[i * bs] = (tia[i] - tia[i - 1]) * bs + (*ia)[i * bs - 1]; 114ad540459SPierre Jolivet for (j = 1; j < bs; j++) (*ia)[i * bs + j] = (tia[i + 1] - tia[i]) * bs + (*ia)[i * bs + j - 1]; 1152462f5fdSStefano Zampini } 116ad540459SPierre Jolivet if (n) (*ia)[n * bs] = (tia[n] - tia[n - 1]) * bs + (*ia)[n * bs - 1]; 1172462f5fdSStefano Zampini 1182462f5fdSStefano Zampini if (inja) { 1199566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nz * bs * bs, ja)); 1202462f5fdSStefano Zampini cnt = 0; 1212462f5fdSStefano Zampini for (i = 0; i < n; i++) { 1228f7157efSSatish Balay for (j = 0; j < bs; j++) { 1232462f5fdSStefano Zampini for (k = tia[i]; k < tia[i + 1]; k++) { 124ad540459SPierre Jolivet for (l = 0; l < bs; l++) (*ja)[cnt++] = bs * tja[k] + l; 1258f7157efSSatish Balay } 1268f7157efSSatish Balay } 1278f7157efSSatish Balay } 1288f7157efSSatish Balay } 1292462f5fdSStefano Zampini 1302462f5fdSStefano Zampini if (symmetric) { /* deallocate memory allocated in MatToSymmetricIJ_SeqAIJ() */ 1319566063dSJacob Faibussowitsch PetscCall(PetscFree(tia)); 1329566063dSJacob Faibussowitsch PetscCall(PetscFree(tja)); 1332462f5fdSStefano Zampini } 1342462f5fdSStefano Zampini } else if (oshift == 1) { 1352462f5fdSStefano Zampini if (symmetric) { 1362462f5fdSStefano Zampini nz = tia[A->rmap->n / bs]; 1372462f5fdSStefano Zampini /* add 1 to i and j indices */ 1382462f5fdSStefano Zampini for (i = 0; i < A->rmap->n / bs + 1; i++) tia[i] = tia[i] + 1; 1392462f5fdSStefano Zampini *ia = tia; 1402462f5fdSStefano Zampini if (ja) { 1412462f5fdSStefano Zampini for (i = 0; i < nz; i++) tja[i] = tja[i] + 1; 1422462f5fdSStefano Zampini *ja = tja; 1432462f5fdSStefano Zampini } 1442462f5fdSStefano Zampini } else { 1452462f5fdSStefano Zampini nz = a->i[A->rmap->n / bs]; 1462462f5fdSStefano Zampini /* malloc space and add 1 to i and j indices */ 1479566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(A->rmap->n / bs + 1, ia)); 1482462f5fdSStefano Zampini for (i = 0; i < A->rmap->n / bs + 1; i++) (*ia)[i] = a->i[i] + 1; 1492462f5fdSStefano Zampini if (ja) { 1509566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nz, ja)); 1512462f5fdSStefano Zampini for (i = 0; i < nz; i++) (*ja)[i] = a->j[i] + 1; 1522462f5fdSStefano Zampini } 1532462f5fdSStefano Zampini } 1542462f5fdSStefano Zampini } else { 1552462f5fdSStefano Zampini *ia = tia; 1562462f5fdSStefano Zampini if (ja) *ja = tja; 157a6ece127SHong Zhang } 1583ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 15949b5e25fSSatish Balay } 16049b5e25fSSatish Balay 161d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatRestoreRowIJ_SeqSBAIJ(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool blockcompressed, PetscInt *nn, const PetscInt *ia[], const PetscInt *ja[], PetscBool *done) 162d71ae5a4SJacob Faibussowitsch { 16349b5e25fSSatish Balay PetscFunctionBegin; 1643ba16761SJacob Faibussowitsch if (!ia) PetscFunctionReturn(PETSC_SUCCESS); 1652462f5fdSStefano Zampini if ((!blockcompressed && A->rmap->bs > 1) || (symmetric || oshift == 1)) { 1669566063dSJacob Faibussowitsch PetscCall(PetscFree(*ia)); 1679566063dSJacob Faibussowitsch if (ja) PetscCall(PetscFree(*ja)); 168a6ece127SHong Zhang } 1693ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 17049b5e25fSSatish Balay } 17149b5e25fSSatish Balay 172d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDestroy_SeqSBAIJ(Mat A) 173d71ae5a4SJacob Faibussowitsch { 17449b5e25fSSatish Balay Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)A->data; 17549b5e25fSSatish Balay 17649b5e25fSSatish Balay PetscFunctionBegin; 177b4e2f619SBarry Smith if (A->hash_active) { 178b4e2f619SBarry Smith PetscInt bs; 179e3c72094SPierre Jolivet A->ops[0] = a->cops; 180b4e2f619SBarry Smith PetscCall(PetscHMapIJVDestroy(&a->ht)); 181b4e2f619SBarry Smith PetscCall(MatGetBlockSize(A, &bs)); 182b4e2f619SBarry Smith if (bs > 1) PetscCall(PetscHSetIJDestroy(&a->bht)); 183b4e2f619SBarry Smith PetscCall(PetscFree(a->dnz)); 184b4e2f619SBarry Smith PetscCall(PetscFree(a->bdnz)); 185b4e2f619SBarry Smith A->hash_active = PETSC_FALSE; 186b4e2f619SBarry Smith } 1873ba16761SJacob Faibussowitsch PetscCall(PetscLogObjectState((PetscObject)A, "Rows=%" PetscInt_FMT ", NZ=%" PetscInt_FMT, A->rmap->N, a->nz)); 1889566063dSJacob Faibussowitsch PetscCall(MatSeqXAIJFreeAIJ(A, &a->a, &a->j, &a->i)); 1899566063dSJacob Faibussowitsch if (a->free_diag) PetscCall(PetscFree(a->diag)); 1909566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->row)); 1919566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->col)); 1929566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->icol)); 1939566063dSJacob Faibussowitsch PetscCall(PetscFree(a->idiag)); 1949566063dSJacob Faibussowitsch PetscCall(PetscFree(a->inode.size)); 1959566063dSJacob Faibussowitsch if (a->free_imax_ilen) PetscCall(PetscFree2(a->imax, a->ilen)); 1969566063dSJacob Faibussowitsch PetscCall(PetscFree(a->solve_work)); 1979566063dSJacob Faibussowitsch PetscCall(PetscFree(a->sor_work)); 1989566063dSJacob Faibussowitsch PetscCall(PetscFree(a->solves_work)); 1999566063dSJacob Faibussowitsch PetscCall(PetscFree(a->mult_work)); 2009566063dSJacob Faibussowitsch PetscCall(PetscFree(a->saved_values)); 2019566063dSJacob Faibussowitsch if (a->free_jshort) PetscCall(PetscFree(a->jshort)); 2029566063dSJacob Faibussowitsch PetscCall(PetscFree(a->inew)); 2039566063dSJacob Faibussowitsch PetscCall(MatDestroy(&a->parent)); 2049566063dSJacob Faibussowitsch PetscCall(PetscFree(A->data)); 205901853e0SKris Buschelman 2069566063dSJacob Faibussowitsch PetscCall(PetscObjectChangeTypeName((PetscObject)A, NULL)); 2072e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSeqSBAIJGetArray_C", NULL)); 2082e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSeqSBAIJRestoreArray_C", NULL)); 2099566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatStoreValues_C", NULL)); 2109566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatRetrieveValues_C", NULL)); 2119566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSeqSBAIJSetColumnIndices_C", NULL)); 2129566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqsbaij_seqaij_C", NULL)); 2139566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqsbaij_seqbaij_C", NULL)); 2149566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSeqSBAIJSetPreallocation_C", NULL)); 2159566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSeqSBAIJSetPreallocationCSR_C", NULL)); 2166214f412SHong Zhang #if defined(PETSC_HAVE_ELEMENTAL) 2179566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqsbaij_elemental_C", NULL)); 2186214f412SHong Zhang #endif 219d24d4204SJose E. Roman #if defined(PETSC_HAVE_SCALAPACK) 2209566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqsbaij_scalapack_C", NULL)); 221d24d4204SJose E. Roman #endif 2222e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatFactorGetSolverType_C", NULL)); 2233ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 22449b5e25fSSatish Balay } 22549b5e25fSSatish Balay 226ba38deedSJacob Faibussowitsch static PetscErrorCode MatSetOption_SeqSBAIJ(Mat A, MatOption op, PetscBool flg) 227d71ae5a4SJacob Faibussowitsch { 228045c9aa0SHong Zhang Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)A->data; 229eb1ec7c1SStefano Zampini #if defined(PETSC_USE_COMPLEX) 230eb1ec7c1SStefano Zampini PetscInt bs; 231eb1ec7c1SStefano Zampini #endif 23249b5e25fSSatish Balay 23349b5e25fSSatish Balay PetscFunctionBegin; 234eb1ec7c1SStefano Zampini #if defined(PETSC_USE_COMPLEX) 2359566063dSJacob Faibussowitsch PetscCall(MatGetBlockSize(A, &bs)); 236eb1ec7c1SStefano Zampini #endif 2374d9d31abSKris Buschelman switch (op) { 238d71ae5a4SJacob Faibussowitsch case MAT_ROW_ORIENTED: 239d71ae5a4SJacob Faibussowitsch a->roworiented = flg; 240d71ae5a4SJacob Faibussowitsch break; 241d71ae5a4SJacob Faibussowitsch case MAT_KEEP_NONZERO_PATTERN: 242d71ae5a4SJacob Faibussowitsch a->keepnonzeropattern = flg; 243d71ae5a4SJacob Faibussowitsch break; 244d71ae5a4SJacob Faibussowitsch case MAT_NEW_NONZERO_LOCATIONS: 245d71ae5a4SJacob Faibussowitsch a->nonew = (flg ? 0 : 1); 246d71ae5a4SJacob Faibussowitsch break; 247d71ae5a4SJacob Faibussowitsch case MAT_NEW_NONZERO_LOCATION_ERR: 248d71ae5a4SJacob Faibussowitsch a->nonew = (flg ? -1 : 0); 249d71ae5a4SJacob Faibussowitsch break; 250d71ae5a4SJacob Faibussowitsch case MAT_NEW_NONZERO_ALLOCATION_ERR: 251d71ae5a4SJacob Faibussowitsch a->nonew = (flg ? -2 : 0); 252d71ae5a4SJacob Faibussowitsch break; 253d71ae5a4SJacob Faibussowitsch case MAT_UNUSED_NONZERO_LOCATION_ERR: 254d71ae5a4SJacob Faibussowitsch a->nounused = (flg ? -1 : 0); 255d71ae5a4SJacob Faibussowitsch break; 2568c78258cSHong Zhang case MAT_FORCE_DIAGONAL_ENTRIES: 2574d9d31abSKris Buschelman case MAT_IGNORE_OFF_PROC_ENTRIES: 2584d9d31abSKris Buschelman case MAT_USE_HASH_TABLE: 259d71ae5a4SJacob Faibussowitsch case MAT_SORTED_FULL: 260d71ae5a4SJacob Faibussowitsch PetscCall(PetscInfo(A, "Option %s ignored\n", MatOptions[op])); 261d71ae5a4SJacob Faibussowitsch break; 2629a4540c5SBarry Smith case MAT_HERMITIAN: 263eb1ec7c1SStefano Zampini #if defined(PETSC_USE_COMPLEX) 264eb1ec7c1SStefano Zampini if (flg) { /* disable transpose ops */ 26508401ef6SPierre Jolivet PetscCheck(bs <= 1, PETSC_COMM_SELF, PETSC_ERR_SUP, "No support for Hermitian with block size greater than 1"); 266eb1ec7c1SStefano Zampini A->ops->multtranspose = NULL; 267eb1ec7c1SStefano Zampini A->ops->multtransposeadd = NULL; 268b94d7dedSBarry Smith A->symmetric = PETSC_BOOL3_FALSE; 269eb1ec7c1SStefano Zampini } 2700f2140c7SStefano Zampini #endif 271eeffb40dSHong Zhang break; 27277e54ba9SKris Buschelman case MAT_SYMMETRIC: 273eb1ec7c1SStefano Zampini case MAT_SPD: 274eb1ec7c1SStefano Zampini #if defined(PETSC_USE_COMPLEX) 275eb1ec7c1SStefano Zampini if (flg) { /* An hermitian and symmetric matrix has zero imaginary part (restore back transpose ops) */ 276eb1ec7c1SStefano Zampini A->ops->multtranspose = A->ops->mult; 277eb1ec7c1SStefano Zampini A->ops->multtransposeadd = A->ops->multadd; 278eb1ec7c1SStefano Zampini } 279eb1ec7c1SStefano Zampini #endif 280eb1ec7c1SStefano Zampini break; 281eb1ec7c1SStefano Zampini /* These options are handled directly by MatSetOption() */ 28277e54ba9SKris Buschelman case MAT_STRUCTURALLY_SYMMETRIC: 2839a4540c5SBarry Smith case MAT_SYMMETRY_ETERNAL: 284b94d7dedSBarry Smith case MAT_STRUCTURAL_SYMMETRY_ETERNAL: 285672ba085SHong Zhang case MAT_STRUCTURE_ONLY: 286b94d7dedSBarry Smith case MAT_SPD_ETERNAL: 2874dcd73b1SHong Zhang /* These options are handled directly by MatSetOption() */ 288290bbb0aSBarry Smith break; 289d71ae5a4SJacob Faibussowitsch case MAT_IGNORE_LOWER_TRIANGULAR: 290d71ae5a4SJacob Faibussowitsch a->ignore_ltriangular = flg; 291d71ae5a4SJacob Faibussowitsch break; 292d71ae5a4SJacob Faibussowitsch case MAT_ERROR_LOWER_TRIANGULAR: 293d71ae5a4SJacob Faibussowitsch a->ignore_ltriangular = flg; 294d71ae5a4SJacob Faibussowitsch break; 295d71ae5a4SJacob Faibussowitsch case MAT_GETROW_UPPERTRIANGULAR: 296d71ae5a4SJacob Faibussowitsch a->getrow_utriangular = flg; 297d71ae5a4SJacob Faibussowitsch break; 298d71ae5a4SJacob Faibussowitsch case MAT_SUBMAT_SINGLEIS: 299d71ae5a4SJacob Faibussowitsch break; 300d71ae5a4SJacob Faibussowitsch default: 301d71ae5a4SJacob Faibussowitsch SETERRQ(PETSC_COMM_SELF, PETSC_ERR_SUP, "unknown option %d", op); 30249b5e25fSSatish Balay } 3033ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 30449b5e25fSSatish Balay } 30549b5e25fSSatish Balay 306d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetRow_SeqSBAIJ(Mat A, PetscInt row, PetscInt *nz, PetscInt **idx, PetscScalar **v) 307d71ae5a4SJacob Faibussowitsch { 30849b5e25fSSatish Balay Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)A->data; 30949b5e25fSSatish Balay 31049b5e25fSSatish Balay PetscFunctionBegin; 31108401ef6SPierre Jolivet PetscCheck(!A || a->getrow_utriangular, PETSC_COMM_SELF, PETSC_ERR_SUP, "MatGetRow is not supported for SBAIJ matrix format. Getting the upper triangular part of row, run with -mat_getrow_uppertriangular, call MatSetOption(mat,MAT_GETROW_UPPERTRIANGULAR,PETSC_TRUE) or MatGetRowUpperTriangular()"); 31252768537SHong Zhang 313f5edf698SHong Zhang /* Get the upper triangular part of the row */ 3149566063dSJacob Faibussowitsch PetscCall(MatGetRow_SeqBAIJ_private(A, row, nz, idx, v, a->i, a->j, a->a)); 3153ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 31649b5e25fSSatish Balay } 31749b5e25fSSatish Balay 318d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRestoreRow_SeqSBAIJ(Mat A, PetscInt row, PetscInt *nz, PetscInt **idx, PetscScalar **v) 319d71ae5a4SJacob Faibussowitsch { 32049b5e25fSSatish Balay PetscFunctionBegin; 3219566063dSJacob Faibussowitsch if (idx) PetscCall(PetscFree(*idx)); 3229566063dSJacob Faibussowitsch if (v) PetscCall(PetscFree(*v)); 3233ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 32449b5e25fSSatish Balay } 32549b5e25fSSatish Balay 326ba38deedSJacob Faibussowitsch static PetscErrorCode MatGetRowUpperTriangular_SeqSBAIJ(Mat A) 327d71ae5a4SJacob Faibussowitsch { 328f5edf698SHong Zhang Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)A->data; 329f5edf698SHong Zhang 330f5edf698SHong Zhang PetscFunctionBegin; 331f5edf698SHong Zhang a->getrow_utriangular = PETSC_TRUE; 3323ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 333f5edf698SHong Zhang } 334a323099bSStefano Zampini 335ba38deedSJacob Faibussowitsch static PetscErrorCode MatRestoreRowUpperTriangular_SeqSBAIJ(Mat A) 336d71ae5a4SJacob Faibussowitsch { 337f5edf698SHong Zhang Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)A->data; 338f5edf698SHong Zhang 339f5edf698SHong Zhang PetscFunctionBegin; 340f5edf698SHong Zhang a->getrow_utriangular = PETSC_FALSE; 3413ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 342f5edf698SHong Zhang } 343f5edf698SHong Zhang 344ba38deedSJacob Faibussowitsch static PetscErrorCode MatTranspose_SeqSBAIJ(Mat A, MatReuse reuse, Mat *B) 345d71ae5a4SJacob Faibussowitsch { 34649b5e25fSSatish Balay PetscFunctionBegin; 3477fb60732SBarry Smith if (reuse == MAT_REUSE_MATRIX) PetscCall(MatTransposeCheckNonzeroState_Private(A, *B)); 348cf37664fSBarry Smith if (reuse == MAT_INITIAL_MATRIX) { 3499566063dSJacob Faibussowitsch PetscCall(MatDuplicate(A, MAT_COPY_VALUES, B)); 350cf37664fSBarry Smith } else if (reuse == MAT_REUSE_MATRIX) { 3519566063dSJacob Faibussowitsch PetscCall(MatCopy(A, *B, SAME_NONZERO_PATTERN)); 352fc4dec0aSBarry Smith } 3533ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 35449b5e25fSSatish Balay } 35549b5e25fSSatish Balay 356ba38deedSJacob Faibussowitsch static PetscErrorCode MatView_SeqSBAIJ_ASCII(Mat A, PetscViewer viewer) 357d71ae5a4SJacob Faibussowitsch { 35849b5e25fSSatish Balay Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)A->data; 359d0f46423SBarry Smith PetscInt i, j, bs = A->rmap->bs, k, l, bs2 = a->bs2; 360f3ef73ceSBarry Smith PetscViewerFormat format; 361121deb67SSatish Balay PetscInt *diag; 362b3a0534dSBarry Smith const char *matname; 36349b5e25fSSatish Balay 36449b5e25fSSatish Balay PetscFunctionBegin; 3659566063dSJacob Faibussowitsch PetscCall(PetscViewerGetFormat(viewer, &format)); 366456192e2SBarry Smith if (format == PETSC_VIEWER_ASCII_INFO || format == PETSC_VIEWER_ASCII_INFO_DETAIL) { 3679566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " block size is %" PetscInt_FMT "\n", bs)); 368fb9695e5SSatish Balay } else if (format == PETSC_VIEWER_ASCII_MATLAB) { 369d2507d54SMatthew Knepley Mat aij; 370ade3a672SBarry Smith 371d5f3da31SBarry Smith if (A->factortype && bs > 1) { 3729566063dSJacob Faibussowitsch PetscCall(PetscPrintf(PETSC_COMM_SELF, "Warning: matrix is factored with bs>1. MatView() with PETSC_VIEWER_ASCII_MATLAB is not supported and ignored!\n")); 3733ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 37470d5e725SHong Zhang } 3759566063dSJacob Faibussowitsch PetscCall(MatConvert(A, MATSEQAIJ, MAT_INITIAL_MATRIX, &aij)); 37623a3927dSBarry Smith if (((PetscObject)A)->name) PetscCall(PetscObjectGetName((PetscObject)A, &matname)); 37723a3927dSBarry Smith if (((PetscObject)A)->name) PetscCall(PetscObjectSetName((PetscObject)aij, matname)); 37823a3927dSBarry Smith PetscCall(MatView_SeqAIJ(aij, viewer)); 3799566063dSJacob Faibussowitsch PetscCall(MatDestroy(&aij)); 380fb9695e5SSatish Balay } else if (format == PETSC_VIEWER_ASCII_COMMON) { 381b3a0534dSBarry Smith Mat B; 382b3a0534dSBarry Smith 383b3a0534dSBarry Smith PetscCall(MatConvert(A, MATSEQAIJ, MAT_INITIAL_MATRIX, &B)); 384b3a0534dSBarry Smith if (((PetscObject)A)->name) PetscCall(PetscObjectGetName((PetscObject)A, &matname)); 385b3a0534dSBarry Smith if (((PetscObject)A)->name) PetscCall(PetscObjectSetName((PetscObject)B, matname)); 386b3a0534dSBarry Smith PetscCall(MatView_SeqAIJ(B, viewer)); 387b3a0534dSBarry Smith PetscCall(MatDestroy(&B)); 388c1490034SHong Zhang } else if (format == PETSC_VIEWER_ASCII_FACTOR_INFO) { 3893ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 39049b5e25fSSatish Balay } else { 3919566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE)); 3922c990fa1SHong Zhang if (A->factortype) { /* for factored matrix */ 39308401ef6SPierre Jolivet PetscCheck(bs <= 1, PETSC_COMM_SELF, PETSC_ERR_SUP, "matrix is factored with bs>1. Not implemented yet"); 3942c990fa1SHong Zhang 395121deb67SSatish Balay diag = a->diag; 396121deb67SSatish Balay for (i = 0; i < a->mbs; i++) { /* for row block i */ 3979566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "row %" PetscInt_FMT ":", i)); 3982c990fa1SHong Zhang /* diagonal entry */ 3992c990fa1SHong Zhang #if defined(PETSC_USE_COMPLEX) 4002c990fa1SHong Zhang if (PetscImaginaryPart(a->a[diag[i]]) > 0.0) { 4019566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g + %g i) ", a->j[diag[i]], (double)PetscRealPart(1.0 / a->a[diag[i]]), (double)PetscImaginaryPart(1.0 / a->a[diag[i]]))); 4022c990fa1SHong Zhang } else if (PetscImaginaryPart(a->a[diag[i]]) < 0.0) { 4039566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g - %g i) ", a->j[diag[i]], (double)PetscRealPart(1.0 / a->a[diag[i]]), -(double)PetscImaginaryPart(1.0 / a->a[diag[i]]))); 4042c990fa1SHong Zhang } else { 4059566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[diag[i]], (double)PetscRealPart(1.0 / a->a[diag[i]]))); 4062c990fa1SHong Zhang } 4072c990fa1SHong Zhang #else 4089566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[diag[i]], (double)(1.0 / a->a[diag[i]]))); 4092c990fa1SHong Zhang #endif 4102c990fa1SHong Zhang /* off-diagonal entries */ 4112c990fa1SHong Zhang for (k = a->i[i]; k < a->i[i + 1] - 1; k++) { 4122c990fa1SHong Zhang #if defined(PETSC_USE_COMPLEX) 413ca0704adSBarry Smith if (PetscImaginaryPart(a->a[k]) > 0.0) { 4149566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g + %g i) ", bs * a->j[k], (double)PetscRealPart(a->a[k]), (double)PetscImaginaryPart(a->a[k]))); 415ca0704adSBarry Smith } else if (PetscImaginaryPart(a->a[k]) < 0.0) { 4169566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g - %g i) ", bs * a->j[k], (double)PetscRealPart(a->a[k]), -(double)PetscImaginaryPart(a->a[k]))); 4172c990fa1SHong Zhang } else { 4189566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", bs * a->j[k], (double)PetscRealPart(a->a[k]))); 4192c990fa1SHong Zhang } 4202c990fa1SHong Zhang #else 4219566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[k], (double)a->a[k])); 4222c990fa1SHong Zhang #endif 4232c990fa1SHong Zhang } 4249566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 4252c990fa1SHong Zhang } 4262c990fa1SHong Zhang 4272c990fa1SHong Zhang } else { /* for non-factored matrix */ 4280c74a584SJed Brown for (i = 0; i < a->mbs; i++) { /* for row block i */ 4290c74a584SJed Brown for (j = 0; j < bs; j++) { /* for row bs*i + j */ 4309566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "row %" PetscInt_FMT ":", i * bs + j)); 4310c74a584SJed Brown for (k = a->i[i]; k < a->i[i + 1]; k++) { /* for column block */ 4320c74a584SJed Brown for (l = 0; l < bs; l++) { /* for column */ 43349b5e25fSSatish Balay #if defined(PETSC_USE_COMPLEX) 43449b5e25fSSatish Balay if (PetscImaginaryPart(a->a[bs2 * k + l * bs + j]) > 0.0) { 4359371c9d4SSatish Balay PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g + %g i) ", bs * a->j[k] + l, (double)PetscRealPart(a->a[bs2 * k + l * bs + j]), (double)PetscImaginaryPart(a->a[bs2 * k + l * bs + j]))); 43649b5e25fSSatish Balay } else if (PetscImaginaryPart(a->a[bs2 * k + l * bs + j]) < 0.0) { 4379371c9d4SSatish Balay PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g - %g i) ", bs * a->j[k] + l, (double)PetscRealPart(a->a[bs2 * k + l * bs + j]), -(double)PetscImaginaryPart(a->a[bs2 * k + l * bs + j]))); 43849b5e25fSSatish Balay } else { 4399566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", bs * a->j[k] + l, (double)PetscRealPart(a->a[bs2 * k + l * bs + j]))); 44049b5e25fSSatish Balay } 44149b5e25fSSatish Balay #else 4429566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", bs * a->j[k] + l, (double)a->a[bs2 * k + l * bs + j])); 44349b5e25fSSatish Balay #endif 44449b5e25fSSatish Balay } 44549b5e25fSSatish Balay } 4469566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 44749b5e25fSSatish Balay } 44849b5e25fSSatish Balay } 4492c990fa1SHong Zhang } 4509566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE)); 45149b5e25fSSatish Balay } 4529566063dSJacob Faibussowitsch PetscCall(PetscViewerFlush(viewer)); 4533ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 45449b5e25fSSatish Balay } 45549b5e25fSSatish Balay 4569804daf3SBarry Smith #include <petscdraw.h> 457d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatView_SeqSBAIJ_Draw_Zoom(PetscDraw draw, void *Aa) 458d71ae5a4SJacob Faibussowitsch { 45949b5e25fSSatish Balay Mat A = (Mat)Aa; 46049b5e25fSSatish Balay Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)A->data; 461d0f46423SBarry Smith PetscInt row, i, j, k, l, mbs = a->mbs, color, bs = A->rmap->bs, bs2 = a->bs2; 46249b5e25fSSatish Balay PetscReal xl, yl, xr, yr, x_l, x_r, y_l, y_r; 46349b5e25fSSatish Balay MatScalar *aa; 464b0a32e0cSBarry Smith PetscViewer viewer; 46549b5e25fSSatish Balay 46649b5e25fSSatish Balay PetscFunctionBegin; 4679566063dSJacob Faibussowitsch PetscCall(PetscObjectQuery((PetscObject)A, "Zoomviewer", (PetscObject *)&viewer)); 4689566063dSJacob Faibussowitsch PetscCall(PetscDrawGetCoordinates(draw, &xl, &yl, &xr, &yr)); 46949b5e25fSSatish Balay 47049b5e25fSSatish Balay /* loop over matrix elements drawing boxes */ 471383922c3SLisandro Dalcin 472d0609cedSBarry Smith PetscDrawCollectiveBegin(draw); 4739566063dSJacob Faibussowitsch PetscCall(PetscDrawString(draw, .3 * (xl + xr), .3 * (yl + yr), PETSC_DRAW_BLACK, "symmetric")); 474383922c3SLisandro Dalcin /* Blue for negative, Cyan for zero and Red for positive */ 475b0a32e0cSBarry Smith color = PETSC_DRAW_BLUE; 47649b5e25fSSatish Balay for (i = 0, row = 0; i < mbs; i++, row += bs) { 47749b5e25fSSatish Balay for (j = a->i[i]; j < a->i[i + 1]; j++) { 4789371c9d4SSatish Balay y_l = A->rmap->N - row - 1.0; 4799371c9d4SSatish Balay y_r = y_l + 1.0; 4809371c9d4SSatish Balay x_l = a->j[j] * bs; 4819371c9d4SSatish Balay x_r = x_l + 1.0; 48249b5e25fSSatish Balay aa = a->a + j * bs2; 48349b5e25fSSatish Balay for (k = 0; k < bs; k++) { 48449b5e25fSSatish Balay for (l = 0; l < bs; l++) { 48549b5e25fSSatish Balay if (PetscRealPart(*aa++) >= 0.) continue; 4869566063dSJacob Faibussowitsch PetscCall(PetscDrawRectangle(draw, x_l + k, y_l - l, x_r + k, y_r - l, color, color, color, color)); 48749b5e25fSSatish Balay } 48849b5e25fSSatish Balay } 48949b5e25fSSatish Balay } 49049b5e25fSSatish Balay } 491b0a32e0cSBarry Smith color = PETSC_DRAW_CYAN; 49249b5e25fSSatish Balay for (i = 0, row = 0; i < mbs; i++, row += bs) { 49349b5e25fSSatish Balay for (j = a->i[i]; j < a->i[i + 1]; j++) { 4949371c9d4SSatish Balay y_l = A->rmap->N - row - 1.0; 4959371c9d4SSatish Balay y_r = y_l + 1.0; 4969371c9d4SSatish Balay x_l = a->j[j] * bs; 4979371c9d4SSatish Balay x_r = x_l + 1.0; 49849b5e25fSSatish Balay aa = a->a + j * bs2; 49949b5e25fSSatish Balay for (k = 0; k < bs; k++) { 50049b5e25fSSatish Balay for (l = 0; l < bs; l++) { 50149b5e25fSSatish Balay if (PetscRealPart(*aa++) != 0.) continue; 5029566063dSJacob Faibussowitsch PetscCall(PetscDrawRectangle(draw, x_l + k, y_l - l, x_r + k, y_r - l, color, color, color, color)); 50349b5e25fSSatish Balay } 50449b5e25fSSatish Balay } 50549b5e25fSSatish Balay } 50649b5e25fSSatish Balay } 507b0a32e0cSBarry Smith color = PETSC_DRAW_RED; 50849b5e25fSSatish Balay for (i = 0, row = 0; i < mbs; i++, row += bs) { 50949b5e25fSSatish Balay for (j = a->i[i]; j < a->i[i + 1]; j++) { 5109371c9d4SSatish Balay y_l = A->rmap->N - row - 1.0; 5119371c9d4SSatish Balay y_r = y_l + 1.0; 5129371c9d4SSatish Balay x_l = a->j[j] * bs; 5139371c9d4SSatish Balay x_r = x_l + 1.0; 51449b5e25fSSatish Balay aa = a->a + j * bs2; 51549b5e25fSSatish Balay for (k = 0; k < bs; k++) { 51649b5e25fSSatish Balay for (l = 0; l < bs; l++) { 51749b5e25fSSatish Balay if (PetscRealPart(*aa++) <= 0.) continue; 5189566063dSJacob Faibussowitsch PetscCall(PetscDrawRectangle(draw, x_l + k, y_l - l, x_r + k, y_r - l, color, color, color, color)); 51949b5e25fSSatish Balay } 52049b5e25fSSatish Balay } 52149b5e25fSSatish Balay } 52249b5e25fSSatish Balay } 523d0609cedSBarry Smith PetscDrawCollectiveEnd(draw); 5243ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 52549b5e25fSSatish Balay } 52649b5e25fSSatish Balay 527d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatView_SeqSBAIJ_Draw(Mat A, PetscViewer viewer) 528d71ae5a4SJacob Faibussowitsch { 52949b5e25fSSatish Balay PetscReal xl, yl, xr, yr, w, h; 530b0a32e0cSBarry Smith PetscDraw draw; 531ace3abfcSBarry Smith PetscBool isnull; 53249b5e25fSSatish Balay 53349b5e25fSSatish Balay PetscFunctionBegin; 5349566063dSJacob Faibussowitsch PetscCall(PetscViewerDrawGetDraw(viewer, 0, &draw)); 5359566063dSJacob Faibussowitsch PetscCall(PetscDrawIsNull(draw, &isnull)); 5363ba16761SJacob Faibussowitsch if (isnull) PetscFunctionReturn(PETSC_SUCCESS); 53749b5e25fSSatish Balay 5389371c9d4SSatish Balay xr = A->rmap->N; 5399371c9d4SSatish Balay yr = A->rmap->N; 5409371c9d4SSatish Balay h = yr / 10.0; 5419371c9d4SSatish Balay w = xr / 10.0; 5429371c9d4SSatish Balay xr += w; 5439371c9d4SSatish Balay yr += h; 5449371c9d4SSatish Balay xl = -w; 5459371c9d4SSatish Balay yl = -h; 5469566063dSJacob Faibussowitsch PetscCall(PetscDrawSetCoordinates(draw, xl, yl, xr, yr)); 5479566063dSJacob Faibussowitsch PetscCall(PetscObjectCompose((PetscObject)A, "Zoomviewer", (PetscObject)viewer)); 5489566063dSJacob Faibussowitsch PetscCall(PetscDrawZoom(draw, MatView_SeqSBAIJ_Draw_Zoom, A)); 5499566063dSJacob Faibussowitsch PetscCall(PetscObjectCompose((PetscObject)A, "Zoomviewer", NULL)); 5509566063dSJacob Faibussowitsch PetscCall(PetscDrawSave(draw)); 5513ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 55249b5e25fSSatish Balay } 55349b5e25fSSatish Balay 554618cc2edSLisandro Dalcin /* Used for both MPIBAIJ and MPISBAIJ matrices */ 555618cc2edSLisandro Dalcin #define MatView_SeqSBAIJ_Binary MatView_SeqBAIJ_Binary 556618cc2edSLisandro Dalcin 557d71ae5a4SJacob Faibussowitsch PetscErrorCode MatView_SeqSBAIJ(Mat A, PetscViewer viewer) 558d71ae5a4SJacob Faibussowitsch { 559618cc2edSLisandro Dalcin PetscBool iascii, isbinary, isdraw; 56049b5e25fSSatish Balay 56149b5e25fSSatish Balay PetscFunctionBegin; 5629566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERASCII, &iascii)); 5639566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERBINARY, &isbinary)); 5649566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERDRAW, &isdraw)); 56532077d6dSBarry Smith if (iascii) { 5669566063dSJacob Faibussowitsch PetscCall(MatView_SeqSBAIJ_ASCII(A, viewer)); 567618cc2edSLisandro Dalcin } else if (isbinary) { 5689566063dSJacob Faibussowitsch PetscCall(MatView_SeqSBAIJ_Binary(A, viewer)); 56949b5e25fSSatish Balay } else if (isdraw) { 5709566063dSJacob Faibussowitsch PetscCall(MatView_SeqSBAIJ_Draw(A, viewer)); 57149b5e25fSSatish Balay } else { 572a5e6ed63SBarry Smith Mat B; 573ade3a672SBarry Smith const char *matname; 5749566063dSJacob Faibussowitsch PetscCall(MatConvert(A, MATSEQAIJ, MAT_INITIAL_MATRIX, &B)); 57523a3927dSBarry Smith if (((PetscObject)A)->name) PetscCall(PetscObjectGetName((PetscObject)A, &matname)); 57623a3927dSBarry Smith if (((PetscObject)A)->name) PetscCall(PetscObjectSetName((PetscObject)B, matname)); 5779566063dSJacob Faibussowitsch PetscCall(MatView(B, viewer)); 5789566063dSJacob Faibussowitsch PetscCall(MatDestroy(&B)); 57949b5e25fSSatish Balay } 5803ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 58149b5e25fSSatish Balay } 58249b5e25fSSatish Balay 583d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetValues_SeqSBAIJ(Mat A, PetscInt m, const PetscInt im[], PetscInt n, const PetscInt in[], PetscScalar v[]) 584d71ae5a4SJacob Faibussowitsch { 585045c9aa0SHong Zhang Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)A->data; 58613f74950SBarry Smith PetscInt *rp, k, low, high, t, row, nrow, i, col, l, *aj = a->j; 58713f74950SBarry Smith PetscInt *ai = a->i, *ailen = a->ilen; 588d0f46423SBarry Smith PetscInt brow, bcol, ridx, cidx, bs = A->rmap->bs, bs2 = a->bs2; 58997e567efSBarry Smith MatScalar *ap, *aa = a->a; 59049b5e25fSSatish Balay 59149b5e25fSSatish Balay PetscFunctionBegin; 59249b5e25fSSatish Balay for (k = 0; k < m; k++) { /* loop over rows */ 5939371c9d4SSatish Balay row = im[k]; 5949371c9d4SSatish Balay brow = row / bs; 5959371c9d4SSatish Balay if (row < 0) { 5969371c9d4SSatish Balay v += n; 5979371c9d4SSatish Balay continue; 5989371c9d4SSatish Balay } /* negative row */ 59954c59aa7SJacob Faibussowitsch PetscCheck(row < A->rmap->N, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Row too large: row %" PetscInt_FMT " max %" PetscInt_FMT, row, A->rmap->N - 1); 6009371c9d4SSatish Balay rp = aj + ai[brow]; 6019371c9d4SSatish Balay ap = aa + bs2 * ai[brow]; 60249b5e25fSSatish Balay nrow = ailen[brow]; 60349b5e25fSSatish Balay for (l = 0; l < n; l++) { /* loop over columns */ 6049371c9d4SSatish Balay if (in[l] < 0) { 6059371c9d4SSatish Balay v++; 6069371c9d4SSatish Balay continue; 6079371c9d4SSatish Balay } /* negative column */ 60854c59aa7SJacob Faibussowitsch PetscCheck(in[l] < A->cmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Column too large: col %" PetscInt_FMT " max %" PetscInt_FMT, in[l], A->cmap->n - 1); 60949b5e25fSSatish Balay col = in[l]; 61049b5e25fSSatish Balay bcol = col / bs; 61149b5e25fSSatish Balay cidx = col % bs; 61249b5e25fSSatish Balay ridx = row % bs; 61349b5e25fSSatish Balay high = nrow; 61449b5e25fSSatish Balay low = 0; /* assume unsorted */ 61549b5e25fSSatish Balay while (high - low > 5) { 61649b5e25fSSatish Balay t = (low + high) / 2; 61749b5e25fSSatish Balay if (rp[t] > bcol) high = t; 61849b5e25fSSatish Balay else low = t; 61949b5e25fSSatish Balay } 62049b5e25fSSatish Balay for (i = low; i < high; i++) { 62149b5e25fSSatish Balay if (rp[i] > bcol) break; 62249b5e25fSSatish Balay if (rp[i] == bcol) { 62349b5e25fSSatish Balay *v++ = ap[bs2 * i + bs * cidx + ridx]; 62449b5e25fSSatish Balay goto finished; 62549b5e25fSSatish Balay } 62649b5e25fSSatish Balay } 62797e567efSBarry Smith *v++ = 0.0; 62849b5e25fSSatish Balay finished:; 62949b5e25fSSatish Balay } 63049b5e25fSSatish Balay } 6313ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 63249b5e25fSSatish Balay } 63349b5e25fSSatish Balay 634ba38deedSJacob Faibussowitsch static PetscErrorCode MatPermute_SeqSBAIJ(Mat A, IS rowp, IS colp, Mat *B) 635d71ae5a4SJacob Faibussowitsch { 636dc29a518SPierre Jolivet Mat C; 637dc29a518SPierre Jolivet 638dc29a518SPierre Jolivet PetscFunctionBegin; 6399566063dSJacob Faibussowitsch PetscCall(MatConvert(A, MATSEQBAIJ, MAT_INITIAL_MATRIX, &C)); 6409566063dSJacob Faibussowitsch PetscCall(MatPermute(C, rowp, colp, B)); 6419566063dSJacob Faibussowitsch PetscCall(MatDestroy(&C)); 64248a46eb9SPierre Jolivet if (rowp == colp) PetscCall(MatConvert(*B, MATSEQSBAIJ, MAT_INPLACE_MATRIX, B)); 6433ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 644dc29a518SPierre Jolivet } 64549b5e25fSSatish Balay 646d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetValuesBlocked_SeqSBAIJ(Mat A, PetscInt m, const PetscInt im[], PetscInt n, const PetscInt in[], const PetscScalar v[], InsertMode is) 647d71ae5a4SJacob Faibussowitsch { 6480880e062SHong Zhang Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)A->data; 649e2ee6c50SBarry Smith PetscInt *rp, k, low, high, t, ii, jj, row, nrow, i, col, l, rmax, N, lastcol = -1; 65013f74950SBarry Smith PetscInt *imax = a->imax, *ai = a->i, *ailen = a->ilen; 651d0f46423SBarry Smith PetscInt *aj = a->j, nonew = a->nonew, bs2 = a->bs2, bs = A->rmap->bs, stepval; 652ace3abfcSBarry Smith PetscBool roworiented = a->roworiented; 653dd6ea824SBarry Smith const PetscScalar *value = v; 654f15d580aSBarry Smith MatScalar *ap, *aa = a->a, *bap; 6550880e062SHong Zhang 65649b5e25fSSatish Balay PetscFunctionBegin; 65726fbe8dcSKarl Rupp if (roworiented) stepval = (n - 1) * bs; 65826fbe8dcSKarl Rupp else stepval = (m - 1) * bs; 65926fbe8dcSKarl Rupp 6600880e062SHong Zhang for (k = 0; k < m; k++) { /* loop over added rows */ 6610880e062SHong Zhang row = im[k]; 6620880e062SHong Zhang if (row < 0) continue; 6636bdcaf15SBarry Smith PetscCheck(row < a->mbs, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Block index row too large %" PetscInt_FMT " max %" PetscInt_FMT, row, a->mbs - 1); 6640880e062SHong Zhang rp = aj + ai[row]; 6650880e062SHong Zhang ap = aa + bs2 * ai[row]; 6660880e062SHong Zhang rmax = imax[row]; 6670880e062SHong Zhang nrow = ailen[row]; 6680880e062SHong Zhang low = 0; 669818f2c47SBarry Smith high = nrow; 6700880e062SHong Zhang for (l = 0; l < n; l++) { /* loop over added columns */ 6710880e062SHong Zhang if (in[l] < 0) continue; 6720880e062SHong Zhang col = in[l]; 6736bdcaf15SBarry Smith PetscCheck(col < a->nbs, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Block index column too large %" PetscInt_FMT " max %" PetscInt_FMT, col, a->nbs - 1); 674b98bf0e1SJed Brown if (col < row) { 67526fbe8dcSKarl Rupp if (a->ignore_ltriangular) continue; /* ignore lower triangular block */ 67626fbe8dcSKarl Rupp else SETERRQ(PETSC_COMM_SELF, PETSC_ERR_USER, "Lower triangular value cannot be set for sbaij format. Ignoring these values, run with -mat_ignore_lower_triangular or call MatSetOption(mat,MAT_IGNORE_LOWER_TRIANGULAR,PETSC_TRUE)"); 677b98bf0e1SJed Brown } 67826fbe8dcSKarl Rupp if (roworiented) value = v + k * (stepval + bs) * bs + l * bs; 67926fbe8dcSKarl Rupp else value = v + l * (stepval + bs) * bs + k * bs; 68026fbe8dcSKarl Rupp 68126fbe8dcSKarl Rupp if (col <= lastcol) low = 0; 68226fbe8dcSKarl Rupp else high = nrow; 68326fbe8dcSKarl Rupp 684e2ee6c50SBarry Smith lastcol = col; 6850880e062SHong Zhang while (high - low > 7) { 6860880e062SHong Zhang t = (low + high) / 2; 6870880e062SHong Zhang if (rp[t] > col) high = t; 6880880e062SHong Zhang else low = t; 6890880e062SHong Zhang } 6900880e062SHong Zhang for (i = low; i < high; i++) { 6910880e062SHong Zhang if (rp[i] > col) break; 6920880e062SHong Zhang if (rp[i] == col) { 6930880e062SHong Zhang bap = ap + bs2 * i; 6940880e062SHong Zhang if (roworiented) { 6950880e062SHong Zhang if (is == ADD_VALUES) { 6960880e062SHong Zhang for (ii = 0; ii < bs; ii++, value += stepval) { 697ad540459SPierre Jolivet for (jj = ii; jj < bs2; jj += bs) bap[jj] += *value++; 6980880e062SHong Zhang } 6990880e062SHong Zhang } else { 7000880e062SHong Zhang for (ii = 0; ii < bs; ii++, value += stepval) { 701ad540459SPierre Jolivet for (jj = ii; jj < bs2; jj += bs) bap[jj] = *value++; 7020880e062SHong Zhang } 7030880e062SHong Zhang } 7040880e062SHong Zhang } else { 7050880e062SHong Zhang if (is == ADD_VALUES) { 7060880e062SHong Zhang for (ii = 0; ii < bs; ii++, value += stepval) { 707ad540459SPierre Jolivet for (jj = 0; jj < bs; jj++) *bap++ += *value++; 7080880e062SHong Zhang } 7090880e062SHong Zhang } else { 7100880e062SHong Zhang for (ii = 0; ii < bs; ii++, value += stepval) { 711ad540459SPierre Jolivet for (jj = 0; jj < bs; jj++) *bap++ = *value++; 7120880e062SHong Zhang } 7130880e062SHong Zhang } 7140880e062SHong Zhang } 7150880e062SHong Zhang goto noinsert2; 7160880e062SHong Zhang } 7170880e062SHong Zhang } 7180880e062SHong Zhang if (nonew == 1) goto noinsert2; 71908401ef6SPierre Jolivet PetscCheck(nonew != -1, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Inserting a new block index nonzero block (%" PetscInt_FMT ", %" PetscInt_FMT ") in the matrix", row, col); 720fef13f97SBarry Smith MatSeqXAIJReallocateAIJ(A, a->mbs, bs2, nrow, row, col, rmax, aa, ai, aj, rp, ap, imax, nonew, MatScalar); 7219371c9d4SSatish Balay N = nrow++ - 1; 7229371c9d4SSatish Balay high++; 7230880e062SHong Zhang /* shift up all the later entries in this row */ 7249566063dSJacob Faibussowitsch PetscCall(PetscArraymove(rp + i + 1, rp + i, N - i + 1)); 7259566063dSJacob Faibussowitsch PetscCall(PetscArraymove(ap + bs2 * (i + 1), ap + bs2 * i, bs2 * (N - i + 1))); 7269566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(ap + bs2 * i, bs2)); 7270880e062SHong Zhang rp[i] = col; 7280880e062SHong Zhang bap = ap + bs2 * i; 7290880e062SHong Zhang if (roworiented) { 7300880e062SHong Zhang for (ii = 0; ii < bs; ii++, value += stepval) { 731ad540459SPierre Jolivet for (jj = ii; jj < bs2; jj += bs) bap[jj] = *value++; 7320880e062SHong Zhang } 7330880e062SHong Zhang } else { 7340880e062SHong Zhang for (ii = 0; ii < bs; ii++, value += stepval) { 735ad540459SPierre Jolivet for (jj = 0; jj < bs; jj++) *bap++ = *value++; 7360880e062SHong Zhang } 7370880e062SHong Zhang } 7380880e062SHong Zhang noinsert2:; 7390880e062SHong Zhang low = i; 7400880e062SHong Zhang } 7410880e062SHong Zhang ailen[row] = nrow; 7420880e062SHong Zhang } 7433ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 74449b5e25fSSatish Balay } 74549b5e25fSSatish Balay 746ba38deedSJacob Faibussowitsch static PetscErrorCode MatAssemblyEnd_SeqSBAIJ(Mat A, MatAssemblyType mode) 747d71ae5a4SJacob Faibussowitsch { 74849b5e25fSSatish Balay Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)A->data; 7498f8f2f0dSBarry Smith PetscInt fshift = 0, i, *ai = a->i, *aj = a->j, *imax = a->imax; 750d0f46423SBarry Smith PetscInt m = A->rmap->N, *ip, N, *ailen = a->ilen; 75113f74950SBarry Smith PetscInt mbs = a->mbs, bs2 = a->bs2, rmax = 0; 75249b5e25fSSatish Balay MatScalar *aa = a->a, *ap; 75349b5e25fSSatish Balay 75449b5e25fSSatish Balay PetscFunctionBegin; 755d32568d8SPierre Jolivet if (mode == MAT_FLUSH_ASSEMBLY || (A->was_assembled && A->ass_nonzerostate == A->nonzerostate)) PetscFunctionReturn(PETSC_SUCCESS); 75649b5e25fSSatish Balay 75749b5e25fSSatish Balay if (m) rmax = ailen[0]; 75849b5e25fSSatish Balay for (i = 1; i < mbs; i++) { 75949b5e25fSSatish Balay /* move each row back by the amount of empty slots (fshift) before it*/ 76049b5e25fSSatish Balay fshift += imax[i - 1] - ailen[i - 1]; 76149b5e25fSSatish Balay rmax = PetscMax(rmax, ailen[i]); 76249b5e25fSSatish Balay if (fshift) { 763580bdb30SBarry Smith ip = aj + ai[i]; 764580bdb30SBarry Smith ap = aa + bs2 * ai[i]; 76549b5e25fSSatish Balay N = ailen[i]; 7669566063dSJacob Faibussowitsch PetscCall(PetscArraymove(ip - fshift, ip, N)); 7679566063dSJacob Faibussowitsch PetscCall(PetscArraymove(ap - bs2 * fshift, ap, bs2 * N)); 76849b5e25fSSatish Balay } 76949b5e25fSSatish Balay ai[i] = ai[i - 1] + ailen[i - 1]; 77049b5e25fSSatish Balay } 77149b5e25fSSatish Balay if (mbs) { 77249b5e25fSSatish Balay fshift += imax[mbs - 1] - ailen[mbs - 1]; 77349b5e25fSSatish Balay ai[mbs] = ai[mbs - 1] + ailen[mbs - 1]; 77449b5e25fSSatish Balay } 77549b5e25fSSatish Balay /* reset ilen and imax for each row */ 776ad540459SPierre Jolivet for (i = 0; i < mbs; i++) ailen[i] = imax[i] = ai[i + 1] - ai[i]; 7776c6c5352SBarry Smith a->nz = ai[mbs]; 77849b5e25fSSatish Balay 779b424e231SHong Zhang /* diagonals may have moved, reset it */ 7801baa6e33SBarry Smith if (a->diag) PetscCall(PetscArraycpy(a->diag, ai, mbs)); 781aed4548fSBarry Smith PetscCheck(!fshift || a->nounused != -1, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Unused space detected in matrix: %" PetscInt_FMT " X %" PetscInt_FMT " block size %" PetscInt_FMT ", %" PetscInt_FMT " unneeded", m, A->cmap->n, A->rmap->bs, fshift * bs2); 78226fbe8dcSKarl Rupp 7839566063dSJacob Faibussowitsch PetscCall(PetscInfo(A, "Matrix size: %" PetscInt_FMT " X %" PetscInt_FMT ", block size %" PetscInt_FMT "; storage space: %" PetscInt_FMT " unneeded, %" PetscInt_FMT " used\n", m, A->rmap->N, A->rmap->bs, fshift * bs2, a->nz * bs2)); 7849566063dSJacob Faibussowitsch PetscCall(PetscInfo(A, "Number of mallocs during MatSetValues is %" PetscInt_FMT "\n", a->reallocs)); 7859566063dSJacob Faibussowitsch PetscCall(PetscInfo(A, "Most nonzeros blocks in any row is %" PetscInt_FMT "\n", rmax)); 78626fbe8dcSKarl Rupp 7878e58a170SBarry Smith A->info.mallocs += a->reallocs; 78849b5e25fSSatish Balay a->reallocs = 0; 78949b5e25fSSatish Balay A->info.nz_unneeded = (PetscReal)fshift * bs2; 790061b2667SBarry Smith a->idiagvalid = PETSC_FALSE; 7914dcd73b1SHong Zhang a->rmax = rmax; 79238702af4SBarry Smith 79338702af4SBarry Smith if (A->cmap->n < 65536 && A->cmap->bs == 1) { 79444e1c64aSLisandro Dalcin if (a->jshort && a->free_jshort) { 79517803ae8SHong Zhang /* when matrix data structure is changed, previous jshort must be replaced */ 7969566063dSJacob Faibussowitsch PetscCall(PetscFree(a->jshort)); 79717803ae8SHong Zhang } 7989566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(a->i[A->rmap->n], &a->jshort)); 79938702af4SBarry Smith for (i = 0; i < a->i[A->rmap->n]; i++) a->jshort[i] = a->j[i]; 80038702af4SBarry Smith A->ops->mult = MatMult_SeqSBAIJ_1_ushort; 80141f059aeSBarry Smith A->ops->sor = MatSOR_SeqSBAIJ_ushort; 8024da8f245SBarry Smith a->free_jshort = PETSC_TRUE; 80338702af4SBarry Smith } 8043ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 80549b5e25fSSatish Balay } 80649b5e25fSSatish Balay 80749b5e25fSSatish Balay /* Only add/insert a(i,j) with i<=j (blocks). 808da81f932SPierre Jolivet Any a(i,j) with i>j input by user is ignored. 80949b5e25fSSatish Balay */ 81049b5e25fSSatish Balay 811d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetValues_SeqSBAIJ(Mat A, PetscInt m, const PetscInt im[], PetscInt n, const PetscInt in[], const PetscScalar v[], InsertMode is) 812d71ae5a4SJacob Faibussowitsch { 81349b5e25fSSatish Balay Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)A->data; 814e2ee6c50SBarry Smith PetscInt *rp, k, low, high, t, ii, row, nrow, i, col, l, rmax, N, lastcol = -1; 81513f74950SBarry Smith PetscInt *imax = a->imax, *ai = a->i, *ailen = a->ilen, roworiented = a->roworiented; 816d0f46423SBarry Smith PetscInt *aj = a->j, nonew = a->nonew, bs = A->rmap->bs, brow, bcol; 81713f74950SBarry Smith PetscInt ridx, cidx, bs2 = a->bs2; 81849b5e25fSSatish Balay MatScalar *ap, value, *aa = a->a, *bap; 81949b5e25fSSatish Balay 82049b5e25fSSatish Balay PetscFunctionBegin; 82149b5e25fSSatish Balay for (k = 0; k < m; k++) { /* loop over added rows */ 82249b5e25fSSatish Balay row = im[k]; /* row number */ 82349b5e25fSSatish Balay brow = row / bs; /* block row number */ 82449b5e25fSSatish Balay if (row < 0) continue; 8256bdcaf15SBarry Smith PetscCheck(row < A->rmap->N, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Row too large: row %" PetscInt_FMT " max %" PetscInt_FMT, row, A->rmap->N - 1); 82649b5e25fSSatish Balay rp = aj + ai[brow]; /*ptr to beginning of column value of the row block*/ 82749b5e25fSSatish Balay ap = aa + bs2 * ai[brow]; /*ptr to beginning of element value of the row block*/ 82849b5e25fSSatish Balay rmax = imax[brow]; /* maximum space allocated for this row */ 82949b5e25fSSatish Balay nrow = ailen[brow]; /* actual length of this row */ 83049b5e25fSSatish Balay low = 0; 8318509e838SStefano Zampini high = nrow; 83249b5e25fSSatish Balay for (l = 0; l < n; l++) { /* loop over added columns */ 83349b5e25fSSatish Balay if (in[l] < 0) continue; 8346bdcaf15SBarry Smith PetscCheck(in[l] < A->cmap->N, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Column too large: col %" PetscInt_FMT " max %" PetscInt_FMT, in[l], A->cmap->N - 1); 83549b5e25fSSatish Balay col = in[l]; 83649b5e25fSSatish Balay bcol = col / bs; /* block col number */ 83749b5e25fSSatish Balay 838941593c8SHong Zhang if (brow > bcol) { 83926fbe8dcSKarl Rupp if (a->ignore_ltriangular) continue; /* ignore lower triangular values */ 84026fbe8dcSKarl Rupp else SETERRQ(PETSC_COMM_SELF, PETSC_ERR_USER, "Lower triangular value cannot be set for sbaij format. Ignoring these values, run with -mat_ignore_lower_triangular or call MatSetOption(mat,MAT_IGNORE_LOWER_TRIANGULAR,PETSC_TRUE)"); 841941593c8SHong Zhang } 842f4989cb3SHong Zhang 8439371c9d4SSatish Balay ridx = row % bs; 8449371c9d4SSatish Balay cidx = col % bs; /*row and col index inside the block */ 8458549e402SHong Zhang if ((brow == bcol && ridx <= cidx) || (brow < bcol)) { 84649b5e25fSSatish Balay /* element value a(k,l) */ 84726fbe8dcSKarl Rupp if (roworiented) value = v[l + k * n]; 84826fbe8dcSKarl Rupp else value = v[k + l * m]; 84949b5e25fSSatish Balay 85049b5e25fSSatish Balay /* move pointer bap to a(k,l) quickly and add/insert value */ 85126fbe8dcSKarl Rupp if (col <= lastcol) low = 0; 8528509e838SStefano Zampini else high = nrow; 8538509e838SStefano Zampini 854e2ee6c50SBarry Smith lastcol = col; 85549b5e25fSSatish Balay while (high - low > 7) { 85649b5e25fSSatish Balay t = (low + high) / 2; 85749b5e25fSSatish Balay if (rp[t] > bcol) high = t; 85849b5e25fSSatish Balay else low = t; 85949b5e25fSSatish Balay } 86049b5e25fSSatish Balay for (i = low; i < high; i++) { 86149b5e25fSSatish Balay if (rp[i] > bcol) break; 86249b5e25fSSatish Balay if (rp[i] == bcol) { 86349b5e25fSSatish Balay bap = ap + bs2 * i + bs * cidx + ridx; 86449b5e25fSSatish Balay if (is == ADD_VALUES) *bap += value; 86549b5e25fSSatish Balay else *bap = value; 8668549e402SHong Zhang /* for diag block, add/insert its symmetric element a(cidx,ridx) */ 8678549e402SHong Zhang if (brow == bcol && ridx < cidx) { 8688549e402SHong Zhang bap = ap + bs2 * i + bs * ridx + cidx; 8698549e402SHong Zhang if (is == ADD_VALUES) *bap += value; 8708549e402SHong Zhang else *bap = value; 8718549e402SHong Zhang } 87249b5e25fSSatish Balay goto noinsert1; 87349b5e25fSSatish Balay } 87449b5e25fSSatish Balay } 87549b5e25fSSatish Balay 87649b5e25fSSatish Balay if (nonew == 1) goto noinsert1; 87708401ef6SPierre Jolivet PetscCheck(nonew != -1, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Inserting a new nonzero (%" PetscInt_FMT ", %" PetscInt_FMT ") in the matrix", row, col); 878fef13f97SBarry Smith MatSeqXAIJReallocateAIJ(A, a->mbs, bs2, nrow, brow, bcol, rmax, aa, ai, aj, rp, ap, imax, nonew, MatScalar); 87949b5e25fSSatish Balay 8809371c9d4SSatish Balay N = nrow++ - 1; 8819371c9d4SSatish Balay high++; 88249b5e25fSSatish Balay /* shift up all the later entries in this row */ 8839566063dSJacob Faibussowitsch PetscCall(PetscArraymove(rp + i + 1, rp + i, N - i + 1)); 8849566063dSJacob Faibussowitsch PetscCall(PetscArraymove(ap + bs2 * (i + 1), ap + bs2 * i, bs2 * (N - i + 1))); 8859566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(ap + bs2 * i, bs2)); 88649b5e25fSSatish Balay rp[i] = bcol; 88749b5e25fSSatish Balay ap[bs2 * i + bs * cidx + ridx] = value; 8888509e838SStefano Zampini /* for diag block, add/insert its symmetric element a(cidx,ridx) */ 889ad540459SPierre Jolivet if (brow == bcol && ridx < cidx) ap[bs2 * i + bs * ridx + cidx] = value; 890e56f5c9eSBarry Smith A->nonzerostate++; 89149b5e25fSSatish Balay noinsert1:; 89249b5e25fSSatish Balay low = i; 8938549e402SHong Zhang } 89449b5e25fSSatish Balay } /* end of loop over added columns */ 89549b5e25fSSatish Balay ailen[brow] = nrow; 89649b5e25fSSatish Balay } /* end of loop over added rows */ 8973ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 89849b5e25fSSatish Balay } 89949b5e25fSSatish Balay 900ba38deedSJacob Faibussowitsch static PetscErrorCode MatICCFactor_SeqSBAIJ(Mat inA, IS row, const MatFactorInfo *info) 901d71ae5a4SJacob Faibussowitsch { 9024ccecd49SHong Zhang Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)inA->data; 90349b5e25fSSatish Balay Mat outA; 904ace3abfcSBarry Smith PetscBool row_identity; 90549b5e25fSSatish Balay 90649b5e25fSSatish Balay PetscFunctionBegin; 90708401ef6SPierre Jolivet PetscCheck(info->levels == 0, PETSC_COMM_SELF, PETSC_ERR_SUP, "Only levels=0 is supported for in-place icc"); 9089566063dSJacob Faibussowitsch PetscCall(ISIdentity(row, &row_identity)); 90928b400f6SJacob Faibussowitsch PetscCheck(row_identity, PETSC_COMM_SELF, PETSC_ERR_SUP, "Matrix reordering is not supported"); 91008401ef6SPierre Jolivet PetscCheck(inA->rmap->bs == 1, PETSC_COMM_SELF, PETSC_ERR_SUP, "Matrix block size %" PetscInt_FMT " is not supported", inA->rmap->bs); /* Need to replace MatCholeskyFactorSymbolic_SeqSBAIJ_MSR()! */ 911c84f5b01SHong Zhang 91249b5e25fSSatish Balay outA = inA; 913d5f3da31SBarry Smith inA->factortype = MAT_FACTOR_ICC; 9149566063dSJacob Faibussowitsch PetscCall(PetscFree(inA->solvertype)); 9159566063dSJacob Faibussowitsch PetscCall(PetscStrallocpy(MATSOLVERPETSC, &inA->solvertype)); 91649b5e25fSSatish Balay 9179566063dSJacob Faibussowitsch PetscCall(MatMarkDiagonal_SeqSBAIJ(inA)); 9189566063dSJacob Faibussowitsch PetscCall(MatSeqSBAIJSetNumericFactorization_inplace(inA, row_identity)); 91949b5e25fSSatish Balay 9209566063dSJacob Faibussowitsch PetscCall(PetscObjectReference((PetscObject)row)); 9219566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->row)); 922c84f5b01SHong Zhang a->row = row; 9239566063dSJacob Faibussowitsch PetscCall(PetscObjectReference((PetscObject)row)); 9249566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->col)); 925c84f5b01SHong Zhang a->col = row; 926c84f5b01SHong Zhang 927c84f5b01SHong Zhang /* Create the invert permutation so that it can be used in MatCholeskyFactorNumeric() */ 9289566063dSJacob Faibussowitsch if (a->icol) PetscCall(ISInvertPermutation(row, PETSC_DECIDE, &a->icol)); 92949b5e25fSSatish Balay 930aa624791SPierre Jolivet if (!a->solve_work) PetscCall(PetscMalloc1(inA->rmap->N + inA->rmap->bs, &a->solve_work)); 93149b5e25fSSatish Balay 9329566063dSJacob Faibussowitsch PetscCall(MatCholeskyFactorNumeric(outA, inA, info)); 9333ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 93449b5e25fSSatish Balay } 935950f1e5bSHong Zhang 936ba38deedSJacob Faibussowitsch static PetscErrorCode MatSeqSBAIJSetColumnIndices_SeqSBAIJ(Mat mat, PetscInt *indices) 937d71ae5a4SJacob Faibussowitsch { 938045c9aa0SHong Zhang Mat_SeqSBAIJ *baij = (Mat_SeqSBAIJ *)mat->data; 93913f74950SBarry Smith PetscInt i, nz, n; 94049b5e25fSSatish Balay 94149b5e25fSSatish Balay PetscFunctionBegin; 9426c6c5352SBarry Smith nz = baij->maxnz; 943d0f46423SBarry Smith n = mat->cmap->n; 94426fbe8dcSKarl Rupp for (i = 0; i < nz; i++) baij->j[i] = indices[i]; 94526fbe8dcSKarl Rupp 9466c6c5352SBarry Smith baij->nz = nz; 94726fbe8dcSKarl Rupp for (i = 0; i < n; i++) baij->ilen[i] = baij->imax[i]; 94826fbe8dcSKarl Rupp 9499566063dSJacob Faibussowitsch PetscCall(MatSetOption(mat, MAT_NEW_NONZERO_LOCATION_ERR, PETSC_TRUE)); 9503ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 95149b5e25fSSatish Balay } 95249b5e25fSSatish Balay 95349b5e25fSSatish Balay /*@ 95419585528SSatish Balay MatSeqSBAIJSetColumnIndices - Set the column indices for all the rows 95511a5261eSBarry Smith in a `MATSEQSBAIJ` matrix. 95649b5e25fSSatish Balay 95749b5e25fSSatish Balay Input Parameters: 95811a5261eSBarry Smith + mat - the `MATSEQSBAIJ` matrix 95949b5e25fSSatish Balay - indices - the column indices 96049b5e25fSSatish Balay 96149b5e25fSSatish Balay Level: advanced 96249b5e25fSSatish Balay 96349b5e25fSSatish Balay Notes: 96449b5e25fSSatish Balay This can be called if you have precomputed the nonzero structure of the 96549b5e25fSSatish Balay matrix and want to provide it to the matrix object to improve the performance 96611a5261eSBarry Smith of the `MatSetValues()` operation. 96749b5e25fSSatish Balay 96849b5e25fSSatish Balay You MUST have set the correct numbers of nonzeros per row in the call to 96911a5261eSBarry Smith `MatCreateSeqSBAIJ()`, and the columns indices MUST be sorted. 97049b5e25fSSatish Balay 9712ef1f0ffSBarry Smith MUST be called before any calls to `MatSetValues()` 97249b5e25fSSatish Balay 9731cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MATSEQSBAIJ`, `MatCreateSeqSBAIJ` 97449b5e25fSSatish Balay @*/ 975d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqSBAIJSetColumnIndices(Mat mat, PetscInt *indices) 976d71ae5a4SJacob Faibussowitsch { 97749b5e25fSSatish Balay PetscFunctionBegin; 9780700a824SBarry Smith PetscValidHeaderSpecific(mat, MAT_CLASSID, 1); 9794f572ea9SToby Isaac PetscAssertPointer(indices, 2); 980cac4c232SBarry Smith PetscUseMethod(mat, "MatSeqSBAIJSetColumnIndices_C", (Mat, PetscInt *), (mat, indices)); 9813ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 98249b5e25fSSatish Balay } 98349b5e25fSSatish Balay 984ba38deedSJacob Faibussowitsch static PetscErrorCode MatCopy_SeqSBAIJ(Mat A, Mat B, MatStructure str) 985d71ae5a4SJacob Faibussowitsch { 9864c7a3774SStefano Zampini PetscBool isbaij; 9873c896bc6SHong Zhang 9883c896bc6SHong Zhang PetscFunctionBegin; 9899566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompareAny((PetscObject)B, &isbaij, MATSEQSBAIJ, MATMPISBAIJ, "")); 99028b400f6SJacob Faibussowitsch PetscCheck(isbaij, PetscObjectComm((PetscObject)B), PETSC_ERR_SUP, "Not for matrix type %s", ((PetscObject)B)->type_name); 9914c7a3774SStefano Zampini /* If the two matrices have the same copy implementation and nonzero pattern, use fast copy. */ 9924c7a3774SStefano Zampini if (str == SAME_NONZERO_PATTERN && A->ops->copy == B->ops->copy) { 9933c896bc6SHong Zhang Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)A->data; 9943c896bc6SHong Zhang Mat_SeqSBAIJ *b = (Mat_SeqSBAIJ *)B->data; 9953c896bc6SHong Zhang 99608401ef6SPierre Jolivet PetscCheck(a->i[a->mbs] == b->i[b->mbs], PETSC_COMM_SELF, PETSC_ERR_ARG_INCOMP, "Number of nonzeros in two matrices are different"); 99708401ef6SPierre Jolivet PetscCheck(a->mbs == b->mbs, PETSC_COMM_SELF, PETSC_ERR_ARG_INCOMP, "Number of rows in two matrices are different"); 99808401ef6SPierre Jolivet PetscCheck(a->bs2 == b->bs2, PETSC_COMM_SELF, PETSC_ERR_ARG_INCOMP, "Different block size"); 9999566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(b->a, a->a, a->bs2 * a->i[a->mbs])); 10009566063dSJacob Faibussowitsch PetscCall(PetscObjectStateIncrease((PetscObject)B)); 10013c896bc6SHong Zhang } else { 10029566063dSJacob Faibussowitsch PetscCall(MatGetRowUpperTriangular(A)); 10039566063dSJacob Faibussowitsch PetscCall(MatCopy_Basic(A, B, str)); 10049566063dSJacob Faibussowitsch PetscCall(MatRestoreRowUpperTriangular(A)); 10053c896bc6SHong Zhang } 10063ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 10073c896bc6SHong Zhang } 10083c896bc6SHong Zhang 1009d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatSeqSBAIJGetArray_SeqSBAIJ(Mat A, PetscScalar *array[]) 1010d71ae5a4SJacob Faibussowitsch { 1011a6ece127SHong Zhang Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)A->data; 10125fd66863SKarl Rupp 1013a6ece127SHong Zhang PetscFunctionBegin; 1014a6ece127SHong Zhang *array = a->a; 10153ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1016a6ece127SHong Zhang } 1017a6ece127SHong Zhang 1018d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatSeqSBAIJRestoreArray_SeqSBAIJ(Mat A, PetscScalar *array[]) 1019d71ae5a4SJacob Faibussowitsch { 1020a6ece127SHong Zhang PetscFunctionBegin; 1021cda14afcSprj- *array = NULL; 10223ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1023a6ece127SHong Zhang } 1024a6ece127SHong Zhang 1025d71ae5a4SJacob Faibussowitsch PetscErrorCode MatAXPYGetPreallocation_SeqSBAIJ(Mat Y, Mat X, PetscInt *nnz) 1026d71ae5a4SJacob Faibussowitsch { 1027b264fe52SHong Zhang PetscInt bs = Y->rmap->bs, mbs = Y->rmap->N / bs; 102852768537SHong Zhang Mat_SeqSBAIJ *x = (Mat_SeqSBAIJ *)X->data; 102952768537SHong Zhang Mat_SeqSBAIJ *y = (Mat_SeqSBAIJ *)Y->data; 103052768537SHong Zhang 103152768537SHong Zhang PetscFunctionBegin; 103252768537SHong Zhang /* Set the number of nonzeros in the new matrix */ 10339566063dSJacob Faibussowitsch PetscCall(MatAXPYGetPreallocation_SeqX_private(mbs, x->i, x->j, y->i, y->j, nnz)); 10343ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 103552768537SHong Zhang } 103652768537SHong Zhang 1037ba38deedSJacob Faibussowitsch static PetscErrorCode MatAXPY_SeqSBAIJ(Mat Y, PetscScalar a, Mat X, MatStructure str) 1038d71ae5a4SJacob Faibussowitsch { 103942ee4b1aSHong Zhang Mat_SeqSBAIJ *x = (Mat_SeqSBAIJ *)X->data, *y = (Mat_SeqSBAIJ *)Y->data; 104031ce2d13SHong Zhang PetscInt bs = Y->rmap->bs, bs2 = bs * bs; 1041e838b9e7SJed Brown PetscBLASInt one = 1; 104242ee4b1aSHong Zhang 104342ee4b1aSHong Zhang PetscFunctionBegin; 1044134adf20SPierre Jolivet if (str == UNKNOWN_NONZERO_PATTERN || (PetscDefined(USE_DEBUG) && str == SAME_NONZERO_PATTERN)) { 1045134adf20SPierre Jolivet PetscBool e = x->nz == y->nz && x->mbs == y->mbs ? PETSC_TRUE : PETSC_FALSE; 1046134adf20SPierre Jolivet if (e) { 10479566063dSJacob Faibussowitsch PetscCall(PetscArraycmp(x->i, y->i, x->mbs + 1, &e)); 1048134adf20SPierre Jolivet if (e) { 10499566063dSJacob Faibussowitsch PetscCall(PetscArraycmp(x->j, y->j, x->i[x->mbs], &e)); 1050134adf20SPierre Jolivet if (e) str = SAME_NONZERO_PATTERN; 1051134adf20SPierre Jolivet } 1052134adf20SPierre Jolivet } 105354c59aa7SJacob Faibussowitsch if (!e) PetscCheck(str != SAME_NONZERO_PATTERN, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONG, "MatStructure is not SAME_NONZERO_PATTERN"); 1054134adf20SPierre Jolivet } 105542ee4b1aSHong Zhang if (str == SAME_NONZERO_PATTERN) { 1056f4df32b1SMatthew Knepley PetscScalar alpha = a; 1057c5df96a5SBarry Smith PetscBLASInt bnz; 10589566063dSJacob Faibussowitsch PetscCall(PetscBLASIntCast(x->nz * bs2, &bnz)); 1059792fecdfSBarry Smith PetscCallBLAS("BLASaxpy", BLASaxpy_(&bnz, &alpha, x->a, &one, y->a, &one)); 10609566063dSJacob Faibussowitsch PetscCall(PetscObjectStateIncrease((PetscObject)Y)); 1061ab784542SHong Zhang } else if (str == SUBSET_NONZERO_PATTERN) { /* nonzeros of X is a subset of Y's */ 10629566063dSJacob Faibussowitsch PetscCall(MatSetOption(X, MAT_GETROW_UPPERTRIANGULAR, PETSC_TRUE)); 10639566063dSJacob Faibussowitsch PetscCall(MatAXPY_Basic(Y, a, X, str)); 10649566063dSJacob Faibussowitsch PetscCall(MatSetOption(X, MAT_GETROW_UPPERTRIANGULAR, PETSC_FALSE)); 106542ee4b1aSHong Zhang } else { 106652768537SHong Zhang Mat B; 106752768537SHong Zhang PetscInt *nnz; 106854c59aa7SJacob Faibussowitsch PetscCheck(bs == X->rmap->bs, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Matrices must have same block size"); 10699566063dSJacob Faibussowitsch PetscCall(MatGetRowUpperTriangular(X)); 10709566063dSJacob Faibussowitsch PetscCall(MatGetRowUpperTriangular(Y)); 10719566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(Y->rmap->N, &nnz)); 10729566063dSJacob Faibussowitsch PetscCall(MatCreate(PetscObjectComm((PetscObject)Y), &B)); 10739566063dSJacob Faibussowitsch PetscCall(PetscObjectSetName((PetscObject)B, ((PetscObject)Y)->name)); 10749566063dSJacob Faibussowitsch PetscCall(MatSetSizes(B, Y->rmap->n, Y->cmap->n, Y->rmap->N, Y->cmap->N)); 10759566063dSJacob Faibussowitsch PetscCall(MatSetBlockSizesFromMats(B, Y, Y)); 10769566063dSJacob Faibussowitsch PetscCall(MatSetType(B, ((PetscObject)Y)->type_name)); 10779566063dSJacob Faibussowitsch PetscCall(MatAXPYGetPreallocation_SeqSBAIJ(Y, X, nnz)); 10789566063dSJacob Faibussowitsch PetscCall(MatSeqSBAIJSetPreallocation(B, bs, 0, nnz)); 107952768537SHong Zhang 10809566063dSJacob Faibussowitsch PetscCall(MatAXPY_BasicWithPreallocation(B, Y, a, X, str)); 108152768537SHong Zhang 10829566063dSJacob Faibussowitsch PetscCall(MatHeaderMerge(Y, &B)); 10839566063dSJacob Faibussowitsch PetscCall(PetscFree(nnz)); 10849566063dSJacob Faibussowitsch PetscCall(MatRestoreRowUpperTriangular(X)); 10859566063dSJacob Faibussowitsch PetscCall(MatRestoreRowUpperTriangular(Y)); 108642ee4b1aSHong Zhang } 10873ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 108842ee4b1aSHong Zhang } 108942ee4b1aSHong Zhang 1090ba38deedSJacob Faibussowitsch static PetscErrorCode MatIsSymmetric_SeqSBAIJ(Mat A, PetscReal tol, PetscBool *flg) 1091d71ae5a4SJacob Faibussowitsch { 1092efcf0fc3SBarry Smith PetscFunctionBegin; 1093efcf0fc3SBarry Smith *flg = PETSC_TRUE; 10943ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1095efcf0fc3SBarry Smith } 1096efcf0fc3SBarry Smith 1097ba38deedSJacob Faibussowitsch static PetscErrorCode MatIsStructurallySymmetric_SeqSBAIJ(Mat A, PetscBool *flg) 1098d71ae5a4SJacob Faibussowitsch { 1099efcf0fc3SBarry Smith PetscFunctionBegin; 1100efcf0fc3SBarry Smith *flg = PETSC_TRUE; 11013ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1102efcf0fc3SBarry Smith } 1103efcf0fc3SBarry Smith 1104ba38deedSJacob Faibussowitsch static PetscErrorCode MatIsHermitian_SeqSBAIJ(Mat A, PetscReal tol, PetscBool *flg) 1105d71ae5a4SJacob Faibussowitsch { 1106efcf0fc3SBarry Smith PetscFunctionBegin; 1107efcf0fc3SBarry Smith *flg = PETSC_FALSE; 11083ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1109efcf0fc3SBarry Smith } 1110efcf0fc3SBarry Smith 1111ba38deedSJacob Faibussowitsch static PetscErrorCode MatConjugate_SeqSBAIJ(Mat A) 1112d71ae5a4SJacob Faibussowitsch { 11132726fb6dSPierre Jolivet #if defined(PETSC_USE_COMPLEX) 11142726fb6dSPierre Jolivet Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)A->data; 11152726fb6dSPierre Jolivet PetscInt i, nz = a->bs2 * a->i[a->mbs]; 11162726fb6dSPierre Jolivet MatScalar *aa = a->a; 11172726fb6dSPierre Jolivet 11182726fb6dSPierre Jolivet PetscFunctionBegin; 11192726fb6dSPierre Jolivet for (i = 0; i < nz; i++) aa[i] = PetscConj(aa[i]); 11202726fb6dSPierre Jolivet #else 11212726fb6dSPierre Jolivet PetscFunctionBegin; 11222726fb6dSPierre Jolivet #endif 11233ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 11242726fb6dSPierre Jolivet } 11252726fb6dSPierre Jolivet 1126ba38deedSJacob Faibussowitsch static PetscErrorCode MatRealPart_SeqSBAIJ(Mat A) 1127d71ae5a4SJacob Faibussowitsch { 112899cafbc1SBarry Smith Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)A->data; 112999cafbc1SBarry Smith PetscInt i, nz = a->bs2 * a->i[a->mbs]; 1130dd6ea824SBarry Smith MatScalar *aa = a->a; 113199cafbc1SBarry Smith 113299cafbc1SBarry Smith PetscFunctionBegin; 113399cafbc1SBarry Smith for (i = 0; i < nz; i++) aa[i] = PetscRealPart(aa[i]); 11343ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 113599cafbc1SBarry Smith } 113699cafbc1SBarry Smith 1137ba38deedSJacob Faibussowitsch static PetscErrorCode MatImaginaryPart_SeqSBAIJ(Mat A) 1138d71ae5a4SJacob Faibussowitsch { 113999cafbc1SBarry Smith Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)A->data; 114099cafbc1SBarry Smith PetscInt i, nz = a->bs2 * a->i[a->mbs]; 1141dd6ea824SBarry Smith MatScalar *aa = a->a; 114299cafbc1SBarry Smith 114399cafbc1SBarry Smith PetscFunctionBegin; 114499cafbc1SBarry Smith for (i = 0; i < nz; i++) aa[i] = PetscImaginaryPart(aa[i]); 11453ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 114699cafbc1SBarry Smith } 114799cafbc1SBarry Smith 1148ba38deedSJacob Faibussowitsch static PetscErrorCode MatZeroRowsColumns_SeqSBAIJ(Mat A, PetscInt is_n, const PetscInt is_idx[], PetscScalar diag, Vec x, Vec b) 1149d71ae5a4SJacob Faibussowitsch { 11503bededecSBarry Smith Mat_SeqSBAIJ *baij = (Mat_SeqSBAIJ *)A->data; 11513bededecSBarry Smith PetscInt i, j, k, count; 11523bededecSBarry Smith PetscInt bs = A->rmap->bs, bs2 = baij->bs2, row, col; 11533bededecSBarry Smith PetscScalar zero = 0.0; 11543bededecSBarry Smith MatScalar *aa; 11553bededecSBarry Smith const PetscScalar *xx; 11563bededecSBarry Smith PetscScalar *bb; 115756777dd2SBarry Smith PetscBool *zeroed, vecs = PETSC_FALSE; 11583bededecSBarry Smith 11593bededecSBarry Smith PetscFunctionBegin; 11603bededecSBarry Smith /* fix right hand side if needed */ 11613bededecSBarry Smith if (x && b) { 11629566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(x, &xx)); 11639566063dSJacob Faibussowitsch PetscCall(VecGetArray(b, &bb)); 116456777dd2SBarry Smith vecs = PETSC_TRUE; 11653bededecSBarry Smith } 11663bededecSBarry Smith 11673bededecSBarry Smith /* zero the columns */ 11689566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(A->rmap->n, &zeroed)); 11693bededecSBarry Smith for (i = 0; i < is_n; i++) { 1170aed4548fSBarry Smith PetscCheck(is_idx[i] >= 0 && is_idx[i] < A->rmap->N, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "row %" PetscInt_FMT " out of range", is_idx[i]); 11713bededecSBarry Smith zeroed[is_idx[i]] = PETSC_TRUE; 11723bededecSBarry Smith } 117356777dd2SBarry Smith if (vecs) { 117456777dd2SBarry Smith for (i = 0; i < A->rmap->N; i++) { 117556777dd2SBarry Smith row = i / bs; 117656777dd2SBarry Smith for (j = baij->i[row]; j < baij->i[row + 1]; j++) { 117756777dd2SBarry Smith for (k = 0; k < bs; k++) { 117856777dd2SBarry Smith col = bs * baij->j[j] + k; 117956777dd2SBarry Smith if (col <= i) continue; 118056777dd2SBarry Smith aa = ((MatScalar *)(baij->a)) + j * bs2 + (i % bs) + bs * k; 118126fbe8dcSKarl Rupp if (!zeroed[i] && zeroed[col]) bb[i] -= aa[0] * xx[col]; 118226fbe8dcSKarl Rupp if (zeroed[i] && !zeroed[col]) bb[col] -= aa[0] * xx[i]; 118356777dd2SBarry Smith } 118456777dd2SBarry Smith } 118556777dd2SBarry Smith } 118626fbe8dcSKarl Rupp for (i = 0; i < is_n; i++) bb[is_idx[i]] = diag * xx[is_idx[i]]; 118756777dd2SBarry Smith } 118856777dd2SBarry Smith 11893bededecSBarry Smith for (i = 0; i < A->rmap->N; i++) { 11903bededecSBarry Smith if (!zeroed[i]) { 11913bededecSBarry Smith row = i / bs; 11923bededecSBarry Smith for (j = baij->i[row]; j < baij->i[row + 1]; j++) { 11933bededecSBarry Smith for (k = 0; k < bs; k++) { 11943bededecSBarry Smith col = bs * baij->j[j] + k; 11953bededecSBarry Smith if (zeroed[col]) { 11963bededecSBarry Smith aa = ((MatScalar *)(baij->a)) + j * bs2 + (i % bs) + bs * k; 11973bededecSBarry Smith aa[0] = 0.0; 11983bededecSBarry Smith } 11993bededecSBarry Smith } 12003bededecSBarry Smith } 12013bededecSBarry Smith } 12023bededecSBarry Smith } 12039566063dSJacob Faibussowitsch PetscCall(PetscFree(zeroed)); 120456777dd2SBarry Smith if (vecs) { 12059566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(x, &xx)); 12069566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(b, &bb)); 120756777dd2SBarry Smith } 12083bededecSBarry Smith 12093bededecSBarry Smith /* zero the rows */ 12103bededecSBarry Smith for (i = 0; i < is_n; i++) { 12113bededecSBarry Smith row = is_idx[i]; 12123bededecSBarry Smith count = (baij->i[row / bs + 1] - baij->i[row / bs]) * bs; 12133bededecSBarry Smith aa = ((MatScalar *)(baij->a)) + baij->i[row / bs] * bs2 + (row % bs); 12143bededecSBarry Smith for (k = 0; k < count; k++) { 12153bededecSBarry Smith aa[0] = zero; 12163bededecSBarry Smith aa += bs; 12173bededecSBarry Smith } 1218dbbe0bcdSBarry Smith if (diag != 0.0) PetscUseTypeMethod(A, setvalues, 1, &row, 1, &row, &diag, INSERT_VALUES); 12193bededecSBarry Smith } 12209566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd_SeqSBAIJ(A, MAT_FINAL_ASSEMBLY)); 12213ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 12223bededecSBarry Smith } 12233bededecSBarry Smith 1224ba38deedSJacob Faibussowitsch static PetscErrorCode MatShift_SeqSBAIJ(Mat Y, PetscScalar a) 1225d71ae5a4SJacob Faibussowitsch { 12267d68702bSBarry Smith Mat_SeqSBAIJ *aij = (Mat_SeqSBAIJ *)Y->data; 12277d68702bSBarry Smith 12287d68702bSBarry Smith PetscFunctionBegin; 122948a46eb9SPierre Jolivet if (!Y->preallocated || !aij->nz) PetscCall(MatSeqSBAIJSetPreallocation(Y, Y->rmap->bs, 1, NULL)); 12309566063dSJacob Faibussowitsch PetscCall(MatShift_Basic(Y, a)); 12313ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 12327d68702bSBarry Smith } 12337d68702bSBarry Smith 123417ea310bSPierre Jolivet PetscErrorCode MatEliminateZeros_SeqSBAIJ(Mat A, PetscBool keep) 123517ea310bSPierre Jolivet { 123617ea310bSPierre Jolivet Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)A->data; 123717ea310bSPierre Jolivet PetscInt fshift = 0, fshift_prev = 0, i, *ai = a->i, *aj = a->j, *imax = a->imax, j, k; 123817ea310bSPierre Jolivet PetscInt m = A->rmap->N, *ailen = a->ilen; 123917ea310bSPierre Jolivet PetscInt mbs = a->mbs, bs2 = a->bs2, rmax = 0; 124017ea310bSPierre Jolivet MatScalar *aa = a->a, *ap; 124117ea310bSPierre Jolivet PetscBool zero; 124217ea310bSPierre Jolivet 124317ea310bSPierre Jolivet PetscFunctionBegin; 124417ea310bSPierre Jolivet PetscCheck(A->assembled, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Cannot eliminate zeros for unassembled matrix"); 124517ea310bSPierre Jolivet if (m) rmax = ailen[0]; 124617ea310bSPierre Jolivet for (i = 1; i <= mbs; i++) { 124717ea310bSPierre Jolivet for (k = ai[i - 1]; k < ai[i]; k++) { 124817ea310bSPierre Jolivet zero = PETSC_TRUE; 124917ea310bSPierre Jolivet ap = aa + bs2 * k; 125017ea310bSPierre Jolivet for (j = 0; j < bs2 && zero; j++) { 125117ea310bSPierre Jolivet if (ap[j] != 0.0) zero = PETSC_FALSE; 125217ea310bSPierre Jolivet } 125317ea310bSPierre Jolivet if (zero && (aj[k] != i - 1 || !keep)) fshift++; 125417ea310bSPierre Jolivet else { 125517ea310bSPierre Jolivet if (zero && aj[k] == i - 1) PetscCall(PetscInfo(A, "Keep the diagonal block at row %" PetscInt_FMT "\n", i - 1)); 125617ea310bSPierre Jolivet aj[k - fshift] = aj[k]; 125717ea310bSPierre Jolivet PetscCall(PetscArraymove(ap - bs2 * fshift, ap, bs2)); 125817ea310bSPierre Jolivet } 125917ea310bSPierre Jolivet } 126017ea310bSPierre Jolivet ai[i - 1] -= fshift_prev; 126117ea310bSPierre Jolivet fshift_prev = fshift; 126217ea310bSPierre Jolivet ailen[i - 1] = imax[i - 1] = ai[i] - fshift - ai[i - 1]; 126317ea310bSPierre Jolivet a->nonzerorowcnt += ((ai[i] - fshift - ai[i - 1]) > 0); 126417ea310bSPierre Jolivet rmax = PetscMax(rmax, ailen[i - 1]); 126517ea310bSPierre Jolivet } 126617ea310bSPierre Jolivet if (fshift) { 126717ea310bSPierre Jolivet if (mbs) { 126817ea310bSPierre Jolivet ai[mbs] -= fshift; 126917ea310bSPierre Jolivet a->nz = ai[mbs]; 127017ea310bSPierre Jolivet } 127117ea310bSPierre Jolivet PetscCall(PetscInfo(A, "Matrix size: %" PetscInt_FMT " X %" PetscInt_FMT "; zeros eliminated: %" PetscInt_FMT "; nonzeros left: %" PetscInt_FMT "\n", m, A->cmap->n, fshift, a->nz)); 127217ea310bSPierre Jolivet A->nonzerostate++; 127317ea310bSPierre Jolivet A->info.nz_unneeded += (PetscReal)fshift; 127417ea310bSPierre Jolivet a->rmax = rmax; 127517ea310bSPierre Jolivet PetscCall(MatAssemblyBegin(A, MAT_FINAL_ASSEMBLY)); 127617ea310bSPierre Jolivet PetscCall(MatAssemblyEnd(A, MAT_FINAL_ASSEMBLY)); 127717ea310bSPierre Jolivet } 127817ea310bSPierre Jolivet PetscFunctionReturn(PETSC_SUCCESS); 127917ea310bSPierre Jolivet } 128017ea310bSPierre Jolivet 12813964eb88SJed Brown static struct _MatOps MatOps_Values = {MatSetValues_SeqSBAIJ, 128249b5e25fSSatish Balay MatGetRow_SeqSBAIJ, 128349b5e25fSSatish Balay MatRestoreRow_SeqSBAIJ, 128449b5e25fSSatish Balay MatMult_SeqSBAIJ_N, 128597304618SKris Buschelman /* 4*/ MatMultAdd_SeqSBAIJ_N, 1286431c96f7SBarry Smith MatMult_SeqSBAIJ_N, /* transpose versions are same as non-transpose versions */ 1287e005ede5SBarry Smith MatMultAdd_SeqSBAIJ_N, 1288f4259b30SLisandro Dalcin NULL, 1289f4259b30SLisandro Dalcin NULL, 1290f4259b30SLisandro Dalcin NULL, 1291f4259b30SLisandro Dalcin /* 10*/ NULL, 1292f4259b30SLisandro Dalcin NULL, 1293c078aec8SLisandro Dalcin MatCholeskyFactor_SeqSBAIJ, 129441f059aeSBarry Smith MatSOR_SeqSBAIJ, 129549b5e25fSSatish Balay MatTranspose_SeqSBAIJ, 129697304618SKris Buschelman /* 15*/ MatGetInfo_SeqSBAIJ, 129749b5e25fSSatish Balay MatEqual_SeqSBAIJ, 129849b5e25fSSatish Balay MatGetDiagonal_SeqSBAIJ, 129949b5e25fSSatish Balay MatDiagonalScale_SeqSBAIJ, 130049b5e25fSSatish Balay MatNorm_SeqSBAIJ, 1301f4259b30SLisandro Dalcin /* 20*/ NULL, 130249b5e25fSSatish Balay MatAssemblyEnd_SeqSBAIJ, 130349b5e25fSSatish Balay MatSetOption_SeqSBAIJ, 130449b5e25fSSatish Balay MatZeroEntries_SeqSBAIJ, 1305f4259b30SLisandro Dalcin /* 24*/ NULL, 1306f4259b30SLisandro Dalcin NULL, 1307f4259b30SLisandro Dalcin NULL, 1308f4259b30SLisandro Dalcin NULL, 1309f4259b30SLisandro Dalcin NULL, 131026cec326SBarry Smith /* 29*/ MatSetUp_Seq_Hash, 1311f4259b30SLisandro Dalcin NULL, 1312f4259b30SLisandro Dalcin NULL, 1313f4259b30SLisandro Dalcin NULL, 1314f4259b30SLisandro Dalcin NULL, 1315d519adbfSMatthew Knepley /* 34*/ MatDuplicate_SeqSBAIJ, 1316f4259b30SLisandro Dalcin NULL, 1317f4259b30SLisandro Dalcin NULL, 1318f4259b30SLisandro Dalcin NULL, 1319c84f5b01SHong Zhang MatICCFactor_SeqSBAIJ, 1320d519adbfSMatthew Knepley /* 39*/ MatAXPY_SeqSBAIJ, 13217dae84e0SHong Zhang MatCreateSubMatrices_SeqSBAIJ, 132249b5e25fSSatish Balay MatIncreaseOverlap_SeqSBAIJ, 132349b5e25fSSatish Balay MatGetValues_SeqSBAIJ, 13243c896bc6SHong Zhang MatCopy_SeqSBAIJ, 1325f4259b30SLisandro Dalcin /* 44*/ NULL, 132649b5e25fSSatish Balay MatScale_SeqSBAIJ, 13277d68702bSBarry Smith MatShift_SeqSBAIJ, 1328f4259b30SLisandro Dalcin NULL, 13293bededecSBarry Smith MatZeroRowsColumns_SeqSBAIJ, 1330f4259b30SLisandro Dalcin /* 49*/ NULL, 133149b5e25fSSatish Balay MatGetRowIJ_SeqSBAIJ, 133249b5e25fSSatish Balay MatRestoreRowIJ_SeqSBAIJ, 1333f4259b30SLisandro Dalcin NULL, 1334f4259b30SLisandro Dalcin NULL, 1335f4259b30SLisandro Dalcin /* 54*/ NULL, 1336f4259b30SLisandro Dalcin NULL, 1337f4259b30SLisandro Dalcin NULL, 1338dc29a518SPierre Jolivet MatPermute_SeqSBAIJ, 133949b5e25fSSatish Balay MatSetValuesBlocked_SeqSBAIJ, 13407dae84e0SHong Zhang /* 59*/ MatCreateSubMatrix_SeqSBAIJ, 1341f4259b30SLisandro Dalcin NULL, 1342f4259b30SLisandro Dalcin NULL, 1343f4259b30SLisandro Dalcin NULL, 1344f4259b30SLisandro Dalcin NULL, 1345f4259b30SLisandro Dalcin /* 64*/ NULL, 1346f4259b30SLisandro Dalcin NULL, 1347f4259b30SLisandro Dalcin NULL, 1348f4259b30SLisandro Dalcin NULL, 1349f4259b30SLisandro Dalcin NULL, 1350d519adbfSMatthew Knepley /* 69*/ MatGetRowMaxAbs_SeqSBAIJ, 1351f4259b30SLisandro Dalcin NULL, 135228d58a37SPierre Jolivet MatConvert_MPISBAIJ_Basic, 1353f4259b30SLisandro Dalcin NULL, 1354f4259b30SLisandro Dalcin NULL, 1355f4259b30SLisandro Dalcin /* 74*/ NULL, 1356f4259b30SLisandro Dalcin NULL, 1357f4259b30SLisandro Dalcin NULL, 1358f4259b30SLisandro Dalcin NULL, 1359f4259b30SLisandro Dalcin NULL, 1360f4259b30SLisandro Dalcin /* 79*/ NULL, 1361f4259b30SLisandro Dalcin NULL, 1362f4259b30SLisandro Dalcin NULL, 136397304618SKris Buschelman MatGetInertia_SeqSBAIJ, 13645bba2384SShri Abhyankar MatLoad_SeqSBAIJ, 1365d519adbfSMatthew Knepley /* 84*/ MatIsSymmetric_SeqSBAIJ, 1366865e5f61SKris Buschelman MatIsHermitian_SeqSBAIJ, 1367efcf0fc3SBarry Smith MatIsStructurallySymmetric_SeqSBAIJ, 1368f4259b30SLisandro Dalcin NULL, 1369f4259b30SLisandro Dalcin NULL, 1370f4259b30SLisandro Dalcin /* 89*/ NULL, 1371f4259b30SLisandro Dalcin NULL, 1372f4259b30SLisandro Dalcin NULL, 1373f4259b30SLisandro Dalcin NULL, 1374f4259b30SLisandro Dalcin NULL, 1375f4259b30SLisandro Dalcin /* 94*/ NULL, 1376f4259b30SLisandro Dalcin NULL, 1377f4259b30SLisandro Dalcin NULL, 1378f4259b30SLisandro Dalcin NULL, 1379f4259b30SLisandro Dalcin NULL, 1380f4259b30SLisandro Dalcin /* 99*/ NULL, 1381f4259b30SLisandro Dalcin NULL, 1382f4259b30SLisandro Dalcin NULL, 13832726fb6dSPierre Jolivet MatConjugate_SeqSBAIJ, 1384f4259b30SLisandro Dalcin NULL, 1385f4259b30SLisandro Dalcin /*104*/ NULL, 138699cafbc1SBarry Smith MatRealPart_SeqSBAIJ, 1387f5edf698SHong Zhang MatImaginaryPart_SeqSBAIJ, 1388f5edf698SHong Zhang MatGetRowUpperTriangular_SeqSBAIJ, 13892af78befSBarry Smith MatRestoreRowUpperTriangular_SeqSBAIJ, 1390f4259b30SLisandro Dalcin /*109*/ NULL, 1391f4259b30SLisandro Dalcin NULL, 1392f4259b30SLisandro Dalcin NULL, 1393f4259b30SLisandro Dalcin NULL, 1394547795f9SHong Zhang MatMissingDiagonal_SeqSBAIJ, 1395f4259b30SLisandro Dalcin /*114*/ NULL, 1396f4259b30SLisandro Dalcin NULL, 1397f4259b30SLisandro Dalcin NULL, 1398f4259b30SLisandro Dalcin NULL, 1399f4259b30SLisandro Dalcin NULL, 1400f4259b30SLisandro Dalcin /*119*/ NULL, 1401f4259b30SLisandro Dalcin NULL, 1402f4259b30SLisandro Dalcin NULL, 1403f4259b30SLisandro Dalcin NULL, 1404f4259b30SLisandro Dalcin NULL, 1405f4259b30SLisandro Dalcin /*124*/ NULL, 1406f4259b30SLisandro Dalcin NULL, 1407f4259b30SLisandro Dalcin NULL, 1408f4259b30SLisandro Dalcin NULL, 1409f4259b30SLisandro Dalcin NULL, 1410f4259b30SLisandro Dalcin /*129*/ NULL, 1411f4259b30SLisandro Dalcin NULL, 1412f4259b30SLisandro Dalcin NULL, 1413f4259b30SLisandro Dalcin NULL, 1414f4259b30SLisandro Dalcin NULL, 1415f4259b30SLisandro Dalcin /*134*/ NULL, 1416f4259b30SLisandro Dalcin NULL, 1417f4259b30SLisandro Dalcin NULL, 1418f4259b30SLisandro Dalcin NULL, 1419f4259b30SLisandro Dalcin NULL, 142046533700Sstefano_zampini /*139*/ MatSetBlockSizes_Default, 1421f4259b30SLisandro Dalcin NULL, 1422f4259b30SLisandro Dalcin NULL, 1423f4259b30SLisandro Dalcin NULL, 1424f4259b30SLisandro Dalcin NULL, 1425d70f29a3SPierre Jolivet /*144*/ MatCreateMPIMatConcatenateSeqMat_SeqSBAIJ, 1426d70f29a3SPierre Jolivet NULL, 1427d70f29a3SPierre Jolivet NULL, 142899a7f59eSMark Adams NULL, 142999a7f59eSMark Adams NULL, 14307fb60732SBarry Smith NULL, 1431dec0b466SHong Zhang /*150*/ NULL, 1432*eede4a3fSMark Adams MatEliminateZeros_SeqSBAIJ, 1433*eede4a3fSMark Adams NULL}; 1434be1d678aSKris Buschelman 1435ba38deedSJacob Faibussowitsch static PetscErrorCode MatStoreValues_SeqSBAIJ(Mat mat) 1436d71ae5a4SJacob Faibussowitsch { 14374afc71dfSHong Zhang Mat_SeqSBAIJ *aij = (Mat_SeqSBAIJ *)mat->data; 1438d0f46423SBarry Smith PetscInt nz = aij->i[mat->rmap->N] * mat->rmap->bs * aij->bs2; 143949b5e25fSSatish Balay 144049b5e25fSSatish Balay PetscFunctionBegin; 144108401ef6SPierre Jolivet PetscCheck(aij->nonew == 1, PETSC_COMM_SELF, PETSC_ERR_ORDER, "Must call MatSetOption(A,MAT_NEW_NONZERO_LOCATIONS,PETSC_FALSE);first"); 144249b5e25fSSatish Balay 144349b5e25fSSatish Balay /* allocate space for values if not already there */ 144448a46eb9SPierre Jolivet if (!aij->saved_values) PetscCall(PetscMalloc1(nz + 1, &aij->saved_values)); 144549b5e25fSSatish Balay 144649b5e25fSSatish Balay /* copy values over */ 14479566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(aij->saved_values, aij->a, nz)); 14483ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 144949b5e25fSSatish Balay } 145049b5e25fSSatish Balay 1451ba38deedSJacob Faibussowitsch static PetscErrorCode MatRetrieveValues_SeqSBAIJ(Mat mat) 1452d71ae5a4SJacob Faibussowitsch { 14534afc71dfSHong Zhang Mat_SeqSBAIJ *aij = (Mat_SeqSBAIJ *)mat->data; 1454d0f46423SBarry Smith PetscInt nz = aij->i[mat->rmap->N] * mat->rmap->bs * aij->bs2; 145549b5e25fSSatish Balay 145649b5e25fSSatish Balay PetscFunctionBegin; 145708401ef6SPierre Jolivet PetscCheck(aij->nonew == 1, PETSC_COMM_SELF, PETSC_ERR_ORDER, "Must call MatSetOption(A,MAT_NEW_NONZERO_LOCATIONS,PETSC_FALSE);first"); 145828b400f6SJacob Faibussowitsch PetscCheck(aij->saved_values, PETSC_COMM_SELF, PETSC_ERR_ORDER, "Must call MatStoreValues(A);first"); 145949b5e25fSSatish Balay 146049b5e25fSSatish Balay /* copy values over */ 14619566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(aij->a, aij->saved_values, nz)); 14623ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 146349b5e25fSSatish Balay } 146449b5e25fSSatish Balay 1465f9663b93SPierre Jolivet static PetscErrorCode MatSeqSBAIJSetPreallocation_SeqSBAIJ(Mat B, PetscInt bs, PetscInt nz, const PetscInt nnz[]) 1466d71ae5a4SJacob Faibussowitsch { 1467c464158bSHong Zhang Mat_SeqSBAIJ *b = (Mat_SeqSBAIJ *)B->data; 14684dcd73b1SHong Zhang PetscInt i, mbs, nbs, bs2; 14692576faa2SJed Brown PetscBool skipallocation = PETSC_FALSE, flg = PETSC_FALSE, realalloc = PETSC_FALSE; 147049b5e25fSSatish Balay 1471b4e2f619SBarry Smith PetscFunctionBegin; 1472ad79cf63SBarry Smith if (B->hash_active) { 1473ad79cf63SBarry Smith PetscInt bs; 1474aea10558SJacob Faibussowitsch B->ops[0] = b->cops; 1475ad79cf63SBarry Smith PetscCall(PetscHMapIJVDestroy(&b->ht)); 1476ad79cf63SBarry Smith PetscCall(MatGetBlockSize(B, &bs)); 1477ad79cf63SBarry Smith if (bs > 1) PetscCall(PetscHSetIJDestroy(&b->bht)); 1478ad79cf63SBarry Smith PetscCall(PetscFree(b->dnz)); 1479ad79cf63SBarry Smith PetscCall(PetscFree(b->bdnz)); 1480ad79cf63SBarry Smith B->hash_active = PETSC_FALSE; 1481ad79cf63SBarry Smith } 14822576faa2SJed Brown if (nz >= 0 || nnz) realalloc = PETSC_TRUE; 1483db4efbfdSBarry Smith 14849566063dSJacob Faibussowitsch PetscCall(MatSetBlockSize(B, PetscAbs(bs))); 14859566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(B->rmap)); 14869566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(B->cmap)); 148708401ef6SPierre Jolivet PetscCheck(B->rmap->N <= B->cmap->N, PETSC_COMM_SELF, PETSC_ERR_SUP, "SEQSBAIJ matrix cannot have more rows %" PetscInt_FMT " than columns %" PetscInt_FMT, B->rmap->N, B->cmap->N); 14889566063dSJacob Faibussowitsch PetscCall(PetscLayoutGetBlockSize(B->rmap, &bs)); 1489899cda47SBarry Smith 149021940c7eSstefano_zampini B->preallocated = PETSC_TRUE; 149121940c7eSstefano_zampini 1492d0f46423SBarry Smith mbs = B->rmap->N / bs; 14934dcd73b1SHong Zhang nbs = B->cmap->n / bs; 149449b5e25fSSatish Balay bs2 = bs * bs; 149549b5e25fSSatish Balay 1496aed4548fSBarry Smith PetscCheck(mbs * bs == B->rmap->N && nbs * bs == B->cmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Number rows, cols must be divisible by blocksize"); 149749b5e25fSSatish Balay 1498ab93d7beSBarry Smith if (nz == MAT_SKIP_ALLOCATION) { 1499ab93d7beSBarry Smith skipallocation = PETSC_TRUE; 1500ab93d7beSBarry Smith nz = 0; 1501ab93d7beSBarry Smith } 1502ab93d7beSBarry Smith 1503435da068SBarry Smith if (nz == PETSC_DEFAULT || nz == PETSC_DECIDE) nz = 3; 150408401ef6SPierre Jolivet PetscCheck(nz >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "nz cannot be less than 0: value %" PetscInt_FMT, nz); 150549b5e25fSSatish Balay if (nnz) { 150649b5e25fSSatish Balay for (i = 0; i < mbs; i++) { 150708401ef6SPierre Jolivet PetscCheck(nnz[i] >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "nnz cannot be less than 0: local row %" PetscInt_FMT " value %" PetscInt_FMT, i, nnz[i]); 150808401ef6SPierre Jolivet PetscCheck(nnz[i] <= nbs, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "nnz cannot be greater than block row length: local row %" PetscInt_FMT " value %" PetscInt_FMT " block rowlength %" PetscInt_FMT, i, nnz[i], nbs); 150949b5e25fSSatish Balay } 151049b5e25fSSatish Balay } 151149b5e25fSSatish Balay 1512db4efbfdSBarry Smith B->ops->mult = MatMult_SeqSBAIJ_N; 1513db4efbfdSBarry Smith B->ops->multadd = MatMultAdd_SeqSBAIJ_N; 1514db4efbfdSBarry Smith B->ops->multtranspose = MatMult_SeqSBAIJ_N; 1515db4efbfdSBarry Smith B->ops->multtransposeadd = MatMultAdd_SeqSBAIJ_N; 151626fbe8dcSKarl Rupp 15179566063dSJacob Faibussowitsch PetscCall(PetscOptionsGetBool(((PetscObject)B)->options, ((PetscObject)B)->prefix, "-mat_no_unroll", &flg, NULL)); 151849b5e25fSSatish Balay if (!flg) { 151949b5e25fSSatish Balay switch (bs) { 152049b5e25fSSatish Balay case 1: 152149b5e25fSSatish Balay B->ops->mult = MatMult_SeqSBAIJ_1; 152249b5e25fSSatish Balay B->ops->multadd = MatMultAdd_SeqSBAIJ_1; 1523431c96f7SBarry Smith B->ops->multtranspose = MatMult_SeqSBAIJ_1; 1524431c96f7SBarry Smith B->ops->multtransposeadd = MatMultAdd_SeqSBAIJ_1; 152549b5e25fSSatish Balay break; 152649b5e25fSSatish Balay case 2: 152749b5e25fSSatish Balay B->ops->mult = MatMult_SeqSBAIJ_2; 152849b5e25fSSatish Balay B->ops->multadd = MatMultAdd_SeqSBAIJ_2; 1529431c96f7SBarry Smith B->ops->multtranspose = MatMult_SeqSBAIJ_2; 1530431c96f7SBarry Smith B->ops->multtransposeadd = MatMultAdd_SeqSBAIJ_2; 153149b5e25fSSatish Balay break; 153249b5e25fSSatish Balay case 3: 153349b5e25fSSatish Balay B->ops->mult = MatMult_SeqSBAIJ_3; 153449b5e25fSSatish Balay B->ops->multadd = MatMultAdd_SeqSBAIJ_3; 1535431c96f7SBarry Smith B->ops->multtranspose = MatMult_SeqSBAIJ_3; 1536431c96f7SBarry Smith B->ops->multtransposeadd = MatMultAdd_SeqSBAIJ_3; 153749b5e25fSSatish Balay break; 153849b5e25fSSatish Balay case 4: 153949b5e25fSSatish Balay B->ops->mult = MatMult_SeqSBAIJ_4; 154049b5e25fSSatish Balay B->ops->multadd = MatMultAdd_SeqSBAIJ_4; 1541431c96f7SBarry Smith B->ops->multtranspose = MatMult_SeqSBAIJ_4; 1542431c96f7SBarry Smith B->ops->multtransposeadd = MatMultAdd_SeqSBAIJ_4; 154349b5e25fSSatish Balay break; 154449b5e25fSSatish Balay case 5: 154549b5e25fSSatish Balay B->ops->mult = MatMult_SeqSBAIJ_5; 154649b5e25fSSatish Balay B->ops->multadd = MatMultAdd_SeqSBAIJ_5; 1547431c96f7SBarry Smith B->ops->multtranspose = MatMult_SeqSBAIJ_5; 1548431c96f7SBarry Smith B->ops->multtransposeadd = MatMultAdd_SeqSBAIJ_5; 154949b5e25fSSatish Balay break; 155049b5e25fSSatish Balay case 6: 155149b5e25fSSatish Balay B->ops->mult = MatMult_SeqSBAIJ_6; 155249b5e25fSSatish Balay B->ops->multadd = MatMultAdd_SeqSBAIJ_6; 1553431c96f7SBarry Smith B->ops->multtranspose = MatMult_SeqSBAIJ_6; 1554431c96f7SBarry Smith B->ops->multtransposeadd = MatMultAdd_SeqSBAIJ_6; 155549b5e25fSSatish Balay break; 155649b5e25fSSatish Balay case 7: 1557de53e5efSHong Zhang B->ops->mult = MatMult_SeqSBAIJ_7; 155849b5e25fSSatish Balay B->ops->multadd = MatMultAdd_SeqSBAIJ_7; 1559431c96f7SBarry Smith B->ops->multtranspose = MatMult_SeqSBAIJ_7; 1560431c96f7SBarry Smith B->ops->multtransposeadd = MatMultAdd_SeqSBAIJ_7; 156149b5e25fSSatish Balay break; 156249b5e25fSSatish Balay } 156349b5e25fSSatish Balay } 156449b5e25fSSatish Balay 156549b5e25fSSatish Balay b->mbs = mbs; 15664dcd73b1SHong Zhang b->nbs = nbs; 1567ab93d7beSBarry Smith if (!skipallocation) { 15682ee49352SLisandro Dalcin if (!b->imax) { 15699566063dSJacob Faibussowitsch PetscCall(PetscMalloc2(mbs, &b->imax, mbs, &b->ilen)); 157026fbe8dcSKarl Rupp 1571c760cd28SBarry Smith b->free_imax_ilen = PETSC_TRUE; 15722ee49352SLisandro Dalcin } 157349b5e25fSSatish Balay if (!nnz) { 1574435da068SBarry Smith if (nz == PETSC_DEFAULT || nz == PETSC_DECIDE) nz = 5; 157549b5e25fSSatish Balay else if (nz <= 0) nz = 1; 15765d2a9ed1SStefano Zampini nz = PetscMin(nbs, nz); 157726fbe8dcSKarl Rupp for (i = 0; i < mbs; i++) b->imax[i] = nz; 15789566063dSJacob Faibussowitsch PetscCall(PetscIntMultError(nz, mbs, &nz)); 157949b5e25fSSatish Balay } else { 1580c73702f5SBarry Smith PetscInt64 nz64 = 0; 15819371c9d4SSatish Balay for (i = 0; i < mbs; i++) { 15829371c9d4SSatish Balay b->imax[i] = nnz[i]; 15839371c9d4SSatish Balay nz64 += nnz[i]; 15849371c9d4SSatish Balay } 15859566063dSJacob Faibussowitsch PetscCall(PetscIntCast(nz64, &nz)); 158649b5e25fSSatish Balay } 15872ee49352SLisandro Dalcin /* b->ilen will count nonzeros in each block row so far. */ 158826fbe8dcSKarl Rupp for (i = 0; i < mbs; i++) b->ilen[i] = 0; 15896c6c5352SBarry Smith /* nz=(nz+mbs)/2; */ /* total diagonal and superdiagonal nonzero blocks */ 159049b5e25fSSatish Balay 159149b5e25fSSatish Balay /* allocate the matrix space */ 15929566063dSJacob Faibussowitsch PetscCall(MatSeqXAIJFreeAIJ(B, &b->a, &b->j, &b->i)); 15939566063dSJacob Faibussowitsch PetscCall(PetscMalloc3(bs2 * nz, &b->a, nz, &b->j, B->rmap->N + 1, &b->i)); 15949566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(b->a, nz * bs2)); 15959566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(b->j, nz)); 159626fbe8dcSKarl Rupp 159749b5e25fSSatish Balay b->singlemalloc = PETSC_TRUE; 159849b5e25fSSatish Balay 159949b5e25fSSatish Balay /* pointer to beginning of each row */ 1600e60cf9a0SBarry Smith b->i[0] = 0; 160126fbe8dcSKarl Rupp for (i = 1; i < mbs + 1; i++) b->i[i] = b->i[i - 1] + b->imax[i - 1]; 160226fbe8dcSKarl Rupp 1603e6b907acSBarry Smith b->free_a = PETSC_TRUE; 1604e6b907acSBarry Smith b->free_ij = PETSC_TRUE; 1605e811da20SHong Zhang } else { 1606e6b907acSBarry Smith b->free_a = PETSC_FALSE; 1607e6b907acSBarry Smith b->free_ij = PETSC_FALSE; 1608ab93d7beSBarry Smith } 160949b5e25fSSatish Balay 161049b5e25fSSatish Balay b->bs2 = bs2; 16116c6c5352SBarry Smith b->nz = 0; 1612b32cb4a7SJed Brown b->maxnz = nz; 1613f4259b30SLisandro Dalcin b->inew = NULL; 1614f4259b30SLisandro Dalcin b->jnew = NULL; 1615f4259b30SLisandro Dalcin b->anew = NULL; 1616f4259b30SLisandro Dalcin b->a2anew = NULL; 16171a3463dfSHong Zhang b->permute = PETSC_FALSE; 1618cb7b82ddSBarry Smith 1619cb7b82ddSBarry Smith B->was_assembled = PETSC_FALSE; 1620cb7b82ddSBarry Smith B->assembled = PETSC_FALSE; 16219566063dSJacob Faibussowitsch if (realalloc) PetscCall(MatSetOption(B, MAT_NEW_NONZERO_ALLOCATION_ERR, PETSC_TRUE)); 16223ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1623c464158bSHong Zhang } 1624153ea458SHong Zhang 1625ba38deedSJacob Faibussowitsch static PetscErrorCode MatSeqSBAIJSetPreallocationCSR_SeqSBAIJ(Mat B, PetscInt bs, const PetscInt ii[], const PetscInt jj[], const PetscScalar V[]) 1626d71ae5a4SJacob Faibussowitsch { 16270cd7f59aSBarry Smith PetscInt i, j, m, nz, anz, nz_max = 0, *nnz; 1628f4259b30SLisandro Dalcin PetscScalar *values = NULL; 162938f409ebSLisandro Dalcin PetscBool roworiented = ((Mat_SeqSBAIJ *)B->data)->roworiented; 16300cd7f59aSBarry Smith 163138f409ebSLisandro Dalcin PetscFunctionBegin; 163208401ef6SPierre Jolivet PetscCheck(bs >= 1, PetscObjectComm((PetscObject)B), PETSC_ERR_ARG_OUTOFRANGE, "Invalid block size specified, must be positive but it is %" PetscInt_FMT, bs); 16339566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetBlockSize(B->rmap, bs)); 16349566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetBlockSize(B->cmap, bs)); 16359566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(B->rmap)); 16369566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(B->cmap)); 16379566063dSJacob Faibussowitsch PetscCall(PetscLayoutGetBlockSize(B->rmap, &bs)); 163838f409ebSLisandro Dalcin m = B->rmap->n / bs; 163938f409ebSLisandro Dalcin 1640aed4548fSBarry Smith PetscCheck(!ii[0], PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "ii[0] must be 0 but it is %" PetscInt_FMT, ii[0]); 16419566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m + 1, &nnz)); 164238f409ebSLisandro Dalcin for (i = 0; i < m; i++) { 164338f409ebSLisandro Dalcin nz = ii[i + 1] - ii[i]; 164408401ef6SPierre Jolivet PetscCheck(nz >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Row %" PetscInt_FMT " has a negative number of columns %" PetscInt_FMT, i, nz); 16450cd7f59aSBarry Smith anz = 0; 16460cd7f59aSBarry Smith for (j = 0; j < nz; j++) { 16470cd7f59aSBarry Smith /* count only values on the diagonal or above */ 16480cd7f59aSBarry Smith if (jj[ii[i] + j] >= i) { 16490cd7f59aSBarry Smith anz = nz - j; 16500cd7f59aSBarry Smith break; 16510cd7f59aSBarry Smith } 16520cd7f59aSBarry Smith } 16530cd7f59aSBarry Smith nz_max = PetscMax(nz_max, anz); 16540cd7f59aSBarry Smith nnz[i] = anz; 165538f409ebSLisandro Dalcin } 16569566063dSJacob Faibussowitsch PetscCall(MatSeqSBAIJSetPreallocation(B, bs, 0, nnz)); 16579566063dSJacob Faibussowitsch PetscCall(PetscFree(nnz)); 165838f409ebSLisandro Dalcin 165938f409ebSLisandro Dalcin values = (PetscScalar *)V; 166048a46eb9SPierre Jolivet if (!values) PetscCall(PetscCalloc1(bs * bs * nz_max, &values)); 166138f409ebSLisandro Dalcin for (i = 0; i < m; i++) { 166238f409ebSLisandro Dalcin PetscInt ncols = ii[i + 1] - ii[i]; 166338f409ebSLisandro Dalcin const PetscInt *icols = jj + ii[i]; 166438f409ebSLisandro Dalcin if (!roworiented || bs == 1) { 166538f409ebSLisandro Dalcin const PetscScalar *svals = values + (V ? (bs * bs * ii[i]) : 0); 16669566063dSJacob Faibussowitsch PetscCall(MatSetValuesBlocked_SeqSBAIJ(B, 1, &i, ncols, icols, svals, INSERT_VALUES)); 166738f409ebSLisandro Dalcin } else { 166838f409ebSLisandro Dalcin for (j = 0; j < ncols; j++) { 166938f409ebSLisandro Dalcin const PetscScalar *svals = values + (V ? (bs * bs * (ii[i] + j)) : 0); 16709566063dSJacob Faibussowitsch PetscCall(MatSetValuesBlocked_SeqSBAIJ(B, 1, &i, 1, &icols[j], svals, INSERT_VALUES)); 167138f409ebSLisandro Dalcin } 167238f409ebSLisandro Dalcin } 167338f409ebSLisandro Dalcin } 16749566063dSJacob Faibussowitsch if (!V) PetscCall(PetscFree(values)); 16759566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(B, MAT_FINAL_ASSEMBLY)); 16769566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(B, MAT_FINAL_ASSEMBLY)); 16779566063dSJacob Faibussowitsch PetscCall(MatSetOption(B, MAT_NEW_NONZERO_LOCATION_ERR, PETSC_TRUE)); 16783ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 167938f409ebSLisandro Dalcin } 168038f409ebSLisandro Dalcin 1681db4efbfdSBarry Smith /* 1682db4efbfdSBarry Smith This is used to set the numeric factorization for both Cholesky and ICC symbolic factorization 1683db4efbfdSBarry Smith */ 1684d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqSBAIJSetNumericFactorization_inplace(Mat B, PetscBool natural) 1685d71ae5a4SJacob Faibussowitsch { 1686ace3abfcSBarry Smith PetscBool flg = PETSC_FALSE; 1687db4efbfdSBarry Smith PetscInt bs = B->rmap->bs; 1688db4efbfdSBarry Smith 1689db4efbfdSBarry Smith PetscFunctionBegin; 16909566063dSJacob Faibussowitsch PetscCall(PetscOptionsGetBool(((PetscObject)B)->options, ((PetscObject)B)->prefix, "-mat_no_unroll", &flg, NULL)); 1691db4efbfdSBarry Smith if (flg) bs = 8; 1692db4efbfdSBarry Smith 1693db4efbfdSBarry Smith if (!natural) { 1694db4efbfdSBarry Smith switch (bs) { 1695d71ae5a4SJacob Faibussowitsch case 1: 1696d71ae5a4SJacob Faibussowitsch B->ops->choleskyfactornumeric = MatCholeskyFactorNumeric_SeqSBAIJ_1_inplace; 1697d71ae5a4SJacob Faibussowitsch break; 1698d71ae5a4SJacob Faibussowitsch case 2: 1699d71ae5a4SJacob Faibussowitsch B->ops->choleskyfactornumeric = MatCholeskyFactorNumeric_SeqSBAIJ_2; 1700d71ae5a4SJacob Faibussowitsch break; 1701d71ae5a4SJacob Faibussowitsch case 3: 1702d71ae5a4SJacob Faibussowitsch B->ops->choleskyfactornumeric = MatCholeskyFactorNumeric_SeqSBAIJ_3; 1703d71ae5a4SJacob Faibussowitsch break; 1704d71ae5a4SJacob Faibussowitsch case 4: 1705d71ae5a4SJacob Faibussowitsch B->ops->choleskyfactornumeric = MatCholeskyFactorNumeric_SeqSBAIJ_4; 1706d71ae5a4SJacob Faibussowitsch break; 1707d71ae5a4SJacob Faibussowitsch case 5: 1708d71ae5a4SJacob Faibussowitsch B->ops->choleskyfactornumeric = MatCholeskyFactorNumeric_SeqSBAIJ_5; 1709d71ae5a4SJacob Faibussowitsch break; 1710d71ae5a4SJacob Faibussowitsch case 6: 1711d71ae5a4SJacob Faibussowitsch B->ops->choleskyfactornumeric = MatCholeskyFactorNumeric_SeqSBAIJ_6; 1712d71ae5a4SJacob Faibussowitsch break; 1713d71ae5a4SJacob Faibussowitsch case 7: 1714d71ae5a4SJacob Faibussowitsch B->ops->choleskyfactornumeric = MatCholeskyFactorNumeric_SeqSBAIJ_7; 1715d71ae5a4SJacob Faibussowitsch break; 1716d71ae5a4SJacob Faibussowitsch default: 1717d71ae5a4SJacob Faibussowitsch B->ops->choleskyfactornumeric = MatCholeskyFactorNumeric_SeqSBAIJ_N; 1718d71ae5a4SJacob Faibussowitsch break; 1719db4efbfdSBarry Smith } 1720db4efbfdSBarry Smith } else { 1721db4efbfdSBarry Smith switch (bs) { 1722d71ae5a4SJacob Faibussowitsch case 1: 1723d71ae5a4SJacob Faibussowitsch B->ops->choleskyfactornumeric = MatCholeskyFactorNumeric_SeqSBAIJ_1_NaturalOrdering_inplace; 1724d71ae5a4SJacob Faibussowitsch break; 1725d71ae5a4SJacob Faibussowitsch case 2: 1726d71ae5a4SJacob Faibussowitsch B->ops->choleskyfactornumeric = MatCholeskyFactorNumeric_SeqSBAIJ_2_NaturalOrdering; 1727d71ae5a4SJacob Faibussowitsch break; 1728d71ae5a4SJacob Faibussowitsch case 3: 1729d71ae5a4SJacob Faibussowitsch B->ops->choleskyfactornumeric = MatCholeskyFactorNumeric_SeqSBAIJ_3_NaturalOrdering; 1730d71ae5a4SJacob Faibussowitsch break; 1731d71ae5a4SJacob Faibussowitsch case 4: 1732d71ae5a4SJacob Faibussowitsch B->ops->choleskyfactornumeric = MatCholeskyFactorNumeric_SeqSBAIJ_4_NaturalOrdering; 1733d71ae5a4SJacob Faibussowitsch break; 1734d71ae5a4SJacob Faibussowitsch case 5: 1735d71ae5a4SJacob Faibussowitsch B->ops->choleskyfactornumeric = MatCholeskyFactorNumeric_SeqSBAIJ_5_NaturalOrdering; 1736d71ae5a4SJacob Faibussowitsch break; 1737d71ae5a4SJacob Faibussowitsch case 6: 1738d71ae5a4SJacob Faibussowitsch B->ops->choleskyfactornumeric = MatCholeskyFactorNumeric_SeqSBAIJ_6_NaturalOrdering; 1739d71ae5a4SJacob Faibussowitsch break; 1740d71ae5a4SJacob Faibussowitsch case 7: 1741d71ae5a4SJacob Faibussowitsch B->ops->choleskyfactornumeric = MatCholeskyFactorNumeric_SeqSBAIJ_7_NaturalOrdering; 1742d71ae5a4SJacob Faibussowitsch break; 1743d71ae5a4SJacob Faibussowitsch default: 1744d71ae5a4SJacob Faibussowitsch B->ops->choleskyfactornumeric = MatCholeskyFactorNumeric_SeqSBAIJ_N_NaturalOrdering; 1745d71ae5a4SJacob Faibussowitsch break; 1746db4efbfdSBarry Smith } 1747db4efbfdSBarry Smith } 17483ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1749db4efbfdSBarry Smith } 1750db4efbfdSBarry Smith 1751cc2e6a90SBarry Smith PETSC_INTERN PetscErrorCode MatConvert_SeqSBAIJ_SeqAIJ(Mat, MatType, MatReuse, Mat *); 1752cc2e6a90SBarry Smith PETSC_INTERN PetscErrorCode MatConvert_SeqSBAIJ_SeqBAIJ(Mat, MatType, MatReuse, Mat *); 1753d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatFactorGetSolverType_petsc(Mat A, MatSolverType *type) 1754d71ae5a4SJacob Faibussowitsch { 17554ac6704cSBarry Smith PetscFunctionBegin; 17564ac6704cSBarry Smith *type = MATSOLVERPETSC; 17573ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 17584ac6704cSBarry Smith } 1759d769727bSBarry Smith 1760d71ae5a4SJacob Faibussowitsch PETSC_INTERN PetscErrorCode MatGetFactor_seqsbaij_petsc(Mat A, MatFactorType ftype, Mat *B) 1761d71ae5a4SJacob Faibussowitsch { 1762d0f46423SBarry Smith PetscInt n = A->rmap->n; 17635c9eb25fSBarry Smith 17645c9eb25fSBarry Smith PetscFunctionBegin; 17650e92d65fSHong Zhang #if defined(PETSC_USE_COMPLEX) 176603e5aca4SStefano Zampini if ((ftype == MAT_FACTOR_CHOLESKY || ftype == MAT_FACTOR_ICC) && A->hermitian == PETSC_BOOL3_TRUE && A->symmetric != PETSC_BOOL3_TRUE) { 176703e5aca4SStefano Zampini PetscCall(PetscInfo(A, "Hermitian MAT_FACTOR_CHOLESKY or MAT_FACTOR_ICC are not supported. Use MAT_FACTOR_LU instead.\n")); 176803e5aca4SStefano Zampini *B = NULL; 176903e5aca4SStefano Zampini PetscFunctionReturn(PETSC_SUCCESS); 177003e5aca4SStefano Zampini } 17710e92d65fSHong Zhang #endif 1772eb1ec7c1SStefano Zampini 17739566063dSJacob Faibussowitsch PetscCall(MatCreate(PetscObjectComm((PetscObject)A), B)); 17749566063dSJacob Faibussowitsch PetscCall(MatSetSizes(*B, n, n, n, n)); 17755c9eb25fSBarry Smith if (ftype == MAT_FACTOR_CHOLESKY || ftype == MAT_FACTOR_ICC) { 17769566063dSJacob Faibussowitsch PetscCall(MatSetType(*B, MATSEQSBAIJ)); 17779566063dSJacob Faibussowitsch PetscCall(MatSeqSBAIJSetPreallocation(*B, A->rmap->bs, MAT_SKIP_ALLOCATION, NULL)); 177826fbe8dcSKarl Rupp 17797b056e98SHong Zhang (*B)->ops->choleskyfactorsymbolic = MatCholeskyFactorSymbolic_SeqSBAIJ; 1780c6d0d4f0SHong Zhang (*B)->ops->iccfactorsymbolic = MatICCFactorSymbolic_SeqSBAIJ; 17819566063dSJacob Faibussowitsch PetscCall(PetscStrallocpy(MATORDERINGNATURAL, (char **)&(*B)->preferredordering[MAT_FACTOR_CHOLESKY])); 17829566063dSJacob Faibussowitsch PetscCall(PetscStrallocpy(MATORDERINGNATURAL, (char **)&(*B)->preferredordering[MAT_FACTOR_ICC])); 1783e32f2f54SBarry Smith } else SETERRQ(PETSC_COMM_SELF, PETSC_ERR_SUP, "Factor type not supported"); 178400c67f3bSHong Zhang 1785d5f3da31SBarry Smith (*B)->factortype = ftype; 1786f73b0415SBarry Smith (*B)->canuseordering = PETSC_TRUE; 17879566063dSJacob Faibussowitsch PetscCall(PetscFree((*B)->solvertype)); 17889566063dSJacob Faibussowitsch PetscCall(PetscStrallocpy(MATSOLVERPETSC, &(*B)->solvertype)); 17899566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)*B, "MatFactorGetSolverType_C", MatFactorGetSolverType_petsc)); 17903ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 17915c9eb25fSBarry Smith } 17925c9eb25fSBarry Smith 17938397e458SBarry Smith /*@C 17942ef1f0ffSBarry Smith MatSeqSBAIJGetArray - gives access to the array where the numerical data for a `MATSEQSBAIJ` matrix is stored 17958397e458SBarry Smith 17968397e458SBarry Smith Not Collective 17978397e458SBarry Smith 17988397e458SBarry Smith Input Parameter: 1799fe59aa6dSJacob Faibussowitsch . A - a `MATSEQSBAIJ` matrix 18008397e458SBarry Smith 18018397e458SBarry Smith Output Parameter: 18028397e458SBarry Smith . array - pointer to the data 18038397e458SBarry Smith 18048397e458SBarry Smith Level: intermediate 18058397e458SBarry Smith 18061cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MATSEQSBAIJ`, `MatSeqSBAIJRestoreArray()`, `MatSeqAIJGetArray()`, `MatSeqAIJRestoreArray()` 18078397e458SBarry Smith @*/ 1808d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqSBAIJGetArray(Mat A, PetscScalar **array) 1809d71ae5a4SJacob Faibussowitsch { 18108397e458SBarry Smith PetscFunctionBegin; 1811cac4c232SBarry Smith PetscUseMethod(A, "MatSeqSBAIJGetArray_C", (Mat, PetscScalar **), (A, array)); 18123ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 18138397e458SBarry Smith } 18148397e458SBarry Smith 18158397e458SBarry Smith /*@C 18162ef1f0ffSBarry Smith MatSeqSBAIJRestoreArray - returns access to the array where the numerical data for a `MATSEQSBAIJ` matrix is stored obtained by `MatSeqSBAIJGetArray()` 18178397e458SBarry Smith 18188397e458SBarry Smith Not Collective 18198397e458SBarry Smith 18208397e458SBarry Smith Input Parameters: 1821fe59aa6dSJacob Faibussowitsch + A - a `MATSEQSBAIJ` matrix 1822a2b725a8SWilliam Gropp - array - pointer to the data 18238397e458SBarry Smith 18248397e458SBarry Smith Level: intermediate 18258397e458SBarry Smith 18261cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MATSEQSBAIJ`, `MatSeqSBAIJGetArray()`, `MatSeqAIJGetArray()`, `MatSeqAIJRestoreArray()` 18278397e458SBarry Smith @*/ 1828d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqSBAIJRestoreArray(Mat A, PetscScalar **array) 1829d71ae5a4SJacob Faibussowitsch { 18308397e458SBarry Smith PetscFunctionBegin; 1831cac4c232SBarry Smith PetscUseMethod(A, "MatSeqSBAIJRestoreArray_C", (Mat, PetscScalar **), (A, array)); 18323ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 18338397e458SBarry Smith } 18348397e458SBarry Smith 18350bad9183SKris Buschelman /*MC 1836fafad747SKris Buschelman MATSEQSBAIJ - MATSEQSBAIJ = "seqsbaij" - A matrix type to be used for sequential symmetric block sparse matrices, 18370bad9183SKris Buschelman based on block compressed sparse row format. Only the upper triangular portion of the matrix is stored. 18380bad9183SKris Buschelman 1839828413b8SBarry Smith For complex numbers by default this matrix is symmetric, NOT Hermitian symmetric. To make it Hermitian symmetric you 184011a5261eSBarry Smith can call `MatSetOption`(`Mat`, `MAT_HERMITIAN`). 1841828413b8SBarry Smith 18422ef1f0ffSBarry Smith Options Database Key: 184311a5261eSBarry Smith . -mat_type seqsbaij - sets the matrix type to "seqsbaij" during a call to `MatSetFromOptions()` 18440bad9183SKris Buschelman 18452ef1f0ffSBarry Smith Level: beginner 18462ef1f0ffSBarry Smith 184795452b02SPatrick Sanan Notes: 184895452b02SPatrick Sanan By default if you insert values into the lower triangular part of the matrix they are simply ignored (since they are not 184911a5261eSBarry Smith stored and it is assumed they symmetric to the upper triangular). If you call `MatSetOption`(`Mat`,`MAT_IGNORE_LOWER_TRIANGULAR`,`PETSC_FALSE`) or use 18502ef1f0ffSBarry Smith the options database `-mat_ignore_lower_triangular` false it will generate an error if you try to set a value in the lower triangular portion. 185171dad5bbSBarry Smith 1852476417e5SBarry Smith The number of rows in the matrix must be less than or equal to the number of columns 185371dad5bbSBarry Smith 18541cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MATSEQSBAIJ`, `MatCreateSeqSBAIJ()`, `MatType`, `MATMPISBAIJ` 18550bad9183SKris Buschelman M*/ 1856d71ae5a4SJacob Faibussowitsch PETSC_EXTERN PetscErrorCode MatCreate_SeqSBAIJ(Mat B) 1857d71ae5a4SJacob Faibussowitsch { 1858a23d5eceSKris Buschelman Mat_SeqSBAIJ *b; 185913f74950SBarry Smith PetscMPIInt size; 1860ace3abfcSBarry Smith PetscBool no_unroll = PETSC_FALSE, no_inode = PETSC_FALSE; 1861a23d5eceSKris Buschelman 1862a23d5eceSKris Buschelman PetscFunctionBegin; 18639566063dSJacob Faibussowitsch PetscCallMPI(MPI_Comm_size(PetscObjectComm((PetscObject)B), &size)); 186408401ef6SPierre Jolivet PetscCheck(size <= 1, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONG, "Comm must be of size 1"); 1865a23d5eceSKris Buschelman 18664dfa11a4SJacob Faibussowitsch PetscCall(PetscNew(&b)); 1867a23d5eceSKris Buschelman B->data = (void *)b; 1868aea10558SJacob Faibussowitsch B->ops[0] = MatOps_Values; 186926fbe8dcSKarl Rupp 1870a23d5eceSKris Buschelman B->ops->destroy = MatDestroy_SeqSBAIJ; 1871a23d5eceSKris Buschelman B->ops->view = MatView_SeqSBAIJ; 1872f4259b30SLisandro Dalcin b->row = NULL; 1873f4259b30SLisandro Dalcin b->icol = NULL; 1874a23d5eceSKris Buschelman b->reallocs = 0; 1875f4259b30SLisandro Dalcin b->saved_values = NULL; 18760def2e27SBarry Smith b->inode.limit = 5; 18770def2e27SBarry Smith b->inode.max_limit = 5; 1878a23d5eceSKris Buschelman 1879a23d5eceSKris Buschelman b->roworiented = PETSC_TRUE; 1880a23d5eceSKris Buschelman b->nonew = 0; 1881f4259b30SLisandro Dalcin b->diag = NULL; 1882f4259b30SLisandro Dalcin b->solve_work = NULL; 1883f4259b30SLisandro Dalcin b->mult_work = NULL; 1884f4259b30SLisandro Dalcin B->spptr = NULL; 1885f2cbd3d5SJed Brown B->info.nz_unneeded = (PetscReal)b->maxnz * b->bs2; 1886a9817697SBarry Smith b->keepnonzeropattern = PETSC_FALSE; 1887a23d5eceSKris Buschelman 1888f4259b30SLisandro Dalcin b->inew = NULL; 1889f4259b30SLisandro Dalcin b->jnew = NULL; 1890f4259b30SLisandro Dalcin b->anew = NULL; 1891f4259b30SLisandro Dalcin b->a2anew = NULL; 1892a23d5eceSKris Buschelman b->permute = PETSC_FALSE; 1893a23d5eceSKris Buschelman 189471dad5bbSBarry Smith b->ignore_ltriangular = PETSC_TRUE; 189526fbe8dcSKarl Rupp 18969566063dSJacob Faibussowitsch PetscCall(PetscOptionsGetBool(((PetscObject)B)->options, ((PetscObject)B)->prefix, "-mat_ignore_lower_triangular", &b->ignore_ltriangular, NULL)); 1897941593c8SHong Zhang 1898f5edf698SHong Zhang b->getrow_utriangular = PETSC_FALSE; 189926fbe8dcSKarl Rupp 19009566063dSJacob Faibussowitsch PetscCall(PetscOptionsGetBool(((PetscObject)B)->options, ((PetscObject)B)->prefix, "-mat_getrow_uppertriangular", &b->getrow_utriangular, NULL)); 1901f5edf698SHong Zhang 19029566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSeqSBAIJGetArray_C", MatSeqSBAIJGetArray_SeqSBAIJ)); 19039566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSeqSBAIJRestoreArray_C", MatSeqSBAIJRestoreArray_SeqSBAIJ)); 19049566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatStoreValues_C", MatStoreValues_SeqSBAIJ)); 19059566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatRetrieveValues_C", MatRetrieveValues_SeqSBAIJ)); 19069566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSeqSBAIJSetColumnIndices_C", MatSeqSBAIJSetColumnIndices_SeqSBAIJ)); 19079566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqsbaij_seqaij_C", MatConvert_SeqSBAIJ_SeqAIJ)); 19089566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqsbaij_seqbaij_C", MatConvert_SeqSBAIJ_SeqBAIJ)); 19099566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSeqSBAIJSetPreallocation_C", MatSeqSBAIJSetPreallocation_SeqSBAIJ)); 19109566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSeqSBAIJSetPreallocationCSR_C", MatSeqSBAIJSetPreallocationCSR_SeqSBAIJ)); 19116214f412SHong Zhang #if defined(PETSC_HAVE_ELEMENTAL) 19129566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqsbaij_elemental_C", MatConvert_SeqSBAIJ_Elemental)); 19136214f412SHong Zhang #endif 1914d24d4204SJose E. Roman #if defined(PETSC_HAVE_SCALAPACK) 19159566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqsbaij_scalapack_C", MatConvert_SBAIJ_ScaLAPACK)); 1916d24d4204SJose E. Roman #endif 191723ce1328SBarry Smith 1918b94d7dedSBarry Smith B->symmetry_eternal = PETSC_TRUE; 1919b94d7dedSBarry Smith B->structural_symmetry_eternal = PETSC_TRUE; 1920b94d7dedSBarry Smith B->symmetric = PETSC_BOOL3_TRUE; 1921b94d7dedSBarry Smith B->structurally_symmetric = PETSC_BOOL3_TRUE; 1922eb1ec7c1SStefano Zampini #if defined(PETSC_USE_COMPLEX) 1923b94d7dedSBarry Smith B->hermitian = PETSC_BOOL3_FALSE; 1924eb1ec7c1SStefano Zampini #else 1925b94d7dedSBarry Smith B->hermitian = PETSC_BOOL3_TRUE; 1926eb1ec7c1SStefano Zampini #endif 192713647f61SHong Zhang 19289566063dSJacob Faibussowitsch PetscCall(PetscObjectChangeTypeName((PetscObject)B, MATSEQSBAIJ)); 19290def2e27SBarry Smith 1930d0609cedSBarry Smith PetscOptionsBegin(PetscObjectComm((PetscObject)B), ((PetscObject)B)->prefix, "Options for SEQSBAIJ matrix", "Mat"); 19319566063dSJacob Faibussowitsch PetscCall(PetscOptionsBool("-mat_no_unroll", "Do not optimize for inodes (slower)", NULL, no_unroll, &no_unroll, NULL)); 193248a46eb9SPierre Jolivet if (no_unroll) PetscCall(PetscInfo(B, "Not using Inode routines due to -mat_no_unroll\n")); 19339566063dSJacob Faibussowitsch PetscCall(PetscOptionsBool("-mat_no_inode", "Do not optimize for inodes (slower)", NULL, no_inode, &no_inode, NULL)); 19349566063dSJacob Faibussowitsch if (no_inode) PetscCall(PetscInfo(B, "Not using Inode routines due to -mat_no_inode\n")); 19359566063dSJacob Faibussowitsch PetscCall(PetscOptionsInt("-mat_inode_limit", "Do not use inodes larger then this value", NULL, b->inode.limit, &b->inode.limit, NULL)); 1936d0609cedSBarry Smith PetscOptionsEnd(); 1937ace3abfcSBarry Smith b->inode.use = (PetscBool)(!(no_unroll || no_inode)); 19380def2e27SBarry Smith if (b->inode.limit > b->inode.max_limit) b->inode.limit = b->inode.max_limit; 19393ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1940a23d5eceSKris Buschelman } 1941a23d5eceSKris Buschelman 1942a23d5eceSKris Buschelman /*@C 1943a23d5eceSKris Buschelman MatSeqSBAIJSetPreallocation - Creates a sparse symmetric matrix in block AIJ (block 194411a5261eSBarry Smith compressed row) `MATSEQSBAIJ` format. For good matrix assembly performance the 194520f4b53cSBarry Smith user should preallocate the matrix storage by setting the parameter `nz` 194620f4b53cSBarry Smith (or the array `nnz`). 1947a23d5eceSKris Buschelman 1948c3339decSBarry Smith Collective 1949a23d5eceSKris Buschelman 1950a23d5eceSKris Buschelman Input Parameters: 19511c4f3114SJed Brown + B - the symmetric matrix 195211a5261eSBarry Smith . bs - size of block, the blocks are ALWAYS square. One can use `MatSetBlockSizes()` to set a different row and column blocksize but the row 195311a5261eSBarry Smith blocksize always defines the size of the blocks. The column blocksize sets the blocksize of the vectors obtained with `MatCreateVecs()` 1954a23d5eceSKris Buschelman . nz - number of block nonzeros per block row (same for all rows) 1955a23d5eceSKris Buschelman - nnz - array containing the number of block nonzeros in the upper triangular plus 19562ef1f0ffSBarry Smith diagonal portion of each block (possibly different for each block row) or `NULL` 1957a23d5eceSKris Buschelman 1958a23d5eceSKris Buschelman Options Database Keys: 1959a2b725a8SWilliam Gropp + -mat_no_unroll - uses code that does not unroll the loops in the 1960a23d5eceSKris Buschelman block calculations (much slower) 1961a2b725a8SWilliam Gropp - -mat_block_size - size of the blocks to use (only works if a negative bs is passed in 1962a23d5eceSKris Buschelman 1963a23d5eceSKris Buschelman Level: intermediate 1964a23d5eceSKris Buschelman 1965a23d5eceSKris Buschelman Notes: 196620f4b53cSBarry Smith Specify the preallocated storage with either `nz` or `nnz` (not both). 19672ef1f0ffSBarry Smith Set `nz` = `PETSC_DEFAULT` and `nnz` = `NULL` for PETSc to control dynamic memory 1968651615e1SBarry Smith allocation. See [Sparse Matrices](sec_matsparse) for details. 1969a23d5eceSKris Buschelman 197011a5261eSBarry Smith You can call `MatGetInfo()` to get information on how effective the preallocation was; 1971aa95bbe8SBarry Smith for example the fields mallocs,nz_allocated,nz_used,nz_unneeded; 19722ef1f0ffSBarry Smith You can also run with the option `-info` and look for messages with the string 1973aa95bbe8SBarry Smith malloc in them to see if additional memory allocation was needed. 1974aa95bbe8SBarry Smith 19752ef1f0ffSBarry Smith If the `nnz` parameter is given then the `nz` parameter is ignored 197649a6f317SBarry Smith 19771cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, [Sparse Matrices](sec_matsparse), `MATSEQSBAIJ`, `MatCreate()`, `MatCreateSeqAIJ()`, `MatSetValues()`, `MatCreateSBAIJ()` 1978a23d5eceSKris Buschelman @*/ 1979d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqSBAIJSetPreallocation(Mat B, PetscInt bs, PetscInt nz, const PetscInt nnz[]) 1980d71ae5a4SJacob Faibussowitsch { 1981a23d5eceSKris Buschelman PetscFunctionBegin; 19826ba663aaSJed Brown PetscValidHeaderSpecific(B, MAT_CLASSID, 1); 19836ba663aaSJed Brown PetscValidType(B, 1); 19846ba663aaSJed Brown PetscValidLogicalCollectiveInt(B, bs, 2); 1985cac4c232SBarry Smith PetscTryMethod(B, "MatSeqSBAIJSetPreallocation_C", (Mat, PetscInt, PetscInt, const PetscInt[]), (B, bs, nz, nnz)); 19863ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1987a23d5eceSKris Buschelman } 198849b5e25fSSatish Balay 198938f409ebSLisandro Dalcin /*@C 199011a5261eSBarry Smith MatSeqSBAIJSetPreallocationCSR - Creates a sparse parallel matrix in `MATSEQSBAIJ` format using the given nonzero structure and (optional) numerical values 199138f409ebSLisandro Dalcin 199238f409ebSLisandro Dalcin Input Parameters: 19931c4f3114SJed Brown + B - the matrix 1994eab78319SHong Zhang . bs - size of block, the blocks are ALWAYS square. 199538f409ebSLisandro Dalcin . i - the indices into j for the start of each local row (starts with zero) 199638f409ebSLisandro Dalcin . j - the column indices for each local row (starts with zero) these must be sorted for each row 199738f409ebSLisandro Dalcin - v - optional values in the matrix 199838f409ebSLisandro Dalcin 1999664954b6SBarry Smith Level: advanced 200038f409ebSLisandro Dalcin 200138f409ebSLisandro Dalcin Notes: 200211a5261eSBarry Smith The order of the entries in values is specified by the `MatOption` `MAT_ROW_ORIENTED`. For example, C programs 200311a5261eSBarry Smith may want to use the default `MAT_ROW_ORIENTED` = `PETSC_TRUE` and use an array v[nnz][bs][bs] where the second index is 200438f409ebSLisandro Dalcin over rows within a block and the last index is over columns within a block row. Fortran programs will likely set 200511a5261eSBarry Smith `MAT_ROW_ORIENTED` = `PETSC_FALSE` and use a Fortran array v(bs,bs,nnz) in which the first index is over rows within a 200638f409ebSLisandro Dalcin block column and the second index is over columns within a block. 200738f409ebSLisandro Dalcin 200850c5228eSBarry Smith Any entries below the diagonal are ignored 20090cd7f59aSBarry Smith 20100cd7f59aSBarry Smith Though this routine has Preallocation() in the name it also sets the exact nonzero locations of the matrix entries 20110cd7f59aSBarry Smith and usually the numerical values as well 2012664954b6SBarry Smith 2013fe59aa6dSJacob Faibussowitsch .seealso: [](ch_matrices), `Mat`, `MATSEQSBAIJ`, `MatCreate()`, `MatCreateSeqSBAIJ()`, `MatSetValuesBlocked()`, `MatSeqSBAIJSetPreallocation()` 201438f409ebSLisandro Dalcin @*/ 2015d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqSBAIJSetPreallocationCSR(Mat B, PetscInt bs, const PetscInt i[], const PetscInt j[], const PetscScalar v[]) 2016d71ae5a4SJacob Faibussowitsch { 201738f409ebSLisandro Dalcin PetscFunctionBegin; 201838f409ebSLisandro Dalcin PetscValidHeaderSpecific(B, MAT_CLASSID, 1); 201938f409ebSLisandro Dalcin PetscValidType(B, 1); 202038f409ebSLisandro Dalcin PetscValidLogicalCollectiveInt(B, bs, 2); 2021cac4c232SBarry Smith PetscTryMethod(B, "MatSeqSBAIJSetPreallocationCSR_C", (Mat, PetscInt, const PetscInt[], const PetscInt[], const PetscScalar[]), (B, bs, i, j, v)); 20223ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 202338f409ebSLisandro Dalcin } 202438f409ebSLisandro Dalcin 2025c464158bSHong Zhang /*@C 20262ef1f0ffSBarry Smith MatCreateSeqSBAIJ - Creates a sparse symmetric matrix in (block 202711a5261eSBarry Smith compressed row) `MATSEQSBAIJ` format. For good matrix assembly performance the 20282ef1f0ffSBarry Smith user should preallocate the matrix storage by setting the parameter `nz` 20292ef1f0ffSBarry Smith (or the array `nnz`). 203049b5e25fSSatish Balay 2031d083f849SBarry Smith Collective 2032c464158bSHong Zhang 2033c464158bSHong Zhang Input Parameters: 203411a5261eSBarry Smith + comm - MPI communicator, set to `PETSC_COMM_SELF` 203511a5261eSBarry Smith . bs - size of block, the blocks are ALWAYS square. One can use `MatSetBlockSizes()` to set a different row and column blocksize but the row 2036bb7ae925SBarry Smith blocksize always defines the size of the blocks. The column blocksize sets the blocksize of the vectors obtained with MatCreateVecs() 203720f4b53cSBarry Smith . m - number of rows 203820f4b53cSBarry Smith . n - number of columns 2039c464158bSHong Zhang . nz - number of block nonzeros per block row (same for all rows) 2040744e8345SSatish Balay - nnz - array containing the number of block nonzeros in the upper triangular plus 20412ef1f0ffSBarry Smith diagonal portion of each block (possibly different for each block row) or `NULL` 2042c464158bSHong Zhang 2043c464158bSHong Zhang Output Parameter: 2044c464158bSHong Zhang . A - the symmetric matrix 2045c464158bSHong Zhang 2046c464158bSHong Zhang Options Database Keys: 2047a2b725a8SWilliam Gropp + -mat_no_unroll - uses code that does not unroll the loops in the 2048c464158bSHong Zhang block calculations (much slower) 2049a2b725a8SWilliam Gropp - -mat_block_size - size of the blocks to use 2050c464158bSHong Zhang 2051c464158bSHong Zhang Level: intermediate 2052c464158bSHong Zhang 20532ef1f0ffSBarry Smith Notes: 205477433607SBarry Smith It is recommended that one use `MatCreateFromOptions()` or the `MatCreate()`, `MatSetType()` and/or `MatSetFromOptions()`, 2055f6f02116SRichard Tran Mills MatXXXXSetPreallocation() paradigm instead of this routine directly. 205611a5261eSBarry Smith [MatXXXXSetPreallocation() is, for example, `MatSeqAIJSetPreallocation()`] 2057175b88e8SBarry Smith 20586d6d819aSHong Zhang The number of rows and columns must be divisible by blocksize. 20596d6d819aSHong Zhang This matrix type does not support complex Hermitian operation. 2060c464158bSHong Zhang 20612ef1f0ffSBarry Smith Specify the preallocated storage with either `nz` or `nnz` (not both). 20622ef1f0ffSBarry Smith Set `nz` = `PETSC_DEFAULT` and `nnz` = `NULL` for PETSc to control dynamic memory 2063651615e1SBarry Smith allocation. See [Sparse Matrices](sec_matsparse) for details. 2064c464158bSHong Zhang 20652ef1f0ffSBarry Smith If the `nnz` parameter is given then the `nz` parameter is ignored 206649a6f317SBarry Smith 20671cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, [Sparse Matrices](sec_matsparse), `MATSEQSBAIJ`, `MatCreate()`, `MatCreateSeqAIJ()`, `MatSetValues()`, `MatCreateSBAIJ()` 2068c464158bSHong Zhang @*/ 2069d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateSeqSBAIJ(MPI_Comm comm, PetscInt bs, PetscInt m, PetscInt n, PetscInt nz, const PetscInt nnz[], Mat *A) 2070d71ae5a4SJacob Faibussowitsch { 2071c464158bSHong Zhang PetscFunctionBegin; 20729566063dSJacob Faibussowitsch PetscCall(MatCreate(comm, A)); 20739566063dSJacob Faibussowitsch PetscCall(MatSetSizes(*A, m, n, m, n)); 20749566063dSJacob Faibussowitsch PetscCall(MatSetType(*A, MATSEQSBAIJ)); 20759566063dSJacob Faibussowitsch PetscCall(MatSeqSBAIJSetPreallocation(*A, bs, nz, (PetscInt *)nnz)); 20763ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 207749b5e25fSSatish Balay } 207849b5e25fSSatish Balay 2079d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDuplicate_SeqSBAIJ(Mat A, MatDuplicateOption cpvalues, Mat *B) 2080d71ae5a4SJacob Faibussowitsch { 208149b5e25fSSatish Balay Mat C; 208249b5e25fSSatish Balay Mat_SeqSBAIJ *c, *a = (Mat_SeqSBAIJ *)A->data; 2083b40805acSSatish Balay PetscInt i, mbs = a->mbs, nz = a->nz, bs2 = a->bs2; 208449b5e25fSSatish Balay 208549b5e25fSSatish Balay PetscFunctionBegin; 208631fe6a7dSBarry Smith PetscCheck(A->assembled, PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_WRONGSTATE, "Cannot duplicate unassembled matrix"); 208708401ef6SPierre Jolivet PetscCheck(a->i[mbs] == nz, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Corrupt matrix"); 208849b5e25fSSatish Balay 2089f4259b30SLisandro Dalcin *B = NULL; 20909566063dSJacob Faibussowitsch PetscCall(MatCreate(PetscObjectComm((PetscObject)A), &C)); 20919566063dSJacob Faibussowitsch PetscCall(MatSetSizes(C, A->rmap->N, A->cmap->n, A->rmap->N, A->cmap->n)); 20929566063dSJacob Faibussowitsch PetscCall(MatSetBlockSizesFromMats(C, A, A)); 20939566063dSJacob Faibussowitsch PetscCall(MatSetType(C, MATSEQSBAIJ)); 2094692f9cbeSHong Zhang c = (Mat_SeqSBAIJ *)C->data; 2095692f9cbeSHong Zhang 2096273d9f13SBarry Smith C->preallocated = PETSC_TRUE; 2097d5f3da31SBarry Smith C->factortype = A->factortype; 2098f4259b30SLisandro Dalcin c->row = NULL; 2099f4259b30SLisandro Dalcin c->icol = NULL; 2100f4259b30SLisandro Dalcin c->saved_values = NULL; 2101a9817697SBarry Smith c->keepnonzeropattern = a->keepnonzeropattern; 210249b5e25fSSatish Balay C->assembled = PETSC_TRUE; 210349b5e25fSSatish Balay 21049566063dSJacob Faibussowitsch PetscCall(PetscLayoutReference(A->rmap, &C->rmap)); 21059566063dSJacob Faibussowitsch PetscCall(PetscLayoutReference(A->cmap, &C->cmap)); 210649b5e25fSSatish Balay c->bs2 = a->bs2; 210749b5e25fSSatish Balay c->mbs = a->mbs; 210849b5e25fSSatish Balay c->nbs = a->nbs; 210949b5e25fSSatish Balay 2110c760cd28SBarry Smith if (cpvalues == MAT_SHARE_NONZERO_PATTERN) { 2111c760cd28SBarry Smith c->imax = a->imax; 2112c760cd28SBarry Smith c->ilen = a->ilen; 2113c760cd28SBarry Smith c->free_imax_ilen = PETSC_FALSE; 2114c760cd28SBarry Smith } else { 21159566063dSJacob Faibussowitsch PetscCall(PetscMalloc2((mbs + 1), &c->imax, (mbs + 1), &c->ilen)); 211649b5e25fSSatish Balay for (i = 0; i < mbs; i++) { 211749b5e25fSSatish Balay c->imax[i] = a->imax[i]; 211849b5e25fSSatish Balay c->ilen[i] = a->ilen[i]; 211949b5e25fSSatish Balay } 2120c760cd28SBarry Smith c->free_imax_ilen = PETSC_TRUE; 2121c760cd28SBarry Smith } 212249b5e25fSSatish Balay 212349b5e25fSSatish Balay /* allocate the matrix space */ 21244da8f245SBarry Smith if (cpvalues == MAT_SHARE_NONZERO_PATTERN) { 21259566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(bs2 * nz, &c->a)); 212644e1c64aSLisandro Dalcin c->i = a->i; 212744e1c64aSLisandro Dalcin c->j = a->j; 21284da8f245SBarry Smith c->singlemalloc = PETSC_FALSE; 212944e1c64aSLisandro Dalcin c->free_a = PETSC_TRUE; 21304da8f245SBarry Smith c->free_ij = PETSC_FALSE; 21314da8f245SBarry Smith c->parent = A; 21329566063dSJacob Faibussowitsch PetscCall(PetscObjectReference((PetscObject)A)); 21339566063dSJacob Faibussowitsch PetscCall(MatSetOption(A, MAT_NEW_NONZERO_LOCATION_ERR, PETSC_TRUE)); 21349566063dSJacob Faibussowitsch PetscCall(MatSetOption(C, MAT_NEW_NONZERO_LOCATION_ERR, PETSC_TRUE)); 21354da8f245SBarry Smith } else { 21369566063dSJacob Faibussowitsch PetscCall(PetscMalloc3(bs2 * nz, &c->a, nz, &c->j, mbs + 1, &c->i)); 21379566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(c->i, a->i, mbs + 1)); 21384da8f245SBarry Smith c->singlemalloc = PETSC_TRUE; 213944e1c64aSLisandro Dalcin c->free_a = PETSC_TRUE; 21404da8f245SBarry Smith c->free_ij = PETSC_TRUE; 21414da8f245SBarry Smith } 214249b5e25fSSatish Balay if (mbs > 0) { 214348a46eb9SPierre Jolivet if (cpvalues != MAT_SHARE_NONZERO_PATTERN) PetscCall(PetscArraycpy(c->j, a->j, nz)); 214449b5e25fSSatish Balay if (cpvalues == MAT_COPY_VALUES) { 21459566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(c->a, a->a, bs2 * nz)); 214649b5e25fSSatish Balay } else { 21479566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(c->a, bs2 * nz)); 214849b5e25fSSatish Balay } 2149a1c3900fSBarry Smith if (a->jshort) { 215044e1c64aSLisandro Dalcin /* cannot share jshort, it is reallocated in MatAssemblyEnd_SeqSBAIJ() */ 215144e1c64aSLisandro Dalcin /* if the parent matrix is reassembled, this child matrix will never notice */ 21529566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nz, &c->jshort)); 21539566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(c->jshort, a->jshort, nz)); 215426fbe8dcSKarl Rupp 21554da8f245SBarry Smith c->free_jshort = PETSC_TRUE; 21564da8f245SBarry Smith } 2157a1c3900fSBarry Smith } 215849b5e25fSSatish Balay 215949b5e25fSSatish Balay c->roworiented = a->roworiented; 216049b5e25fSSatish Balay c->nonew = a->nonew; 216149b5e25fSSatish Balay 216249b5e25fSSatish Balay if (a->diag) { 2163c760cd28SBarry Smith if (cpvalues == MAT_SHARE_NONZERO_PATTERN) { 2164c760cd28SBarry Smith c->diag = a->diag; 2165c760cd28SBarry Smith c->free_diag = PETSC_FALSE; 2166c760cd28SBarry Smith } else { 21679566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(mbs, &c->diag)); 216826fbe8dcSKarl Rupp for (i = 0; i < mbs; i++) c->diag[i] = a->diag[i]; 2169c760cd28SBarry Smith c->free_diag = PETSC_TRUE; 2170c760cd28SBarry Smith } 217144e1c64aSLisandro Dalcin } 21726c6c5352SBarry Smith c->nz = a->nz; 2173f2cbd3d5SJed Brown c->maxnz = a->nz; /* Since we allocate exactly the right amount */ 2174f4259b30SLisandro Dalcin c->solve_work = NULL; 2175f4259b30SLisandro Dalcin c->mult_work = NULL; 217626fbe8dcSKarl Rupp 217749b5e25fSSatish Balay *B = C; 21789566063dSJacob Faibussowitsch PetscCall(PetscFunctionListDuplicate(((PetscObject)A)->qlist, &((PetscObject)C)->qlist)); 21793ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 218049b5e25fSSatish Balay } 218149b5e25fSSatish Balay 2182618cc2edSLisandro Dalcin /* Used for both SeqBAIJ and SeqSBAIJ matrices */ 2183618cc2edSLisandro Dalcin #define MatLoad_SeqSBAIJ_Binary MatLoad_SeqBAIJ_Binary 2184618cc2edSLisandro Dalcin 2185d71ae5a4SJacob Faibussowitsch PetscErrorCode MatLoad_SeqSBAIJ(Mat mat, PetscViewer viewer) 2186d71ae5a4SJacob Faibussowitsch { 21877f489da9SVaclav Hapla PetscBool isbinary; 21882f480046SShri Abhyankar 21892f480046SShri Abhyankar PetscFunctionBegin; 21909566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERBINARY, &isbinary)); 219128b400f6SJacob Faibussowitsch PetscCheck(isbinary, PetscObjectComm((PetscObject)viewer), PETSC_ERR_SUP, "Viewer type %s not yet supported for reading %s matrices", ((PetscObject)viewer)->type_name, ((PetscObject)mat)->type_name); 21929566063dSJacob Faibussowitsch PetscCall(MatLoad_SeqSBAIJ_Binary(mat, viewer)); 21933ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 21942f480046SShri Abhyankar } 21952f480046SShri Abhyankar 2196c75a6043SHong Zhang /*@ 219711a5261eSBarry Smith MatCreateSeqSBAIJWithArrays - Creates an sequential `MATSEQSBAIJ` matrix using matrix elements 2198c75a6043SHong Zhang (upper triangular entries in CSR format) provided by the user. 2199c75a6043SHong Zhang 2200d083f849SBarry Smith Collective 2201c75a6043SHong Zhang 2202c75a6043SHong Zhang Input Parameters: 2203c75a6043SHong Zhang + comm - must be an MPI communicator of size 1 2204c75a6043SHong Zhang . bs - size of block 2205c75a6043SHong Zhang . m - number of rows 2206c75a6043SHong Zhang . n - number of columns 2207483a2f95SBarry Smith . i - row indices; that is i[0] = 0, i[row] = i[row-1] + number of block elements in that row block row of the matrix 2208c75a6043SHong Zhang . j - column indices 2209c75a6043SHong Zhang - a - matrix values 2210c75a6043SHong Zhang 2211c75a6043SHong Zhang Output Parameter: 2212c75a6043SHong Zhang . mat - the matrix 2213c75a6043SHong Zhang 2214dfb205c3SBarry Smith Level: advanced 2215c75a6043SHong Zhang 2216c75a6043SHong Zhang Notes: 22172ef1f0ffSBarry Smith The `i`, `j`, and `a` arrays are not copied by this routine, the user must free these arrays 2218c75a6043SHong Zhang once the matrix is destroyed 2219c75a6043SHong Zhang 2220c75a6043SHong Zhang You cannot set new nonzero locations into this matrix, that will generate an error. 2221c75a6043SHong Zhang 22222ef1f0ffSBarry Smith The `i` and `j` indices are 0 based 2223c75a6043SHong Zhang 22242ef1f0ffSBarry Smith When block size is greater than 1 the matrix values must be stored using the `MATSBAIJ` storage format. For block size of 1 2225dfb205c3SBarry Smith it is the regular CSR format excluding the lower triangular elements. 2226dfb205c3SBarry Smith 22271cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MATSEQSBAIJ`, `MatCreate()`, `MatCreateSBAIJ()`, `MatCreateSeqSBAIJ()` 2228c75a6043SHong Zhang @*/ 2229d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateSeqSBAIJWithArrays(MPI_Comm comm, PetscInt bs, PetscInt m, PetscInt n, PetscInt i[], PetscInt j[], PetscScalar a[], Mat *mat) 2230d71ae5a4SJacob Faibussowitsch { 2231c75a6043SHong Zhang PetscInt ii; 2232c75a6043SHong Zhang Mat_SeqSBAIJ *sbaij; 2233c75a6043SHong Zhang 2234c75a6043SHong Zhang PetscFunctionBegin; 223508401ef6SPierre Jolivet PetscCheck(bs == 1, PETSC_COMM_SELF, PETSC_ERR_SUP, "block size %" PetscInt_FMT " > 1 is not supported yet", bs); 2236aed4548fSBarry Smith PetscCheck(m == 0 || i[0] == 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "i (row indices) must start with 0"); 2237c75a6043SHong Zhang 22389566063dSJacob Faibussowitsch PetscCall(MatCreate(comm, mat)); 22399566063dSJacob Faibussowitsch PetscCall(MatSetSizes(*mat, m, n, m, n)); 22409566063dSJacob Faibussowitsch PetscCall(MatSetType(*mat, MATSEQSBAIJ)); 22419566063dSJacob Faibussowitsch PetscCall(MatSeqSBAIJSetPreallocation(*mat, bs, MAT_SKIP_ALLOCATION, NULL)); 2242c75a6043SHong Zhang sbaij = (Mat_SeqSBAIJ *)(*mat)->data; 22439566063dSJacob Faibussowitsch PetscCall(PetscMalloc2(m, &sbaij->imax, m, &sbaij->ilen)); 2244c75a6043SHong Zhang 2245c75a6043SHong Zhang sbaij->i = i; 2246c75a6043SHong Zhang sbaij->j = j; 2247c75a6043SHong Zhang sbaij->a = a; 224826fbe8dcSKarl Rupp 2249c75a6043SHong Zhang sbaij->singlemalloc = PETSC_FALSE; 2250c75a6043SHong Zhang sbaij->nonew = -1; /*this indicates that inserting a new value in the matrix that generates a new nonzero is an error*/ 2251e6b907acSBarry Smith sbaij->free_a = PETSC_FALSE; 2252e6b907acSBarry Smith sbaij->free_ij = PETSC_FALSE; 2253ddf7884eSMatthew Knepley sbaij->free_imax_ilen = PETSC_TRUE; 2254c75a6043SHong Zhang 2255c75a6043SHong Zhang for (ii = 0; ii < m; ii++) { 2256c75a6043SHong Zhang sbaij->ilen[ii] = sbaij->imax[ii] = i[ii + 1] - i[ii]; 22576bdcaf15SBarry Smith PetscCheck(i[ii + 1] >= i[ii], PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Negative row length in i (row indices) row = %" PetscInt_FMT " length = %" PetscInt_FMT, ii, i[ii + 1] - i[ii]); 2258c75a6043SHong Zhang } 225976bd3646SJed Brown if (PetscDefined(USE_DEBUG)) { 2260c75a6043SHong Zhang for (ii = 0; ii < sbaij->i[m]; ii++) { 22616bdcaf15SBarry Smith PetscCheck(j[ii] >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Negative column index at location = %" PetscInt_FMT " index = %" PetscInt_FMT, ii, j[ii]); 22626bdcaf15SBarry Smith PetscCheck(j[ii] < n, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Column index too large at location = %" PetscInt_FMT " index = %" PetscInt_FMT, ii, j[ii]); 2263c75a6043SHong Zhang } 226476bd3646SJed Brown } 2265c75a6043SHong Zhang 22669566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(*mat, MAT_FINAL_ASSEMBLY)); 22679566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(*mat, MAT_FINAL_ASSEMBLY)); 22683ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 2269c75a6043SHong Zhang } 2270d06b337dSHong Zhang 2271d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateMPIMatConcatenateSeqMat_SeqSBAIJ(MPI_Comm comm, Mat inmat, PetscInt n, MatReuse scall, Mat *outmat) 2272d71ae5a4SJacob Faibussowitsch { 227359f5e6ceSHong Zhang PetscFunctionBegin; 22749566063dSJacob Faibussowitsch PetscCall(MatCreateMPIMatConcatenateSeqMat_MPISBAIJ(comm, inmat, n, scall, outmat)); 22753ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 227659f5e6ceSHong Zhang } 2277