149b5e25fSSatish Balay 249b5e25fSSatish Balay /* 3a1373b80SHong Zhang Defines the basic matrix operations for the SBAIJ (compressed row) 449b5e25fSSatish Balay matrix storage format. 549b5e25fSSatish Balay */ 6c6db04a5SJed Brown #include <../src/mat/impls/baij/seq/baij.h> /*I "petscmat.h" I*/ 7c6db04a5SJed Brown #include <../src/mat/impls/sbaij/seq/sbaij.h> 8c6db04a5SJed Brown #include <petscblaslapack.h> 949b5e25fSSatish Balay 10c6db04a5SJed Brown #include <../src/mat/impls/sbaij/seq/relax.h> 1170dcbbb9SBarry Smith #define USESHORT 12c6db04a5SJed Brown #include <../src/mat/impls/sbaij/seq/relax.h> 1370dcbbb9SBarry Smith 1426cec326SBarry Smith /* defines MatSetValues_Seq_Hash(), MatAssemblyEnd_Seq_Hash(), MatSetUp_Seq_Hash() */ 1526cec326SBarry Smith #define TYPE SBAIJ 1626cec326SBarry Smith #define TYPE_SBAIJ 1726cec326SBarry Smith #define TYPE_BS 1826cec326SBarry Smith #include "../src/mat/impls/aij/seq/seqhashmatsetvalues.h" 1926cec326SBarry Smith #undef TYPE_BS 2026cec326SBarry Smith #define TYPE_BS _BS 2126cec326SBarry Smith #define TYPE_BS_ON 2226cec326SBarry Smith #include "../src/mat/impls/aij/seq/seqhashmatsetvalues.h" 2326cec326SBarry Smith #undef TYPE_BS 2426cec326SBarry Smith #undef TYPE_SBAIJ 2526cec326SBarry Smith #include "../src/mat/impls/aij/seq/seqhashmat.h" 2626cec326SBarry Smith #undef TYPE 2726cec326SBarry Smith #undef TYPE_BS_ON 2826cec326SBarry Smith 296214f412SHong Zhang #if defined(PETSC_HAVE_ELEMENTAL) 30cc2e6a90SBarry Smith PETSC_INTERN PetscErrorCode MatConvert_SeqSBAIJ_Elemental(Mat, MatType, MatReuse, Mat *); 316214f412SHong Zhang #endif 32d24d4204SJose E. Roman #if defined(PETSC_HAVE_SCALAPACK) 33d24d4204SJose E. Roman PETSC_INTERN PetscErrorCode MatConvert_SBAIJ_ScaLAPACK(Mat, MatType, MatReuse, Mat *); 34d24d4204SJose E. Roman #endif 3528d58a37SPierre Jolivet PETSC_INTERN PetscErrorCode MatConvert_MPISBAIJ_Basic(Mat, MatType, MatReuse, Mat *); 36b5b17502SBarry Smith 3749b5e25fSSatish Balay /* 3849b5e25fSSatish Balay Checks for missing diagonals 3949b5e25fSSatish Balay */ 40ba38deedSJacob Faibussowitsch static PetscErrorCode MatMissingDiagonal_SeqSBAIJ(Mat A, PetscBool *missing, PetscInt *dd) 41d71ae5a4SJacob Faibussowitsch { 42045c9aa0SHong Zhang Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)A->data; 437734d3b5SMatthew G. Knepley PetscInt *diag, *ii = a->i, i; 4449b5e25fSSatish Balay 4549b5e25fSSatish Balay PetscFunctionBegin; 469566063dSJacob Faibussowitsch PetscCall(MatMarkDiagonal_SeqSBAIJ(A)); 472af78befSBarry Smith *missing = PETSC_FALSE; 487734d3b5SMatthew G. Knepley if (A->rmap->n > 0 && !ii) { 49358d2f5dSShri Abhyankar *missing = PETSC_TRUE; 50358d2f5dSShri Abhyankar if (dd) *dd = 0; 519566063dSJacob Faibussowitsch PetscCall(PetscInfo(A, "Matrix has no entries therefore is missing diagonal\n")); 52358d2f5dSShri Abhyankar } else { 53358d2f5dSShri Abhyankar diag = a->diag; 5449b5e25fSSatish Balay for (i = 0; i < a->mbs; i++) { 557734d3b5SMatthew G. Knepley if (diag[i] >= ii[i + 1]) { 562af78befSBarry Smith *missing = PETSC_TRUE; 572af78befSBarry Smith if (dd) *dd = i; 582af78befSBarry Smith break; 592af78befSBarry Smith } 6049b5e25fSSatish Balay } 61358d2f5dSShri Abhyankar } 623ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 6349b5e25fSSatish Balay } 6449b5e25fSSatish Balay 65d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMarkDiagonal_SeqSBAIJ(Mat A) 66d71ae5a4SJacob Faibussowitsch { 67045c9aa0SHong Zhang Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)A->data; 6848dd3d27SHong Zhang PetscInt i, j; 6949b5e25fSSatish Balay 7049b5e25fSSatish Balay PetscFunctionBegin; 7109f38230SBarry Smith if (!a->diag) { 729566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(a->mbs, &a->diag)); 73c760cd28SBarry Smith a->free_diag = PETSC_TRUE; 7409f38230SBarry Smith } 7548dd3d27SHong Zhang for (i = 0; i < a->mbs; i++) { 7648dd3d27SHong Zhang a->diag[i] = a->i[i + 1]; 7748dd3d27SHong Zhang for (j = a->i[i]; j < a->i[i + 1]; j++) { 7848dd3d27SHong Zhang if (a->j[j] == i) { 7948dd3d27SHong Zhang a->diag[i] = j; 8048dd3d27SHong Zhang break; 8148dd3d27SHong Zhang } 8248dd3d27SHong Zhang } 8348dd3d27SHong Zhang } 843ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 8549b5e25fSSatish Balay } 8649b5e25fSSatish Balay 87d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatGetRowIJ_SeqSBAIJ(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool blockcompressed, PetscInt *nn, const PetscInt *inia[], const PetscInt *inja[], PetscBool *done) 88d71ae5a4SJacob Faibussowitsch { 89a6ece127SHong Zhang Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)A->data; 902462f5fdSStefano Zampini PetscInt i, j, n = a->mbs, nz = a->i[n], *tia, *tja, bs = A->rmap->bs, k, l, cnt; 912462f5fdSStefano Zampini PetscInt **ia = (PetscInt **)inia, **ja = (PetscInt **)inja; 9249b5e25fSSatish Balay 9349b5e25fSSatish Balay PetscFunctionBegin; 94d3e5a4abSHong Zhang *nn = n; 953ba16761SJacob Faibussowitsch if (!ia) PetscFunctionReturn(PETSC_SUCCESS); 962462f5fdSStefano Zampini if (symmetric) { 979566063dSJacob Faibussowitsch PetscCall(MatToSymmetricIJ_SeqAIJ(n, a->i, a->j, PETSC_FALSE, 0, 0, &tia, &tja)); 982462f5fdSStefano Zampini nz = tia[n]; 992462f5fdSStefano Zampini } else { 1009371c9d4SSatish Balay tia = a->i; 1019371c9d4SSatish Balay tja = a->j; 1022462f5fdSStefano Zampini } 1032462f5fdSStefano Zampini 1042462f5fdSStefano Zampini if (!blockcompressed && bs > 1) { 1052462f5fdSStefano Zampini (*nn) *= bs; 1068f7157efSSatish Balay /* malloc & create the natural set of indices */ 1079566063dSJacob Faibussowitsch PetscCall(PetscMalloc1((n + 1) * bs, ia)); 1082462f5fdSStefano Zampini if (n) { 1092462f5fdSStefano Zampini (*ia)[0] = oshift; 110ad540459SPierre Jolivet for (j = 1; j < bs; j++) (*ia)[j] = (tia[1] - tia[0]) * bs + (*ia)[j - 1]; 1112462f5fdSStefano Zampini } 1122462f5fdSStefano Zampini 1132462f5fdSStefano Zampini for (i = 1; i < n; i++) { 1142462f5fdSStefano Zampini (*ia)[i * bs] = (tia[i] - tia[i - 1]) * bs + (*ia)[i * bs - 1]; 115ad540459SPierre Jolivet for (j = 1; j < bs; j++) (*ia)[i * bs + j] = (tia[i + 1] - tia[i]) * bs + (*ia)[i * bs + j - 1]; 1162462f5fdSStefano Zampini } 117ad540459SPierre Jolivet if (n) (*ia)[n * bs] = (tia[n] - tia[n - 1]) * bs + (*ia)[n * bs - 1]; 1182462f5fdSStefano Zampini 1192462f5fdSStefano Zampini if (inja) { 1209566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nz * bs * bs, ja)); 1212462f5fdSStefano Zampini cnt = 0; 1222462f5fdSStefano Zampini for (i = 0; i < n; i++) { 1238f7157efSSatish Balay for (j = 0; j < bs; j++) { 1242462f5fdSStefano Zampini for (k = tia[i]; k < tia[i + 1]; k++) { 125ad540459SPierre Jolivet for (l = 0; l < bs; l++) (*ja)[cnt++] = bs * tja[k] + l; 1268f7157efSSatish Balay } 1278f7157efSSatish Balay } 1288f7157efSSatish Balay } 1298f7157efSSatish Balay } 1302462f5fdSStefano Zampini 1312462f5fdSStefano Zampini if (symmetric) { /* deallocate memory allocated in MatToSymmetricIJ_SeqAIJ() */ 1329566063dSJacob Faibussowitsch PetscCall(PetscFree(tia)); 1339566063dSJacob Faibussowitsch PetscCall(PetscFree(tja)); 1342462f5fdSStefano Zampini } 1352462f5fdSStefano Zampini } else if (oshift == 1) { 1362462f5fdSStefano Zampini if (symmetric) { 1372462f5fdSStefano Zampini nz = tia[A->rmap->n / bs]; 1382462f5fdSStefano Zampini /* add 1 to i and j indices */ 1392462f5fdSStefano Zampini for (i = 0; i < A->rmap->n / bs + 1; i++) tia[i] = tia[i] + 1; 1402462f5fdSStefano Zampini *ia = tia; 1412462f5fdSStefano Zampini if (ja) { 1422462f5fdSStefano Zampini for (i = 0; i < nz; i++) tja[i] = tja[i] + 1; 1432462f5fdSStefano Zampini *ja = tja; 1442462f5fdSStefano Zampini } 1452462f5fdSStefano Zampini } else { 1462462f5fdSStefano Zampini nz = a->i[A->rmap->n / bs]; 1472462f5fdSStefano Zampini /* malloc space and add 1 to i and j indices */ 1489566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(A->rmap->n / bs + 1, ia)); 1492462f5fdSStefano Zampini for (i = 0; i < A->rmap->n / bs + 1; i++) (*ia)[i] = a->i[i] + 1; 1502462f5fdSStefano Zampini if (ja) { 1519566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nz, ja)); 1522462f5fdSStefano Zampini for (i = 0; i < nz; i++) (*ja)[i] = a->j[i] + 1; 1532462f5fdSStefano Zampini } 1542462f5fdSStefano Zampini } 1552462f5fdSStefano Zampini } else { 1562462f5fdSStefano Zampini *ia = tia; 1572462f5fdSStefano Zampini if (ja) *ja = tja; 158a6ece127SHong Zhang } 1593ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 16049b5e25fSSatish Balay } 16149b5e25fSSatish Balay 162d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatRestoreRowIJ_SeqSBAIJ(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool blockcompressed, PetscInt *nn, const PetscInt *ia[], const PetscInt *ja[], PetscBool *done) 163d71ae5a4SJacob Faibussowitsch { 16449b5e25fSSatish Balay PetscFunctionBegin; 1653ba16761SJacob Faibussowitsch if (!ia) PetscFunctionReturn(PETSC_SUCCESS); 1662462f5fdSStefano Zampini if ((!blockcompressed && A->rmap->bs > 1) || (symmetric || oshift == 1)) { 1679566063dSJacob Faibussowitsch PetscCall(PetscFree(*ia)); 1689566063dSJacob Faibussowitsch if (ja) PetscCall(PetscFree(*ja)); 169a6ece127SHong Zhang } 1703ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 17149b5e25fSSatish Balay } 17249b5e25fSSatish Balay 173d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDestroy_SeqSBAIJ(Mat A) 174d71ae5a4SJacob Faibussowitsch { 17549b5e25fSSatish Balay Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)A->data; 17649b5e25fSSatish Balay 17749b5e25fSSatish Balay PetscFunctionBegin; 178b4e2f619SBarry Smith if (A->hash_active) { 179b4e2f619SBarry Smith PetscInt bs; 180e3c72094SPierre Jolivet A->ops[0] = a->cops; 181b4e2f619SBarry Smith PetscCall(PetscHMapIJVDestroy(&a->ht)); 182b4e2f619SBarry Smith PetscCall(MatGetBlockSize(A, &bs)); 183b4e2f619SBarry Smith if (bs > 1) PetscCall(PetscHSetIJDestroy(&a->bht)); 184b4e2f619SBarry Smith PetscCall(PetscFree(a->dnz)); 185b4e2f619SBarry Smith PetscCall(PetscFree(a->bdnz)); 186b4e2f619SBarry Smith A->hash_active = PETSC_FALSE; 187b4e2f619SBarry Smith } 1883ba16761SJacob Faibussowitsch PetscCall(PetscLogObjectState((PetscObject)A, "Rows=%" PetscInt_FMT ", NZ=%" PetscInt_FMT, A->rmap->N, a->nz)); 1899566063dSJacob Faibussowitsch PetscCall(MatSeqXAIJFreeAIJ(A, &a->a, &a->j, &a->i)); 1909566063dSJacob Faibussowitsch if (a->free_diag) PetscCall(PetscFree(a->diag)); 1919566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->row)); 1929566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->col)); 1939566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->icol)); 1949566063dSJacob Faibussowitsch PetscCall(PetscFree(a->idiag)); 1959566063dSJacob Faibussowitsch PetscCall(PetscFree(a->inode.size)); 1969566063dSJacob Faibussowitsch if (a->free_imax_ilen) PetscCall(PetscFree2(a->imax, a->ilen)); 1979566063dSJacob Faibussowitsch PetscCall(PetscFree(a->solve_work)); 1989566063dSJacob Faibussowitsch PetscCall(PetscFree(a->sor_work)); 1999566063dSJacob Faibussowitsch PetscCall(PetscFree(a->solves_work)); 2009566063dSJacob Faibussowitsch PetscCall(PetscFree(a->mult_work)); 2019566063dSJacob Faibussowitsch PetscCall(PetscFree(a->saved_values)); 2029566063dSJacob Faibussowitsch if (a->free_jshort) PetscCall(PetscFree(a->jshort)); 2039566063dSJacob Faibussowitsch PetscCall(PetscFree(a->inew)); 2049566063dSJacob Faibussowitsch PetscCall(MatDestroy(&a->parent)); 2059566063dSJacob Faibussowitsch PetscCall(PetscFree(A->data)); 206901853e0SKris Buschelman 2079566063dSJacob Faibussowitsch PetscCall(PetscObjectChangeTypeName((PetscObject)A, NULL)); 2082e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSeqSBAIJGetArray_C", NULL)); 2092e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSeqSBAIJRestoreArray_C", NULL)); 2109566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatStoreValues_C", NULL)); 2119566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatRetrieveValues_C", NULL)); 2129566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSeqSBAIJSetColumnIndices_C", NULL)); 2139566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqsbaij_seqaij_C", NULL)); 2149566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqsbaij_seqbaij_C", NULL)); 2159566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSeqSBAIJSetPreallocation_C", NULL)); 2169566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSeqSBAIJSetPreallocationCSR_C", NULL)); 2176214f412SHong Zhang #if defined(PETSC_HAVE_ELEMENTAL) 2189566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqsbaij_elemental_C", NULL)); 2196214f412SHong Zhang #endif 220d24d4204SJose E. Roman #if defined(PETSC_HAVE_SCALAPACK) 2219566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqsbaij_scalapack_C", NULL)); 222d24d4204SJose E. Roman #endif 2232e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatFactorGetSolverType_C", NULL)); 2243ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 22549b5e25fSSatish Balay } 22649b5e25fSSatish Balay 227ba38deedSJacob Faibussowitsch static PetscErrorCode MatSetOption_SeqSBAIJ(Mat A, MatOption op, PetscBool flg) 228d71ae5a4SJacob Faibussowitsch { 229045c9aa0SHong Zhang Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)A->data; 230eb1ec7c1SStefano Zampini #if defined(PETSC_USE_COMPLEX) 231eb1ec7c1SStefano Zampini PetscInt bs; 232eb1ec7c1SStefano Zampini #endif 23349b5e25fSSatish Balay 23449b5e25fSSatish Balay PetscFunctionBegin; 235eb1ec7c1SStefano Zampini #if defined(PETSC_USE_COMPLEX) 2369566063dSJacob Faibussowitsch PetscCall(MatGetBlockSize(A, &bs)); 237eb1ec7c1SStefano Zampini #endif 2384d9d31abSKris Buschelman switch (op) { 239d71ae5a4SJacob Faibussowitsch case MAT_ROW_ORIENTED: 240d71ae5a4SJacob Faibussowitsch a->roworiented = flg; 241d71ae5a4SJacob Faibussowitsch break; 242d71ae5a4SJacob Faibussowitsch case MAT_KEEP_NONZERO_PATTERN: 243d71ae5a4SJacob Faibussowitsch a->keepnonzeropattern = flg; 244d71ae5a4SJacob Faibussowitsch break; 245d71ae5a4SJacob Faibussowitsch case MAT_NEW_NONZERO_LOCATIONS: 246d71ae5a4SJacob Faibussowitsch a->nonew = (flg ? 0 : 1); 247d71ae5a4SJacob Faibussowitsch break; 248d71ae5a4SJacob Faibussowitsch case MAT_NEW_NONZERO_LOCATION_ERR: 249d71ae5a4SJacob Faibussowitsch a->nonew = (flg ? -1 : 0); 250d71ae5a4SJacob Faibussowitsch break; 251d71ae5a4SJacob Faibussowitsch case MAT_NEW_NONZERO_ALLOCATION_ERR: 252d71ae5a4SJacob Faibussowitsch a->nonew = (flg ? -2 : 0); 253d71ae5a4SJacob Faibussowitsch break; 254d71ae5a4SJacob Faibussowitsch case MAT_UNUSED_NONZERO_LOCATION_ERR: 255d71ae5a4SJacob Faibussowitsch a->nounused = (flg ? -1 : 0); 256d71ae5a4SJacob Faibussowitsch break; 2578c78258cSHong Zhang case MAT_FORCE_DIAGONAL_ENTRIES: 2584d9d31abSKris Buschelman case MAT_IGNORE_OFF_PROC_ENTRIES: 2594d9d31abSKris Buschelman case MAT_USE_HASH_TABLE: 260d71ae5a4SJacob Faibussowitsch case MAT_SORTED_FULL: 261d71ae5a4SJacob Faibussowitsch PetscCall(PetscInfo(A, "Option %s ignored\n", MatOptions[op])); 262d71ae5a4SJacob Faibussowitsch break; 2639a4540c5SBarry Smith case MAT_HERMITIAN: 264eb1ec7c1SStefano Zampini #if defined(PETSC_USE_COMPLEX) 265eb1ec7c1SStefano Zampini if (flg) { /* disable transpose ops */ 26608401ef6SPierre Jolivet PetscCheck(bs <= 1, PETSC_COMM_SELF, PETSC_ERR_SUP, "No support for Hermitian with block size greater than 1"); 267eb1ec7c1SStefano Zampini A->ops->multtranspose = NULL; 268eb1ec7c1SStefano Zampini A->ops->multtransposeadd = NULL; 269b94d7dedSBarry Smith A->symmetric = PETSC_BOOL3_FALSE; 270eb1ec7c1SStefano Zampini } 2710f2140c7SStefano Zampini #endif 272eeffb40dSHong Zhang break; 27377e54ba9SKris Buschelman case MAT_SYMMETRIC: 274eb1ec7c1SStefano Zampini case MAT_SPD: 275eb1ec7c1SStefano Zampini #if defined(PETSC_USE_COMPLEX) 276eb1ec7c1SStefano Zampini if (flg) { /* An hermitian and symmetric matrix has zero imaginary part (restore back transpose ops) */ 277eb1ec7c1SStefano Zampini A->ops->multtranspose = A->ops->mult; 278eb1ec7c1SStefano Zampini A->ops->multtransposeadd = A->ops->multadd; 279eb1ec7c1SStefano Zampini } 280eb1ec7c1SStefano Zampini #endif 281eb1ec7c1SStefano Zampini break; 282eb1ec7c1SStefano Zampini /* These options are handled directly by MatSetOption() */ 28377e54ba9SKris Buschelman case MAT_STRUCTURALLY_SYMMETRIC: 2849a4540c5SBarry Smith case MAT_SYMMETRY_ETERNAL: 285b94d7dedSBarry Smith case MAT_STRUCTURAL_SYMMETRY_ETERNAL: 286672ba085SHong Zhang case MAT_STRUCTURE_ONLY: 287b94d7dedSBarry Smith case MAT_SPD_ETERNAL: 2884dcd73b1SHong Zhang /* These options are handled directly by MatSetOption() */ 289290bbb0aSBarry Smith break; 290d71ae5a4SJacob Faibussowitsch case MAT_IGNORE_LOWER_TRIANGULAR: 291d71ae5a4SJacob Faibussowitsch a->ignore_ltriangular = flg; 292d71ae5a4SJacob Faibussowitsch break; 293d71ae5a4SJacob Faibussowitsch case MAT_ERROR_LOWER_TRIANGULAR: 294d71ae5a4SJacob Faibussowitsch a->ignore_ltriangular = flg; 295d71ae5a4SJacob Faibussowitsch break; 296d71ae5a4SJacob Faibussowitsch case MAT_GETROW_UPPERTRIANGULAR: 297d71ae5a4SJacob Faibussowitsch a->getrow_utriangular = flg; 298d71ae5a4SJacob Faibussowitsch break; 299d71ae5a4SJacob Faibussowitsch case MAT_SUBMAT_SINGLEIS: 300d71ae5a4SJacob Faibussowitsch break; 301d71ae5a4SJacob Faibussowitsch default: 302d71ae5a4SJacob Faibussowitsch SETERRQ(PETSC_COMM_SELF, PETSC_ERR_SUP, "unknown option %d", op); 30349b5e25fSSatish Balay } 3043ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 30549b5e25fSSatish Balay } 30649b5e25fSSatish Balay 307d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetRow_SeqSBAIJ(Mat A, PetscInt row, PetscInt *nz, PetscInt **idx, PetscScalar **v) 308d71ae5a4SJacob Faibussowitsch { 30949b5e25fSSatish Balay Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)A->data; 31049b5e25fSSatish Balay 31149b5e25fSSatish Balay PetscFunctionBegin; 31208401ef6SPierre Jolivet PetscCheck(!A || a->getrow_utriangular, PETSC_COMM_SELF, PETSC_ERR_SUP, "MatGetRow is not supported for SBAIJ matrix format. Getting the upper triangular part of row, run with -mat_getrow_uppertriangular, call MatSetOption(mat,MAT_GETROW_UPPERTRIANGULAR,PETSC_TRUE) or MatGetRowUpperTriangular()"); 31352768537SHong Zhang 314f5edf698SHong Zhang /* Get the upper triangular part of the row */ 3159566063dSJacob Faibussowitsch PetscCall(MatGetRow_SeqBAIJ_private(A, row, nz, idx, v, a->i, a->j, a->a)); 3163ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 31749b5e25fSSatish Balay } 31849b5e25fSSatish Balay 319d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRestoreRow_SeqSBAIJ(Mat A, PetscInt row, PetscInt *nz, PetscInt **idx, PetscScalar **v) 320d71ae5a4SJacob Faibussowitsch { 32149b5e25fSSatish Balay PetscFunctionBegin; 322cb4a9cd9SHong Zhang if (nz) *nz = 0; 3239566063dSJacob Faibussowitsch if (idx) PetscCall(PetscFree(*idx)); 3249566063dSJacob Faibussowitsch if (v) PetscCall(PetscFree(*v)); 3253ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 32649b5e25fSSatish Balay } 32749b5e25fSSatish Balay 328ba38deedSJacob Faibussowitsch static PetscErrorCode MatGetRowUpperTriangular_SeqSBAIJ(Mat A) 329d71ae5a4SJacob Faibussowitsch { 330f5edf698SHong Zhang Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)A->data; 331f5edf698SHong Zhang 332f5edf698SHong Zhang PetscFunctionBegin; 333f5edf698SHong Zhang a->getrow_utriangular = PETSC_TRUE; 3343ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 335f5edf698SHong Zhang } 336a323099bSStefano Zampini 337ba38deedSJacob Faibussowitsch static PetscErrorCode MatRestoreRowUpperTriangular_SeqSBAIJ(Mat A) 338d71ae5a4SJacob Faibussowitsch { 339f5edf698SHong Zhang Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)A->data; 340f5edf698SHong Zhang 341f5edf698SHong Zhang PetscFunctionBegin; 342f5edf698SHong Zhang a->getrow_utriangular = PETSC_FALSE; 3433ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 344f5edf698SHong Zhang } 345f5edf698SHong Zhang 346ba38deedSJacob Faibussowitsch static PetscErrorCode MatTranspose_SeqSBAIJ(Mat A, MatReuse reuse, Mat *B) 347d71ae5a4SJacob Faibussowitsch { 34849b5e25fSSatish Balay PetscFunctionBegin; 3497fb60732SBarry Smith if (reuse == MAT_REUSE_MATRIX) PetscCall(MatTransposeCheckNonzeroState_Private(A, *B)); 350cf37664fSBarry Smith if (reuse == MAT_INITIAL_MATRIX) { 3519566063dSJacob Faibussowitsch PetscCall(MatDuplicate(A, MAT_COPY_VALUES, B)); 352cf37664fSBarry Smith } else if (reuse == MAT_REUSE_MATRIX) { 3539566063dSJacob Faibussowitsch PetscCall(MatCopy(A, *B, SAME_NONZERO_PATTERN)); 354fc4dec0aSBarry Smith } 3553ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 35649b5e25fSSatish Balay } 35749b5e25fSSatish Balay 358ba38deedSJacob Faibussowitsch static PetscErrorCode MatView_SeqSBAIJ_ASCII(Mat A, PetscViewer viewer) 359d71ae5a4SJacob Faibussowitsch { 36049b5e25fSSatish Balay Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)A->data; 361d0f46423SBarry Smith PetscInt i, j, bs = A->rmap->bs, k, l, bs2 = a->bs2; 362f3ef73ceSBarry Smith PetscViewerFormat format; 363121deb67SSatish Balay PetscInt *diag; 364b3a0534dSBarry Smith const char *matname; 36549b5e25fSSatish Balay 36649b5e25fSSatish Balay PetscFunctionBegin; 3679566063dSJacob Faibussowitsch PetscCall(PetscViewerGetFormat(viewer, &format)); 368456192e2SBarry Smith if (format == PETSC_VIEWER_ASCII_INFO || format == PETSC_VIEWER_ASCII_INFO_DETAIL) { 3699566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " block size is %" PetscInt_FMT "\n", bs)); 370fb9695e5SSatish Balay } else if (format == PETSC_VIEWER_ASCII_MATLAB) { 371d2507d54SMatthew Knepley Mat aij; 372ade3a672SBarry Smith 373d5f3da31SBarry Smith if (A->factortype && bs > 1) { 3749566063dSJacob Faibussowitsch PetscCall(PetscPrintf(PETSC_COMM_SELF, "Warning: matrix is factored with bs>1. MatView() with PETSC_VIEWER_ASCII_MATLAB is not supported and ignored!\n")); 3753ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 37670d5e725SHong Zhang } 3779566063dSJacob Faibussowitsch PetscCall(MatConvert(A, MATSEQAIJ, MAT_INITIAL_MATRIX, &aij)); 37823a3927dSBarry Smith if (((PetscObject)A)->name) PetscCall(PetscObjectGetName((PetscObject)A, &matname)); 37923a3927dSBarry Smith if (((PetscObject)A)->name) PetscCall(PetscObjectSetName((PetscObject)aij, matname)); 38023a3927dSBarry Smith PetscCall(MatView_SeqAIJ(aij, viewer)); 3819566063dSJacob Faibussowitsch PetscCall(MatDestroy(&aij)); 382fb9695e5SSatish Balay } else if (format == PETSC_VIEWER_ASCII_COMMON) { 383b3a0534dSBarry Smith Mat B; 384b3a0534dSBarry Smith 385b3a0534dSBarry Smith PetscCall(MatConvert(A, MATSEQAIJ, MAT_INITIAL_MATRIX, &B)); 386b3a0534dSBarry Smith if (((PetscObject)A)->name) PetscCall(PetscObjectGetName((PetscObject)A, &matname)); 387b3a0534dSBarry Smith if (((PetscObject)A)->name) PetscCall(PetscObjectSetName((PetscObject)B, matname)); 388b3a0534dSBarry Smith PetscCall(MatView_SeqAIJ(B, viewer)); 389b3a0534dSBarry Smith PetscCall(MatDestroy(&B)); 390c1490034SHong Zhang } else if (format == PETSC_VIEWER_ASCII_FACTOR_INFO) { 3913ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 39249b5e25fSSatish Balay } else { 3939566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE)); 3942c990fa1SHong Zhang if (A->factortype) { /* for factored matrix */ 39508401ef6SPierre Jolivet PetscCheck(bs <= 1, PETSC_COMM_SELF, PETSC_ERR_SUP, "matrix is factored with bs>1. Not implemented yet"); 3962c990fa1SHong Zhang 397121deb67SSatish Balay diag = a->diag; 398121deb67SSatish Balay for (i = 0; i < a->mbs; i++) { /* for row block i */ 3999566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "row %" PetscInt_FMT ":", i)); 4002c990fa1SHong Zhang /* diagonal entry */ 4012c990fa1SHong Zhang #if defined(PETSC_USE_COMPLEX) 4022c990fa1SHong Zhang if (PetscImaginaryPart(a->a[diag[i]]) > 0.0) { 4039566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g + %g i) ", a->j[diag[i]], (double)PetscRealPart(1.0 / a->a[diag[i]]), (double)PetscImaginaryPart(1.0 / a->a[diag[i]]))); 4042c990fa1SHong Zhang } else if (PetscImaginaryPart(a->a[diag[i]]) < 0.0) { 4059566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g - %g i) ", a->j[diag[i]], (double)PetscRealPart(1.0 / a->a[diag[i]]), -(double)PetscImaginaryPart(1.0 / a->a[diag[i]]))); 4062c990fa1SHong Zhang } else { 4079566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[diag[i]], (double)PetscRealPart(1.0 / a->a[diag[i]]))); 4082c990fa1SHong Zhang } 4092c990fa1SHong Zhang #else 4109566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[diag[i]], (double)(1.0 / a->a[diag[i]]))); 4112c990fa1SHong Zhang #endif 4122c990fa1SHong Zhang /* off-diagonal entries */ 4132c990fa1SHong Zhang for (k = a->i[i]; k < a->i[i + 1] - 1; k++) { 4142c990fa1SHong Zhang #if defined(PETSC_USE_COMPLEX) 415ca0704adSBarry Smith if (PetscImaginaryPart(a->a[k]) > 0.0) { 4169566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g + %g i) ", bs * a->j[k], (double)PetscRealPart(a->a[k]), (double)PetscImaginaryPart(a->a[k]))); 417ca0704adSBarry Smith } else if (PetscImaginaryPart(a->a[k]) < 0.0) { 4189566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g - %g i) ", bs * a->j[k], (double)PetscRealPart(a->a[k]), -(double)PetscImaginaryPart(a->a[k]))); 4192c990fa1SHong Zhang } else { 4209566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", bs * a->j[k], (double)PetscRealPart(a->a[k]))); 4212c990fa1SHong Zhang } 4222c990fa1SHong Zhang #else 4239566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[k], (double)a->a[k])); 4242c990fa1SHong Zhang #endif 4252c990fa1SHong Zhang } 4269566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 4272c990fa1SHong Zhang } 4282c990fa1SHong Zhang 4292c990fa1SHong Zhang } else { /* for non-factored matrix */ 4300c74a584SJed Brown for (i = 0; i < a->mbs; i++) { /* for row block i */ 4310c74a584SJed Brown for (j = 0; j < bs; j++) { /* for row bs*i + j */ 4329566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "row %" PetscInt_FMT ":", i * bs + j)); 4330c74a584SJed Brown for (k = a->i[i]; k < a->i[i + 1]; k++) { /* for column block */ 4340c74a584SJed Brown for (l = 0; l < bs; l++) { /* for column */ 43549b5e25fSSatish Balay #if defined(PETSC_USE_COMPLEX) 43649b5e25fSSatish Balay if (PetscImaginaryPart(a->a[bs2 * k + l * bs + j]) > 0.0) { 4379371c9d4SSatish Balay PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g + %g i) ", bs * a->j[k] + l, (double)PetscRealPart(a->a[bs2 * k + l * bs + j]), (double)PetscImaginaryPart(a->a[bs2 * k + l * bs + j]))); 43849b5e25fSSatish Balay } else if (PetscImaginaryPart(a->a[bs2 * k + l * bs + j]) < 0.0) { 4399371c9d4SSatish Balay PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g - %g i) ", bs * a->j[k] + l, (double)PetscRealPart(a->a[bs2 * k + l * bs + j]), -(double)PetscImaginaryPart(a->a[bs2 * k + l * bs + j]))); 44049b5e25fSSatish Balay } else { 4419566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", bs * a->j[k] + l, (double)PetscRealPart(a->a[bs2 * k + l * bs + j]))); 44249b5e25fSSatish Balay } 44349b5e25fSSatish Balay #else 4449566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", bs * a->j[k] + l, (double)a->a[bs2 * k + l * bs + j])); 44549b5e25fSSatish Balay #endif 44649b5e25fSSatish Balay } 44749b5e25fSSatish Balay } 4489566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 44949b5e25fSSatish Balay } 45049b5e25fSSatish Balay } 4512c990fa1SHong Zhang } 4529566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE)); 45349b5e25fSSatish Balay } 4549566063dSJacob Faibussowitsch PetscCall(PetscViewerFlush(viewer)); 4553ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 45649b5e25fSSatish Balay } 45749b5e25fSSatish Balay 4589804daf3SBarry Smith #include <petscdraw.h> 459d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatView_SeqSBAIJ_Draw_Zoom(PetscDraw draw, void *Aa) 460d71ae5a4SJacob Faibussowitsch { 46149b5e25fSSatish Balay Mat A = (Mat)Aa; 46249b5e25fSSatish Balay Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)A->data; 463d0f46423SBarry Smith PetscInt row, i, j, k, l, mbs = a->mbs, color, bs = A->rmap->bs, bs2 = a->bs2; 46449b5e25fSSatish Balay PetscReal xl, yl, xr, yr, x_l, x_r, y_l, y_r; 46549b5e25fSSatish Balay MatScalar *aa; 466b0a32e0cSBarry Smith PetscViewer viewer; 46749b5e25fSSatish Balay 46849b5e25fSSatish Balay PetscFunctionBegin; 4699566063dSJacob Faibussowitsch PetscCall(PetscObjectQuery((PetscObject)A, "Zoomviewer", (PetscObject *)&viewer)); 4709566063dSJacob Faibussowitsch PetscCall(PetscDrawGetCoordinates(draw, &xl, &yl, &xr, &yr)); 47149b5e25fSSatish Balay 47249b5e25fSSatish Balay /* loop over matrix elements drawing boxes */ 473383922c3SLisandro Dalcin 474d0609cedSBarry Smith PetscDrawCollectiveBegin(draw); 4759566063dSJacob Faibussowitsch PetscCall(PetscDrawString(draw, .3 * (xl + xr), .3 * (yl + yr), PETSC_DRAW_BLACK, "symmetric")); 476383922c3SLisandro Dalcin /* Blue for negative, Cyan for zero and Red for positive */ 477b0a32e0cSBarry Smith color = PETSC_DRAW_BLUE; 47849b5e25fSSatish Balay for (i = 0, row = 0; i < mbs; i++, row += bs) { 47949b5e25fSSatish Balay for (j = a->i[i]; j < a->i[i + 1]; j++) { 4809371c9d4SSatish Balay y_l = A->rmap->N - row - 1.0; 4819371c9d4SSatish Balay y_r = y_l + 1.0; 4829371c9d4SSatish Balay x_l = a->j[j] * bs; 4839371c9d4SSatish Balay x_r = x_l + 1.0; 48449b5e25fSSatish Balay aa = a->a + j * bs2; 48549b5e25fSSatish Balay for (k = 0; k < bs; k++) { 48649b5e25fSSatish Balay for (l = 0; l < bs; l++) { 48749b5e25fSSatish Balay if (PetscRealPart(*aa++) >= 0.) continue; 4889566063dSJacob Faibussowitsch PetscCall(PetscDrawRectangle(draw, x_l + k, y_l - l, x_r + k, y_r - l, color, color, color, color)); 48949b5e25fSSatish Balay } 49049b5e25fSSatish Balay } 49149b5e25fSSatish Balay } 49249b5e25fSSatish Balay } 493b0a32e0cSBarry Smith color = PETSC_DRAW_CYAN; 49449b5e25fSSatish Balay for (i = 0, row = 0; i < mbs; i++, row += bs) { 49549b5e25fSSatish Balay for (j = a->i[i]; j < a->i[i + 1]; j++) { 4969371c9d4SSatish Balay y_l = A->rmap->N - row - 1.0; 4979371c9d4SSatish Balay y_r = y_l + 1.0; 4989371c9d4SSatish Balay x_l = a->j[j] * bs; 4999371c9d4SSatish Balay x_r = x_l + 1.0; 50049b5e25fSSatish Balay aa = a->a + j * bs2; 50149b5e25fSSatish Balay for (k = 0; k < bs; k++) { 50249b5e25fSSatish Balay for (l = 0; l < bs; l++) { 50349b5e25fSSatish Balay if (PetscRealPart(*aa++) != 0.) continue; 5049566063dSJacob Faibussowitsch PetscCall(PetscDrawRectangle(draw, x_l + k, y_l - l, x_r + k, y_r - l, color, color, color, color)); 50549b5e25fSSatish Balay } 50649b5e25fSSatish Balay } 50749b5e25fSSatish Balay } 50849b5e25fSSatish Balay } 509b0a32e0cSBarry Smith color = PETSC_DRAW_RED; 51049b5e25fSSatish Balay for (i = 0, row = 0; i < mbs; i++, row += bs) { 51149b5e25fSSatish Balay for (j = a->i[i]; j < a->i[i + 1]; j++) { 5129371c9d4SSatish Balay y_l = A->rmap->N - row - 1.0; 5139371c9d4SSatish Balay y_r = y_l + 1.0; 5149371c9d4SSatish Balay x_l = a->j[j] * bs; 5159371c9d4SSatish Balay x_r = x_l + 1.0; 51649b5e25fSSatish Balay aa = a->a + j * bs2; 51749b5e25fSSatish Balay for (k = 0; k < bs; k++) { 51849b5e25fSSatish Balay for (l = 0; l < bs; l++) { 51949b5e25fSSatish Balay if (PetscRealPart(*aa++) <= 0.) continue; 5209566063dSJacob Faibussowitsch PetscCall(PetscDrawRectangle(draw, x_l + k, y_l - l, x_r + k, y_r - l, color, color, color, color)); 52149b5e25fSSatish Balay } 52249b5e25fSSatish Balay } 52349b5e25fSSatish Balay } 52449b5e25fSSatish Balay } 525d0609cedSBarry Smith PetscDrawCollectiveEnd(draw); 5263ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 52749b5e25fSSatish Balay } 52849b5e25fSSatish Balay 529d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatView_SeqSBAIJ_Draw(Mat A, PetscViewer viewer) 530d71ae5a4SJacob Faibussowitsch { 53149b5e25fSSatish Balay PetscReal xl, yl, xr, yr, w, h; 532b0a32e0cSBarry Smith PetscDraw draw; 533ace3abfcSBarry Smith PetscBool isnull; 53449b5e25fSSatish Balay 53549b5e25fSSatish Balay PetscFunctionBegin; 5369566063dSJacob Faibussowitsch PetscCall(PetscViewerDrawGetDraw(viewer, 0, &draw)); 5379566063dSJacob Faibussowitsch PetscCall(PetscDrawIsNull(draw, &isnull)); 5383ba16761SJacob Faibussowitsch if (isnull) PetscFunctionReturn(PETSC_SUCCESS); 53949b5e25fSSatish Balay 5409371c9d4SSatish Balay xr = A->rmap->N; 5419371c9d4SSatish Balay yr = A->rmap->N; 5429371c9d4SSatish Balay h = yr / 10.0; 5439371c9d4SSatish Balay w = xr / 10.0; 5449371c9d4SSatish Balay xr += w; 5459371c9d4SSatish Balay yr += h; 5469371c9d4SSatish Balay xl = -w; 5479371c9d4SSatish Balay yl = -h; 5489566063dSJacob Faibussowitsch PetscCall(PetscDrawSetCoordinates(draw, xl, yl, xr, yr)); 5499566063dSJacob Faibussowitsch PetscCall(PetscObjectCompose((PetscObject)A, "Zoomviewer", (PetscObject)viewer)); 5509566063dSJacob Faibussowitsch PetscCall(PetscDrawZoom(draw, MatView_SeqSBAIJ_Draw_Zoom, A)); 5519566063dSJacob Faibussowitsch PetscCall(PetscObjectCompose((PetscObject)A, "Zoomviewer", NULL)); 5529566063dSJacob Faibussowitsch PetscCall(PetscDrawSave(draw)); 5533ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 55449b5e25fSSatish Balay } 55549b5e25fSSatish Balay 556618cc2edSLisandro Dalcin /* Used for both MPIBAIJ and MPISBAIJ matrices */ 557618cc2edSLisandro Dalcin #define MatView_SeqSBAIJ_Binary MatView_SeqBAIJ_Binary 558618cc2edSLisandro Dalcin 559d71ae5a4SJacob Faibussowitsch PetscErrorCode MatView_SeqSBAIJ(Mat A, PetscViewer viewer) 560d71ae5a4SJacob Faibussowitsch { 561618cc2edSLisandro Dalcin PetscBool iascii, isbinary, isdraw; 56249b5e25fSSatish Balay 56349b5e25fSSatish Balay PetscFunctionBegin; 5649566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERASCII, &iascii)); 5659566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERBINARY, &isbinary)); 5669566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERDRAW, &isdraw)); 56732077d6dSBarry Smith if (iascii) { 5689566063dSJacob Faibussowitsch PetscCall(MatView_SeqSBAIJ_ASCII(A, viewer)); 569618cc2edSLisandro Dalcin } else if (isbinary) { 5709566063dSJacob Faibussowitsch PetscCall(MatView_SeqSBAIJ_Binary(A, viewer)); 57149b5e25fSSatish Balay } else if (isdraw) { 5729566063dSJacob Faibussowitsch PetscCall(MatView_SeqSBAIJ_Draw(A, viewer)); 57349b5e25fSSatish Balay } else { 574a5e6ed63SBarry Smith Mat B; 575ade3a672SBarry Smith const char *matname; 5769566063dSJacob Faibussowitsch PetscCall(MatConvert(A, MATSEQAIJ, MAT_INITIAL_MATRIX, &B)); 57723a3927dSBarry Smith if (((PetscObject)A)->name) PetscCall(PetscObjectGetName((PetscObject)A, &matname)); 57823a3927dSBarry Smith if (((PetscObject)A)->name) PetscCall(PetscObjectSetName((PetscObject)B, matname)); 5799566063dSJacob Faibussowitsch PetscCall(MatView(B, viewer)); 5809566063dSJacob Faibussowitsch PetscCall(MatDestroy(&B)); 58149b5e25fSSatish Balay } 5823ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 58349b5e25fSSatish Balay } 58449b5e25fSSatish Balay 585d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetValues_SeqSBAIJ(Mat A, PetscInt m, const PetscInt im[], PetscInt n, const PetscInt in[], PetscScalar v[]) 586d71ae5a4SJacob Faibussowitsch { 587045c9aa0SHong Zhang Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)A->data; 58813f74950SBarry Smith PetscInt *rp, k, low, high, t, row, nrow, i, col, l, *aj = a->j; 58913f74950SBarry Smith PetscInt *ai = a->i, *ailen = a->ilen; 590d0f46423SBarry Smith PetscInt brow, bcol, ridx, cidx, bs = A->rmap->bs, bs2 = a->bs2; 59197e567efSBarry Smith MatScalar *ap, *aa = a->a; 59249b5e25fSSatish Balay 59349b5e25fSSatish Balay PetscFunctionBegin; 59449b5e25fSSatish Balay for (k = 0; k < m; k++) { /* loop over rows */ 5959371c9d4SSatish Balay row = im[k]; 5969371c9d4SSatish Balay brow = row / bs; 5979371c9d4SSatish Balay if (row < 0) { 5989371c9d4SSatish Balay v += n; 5999371c9d4SSatish Balay continue; 6009371c9d4SSatish Balay } /* negative row */ 60154c59aa7SJacob Faibussowitsch PetscCheck(row < A->rmap->N, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Row too large: row %" PetscInt_FMT " max %" PetscInt_FMT, row, A->rmap->N - 1); 6029371c9d4SSatish Balay rp = aj + ai[brow]; 6039371c9d4SSatish Balay ap = aa + bs2 * ai[brow]; 60449b5e25fSSatish Balay nrow = ailen[brow]; 60549b5e25fSSatish Balay for (l = 0; l < n; l++) { /* loop over columns */ 6069371c9d4SSatish Balay if (in[l] < 0) { 6079371c9d4SSatish Balay v++; 6089371c9d4SSatish Balay continue; 6099371c9d4SSatish Balay } /* negative column */ 61054c59aa7SJacob Faibussowitsch PetscCheck(in[l] < A->cmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Column too large: col %" PetscInt_FMT " max %" PetscInt_FMT, in[l], A->cmap->n - 1); 61149b5e25fSSatish Balay col = in[l]; 61249b5e25fSSatish Balay bcol = col / bs; 61349b5e25fSSatish Balay cidx = col % bs; 61449b5e25fSSatish Balay ridx = row % bs; 61549b5e25fSSatish Balay high = nrow; 61649b5e25fSSatish Balay low = 0; /* assume unsorted */ 61749b5e25fSSatish Balay while (high - low > 5) { 61849b5e25fSSatish Balay t = (low + high) / 2; 61949b5e25fSSatish Balay if (rp[t] > bcol) high = t; 62049b5e25fSSatish Balay else low = t; 62149b5e25fSSatish Balay } 62249b5e25fSSatish Balay for (i = low; i < high; i++) { 62349b5e25fSSatish Balay if (rp[i] > bcol) break; 62449b5e25fSSatish Balay if (rp[i] == bcol) { 62549b5e25fSSatish Balay *v++ = ap[bs2 * i + bs * cidx + ridx]; 62649b5e25fSSatish Balay goto finished; 62749b5e25fSSatish Balay } 62849b5e25fSSatish Balay } 62997e567efSBarry Smith *v++ = 0.0; 63049b5e25fSSatish Balay finished:; 63149b5e25fSSatish Balay } 63249b5e25fSSatish Balay } 6333ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 63449b5e25fSSatish Balay } 63549b5e25fSSatish Balay 636ba38deedSJacob Faibussowitsch static PetscErrorCode MatPermute_SeqSBAIJ(Mat A, IS rowp, IS colp, Mat *B) 637d71ae5a4SJacob Faibussowitsch { 638dc29a518SPierre Jolivet Mat C; 639dc29a518SPierre Jolivet 640dc29a518SPierre Jolivet PetscFunctionBegin; 6419566063dSJacob Faibussowitsch PetscCall(MatConvert(A, MATSEQBAIJ, MAT_INITIAL_MATRIX, &C)); 6429566063dSJacob Faibussowitsch PetscCall(MatPermute(C, rowp, colp, B)); 6439566063dSJacob Faibussowitsch PetscCall(MatDestroy(&C)); 64448a46eb9SPierre Jolivet if (rowp == colp) PetscCall(MatConvert(*B, MATSEQSBAIJ, MAT_INPLACE_MATRIX, B)); 6453ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 646dc29a518SPierre Jolivet } 64749b5e25fSSatish Balay 648d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetValuesBlocked_SeqSBAIJ(Mat A, PetscInt m, const PetscInt im[], PetscInt n, const PetscInt in[], const PetscScalar v[], InsertMode is) 649d71ae5a4SJacob Faibussowitsch { 6500880e062SHong Zhang Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)A->data; 651e2ee6c50SBarry Smith PetscInt *rp, k, low, high, t, ii, jj, row, nrow, i, col, l, rmax, N, lastcol = -1; 65213f74950SBarry Smith PetscInt *imax = a->imax, *ai = a->i, *ailen = a->ilen; 653d0f46423SBarry Smith PetscInt *aj = a->j, nonew = a->nonew, bs2 = a->bs2, bs = A->rmap->bs, stepval; 654ace3abfcSBarry Smith PetscBool roworiented = a->roworiented; 655dd6ea824SBarry Smith const PetscScalar *value = v; 656f15d580aSBarry Smith MatScalar *ap, *aa = a->a, *bap; 6570880e062SHong Zhang 65849b5e25fSSatish Balay PetscFunctionBegin; 65926fbe8dcSKarl Rupp if (roworiented) stepval = (n - 1) * bs; 66026fbe8dcSKarl Rupp else stepval = (m - 1) * bs; 66126fbe8dcSKarl Rupp 6620880e062SHong Zhang for (k = 0; k < m; k++) { /* loop over added rows */ 6630880e062SHong Zhang row = im[k]; 6640880e062SHong Zhang if (row < 0) continue; 6656bdcaf15SBarry Smith PetscCheck(row < a->mbs, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Block index row too large %" PetscInt_FMT " max %" PetscInt_FMT, row, a->mbs - 1); 6660880e062SHong Zhang rp = aj + ai[row]; 6670880e062SHong Zhang ap = aa + bs2 * ai[row]; 6680880e062SHong Zhang rmax = imax[row]; 6690880e062SHong Zhang nrow = ailen[row]; 6700880e062SHong Zhang low = 0; 671818f2c47SBarry Smith high = nrow; 6720880e062SHong Zhang for (l = 0; l < n; l++) { /* loop over added columns */ 6730880e062SHong Zhang if (in[l] < 0) continue; 6740880e062SHong Zhang col = in[l]; 6756bdcaf15SBarry Smith PetscCheck(col < a->nbs, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Block index column too large %" PetscInt_FMT " max %" PetscInt_FMT, col, a->nbs - 1); 676b98bf0e1SJed Brown if (col < row) { 67726fbe8dcSKarl Rupp if (a->ignore_ltriangular) continue; /* ignore lower triangular block */ 67826fbe8dcSKarl Rupp else SETERRQ(PETSC_COMM_SELF, PETSC_ERR_USER, "Lower triangular value cannot be set for sbaij format. Ignoring these values, run with -mat_ignore_lower_triangular or call MatSetOption(mat,MAT_IGNORE_LOWER_TRIANGULAR,PETSC_TRUE)"); 679b98bf0e1SJed Brown } 68026fbe8dcSKarl Rupp if (roworiented) value = v + k * (stepval + bs) * bs + l * bs; 68126fbe8dcSKarl Rupp else value = v + l * (stepval + bs) * bs + k * bs; 68226fbe8dcSKarl Rupp 68326fbe8dcSKarl Rupp if (col <= lastcol) low = 0; 68426fbe8dcSKarl Rupp else high = nrow; 68526fbe8dcSKarl Rupp 686e2ee6c50SBarry Smith lastcol = col; 6870880e062SHong Zhang while (high - low > 7) { 6880880e062SHong Zhang t = (low + high) / 2; 6890880e062SHong Zhang if (rp[t] > col) high = t; 6900880e062SHong Zhang else low = t; 6910880e062SHong Zhang } 6920880e062SHong Zhang for (i = low; i < high; i++) { 6930880e062SHong Zhang if (rp[i] > col) break; 6940880e062SHong Zhang if (rp[i] == col) { 6950880e062SHong Zhang bap = ap + bs2 * i; 6960880e062SHong Zhang if (roworiented) { 6970880e062SHong Zhang if (is == ADD_VALUES) { 6980880e062SHong Zhang for (ii = 0; ii < bs; ii++, value += stepval) { 699ad540459SPierre Jolivet for (jj = ii; jj < bs2; jj += bs) bap[jj] += *value++; 7000880e062SHong Zhang } 7010880e062SHong Zhang } else { 7020880e062SHong Zhang for (ii = 0; ii < bs; ii++, value += stepval) { 703ad540459SPierre Jolivet for (jj = ii; jj < bs2; jj += bs) bap[jj] = *value++; 7040880e062SHong Zhang } 7050880e062SHong Zhang } 7060880e062SHong Zhang } else { 7070880e062SHong Zhang if (is == ADD_VALUES) { 7080880e062SHong Zhang for (ii = 0; ii < bs; ii++, value += stepval) { 709ad540459SPierre Jolivet for (jj = 0; jj < bs; jj++) *bap++ += *value++; 7100880e062SHong Zhang } 7110880e062SHong Zhang } else { 7120880e062SHong Zhang for (ii = 0; ii < bs; ii++, value += stepval) { 713ad540459SPierre Jolivet for (jj = 0; jj < bs; jj++) *bap++ = *value++; 7140880e062SHong Zhang } 7150880e062SHong Zhang } 7160880e062SHong Zhang } 7170880e062SHong Zhang goto noinsert2; 7180880e062SHong Zhang } 7190880e062SHong Zhang } 7200880e062SHong Zhang if (nonew == 1) goto noinsert2; 72108401ef6SPierre Jolivet PetscCheck(nonew != -1, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Inserting a new block index nonzero block (%" PetscInt_FMT ", %" PetscInt_FMT ") in the matrix", row, col); 722fef13f97SBarry Smith MatSeqXAIJReallocateAIJ(A, a->mbs, bs2, nrow, row, col, rmax, aa, ai, aj, rp, ap, imax, nonew, MatScalar); 7239371c9d4SSatish Balay N = nrow++ - 1; 7249371c9d4SSatish Balay high++; 7250880e062SHong Zhang /* shift up all the later entries in this row */ 7269566063dSJacob Faibussowitsch PetscCall(PetscArraymove(rp + i + 1, rp + i, N - i + 1)); 7279566063dSJacob Faibussowitsch PetscCall(PetscArraymove(ap + bs2 * (i + 1), ap + bs2 * i, bs2 * (N - i + 1))); 7289566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(ap + bs2 * i, bs2)); 7290880e062SHong Zhang rp[i] = col; 7300880e062SHong Zhang bap = ap + bs2 * i; 7310880e062SHong Zhang if (roworiented) { 7320880e062SHong Zhang for (ii = 0; ii < bs; ii++, value += stepval) { 733ad540459SPierre Jolivet for (jj = ii; jj < bs2; jj += bs) bap[jj] = *value++; 7340880e062SHong Zhang } 7350880e062SHong Zhang } else { 7360880e062SHong Zhang for (ii = 0; ii < bs; ii++, value += stepval) { 737ad540459SPierre Jolivet for (jj = 0; jj < bs; jj++) *bap++ = *value++; 7380880e062SHong Zhang } 7390880e062SHong Zhang } 7400880e062SHong Zhang noinsert2:; 7410880e062SHong Zhang low = i; 7420880e062SHong Zhang } 7430880e062SHong Zhang ailen[row] = nrow; 7440880e062SHong Zhang } 7453ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 74649b5e25fSSatish Balay } 74749b5e25fSSatish Balay 748ba38deedSJacob Faibussowitsch static PetscErrorCode MatAssemblyEnd_SeqSBAIJ(Mat A, MatAssemblyType mode) 749d71ae5a4SJacob Faibussowitsch { 75049b5e25fSSatish Balay Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)A->data; 7518f8f2f0dSBarry Smith PetscInt fshift = 0, i, *ai = a->i, *aj = a->j, *imax = a->imax; 752d0f46423SBarry Smith PetscInt m = A->rmap->N, *ip, N, *ailen = a->ilen; 75313f74950SBarry Smith PetscInt mbs = a->mbs, bs2 = a->bs2, rmax = 0; 75449b5e25fSSatish Balay MatScalar *aa = a->a, *ap; 75549b5e25fSSatish Balay 75649b5e25fSSatish Balay PetscFunctionBegin; 757d32568d8SPierre Jolivet if (mode == MAT_FLUSH_ASSEMBLY || (A->was_assembled && A->ass_nonzerostate == A->nonzerostate)) PetscFunctionReturn(PETSC_SUCCESS); 75849b5e25fSSatish Balay 75949b5e25fSSatish Balay if (m) rmax = ailen[0]; 76049b5e25fSSatish Balay for (i = 1; i < mbs; i++) { 76149b5e25fSSatish Balay /* move each row back by the amount of empty slots (fshift) before it*/ 76249b5e25fSSatish Balay fshift += imax[i - 1] - ailen[i - 1]; 76349b5e25fSSatish Balay rmax = PetscMax(rmax, ailen[i]); 76449b5e25fSSatish Balay if (fshift) { 765580bdb30SBarry Smith ip = aj + ai[i]; 766580bdb30SBarry Smith ap = aa + bs2 * ai[i]; 76749b5e25fSSatish Balay N = ailen[i]; 7689566063dSJacob Faibussowitsch PetscCall(PetscArraymove(ip - fshift, ip, N)); 7699566063dSJacob Faibussowitsch PetscCall(PetscArraymove(ap - bs2 * fshift, ap, bs2 * N)); 77049b5e25fSSatish Balay } 77149b5e25fSSatish Balay ai[i] = ai[i - 1] + ailen[i - 1]; 77249b5e25fSSatish Balay } 77349b5e25fSSatish Balay if (mbs) { 77449b5e25fSSatish Balay fshift += imax[mbs - 1] - ailen[mbs - 1]; 77549b5e25fSSatish Balay ai[mbs] = ai[mbs - 1] + ailen[mbs - 1]; 77649b5e25fSSatish Balay } 77749b5e25fSSatish Balay /* reset ilen and imax for each row */ 778ad540459SPierre Jolivet for (i = 0; i < mbs; i++) ailen[i] = imax[i] = ai[i + 1] - ai[i]; 7796c6c5352SBarry Smith a->nz = ai[mbs]; 78049b5e25fSSatish Balay 781b424e231SHong Zhang /* diagonals may have moved, reset it */ 7821baa6e33SBarry Smith if (a->diag) PetscCall(PetscArraycpy(a->diag, ai, mbs)); 783aed4548fSBarry Smith PetscCheck(!fshift || a->nounused != -1, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Unused space detected in matrix: %" PetscInt_FMT " X %" PetscInt_FMT " block size %" PetscInt_FMT ", %" PetscInt_FMT " unneeded", m, A->cmap->n, A->rmap->bs, fshift * bs2); 78426fbe8dcSKarl Rupp 7859566063dSJacob Faibussowitsch PetscCall(PetscInfo(A, "Matrix size: %" PetscInt_FMT " X %" PetscInt_FMT ", block size %" PetscInt_FMT "; storage space: %" PetscInt_FMT " unneeded, %" PetscInt_FMT " used\n", m, A->rmap->N, A->rmap->bs, fshift * bs2, a->nz * bs2)); 7869566063dSJacob Faibussowitsch PetscCall(PetscInfo(A, "Number of mallocs during MatSetValues is %" PetscInt_FMT "\n", a->reallocs)); 7879566063dSJacob Faibussowitsch PetscCall(PetscInfo(A, "Most nonzeros blocks in any row is %" PetscInt_FMT "\n", rmax)); 78826fbe8dcSKarl Rupp 7898e58a170SBarry Smith A->info.mallocs += a->reallocs; 79049b5e25fSSatish Balay a->reallocs = 0; 79149b5e25fSSatish Balay A->info.nz_unneeded = (PetscReal)fshift * bs2; 792061b2667SBarry Smith a->idiagvalid = PETSC_FALSE; 7934dcd73b1SHong Zhang a->rmax = rmax; 79438702af4SBarry Smith 79538702af4SBarry Smith if (A->cmap->n < 65536 && A->cmap->bs == 1) { 79644e1c64aSLisandro Dalcin if (a->jshort && a->free_jshort) { 79717803ae8SHong Zhang /* when matrix data structure is changed, previous jshort must be replaced */ 7989566063dSJacob Faibussowitsch PetscCall(PetscFree(a->jshort)); 79917803ae8SHong Zhang } 8009566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(a->i[A->rmap->n], &a->jshort)); 80138702af4SBarry Smith for (i = 0; i < a->i[A->rmap->n]; i++) a->jshort[i] = a->j[i]; 80238702af4SBarry Smith A->ops->mult = MatMult_SeqSBAIJ_1_ushort; 80341f059aeSBarry Smith A->ops->sor = MatSOR_SeqSBAIJ_ushort; 8044da8f245SBarry Smith a->free_jshort = PETSC_TRUE; 80538702af4SBarry Smith } 8063ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 80749b5e25fSSatish Balay } 80849b5e25fSSatish Balay 80949b5e25fSSatish Balay /* Only add/insert a(i,j) with i<=j (blocks). 810da81f932SPierre Jolivet Any a(i,j) with i>j input by user is ignored. 81149b5e25fSSatish Balay */ 81249b5e25fSSatish Balay 813d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetValues_SeqSBAIJ(Mat A, PetscInt m, const PetscInt im[], PetscInt n, const PetscInt in[], const PetscScalar v[], InsertMode is) 814d71ae5a4SJacob Faibussowitsch { 81549b5e25fSSatish Balay Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)A->data; 816e2ee6c50SBarry Smith PetscInt *rp, k, low, high, t, ii, row, nrow, i, col, l, rmax, N, lastcol = -1; 81713f74950SBarry Smith PetscInt *imax = a->imax, *ai = a->i, *ailen = a->ilen, roworiented = a->roworiented; 818d0f46423SBarry Smith PetscInt *aj = a->j, nonew = a->nonew, bs = A->rmap->bs, brow, bcol; 81913f74950SBarry Smith PetscInt ridx, cidx, bs2 = a->bs2; 82049b5e25fSSatish Balay MatScalar *ap, value, *aa = a->a, *bap; 82149b5e25fSSatish Balay 82249b5e25fSSatish Balay PetscFunctionBegin; 82349b5e25fSSatish Balay for (k = 0; k < m; k++) { /* loop over added rows */ 82449b5e25fSSatish Balay row = im[k]; /* row number */ 82549b5e25fSSatish Balay brow = row / bs; /* block row number */ 82649b5e25fSSatish Balay if (row < 0) continue; 8276bdcaf15SBarry Smith PetscCheck(row < A->rmap->N, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Row too large: row %" PetscInt_FMT " max %" PetscInt_FMT, row, A->rmap->N - 1); 82849b5e25fSSatish Balay rp = aj + ai[brow]; /*ptr to beginning of column value of the row block*/ 82949b5e25fSSatish Balay ap = aa + bs2 * ai[brow]; /*ptr to beginning of element value of the row block*/ 83049b5e25fSSatish Balay rmax = imax[brow]; /* maximum space allocated for this row */ 83149b5e25fSSatish Balay nrow = ailen[brow]; /* actual length of this row */ 83249b5e25fSSatish Balay low = 0; 8338509e838SStefano Zampini high = nrow; 83449b5e25fSSatish Balay for (l = 0; l < n; l++) { /* loop over added columns */ 83549b5e25fSSatish Balay if (in[l] < 0) continue; 8366bdcaf15SBarry Smith PetscCheck(in[l] < A->cmap->N, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Column too large: col %" PetscInt_FMT " max %" PetscInt_FMT, in[l], A->cmap->N - 1); 83749b5e25fSSatish Balay col = in[l]; 83849b5e25fSSatish Balay bcol = col / bs; /* block col number */ 83949b5e25fSSatish Balay 840941593c8SHong Zhang if (brow > bcol) { 84126fbe8dcSKarl Rupp if (a->ignore_ltriangular) continue; /* ignore lower triangular values */ 84226fbe8dcSKarl Rupp else SETERRQ(PETSC_COMM_SELF, PETSC_ERR_USER, "Lower triangular value cannot be set for sbaij format. Ignoring these values, run with -mat_ignore_lower_triangular or call MatSetOption(mat,MAT_IGNORE_LOWER_TRIANGULAR,PETSC_TRUE)"); 843941593c8SHong Zhang } 844f4989cb3SHong Zhang 8459371c9d4SSatish Balay ridx = row % bs; 8469371c9d4SSatish Balay cidx = col % bs; /*row and col index inside the block */ 8478549e402SHong Zhang if ((brow == bcol && ridx <= cidx) || (brow < bcol)) { 84849b5e25fSSatish Balay /* element value a(k,l) */ 84926fbe8dcSKarl Rupp if (roworiented) value = v[l + k * n]; 85026fbe8dcSKarl Rupp else value = v[k + l * m]; 85149b5e25fSSatish Balay 85249b5e25fSSatish Balay /* move pointer bap to a(k,l) quickly and add/insert value */ 85326fbe8dcSKarl Rupp if (col <= lastcol) low = 0; 8548509e838SStefano Zampini else high = nrow; 8558509e838SStefano Zampini 856e2ee6c50SBarry Smith lastcol = col; 85749b5e25fSSatish Balay while (high - low > 7) { 85849b5e25fSSatish Balay t = (low + high) / 2; 85949b5e25fSSatish Balay if (rp[t] > bcol) high = t; 86049b5e25fSSatish Balay else low = t; 86149b5e25fSSatish Balay } 86249b5e25fSSatish Balay for (i = low; i < high; i++) { 86349b5e25fSSatish Balay if (rp[i] > bcol) break; 86449b5e25fSSatish Balay if (rp[i] == bcol) { 86549b5e25fSSatish Balay bap = ap + bs2 * i + bs * cidx + ridx; 86649b5e25fSSatish Balay if (is == ADD_VALUES) *bap += value; 86749b5e25fSSatish Balay else *bap = value; 8688549e402SHong Zhang /* for diag block, add/insert its symmetric element a(cidx,ridx) */ 8698549e402SHong Zhang if (brow == bcol && ridx < cidx) { 8708549e402SHong Zhang bap = ap + bs2 * i + bs * ridx + cidx; 8718549e402SHong Zhang if (is == ADD_VALUES) *bap += value; 8728549e402SHong Zhang else *bap = value; 8738549e402SHong Zhang } 87449b5e25fSSatish Balay goto noinsert1; 87549b5e25fSSatish Balay } 87649b5e25fSSatish Balay } 87749b5e25fSSatish Balay 87849b5e25fSSatish Balay if (nonew == 1) goto noinsert1; 87908401ef6SPierre Jolivet PetscCheck(nonew != -1, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Inserting a new nonzero (%" PetscInt_FMT ", %" PetscInt_FMT ") in the matrix", row, col); 880fef13f97SBarry Smith MatSeqXAIJReallocateAIJ(A, a->mbs, bs2, nrow, brow, bcol, rmax, aa, ai, aj, rp, ap, imax, nonew, MatScalar); 88149b5e25fSSatish Balay 8829371c9d4SSatish Balay N = nrow++ - 1; 8839371c9d4SSatish Balay high++; 88449b5e25fSSatish Balay /* shift up all the later entries in this row */ 8859566063dSJacob Faibussowitsch PetscCall(PetscArraymove(rp + i + 1, rp + i, N - i + 1)); 8869566063dSJacob Faibussowitsch PetscCall(PetscArraymove(ap + bs2 * (i + 1), ap + bs2 * i, bs2 * (N - i + 1))); 8879566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(ap + bs2 * i, bs2)); 88849b5e25fSSatish Balay rp[i] = bcol; 88949b5e25fSSatish Balay ap[bs2 * i + bs * cidx + ridx] = value; 8908509e838SStefano Zampini /* for diag block, add/insert its symmetric element a(cidx,ridx) */ 891ad540459SPierre Jolivet if (brow == bcol && ridx < cidx) ap[bs2 * i + bs * ridx + cidx] = value; 892e56f5c9eSBarry Smith A->nonzerostate++; 89349b5e25fSSatish Balay noinsert1:; 89449b5e25fSSatish Balay low = i; 8958549e402SHong Zhang } 89649b5e25fSSatish Balay } /* end of loop over added columns */ 89749b5e25fSSatish Balay ailen[brow] = nrow; 89849b5e25fSSatish Balay } /* end of loop over added rows */ 8993ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 90049b5e25fSSatish Balay } 90149b5e25fSSatish Balay 902ba38deedSJacob Faibussowitsch static PetscErrorCode MatICCFactor_SeqSBAIJ(Mat inA, IS row, const MatFactorInfo *info) 903d71ae5a4SJacob Faibussowitsch { 9044ccecd49SHong Zhang Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)inA->data; 90549b5e25fSSatish Balay Mat outA; 906ace3abfcSBarry Smith PetscBool row_identity; 90749b5e25fSSatish Balay 90849b5e25fSSatish Balay PetscFunctionBegin; 90908401ef6SPierre Jolivet PetscCheck(info->levels == 0, PETSC_COMM_SELF, PETSC_ERR_SUP, "Only levels=0 is supported for in-place icc"); 9109566063dSJacob Faibussowitsch PetscCall(ISIdentity(row, &row_identity)); 91128b400f6SJacob Faibussowitsch PetscCheck(row_identity, PETSC_COMM_SELF, PETSC_ERR_SUP, "Matrix reordering is not supported"); 91208401ef6SPierre Jolivet PetscCheck(inA->rmap->bs == 1, PETSC_COMM_SELF, PETSC_ERR_SUP, "Matrix block size %" PetscInt_FMT " is not supported", inA->rmap->bs); /* Need to replace MatCholeskyFactorSymbolic_SeqSBAIJ_MSR()! */ 913c84f5b01SHong Zhang 91449b5e25fSSatish Balay outA = inA; 915d5f3da31SBarry Smith inA->factortype = MAT_FACTOR_ICC; 9169566063dSJacob Faibussowitsch PetscCall(PetscFree(inA->solvertype)); 9179566063dSJacob Faibussowitsch PetscCall(PetscStrallocpy(MATSOLVERPETSC, &inA->solvertype)); 91849b5e25fSSatish Balay 9199566063dSJacob Faibussowitsch PetscCall(MatMarkDiagonal_SeqSBAIJ(inA)); 9209566063dSJacob Faibussowitsch PetscCall(MatSeqSBAIJSetNumericFactorization_inplace(inA, row_identity)); 92149b5e25fSSatish Balay 9229566063dSJacob Faibussowitsch PetscCall(PetscObjectReference((PetscObject)row)); 9239566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->row)); 924c84f5b01SHong Zhang a->row = row; 9259566063dSJacob Faibussowitsch PetscCall(PetscObjectReference((PetscObject)row)); 9269566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->col)); 927c84f5b01SHong Zhang a->col = row; 928c84f5b01SHong Zhang 929c84f5b01SHong Zhang /* Create the invert permutation so that it can be used in MatCholeskyFactorNumeric() */ 9309566063dSJacob Faibussowitsch if (a->icol) PetscCall(ISInvertPermutation(row, PETSC_DECIDE, &a->icol)); 93149b5e25fSSatish Balay 932aa624791SPierre Jolivet if (!a->solve_work) PetscCall(PetscMalloc1(inA->rmap->N + inA->rmap->bs, &a->solve_work)); 93349b5e25fSSatish Balay 9349566063dSJacob Faibussowitsch PetscCall(MatCholeskyFactorNumeric(outA, inA, info)); 9353ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 93649b5e25fSSatish Balay } 937950f1e5bSHong Zhang 938ba38deedSJacob Faibussowitsch static PetscErrorCode MatSeqSBAIJSetColumnIndices_SeqSBAIJ(Mat mat, PetscInt *indices) 939d71ae5a4SJacob Faibussowitsch { 940045c9aa0SHong Zhang Mat_SeqSBAIJ *baij = (Mat_SeqSBAIJ *)mat->data; 94113f74950SBarry Smith PetscInt i, nz, n; 94249b5e25fSSatish Balay 94349b5e25fSSatish Balay PetscFunctionBegin; 9446c6c5352SBarry Smith nz = baij->maxnz; 945d0f46423SBarry Smith n = mat->cmap->n; 94626fbe8dcSKarl Rupp for (i = 0; i < nz; i++) baij->j[i] = indices[i]; 94726fbe8dcSKarl Rupp 9486c6c5352SBarry Smith baij->nz = nz; 94926fbe8dcSKarl Rupp for (i = 0; i < n; i++) baij->ilen[i] = baij->imax[i]; 95026fbe8dcSKarl Rupp 9519566063dSJacob Faibussowitsch PetscCall(MatSetOption(mat, MAT_NEW_NONZERO_LOCATION_ERR, PETSC_TRUE)); 9523ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 95349b5e25fSSatish Balay } 95449b5e25fSSatish Balay 95549b5e25fSSatish Balay /*@ 95619585528SSatish Balay MatSeqSBAIJSetColumnIndices - Set the column indices for all the rows 95711a5261eSBarry Smith in a `MATSEQSBAIJ` matrix. 95849b5e25fSSatish Balay 95949b5e25fSSatish Balay Input Parameters: 96011a5261eSBarry Smith + mat - the `MATSEQSBAIJ` matrix 96149b5e25fSSatish Balay - indices - the column indices 96249b5e25fSSatish Balay 96349b5e25fSSatish Balay Level: advanced 96449b5e25fSSatish Balay 96549b5e25fSSatish Balay Notes: 96649b5e25fSSatish Balay This can be called if you have precomputed the nonzero structure of the 96749b5e25fSSatish Balay matrix and want to provide it to the matrix object to improve the performance 96811a5261eSBarry Smith of the `MatSetValues()` operation. 96949b5e25fSSatish Balay 97049b5e25fSSatish Balay You MUST have set the correct numbers of nonzeros per row in the call to 97111a5261eSBarry Smith `MatCreateSeqSBAIJ()`, and the columns indices MUST be sorted. 97249b5e25fSSatish Balay 9732ef1f0ffSBarry Smith MUST be called before any calls to `MatSetValues()` 97449b5e25fSSatish Balay 9751cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MATSEQSBAIJ`, `MatCreateSeqSBAIJ` 97649b5e25fSSatish Balay @*/ 977d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqSBAIJSetColumnIndices(Mat mat, PetscInt *indices) 978d71ae5a4SJacob Faibussowitsch { 97949b5e25fSSatish Balay PetscFunctionBegin; 9800700a824SBarry Smith PetscValidHeaderSpecific(mat, MAT_CLASSID, 1); 9814f572ea9SToby Isaac PetscAssertPointer(indices, 2); 982cac4c232SBarry Smith PetscUseMethod(mat, "MatSeqSBAIJSetColumnIndices_C", (Mat, PetscInt *), (mat, indices)); 9833ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 98449b5e25fSSatish Balay } 98549b5e25fSSatish Balay 986ba38deedSJacob Faibussowitsch static PetscErrorCode MatCopy_SeqSBAIJ(Mat A, Mat B, MatStructure str) 987d71ae5a4SJacob Faibussowitsch { 9884c7a3774SStefano Zampini PetscBool isbaij; 9893c896bc6SHong Zhang 9903c896bc6SHong Zhang PetscFunctionBegin; 9919566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompareAny((PetscObject)B, &isbaij, MATSEQSBAIJ, MATMPISBAIJ, "")); 99228b400f6SJacob Faibussowitsch PetscCheck(isbaij, PetscObjectComm((PetscObject)B), PETSC_ERR_SUP, "Not for matrix type %s", ((PetscObject)B)->type_name); 9934c7a3774SStefano Zampini /* If the two matrices have the same copy implementation and nonzero pattern, use fast copy. */ 9944c7a3774SStefano Zampini if (str == SAME_NONZERO_PATTERN && A->ops->copy == B->ops->copy) { 9953c896bc6SHong Zhang Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)A->data; 9963c896bc6SHong Zhang Mat_SeqSBAIJ *b = (Mat_SeqSBAIJ *)B->data; 9973c896bc6SHong Zhang 99808401ef6SPierre Jolivet PetscCheck(a->i[a->mbs] == b->i[b->mbs], PETSC_COMM_SELF, PETSC_ERR_ARG_INCOMP, "Number of nonzeros in two matrices are different"); 99908401ef6SPierre Jolivet PetscCheck(a->mbs == b->mbs, PETSC_COMM_SELF, PETSC_ERR_ARG_INCOMP, "Number of rows in two matrices are different"); 100008401ef6SPierre Jolivet PetscCheck(a->bs2 == b->bs2, PETSC_COMM_SELF, PETSC_ERR_ARG_INCOMP, "Different block size"); 10019566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(b->a, a->a, a->bs2 * a->i[a->mbs])); 10029566063dSJacob Faibussowitsch PetscCall(PetscObjectStateIncrease((PetscObject)B)); 10033c896bc6SHong Zhang } else { 10049566063dSJacob Faibussowitsch PetscCall(MatGetRowUpperTriangular(A)); 10059566063dSJacob Faibussowitsch PetscCall(MatCopy_Basic(A, B, str)); 10069566063dSJacob Faibussowitsch PetscCall(MatRestoreRowUpperTriangular(A)); 10073c896bc6SHong Zhang } 10083ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 10093c896bc6SHong Zhang } 10103c896bc6SHong Zhang 1011d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatSeqSBAIJGetArray_SeqSBAIJ(Mat A, PetscScalar *array[]) 1012d71ae5a4SJacob Faibussowitsch { 1013a6ece127SHong Zhang Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)A->data; 10145fd66863SKarl Rupp 1015a6ece127SHong Zhang PetscFunctionBegin; 1016a6ece127SHong Zhang *array = a->a; 10173ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1018a6ece127SHong Zhang } 1019a6ece127SHong Zhang 1020d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatSeqSBAIJRestoreArray_SeqSBAIJ(Mat A, PetscScalar *array[]) 1021d71ae5a4SJacob Faibussowitsch { 1022a6ece127SHong Zhang PetscFunctionBegin; 1023cda14afcSprj- *array = NULL; 10243ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1025a6ece127SHong Zhang } 1026a6ece127SHong Zhang 1027d71ae5a4SJacob Faibussowitsch PetscErrorCode MatAXPYGetPreallocation_SeqSBAIJ(Mat Y, Mat X, PetscInt *nnz) 1028d71ae5a4SJacob Faibussowitsch { 1029b264fe52SHong Zhang PetscInt bs = Y->rmap->bs, mbs = Y->rmap->N / bs; 103052768537SHong Zhang Mat_SeqSBAIJ *x = (Mat_SeqSBAIJ *)X->data; 103152768537SHong Zhang Mat_SeqSBAIJ *y = (Mat_SeqSBAIJ *)Y->data; 103252768537SHong Zhang 103352768537SHong Zhang PetscFunctionBegin; 103452768537SHong Zhang /* Set the number of nonzeros in the new matrix */ 10359566063dSJacob Faibussowitsch PetscCall(MatAXPYGetPreallocation_SeqX_private(mbs, x->i, x->j, y->i, y->j, nnz)); 10363ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 103752768537SHong Zhang } 103852768537SHong Zhang 1039ba38deedSJacob Faibussowitsch static PetscErrorCode MatAXPY_SeqSBAIJ(Mat Y, PetscScalar a, Mat X, MatStructure str) 1040d71ae5a4SJacob Faibussowitsch { 104142ee4b1aSHong Zhang Mat_SeqSBAIJ *x = (Mat_SeqSBAIJ *)X->data, *y = (Mat_SeqSBAIJ *)Y->data; 104231ce2d13SHong Zhang PetscInt bs = Y->rmap->bs, bs2 = bs * bs; 1043e838b9e7SJed Brown PetscBLASInt one = 1; 104442ee4b1aSHong Zhang 104542ee4b1aSHong Zhang PetscFunctionBegin; 1046134adf20SPierre Jolivet if (str == UNKNOWN_NONZERO_PATTERN || (PetscDefined(USE_DEBUG) && str == SAME_NONZERO_PATTERN)) { 1047134adf20SPierre Jolivet PetscBool e = x->nz == y->nz && x->mbs == y->mbs ? PETSC_TRUE : PETSC_FALSE; 1048134adf20SPierre Jolivet if (e) { 10499566063dSJacob Faibussowitsch PetscCall(PetscArraycmp(x->i, y->i, x->mbs + 1, &e)); 1050134adf20SPierre Jolivet if (e) { 10519566063dSJacob Faibussowitsch PetscCall(PetscArraycmp(x->j, y->j, x->i[x->mbs], &e)); 1052134adf20SPierre Jolivet if (e) str = SAME_NONZERO_PATTERN; 1053134adf20SPierre Jolivet } 1054134adf20SPierre Jolivet } 105554c59aa7SJacob Faibussowitsch if (!e) PetscCheck(str != SAME_NONZERO_PATTERN, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONG, "MatStructure is not SAME_NONZERO_PATTERN"); 1056134adf20SPierre Jolivet } 105742ee4b1aSHong Zhang if (str == SAME_NONZERO_PATTERN) { 1058f4df32b1SMatthew Knepley PetscScalar alpha = a; 1059c5df96a5SBarry Smith PetscBLASInt bnz; 10609566063dSJacob Faibussowitsch PetscCall(PetscBLASIntCast(x->nz * bs2, &bnz)); 1061792fecdfSBarry Smith PetscCallBLAS("BLASaxpy", BLASaxpy_(&bnz, &alpha, x->a, &one, y->a, &one)); 10629566063dSJacob Faibussowitsch PetscCall(PetscObjectStateIncrease((PetscObject)Y)); 1063ab784542SHong Zhang } else if (str == SUBSET_NONZERO_PATTERN) { /* nonzeros of X is a subset of Y's */ 10649566063dSJacob Faibussowitsch PetscCall(MatSetOption(X, MAT_GETROW_UPPERTRIANGULAR, PETSC_TRUE)); 10659566063dSJacob Faibussowitsch PetscCall(MatAXPY_Basic(Y, a, X, str)); 10669566063dSJacob Faibussowitsch PetscCall(MatSetOption(X, MAT_GETROW_UPPERTRIANGULAR, PETSC_FALSE)); 106742ee4b1aSHong Zhang } else { 106852768537SHong Zhang Mat B; 106952768537SHong Zhang PetscInt *nnz; 107054c59aa7SJacob Faibussowitsch PetscCheck(bs == X->rmap->bs, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Matrices must have same block size"); 10719566063dSJacob Faibussowitsch PetscCall(MatGetRowUpperTriangular(X)); 10729566063dSJacob Faibussowitsch PetscCall(MatGetRowUpperTriangular(Y)); 10739566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(Y->rmap->N, &nnz)); 10749566063dSJacob Faibussowitsch PetscCall(MatCreate(PetscObjectComm((PetscObject)Y), &B)); 10759566063dSJacob Faibussowitsch PetscCall(PetscObjectSetName((PetscObject)B, ((PetscObject)Y)->name)); 10769566063dSJacob Faibussowitsch PetscCall(MatSetSizes(B, Y->rmap->n, Y->cmap->n, Y->rmap->N, Y->cmap->N)); 10779566063dSJacob Faibussowitsch PetscCall(MatSetBlockSizesFromMats(B, Y, Y)); 10789566063dSJacob Faibussowitsch PetscCall(MatSetType(B, ((PetscObject)Y)->type_name)); 10799566063dSJacob Faibussowitsch PetscCall(MatAXPYGetPreallocation_SeqSBAIJ(Y, X, nnz)); 10809566063dSJacob Faibussowitsch PetscCall(MatSeqSBAIJSetPreallocation(B, bs, 0, nnz)); 108152768537SHong Zhang 10829566063dSJacob Faibussowitsch PetscCall(MatAXPY_BasicWithPreallocation(B, Y, a, X, str)); 108352768537SHong Zhang 10849566063dSJacob Faibussowitsch PetscCall(MatHeaderMerge(Y, &B)); 10859566063dSJacob Faibussowitsch PetscCall(PetscFree(nnz)); 10869566063dSJacob Faibussowitsch PetscCall(MatRestoreRowUpperTriangular(X)); 10879566063dSJacob Faibussowitsch PetscCall(MatRestoreRowUpperTriangular(Y)); 108842ee4b1aSHong Zhang } 10893ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 109042ee4b1aSHong Zhang } 109142ee4b1aSHong Zhang 1092ba38deedSJacob Faibussowitsch static PetscErrorCode MatIsSymmetric_SeqSBAIJ(Mat A, PetscReal tol, PetscBool *flg) 1093d71ae5a4SJacob Faibussowitsch { 1094efcf0fc3SBarry Smith PetscFunctionBegin; 1095efcf0fc3SBarry Smith *flg = PETSC_TRUE; 10963ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1097efcf0fc3SBarry Smith } 1098efcf0fc3SBarry Smith 1099ba38deedSJacob Faibussowitsch static PetscErrorCode MatIsStructurallySymmetric_SeqSBAIJ(Mat A, PetscBool *flg) 1100d71ae5a4SJacob Faibussowitsch { 1101efcf0fc3SBarry Smith PetscFunctionBegin; 1102efcf0fc3SBarry Smith *flg = PETSC_TRUE; 11033ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1104efcf0fc3SBarry Smith } 1105efcf0fc3SBarry Smith 1106ba38deedSJacob Faibussowitsch static PetscErrorCode MatIsHermitian_SeqSBAIJ(Mat A, PetscReal tol, PetscBool *flg) 1107d71ae5a4SJacob Faibussowitsch { 1108efcf0fc3SBarry Smith PetscFunctionBegin; 1109efcf0fc3SBarry Smith *flg = PETSC_FALSE; 11103ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1111efcf0fc3SBarry Smith } 1112efcf0fc3SBarry Smith 1113ba38deedSJacob Faibussowitsch static PetscErrorCode MatConjugate_SeqSBAIJ(Mat A) 1114d71ae5a4SJacob Faibussowitsch { 11152726fb6dSPierre Jolivet #if defined(PETSC_USE_COMPLEX) 11162726fb6dSPierre Jolivet Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)A->data; 11172726fb6dSPierre Jolivet PetscInt i, nz = a->bs2 * a->i[a->mbs]; 11182726fb6dSPierre Jolivet MatScalar *aa = a->a; 11192726fb6dSPierre Jolivet 11202726fb6dSPierre Jolivet PetscFunctionBegin; 11212726fb6dSPierre Jolivet for (i = 0; i < nz; i++) aa[i] = PetscConj(aa[i]); 11222726fb6dSPierre Jolivet #else 11232726fb6dSPierre Jolivet PetscFunctionBegin; 11242726fb6dSPierre Jolivet #endif 11253ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 11262726fb6dSPierre Jolivet } 11272726fb6dSPierre Jolivet 1128ba38deedSJacob Faibussowitsch static PetscErrorCode MatRealPart_SeqSBAIJ(Mat A) 1129d71ae5a4SJacob Faibussowitsch { 113099cafbc1SBarry Smith Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)A->data; 113199cafbc1SBarry Smith PetscInt i, nz = a->bs2 * a->i[a->mbs]; 1132dd6ea824SBarry Smith MatScalar *aa = a->a; 113399cafbc1SBarry Smith 113499cafbc1SBarry Smith PetscFunctionBegin; 113599cafbc1SBarry Smith for (i = 0; i < nz; i++) aa[i] = PetscRealPart(aa[i]); 11363ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 113799cafbc1SBarry Smith } 113899cafbc1SBarry Smith 1139ba38deedSJacob Faibussowitsch static PetscErrorCode MatImaginaryPart_SeqSBAIJ(Mat A) 1140d71ae5a4SJacob Faibussowitsch { 114199cafbc1SBarry Smith Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)A->data; 114299cafbc1SBarry Smith PetscInt i, nz = a->bs2 * a->i[a->mbs]; 1143dd6ea824SBarry Smith MatScalar *aa = a->a; 114499cafbc1SBarry Smith 114599cafbc1SBarry Smith PetscFunctionBegin; 114699cafbc1SBarry Smith for (i = 0; i < nz; i++) aa[i] = PetscImaginaryPart(aa[i]); 11473ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 114899cafbc1SBarry Smith } 114999cafbc1SBarry Smith 1150ba38deedSJacob Faibussowitsch static PetscErrorCode MatZeroRowsColumns_SeqSBAIJ(Mat A, PetscInt is_n, const PetscInt is_idx[], PetscScalar diag, Vec x, Vec b) 1151d71ae5a4SJacob Faibussowitsch { 11523bededecSBarry Smith Mat_SeqSBAIJ *baij = (Mat_SeqSBAIJ *)A->data; 11533bededecSBarry Smith PetscInt i, j, k, count; 11543bededecSBarry Smith PetscInt bs = A->rmap->bs, bs2 = baij->bs2, row, col; 11553bededecSBarry Smith PetscScalar zero = 0.0; 11563bededecSBarry Smith MatScalar *aa; 11573bededecSBarry Smith const PetscScalar *xx; 11583bededecSBarry Smith PetscScalar *bb; 115956777dd2SBarry Smith PetscBool *zeroed, vecs = PETSC_FALSE; 11603bededecSBarry Smith 11613bededecSBarry Smith PetscFunctionBegin; 11623bededecSBarry Smith /* fix right hand side if needed */ 11633bededecSBarry Smith if (x && b) { 11649566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(x, &xx)); 11659566063dSJacob Faibussowitsch PetscCall(VecGetArray(b, &bb)); 116656777dd2SBarry Smith vecs = PETSC_TRUE; 11673bededecSBarry Smith } 11683bededecSBarry Smith 11693bededecSBarry Smith /* zero the columns */ 11709566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(A->rmap->n, &zeroed)); 11713bededecSBarry Smith for (i = 0; i < is_n; i++) { 1172aed4548fSBarry Smith PetscCheck(is_idx[i] >= 0 && is_idx[i] < A->rmap->N, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "row %" PetscInt_FMT " out of range", is_idx[i]); 11733bededecSBarry Smith zeroed[is_idx[i]] = PETSC_TRUE; 11743bededecSBarry Smith } 117556777dd2SBarry Smith if (vecs) { 117656777dd2SBarry Smith for (i = 0; i < A->rmap->N; i++) { 117756777dd2SBarry Smith row = i / bs; 117856777dd2SBarry Smith for (j = baij->i[row]; j < baij->i[row + 1]; j++) { 117956777dd2SBarry Smith for (k = 0; k < bs; k++) { 118056777dd2SBarry Smith col = bs * baij->j[j] + k; 118156777dd2SBarry Smith if (col <= i) continue; 118256777dd2SBarry Smith aa = ((MatScalar *)(baij->a)) + j * bs2 + (i % bs) + bs * k; 118326fbe8dcSKarl Rupp if (!zeroed[i] && zeroed[col]) bb[i] -= aa[0] * xx[col]; 118426fbe8dcSKarl Rupp if (zeroed[i] && !zeroed[col]) bb[col] -= aa[0] * xx[i]; 118556777dd2SBarry Smith } 118656777dd2SBarry Smith } 118756777dd2SBarry Smith } 118826fbe8dcSKarl Rupp for (i = 0; i < is_n; i++) bb[is_idx[i]] = diag * xx[is_idx[i]]; 118956777dd2SBarry Smith } 119056777dd2SBarry Smith 11913bededecSBarry Smith for (i = 0; i < A->rmap->N; i++) { 11923bededecSBarry Smith if (!zeroed[i]) { 11933bededecSBarry Smith row = i / bs; 11943bededecSBarry Smith for (j = baij->i[row]; j < baij->i[row + 1]; j++) { 11953bededecSBarry Smith for (k = 0; k < bs; k++) { 11963bededecSBarry Smith col = bs * baij->j[j] + k; 11973bededecSBarry Smith if (zeroed[col]) { 11983bededecSBarry Smith aa = ((MatScalar *)(baij->a)) + j * bs2 + (i % bs) + bs * k; 11993bededecSBarry Smith aa[0] = 0.0; 12003bededecSBarry Smith } 12013bededecSBarry Smith } 12023bededecSBarry Smith } 12033bededecSBarry Smith } 12043bededecSBarry Smith } 12059566063dSJacob Faibussowitsch PetscCall(PetscFree(zeroed)); 120656777dd2SBarry Smith if (vecs) { 12079566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(x, &xx)); 12089566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(b, &bb)); 120956777dd2SBarry Smith } 12103bededecSBarry Smith 12113bededecSBarry Smith /* zero the rows */ 12123bededecSBarry Smith for (i = 0; i < is_n; i++) { 12133bededecSBarry Smith row = is_idx[i]; 12143bededecSBarry Smith count = (baij->i[row / bs + 1] - baij->i[row / bs]) * bs; 12153bededecSBarry Smith aa = ((MatScalar *)(baij->a)) + baij->i[row / bs] * bs2 + (row % bs); 12163bededecSBarry Smith for (k = 0; k < count; k++) { 12173bededecSBarry Smith aa[0] = zero; 12183bededecSBarry Smith aa += bs; 12193bededecSBarry Smith } 1220dbbe0bcdSBarry Smith if (diag != 0.0) PetscUseTypeMethod(A, setvalues, 1, &row, 1, &row, &diag, INSERT_VALUES); 12213bededecSBarry Smith } 12229566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd_SeqSBAIJ(A, MAT_FINAL_ASSEMBLY)); 12233ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 12243bededecSBarry Smith } 12253bededecSBarry Smith 1226ba38deedSJacob Faibussowitsch static PetscErrorCode MatShift_SeqSBAIJ(Mat Y, PetscScalar a) 1227d71ae5a4SJacob Faibussowitsch { 12287d68702bSBarry Smith Mat_SeqSBAIJ *aij = (Mat_SeqSBAIJ *)Y->data; 12297d68702bSBarry Smith 12307d68702bSBarry Smith PetscFunctionBegin; 123148a46eb9SPierre Jolivet if (!Y->preallocated || !aij->nz) PetscCall(MatSeqSBAIJSetPreallocation(Y, Y->rmap->bs, 1, NULL)); 12329566063dSJacob Faibussowitsch PetscCall(MatShift_Basic(Y, a)); 12333ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 12347d68702bSBarry Smith } 12357d68702bSBarry Smith 123617ea310bSPierre Jolivet PetscErrorCode MatEliminateZeros_SeqSBAIJ(Mat A, PetscBool keep) 123717ea310bSPierre Jolivet { 123817ea310bSPierre Jolivet Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)A->data; 123917ea310bSPierre Jolivet PetscInt fshift = 0, fshift_prev = 0, i, *ai = a->i, *aj = a->j, *imax = a->imax, j, k; 124017ea310bSPierre Jolivet PetscInt m = A->rmap->N, *ailen = a->ilen; 124117ea310bSPierre Jolivet PetscInt mbs = a->mbs, bs2 = a->bs2, rmax = 0; 124217ea310bSPierre Jolivet MatScalar *aa = a->a, *ap; 124317ea310bSPierre Jolivet PetscBool zero; 124417ea310bSPierre Jolivet 124517ea310bSPierre Jolivet PetscFunctionBegin; 124617ea310bSPierre Jolivet PetscCheck(A->assembled, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Cannot eliminate zeros for unassembled matrix"); 124717ea310bSPierre Jolivet if (m) rmax = ailen[0]; 124817ea310bSPierre Jolivet for (i = 1; i <= mbs; i++) { 124917ea310bSPierre Jolivet for (k = ai[i - 1]; k < ai[i]; k++) { 125017ea310bSPierre Jolivet zero = PETSC_TRUE; 125117ea310bSPierre Jolivet ap = aa + bs2 * k; 125217ea310bSPierre Jolivet for (j = 0; j < bs2 && zero; j++) { 125317ea310bSPierre Jolivet if (ap[j] != 0.0) zero = PETSC_FALSE; 125417ea310bSPierre Jolivet } 125517ea310bSPierre Jolivet if (zero && (aj[k] != i - 1 || !keep)) fshift++; 125617ea310bSPierre Jolivet else { 125717ea310bSPierre Jolivet if (zero && aj[k] == i - 1) PetscCall(PetscInfo(A, "Keep the diagonal block at row %" PetscInt_FMT "\n", i - 1)); 125817ea310bSPierre Jolivet aj[k - fshift] = aj[k]; 125917ea310bSPierre Jolivet PetscCall(PetscArraymove(ap - bs2 * fshift, ap, bs2)); 126017ea310bSPierre Jolivet } 126117ea310bSPierre Jolivet } 126217ea310bSPierre Jolivet ai[i - 1] -= fshift_prev; 126317ea310bSPierre Jolivet fshift_prev = fshift; 126417ea310bSPierre Jolivet ailen[i - 1] = imax[i - 1] = ai[i] - fshift - ai[i - 1]; 126517ea310bSPierre Jolivet a->nonzerorowcnt += ((ai[i] - fshift - ai[i - 1]) > 0); 126617ea310bSPierre Jolivet rmax = PetscMax(rmax, ailen[i - 1]); 126717ea310bSPierre Jolivet } 126817ea310bSPierre Jolivet if (fshift) { 126917ea310bSPierre Jolivet if (mbs) { 127017ea310bSPierre Jolivet ai[mbs] -= fshift; 127117ea310bSPierre Jolivet a->nz = ai[mbs]; 127217ea310bSPierre Jolivet } 127317ea310bSPierre Jolivet PetscCall(PetscInfo(A, "Matrix size: %" PetscInt_FMT " X %" PetscInt_FMT "; zeros eliminated: %" PetscInt_FMT "; nonzeros left: %" PetscInt_FMT "\n", m, A->cmap->n, fshift, a->nz)); 127417ea310bSPierre Jolivet A->nonzerostate++; 127517ea310bSPierre Jolivet A->info.nz_unneeded += (PetscReal)fshift; 127617ea310bSPierre Jolivet a->rmax = rmax; 127717ea310bSPierre Jolivet PetscCall(MatAssemblyBegin(A, MAT_FINAL_ASSEMBLY)); 127817ea310bSPierre Jolivet PetscCall(MatAssemblyEnd(A, MAT_FINAL_ASSEMBLY)); 127917ea310bSPierre Jolivet } 128017ea310bSPierre Jolivet PetscFunctionReturn(PETSC_SUCCESS); 128117ea310bSPierre Jolivet } 128217ea310bSPierre Jolivet 12833964eb88SJed Brown static struct _MatOps MatOps_Values = {MatSetValues_SeqSBAIJ, 128449b5e25fSSatish Balay MatGetRow_SeqSBAIJ, 128549b5e25fSSatish Balay MatRestoreRow_SeqSBAIJ, 128649b5e25fSSatish Balay MatMult_SeqSBAIJ_N, 128797304618SKris Buschelman /* 4*/ MatMultAdd_SeqSBAIJ_N, 1288431c96f7SBarry Smith MatMult_SeqSBAIJ_N, /* transpose versions are same as non-transpose versions */ 1289e005ede5SBarry Smith MatMultAdd_SeqSBAIJ_N, 1290f4259b30SLisandro Dalcin NULL, 1291f4259b30SLisandro Dalcin NULL, 1292f4259b30SLisandro Dalcin NULL, 1293f4259b30SLisandro Dalcin /* 10*/ NULL, 1294f4259b30SLisandro Dalcin NULL, 1295c078aec8SLisandro Dalcin MatCholeskyFactor_SeqSBAIJ, 129641f059aeSBarry Smith MatSOR_SeqSBAIJ, 129749b5e25fSSatish Balay MatTranspose_SeqSBAIJ, 129897304618SKris Buschelman /* 15*/ MatGetInfo_SeqSBAIJ, 129949b5e25fSSatish Balay MatEqual_SeqSBAIJ, 130049b5e25fSSatish Balay MatGetDiagonal_SeqSBAIJ, 130149b5e25fSSatish Balay MatDiagonalScale_SeqSBAIJ, 130249b5e25fSSatish Balay MatNorm_SeqSBAIJ, 1303f4259b30SLisandro Dalcin /* 20*/ NULL, 130449b5e25fSSatish Balay MatAssemblyEnd_SeqSBAIJ, 130549b5e25fSSatish Balay MatSetOption_SeqSBAIJ, 130649b5e25fSSatish Balay MatZeroEntries_SeqSBAIJ, 1307f4259b30SLisandro Dalcin /* 24*/ NULL, 1308f4259b30SLisandro Dalcin NULL, 1309f4259b30SLisandro Dalcin NULL, 1310f4259b30SLisandro Dalcin NULL, 1311f4259b30SLisandro Dalcin NULL, 131226cec326SBarry Smith /* 29*/ MatSetUp_Seq_Hash, 1313f4259b30SLisandro Dalcin NULL, 1314f4259b30SLisandro Dalcin NULL, 1315f4259b30SLisandro Dalcin NULL, 1316f4259b30SLisandro Dalcin NULL, 1317d519adbfSMatthew Knepley /* 34*/ MatDuplicate_SeqSBAIJ, 1318f4259b30SLisandro Dalcin NULL, 1319f4259b30SLisandro Dalcin NULL, 1320f4259b30SLisandro Dalcin NULL, 1321c84f5b01SHong Zhang MatICCFactor_SeqSBAIJ, 1322d519adbfSMatthew Knepley /* 39*/ MatAXPY_SeqSBAIJ, 13237dae84e0SHong Zhang MatCreateSubMatrices_SeqSBAIJ, 132449b5e25fSSatish Balay MatIncreaseOverlap_SeqSBAIJ, 132549b5e25fSSatish Balay MatGetValues_SeqSBAIJ, 13263c896bc6SHong Zhang MatCopy_SeqSBAIJ, 1327f4259b30SLisandro Dalcin /* 44*/ NULL, 132849b5e25fSSatish Balay MatScale_SeqSBAIJ, 13297d68702bSBarry Smith MatShift_SeqSBAIJ, 1330f4259b30SLisandro Dalcin NULL, 13313bededecSBarry Smith MatZeroRowsColumns_SeqSBAIJ, 1332f4259b30SLisandro Dalcin /* 49*/ NULL, 133349b5e25fSSatish Balay MatGetRowIJ_SeqSBAIJ, 133449b5e25fSSatish Balay MatRestoreRowIJ_SeqSBAIJ, 1335f4259b30SLisandro Dalcin NULL, 1336f4259b30SLisandro Dalcin NULL, 1337f4259b30SLisandro Dalcin /* 54*/ NULL, 1338f4259b30SLisandro Dalcin NULL, 1339f4259b30SLisandro Dalcin NULL, 1340dc29a518SPierre Jolivet MatPermute_SeqSBAIJ, 134149b5e25fSSatish Balay MatSetValuesBlocked_SeqSBAIJ, 13427dae84e0SHong Zhang /* 59*/ MatCreateSubMatrix_SeqSBAIJ, 1343f4259b30SLisandro Dalcin NULL, 1344f4259b30SLisandro Dalcin NULL, 1345f4259b30SLisandro Dalcin NULL, 1346f4259b30SLisandro Dalcin NULL, 1347f4259b30SLisandro Dalcin /* 64*/ NULL, 1348f4259b30SLisandro Dalcin NULL, 1349f4259b30SLisandro Dalcin NULL, 1350f4259b30SLisandro Dalcin NULL, 1351f4259b30SLisandro Dalcin NULL, 1352d519adbfSMatthew Knepley /* 69*/ MatGetRowMaxAbs_SeqSBAIJ, 1353f4259b30SLisandro Dalcin NULL, 135428d58a37SPierre Jolivet MatConvert_MPISBAIJ_Basic, 1355f4259b30SLisandro Dalcin NULL, 1356f4259b30SLisandro Dalcin NULL, 1357f4259b30SLisandro Dalcin /* 74*/ NULL, 1358f4259b30SLisandro Dalcin NULL, 1359f4259b30SLisandro Dalcin NULL, 1360f4259b30SLisandro Dalcin NULL, 1361f4259b30SLisandro Dalcin NULL, 1362f4259b30SLisandro Dalcin /* 79*/ NULL, 1363f4259b30SLisandro Dalcin NULL, 1364f4259b30SLisandro Dalcin NULL, 136597304618SKris Buschelman MatGetInertia_SeqSBAIJ, 13665bba2384SShri Abhyankar MatLoad_SeqSBAIJ, 1367d519adbfSMatthew Knepley /* 84*/ MatIsSymmetric_SeqSBAIJ, 1368865e5f61SKris Buschelman MatIsHermitian_SeqSBAIJ, 1369efcf0fc3SBarry Smith MatIsStructurallySymmetric_SeqSBAIJ, 1370f4259b30SLisandro Dalcin NULL, 1371f4259b30SLisandro Dalcin NULL, 1372f4259b30SLisandro Dalcin /* 89*/ NULL, 1373f4259b30SLisandro Dalcin NULL, 1374f4259b30SLisandro Dalcin NULL, 1375f4259b30SLisandro Dalcin NULL, 1376f4259b30SLisandro Dalcin NULL, 1377f4259b30SLisandro Dalcin /* 94*/ NULL, 1378f4259b30SLisandro Dalcin NULL, 1379f4259b30SLisandro Dalcin NULL, 1380f4259b30SLisandro Dalcin NULL, 1381f4259b30SLisandro Dalcin NULL, 1382f4259b30SLisandro Dalcin /* 99*/ NULL, 1383f4259b30SLisandro Dalcin NULL, 1384f4259b30SLisandro Dalcin NULL, 13852726fb6dSPierre Jolivet MatConjugate_SeqSBAIJ, 1386f4259b30SLisandro Dalcin NULL, 1387f4259b30SLisandro Dalcin /*104*/ NULL, 138899cafbc1SBarry Smith MatRealPart_SeqSBAIJ, 1389f5edf698SHong Zhang MatImaginaryPart_SeqSBAIJ, 1390f5edf698SHong Zhang MatGetRowUpperTriangular_SeqSBAIJ, 13912af78befSBarry Smith MatRestoreRowUpperTriangular_SeqSBAIJ, 1392f4259b30SLisandro Dalcin /*109*/ NULL, 1393f4259b30SLisandro Dalcin NULL, 1394f4259b30SLisandro Dalcin NULL, 1395f4259b30SLisandro Dalcin NULL, 1396547795f9SHong Zhang MatMissingDiagonal_SeqSBAIJ, 1397f4259b30SLisandro Dalcin /*114*/ NULL, 1398f4259b30SLisandro Dalcin NULL, 1399f4259b30SLisandro Dalcin NULL, 1400f4259b30SLisandro Dalcin NULL, 1401f4259b30SLisandro Dalcin NULL, 1402f4259b30SLisandro Dalcin /*119*/ NULL, 1403f4259b30SLisandro Dalcin NULL, 1404f4259b30SLisandro Dalcin NULL, 1405f4259b30SLisandro Dalcin NULL, 1406f4259b30SLisandro Dalcin NULL, 1407f4259b30SLisandro Dalcin /*124*/ NULL, 1408f4259b30SLisandro Dalcin NULL, 1409f4259b30SLisandro Dalcin NULL, 1410f4259b30SLisandro Dalcin NULL, 1411f4259b30SLisandro Dalcin NULL, 1412f4259b30SLisandro Dalcin /*129*/ NULL, 1413f4259b30SLisandro Dalcin NULL, 1414f4259b30SLisandro Dalcin NULL, 1415f4259b30SLisandro Dalcin NULL, 1416f4259b30SLisandro Dalcin NULL, 1417f4259b30SLisandro Dalcin /*134*/ NULL, 1418f4259b30SLisandro Dalcin NULL, 1419f4259b30SLisandro Dalcin NULL, 1420f4259b30SLisandro Dalcin NULL, 1421f4259b30SLisandro Dalcin NULL, 142246533700Sstefano_zampini /*139*/ MatSetBlockSizes_Default, 1423f4259b30SLisandro Dalcin NULL, 1424f4259b30SLisandro Dalcin NULL, 1425f4259b30SLisandro Dalcin NULL, 1426f4259b30SLisandro Dalcin NULL, 1427d70f29a3SPierre Jolivet /*144*/ MatCreateMPIMatConcatenateSeqMat_SeqSBAIJ, 1428d70f29a3SPierre Jolivet NULL, 1429d70f29a3SPierre Jolivet NULL, 143099a7f59eSMark Adams NULL, 143199a7f59eSMark Adams NULL, 14327fb60732SBarry Smith NULL, 1433dec0b466SHong Zhang /*150*/ NULL, 143417ea310bSPierre Jolivet MatEliminateZeros_SeqSBAIJ}; 1435be1d678aSKris Buschelman 1436ba38deedSJacob Faibussowitsch static PetscErrorCode MatStoreValues_SeqSBAIJ(Mat mat) 1437d71ae5a4SJacob Faibussowitsch { 14384afc71dfSHong Zhang Mat_SeqSBAIJ *aij = (Mat_SeqSBAIJ *)mat->data; 1439d0f46423SBarry Smith PetscInt nz = aij->i[mat->rmap->N] * mat->rmap->bs * aij->bs2; 144049b5e25fSSatish Balay 144149b5e25fSSatish Balay PetscFunctionBegin; 144208401ef6SPierre Jolivet PetscCheck(aij->nonew == 1, PETSC_COMM_SELF, PETSC_ERR_ORDER, "Must call MatSetOption(A,MAT_NEW_NONZERO_LOCATIONS,PETSC_FALSE);first"); 144349b5e25fSSatish Balay 144449b5e25fSSatish Balay /* allocate space for values if not already there */ 144548a46eb9SPierre Jolivet if (!aij->saved_values) PetscCall(PetscMalloc1(nz + 1, &aij->saved_values)); 144649b5e25fSSatish Balay 144749b5e25fSSatish Balay /* copy values over */ 14489566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(aij->saved_values, aij->a, nz)); 14493ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 145049b5e25fSSatish Balay } 145149b5e25fSSatish Balay 1452ba38deedSJacob Faibussowitsch static PetscErrorCode MatRetrieveValues_SeqSBAIJ(Mat mat) 1453d71ae5a4SJacob Faibussowitsch { 14544afc71dfSHong Zhang Mat_SeqSBAIJ *aij = (Mat_SeqSBAIJ *)mat->data; 1455d0f46423SBarry Smith PetscInt nz = aij->i[mat->rmap->N] * mat->rmap->bs * aij->bs2; 145649b5e25fSSatish Balay 145749b5e25fSSatish Balay PetscFunctionBegin; 145808401ef6SPierre Jolivet PetscCheck(aij->nonew == 1, PETSC_COMM_SELF, PETSC_ERR_ORDER, "Must call MatSetOption(A,MAT_NEW_NONZERO_LOCATIONS,PETSC_FALSE);first"); 145928b400f6SJacob Faibussowitsch PetscCheck(aij->saved_values, PETSC_COMM_SELF, PETSC_ERR_ORDER, "Must call MatStoreValues(A);first"); 146049b5e25fSSatish Balay 146149b5e25fSSatish Balay /* copy values over */ 14629566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(aij->a, aij->saved_values, nz)); 14633ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 146449b5e25fSSatish Balay } 146549b5e25fSSatish Balay 1466*f9663b93SPierre Jolivet static PetscErrorCode MatSeqSBAIJSetPreallocation_SeqSBAIJ(Mat B, PetscInt bs, PetscInt nz, const PetscInt nnz[]) 1467d71ae5a4SJacob Faibussowitsch { 1468c464158bSHong Zhang Mat_SeqSBAIJ *b = (Mat_SeqSBAIJ *)B->data; 14694dcd73b1SHong Zhang PetscInt i, mbs, nbs, bs2; 14702576faa2SJed Brown PetscBool skipallocation = PETSC_FALSE, flg = PETSC_FALSE, realalloc = PETSC_FALSE; 147149b5e25fSSatish Balay 1472b4e2f619SBarry Smith PetscFunctionBegin; 1473ad79cf63SBarry Smith if (B->hash_active) { 1474ad79cf63SBarry Smith PetscInt bs; 1475aea10558SJacob Faibussowitsch B->ops[0] = b->cops; 1476ad79cf63SBarry Smith PetscCall(PetscHMapIJVDestroy(&b->ht)); 1477ad79cf63SBarry Smith PetscCall(MatGetBlockSize(B, &bs)); 1478ad79cf63SBarry Smith if (bs > 1) PetscCall(PetscHSetIJDestroy(&b->bht)); 1479ad79cf63SBarry Smith PetscCall(PetscFree(b->dnz)); 1480ad79cf63SBarry Smith PetscCall(PetscFree(b->bdnz)); 1481ad79cf63SBarry Smith B->hash_active = PETSC_FALSE; 1482ad79cf63SBarry Smith } 14832576faa2SJed Brown if (nz >= 0 || nnz) realalloc = PETSC_TRUE; 1484db4efbfdSBarry Smith 14859566063dSJacob Faibussowitsch PetscCall(MatSetBlockSize(B, PetscAbs(bs))); 14869566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(B->rmap)); 14879566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(B->cmap)); 148808401ef6SPierre Jolivet PetscCheck(B->rmap->N <= B->cmap->N, PETSC_COMM_SELF, PETSC_ERR_SUP, "SEQSBAIJ matrix cannot have more rows %" PetscInt_FMT " than columns %" PetscInt_FMT, B->rmap->N, B->cmap->N); 14899566063dSJacob Faibussowitsch PetscCall(PetscLayoutGetBlockSize(B->rmap, &bs)); 1490899cda47SBarry Smith 149121940c7eSstefano_zampini B->preallocated = PETSC_TRUE; 149221940c7eSstefano_zampini 1493d0f46423SBarry Smith mbs = B->rmap->N / bs; 14944dcd73b1SHong Zhang nbs = B->cmap->n / bs; 149549b5e25fSSatish Balay bs2 = bs * bs; 149649b5e25fSSatish Balay 1497aed4548fSBarry Smith PetscCheck(mbs * bs == B->rmap->N && nbs * bs == B->cmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Number rows, cols must be divisible by blocksize"); 149849b5e25fSSatish Balay 1499ab93d7beSBarry Smith if (nz == MAT_SKIP_ALLOCATION) { 1500ab93d7beSBarry Smith skipallocation = PETSC_TRUE; 1501ab93d7beSBarry Smith nz = 0; 1502ab93d7beSBarry Smith } 1503ab93d7beSBarry Smith 1504435da068SBarry Smith if (nz == PETSC_DEFAULT || nz == PETSC_DECIDE) nz = 3; 150508401ef6SPierre Jolivet PetscCheck(nz >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "nz cannot be less than 0: value %" PetscInt_FMT, nz); 150649b5e25fSSatish Balay if (nnz) { 150749b5e25fSSatish Balay for (i = 0; i < mbs; i++) { 150808401ef6SPierre Jolivet PetscCheck(nnz[i] >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "nnz cannot be less than 0: local row %" PetscInt_FMT " value %" PetscInt_FMT, i, nnz[i]); 150908401ef6SPierre Jolivet PetscCheck(nnz[i] <= nbs, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "nnz cannot be greater than block row length: local row %" PetscInt_FMT " value %" PetscInt_FMT " block rowlength %" PetscInt_FMT, i, nnz[i], nbs); 151049b5e25fSSatish Balay } 151149b5e25fSSatish Balay } 151249b5e25fSSatish Balay 1513db4efbfdSBarry Smith B->ops->mult = MatMult_SeqSBAIJ_N; 1514db4efbfdSBarry Smith B->ops->multadd = MatMultAdd_SeqSBAIJ_N; 1515db4efbfdSBarry Smith B->ops->multtranspose = MatMult_SeqSBAIJ_N; 1516db4efbfdSBarry Smith B->ops->multtransposeadd = MatMultAdd_SeqSBAIJ_N; 151726fbe8dcSKarl Rupp 15189566063dSJacob Faibussowitsch PetscCall(PetscOptionsGetBool(((PetscObject)B)->options, ((PetscObject)B)->prefix, "-mat_no_unroll", &flg, NULL)); 151949b5e25fSSatish Balay if (!flg) { 152049b5e25fSSatish Balay switch (bs) { 152149b5e25fSSatish Balay case 1: 152249b5e25fSSatish Balay B->ops->mult = MatMult_SeqSBAIJ_1; 152349b5e25fSSatish Balay B->ops->multadd = MatMultAdd_SeqSBAIJ_1; 1524431c96f7SBarry Smith B->ops->multtranspose = MatMult_SeqSBAIJ_1; 1525431c96f7SBarry Smith B->ops->multtransposeadd = MatMultAdd_SeqSBAIJ_1; 152649b5e25fSSatish Balay break; 152749b5e25fSSatish Balay case 2: 152849b5e25fSSatish Balay B->ops->mult = MatMult_SeqSBAIJ_2; 152949b5e25fSSatish Balay B->ops->multadd = MatMultAdd_SeqSBAIJ_2; 1530431c96f7SBarry Smith B->ops->multtranspose = MatMult_SeqSBAIJ_2; 1531431c96f7SBarry Smith B->ops->multtransposeadd = MatMultAdd_SeqSBAIJ_2; 153249b5e25fSSatish Balay break; 153349b5e25fSSatish Balay case 3: 153449b5e25fSSatish Balay B->ops->mult = MatMult_SeqSBAIJ_3; 153549b5e25fSSatish Balay B->ops->multadd = MatMultAdd_SeqSBAIJ_3; 1536431c96f7SBarry Smith B->ops->multtranspose = MatMult_SeqSBAIJ_3; 1537431c96f7SBarry Smith B->ops->multtransposeadd = MatMultAdd_SeqSBAIJ_3; 153849b5e25fSSatish Balay break; 153949b5e25fSSatish Balay case 4: 154049b5e25fSSatish Balay B->ops->mult = MatMult_SeqSBAIJ_4; 154149b5e25fSSatish Balay B->ops->multadd = MatMultAdd_SeqSBAIJ_4; 1542431c96f7SBarry Smith B->ops->multtranspose = MatMult_SeqSBAIJ_4; 1543431c96f7SBarry Smith B->ops->multtransposeadd = MatMultAdd_SeqSBAIJ_4; 154449b5e25fSSatish Balay break; 154549b5e25fSSatish Balay case 5: 154649b5e25fSSatish Balay B->ops->mult = MatMult_SeqSBAIJ_5; 154749b5e25fSSatish Balay B->ops->multadd = MatMultAdd_SeqSBAIJ_5; 1548431c96f7SBarry Smith B->ops->multtranspose = MatMult_SeqSBAIJ_5; 1549431c96f7SBarry Smith B->ops->multtransposeadd = MatMultAdd_SeqSBAIJ_5; 155049b5e25fSSatish Balay break; 155149b5e25fSSatish Balay case 6: 155249b5e25fSSatish Balay B->ops->mult = MatMult_SeqSBAIJ_6; 155349b5e25fSSatish Balay B->ops->multadd = MatMultAdd_SeqSBAIJ_6; 1554431c96f7SBarry Smith B->ops->multtranspose = MatMult_SeqSBAIJ_6; 1555431c96f7SBarry Smith B->ops->multtransposeadd = MatMultAdd_SeqSBAIJ_6; 155649b5e25fSSatish Balay break; 155749b5e25fSSatish Balay case 7: 1558de53e5efSHong Zhang B->ops->mult = MatMult_SeqSBAIJ_7; 155949b5e25fSSatish Balay B->ops->multadd = MatMultAdd_SeqSBAIJ_7; 1560431c96f7SBarry Smith B->ops->multtranspose = MatMult_SeqSBAIJ_7; 1561431c96f7SBarry Smith B->ops->multtransposeadd = MatMultAdd_SeqSBAIJ_7; 156249b5e25fSSatish Balay break; 156349b5e25fSSatish Balay } 156449b5e25fSSatish Balay } 156549b5e25fSSatish Balay 156649b5e25fSSatish Balay b->mbs = mbs; 15674dcd73b1SHong Zhang b->nbs = nbs; 1568ab93d7beSBarry Smith if (!skipallocation) { 15692ee49352SLisandro Dalcin if (!b->imax) { 15709566063dSJacob Faibussowitsch PetscCall(PetscMalloc2(mbs, &b->imax, mbs, &b->ilen)); 157126fbe8dcSKarl Rupp 1572c760cd28SBarry Smith b->free_imax_ilen = PETSC_TRUE; 15732ee49352SLisandro Dalcin } 157449b5e25fSSatish Balay if (!nnz) { 1575435da068SBarry Smith if (nz == PETSC_DEFAULT || nz == PETSC_DECIDE) nz = 5; 157649b5e25fSSatish Balay else if (nz <= 0) nz = 1; 15775d2a9ed1SStefano Zampini nz = PetscMin(nbs, nz); 157826fbe8dcSKarl Rupp for (i = 0; i < mbs; i++) b->imax[i] = nz; 15799566063dSJacob Faibussowitsch PetscCall(PetscIntMultError(nz, mbs, &nz)); 158049b5e25fSSatish Balay } else { 1581c73702f5SBarry Smith PetscInt64 nz64 = 0; 15829371c9d4SSatish Balay for (i = 0; i < mbs; i++) { 15839371c9d4SSatish Balay b->imax[i] = nnz[i]; 15849371c9d4SSatish Balay nz64 += nnz[i]; 15859371c9d4SSatish Balay } 15869566063dSJacob Faibussowitsch PetscCall(PetscIntCast(nz64, &nz)); 158749b5e25fSSatish Balay } 15882ee49352SLisandro Dalcin /* b->ilen will count nonzeros in each block row so far. */ 158926fbe8dcSKarl Rupp for (i = 0; i < mbs; i++) b->ilen[i] = 0; 15906c6c5352SBarry Smith /* nz=(nz+mbs)/2; */ /* total diagonal and superdiagonal nonzero blocks */ 159149b5e25fSSatish Balay 159249b5e25fSSatish Balay /* allocate the matrix space */ 15939566063dSJacob Faibussowitsch PetscCall(MatSeqXAIJFreeAIJ(B, &b->a, &b->j, &b->i)); 15949566063dSJacob Faibussowitsch PetscCall(PetscMalloc3(bs2 * nz, &b->a, nz, &b->j, B->rmap->N + 1, &b->i)); 15959566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(b->a, nz * bs2)); 15969566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(b->j, nz)); 159726fbe8dcSKarl Rupp 159849b5e25fSSatish Balay b->singlemalloc = PETSC_TRUE; 159949b5e25fSSatish Balay 160049b5e25fSSatish Balay /* pointer to beginning of each row */ 1601e60cf9a0SBarry Smith b->i[0] = 0; 160226fbe8dcSKarl Rupp for (i = 1; i < mbs + 1; i++) b->i[i] = b->i[i - 1] + b->imax[i - 1]; 160326fbe8dcSKarl Rupp 1604e6b907acSBarry Smith b->free_a = PETSC_TRUE; 1605e6b907acSBarry Smith b->free_ij = PETSC_TRUE; 1606e811da20SHong Zhang } else { 1607e6b907acSBarry Smith b->free_a = PETSC_FALSE; 1608e6b907acSBarry Smith b->free_ij = PETSC_FALSE; 1609ab93d7beSBarry Smith } 161049b5e25fSSatish Balay 161149b5e25fSSatish Balay b->bs2 = bs2; 16126c6c5352SBarry Smith b->nz = 0; 1613b32cb4a7SJed Brown b->maxnz = nz; 1614f4259b30SLisandro Dalcin b->inew = NULL; 1615f4259b30SLisandro Dalcin b->jnew = NULL; 1616f4259b30SLisandro Dalcin b->anew = NULL; 1617f4259b30SLisandro Dalcin b->a2anew = NULL; 16181a3463dfSHong Zhang b->permute = PETSC_FALSE; 1619cb7b82ddSBarry Smith 1620cb7b82ddSBarry Smith B->was_assembled = PETSC_FALSE; 1621cb7b82ddSBarry Smith B->assembled = PETSC_FALSE; 16229566063dSJacob Faibussowitsch if (realalloc) PetscCall(MatSetOption(B, MAT_NEW_NONZERO_ALLOCATION_ERR, PETSC_TRUE)); 16233ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1624c464158bSHong Zhang } 1625153ea458SHong Zhang 1626ba38deedSJacob Faibussowitsch static PetscErrorCode MatSeqSBAIJSetPreallocationCSR_SeqSBAIJ(Mat B, PetscInt bs, const PetscInt ii[], const PetscInt jj[], const PetscScalar V[]) 1627d71ae5a4SJacob Faibussowitsch { 16280cd7f59aSBarry Smith PetscInt i, j, m, nz, anz, nz_max = 0, *nnz; 1629f4259b30SLisandro Dalcin PetscScalar *values = NULL; 163038f409ebSLisandro Dalcin PetscBool roworiented = ((Mat_SeqSBAIJ *)B->data)->roworiented; 16310cd7f59aSBarry Smith 163238f409ebSLisandro Dalcin PetscFunctionBegin; 163308401ef6SPierre Jolivet PetscCheck(bs >= 1, PetscObjectComm((PetscObject)B), PETSC_ERR_ARG_OUTOFRANGE, "Invalid block size specified, must be positive but it is %" PetscInt_FMT, bs); 16349566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetBlockSize(B->rmap, bs)); 16359566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetBlockSize(B->cmap, bs)); 16369566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(B->rmap)); 16379566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(B->cmap)); 16389566063dSJacob Faibussowitsch PetscCall(PetscLayoutGetBlockSize(B->rmap, &bs)); 163938f409ebSLisandro Dalcin m = B->rmap->n / bs; 164038f409ebSLisandro Dalcin 1641aed4548fSBarry Smith PetscCheck(!ii[0], PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "ii[0] must be 0 but it is %" PetscInt_FMT, ii[0]); 16429566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m + 1, &nnz)); 164338f409ebSLisandro Dalcin for (i = 0; i < m; i++) { 164438f409ebSLisandro Dalcin nz = ii[i + 1] - ii[i]; 164508401ef6SPierre Jolivet PetscCheck(nz >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Row %" PetscInt_FMT " has a negative number of columns %" PetscInt_FMT, i, nz); 16460cd7f59aSBarry Smith anz = 0; 16470cd7f59aSBarry Smith for (j = 0; j < nz; j++) { 16480cd7f59aSBarry Smith /* count only values on the diagonal or above */ 16490cd7f59aSBarry Smith if (jj[ii[i] + j] >= i) { 16500cd7f59aSBarry Smith anz = nz - j; 16510cd7f59aSBarry Smith break; 16520cd7f59aSBarry Smith } 16530cd7f59aSBarry Smith } 16540cd7f59aSBarry Smith nz_max = PetscMax(nz_max, anz); 16550cd7f59aSBarry Smith nnz[i] = anz; 165638f409ebSLisandro Dalcin } 16579566063dSJacob Faibussowitsch PetscCall(MatSeqSBAIJSetPreallocation(B, bs, 0, nnz)); 16589566063dSJacob Faibussowitsch PetscCall(PetscFree(nnz)); 165938f409ebSLisandro Dalcin 166038f409ebSLisandro Dalcin values = (PetscScalar *)V; 166148a46eb9SPierre Jolivet if (!values) PetscCall(PetscCalloc1(bs * bs * nz_max, &values)); 166238f409ebSLisandro Dalcin for (i = 0; i < m; i++) { 166338f409ebSLisandro Dalcin PetscInt ncols = ii[i + 1] - ii[i]; 166438f409ebSLisandro Dalcin const PetscInt *icols = jj + ii[i]; 166538f409ebSLisandro Dalcin if (!roworiented || bs == 1) { 166638f409ebSLisandro Dalcin const PetscScalar *svals = values + (V ? (bs * bs * ii[i]) : 0); 16679566063dSJacob Faibussowitsch PetscCall(MatSetValuesBlocked_SeqSBAIJ(B, 1, &i, ncols, icols, svals, INSERT_VALUES)); 166838f409ebSLisandro Dalcin } else { 166938f409ebSLisandro Dalcin for (j = 0; j < ncols; j++) { 167038f409ebSLisandro Dalcin const PetscScalar *svals = values + (V ? (bs * bs * (ii[i] + j)) : 0); 16719566063dSJacob Faibussowitsch PetscCall(MatSetValuesBlocked_SeqSBAIJ(B, 1, &i, 1, &icols[j], svals, INSERT_VALUES)); 167238f409ebSLisandro Dalcin } 167338f409ebSLisandro Dalcin } 167438f409ebSLisandro Dalcin } 16759566063dSJacob Faibussowitsch if (!V) PetscCall(PetscFree(values)); 16769566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(B, MAT_FINAL_ASSEMBLY)); 16779566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(B, MAT_FINAL_ASSEMBLY)); 16789566063dSJacob Faibussowitsch PetscCall(MatSetOption(B, MAT_NEW_NONZERO_LOCATION_ERR, PETSC_TRUE)); 16793ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 168038f409ebSLisandro Dalcin } 168138f409ebSLisandro Dalcin 1682db4efbfdSBarry Smith /* 1683db4efbfdSBarry Smith This is used to set the numeric factorization for both Cholesky and ICC symbolic factorization 1684db4efbfdSBarry Smith */ 1685d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqSBAIJSetNumericFactorization_inplace(Mat B, PetscBool natural) 1686d71ae5a4SJacob Faibussowitsch { 1687ace3abfcSBarry Smith PetscBool flg = PETSC_FALSE; 1688db4efbfdSBarry Smith PetscInt bs = B->rmap->bs; 1689db4efbfdSBarry Smith 1690db4efbfdSBarry Smith PetscFunctionBegin; 16919566063dSJacob Faibussowitsch PetscCall(PetscOptionsGetBool(((PetscObject)B)->options, ((PetscObject)B)->prefix, "-mat_no_unroll", &flg, NULL)); 1692db4efbfdSBarry Smith if (flg) bs = 8; 1693db4efbfdSBarry Smith 1694db4efbfdSBarry Smith if (!natural) { 1695db4efbfdSBarry Smith switch (bs) { 1696d71ae5a4SJacob Faibussowitsch case 1: 1697d71ae5a4SJacob Faibussowitsch B->ops->choleskyfactornumeric = MatCholeskyFactorNumeric_SeqSBAIJ_1_inplace; 1698d71ae5a4SJacob Faibussowitsch break; 1699d71ae5a4SJacob Faibussowitsch case 2: 1700d71ae5a4SJacob Faibussowitsch B->ops->choleskyfactornumeric = MatCholeskyFactorNumeric_SeqSBAIJ_2; 1701d71ae5a4SJacob Faibussowitsch break; 1702d71ae5a4SJacob Faibussowitsch case 3: 1703d71ae5a4SJacob Faibussowitsch B->ops->choleskyfactornumeric = MatCholeskyFactorNumeric_SeqSBAIJ_3; 1704d71ae5a4SJacob Faibussowitsch break; 1705d71ae5a4SJacob Faibussowitsch case 4: 1706d71ae5a4SJacob Faibussowitsch B->ops->choleskyfactornumeric = MatCholeskyFactorNumeric_SeqSBAIJ_4; 1707d71ae5a4SJacob Faibussowitsch break; 1708d71ae5a4SJacob Faibussowitsch case 5: 1709d71ae5a4SJacob Faibussowitsch B->ops->choleskyfactornumeric = MatCholeskyFactorNumeric_SeqSBAIJ_5; 1710d71ae5a4SJacob Faibussowitsch break; 1711d71ae5a4SJacob Faibussowitsch case 6: 1712d71ae5a4SJacob Faibussowitsch B->ops->choleskyfactornumeric = MatCholeskyFactorNumeric_SeqSBAIJ_6; 1713d71ae5a4SJacob Faibussowitsch break; 1714d71ae5a4SJacob Faibussowitsch case 7: 1715d71ae5a4SJacob Faibussowitsch B->ops->choleskyfactornumeric = MatCholeskyFactorNumeric_SeqSBAIJ_7; 1716d71ae5a4SJacob Faibussowitsch break; 1717d71ae5a4SJacob Faibussowitsch default: 1718d71ae5a4SJacob Faibussowitsch B->ops->choleskyfactornumeric = MatCholeskyFactorNumeric_SeqSBAIJ_N; 1719d71ae5a4SJacob Faibussowitsch break; 1720db4efbfdSBarry Smith } 1721db4efbfdSBarry Smith } else { 1722db4efbfdSBarry Smith switch (bs) { 1723d71ae5a4SJacob Faibussowitsch case 1: 1724d71ae5a4SJacob Faibussowitsch B->ops->choleskyfactornumeric = MatCholeskyFactorNumeric_SeqSBAIJ_1_NaturalOrdering_inplace; 1725d71ae5a4SJacob Faibussowitsch break; 1726d71ae5a4SJacob Faibussowitsch case 2: 1727d71ae5a4SJacob Faibussowitsch B->ops->choleskyfactornumeric = MatCholeskyFactorNumeric_SeqSBAIJ_2_NaturalOrdering; 1728d71ae5a4SJacob Faibussowitsch break; 1729d71ae5a4SJacob Faibussowitsch case 3: 1730d71ae5a4SJacob Faibussowitsch B->ops->choleskyfactornumeric = MatCholeskyFactorNumeric_SeqSBAIJ_3_NaturalOrdering; 1731d71ae5a4SJacob Faibussowitsch break; 1732d71ae5a4SJacob Faibussowitsch case 4: 1733d71ae5a4SJacob Faibussowitsch B->ops->choleskyfactornumeric = MatCholeskyFactorNumeric_SeqSBAIJ_4_NaturalOrdering; 1734d71ae5a4SJacob Faibussowitsch break; 1735d71ae5a4SJacob Faibussowitsch case 5: 1736d71ae5a4SJacob Faibussowitsch B->ops->choleskyfactornumeric = MatCholeskyFactorNumeric_SeqSBAIJ_5_NaturalOrdering; 1737d71ae5a4SJacob Faibussowitsch break; 1738d71ae5a4SJacob Faibussowitsch case 6: 1739d71ae5a4SJacob Faibussowitsch B->ops->choleskyfactornumeric = MatCholeskyFactorNumeric_SeqSBAIJ_6_NaturalOrdering; 1740d71ae5a4SJacob Faibussowitsch break; 1741d71ae5a4SJacob Faibussowitsch case 7: 1742d71ae5a4SJacob Faibussowitsch B->ops->choleskyfactornumeric = MatCholeskyFactorNumeric_SeqSBAIJ_7_NaturalOrdering; 1743d71ae5a4SJacob Faibussowitsch break; 1744d71ae5a4SJacob Faibussowitsch default: 1745d71ae5a4SJacob Faibussowitsch B->ops->choleskyfactornumeric = MatCholeskyFactorNumeric_SeqSBAIJ_N_NaturalOrdering; 1746d71ae5a4SJacob Faibussowitsch break; 1747db4efbfdSBarry Smith } 1748db4efbfdSBarry Smith } 17493ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1750db4efbfdSBarry Smith } 1751db4efbfdSBarry Smith 1752cc2e6a90SBarry Smith PETSC_INTERN PetscErrorCode MatConvert_SeqSBAIJ_SeqAIJ(Mat, MatType, MatReuse, Mat *); 1753cc2e6a90SBarry Smith PETSC_INTERN PetscErrorCode MatConvert_SeqSBAIJ_SeqBAIJ(Mat, MatType, MatReuse, Mat *); 1754d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatFactorGetSolverType_petsc(Mat A, MatSolverType *type) 1755d71ae5a4SJacob Faibussowitsch { 17564ac6704cSBarry Smith PetscFunctionBegin; 17574ac6704cSBarry Smith *type = MATSOLVERPETSC; 17583ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 17594ac6704cSBarry Smith } 1760d769727bSBarry Smith 1761d71ae5a4SJacob Faibussowitsch PETSC_INTERN PetscErrorCode MatGetFactor_seqsbaij_petsc(Mat A, MatFactorType ftype, Mat *B) 1762d71ae5a4SJacob Faibussowitsch { 1763d0f46423SBarry Smith PetscInt n = A->rmap->n; 17645c9eb25fSBarry Smith 17655c9eb25fSBarry Smith PetscFunctionBegin; 17660e92d65fSHong Zhang #if defined(PETSC_USE_COMPLEX) 176703e5aca4SStefano Zampini if ((ftype == MAT_FACTOR_CHOLESKY || ftype == MAT_FACTOR_ICC) && A->hermitian == PETSC_BOOL3_TRUE && A->symmetric != PETSC_BOOL3_TRUE) { 176803e5aca4SStefano Zampini PetscCall(PetscInfo(A, "Hermitian MAT_FACTOR_CHOLESKY or MAT_FACTOR_ICC are not supported. Use MAT_FACTOR_LU instead.\n")); 176903e5aca4SStefano Zampini *B = NULL; 177003e5aca4SStefano Zampini PetscFunctionReturn(PETSC_SUCCESS); 177103e5aca4SStefano Zampini } 17720e92d65fSHong Zhang #endif 1773eb1ec7c1SStefano Zampini 17749566063dSJacob Faibussowitsch PetscCall(MatCreate(PetscObjectComm((PetscObject)A), B)); 17759566063dSJacob Faibussowitsch PetscCall(MatSetSizes(*B, n, n, n, n)); 17765c9eb25fSBarry Smith if (ftype == MAT_FACTOR_CHOLESKY || ftype == MAT_FACTOR_ICC) { 17779566063dSJacob Faibussowitsch PetscCall(MatSetType(*B, MATSEQSBAIJ)); 17789566063dSJacob Faibussowitsch PetscCall(MatSeqSBAIJSetPreallocation(*B, A->rmap->bs, MAT_SKIP_ALLOCATION, NULL)); 177926fbe8dcSKarl Rupp 17807b056e98SHong Zhang (*B)->ops->choleskyfactorsymbolic = MatCholeskyFactorSymbolic_SeqSBAIJ; 1781c6d0d4f0SHong Zhang (*B)->ops->iccfactorsymbolic = MatICCFactorSymbolic_SeqSBAIJ; 17829566063dSJacob Faibussowitsch PetscCall(PetscStrallocpy(MATORDERINGNATURAL, (char **)&(*B)->preferredordering[MAT_FACTOR_CHOLESKY])); 17839566063dSJacob Faibussowitsch PetscCall(PetscStrallocpy(MATORDERINGNATURAL, (char **)&(*B)->preferredordering[MAT_FACTOR_ICC])); 1784e32f2f54SBarry Smith } else SETERRQ(PETSC_COMM_SELF, PETSC_ERR_SUP, "Factor type not supported"); 178500c67f3bSHong Zhang 1786d5f3da31SBarry Smith (*B)->factortype = ftype; 1787f73b0415SBarry Smith (*B)->canuseordering = PETSC_TRUE; 17889566063dSJacob Faibussowitsch PetscCall(PetscFree((*B)->solvertype)); 17899566063dSJacob Faibussowitsch PetscCall(PetscStrallocpy(MATSOLVERPETSC, &(*B)->solvertype)); 17909566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)*B, "MatFactorGetSolverType_C", MatFactorGetSolverType_petsc)); 17913ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 17925c9eb25fSBarry Smith } 17935c9eb25fSBarry Smith 17948397e458SBarry Smith /*@C 17952ef1f0ffSBarry Smith MatSeqSBAIJGetArray - gives access to the array where the numerical data for a `MATSEQSBAIJ` matrix is stored 17968397e458SBarry Smith 17978397e458SBarry Smith Not Collective 17988397e458SBarry Smith 17998397e458SBarry Smith Input Parameter: 1800fe59aa6dSJacob Faibussowitsch . A - a `MATSEQSBAIJ` matrix 18018397e458SBarry Smith 18028397e458SBarry Smith Output Parameter: 18038397e458SBarry Smith . array - pointer to the data 18048397e458SBarry Smith 18058397e458SBarry Smith Level: intermediate 18068397e458SBarry Smith 18071cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MATSEQSBAIJ`, `MatSeqSBAIJRestoreArray()`, `MatSeqAIJGetArray()`, `MatSeqAIJRestoreArray()` 18088397e458SBarry Smith @*/ 1809d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqSBAIJGetArray(Mat A, PetscScalar **array) 1810d71ae5a4SJacob Faibussowitsch { 18118397e458SBarry Smith PetscFunctionBegin; 1812cac4c232SBarry Smith PetscUseMethod(A, "MatSeqSBAIJGetArray_C", (Mat, PetscScalar **), (A, array)); 18133ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 18148397e458SBarry Smith } 18158397e458SBarry Smith 18168397e458SBarry Smith /*@C 18172ef1f0ffSBarry Smith MatSeqSBAIJRestoreArray - returns access to the array where the numerical data for a `MATSEQSBAIJ` matrix is stored obtained by `MatSeqSBAIJGetArray()` 18188397e458SBarry Smith 18198397e458SBarry Smith Not Collective 18208397e458SBarry Smith 18218397e458SBarry Smith Input Parameters: 1822fe59aa6dSJacob Faibussowitsch + A - a `MATSEQSBAIJ` matrix 1823a2b725a8SWilliam Gropp - array - pointer to the data 18248397e458SBarry Smith 18258397e458SBarry Smith Level: intermediate 18268397e458SBarry Smith 18271cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MATSEQSBAIJ`, `MatSeqSBAIJGetArray()`, `MatSeqAIJGetArray()`, `MatSeqAIJRestoreArray()` 18288397e458SBarry Smith @*/ 1829d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqSBAIJRestoreArray(Mat A, PetscScalar **array) 1830d71ae5a4SJacob Faibussowitsch { 18318397e458SBarry Smith PetscFunctionBegin; 1832cac4c232SBarry Smith PetscUseMethod(A, "MatSeqSBAIJRestoreArray_C", (Mat, PetscScalar **), (A, array)); 18333ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 18348397e458SBarry Smith } 18358397e458SBarry Smith 18360bad9183SKris Buschelman /*MC 1837fafad747SKris Buschelman MATSEQSBAIJ - MATSEQSBAIJ = "seqsbaij" - A matrix type to be used for sequential symmetric block sparse matrices, 18380bad9183SKris Buschelman based on block compressed sparse row format. Only the upper triangular portion of the matrix is stored. 18390bad9183SKris Buschelman 1840828413b8SBarry Smith For complex numbers by default this matrix is symmetric, NOT Hermitian symmetric. To make it Hermitian symmetric you 184111a5261eSBarry Smith can call `MatSetOption`(`Mat`, `MAT_HERMITIAN`). 1842828413b8SBarry Smith 18432ef1f0ffSBarry Smith Options Database Key: 184411a5261eSBarry Smith . -mat_type seqsbaij - sets the matrix type to "seqsbaij" during a call to `MatSetFromOptions()` 18450bad9183SKris Buschelman 18462ef1f0ffSBarry Smith Level: beginner 18472ef1f0ffSBarry Smith 184895452b02SPatrick Sanan Notes: 184995452b02SPatrick Sanan By default if you insert values into the lower triangular part of the matrix they are simply ignored (since they are not 185011a5261eSBarry Smith stored and it is assumed they symmetric to the upper triangular). If you call `MatSetOption`(`Mat`,`MAT_IGNORE_LOWER_TRIANGULAR`,`PETSC_FALSE`) or use 18512ef1f0ffSBarry Smith the options database `-mat_ignore_lower_triangular` false it will generate an error if you try to set a value in the lower triangular portion. 185271dad5bbSBarry Smith 1853476417e5SBarry Smith The number of rows in the matrix must be less than or equal to the number of columns 185471dad5bbSBarry Smith 18551cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MATSEQSBAIJ`, `MatCreateSeqSBAIJ()`, `MatType`, `MATMPISBAIJ` 18560bad9183SKris Buschelman M*/ 1857d71ae5a4SJacob Faibussowitsch PETSC_EXTERN PetscErrorCode MatCreate_SeqSBAIJ(Mat B) 1858d71ae5a4SJacob Faibussowitsch { 1859a23d5eceSKris Buschelman Mat_SeqSBAIJ *b; 186013f74950SBarry Smith PetscMPIInt size; 1861ace3abfcSBarry Smith PetscBool no_unroll = PETSC_FALSE, no_inode = PETSC_FALSE; 1862a23d5eceSKris Buschelman 1863a23d5eceSKris Buschelman PetscFunctionBegin; 18649566063dSJacob Faibussowitsch PetscCallMPI(MPI_Comm_size(PetscObjectComm((PetscObject)B), &size)); 186508401ef6SPierre Jolivet PetscCheck(size <= 1, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONG, "Comm must be of size 1"); 1866a23d5eceSKris Buschelman 18674dfa11a4SJacob Faibussowitsch PetscCall(PetscNew(&b)); 1868a23d5eceSKris Buschelman B->data = (void *)b; 1869aea10558SJacob Faibussowitsch B->ops[0] = MatOps_Values; 187026fbe8dcSKarl Rupp 1871a23d5eceSKris Buschelman B->ops->destroy = MatDestroy_SeqSBAIJ; 1872a23d5eceSKris Buschelman B->ops->view = MatView_SeqSBAIJ; 1873f4259b30SLisandro Dalcin b->row = NULL; 1874f4259b30SLisandro Dalcin b->icol = NULL; 1875a23d5eceSKris Buschelman b->reallocs = 0; 1876f4259b30SLisandro Dalcin b->saved_values = NULL; 18770def2e27SBarry Smith b->inode.limit = 5; 18780def2e27SBarry Smith b->inode.max_limit = 5; 1879a23d5eceSKris Buschelman 1880a23d5eceSKris Buschelman b->roworiented = PETSC_TRUE; 1881a23d5eceSKris Buschelman b->nonew = 0; 1882f4259b30SLisandro Dalcin b->diag = NULL; 1883f4259b30SLisandro Dalcin b->solve_work = NULL; 1884f4259b30SLisandro Dalcin b->mult_work = NULL; 1885f4259b30SLisandro Dalcin B->spptr = NULL; 1886f2cbd3d5SJed Brown B->info.nz_unneeded = (PetscReal)b->maxnz * b->bs2; 1887a9817697SBarry Smith b->keepnonzeropattern = PETSC_FALSE; 1888a23d5eceSKris Buschelman 1889f4259b30SLisandro Dalcin b->inew = NULL; 1890f4259b30SLisandro Dalcin b->jnew = NULL; 1891f4259b30SLisandro Dalcin b->anew = NULL; 1892f4259b30SLisandro Dalcin b->a2anew = NULL; 1893a23d5eceSKris Buschelman b->permute = PETSC_FALSE; 1894a23d5eceSKris Buschelman 189571dad5bbSBarry Smith b->ignore_ltriangular = PETSC_TRUE; 189626fbe8dcSKarl Rupp 18979566063dSJacob Faibussowitsch PetscCall(PetscOptionsGetBool(((PetscObject)B)->options, ((PetscObject)B)->prefix, "-mat_ignore_lower_triangular", &b->ignore_ltriangular, NULL)); 1898941593c8SHong Zhang 1899f5edf698SHong Zhang b->getrow_utriangular = PETSC_FALSE; 190026fbe8dcSKarl Rupp 19019566063dSJacob Faibussowitsch PetscCall(PetscOptionsGetBool(((PetscObject)B)->options, ((PetscObject)B)->prefix, "-mat_getrow_uppertriangular", &b->getrow_utriangular, NULL)); 1902f5edf698SHong Zhang 19039566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSeqSBAIJGetArray_C", MatSeqSBAIJGetArray_SeqSBAIJ)); 19049566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSeqSBAIJRestoreArray_C", MatSeqSBAIJRestoreArray_SeqSBAIJ)); 19059566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatStoreValues_C", MatStoreValues_SeqSBAIJ)); 19069566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatRetrieveValues_C", MatRetrieveValues_SeqSBAIJ)); 19079566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSeqSBAIJSetColumnIndices_C", MatSeqSBAIJSetColumnIndices_SeqSBAIJ)); 19089566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqsbaij_seqaij_C", MatConvert_SeqSBAIJ_SeqAIJ)); 19099566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqsbaij_seqbaij_C", MatConvert_SeqSBAIJ_SeqBAIJ)); 19109566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSeqSBAIJSetPreallocation_C", MatSeqSBAIJSetPreallocation_SeqSBAIJ)); 19119566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSeqSBAIJSetPreallocationCSR_C", MatSeqSBAIJSetPreallocationCSR_SeqSBAIJ)); 19126214f412SHong Zhang #if defined(PETSC_HAVE_ELEMENTAL) 19139566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqsbaij_elemental_C", MatConvert_SeqSBAIJ_Elemental)); 19146214f412SHong Zhang #endif 1915d24d4204SJose E. Roman #if defined(PETSC_HAVE_SCALAPACK) 19169566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqsbaij_scalapack_C", MatConvert_SBAIJ_ScaLAPACK)); 1917d24d4204SJose E. Roman #endif 191823ce1328SBarry Smith 1919b94d7dedSBarry Smith B->symmetry_eternal = PETSC_TRUE; 1920b94d7dedSBarry Smith B->structural_symmetry_eternal = PETSC_TRUE; 1921b94d7dedSBarry Smith B->symmetric = PETSC_BOOL3_TRUE; 1922b94d7dedSBarry Smith B->structurally_symmetric = PETSC_BOOL3_TRUE; 1923eb1ec7c1SStefano Zampini #if defined(PETSC_USE_COMPLEX) 1924b94d7dedSBarry Smith B->hermitian = PETSC_BOOL3_FALSE; 1925eb1ec7c1SStefano Zampini #else 1926b94d7dedSBarry Smith B->hermitian = PETSC_BOOL3_TRUE; 1927eb1ec7c1SStefano Zampini #endif 192813647f61SHong Zhang 19299566063dSJacob Faibussowitsch PetscCall(PetscObjectChangeTypeName((PetscObject)B, MATSEQSBAIJ)); 19300def2e27SBarry Smith 1931d0609cedSBarry Smith PetscOptionsBegin(PetscObjectComm((PetscObject)B), ((PetscObject)B)->prefix, "Options for SEQSBAIJ matrix", "Mat"); 19329566063dSJacob Faibussowitsch PetscCall(PetscOptionsBool("-mat_no_unroll", "Do not optimize for inodes (slower)", NULL, no_unroll, &no_unroll, NULL)); 193348a46eb9SPierre Jolivet if (no_unroll) PetscCall(PetscInfo(B, "Not using Inode routines due to -mat_no_unroll\n")); 19349566063dSJacob Faibussowitsch PetscCall(PetscOptionsBool("-mat_no_inode", "Do not optimize for inodes (slower)", NULL, no_inode, &no_inode, NULL)); 19359566063dSJacob Faibussowitsch if (no_inode) PetscCall(PetscInfo(B, "Not using Inode routines due to -mat_no_inode\n")); 19369566063dSJacob Faibussowitsch PetscCall(PetscOptionsInt("-mat_inode_limit", "Do not use inodes larger then this value", NULL, b->inode.limit, &b->inode.limit, NULL)); 1937d0609cedSBarry Smith PetscOptionsEnd(); 1938ace3abfcSBarry Smith b->inode.use = (PetscBool)(!(no_unroll || no_inode)); 19390def2e27SBarry Smith if (b->inode.limit > b->inode.max_limit) b->inode.limit = b->inode.max_limit; 19403ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1941a23d5eceSKris Buschelman } 1942a23d5eceSKris Buschelman 1943a23d5eceSKris Buschelman /*@C 1944a23d5eceSKris Buschelman MatSeqSBAIJSetPreallocation - Creates a sparse symmetric matrix in block AIJ (block 194511a5261eSBarry Smith compressed row) `MATSEQSBAIJ` format. For good matrix assembly performance the 194620f4b53cSBarry Smith user should preallocate the matrix storage by setting the parameter `nz` 194720f4b53cSBarry Smith (or the array `nnz`). 1948a23d5eceSKris Buschelman 1949c3339decSBarry Smith Collective 1950a23d5eceSKris Buschelman 1951a23d5eceSKris Buschelman Input Parameters: 19521c4f3114SJed Brown + B - the symmetric matrix 195311a5261eSBarry Smith . bs - size of block, the blocks are ALWAYS square. One can use `MatSetBlockSizes()` to set a different row and column blocksize but the row 195411a5261eSBarry Smith blocksize always defines the size of the blocks. The column blocksize sets the blocksize of the vectors obtained with `MatCreateVecs()` 1955a23d5eceSKris Buschelman . nz - number of block nonzeros per block row (same for all rows) 1956a23d5eceSKris Buschelman - nnz - array containing the number of block nonzeros in the upper triangular plus 19572ef1f0ffSBarry Smith diagonal portion of each block (possibly different for each block row) or `NULL` 1958a23d5eceSKris Buschelman 1959a23d5eceSKris Buschelman Options Database Keys: 1960a2b725a8SWilliam Gropp + -mat_no_unroll - uses code that does not unroll the loops in the 1961a23d5eceSKris Buschelman block calculations (much slower) 1962a2b725a8SWilliam Gropp - -mat_block_size - size of the blocks to use (only works if a negative bs is passed in 1963a23d5eceSKris Buschelman 1964a23d5eceSKris Buschelman Level: intermediate 1965a23d5eceSKris Buschelman 1966a23d5eceSKris Buschelman Notes: 196720f4b53cSBarry Smith Specify the preallocated storage with either `nz` or `nnz` (not both). 19682ef1f0ffSBarry Smith Set `nz` = `PETSC_DEFAULT` and `nnz` = `NULL` for PETSc to control dynamic memory 1969651615e1SBarry Smith allocation. See [Sparse Matrices](sec_matsparse) for details. 1970a23d5eceSKris Buschelman 197111a5261eSBarry Smith You can call `MatGetInfo()` to get information on how effective the preallocation was; 1972aa95bbe8SBarry Smith for example the fields mallocs,nz_allocated,nz_used,nz_unneeded; 19732ef1f0ffSBarry Smith You can also run with the option `-info` and look for messages with the string 1974aa95bbe8SBarry Smith malloc in them to see if additional memory allocation was needed. 1975aa95bbe8SBarry Smith 19762ef1f0ffSBarry Smith If the `nnz` parameter is given then the `nz` parameter is ignored 197749a6f317SBarry Smith 19781cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, [Sparse Matrices](sec_matsparse), `MATSEQSBAIJ`, `MatCreate()`, `MatCreateSeqAIJ()`, `MatSetValues()`, `MatCreateSBAIJ()` 1979a23d5eceSKris Buschelman @*/ 1980d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqSBAIJSetPreallocation(Mat B, PetscInt bs, PetscInt nz, const PetscInt nnz[]) 1981d71ae5a4SJacob Faibussowitsch { 1982a23d5eceSKris Buschelman PetscFunctionBegin; 19836ba663aaSJed Brown PetscValidHeaderSpecific(B, MAT_CLASSID, 1); 19846ba663aaSJed Brown PetscValidType(B, 1); 19856ba663aaSJed Brown PetscValidLogicalCollectiveInt(B, bs, 2); 1986cac4c232SBarry Smith PetscTryMethod(B, "MatSeqSBAIJSetPreallocation_C", (Mat, PetscInt, PetscInt, const PetscInt[]), (B, bs, nz, nnz)); 19873ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1988a23d5eceSKris Buschelman } 198949b5e25fSSatish Balay 199038f409ebSLisandro Dalcin /*@C 199111a5261eSBarry Smith MatSeqSBAIJSetPreallocationCSR - Creates a sparse parallel matrix in `MATSEQSBAIJ` format using the given nonzero structure and (optional) numerical values 199238f409ebSLisandro Dalcin 199338f409ebSLisandro Dalcin Input Parameters: 19941c4f3114SJed Brown + B - the matrix 1995eab78319SHong Zhang . bs - size of block, the blocks are ALWAYS square. 199638f409ebSLisandro Dalcin . i - the indices into j for the start of each local row (starts with zero) 199738f409ebSLisandro Dalcin . j - the column indices for each local row (starts with zero) these must be sorted for each row 199838f409ebSLisandro Dalcin - v - optional values in the matrix 199938f409ebSLisandro Dalcin 2000664954b6SBarry Smith Level: advanced 200138f409ebSLisandro Dalcin 200238f409ebSLisandro Dalcin Notes: 200311a5261eSBarry Smith The order of the entries in values is specified by the `MatOption` `MAT_ROW_ORIENTED`. For example, C programs 200411a5261eSBarry Smith may want to use the default `MAT_ROW_ORIENTED` = `PETSC_TRUE` and use an array v[nnz][bs][bs] where the second index is 200538f409ebSLisandro Dalcin over rows within a block and the last index is over columns within a block row. Fortran programs will likely set 200611a5261eSBarry Smith `MAT_ROW_ORIENTED` = `PETSC_FALSE` and use a Fortran array v(bs,bs,nnz) in which the first index is over rows within a 200738f409ebSLisandro Dalcin block column and the second index is over columns within a block. 200838f409ebSLisandro Dalcin 200950c5228eSBarry Smith Any entries below the diagonal are ignored 20100cd7f59aSBarry Smith 20110cd7f59aSBarry Smith Though this routine has Preallocation() in the name it also sets the exact nonzero locations of the matrix entries 20120cd7f59aSBarry Smith and usually the numerical values as well 2013664954b6SBarry Smith 2014fe59aa6dSJacob Faibussowitsch .seealso: [](ch_matrices), `Mat`, `MATSEQSBAIJ`, `MatCreate()`, `MatCreateSeqSBAIJ()`, `MatSetValuesBlocked()`, `MatSeqSBAIJSetPreallocation()` 201538f409ebSLisandro Dalcin @*/ 2016d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqSBAIJSetPreallocationCSR(Mat B, PetscInt bs, const PetscInt i[], const PetscInt j[], const PetscScalar v[]) 2017d71ae5a4SJacob Faibussowitsch { 201838f409ebSLisandro Dalcin PetscFunctionBegin; 201938f409ebSLisandro Dalcin PetscValidHeaderSpecific(B, MAT_CLASSID, 1); 202038f409ebSLisandro Dalcin PetscValidType(B, 1); 202138f409ebSLisandro Dalcin PetscValidLogicalCollectiveInt(B, bs, 2); 2022cac4c232SBarry Smith PetscTryMethod(B, "MatSeqSBAIJSetPreallocationCSR_C", (Mat, PetscInt, const PetscInt[], const PetscInt[], const PetscScalar[]), (B, bs, i, j, v)); 20233ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 202438f409ebSLisandro Dalcin } 202538f409ebSLisandro Dalcin 2026c464158bSHong Zhang /*@C 20272ef1f0ffSBarry Smith MatCreateSeqSBAIJ - Creates a sparse symmetric matrix in (block 202811a5261eSBarry Smith compressed row) `MATSEQSBAIJ` format. For good matrix assembly performance the 20292ef1f0ffSBarry Smith user should preallocate the matrix storage by setting the parameter `nz` 20302ef1f0ffSBarry Smith (or the array `nnz`). 203149b5e25fSSatish Balay 2032d083f849SBarry Smith Collective 2033c464158bSHong Zhang 2034c464158bSHong Zhang Input Parameters: 203511a5261eSBarry Smith + comm - MPI communicator, set to `PETSC_COMM_SELF` 203611a5261eSBarry Smith . bs - size of block, the blocks are ALWAYS square. One can use `MatSetBlockSizes()` to set a different row and column blocksize but the row 2037bb7ae925SBarry Smith blocksize always defines the size of the blocks. The column blocksize sets the blocksize of the vectors obtained with MatCreateVecs() 203820f4b53cSBarry Smith . m - number of rows 203920f4b53cSBarry Smith . n - number of columns 2040c464158bSHong Zhang . nz - number of block nonzeros per block row (same for all rows) 2041744e8345SSatish Balay - nnz - array containing the number of block nonzeros in the upper triangular plus 20422ef1f0ffSBarry Smith diagonal portion of each block (possibly different for each block row) or `NULL` 2043c464158bSHong Zhang 2044c464158bSHong Zhang Output Parameter: 2045c464158bSHong Zhang . A - the symmetric matrix 2046c464158bSHong Zhang 2047c464158bSHong Zhang Options Database Keys: 2048a2b725a8SWilliam Gropp + -mat_no_unroll - uses code that does not unroll the loops in the 2049c464158bSHong Zhang block calculations (much slower) 2050a2b725a8SWilliam Gropp - -mat_block_size - size of the blocks to use 2051c464158bSHong Zhang 2052c464158bSHong Zhang Level: intermediate 2053c464158bSHong Zhang 20542ef1f0ffSBarry Smith Notes: 205577433607SBarry Smith It is recommended that one use `MatCreateFromOptions()` or the `MatCreate()`, `MatSetType()` and/or `MatSetFromOptions()`, 2056f6f02116SRichard Tran Mills MatXXXXSetPreallocation() paradigm instead of this routine directly. 205711a5261eSBarry Smith [MatXXXXSetPreallocation() is, for example, `MatSeqAIJSetPreallocation()`] 2058175b88e8SBarry Smith 20596d6d819aSHong Zhang The number of rows and columns must be divisible by blocksize. 20606d6d819aSHong Zhang This matrix type does not support complex Hermitian operation. 2061c464158bSHong Zhang 20622ef1f0ffSBarry Smith Specify the preallocated storage with either `nz` or `nnz` (not both). 20632ef1f0ffSBarry Smith Set `nz` = `PETSC_DEFAULT` and `nnz` = `NULL` for PETSc to control dynamic memory 2064651615e1SBarry Smith allocation. See [Sparse Matrices](sec_matsparse) for details. 2065c464158bSHong Zhang 20662ef1f0ffSBarry Smith If the `nnz` parameter is given then the `nz` parameter is ignored 206749a6f317SBarry Smith 20681cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, [Sparse Matrices](sec_matsparse), `MATSEQSBAIJ`, `MatCreate()`, `MatCreateSeqAIJ()`, `MatSetValues()`, `MatCreateSBAIJ()` 2069c464158bSHong Zhang @*/ 2070d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateSeqSBAIJ(MPI_Comm comm, PetscInt bs, PetscInt m, PetscInt n, PetscInt nz, const PetscInt nnz[], Mat *A) 2071d71ae5a4SJacob Faibussowitsch { 2072c464158bSHong Zhang PetscFunctionBegin; 20739566063dSJacob Faibussowitsch PetscCall(MatCreate(comm, A)); 20749566063dSJacob Faibussowitsch PetscCall(MatSetSizes(*A, m, n, m, n)); 20759566063dSJacob Faibussowitsch PetscCall(MatSetType(*A, MATSEQSBAIJ)); 20769566063dSJacob Faibussowitsch PetscCall(MatSeqSBAIJSetPreallocation(*A, bs, nz, (PetscInt *)nnz)); 20773ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 207849b5e25fSSatish Balay } 207949b5e25fSSatish Balay 2080d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDuplicate_SeqSBAIJ(Mat A, MatDuplicateOption cpvalues, Mat *B) 2081d71ae5a4SJacob Faibussowitsch { 208249b5e25fSSatish Balay Mat C; 208349b5e25fSSatish Balay Mat_SeqSBAIJ *c, *a = (Mat_SeqSBAIJ *)A->data; 2084b40805acSSatish Balay PetscInt i, mbs = a->mbs, nz = a->nz, bs2 = a->bs2; 208549b5e25fSSatish Balay 208649b5e25fSSatish Balay PetscFunctionBegin; 208731fe6a7dSBarry Smith PetscCheck(A->assembled, PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_WRONGSTATE, "Cannot duplicate unassembled matrix"); 208808401ef6SPierre Jolivet PetscCheck(a->i[mbs] == nz, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Corrupt matrix"); 208949b5e25fSSatish Balay 2090f4259b30SLisandro Dalcin *B = NULL; 20919566063dSJacob Faibussowitsch PetscCall(MatCreate(PetscObjectComm((PetscObject)A), &C)); 20929566063dSJacob Faibussowitsch PetscCall(MatSetSizes(C, A->rmap->N, A->cmap->n, A->rmap->N, A->cmap->n)); 20939566063dSJacob Faibussowitsch PetscCall(MatSetBlockSizesFromMats(C, A, A)); 20949566063dSJacob Faibussowitsch PetscCall(MatSetType(C, MATSEQSBAIJ)); 2095692f9cbeSHong Zhang c = (Mat_SeqSBAIJ *)C->data; 2096692f9cbeSHong Zhang 2097273d9f13SBarry Smith C->preallocated = PETSC_TRUE; 2098d5f3da31SBarry Smith C->factortype = A->factortype; 2099f4259b30SLisandro Dalcin c->row = NULL; 2100f4259b30SLisandro Dalcin c->icol = NULL; 2101f4259b30SLisandro Dalcin c->saved_values = NULL; 2102a9817697SBarry Smith c->keepnonzeropattern = a->keepnonzeropattern; 210349b5e25fSSatish Balay C->assembled = PETSC_TRUE; 210449b5e25fSSatish Balay 21059566063dSJacob Faibussowitsch PetscCall(PetscLayoutReference(A->rmap, &C->rmap)); 21069566063dSJacob Faibussowitsch PetscCall(PetscLayoutReference(A->cmap, &C->cmap)); 210749b5e25fSSatish Balay c->bs2 = a->bs2; 210849b5e25fSSatish Balay c->mbs = a->mbs; 210949b5e25fSSatish Balay c->nbs = a->nbs; 211049b5e25fSSatish Balay 2111c760cd28SBarry Smith if (cpvalues == MAT_SHARE_NONZERO_PATTERN) { 2112c760cd28SBarry Smith c->imax = a->imax; 2113c760cd28SBarry Smith c->ilen = a->ilen; 2114c760cd28SBarry Smith c->free_imax_ilen = PETSC_FALSE; 2115c760cd28SBarry Smith } else { 21169566063dSJacob Faibussowitsch PetscCall(PetscMalloc2((mbs + 1), &c->imax, (mbs + 1), &c->ilen)); 211749b5e25fSSatish Balay for (i = 0; i < mbs; i++) { 211849b5e25fSSatish Balay c->imax[i] = a->imax[i]; 211949b5e25fSSatish Balay c->ilen[i] = a->ilen[i]; 212049b5e25fSSatish Balay } 2121c760cd28SBarry Smith c->free_imax_ilen = PETSC_TRUE; 2122c760cd28SBarry Smith } 212349b5e25fSSatish Balay 212449b5e25fSSatish Balay /* allocate the matrix space */ 21254da8f245SBarry Smith if (cpvalues == MAT_SHARE_NONZERO_PATTERN) { 21269566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(bs2 * nz, &c->a)); 212744e1c64aSLisandro Dalcin c->i = a->i; 212844e1c64aSLisandro Dalcin c->j = a->j; 21294da8f245SBarry Smith c->singlemalloc = PETSC_FALSE; 213044e1c64aSLisandro Dalcin c->free_a = PETSC_TRUE; 21314da8f245SBarry Smith c->free_ij = PETSC_FALSE; 21324da8f245SBarry Smith c->parent = A; 21339566063dSJacob Faibussowitsch PetscCall(PetscObjectReference((PetscObject)A)); 21349566063dSJacob Faibussowitsch PetscCall(MatSetOption(A, MAT_NEW_NONZERO_LOCATION_ERR, PETSC_TRUE)); 21359566063dSJacob Faibussowitsch PetscCall(MatSetOption(C, MAT_NEW_NONZERO_LOCATION_ERR, PETSC_TRUE)); 21364da8f245SBarry Smith } else { 21379566063dSJacob Faibussowitsch PetscCall(PetscMalloc3(bs2 * nz, &c->a, nz, &c->j, mbs + 1, &c->i)); 21389566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(c->i, a->i, mbs + 1)); 21394da8f245SBarry Smith c->singlemalloc = PETSC_TRUE; 214044e1c64aSLisandro Dalcin c->free_a = PETSC_TRUE; 21414da8f245SBarry Smith c->free_ij = PETSC_TRUE; 21424da8f245SBarry Smith } 214349b5e25fSSatish Balay if (mbs > 0) { 214448a46eb9SPierre Jolivet if (cpvalues != MAT_SHARE_NONZERO_PATTERN) PetscCall(PetscArraycpy(c->j, a->j, nz)); 214549b5e25fSSatish Balay if (cpvalues == MAT_COPY_VALUES) { 21469566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(c->a, a->a, bs2 * nz)); 214749b5e25fSSatish Balay } else { 21489566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(c->a, bs2 * nz)); 214949b5e25fSSatish Balay } 2150a1c3900fSBarry Smith if (a->jshort) { 215144e1c64aSLisandro Dalcin /* cannot share jshort, it is reallocated in MatAssemblyEnd_SeqSBAIJ() */ 215244e1c64aSLisandro Dalcin /* if the parent matrix is reassembled, this child matrix will never notice */ 21539566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nz, &c->jshort)); 21549566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(c->jshort, a->jshort, nz)); 215526fbe8dcSKarl Rupp 21564da8f245SBarry Smith c->free_jshort = PETSC_TRUE; 21574da8f245SBarry Smith } 2158a1c3900fSBarry Smith } 215949b5e25fSSatish Balay 216049b5e25fSSatish Balay c->roworiented = a->roworiented; 216149b5e25fSSatish Balay c->nonew = a->nonew; 216249b5e25fSSatish Balay 216349b5e25fSSatish Balay if (a->diag) { 2164c760cd28SBarry Smith if (cpvalues == MAT_SHARE_NONZERO_PATTERN) { 2165c760cd28SBarry Smith c->diag = a->diag; 2166c760cd28SBarry Smith c->free_diag = PETSC_FALSE; 2167c760cd28SBarry Smith } else { 21689566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(mbs, &c->diag)); 216926fbe8dcSKarl Rupp for (i = 0; i < mbs; i++) c->diag[i] = a->diag[i]; 2170c760cd28SBarry Smith c->free_diag = PETSC_TRUE; 2171c760cd28SBarry Smith } 217244e1c64aSLisandro Dalcin } 21736c6c5352SBarry Smith c->nz = a->nz; 2174f2cbd3d5SJed Brown c->maxnz = a->nz; /* Since we allocate exactly the right amount */ 2175f4259b30SLisandro Dalcin c->solve_work = NULL; 2176f4259b30SLisandro Dalcin c->mult_work = NULL; 217726fbe8dcSKarl Rupp 217849b5e25fSSatish Balay *B = C; 21799566063dSJacob Faibussowitsch PetscCall(PetscFunctionListDuplicate(((PetscObject)A)->qlist, &((PetscObject)C)->qlist)); 21803ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 218149b5e25fSSatish Balay } 218249b5e25fSSatish Balay 2183618cc2edSLisandro Dalcin /* Used for both SeqBAIJ and SeqSBAIJ matrices */ 2184618cc2edSLisandro Dalcin #define MatLoad_SeqSBAIJ_Binary MatLoad_SeqBAIJ_Binary 2185618cc2edSLisandro Dalcin 2186d71ae5a4SJacob Faibussowitsch PetscErrorCode MatLoad_SeqSBAIJ(Mat mat, PetscViewer viewer) 2187d71ae5a4SJacob Faibussowitsch { 21887f489da9SVaclav Hapla PetscBool isbinary; 21892f480046SShri Abhyankar 21902f480046SShri Abhyankar PetscFunctionBegin; 21919566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERBINARY, &isbinary)); 219228b400f6SJacob Faibussowitsch PetscCheck(isbinary, PetscObjectComm((PetscObject)viewer), PETSC_ERR_SUP, "Viewer type %s not yet supported for reading %s matrices", ((PetscObject)viewer)->type_name, ((PetscObject)mat)->type_name); 21939566063dSJacob Faibussowitsch PetscCall(MatLoad_SeqSBAIJ_Binary(mat, viewer)); 21943ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 21952f480046SShri Abhyankar } 21962f480046SShri Abhyankar 2197c75a6043SHong Zhang /*@ 219811a5261eSBarry Smith MatCreateSeqSBAIJWithArrays - Creates an sequential `MATSEQSBAIJ` matrix using matrix elements 2199c75a6043SHong Zhang (upper triangular entries in CSR format) provided by the user. 2200c75a6043SHong Zhang 2201d083f849SBarry Smith Collective 2202c75a6043SHong Zhang 2203c75a6043SHong Zhang Input Parameters: 2204c75a6043SHong Zhang + comm - must be an MPI communicator of size 1 2205c75a6043SHong Zhang . bs - size of block 2206c75a6043SHong Zhang . m - number of rows 2207c75a6043SHong Zhang . n - number of columns 2208483a2f95SBarry Smith . i - row indices; that is i[0] = 0, i[row] = i[row-1] + number of block elements in that row block row of the matrix 2209c75a6043SHong Zhang . j - column indices 2210c75a6043SHong Zhang - a - matrix values 2211c75a6043SHong Zhang 2212c75a6043SHong Zhang Output Parameter: 2213c75a6043SHong Zhang . mat - the matrix 2214c75a6043SHong Zhang 2215dfb205c3SBarry Smith Level: advanced 2216c75a6043SHong Zhang 2217c75a6043SHong Zhang Notes: 22182ef1f0ffSBarry Smith The `i`, `j`, and `a` arrays are not copied by this routine, the user must free these arrays 2219c75a6043SHong Zhang once the matrix is destroyed 2220c75a6043SHong Zhang 2221c75a6043SHong Zhang You cannot set new nonzero locations into this matrix, that will generate an error. 2222c75a6043SHong Zhang 22232ef1f0ffSBarry Smith The `i` and `j` indices are 0 based 2224c75a6043SHong Zhang 22252ef1f0ffSBarry Smith When block size is greater than 1 the matrix values must be stored using the `MATSBAIJ` storage format. For block size of 1 2226dfb205c3SBarry Smith it is the regular CSR format excluding the lower triangular elements. 2227dfb205c3SBarry Smith 22281cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MATSEQSBAIJ`, `MatCreate()`, `MatCreateSBAIJ()`, `MatCreateSeqSBAIJ()` 2229c75a6043SHong Zhang @*/ 2230d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateSeqSBAIJWithArrays(MPI_Comm comm, PetscInt bs, PetscInt m, PetscInt n, PetscInt i[], PetscInt j[], PetscScalar a[], Mat *mat) 2231d71ae5a4SJacob Faibussowitsch { 2232c75a6043SHong Zhang PetscInt ii; 2233c75a6043SHong Zhang Mat_SeqSBAIJ *sbaij; 2234c75a6043SHong Zhang 2235c75a6043SHong Zhang PetscFunctionBegin; 223608401ef6SPierre Jolivet PetscCheck(bs == 1, PETSC_COMM_SELF, PETSC_ERR_SUP, "block size %" PetscInt_FMT " > 1 is not supported yet", bs); 2237aed4548fSBarry Smith PetscCheck(m == 0 || i[0] == 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "i (row indices) must start with 0"); 2238c75a6043SHong Zhang 22399566063dSJacob Faibussowitsch PetscCall(MatCreate(comm, mat)); 22409566063dSJacob Faibussowitsch PetscCall(MatSetSizes(*mat, m, n, m, n)); 22419566063dSJacob Faibussowitsch PetscCall(MatSetType(*mat, MATSEQSBAIJ)); 22429566063dSJacob Faibussowitsch PetscCall(MatSeqSBAIJSetPreallocation(*mat, bs, MAT_SKIP_ALLOCATION, NULL)); 2243c75a6043SHong Zhang sbaij = (Mat_SeqSBAIJ *)(*mat)->data; 22449566063dSJacob Faibussowitsch PetscCall(PetscMalloc2(m, &sbaij->imax, m, &sbaij->ilen)); 2245c75a6043SHong Zhang 2246c75a6043SHong Zhang sbaij->i = i; 2247c75a6043SHong Zhang sbaij->j = j; 2248c75a6043SHong Zhang sbaij->a = a; 224926fbe8dcSKarl Rupp 2250c75a6043SHong Zhang sbaij->singlemalloc = PETSC_FALSE; 2251c75a6043SHong Zhang sbaij->nonew = -1; /*this indicates that inserting a new value in the matrix that generates a new nonzero is an error*/ 2252e6b907acSBarry Smith sbaij->free_a = PETSC_FALSE; 2253e6b907acSBarry Smith sbaij->free_ij = PETSC_FALSE; 2254ddf7884eSMatthew Knepley sbaij->free_imax_ilen = PETSC_TRUE; 2255c75a6043SHong Zhang 2256c75a6043SHong Zhang for (ii = 0; ii < m; ii++) { 2257c75a6043SHong Zhang sbaij->ilen[ii] = sbaij->imax[ii] = i[ii + 1] - i[ii]; 22586bdcaf15SBarry Smith PetscCheck(i[ii + 1] >= i[ii], PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Negative row length in i (row indices) row = %" PetscInt_FMT " length = %" PetscInt_FMT, ii, i[ii + 1] - i[ii]); 2259c75a6043SHong Zhang } 226076bd3646SJed Brown if (PetscDefined(USE_DEBUG)) { 2261c75a6043SHong Zhang for (ii = 0; ii < sbaij->i[m]; ii++) { 22626bdcaf15SBarry Smith PetscCheck(j[ii] >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Negative column index at location = %" PetscInt_FMT " index = %" PetscInt_FMT, ii, j[ii]); 22636bdcaf15SBarry Smith PetscCheck(j[ii] < n, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Column index too large at location = %" PetscInt_FMT " index = %" PetscInt_FMT, ii, j[ii]); 2264c75a6043SHong Zhang } 226576bd3646SJed Brown } 2266c75a6043SHong Zhang 22679566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(*mat, MAT_FINAL_ASSEMBLY)); 22689566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(*mat, MAT_FINAL_ASSEMBLY)); 22693ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 2270c75a6043SHong Zhang } 2271d06b337dSHong Zhang 2272d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateMPIMatConcatenateSeqMat_SeqSBAIJ(MPI_Comm comm, Mat inmat, PetscInt n, MatReuse scall, Mat *outmat) 2273d71ae5a4SJacob Faibussowitsch { 227459f5e6ceSHong Zhang PetscFunctionBegin; 22759566063dSJacob Faibussowitsch PetscCall(MatCreateMPIMatConcatenateSeqMat_MPISBAIJ(comm, inmat, n, scall, outmat)); 22763ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 227759f5e6ceSHong Zhang } 2278