149b5e25fSSatish Balay 249b5e25fSSatish Balay /* 3a1373b80SHong Zhang Defines the basic matrix operations for the SBAIJ (compressed row) 449b5e25fSSatish Balay matrix storage format. 549b5e25fSSatish Balay */ 6c6db04a5SJed Brown #include <../src/mat/impls/baij/seq/baij.h> /*I "petscmat.h" I*/ 7c6db04a5SJed Brown #include <../src/mat/impls/sbaij/seq/sbaij.h> 8c6db04a5SJed Brown #include <petscblaslapack.h> 949b5e25fSSatish Balay 10c6db04a5SJed Brown #include <../src/mat/impls/sbaij/seq/relax.h> 1170dcbbb9SBarry Smith #define USESHORT 12c6db04a5SJed Brown #include <../src/mat/impls/sbaij/seq/relax.h> 1370dcbbb9SBarry Smith 1426cec326SBarry Smith /* defines MatSetValues_Seq_Hash(), MatAssemblyEnd_Seq_Hash(), MatSetUp_Seq_Hash() */ 1526cec326SBarry Smith #define TYPE SBAIJ 1626cec326SBarry Smith #define TYPE_SBAIJ 1726cec326SBarry Smith #define TYPE_BS 1826cec326SBarry Smith #include "../src/mat/impls/aij/seq/seqhashmatsetvalues.h" 1926cec326SBarry Smith #undef TYPE_BS 2026cec326SBarry Smith #define TYPE_BS _BS 2126cec326SBarry Smith #define TYPE_BS_ON 2226cec326SBarry Smith #include "../src/mat/impls/aij/seq/seqhashmatsetvalues.h" 2326cec326SBarry Smith #undef TYPE_BS 2426cec326SBarry Smith #undef TYPE_SBAIJ 2526cec326SBarry Smith #include "../src/mat/impls/aij/seq/seqhashmat.h" 2626cec326SBarry Smith #undef TYPE 2726cec326SBarry Smith #undef TYPE_BS_ON 2826cec326SBarry Smith 296214f412SHong Zhang #if defined(PETSC_HAVE_ELEMENTAL) 30cc2e6a90SBarry Smith PETSC_INTERN PetscErrorCode MatConvert_SeqSBAIJ_Elemental(Mat, MatType, MatReuse, Mat *); 316214f412SHong Zhang #endif 32d24d4204SJose E. Roman #if defined(PETSC_HAVE_SCALAPACK) 33d24d4204SJose E. Roman PETSC_INTERN PetscErrorCode MatConvert_SBAIJ_ScaLAPACK(Mat, MatType, MatReuse, Mat *); 34d24d4204SJose E. Roman #endif 3528d58a37SPierre Jolivet PETSC_INTERN PetscErrorCode MatConvert_MPISBAIJ_Basic(Mat, MatType, MatReuse, Mat *); 36b5b17502SBarry Smith 3749b5e25fSSatish Balay /* 3849b5e25fSSatish Balay Checks for missing diagonals 3949b5e25fSSatish Balay */ 40d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMissingDiagonal_SeqSBAIJ(Mat A, PetscBool *missing, PetscInt *dd) 41d71ae5a4SJacob Faibussowitsch { 42045c9aa0SHong Zhang Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)A->data; 437734d3b5SMatthew G. Knepley PetscInt *diag, *ii = a->i, i; 4449b5e25fSSatish Balay 4549b5e25fSSatish Balay PetscFunctionBegin; 469566063dSJacob Faibussowitsch PetscCall(MatMarkDiagonal_SeqSBAIJ(A)); 472af78befSBarry Smith *missing = PETSC_FALSE; 487734d3b5SMatthew G. Knepley if (A->rmap->n > 0 && !ii) { 49358d2f5dSShri Abhyankar *missing = PETSC_TRUE; 50358d2f5dSShri Abhyankar if (dd) *dd = 0; 519566063dSJacob Faibussowitsch PetscCall(PetscInfo(A, "Matrix has no entries therefore is missing diagonal\n")); 52358d2f5dSShri Abhyankar } else { 53358d2f5dSShri Abhyankar diag = a->diag; 5449b5e25fSSatish Balay for (i = 0; i < a->mbs; i++) { 557734d3b5SMatthew G. Knepley if (diag[i] >= ii[i + 1]) { 562af78befSBarry Smith *missing = PETSC_TRUE; 572af78befSBarry Smith if (dd) *dd = i; 582af78befSBarry Smith break; 592af78befSBarry Smith } 6049b5e25fSSatish Balay } 61358d2f5dSShri Abhyankar } 623ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 6349b5e25fSSatish Balay } 6449b5e25fSSatish Balay 65d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMarkDiagonal_SeqSBAIJ(Mat A) 66d71ae5a4SJacob Faibussowitsch { 67045c9aa0SHong Zhang Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)A->data; 6848dd3d27SHong Zhang PetscInt i, j; 6949b5e25fSSatish Balay 7049b5e25fSSatish Balay PetscFunctionBegin; 7109f38230SBarry Smith if (!a->diag) { 729566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(a->mbs, &a->diag)); 73c760cd28SBarry Smith a->free_diag = PETSC_TRUE; 7409f38230SBarry Smith } 7548dd3d27SHong Zhang for (i = 0; i < a->mbs; i++) { 7648dd3d27SHong Zhang a->diag[i] = a->i[i + 1]; 7748dd3d27SHong Zhang for (j = a->i[i]; j < a->i[i + 1]; j++) { 7848dd3d27SHong Zhang if (a->j[j] == i) { 7948dd3d27SHong Zhang a->diag[i] = j; 8048dd3d27SHong Zhang break; 8148dd3d27SHong Zhang } 8248dd3d27SHong Zhang } 8348dd3d27SHong Zhang } 843ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 8549b5e25fSSatish Balay } 8649b5e25fSSatish Balay 87d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatGetRowIJ_SeqSBAIJ(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool blockcompressed, PetscInt *nn, const PetscInt *inia[], const PetscInt *inja[], PetscBool *done) 88d71ae5a4SJacob Faibussowitsch { 89a6ece127SHong Zhang Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)A->data; 902462f5fdSStefano Zampini PetscInt i, j, n = a->mbs, nz = a->i[n], *tia, *tja, bs = A->rmap->bs, k, l, cnt; 912462f5fdSStefano Zampini PetscInt **ia = (PetscInt **)inia, **ja = (PetscInt **)inja; 9249b5e25fSSatish Balay 9349b5e25fSSatish Balay PetscFunctionBegin; 94d3e5a4abSHong Zhang *nn = n; 953ba16761SJacob Faibussowitsch if (!ia) PetscFunctionReturn(PETSC_SUCCESS); 962462f5fdSStefano Zampini if (symmetric) { 979566063dSJacob Faibussowitsch PetscCall(MatToSymmetricIJ_SeqAIJ(n, a->i, a->j, PETSC_FALSE, 0, 0, &tia, &tja)); 982462f5fdSStefano Zampini nz = tia[n]; 992462f5fdSStefano Zampini } else { 1009371c9d4SSatish Balay tia = a->i; 1019371c9d4SSatish Balay tja = a->j; 1022462f5fdSStefano Zampini } 1032462f5fdSStefano Zampini 1042462f5fdSStefano Zampini if (!blockcompressed && bs > 1) { 1052462f5fdSStefano Zampini (*nn) *= bs; 1068f7157efSSatish Balay /* malloc & create the natural set of indices */ 1079566063dSJacob Faibussowitsch PetscCall(PetscMalloc1((n + 1) * bs, ia)); 1082462f5fdSStefano Zampini if (n) { 1092462f5fdSStefano Zampini (*ia)[0] = oshift; 110ad540459SPierre Jolivet for (j = 1; j < bs; j++) (*ia)[j] = (tia[1] - tia[0]) * bs + (*ia)[j - 1]; 1112462f5fdSStefano Zampini } 1122462f5fdSStefano Zampini 1132462f5fdSStefano Zampini for (i = 1; i < n; i++) { 1142462f5fdSStefano Zampini (*ia)[i * bs] = (tia[i] - tia[i - 1]) * bs + (*ia)[i * bs - 1]; 115ad540459SPierre Jolivet for (j = 1; j < bs; j++) (*ia)[i * bs + j] = (tia[i + 1] - tia[i]) * bs + (*ia)[i * bs + j - 1]; 1162462f5fdSStefano Zampini } 117ad540459SPierre Jolivet if (n) (*ia)[n * bs] = (tia[n] - tia[n - 1]) * bs + (*ia)[n * bs - 1]; 1182462f5fdSStefano Zampini 1192462f5fdSStefano Zampini if (inja) { 1209566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nz * bs * bs, ja)); 1212462f5fdSStefano Zampini cnt = 0; 1222462f5fdSStefano Zampini for (i = 0; i < n; i++) { 1238f7157efSSatish Balay for (j = 0; j < bs; j++) { 1242462f5fdSStefano Zampini for (k = tia[i]; k < tia[i + 1]; k++) { 125ad540459SPierre Jolivet for (l = 0; l < bs; l++) (*ja)[cnt++] = bs * tja[k] + l; 1268f7157efSSatish Balay } 1278f7157efSSatish Balay } 1288f7157efSSatish Balay } 1298f7157efSSatish Balay } 1302462f5fdSStefano Zampini 1312462f5fdSStefano Zampini if (symmetric) { /* deallocate memory allocated in MatToSymmetricIJ_SeqAIJ() */ 1329566063dSJacob Faibussowitsch PetscCall(PetscFree(tia)); 1339566063dSJacob Faibussowitsch PetscCall(PetscFree(tja)); 1342462f5fdSStefano Zampini } 1352462f5fdSStefano Zampini } else if (oshift == 1) { 1362462f5fdSStefano Zampini if (symmetric) { 1372462f5fdSStefano Zampini nz = tia[A->rmap->n / bs]; 1382462f5fdSStefano Zampini /* add 1 to i and j indices */ 1392462f5fdSStefano Zampini for (i = 0; i < A->rmap->n / bs + 1; i++) tia[i] = tia[i] + 1; 1402462f5fdSStefano Zampini *ia = tia; 1412462f5fdSStefano Zampini if (ja) { 1422462f5fdSStefano Zampini for (i = 0; i < nz; i++) tja[i] = tja[i] + 1; 1432462f5fdSStefano Zampini *ja = tja; 1442462f5fdSStefano Zampini } 1452462f5fdSStefano Zampini } else { 1462462f5fdSStefano Zampini nz = a->i[A->rmap->n / bs]; 1472462f5fdSStefano Zampini /* malloc space and add 1 to i and j indices */ 1489566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(A->rmap->n / bs + 1, ia)); 1492462f5fdSStefano Zampini for (i = 0; i < A->rmap->n / bs + 1; i++) (*ia)[i] = a->i[i] + 1; 1502462f5fdSStefano Zampini if (ja) { 1519566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nz, ja)); 1522462f5fdSStefano Zampini for (i = 0; i < nz; i++) (*ja)[i] = a->j[i] + 1; 1532462f5fdSStefano Zampini } 1542462f5fdSStefano Zampini } 1552462f5fdSStefano Zampini } else { 1562462f5fdSStefano Zampini *ia = tia; 1572462f5fdSStefano Zampini if (ja) *ja = tja; 158a6ece127SHong Zhang } 1593ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 16049b5e25fSSatish Balay } 16149b5e25fSSatish Balay 162d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatRestoreRowIJ_SeqSBAIJ(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool blockcompressed, PetscInt *nn, const PetscInt *ia[], const PetscInt *ja[], PetscBool *done) 163d71ae5a4SJacob Faibussowitsch { 16449b5e25fSSatish Balay PetscFunctionBegin; 1653ba16761SJacob Faibussowitsch if (!ia) PetscFunctionReturn(PETSC_SUCCESS); 1662462f5fdSStefano Zampini if ((!blockcompressed && A->rmap->bs > 1) || (symmetric || oshift == 1)) { 1679566063dSJacob Faibussowitsch PetscCall(PetscFree(*ia)); 1689566063dSJacob Faibussowitsch if (ja) PetscCall(PetscFree(*ja)); 169a6ece127SHong Zhang } 1703ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 17149b5e25fSSatish Balay } 17249b5e25fSSatish Balay 173d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDestroy_SeqSBAIJ(Mat A) 174d71ae5a4SJacob Faibussowitsch { 17549b5e25fSSatish Balay Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)A->data; 17649b5e25fSSatish Balay 17749b5e25fSSatish Balay PetscFunctionBegin; 178b4e2f619SBarry Smith if (A->hash_active) { 179b4e2f619SBarry Smith PetscInt bs; 180e3c72094SPierre Jolivet A->ops[0] = a->cops; 181b4e2f619SBarry Smith PetscCall(PetscHMapIJVDestroy(&a->ht)); 182b4e2f619SBarry Smith PetscCall(MatGetBlockSize(A, &bs)); 183b4e2f619SBarry Smith if (bs > 1) PetscCall(PetscHSetIJDestroy(&a->bht)); 184b4e2f619SBarry Smith PetscCall(PetscFree(a->dnz)); 185b4e2f619SBarry Smith PetscCall(PetscFree(a->bdnz)); 186b4e2f619SBarry Smith A->hash_active = PETSC_FALSE; 187b4e2f619SBarry Smith } 188a9f03627SSatish Balay #if defined(PETSC_USE_LOG) 1893ba16761SJacob Faibussowitsch PetscCall(PetscLogObjectState((PetscObject)A, "Rows=%" PetscInt_FMT ", NZ=%" PetscInt_FMT, A->rmap->N, a->nz)); 190a9f03627SSatish Balay #endif 1919566063dSJacob Faibussowitsch PetscCall(MatSeqXAIJFreeAIJ(A, &a->a, &a->j, &a->i)); 1929566063dSJacob Faibussowitsch if (a->free_diag) PetscCall(PetscFree(a->diag)); 1939566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->row)); 1949566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->col)); 1959566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->icol)); 1969566063dSJacob Faibussowitsch PetscCall(PetscFree(a->idiag)); 1979566063dSJacob Faibussowitsch PetscCall(PetscFree(a->inode.size)); 1989566063dSJacob Faibussowitsch if (a->free_imax_ilen) PetscCall(PetscFree2(a->imax, a->ilen)); 1999566063dSJacob Faibussowitsch PetscCall(PetscFree(a->solve_work)); 2009566063dSJacob Faibussowitsch PetscCall(PetscFree(a->sor_work)); 2019566063dSJacob Faibussowitsch PetscCall(PetscFree(a->solves_work)); 2029566063dSJacob Faibussowitsch PetscCall(PetscFree(a->mult_work)); 2039566063dSJacob Faibussowitsch PetscCall(PetscFree(a->saved_values)); 2049566063dSJacob Faibussowitsch if (a->free_jshort) PetscCall(PetscFree(a->jshort)); 2059566063dSJacob Faibussowitsch PetscCall(PetscFree(a->inew)); 2069566063dSJacob Faibussowitsch PetscCall(MatDestroy(&a->parent)); 2079566063dSJacob Faibussowitsch PetscCall(PetscFree(A->data)); 208901853e0SKris Buschelman 2099566063dSJacob Faibussowitsch PetscCall(PetscObjectChangeTypeName((PetscObject)A, NULL)); 2102e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSeqSBAIJGetArray_C", NULL)); 2112e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSeqSBAIJRestoreArray_C", NULL)); 2129566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatStoreValues_C", NULL)); 2139566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatRetrieveValues_C", NULL)); 2149566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSeqSBAIJSetColumnIndices_C", NULL)); 2159566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqsbaij_seqaij_C", NULL)); 2169566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqsbaij_seqbaij_C", NULL)); 2179566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSeqSBAIJSetPreallocation_C", NULL)); 2189566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSeqSBAIJSetPreallocationCSR_C", NULL)); 2196214f412SHong Zhang #if defined(PETSC_HAVE_ELEMENTAL) 2209566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqsbaij_elemental_C", NULL)); 2216214f412SHong Zhang #endif 222d24d4204SJose E. Roman #if defined(PETSC_HAVE_SCALAPACK) 2239566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqsbaij_scalapack_C", NULL)); 224d24d4204SJose E. Roman #endif 2252e956fe4SStefano Zampini PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatFactorGetSolverType_C", NULL)); 2263ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 22749b5e25fSSatish Balay } 22849b5e25fSSatish Balay 229d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetOption_SeqSBAIJ(Mat A, MatOption op, PetscBool flg) 230d71ae5a4SJacob Faibussowitsch { 231045c9aa0SHong Zhang Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)A->data; 232eb1ec7c1SStefano Zampini #if defined(PETSC_USE_COMPLEX) 233eb1ec7c1SStefano Zampini PetscInt bs; 234eb1ec7c1SStefano Zampini #endif 23549b5e25fSSatish Balay 23649b5e25fSSatish Balay PetscFunctionBegin; 237eb1ec7c1SStefano Zampini #if defined(PETSC_USE_COMPLEX) 2389566063dSJacob Faibussowitsch PetscCall(MatGetBlockSize(A, &bs)); 239eb1ec7c1SStefano Zampini #endif 2404d9d31abSKris Buschelman switch (op) { 241d71ae5a4SJacob Faibussowitsch case MAT_ROW_ORIENTED: 242d71ae5a4SJacob Faibussowitsch a->roworiented = flg; 243d71ae5a4SJacob Faibussowitsch break; 244d71ae5a4SJacob Faibussowitsch case MAT_KEEP_NONZERO_PATTERN: 245d71ae5a4SJacob Faibussowitsch a->keepnonzeropattern = flg; 246d71ae5a4SJacob Faibussowitsch break; 247d71ae5a4SJacob Faibussowitsch case MAT_NEW_NONZERO_LOCATIONS: 248d71ae5a4SJacob Faibussowitsch a->nonew = (flg ? 0 : 1); 249d71ae5a4SJacob Faibussowitsch break; 250d71ae5a4SJacob Faibussowitsch case MAT_NEW_NONZERO_LOCATION_ERR: 251d71ae5a4SJacob Faibussowitsch a->nonew = (flg ? -1 : 0); 252d71ae5a4SJacob Faibussowitsch break; 253d71ae5a4SJacob Faibussowitsch case MAT_NEW_NONZERO_ALLOCATION_ERR: 254d71ae5a4SJacob Faibussowitsch a->nonew = (flg ? -2 : 0); 255d71ae5a4SJacob Faibussowitsch break; 256d71ae5a4SJacob Faibussowitsch case MAT_UNUSED_NONZERO_LOCATION_ERR: 257d71ae5a4SJacob Faibussowitsch a->nounused = (flg ? -1 : 0); 258d71ae5a4SJacob Faibussowitsch break; 2598c78258cSHong Zhang case MAT_FORCE_DIAGONAL_ENTRIES: 2604d9d31abSKris Buschelman case MAT_IGNORE_OFF_PROC_ENTRIES: 2614d9d31abSKris Buschelman case MAT_USE_HASH_TABLE: 262d71ae5a4SJacob Faibussowitsch case MAT_SORTED_FULL: 263d71ae5a4SJacob Faibussowitsch PetscCall(PetscInfo(A, "Option %s ignored\n", MatOptions[op])); 264d71ae5a4SJacob Faibussowitsch break; 2659a4540c5SBarry Smith case MAT_HERMITIAN: 266eb1ec7c1SStefano Zampini #if defined(PETSC_USE_COMPLEX) 267eb1ec7c1SStefano Zampini if (flg) { /* disable transpose ops */ 26808401ef6SPierre Jolivet PetscCheck(bs <= 1, PETSC_COMM_SELF, PETSC_ERR_SUP, "No support for Hermitian with block size greater than 1"); 269eb1ec7c1SStefano Zampini A->ops->multtranspose = NULL; 270eb1ec7c1SStefano Zampini A->ops->multtransposeadd = NULL; 271b94d7dedSBarry Smith A->symmetric = PETSC_BOOL3_FALSE; 272eb1ec7c1SStefano Zampini } 2730f2140c7SStefano Zampini #endif 274eeffb40dSHong Zhang break; 27577e54ba9SKris Buschelman case MAT_SYMMETRIC: 276eb1ec7c1SStefano Zampini case MAT_SPD: 277eb1ec7c1SStefano Zampini #if defined(PETSC_USE_COMPLEX) 278eb1ec7c1SStefano Zampini if (flg) { /* An hermitian and symmetric matrix has zero imaginary part (restore back transpose ops) */ 279eb1ec7c1SStefano Zampini A->ops->multtranspose = A->ops->mult; 280eb1ec7c1SStefano Zampini A->ops->multtransposeadd = A->ops->multadd; 281eb1ec7c1SStefano Zampini } 282eb1ec7c1SStefano Zampini #endif 283eb1ec7c1SStefano Zampini break; 284eb1ec7c1SStefano Zampini /* These options are handled directly by MatSetOption() */ 28577e54ba9SKris Buschelman case MAT_STRUCTURALLY_SYMMETRIC: 2869a4540c5SBarry Smith case MAT_SYMMETRY_ETERNAL: 287b94d7dedSBarry Smith case MAT_STRUCTURAL_SYMMETRY_ETERNAL: 288672ba085SHong Zhang case MAT_STRUCTURE_ONLY: 289b94d7dedSBarry Smith case MAT_SPD_ETERNAL: 2904dcd73b1SHong Zhang /* These options are handled directly by MatSetOption() */ 291290bbb0aSBarry Smith break; 292d71ae5a4SJacob Faibussowitsch case MAT_IGNORE_LOWER_TRIANGULAR: 293d71ae5a4SJacob Faibussowitsch a->ignore_ltriangular = flg; 294d71ae5a4SJacob Faibussowitsch break; 295d71ae5a4SJacob Faibussowitsch case MAT_ERROR_LOWER_TRIANGULAR: 296d71ae5a4SJacob Faibussowitsch a->ignore_ltriangular = flg; 297d71ae5a4SJacob Faibussowitsch break; 298d71ae5a4SJacob Faibussowitsch case MAT_GETROW_UPPERTRIANGULAR: 299d71ae5a4SJacob Faibussowitsch a->getrow_utriangular = flg; 300d71ae5a4SJacob Faibussowitsch break; 301d71ae5a4SJacob Faibussowitsch case MAT_SUBMAT_SINGLEIS: 302d71ae5a4SJacob Faibussowitsch break; 303d71ae5a4SJacob Faibussowitsch default: 304d71ae5a4SJacob Faibussowitsch SETERRQ(PETSC_COMM_SELF, PETSC_ERR_SUP, "unknown option %d", op); 30549b5e25fSSatish Balay } 3063ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 30749b5e25fSSatish Balay } 30849b5e25fSSatish Balay 309d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetRow_SeqSBAIJ(Mat A, PetscInt row, PetscInt *nz, PetscInt **idx, PetscScalar **v) 310d71ae5a4SJacob Faibussowitsch { 31149b5e25fSSatish Balay Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)A->data; 31249b5e25fSSatish Balay 31349b5e25fSSatish Balay PetscFunctionBegin; 31408401ef6SPierre Jolivet PetscCheck(!A || a->getrow_utriangular, PETSC_COMM_SELF, PETSC_ERR_SUP, "MatGetRow is not supported for SBAIJ matrix format. Getting the upper triangular part of row, run with -mat_getrow_uppertriangular, call MatSetOption(mat,MAT_GETROW_UPPERTRIANGULAR,PETSC_TRUE) or MatGetRowUpperTriangular()"); 31552768537SHong Zhang 316f5edf698SHong Zhang /* Get the upper triangular part of the row */ 3179566063dSJacob Faibussowitsch PetscCall(MatGetRow_SeqBAIJ_private(A, row, nz, idx, v, a->i, a->j, a->a)); 3183ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 31949b5e25fSSatish Balay } 32049b5e25fSSatish Balay 321d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRestoreRow_SeqSBAIJ(Mat A, PetscInt row, PetscInt *nz, PetscInt **idx, PetscScalar **v) 322d71ae5a4SJacob Faibussowitsch { 32349b5e25fSSatish Balay PetscFunctionBegin; 324cb4a9cd9SHong Zhang if (nz) *nz = 0; 3259566063dSJacob Faibussowitsch if (idx) PetscCall(PetscFree(*idx)); 3269566063dSJacob Faibussowitsch if (v) PetscCall(PetscFree(*v)); 3273ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 32849b5e25fSSatish Balay } 32949b5e25fSSatish Balay 330d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetRowUpperTriangular_SeqSBAIJ(Mat A) 331d71ae5a4SJacob Faibussowitsch { 332f5edf698SHong Zhang Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)A->data; 333f5edf698SHong Zhang 334f5edf698SHong Zhang PetscFunctionBegin; 335f5edf698SHong Zhang a->getrow_utriangular = PETSC_TRUE; 3363ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 337f5edf698SHong Zhang } 338a323099bSStefano Zampini 339d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRestoreRowUpperTriangular_SeqSBAIJ(Mat A) 340d71ae5a4SJacob Faibussowitsch { 341f5edf698SHong Zhang Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)A->data; 342f5edf698SHong Zhang 343f5edf698SHong Zhang PetscFunctionBegin; 344f5edf698SHong Zhang a->getrow_utriangular = PETSC_FALSE; 3453ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 346f5edf698SHong Zhang } 347f5edf698SHong Zhang 348d71ae5a4SJacob Faibussowitsch PetscErrorCode MatTranspose_SeqSBAIJ(Mat A, MatReuse reuse, Mat *B) 349d71ae5a4SJacob Faibussowitsch { 35049b5e25fSSatish Balay PetscFunctionBegin; 3517fb60732SBarry Smith if (reuse == MAT_REUSE_MATRIX) PetscCall(MatTransposeCheckNonzeroState_Private(A, *B)); 352cf37664fSBarry Smith if (reuse == MAT_INITIAL_MATRIX) { 3539566063dSJacob Faibussowitsch PetscCall(MatDuplicate(A, MAT_COPY_VALUES, B)); 354cf37664fSBarry Smith } else if (reuse == MAT_REUSE_MATRIX) { 3559566063dSJacob Faibussowitsch PetscCall(MatCopy(A, *B, SAME_NONZERO_PATTERN)); 356fc4dec0aSBarry Smith } 3573ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 35849b5e25fSSatish Balay } 35949b5e25fSSatish Balay 360d71ae5a4SJacob Faibussowitsch PetscErrorCode MatView_SeqSBAIJ_ASCII(Mat A, PetscViewer viewer) 361d71ae5a4SJacob Faibussowitsch { 36249b5e25fSSatish Balay Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)A->data; 363d0f46423SBarry Smith PetscInt i, j, bs = A->rmap->bs, k, l, bs2 = a->bs2; 364f3ef73ceSBarry Smith PetscViewerFormat format; 365121deb67SSatish Balay PetscInt *diag; 366b3a0534dSBarry Smith const char *matname; 36749b5e25fSSatish Balay 36849b5e25fSSatish Balay PetscFunctionBegin; 3699566063dSJacob Faibussowitsch PetscCall(PetscViewerGetFormat(viewer, &format)); 370456192e2SBarry Smith if (format == PETSC_VIEWER_ASCII_INFO || format == PETSC_VIEWER_ASCII_INFO_DETAIL) { 3719566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " block size is %" PetscInt_FMT "\n", bs)); 372fb9695e5SSatish Balay } else if (format == PETSC_VIEWER_ASCII_MATLAB) { 373d2507d54SMatthew Knepley Mat aij; 374ade3a672SBarry Smith 375d5f3da31SBarry Smith if (A->factortype && bs > 1) { 3769566063dSJacob Faibussowitsch PetscCall(PetscPrintf(PETSC_COMM_SELF, "Warning: matrix is factored with bs>1. MatView() with PETSC_VIEWER_ASCII_MATLAB is not supported and ignored!\n")); 3773ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 37870d5e725SHong Zhang } 3799566063dSJacob Faibussowitsch PetscCall(MatConvert(A, MATSEQAIJ, MAT_INITIAL_MATRIX, &aij)); 38023a3927dSBarry Smith if (((PetscObject)A)->name) PetscCall(PetscObjectGetName((PetscObject)A, &matname)); 38123a3927dSBarry Smith if (((PetscObject)A)->name) PetscCall(PetscObjectSetName((PetscObject)aij, matname)); 38223a3927dSBarry Smith PetscCall(MatView_SeqAIJ(aij, viewer)); 3839566063dSJacob Faibussowitsch PetscCall(MatDestroy(&aij)); 384fb9695e5SSatish Balay } else if (format == PETSC_VIEWER_ASCII_COMMON) { 385b3a0534dSBarry Smith Mat B; 386b3a0534dSBarry Smith 387b3a0534dSBarry Smith PetscCall(MatConvert(A, MATSEQAIJ, MAT_INITIAL_MATRIX, &B)); 388b3a0534dSBarry Smith if (((PetscObject)A)->name) PetscCall(PetscObjectGetName((PetscObject)A, &matname)); 389b3a0534dSBarry Smith if (((PetscObject)A)->name) PetscCall(PetscObjectSetName((PetscObject)B, matname)); 390b3a0534dSBarry Smith PetscCall(MatView_SeqAIJ(B, viewer)); 391b3a0534dSBarry Smith PetscCall(MatDestroy(&B)); 392c1490034SHong Zhang } else if (format == PETSC_VIEWER_ASCII_FACTOR_INFO) { 3933ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 39449b5e25fSSatish Balay } else { 3959566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE)); 3962c990fa1SHong Zhang if (A->factortype) { /* for factored matrix */ 39708401ef6SPierre Jolivet PetscCheck(bs <= 1, PETSC_COMM_SELF, PETSC_ERR_SUP, "matrix is factored with bs>1. Not implemented yet"); 3982c990fa1SHong Zhang 399121deb67SSatish Balay diag = a->diag; 400121deb67SSatish Balay for (i = 0; i < a->mbs; i++) { /* for row block i */ 4019566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "row %" PetscInt_FMT ":", i)); 4022c990fa1SHong Zhang /* diagonal entry */ 4032c990fa1SHong Zhang #if defined(PETSC_USE_COMPLEX) 4042c990fa1SHong Zhang if (PetscImaginaryPart(a->a[diag[i]]) > 0.0) { 4059566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g + %g i) ", a->j[diag[i]], (double)PetscRealPart(1.0 / a->a[diag[i]]), (double)PetscImaginaryPart(1.0 / a->a[diag[i]]))); 4062c990fa1SHong Zhang } else if (PetscImaginaryPart(a->a[diag[i]]) < 0.0) { 4079566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g - %g i) ", a->j[diag[i]], (double)PetscRealPart(1.0 / a->a[diag[i]]), -(double)PetscImaginaryPart(1.0 / a->a[diag[i]]))); 4082c990fa1SHong Zhang } else { 4099566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[diag[i]], (double)PetscRealPart(1.0 / a->a[diag[i]]))); 4102c990fa1SHong Zhang } 4112c990fa1SHong Zhang #else 4129566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[diag[i]], (double)(1.0 / a->a[diag[i]]))); 4132c990fa1SHong Zhang #endif 4142c990fa1SHong Zhang /* off-diagonal entries */ 4152c990fa1SHong Zhang for (k = a->i[i]; k < a->i[i + 1] - 1; k++) { 4162c990fa1SHong Zhang #if defined(PETSC_USE_COMPLEX) 417ca0704adSBarry Smith if (PetscImaginaryPart(a->a[k]) > 0.0) { 4189566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g + %g i) ", bs * a->j[k], (double)PetscRealPart(a->a[k]), (double)PetscImaginaryPart(a->a[k]))); 419ca0704adSBarry Smith } else if (PetscImaginaryPart(a->a[k]) < 0.0) { 4209566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g - %g i) ", bs * a->j[k], (double)PetscRealPart(a->a[k]), -(double)PetscImaginaryPart(a->a[k]))); 4212c990fa1SHong Zhang } else { 4229566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", bs * a->j[k], (double)PetscRealPart(a->a[k]))); 4232c990fa1SHong Zhang } 4242c990fa1SHong Zhang #else 4259566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[k], (double)a->a[k])); 4262c990fa1SHong Zhang #endif 4272c990fa1SHong Zhang } 4289566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 4292c990fa1SHong Zhang } 4302c990fa1SHong Zhang 4312c990fa1SHong Zhang } else { /* for non-factored matrix */ 4320c74a584SJed Brown for (i = 0; i < a->mbs; i++) { /* for row block i */ 4330c74a584SJed Brown for (j = 0; j < bs; j++) { /* for row bs*i + j */ 4349566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "row %" PetscInt_FMT ":", i * bs + j)); 4350c74a584SJed Brown for (k = a->i[i]; k < a->i[i + 1]; k++) { /* for column block */ 4360c74a584SJed Brown for (l = 0; l < bs; l++) { /* for column */ 43749b5e25fSSatish Balay #if defined(PETSC_USE_COMPLEX) 43849b5e25fSSatish Balay if (PetscImaginaryPart(a->a[bs2 * k + l * bs + j]) > 0.0) { 4399371c9d4SSatish Balay PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g + %g i) ", bs * a->j[k] + l, (double)PetscRealPart(a->a[bs2 * k + l * bs + j]), (double)PetscImaginaryPart(a->a[bs2 * k + l * bs + j]))); 44049b5e25fSSatish Balay } else if (PetscImaginaryPart(a->a[bs2 * k + l * bs + j]) < 0.0) { 4419371c9d4SSatish Balay PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g - %g i) ", bs * a->j[k] + l, (double)PetscRealPart(a->a[bs2 * k + l * bs + j]), -(double)PetscImaginaryPart(a->a[bs2 * k + l * bs + j]))); 44249b5e25fSSatish Balay } else { 4439566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", bs * a->j[k] + l, (double)PetscRealPart(a->a[bs2 * k + l * bs + j]))); 44449b5e25fSSatish Balay } 44549b5e25fSSatish Balay #else 4469566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", bs * a->j[k] + l, (double)a->a[bs2 * k + l * bs + j])); 44749b5e25fSSatish Balay #endif 44849b5e25fSSatish Balay } 44949b5e25fSSatish Balay } 4509566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIPrintf(viewer, "\n")); 45149b5e25fSSatish Balay } 45249b5e25fSSatish Balay } 4532c990fa1SHong Zhang } 4549566063dSJacob Faibussowitsch PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE)); 45549b5e25fSSatish Balay } 4569566063dSJacob Faibussowitsch PetscCall(PetscViewerFlush(viewer)); 4573ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 45849b5e25fSSatish Balay } 45949b5e25fSSatish Balay 4609804daf3SBarry Smith #include <petscdraw.h> 461d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatView_SeqSBAIJ_Draw_Zoom(PetscDraw draw, void *Aa) 462d71ae5a4SJacob Faibussowitsch { 46349b5e25fSSatish Balay Mat A = (Mat)Aa; 46449b5e25fSSatish Balay Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)A->data; 465d0f46423SBarry Smith PetscInt row, i, j, k, l, mbs = a->mbs, color, bs = A->rmap->bs, bs2 = a->bs2; 46649b5e25fSSatish Balay PetscReal xl, yl, xr, yr, x_l, x_r, y_l, y_r; 46749b5e25fSSatish Balay MatScalar *aa; 468b0a32e0cSBarry Smith PetscViewer viewer; 46949b5e25fSSatish Balay 47049b5e25fSSatish Balay PetscFunctionBegin; 4719566063dSJacob Faibussowitsch PetscCall(PetscObjectQuery((PetscObject)A, "Zoomviewer", (PetscObject *)&viewer)); 4729566063dSJacob Faibussowitsch PetscCall(PetscDrawGetCoordinates(draw, &xl, &yl, &xr, &yr)); 47349b5e25fSSatish Balay 47449b5e25fSSatish Balay /* loop over matrix elements drawing boxes */ 475383922c3SLisandro Dalcin 476d0609cedSBarry Smith PetscDrawCollectiveBegin(draw); 4779566063dSJacob Faibussowitsch PetscCall(PetscDrawString(draw, .3 * (xl + xr), .3 * (yl + yr), PETSC_DRAW_BLACK, "symmetric")); 478383922c3SLisandro Dalcin /* Blue for negative, Cyan for zero and Red for positive */ 479b0a32e0cSBarry Smith color = PETSC_DRAW_BLUE; 48049b5e25fSSatish Balay for (i = 0, row = 0; i < mbs; i++, row += bs) { 48149b5e25fSSatish Balay for (j = a->i[i]; j < a->i[i + 1]; j++) { 4829371c9d4SSatish Balay y_l = A->rmap->N - row - 1.0; 4839371c9d4SSatish Balay y_r = y_l + 1.0; 4849371c9d4SSatish Balay x_l = a->j[j] * bs; 4859371c9d4SSatish Balay x_r = x_l + 1.0; 48649b5e25fSSatish Balay aa = a->a + j * bs2; 48749b5e25fSSatish Balay for (k = 0; k < bs; k++) { 48849b5e25fSSatish Balay for (l = 0; l < bs; l++) { 48949b5e25fSSatish Balay if (PetscRealPart(*aa++) >= 0.) continue; 4909566063dSJacob Faibussowitsch PetscCall(PetscDrawRectangle(draw, x_l + k, y_l - l, x_r + k, y_r - l, color, color, color, color)); 49149b5e25fSSatish Balay } 49249b5e25fSSatish Balay } 49349b5e25fSSatish Balay } 49449b5e25fSSatish Balay } 495b0a32e0cSBarry Smith color = PETSC_DRAW_CYAN; 49649b5e25fSSatish Balay for (i = 0, row = 0; i < mbs; i++, row += bs) { 49749b5e25fSSatish Balay for (j = a->i[i]; j < a->i[i + 1]; j++) { 4989371c9d4SSatish Balay y_l = A->rmap->N - row - 1.0; 4999371c9d4SSatish Balay y_r = y_l + 1.0; 5009371c9d4SSatish Balay x_l = a->j[j] * bs; 5019371c9d4SSatish Balay x_r = x_l + 1.0; 50249b5e25fSSatish Balay aa = a->a + j * bs2; 50349b5e25fSSatish Balay for (k = 0; k < bs; k++) { 50449b5e25fSSatish Balay for (l = 0; l < bs; l++) { 50549b5e25fSSatish Balay if (PetscRealPart(*aa++) != 0.) continue; 5069566063dSJacob Faibussowitsch PetscCall(PetscDrawRectangle(draw, x_l + k, y_l - l, x_r + k, y_r - l, color, color, color, color)); 50749b5e25fSSatish Balay } 50849b5e25fSSatish Balay } 50949b5e25fSSatish Balay } 51049b5e25fSSatish Balay } 511b0a32e0cSBarry Smith color = PETSC_DRAW_RED; 51249b5e25fSSatish Balay for (i = 0, row = 0; i < mbs; i++, row += bs) { 51349b5e25fSSatish Balay for (j = a->i[i]; j < a->i[i + 1]; j++) { 5149371c9d4SSatish Balay y_l = A->rmap->N - row - 1.0; 5159371c9d4SSatish Balay y_r = y_l + 1.0; 5169371c9d4SSatish Balay x_l = a->j[j] * bs; 5179371c9d4SSatish Balay x_r = x_l + 1.0; 51849b5e25fSSatish Balay aa = a->a + j * bs2; 51949b5e25fSSatish Balay for (k = 0; k < bs; k++) { 52049b5e25fSSatish Balay for (l = 0; l < bs; l++) { 52149b5e25fSSatish Balay if (PetscRealPart(*aa++) <= 0.) continue; 5229566063dSJacob Faibussowitsch PetscCall(PetscDrawRectangle(draw, x_l + k, y_l - l, x_r + k, y_r - l, color, color, color, color)); 52349b5e25fSSatish Balay } 52449b5e25fSSatish Balay } 52549b5e25fSSatish Balay } 52649b5e25fSSatish Balay } 527d0609cedSBarry Smith PetscDrawCollectiveEnd(draw); 5283ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 52949b5e25fSSatish Balay } 53049b5e25fSSatish Balay 531d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatView_SeqSBAIJ_Draw(Mat A, PetscViewer viewer) 532d71ae5a4SJacob Faibussowitsch { 53349b5e25fSSatish Balay PetscReal xl, yl, xr, yr, w, h; 534b0a32e0cSBarry Smith PetscDraw draw; 535ace3abfcSBarry Smith PetscBool isnull; 53649b5e25fSSatish Balay 53749b5e25fSSatish Balay PetscFunctionBegin; 5389566063dSJacob Faibussowitsch PetscCall(PetscViewerDrawGetDraw(viewer, 0, &draw)); 5399566063dSJacob Faibussowitsch PetscCall(PetscDrawIsNull(draw, &isnull)); 5403ba16761SJacob Faibussowitsch if (isnull) PetscFunctionReturn(PETSC_SUCCESS); 54149b5e25fSSatish Balay 5429371c9d4SSatish Balay xr = A->rmap->N; 5439371c9d4SSatish Balay yr = A->rmap->N; 5449371c9d4SSatish Balay h = yr / 10.0; 5459371c9d4SSatish Balay w = xr / 10.0; 5469371c9d4SSatish Balay xr += w; 5479371c9d4SSatish Balay yr += h; 5489371c9d4SSatish Balay xl = -w; 5499371c9d4SSatish Balay yl = -h; 5509566063dSJacob Faibussowitsch PetscCall(PetscDrawSetCoordinates(draw, xl, yl, xr, yr)); 5519566063dSJacob Faibussowitsch PetscCall(PetscObjectCompose((PetscObject)A, "Zoomviewer", (PetscObject)viewer)); 5529566063dSJacob Faibussowitsch PetscCall(PetscDrawZoom(draw, MatView_SeqSBAIJ_Draw_Zoom, A)); 5539566063dSJacob Faibussowitsch PetscCall(PetscObjectCompose((PetscObject)A, "Zoomviewer", NULL)); 5549566063dSJacob Faibussowitsch PetscCall(PetscDrawSave(draw)); 5553ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 55649b5e25fSSatish Balay } 55749b5e25fSSatish Balay 558618cc2edSLisandro Dalcin /* Used for both MPIBAIJ and MPISBAIJ matrices */ 559618cc2edSLisandro Dalcin #define MatView_SeqSBAIJ_Binary MatView_SeqBAIJ_Binary 560618cc2edSLisandro Dalcin 561d71ae5a4SJacob Faibussowitsch PetscErrorCode MatView_SeqSBAIJ(Mat A, PetscViewer viewer) 562d71ae5a4SJacob Faibussowitsch { 563618cc2edSLisandro Dalcin PetscBool iascii, isbinary, isdraw; 56449b5e25fSSatish Balay 56549b5e25fSSatish Balay PetscFunctionBegin; 5669566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERASCII, &iascii)); 5679566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERBINARY, &isbinary)); 5689566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERDRAW, &isdraw)); 56932077d6dSBarry Smith if (iascii) { 5709566063dSJacob Faibussowitsch PetscCall(MatView_SeqSBAIJ_ASCII(A, viewer)); 571618cc2edSLisandro Dalcin } else if (isbinary) { 5729566063dSJacob Faibussowitsch PetscCall(MatView_SeqSBAIJ_Binary(A, viewer)); 57349b5e25fSSatish Balay } else if (isdraw) { 5749566063dSJacob Faibussowitsch PetscCall(MatView_SeqSBAIJ_Draw(A, viewer)); 57549b5e25fSSatish Balay } else { 576a5e6ed63SBarry Smith Mat B; 577ade3a672SBarry Smith const char *matname; 5789566063dSJacob Faibussowitsch PetscCall(MatConvert(A, MATSEQAIJ, MAT_INITIAL_MATRIX, &B)); 57923a3927dSBarry Smith if (((PetscObject)A)->name) PetscCall(PetscObjectGetName((PetscObject)A, &matname)); 58023a3927dSBarry Smith if (((PetscObject)A)->name) PetscCall(PetscObjectSetName((PetscObject)B, matname)); 5819566063dSJacob Faibussowitsch PetscCall(MatView(B, viewer)); 5829566063dSJacob Faibussowitsch PetscCall(MatDestroy(&B)); 58349b5e25fSSatish Balay } 5843ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 58549b5e25fSSatish Balay } 58649b5e25fSSatish Balay 587d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetValues_SeqSBAIJ(Mat A, PetscInt m, const PetscInt im[], PetscInt n, const PetscInt in[], PetscScalar v[]) 588d71ae5a4SJacob Faibussowitsch { 589045c9aa0SHong Zhang Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)A->data; 59013f74950SBarry Smith PetscInt *rp, k, low, high, t, row, nrow, i, col, l, *aj = a->j; 59113f74950SBarry Smith PetscInt *ai = a->i, *ailen = a->ilen; 592d0f46423SBarry Smith PetscInt brow, bcol, ridx, cidx, bs = A->rmap->bs, bs2 = a->bs2; 59397e567efSBarry Smith MatScalar *ap, *aa = a->a; 59449b5e25fSSatish Balay 59549b5e25fSSatish Balay PetscFunctionBegin; 59649b5e25fSSatish Balay for (k = 0; k < m; k++) { /* loop over rows */ 5979371c9d4SSatish Balay row = im[k]; 5989371c9d4SSatish Balay brow = row / bs; 5999371c9d4SSatish Balay if (row < 0) { 6009371c9d4SSatish Balay v += n; 6019371c9d4SSatish Balay continue; 6029371c9d4SSatish Balay } /* negative row */ 60354c59aa7SJacob Faibussowitsch PetscCheck(row < A->rmap->N, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Row too large: row %" PetscInt_FMT " max %" PetscInt_FMT, row, A->rmap->N - 1); 6049371c9d4SSatish Balay rp = aj + ai[brow]; 6059371c9d4SSatish Balay ap = aa + bs2 * ai[brow]; 60649b5e25fSSatish Balay nrow = ailen[brow]; 60749b5e25fSSatish Balay for (l = 0; l < n; l++) { /* loop over columns */ 6089371c9d4SSatish Balay if (in[l] < 0) { 6099371c9d4SSatish Balay v++; 6109371c9d4SSatish Balay continue; 6119371c9d4SSatish Balay } /* negative column */ 61254c59aa7SJacob Faibussowitsch PetscCheck(in[l] < A->cmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Column too large: col %" PetscInt_FMT " max %" PetscInt_FMT, in[l], A->cmap->n - 1); 61349b5e25fSSatish Balay col = in[l]; 61449b5e25fSSatish Balay bcol = col / bs; 61549b5e25fSSatish Balay cidx = col % bs; 61649b5e25fSSatish Balay ridx = row % bs; 61749b5e25fSSatish Balay high = nrow; 61849b5e25fSSatish Balay low = 0; /* assume unsorted */ 61949b5e25fSSatish Balay while (high - low > 5) { 62049b5e25fSSatish Balay t = (low + high) / 2; 62149b5e25fSSatish Balay if (rp[t] > bcol) high = t; 62249b5e25fSSatish Balay else low = t; 62349b5e25fSSatish Balay } 62449b5e25fSSatish Balay for (i = low; i < high; i++) { 62549b5e25fSSatish Balay if (rp[i] > bcol) break; 62649b5e25fSSatish Balay if (rp[i] == bcol) { 62749b5e25fSSatish Balay *v++ = ap[bs2 * i + bs * cidx + ridx]; 62849b5e25fSSatish Balay goto finished; 62949b5e25fSSatish Balay } 63049b5e25fSSatish Balay } 63197e567efSBarry Smith *v++ = 0.0; 63249b5e25fSSatish Balay finished:; 63349b5e25fSSatish Balay } 63449b5e25fSSatish Balay } 6353ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 63649b5e25fSSatish Balay } 63749b5e25fSSatish Balay 638d71ae5a4SJacob Faibussowitsch PetscErrorCode MatPermute_SeqSBAIJ(Mat A, IS rowp, IS colp, Mat *B) 639d71ae5a4SJacob Faibussowitsch { 640dc29a518SPierre Jolivet Mat C; 641dc29a518SPierre Jolivet 642dc29a518SPierre Jolivet PetscFunctionBegin; 6439566063dSJacob Faibussowitsch PetscCall(MatConvert(A, MATSEQBAIJ, MAT_INITIAL_MATRIX, &C)); 6449566063dSJacob Faibussowitsch PetscCall(MatPermute(C, rowp, colp, B)); 6459566063dSJacob Faibussowitsch PetscCall(MatDestroy(&C)); 64648a46eb9SPierre Jolivet if (rowp == colp) PetscCall(MatConvert(*B, MATSEQSBAIJ, MAT_INPLACE_MATRIX, B)); 6473ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 648dc29a518SPierre Jolivet } 64949b5e25fSSatish Balay 650d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetValuesBlocked_SeqSBAIJ(Mat A, PetscInt m, const PetscInt im[], PetscInt n, const PetscInt in[], const PetscScalar v[], InsertMode is) 651d71ae5a4SJacob Faibussowitsch { 6520880e062SHong Zhang Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)A->data; 653e2ee6c50SBarry Smith PetscInt *rp, k, low, high, t, ii, jj, row, nrow, i, col, l, rmax, N, lastcol = -1; 65413f74950SBarry Smith PetscInt *imax = a->imax, *ai = a->i, *ailen = a->ilen; 655d0f46423SBarry Smith PetscInt *aj = a->j, nonew = a->nonew, bs2 = a->bs2, bs = A->rmap->bs, stepval; 656ace3abfcSBarry Smith PetscBool roworiented = a->roworiented; 657dd6ea824SBarry Smith const PetscScalar *value = v; 658f15d580aSBarry Smith MatScalar *ap, *aa = a->a, *bap; 6590880e062SHong Zhang 66049b5e25fSSatish Balay PetscFunctionBegin; 66126fbe8dcSKarl Rupp if (roworiented) stepval = (n - 1) * bs; 66226fbe8dcSKarl Rupp else stepval = (m - 1) * bs; 66326fbe8dcSKarl Rupp 6640880e062SHong Zhang for (k = 0; k < m; k++) { /* loop over added rows */ 6650880e062SHong Zhang row = im[k]; 6660880e062SHong Zhang if (row < 0) continue; 6676bdcaf15SBarry Smith PetscCheck(row < a->mbs, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Block index row too large %" PetscInt_FMT " max %" PetscInt_FMT, row, a->mbs - 1); 6680880e062SHong Zhang rp = aj + ai[row]; 6690880e062SHong Zhang ap = aa + bs2 * ai[row]; 6700880e062SHong Zhang rmax = imax[row]; 6710880e062SHong Zhang nrow = ailen[row]; 6720880e062SHong Zhang low = 0; 673818f2c47SBarry Smith high = nrow; 6740880e062SHong Zhang for (l = 0; l < n; l++) { /* loop over added columns */ 6750880e062SHong Zhang if (in[l] < 0) continue; 6760880e062SHong Zhang col = in[l]; 6776bdcaf15SBarry Smith PetscCheck(col < a->nbs, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Block index column too large %" PetscInt_FMT " max %" PetscInt_FMT, col, a->nbs - 1); 678b98bf0e1SJed Brown if (col < row) { 67926fbe8dcSKarl Rupp if (a->ignore_ltriangular) continue; /* ignore lower triangular block */ 68026fbe8dcSKarl Rupp else SETERRQ(PETSC_COMM_SELF, PETSC_ERR_USER, "Lower triangular value cannot be set for sbaij format. Ignoring these values, run with -mat_ignore_lower_triangular or call MatSetOption(mat,MAT_IGNORE_LOWER_TRIANGULAR,PETSC_TRUE)"); 681b98bf0e1SJed Brown } 68226fbe8dcSKarl Rupp if (roworiented) value = v + k * (stepval + bs) * bs + l * bs; 68326fbe8dcSKarl Rupp else value = v + l * (stepval + bs) * bs + k * bs; 68426fbe8dcSKarl Rupp 68526fbe8dcSKarl Rupp if (col <= lastcol) low = 0; 68626fbe8dcSKarl Rupp else high = nrow; 68726fbe8dcSKarl Rupp 688e2ee6c50SBarry Smith lastcol = col; 6890880e062SHong Zhang while (high - low > 7) { 6900880e062SHong Zhang t = (low + high) / 2; 6910880e062SHong Zhang if (rp[t] > col) high = t; 6920880e062SHong Zhang else low = t; 6930880e062SHong Zhang } 6940880e062SHong Zhang for (i = low; i < high; i++) { 6950880e062SHong Zhang if (rp[i] > col) break; 6960880e062SHong Zhang if (rp[i] == col) { 6970880e062SHong Zhang bap = ap + bs2 * i; 6980880e062SHong Zhang if (roworiented) { 6990880e062SHong Zhang if (is == ADD_VALUES) { 7000880e062SHong Zhang for (ii = 0; ii < bs; ii++, value += stepval) { 701ad540459SPierre Jolivet for (jj = ii; jj < bs2; jj += bs) bap[jj] += *value++; 7020880e062SHong Zhang } 7030880e062SHong Zhang } else { 7040880e062SHong Zhang for (ii = 0; ii < bs; ii++, value += stepval) { 705ad540459SPierre Jolivet for (jj = ii; jj < bs2; jj += bs) bap[jj] = *value++; 7060880e062SHong Zhang } 7070880e062SHong Zhang } 7080880e062SHong Zhang } else { 7090880e062SHong Zhang if (is == ADD_VALUES) { 7100880e062SHong Zhang for (ii = 0; ii < bs; ii++, value += stepval) { 711ad540459SPierre Jolivet for (jj = 0; jj < bs; jj++) *bap++ += *value++; 7120880e062SHong Zhang } 7130880e062SHong Zhang } else { 7140880e062SHong Zhang for (ii = 0; ii < bs; ii++, value += stepval) { 715ad540459SPierre Jolivet for (jj = 0; jj < bs; jj++) *bap++ = *value++; 7160880e062SHong Zhang } 7170880e062SHong Zhang } 7180880e062SHong Zhang } 7190880e062SHong Zhang goto noinsert2; 7200880e062SHong Zhang } 7210880e062SHong Zhang } 7220880e062SHong Zhang if (nonew == 1) goto noinsert2; 72308401ef6SPierre Jolivet PetscCheck(nonew != -1, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Inserting a new block index nonzero block (%" PetscInt_FMT ", %" PetscInt_FMT ") in the matrix", row, col); 724fef13f97SBarry Smith MatSeqXAIJReallocateAIJ(A, a->mbs, bs2, nrow, row, col, rmax, aa, ai, aj, rp, ap, imax, nonew, MatScalar); 7259371c9d4SSatish Balay N = nrow++ - 1; 7269371c9d4SSatish Balay high++; 7270880e062SHong Zhang /* shift up all the later entries in this row */ 7289566063dSJacob Faibussowitsch PetscCall(PetscArraymove(rp + i + 1, rp + i, N - i + 1)); 7299566063dSJacob Faibussowitsch PetscCall(PetscArraymove(ap + bs2 * (i + 1), ap + bs2 * i, bs2 * (N - i + 1))); 7309566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(ap + bs2 * i, bs2)); 7310880e062SHong Zhang rp[i] = col; 7320880e062SHong Zhang bap = ap + bs2 * i; 7330880e062SHong Zhang if (roworiented) { 7340880e062SHong Zhang for (ii = 0; ii < bs; ii++, value += stepval) { 735ad540459SPierre Jolivet for (jj = ii; jj < bs2; jj += bs) bap[jj] = *value++; 7360880e062SHong Zhang } 7370880e062SHong Zhang } else { 7380880e062SHong Zhang for (ii = 0; ii < bs; ii++, value += stepval) { 739ad540459SPierre Jolivet for (jj = 0; jj < bs; jj++) *bap++ = *value++; 7400880e062SHong Zhang } 7410880e062SHong Zhang } 7420880e062SHong Zhang noinsert2:; 7430880e062SHong Zhang low = i; 7440880e062SHong Zhang } 7450880e062SHong Zhang ailen[row] = nrow; 7460880e062SHong Zhang } 7473ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 74849b5e25fSSatish Balay } 74949b5e25fSSatish Balay 750d71ae5a4SJacob Faibussowitsch PetscErrorCode MatAssemblyEnd_SeqSBAIJ(Mat A, MatAssemblyType mode) 751d71ae5a4SJacob Faibussowitsch { 75249b5e25fSSatish Balay Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)A->data; 7538f8f2f0dSBarry Smith PetscInt fshift = 0, i, *ai = a->i, *aj = a->j, *imax = a->imax; 754d0f46423SBarry Smith PetscInt m = A->rmap->N, *ip, N, *ailen = a->ilen; 75513f74950SBarry Smith PetscInt mbs = a->mbs, bs2 = a->bs2, rmax = 0; 75649b5e25fSSatish Balay MatScalar *aa = a->a, *ap; 75749b5e25fSSatish Balay 75849b5e25fSSatish Balay PetscFunctionBegin; 759*d32568d8SPierre Jolivet if (mode == MAT_FLUSH_ASSEMBLY || (A->was_assembled && A->ass_nonzerostate == A->nonzerostate)) PetscFunctionReturn(PETSC_SUCCESS); 76049b5e25fSSatish Balay 76149b5e25fSSatish Balay if (m) rmax = ailen[0]; 76249b5e25fSSatish Balay for (i = 1; i < mbs; i++) { 76349b5e25fSSatish Balay /* move each row back by the amount of empty slots (fshift) before it*/ 76449b5e25fSSatish Balay fshift += imax[i - 1] - ailen[i - 1]; 76549b5e25fSSatish Balay rmax = PetscMax(rmax, ailen[i]); 76649b5e25fSSatish Balay if (fshift) { 767580bdb30SBarry Smith ip = aj + ai[i]; 768580bdb30SBarry Smith ap = aa + bs2 * ai[i]; 76949b5e25fSSatish Balay N = ailen[i]; 7709566063dSJacob Faibussowitsch PetscCall(PetscArraymove(ip - fshift, ip, N)); 7719566063dSJacob Faibussowitsch PetscCall(PetscArraymove(ap - bs2 * fshift, ap, bs2 * N)); 77249b5e25fSSatish Balay } 77349b5e25fSSatish Balay ai[i] = ai[i - 1] + ailen[i - 1]; 77449b5e25fSSatish Balay } 77549b5e25fSSatish Balay if (mbs) { 77649b5e25fSSatish Balay fshift += imax[mbs - 1] - ailen[mbs - 1]; 77749b5e25fSSatish Balay ai[mbs] = ai[mbs - 1] + ailen[mbs - 1]; 77849b5e25fSSatish Balay } 77949b5e25fSSatish Balay /* reset ilen and imax for each row */ 780ad540459SPierre Jolivet for (i = 0; i < mbs; i++) ailen[i] = imax[i] = ai[i + 1] - ai[i]; 7816c6c5352SBarry Smith a->nz = ai[mbs]; 78249b5e25fSSatish Balay 783b424e231SHong Zhang /* diagonals may have moved, reset it */ 7841baa6e33SBarry Smith if (a->diag) PetscCall(PetscArraycpy(a->diag, ai, mbs)); 785aed4548fSBarry Smith PetscCheck(!fshift || a->nounused != -1, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Unused space detected in matrix: %" PetscInt_FMT " X %" PetscInt_FMT " block size %" PetscInt_FMT ", %" PetscInt_FMT " unneeded", m, A->cmap->n, A->rmap->bs, fshift * bs2); 78626fbe8dcSKarl Rupp 7879566063dSJacob Faibussowitsch PetscCall(PetscInfo(A, "Matrix size: %" PetscInt_FMT " X %" PetscInt_FMT ", block size %" PetscInt_FMT "; storage space: %" PetscInt_FMT " unneeded, %" PetscInt_FMT " used\n", m, A->rmap->N, A->rmap->bs, fshift * bs2, a->nz * bs2)); 7889566063dSJacob Faibussowitsch PetscCall(PetscInfo(A, "Number of mallocs during MatSetValues is %" PetscInt_FMT "\n", a->reallocs)); 7899566063dSJacob Faibussowitsch PetscCall(PetscInfo(A, "Most nonzeros blocks in any row is %" PetscInt_FMT "\n", rmax)); 79026fbe8dcSKarl Rupp 7918e58a170SBarry Smith A->info.mallocs += a->reallocs; 79249b5e25fSSatish Balay a->reallocs = 0; 79349b5e25fSSatish Balay A->info.nz_unneeded = (PetscReal)fshift * bs2; 794061b2667SBarry Smith a->idiagvalid = PETSC_FALSE; 7954dcd73b1SHong Zhang a->rmax = rmax; 79638702af4SBarry Smith 79738702af4SBarry Smith if (A->cmap->n < 65536 && A->cmap->bs == 1) { 79844e1c64aSLisandro Dalcin if (a->jshort && a->free_jshort) { 79917803ae8SHong Zhang /* when matrix data structure is changed, previous jshort must be replaced */ 8009566063dSJacob Faibussowitsch PetscCall(PetscFree(a->jshort)); 80117803ae8SHong Zhang } 8029566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(a->i[A->rmap->n], &a->jshort)); 80338702af4SBarry Smith for (i = 0; i < a->i[A->rmap->n]; i++) a->jshort[i] = a->j[i]; 80438702af4SBarry Smith A->ops->mult = MatMult_SeqSBAIJ_1_ushort; 80541f059aeSBarry Smith A->ops->sor = MatSOR_SeqSBAIJ_ushort; 8064da8f245SBarry Smith a->free_jshort = PETSC_TRUE; 80738702af4SBarry Smith } 8083ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 80949b5e25fSSatish Balay } 81049b5e25fSSatish Balay 81149b5e25fSSatish Balay /* 81249b5e25fSSatish Balay This function returns an array of flags which indicate the locations of contiguous 81349b5e25fSSatish Balay blocks that should be zeroed. for eg: if bs = 3 and is = [0,1,2,3,5,6,7,8,9] 814a5b23f4aSJose E. Roman then the resulting sizes = [3,1,1,3,1] corresponding to sets [(0,1,2),(3),(5),(6,7,8),(9)] 81549b5e25fSSatish Balay Assume: sizes should be long enough to hold all the values. 81649b5e25fSSatish Balay */ 817d71ae5a4SJacob Faibussowitsch PetscErrorCode MatZeroRows_SeqSBAIJ_Check_Blocks(PetscInt idx[], PetscInt n, PetscInt bs, PetscInt sizes[], PetscInt *bs_max) 818d71ae5a4SJacob Faibussowitsch { 81913f74950SBarry Smith PetscInt i, j, k, row; 820ace3abfcSBarry Smith PetscBool flg; 82149b5e25fSSatish Balay 82249b5e25fSSatish Balay PetscFunctionBegin; 82349b5e25fSSatish Balay for (i = 0, j = 0; i < n; j++) { 82449b5e25fSSatish Balay row = idx[i]; 825a5b23f4aSJose E. Roman if (row % bs != 0) { /* Not the beginning of a block */ 82649b5e25fSSatish Balay sizes[j] = 1; 82749b5e25fSSatish Balay i++; 82849b5e25fSSatish Balay } else if (i + bs > n) { /* Beginning of a block, but complete block doesn't exist (at idx end) */ 82949b5e25fSSatish Balay sizes[j] = 1; /* Also makes sure at least 'bs' values exist for next else */ 83049b5e25fSSatish Balay i++; 8316aad120cSJose E. Roman } else { /* Beginning of the block, so check if the complete block exists */ 83249b5e25fSSatish Balay flg = PETSC_TRUE; 83349b5e25fSSatish Balay for (k = 1; k < bs; k++) { 83449b5e25fSSatish Balay if (row + k != idx[i + k]) { /* break in the block */ 83549b5e25fSSatish Balay flg = PETSC_FALSE; 83649b5e25fSSatish Balay break; 83749b5e25fSSatish Balay } 83849b5e25fSSatish Balay } 839abc0a331SBarry Smith if (flg) { /* No break in the bs */ 84049b5e25fSSatish Balay sizes[j] = bs; 84149b5e25fSSatish Balay i += bs; 84249b5e25fSSatish Balay } else { 84349b5e25fSSatish Balay sizes[j] = 1; 84449b5e25fSSatish Balay i++; 84549b5e25fSSatish Balay } 84649b5e25fSSatish Balay } 84749b5e25fSSatish Balay } 84849b5e25fSSatish Balay *bs_max = j; 8493ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 85049b5e25fSSatish Balay } 85149b5e25fSSatish Balay 85249b5e25fSSatish Balay /* Only add/insert a(i,j) with i<=j (blocks). 853da81f932SPierre Jolivet Any a(i,j) with i>j input by user is ignored. 85449b5e25fSSatish Balay */ 85549b5e25fSSatish Balay 856d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetValues_SeqSBAIJ(Mat A, PetscInt m, const PetscInt im[], PetscInt n, const PetscInt in[], const PetscScalar v[], InsertMode is) 857d71ae5a4SJacob Faibussowitsch { 85849b5e25fSSatish Balay Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)A->data; 859e2ee6c50SBarry Smith PetscInt *rp, k, low, high, t, ii, row, nrow, i, col, l, rmax, N, lastcol = -1; 86013f74950SBarry Smith PetscInt *imax = a->imax, *ai = a->i, *ailen = a->ilen, roworiented = a->roworiented; 861d0f46423SBarry Smith PetscInt *aj = a->j, nonew = a->nonew, bs = A->rmap->bs, brow, bcol; 86213f74950SBarry Smith PetscInt ridx, cidx, bs2 = a->bs2; 86349b5e25fSSatish Balay MatScalar *ap, value, *aa = a->a, *bap; 86449b5e25fSSatish Balay 86549b5e25fSSatish Balay PetscFunctionBegin; 86649b5e25fSSatish Balay for (k = 0; k < m; k++) { /* loop over added rows */ 86749b5e25fSSatish Balay row = im[k]; /* row number */ 86849b5e25fSSatish Balay brow = row / bs; /* block row number */ 86949b5e25fSSatish Balay if (row < 0) continue; 8706bdcaf15SBarry Smith PetscCheck(row < A->rmap->N, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Row too large: row %" PetscInt_FMT " max %" PetscInt_FMT, row, A->rmap->N - 1); 87149b5e25fSSatish Balay rp = aj + ai[brow]; /*ptr to beginning of column value of the row block*/ 87249b5e25fSSatish Balay ap = aa + bs2 * ai[brow]; /*ptr to beginning of element value of the row block*/ 87349b5e25fSSatish Balay rmax = imax[brow]; /* maximum space allocated for this row */ 87449b5e25fSSatish Balay nrow = ailen[brow]; /* actual length of this row */ 87549b5e25fSSatish Balay low = 0; 8768509e838SStefano Zampini high = nrow; 87749b5e25fSSatish Balay for (l = 0; l < n; l++) { /* loop over added columns */ 87849b5e25fSSatish Balay if (in[l] < 0) continue; 8796bdcaf15SBarry Smith PetscCheck(in[l] < A->cmap->N, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Column too large: col %" PetscInt_FMT " max %" PetscInt_FMT, in[l], A->cmap->N - 1); 88049b5e25fSSatish Balay col = in[l]; 88149b5e25fSSatish Balay bcol = col / bs; /* block col number */ 88249b5e25fSSatish Balay 883941593c8SHong Zhang if (brow > bcol) { 88426fbe8dcSKarl Rupp if (a->ignore_ltriangular) continue; /* ignore lower triangular values */ 88526fbe8dcSKarl Rupp else SETERRQ(PETSC_COMM_SELF, PETSC_ERR_USER, "Lower triangular value cannot be set for sbaij format. Ignoring these values, run with -mat_ignore_lower_triangular or call MatSetOption(mat,MAT_IGNORE_LOWER_TRIANGULAR,PETSC_TRUE)"); 886941593c8SHong Zhang } 887f4989cb3SHong Zhang 8889371c9d4SSatish Balay ridx = row % bs; 8899371c9d4SSatish Balay cidx = col % bs; /*row and col index inside the block */ 8908549e402SHong Zhang if ((brow == bcol && ridx <= cidx) || (brow < bcol)) { 89149b5e25fSSatish Balay /* element value a(k,l) */ 89226fbe8dcSKarl Rupp if (roworiented) value = v[l + k * n]; 89326fbe8dcSKarl Rupp else value = v[k + l * m]; 89449b5e25fSSatish Balay 89549b5e25fSSatish Balay /* move pointer bap to a(k,l) quickly and add/insert value */ 89626fbe8dcSKarl Rupp if (col <= lastcol) low = 0; 8978509e838SStefano Zampini else high = nrow; 8988509e838SStefano Zampini 899e2ee6c50SBarry Smith lastcol = col; 90049b5e25fSSatish Balay while (high - low > 7) { 90149b5e25fSSatish Balay t = (low + high) / 2; 90249b5e25fSSatish Balay if (rp[t] > bcol) high = t; 90349b5e25fSSatish Balay else low = t; 90449b5e25fSSatish Balay } 90549b5e25fSSatish Balay for (i = low; i < high; i++) { 90649b5e25fSSatish Balay if (rp[i] > bcol) break; 90749b5e25fSSatish Balay if (rp[i] == bcol) { 90849b5e25fSSatish Balay bap = ap + bs2 * i + bs * cidx + ridx; 90949b5e25fSSatish Balay if (is == ADD_VALUES) *bap += value; 91049b5e25fSSatish Balay else *bap = value; 9118549e402SHong Zhang /* for diag block, add/insert its symmetric element a(cidx,ridx) */ 9128549e402SHong Zhang if (brow == bcol && ridx < cidx) { 9138549e402SHong Zhang bap = ap + bs2 * i + bs * ridx + cidx; 9148549e402SHong Zhang if (is == ADD_VALUES) *bap += value; 9158549e402SHong Zhang else *bap = value; 9168549e402SHong Zhang } 91749b5e25fSSatish Balay goto noinsert1; 91849b5e25fSSatish Balay } 91949b5e25fSSatish Balay } 92049b5e25fSSatish Balay 92149b5e25fSSatish Balay if (nonew == 1) goto noinsert1; 92208401ef6SPierre Jolivet PetscCheck(nonew != -1, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Inserting a new nonzero (%" PetscInt_FMT ", %" PetscInt_FMT ") in the matrix", row, col); 923fef13f97SBarry Smith MatSeqXAIJReallocateAIJ(A, a->mbs, bs2, nrow, brow, bcol, rmax, aa, ai, aj, rp, ap, imax, nonew, MatScalar); 92449b5e25fSSatish Balay 9259371c9d4SSatish Balay N = nrow++ - 1; 9269371c9d4SSatish Balay high++; 92749b5e25fSSatish Balay /* shift up all the later entries in this row */ 9289566063dSJacob Faibussowitsch PetscCall(PetscArraymove(rp + i + 1, rp + i, N - i + 1)); 9299566063dSJacob Faibussowitsch PetscCall(PetscArraymove(ap + bs2 * (i + 1), ap + bs2 * i, bs2 * (N - i + 1))); 9309566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(ap + bs2 * i, bs2)); 93149b5e25fSSatish Balay rp[i] = bcol; 93249b5e25fSSatish Balay ap[bs2 * i + bs * cidx + ridx] = value; 9338509e838SStefano Zampini /* for diag block, add/insert its symmetric element a(cidx,ridx) */ 934ad540459SPierre Jolivet if (brow == bcol && ridx < cidx) ap[bs2 * i + bs * ridx + cidx] = value; 935e56f5c9eSBarry Smith A->nonzerostate++; 93649b5e25fSSatish Balay noinsert1:; 93749b5e25fSSatish Balay low = i; 9388549e402SHong Zhang } 93949b5e25fSSatish Balay } /* end of loop over added columns */ 94049b5e25fSSatish Balay ailen[brow] = nrow; 94149b5e25fSSatish Balay } /* end of loop over added rows */ 9423ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 94349b5e25fSSatish Balay } 94449b5e25fSSatish Balay 945d71ae5a4SJacob Faibussowitsch PetscErrorCode MatICCFactor_SeqSBAIJ(Mat inA, IS row, const MatFactorInfo *info) 946d71ae5a4SJacob Faibussowitsch { 9474ccecd49SHong Zhang Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)inA->data; 94849b5e25fSSatish Balay Mat outA; 949ace3abfcSBarry Smith PetscBool row_identity; 95049b5e25fSSatish Balay 95149b5e25fSSatish Balay PetscFunctionBegin; 95208401ef6SPierre Jolivet PetscCheck(info->levels == 0, PETSC_COMM_SELF, PETSC_ERR_SUP, "Only levels=0 is supported for in-place icc"); 9539566063dSJacob Faibussowitsch PetscCall(ISIdentity(row, &row_identity)); 95428b400f6SJacob Faibussowitsch PetscCheck(row_identity, PETSC_COMM_SELF, PETSC_ERR_SUP, "Matrix reordering is not supported"); 95508401ef6SPierre Jolivet PetscCheck(inA->rmap->bs == 1, PETSC_COMM_SELF, PETSC_ERR_SUP, "Matrix block size %" PetscInt_FMT " is not supported", inA->rmap->bs); /* Need to replace MatCholeskyFactorSymbolic_SeqSBAIJ_MSR()! */ 956c84f5b01SHong Zhang 95749b5e25fSSatish Balay outA = inA; 958d5f3da31SBarry Smith inA->factortype = MAT_FACTOR_ICC; 9599566063dSJacob Faibussowitsch PetscCall(PetscFree(inA->solvertype)); 9609566063dSJacob Faibussowitsch PetscCall(PetscStrallocpy(MATSOLVERPETSC, &inA->solvertype)); 96149b5e25fSSatish Balay 9629566063dSJacob Faibussowitsch PetscCall(MatMarkDiagonal_SeqSBAIJ(inA)); 9639566063dSJacob Faibussowitsch PetscCall(MatSeqSBAIJSetNumericFactorization_inplace(inA, row_identity)); 96449b5e25fSSatish Balay 9659566063dSJacob Faibussowitsch PetscCall(PetscObjectReference((PetscObject)row)); 9669566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->row)); 967c84f5b01SHong Zhang a->row = row; 9689566063dSJacob Faibussowitsch PetscCall(PetscObjectReference((PetscObject)row)); 9699566063dSJacob Faibussowitsch PetscCall(ISDestroy(&a->col)); 970c84f5b01SHong Zhang a->col = row; 971c84f5b01SHong Zhang 972c84f5b01SHong Zhang /* Create the invert permutation so that it can be used in MatCholeskyFactorNumeric() */ 9739566063dSJacob Faibussowitsch if (a->icol) PetscCall(ISInvertPermutation(row, PETSC_DECIDE, &a->icol)); 97449b5e25fSSatish Balay 975aa624791SPierre Jolivet if (!a->solve_work) PetscCall(PetscMalloc1(inA->rmap->N + inA->rmap->bs, &a->solve_work)); 97649b5e25fSSatish Balay 9779566063dSJacob Faibussowitsch PetscCall(MatCholeskyFactorNumeric(outA, inA, info)); 9783ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 97949b5e25fSSatish Balay } 980950f1e5bSHong Zhang 981d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqSBAIJSetColumnIndices_SeqSBAIJ(Mat mat, PetscInt *indices) 982d71ae5a4SJacob Faibussowitsch { 983045c9aa0SHong Zhang Mat_SeqSBAIJ *baij = (Mat_SeqSBAIJ *)mat->data; 98413f74950SBarry Smith PetscInt i, nz, n; 98549b5e25fSSatish Balay 98649b5e25fSSatish Balay PetscFunctionBegin; 9876c6c5352SBarry Smith nz = baij->maxnz; 988d0f46423SBarry Smith n = mat->cmap->n; 98926fbe8dcSKarl Rupp for (i = 0; i < nz; i++) baij->j[i] = indices[i]; 99026fbe8dcSKarl Rupp 9916c6c5352SBarry Smith baij->nz = nz; 99226fbe8dcSKarl Rupp for (i = 0; i < n; i++) baij->ilen[i] = baij->imax[i]; 99326fbe8dcSKarl Rupp 9949566063dSJacob Faibussowitsch PetscCall(MatSetOption(mat, MAT_NEW_NONZERO_LOCATION_ERR, PETSC_TRUE)); 9953ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 99649b5e25fSSatish Balay } 99749b5e25fSSatish Balay 99849b5e25fSSatish Balay /*@ 99919585528SSatish Balay MatSeqSBAIJSetColumnIndices - Set the column indices for all the rows 100011a5261eSBarry Smith in a `MATSEQSBAIJ` matrix. 100149b5e25fSSatish Balay 100249b5e25fSSatish Balay Input Parameters: 100311a5261eSBarry Smith + mat - the `MATSEQSBAIJ` matrix 100449b5e25fSSatish Balay - indices - the column indices 100549b5e25fSSatish Balay 100649b5e25fSSatish Balay Level: advanced 100749b5e25fSSatish Balay 100849b5e25fSSatish Balay Notes: 100949b5e25fSSatish Balay This can be called if you have precomputed the nonzero structure of the 101049b5e25fSSatish Balay matrix and want to provide it to the matrix object to improve the performance 101111a5261eSBarry Smith of the `MatSetValues()` operation. 101249b5e25fSSatish Balay 101349b5e25fSSatish Balay You MUST have set the correct numbers of nonzeros per row in the call to 101411a5261eSBarry Smith `MatCreateSeqSBAIJ()`, and the columns indices MUST be sorted. 101549b5e25fSSatish Balay 10162ef1f0ffSBarry Smith MUST be called before any calls to `MatSetValues()` 101749b5e25fSSatish Balay 10181cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MATSEQSBAIJ`, `MatCreateSeqSBAIJ` 101949b5e25fSSatish Balay @*/ 1020d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqSBAIJSetColumnIndices(Mat mat, PetscInt *indices) 1021d71ae5a4SJacob Faibussowitsch { 102249b5e25fSSatish Balay PetscFunctionBegin; 10230700a824SBarry Smith PetscValidHeaderSpecific(mat, MAT_CLASSID, 1); 1024dadcf809SJacob Faibussowitsch PetscValidIntPointer(indices, 2); 1025cac4c232SBarry Smith PetscUseMethod(mat, "MatSeqSBAIJSetColumnIndices_C", (Mat, PetscInt *), (mat, indices)); 10263ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 102749b5e25fSSatish Balay } 102849b5e25fSSatish Balay 1029d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCopy_SeqSBAIJ(Mat A, Mat B, MatStructure str) 1030d71ae5a4SJacob Faibussowitsch { 10314c7a3774SStefano Zampini PetscBool isbaij; 10323c896bc6SHong Zhang 10333c896bc6SHong Zhang PetscFunctionBegin; 10349566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompareAny((PetscObject)B, &isbaij, MATSEQSBAIJ, MATMPISBAIJ, "")); 103528b400f6SJacob Faibussowitsch PetscCheck(isbaij, PetscObjectComm((PetscObject)B), PETSC_ERR_SUP, "Not for matrix type %s", ((PetscObject)B)->type_name); 10364c7a3774SStefano Zampini /* If the two matrices have the same copy implementation and nonzero pattern, use fast copy. */ 10374c7a3774SStefano Zampini if (str == SAME_NONZERO_PATTERN && A->ops->copy == B->ops->copy) { 10383c896bc6SHong Zhang Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)A->data; 10393c896bc6SHong Zhang Mat_SeqSBAIJ *b = (Mat_SeqSBAIJ *)B->data; 10403c896bc6SHong Zhang 104108401ef6SPierre Jolivet PetscCheck(a->i[a->mbs] == b->i[b->mbs], PETSC_COMM_SELF, PETSC_ERR_ARG_INCOMP, "Number of nonzeros in two matrices are different"); 104208401ef6SPierre Jolivet PetscCheck(a->mbs == b->mbs, PETSC_COMM_SELF, PETSC_ERR_ARG_INCOMP, "Number of rows in two matrices are different"); 104308401ef6SPierre Jolivet PetscCheck(a->bs2 == b->bs2, PETSC_COMM_SELF, PETSC_ERR_ARG_INCOMP, "Different block size"); 10449566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(b->a, a->a, a->bs2 * a->i[a->mbs])); 10459566063dSJacob Faibussowitsch PetscCall(PetscObjectStateIncrease((PetscObject)B)); 10463c896bc6SHong Zhang } else { 10479566063dSJacob Faibussowitsch PetscCall(MatGetRowUpperTriangular(A)); 10489566063dSJacob Faibussowitsch PetscCall(MatCopy_Basic(A, B, str)); 10499566063dSJacob Faibussowitsch PetscCall(MatRestoreRowUpperTriangular(A)); 10503c896bc6SHong Zhang } 10513ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 10523c896bc6SHong Zhang } 10533c896bc6SHong Zhang 1054d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatSeqSBAIJGetArray_SeqSBAIJ(Mat A, PetscScalar *array[]) 1055d71ae5a4SJacob Faibussowitsch { 1056a6ece127SHong Zhang Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)A->data; 10575fd66863SKarl Rupp 1058a6ece127SHong Zhang PetscFunctionBegin; 1059a6ece127SHong Zhang *array = a->a; 10603ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1061a6ece127SHong Zhang } 1062a6ece127SHong Zhang 1063d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatSeqSBAIJRestoreArray_SeqSBAIJ(Mat A, PetscScalar *array[]) 1064d71ae5a4SJacob Faibussowitsch { 1065a6ece127SHong Zhang PetscFunctionBegin; 1066cda14afcSprj- *array = NULL; 10673ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1068a6ece127SHong Zhang } 1069a6ece127SHong Zhang 1070d71ae5a4SJacob Faibussowitsch PetscErrorCode MatAXPYGetPreallocation_SeqSBAIJ(Mat Y, Mat X, PetscInt *nnz) 1071d71ae5a4SJacob Faibussowitsch { 1072b264fe52SHong Zhang PetscInt bs = Y->rmap->bs, mbs = Y->rmap->N / bs; 107352768537SHong Zhang Mat_SeqSBAIJ *x = (Mat_SeqSBAIJ *)X->data; 107452768537SHong Zhang Mat_SeqSBAIJ *y = (Mat_SeqSBAIJ *)Y->data; 107552768537SHong Zhang 107652768537SHong Zhang PetscFunctionBegin; 107752768537SHong Zhang /* Set the number of nonzeros in the new matrix */ 10789566063dSJacob Faibussowitsch PetscCall(MatAXPYGetPreallocation_SeqX_private(mbs, x->i, x->j, y->i, y->j, nnz)); 10793ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 108052768537SHong Zhang } 108152768537SHong Zhang 1082d71ae5a4SJacob Faibussowitsch PetscErrorCode MatAXPY_SeqSBAIJ(Mat Y, PetscScalar a, Mat X, MatStructure str) 1083d71ae5a4SJacob Faibussowitsch { 108442ee4b1aSHong Zhang Mat_SeqSBAIJ *x = (Mat_SeqSBAIJ *)X->data, *y = (Mat_SeqSBAIJ *)Y->data; 108531ce2d13SHong Zhang PetscInt bs = Y->rmap->bs, bs2 = bs * bs; 1086e838b9e7SJed Brown PetscBLASInt one = 1; 108742ee4b1aSHong Zhang 108842ee4b1aSHong Zhang PetscFunctionBegin; 1089134adf20SPierre Jolivet if (str == UNKNOWN_NONZERO_PATTERN || (PetscDefined(USE_DEBUG) && str == SAME_NONZERO_PATTERN)) { 1090134adf20SPierre Jolivet PetscBool e = x->nz == y->nz && x->mbs == y->mbs ? PETSC_TRUE : PETSC_FALSE; 1091134adf20SPierre Jolivet if (e) { 10929566063dSJacob Faibussowitsch PetscCall(PetscArraycmp(x->i, y->i, x->mbs + 1, &e)); 1093134adf20SPierre Jolivet if (e) { 10949566063dSJacob Faibussowitsch PetscCall(PetscArraycmp(x->j, y->j, x->i[x->mbs], &e)); 1095134adf20SPierre Jolivet if (e) str = SAME_NONZERO_PATTERN; 1096134adf20SPierre Jolivet } 1097134adf20SPierre Jolivet } 109854c59aa7SJacob Faibussowitsch if (!e) PetscCheck(str != SAME_NONZERO_PATTERN, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONG, "MatStructure is not SAME_NONZERO_PATTERN"); 1099134adf20SPierre Jolivet } 110042ee4b1aSHong Zhang if (str == SAME_NONZERO_PATTERN) { 1101f4df32b1SMatthew Knepley PetscScalar alpha = a; 1102c5df96a5SBarry Smith PetscBLASInt bnz; 11039566063dSJacob Faibussowitsch PetscCall(PetscBLASIntCast(x->nz * bs2, &bnz)); 1104792fecdfSBarry Smith PetscCallBLAS("BLASaxpy", BLASaxpy_(&bnz, &alpha, x->a, &one, y->a, &one)); 11059566063dSJacob Faibussowitsch PetscCall(PetscObjectStateIncrease((PetscObject)Y)); 1106ab784542SHong Zhang } else if (str == SUBSET_NONZERO_PATTERN) { /* nonzeros of X is a subset of Y's */ 11079566063dSJacob Faibussowitsch PetscCall(MatSetOption(X, MAT_GETROW_UPPERTRIANGULAR, PETSC_TRUE)); 11089566063dSJacob Faibussowitsch PetscCall(MatAXPY_Basic(Y, a, X, str)); 11099566063dSJacob Faibussowitsch PetscCall(MatSetOption(X, MAT_GETROW_UPPERTRIANGULAR, PETSC_FALSE)); 111042ee4b1aSHong Zhang } else { 111152768537SHong Zhang Mat B; 111252768537SHong Zhang PetscInt *nnz; 111354c59aa7SJacob Faibussowitsch PetscCheck(bs == X->rmap->bs, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Matrices must have same block size"); 11149566063dSJacob Faibussowitsch PetscCall(MatGetRowUpperTriangular(X)); 11159566063dSJacob Faibussowitsch PetscCall(MatGetRowUpperTriangular(Y)); 11169566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(Y->rmap->N, &nnz)); 11179566063dSJacob Faibussowitsch PetscCall(MatCreate(PetscObjectComm((PetscObject)Y), &B)); 11189566063dSJacob Faibussowitsch PetscCall(PetscObjectSetName((PetscObject)B, ((PetscObject)Y)->name)); 11199566063dSJacob Faibussowitsch PetscCall(MatSetSizes(B, Y->rmap->n, Y->cmap->n, Y->rmap->N, Y->cmap->N)); 11209566063dSJacob Faibussowitsch PetscCall(MatSetBlockSizesFromMats(B, Y, Y)); 11219566063dSJacob Faibussowitsch PetscCall(MatSetType(B, ((PetscObject)Y)->type_name)); 11229566063dSJacob Faibussowitsch PetscCall(MatAXPYGetPreallocation_SeqSBAIJ(Y, X, nnz)); 11239566063dSJacob Faibussowitsch PetscCall(MatSeqSBAIJSetPreallocation(B, bs, 0, nnz)); 112452768537SHong Zhang 11259566063dSJacob Faibussowitsch PetscCall(MatAXPY_BasicWithPreallocation(B, Y, a, X, str)); 112652768537SHong Zhang 11279566063dSJacob Faibussowitsch PetscCall(MatHeaderMerge(Y, &B)); 11289566063dSJacob Faibussowitsch PetscCall(PetscFree(nnz)); 11299566063dSJacob Faibussowitsch PetscCall(MatRestoreRowUpperTriangular(X)); 11309566063dSJacob Faibussowitsch PetscCall(MatRestoreRowUpperTriangular(Y)); 113142ee4b1aSHong Zhang } 11323ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 113342ee4b1aSHong Zhang } 113442ee4b1aSHong Zhang 1135d71ae5a4SJacob Faibussowitsch PetscErrorCode MatIsSymmetric_SeqSBAIJ(Mat A, PetscReal tol, PetscBool *flg) 1136d71ae5a4SJacob Faibussowitsch { 1137efcf0fc3SBarry Smith PetscFunctionBegin; 1138efcf0fc3SBarry Smith *flg = PETSC_TRUE; 11393ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1140efcf0fc3SBarry Smith } 1141efcf0fc3SBarry Smith 1142d71ae5a4SJacob Faibussowitsch PetscErrorCode MatIsStructurallySymmetric_SeqSBAIJ(Mat A, PetscBool *flg) 1143d71ae5a4SJacob Faibussowitsch { 1144efcf0fc3SBarry Smith PetscFunctionBegin; 1145efcf0fc3SBarry Smith *flg = PETSC_TRUE; 11463ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1147efcf0fc3SBarry Smith } 1148efcf0fc3SBarry Smith 1149d71ae5a4SJacob Faibussowitsch PetscErrorCode MatIsHermitian_SeqSBAIJ(Mat A, PetscReal tol, PetscBool *flg) 1150d71ae5a4SJacob Faibussowitsch { 1151efcf0fc3SBarry Smith PetscFunctionBegin; 1152efcf0fc3SBarry Smith *flg = PETSC_FALSE; 11533ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1154efcf0fc3SBarry Smith } 1155efcf0fc3SBarry Smith 1156d71ae5a4SJacob Faibussowitsch PetscErrorCode MatConjugate_SeqSBAIJ(Mat A) 1157d71ae5a4SJacob Faibussowitsch { 11582726fb6dSPierre Jolivet #if defined(PETSC_USE_COMPLEX) 11592726fb6dSPierre Jolivet Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)A->data; 11602726fb6dSPierre Jolivet PetscInt i, nz = a->bs2 * a->i[a->mbs]; 11612726fb6dSPierre Jolivet MatScalar *aa = a->a; 11622726fb6dSPierre Jolivet 11632726fb6dSPierre Jolivet PetscFunctionBegin; 11642726fb6dSPierre Jolivet for (i = 0; i < nz; i++) aa[i] = PetscConj(aa[i]); 11652726fb6dSPierre Jolivet #else 11662726fb6dSPierre Jolivet PetscFunctionBegin; 11672726fb6dSPierre Jolivet #endif 11683ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 11692726fb6dSPierre Jolivet } 11702726fb6dSPierre Jolivet 1171d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRealPart_SeqSBAIJ(Mat A) 1172d71ae5a4SJacob Faibussowitsch { 117399cafbc1SBarry Smith Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)A->data; 117499cafbc1SBarry Smith PetscInt i, nz = a->bs2 * a->i[a->mbs]; 1175dd6ea824SBarry Smith MatScalar *aa = a->a; 117699cafbc1SBarry Smith 117799cafbc1SBarry Smith PetscFunctionBegin; 117899cafbc1SBarry Smith for (i = 0; i < nz; i++) aa[i] = PetscRealPart(aa[i]); 11793ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 118099cafbc1SBarry Smith } 118199cafbc1SBarry Smith 1182d71ae5a4SJacob Faibussowitsch PetscErrorCode MatImaginaryPart_SeqSBAIJ(Mat A) 1183d71ae5a4SJacob Faibussowitsch { 118499cafbc1SBarry Smith Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)A->data; 118599cafbc1SBarry Smith PetscInt i, nz = a->bs2 * a->i[a->mbs]; 1186dd6ea824SBarry Smith MatScalar *aa = a->a; 118799cafbc1SBarry Smith 118899cafbc1SBarry Smith PetscFunctionBegin; 118999cafbc1SBarry Smith for (i = 0; i < nz; i++) aa[i] = PetscImaginaryPart(aa[i]); 11903ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 119199cafbc1SBarry Smith } 119299cafbc1SBarry Smith 1193d71ae5a4SJacob Faibussowitsch PetscErrorCode MatZeroRowsColumns_SeqSBAIJ(Mat A, PetscInt is_n, const PetscInt is_idx[], PetscScalar diag, Vec x, Vec b) 1194d71ae5a4SJacob Faibussowitsch { 11953bededecSBarry Smith Mat_SeqSBAIJ *baij = (Mat_SeqSBAIJ *)A->data; 11963bededecSBarry Smith PetscInt i, j, k, count; 11973bededecSBarry Smith PetscInt bs = A->rmap->bs, bs2 = baij->bs2, row, col; 11983bededecSBarry Smith PetscScalar zero = 0.0; 11993bededecSBarry Smith MatScalar *aa; 12003bededecSBarry Smith const PetscScalar *xx; 12013bededecSBarry Smith PetscScalar *bb; 120256777dd2SBarry Smith PetscBool *zeroed, vecs = PETSC_FALSE; 12033bededecSBarry Smith 12043bededecSBarry Smith PetscFunctionBegin; 12053bededecSBarry Smith /* fix right hand side if needed */ 12063bededecSBarry Smith if (x && b) { 12079566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(x, &xx)); 12089566063dSJacob Faibussowitsch PetscCall(VecGetArray(b, &bb)); 120956777dd2SBarry Smith vecs = PETSC_TRUE; 12103bededecSBarry Smith } 12113bededecSBarry Smith 12123bededecSBarry Smith /* zero the columns */ 12139566063dSJacob Faibussowitsch PetscCall(PetscCalloc1(A->rmap->n, &zeroed)); 12143bededecSBarry Smith for (i = 0; i < is_n; i++) { 1215aed4548fSBarry Smith PetscCheck(is_idx[i] >= 0 && is_idx[i] < A->rmap->N, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "row %" PetscInt_FMT " out of range", is_idx[i]); 12163bededecSBarry Smith zeroed[is_idx[i]] = PETSC_TRUE; 12173bededecSBarry Smith } 121856777dd2SBarry Smith if (vecs) { 121956777dd2SBarry Smith for (i = 0; i < A->rmap->N; i++) { 122056777dd2SBarry Smith row = i / bs; 122156777dd2SBarry Smith for (j = baij->i[row]; j < baij->i[row + 1]; j++) { 122256777dd2SBarry Smith for (k = 0; k < bs; k++) { 122356777dd2SBarry Smith col = bs * baij->j[j] + k; 122456777dd2SBarry Smith if (col <= i) continue; 122556777dd2SBarry Smith aa = ((MatScalar *)(baij->a)) + j * bs2 + (i % bs) + bs * k; 122626fbe8dcSKarl Rupp if (!zeroed[i] && zeroed[col]) bb[i] -= aa[0] * xx[col]; 122726fbe8dcSKarl Rupp if (zeroed[i] && !zeroed[col]) bb[col] -= aa[0] * xx[i]; 122856777dd2SBarry Smith } 122956777dd2SBarry Smith } 123056777dd2SBarry Smith } 123126fbe8dcSKarl Rupp for (i = 0; i < is_n; i++) bb[is_idx[i]] = diag * xx[is_idx[i]]; 123256777dd2SBarry Smith } 123356777dd2SBarry Smith 12343bededecSBarry Smith for (i = 0; i < A->rmap->N; i++) { 12353bededecSBarry Smith if (!zeroed[i]) { 12363bededecSBarry Smith row = i / bs; 12373bededecSBarry Smith for (j = baij->i[row]; j < baij->i[row + 1]; j++) { 12383bededecSBarry Smith for (k = 0; k < bs; k++) { 12393bededecSBarry Smith col = bs * baij->j[j] + k; 12403bededecSBarry Smith if (zeroed[col]) { 12413bededecSBarry Smith aa = ((MatScalar *)(baij->a)) + j * bs2 + (i % bs) + bs * k; 12423bededecSBarry Smith aa[0] = 0.0; 12433bededecSBarry Smith } 12443bededecSBarry Smith } 12453bededecSBarry Smith } 12463bededecSBarry Smith } 12473bededecSBarry Smith } 12489566063dSJacob Faibussowitsch PetscCall(PetscFree(zeroed)); 124956777dd2SBarry Smith if (vecs) { 12509566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(x, &xx)); 12519566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(b, &bb)); 125256777dd2SBarry Smith } 12533bededecSBarry Smith 12543bededecSBarry Smith /* zero the rows */ 12553bededecSBarry Smith for (i = 0; i < is_n; i++) { 12563bededecSBarry Smith row = is_idx[i]; 12573bededecSBarry Smith count = (baij->i[row / bs + 1] - baij->i[row / bs]) * bs; 12583bededecSBarry Smith aa = ((MatScalar *)(baij->a)) + baij->i[row / bs] * bs2 + (row % bs); 12593bededecSBarry Smith for (k = 0; k < count; k++) { 12603bededecSBarry Smith aa[0] = zero; 12613bededecSBarry Smith aa += bs; 12623bededecSBarry Smith } 1263dbbe0bcdSBarry Smith if (diag != 0.0) PetscUseTypeMethod(A, setvalues, 1, &row, 1, &row, &diag, INSERT_VALUES); 12643bededecSBarry Smith } 12659566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd_SeqSBAIJ(A, MAT_FINAL_ASSEMBLY)); 12663ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 12673bededecSBarry Smith } 12683bededecSBarry Smith 1269d71ae5a4SJacob Faibussowitsch PetscErrorCode MatShift_SeqSBAIJ(Mat Y, PetscScalar a) 1270d71ae5a4SJacob Faibussowitsch { 12717d68702bSBarry Smith Mat_SeqSBAIJ *aij = (Mat_SeqSBAIJ *)Y->data; 12727d68702bSBarry Smith 12737d68702bSBarry Smith PetscFunctionBegin; 127448a46eb9SPierre Jolivet if (!Y->preallocated || !aij->nz) PetscCall(MatSeqSBAIJSetPreallocation(Y, Y->rmap->bs, 1, NULL)); 12759566063dSJacob Faibussowitsch PetscCall(MatShift_Basic(Y, a)); 12763ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 12777d68702bSBarry Smith } 12787d68702bSBarry Smith 12793964eb88SJed Brown static struct _MatOps MatOps_Values = {MatSetValues_SeqSBAIJ, 128049b5e25fSSatish Balay MatGetRow_SeqSBAIJ, 128149b5e25fSSatish Balay MatRestoreRow_SeqSBAIJ, 128249b5e25fSSatish Balay MatMult_SeqSBAIJ_N, 128397304618SKris Buschelman /* 4*/ MatMultAdd_SeqSBAIJ_N, 1284431c96f7SBarry Smith MatMult_SeqSBAIJ_N, /* transpose versions are same as non-transpose versions */ 1285e005ede5SBarry Smith MatMultAdd_SeqSBAIJ_N, 1286f4259b30SLisandro Dalcin NULL, 1287f4259b30SLisandro Dalcin NULL, 1288f4259b30SLisandro Dalcin NULL, 1289f4259b30SLisandro Dalcin /* 10*/ NULL, 1290f4259b30SLisandro Dalcin NULL, 1291c078aec8SLisandro Dalcin MatCholeskyFactor_SeqSBAIJ, 129241f059aeSBarry Smith MatSOR_SeqSBAIJ, 129349b5e25fSSatish Balay MatTranspose_SeqSBAIJ, 129497304618SKris Buschelman /* 15*/ MatGetInfo_SeqSBAIJ, 129549b5e25fSSatish Balay MatEqual_SeqSBAIJ, 129649b5e25fSSatish Balay MatGetDiagonal_SeqSBAIJ, 129749b5e25fSSatish Balay MatDiagonalScale_SeqSBAIJ, 129849b5e25fSSatish Balay MatNorm_SeqSBAIJ, 1299f4259b30SLisandro Dalcin /* 20*/ NULL, 130049b5e25fSSatish Balay MatAssemblyEnd_SeqSBAIJ, 130149b5e25fSSatish Balay MatSetOption_SeqSBAIJ, 130249b5e25fSSatish Balay MatZeroEntries_SeqSBAIJ, 1303f4259b30SLisandro Dalcin /* 24*/ NULL, 1304f4259b30SLisandro Dalcin NULL, 1305f4259b30SLisandro Dalcin NULL, 1306f4259b30SLisandro Dalcin NULL, 1307f4259b30SLisandro Dalcin NULL, 130826cec326SBarry Smith /* 29*/ MatSetUp_Seq_Hash, 1309f4259b30SLisandro Dalcin NULL, 1310f4259b30SLisandro Dalcin NULL, 1311f4259b30SLisandro Dalcin NULL, 1312f4259b30SLisandro Dalcin NULL, 1313d519adbfSMatthew Knepley /* 34*/ MatDuplicate_SeqSBAIJ, 1314f4259b30SLisandro Dalcin NULL, 1315f4259b30SLisandro Dalcin NULL, 1316f4259b30SLisandro Dalcin NULL, 1317c84f5b01SHong Zhang MatICCFactor_SeqSBAIJ, 1318d519adbfSMatthew Knepley /* 39*/ MatAXPY_SeqSBAIJ, 13197dae84e0SHong Zhang MatCreateSubMatrices_SeqSBAIJ, 132049b5e25fSSatish Balay MatIncreaseOverlap_SeqSBAIJ, 132149b5e25fSSatish Balay MatGetValues_SeqSBAIJ, 13223c896bc6SHong Zhang MatCopy_SeqSBAIJ, 1323f4259b30SLisandro Dalcin /* 44*/ NULL, 132449b5e25fSSatish Balay MatScale_SeqSBAIJ, 13257d68702bSBarry Smith MatShift_SeqSBAIJ, 1326f4259b30SLisandro Dalcin NULL, 13273bededecSBarry Smith MatZeroRowsColumns_SeqSBAIJ, 1328f4259b30SLisandro Dalcin /* 49*/ NULL, 132949b5e25fSSatish Balay MatGetRowIJ_SeqSBAIJ, 133049b5e25fSSatish Balay MatRestoreRowIJ_SeqSBAIJ, 1331f4259b30SLisandro Dalcin NULL, 1332f4259b30SLisandro Dalcin NULL, 1333f4259b30SLisandro Dalcin /* 54*/ NULL, 1334f4259b30SLisandro Dalcin NULL, 1335f4259b30SLisandro Dalcin NULL, 1336dc29a518SPierre Jolivet MatPermute_SeqSBAIJ, 133749b5e25fSSatish Balay MatSetValuesBlocked_SeqSBAIJ, 13387dae84e0SHong Zhang /* 59*/ MatCreateSubMatrix_SeqSBAIJ, 1339f4259b30SLisandro Dalcin NULL, 1340f4259b30SLisandro Dalcin NULL, 1341f4259b30SLisandro Dalcin NULL, 1342f4259b30SLisandro Dalcin NULL, 1343f4259b30SLisandro Dalcin /* 64*/ NULL, 1344f4259b30SLisandro Dalcin NULL, 1345f4259b30SLisandro Dalcin NULL, 1346f4259b30SLisandro Dalcin NULL, 1347f4259b30SLisandro Dalcin NULL, 1348d519adbfSMatthew Knepley /* 69*/ MatGetRowMaxAbs_SeqSBAIJ, 1349f4259b30SLisandro Dalcin NULL, 135028d58a37SPierre Jolivet MatConvert_MPISBAIJ_Basic, 1351f4259b30SLisandro Dalcin NULL, 1352f4259b30SLisandro Dalcin NULL, 1353f4259b30SLisandro Dalcin /* 74*/ NULL, 1354f4259b30SLisandro Dalcin NULL, 1355f4259b30SLisandro Dalcin NULL, 1356f4259b30SLisandro Dalcin NULL, 1357f4259b30SLisandro Dalcin NULL, 1358f4259b30SLisandro Dalcin /* 79*/ NULL, 1359f4259b30SLisandro Dalcin NULL, 1360f4259b30SLisandro Dalcin NULL, 136197304618SKris Buschelman MatGetInertia_SeqSBAIJ, 13625bba2384SShri Abhyankar MatLoad_SeqSBAIJ, 1363d519adbfSMatthew Knepley /* 84*/ MatIsSymmetric_SeqSBAIJ, 1364865e5f61SKris Buschelman MatIsHermitian_SeqSBAIJ, 1365efcf0fc3SBarry Smith MatIsStructurallySymmetric_SeqSBAIJ, 1366f4259b30SLisandro Dalcin NULL, 1367f4259b30SLisandro Dalcin NULL, 1368f4259b30SLisandro Dalcin /* 89*/ NULL, 1369f4259b30SLisandro Dalcin NULL, 1370f4259b30SLisandro Dalcin NULL, 1371f4259b30SLisandro Dalcin NULL, 1372f4259b30SLisandro Dalcin NULL, 1373f4259b30SLisandro Dalcin /* 94*/ NULL, 1374f4259b30SLisandro Dalcin NULL, 1375f4259b30SLisandro Dalcin NULL, 1376f4259b30SLisandro Dalcin NULL, 1377f4259b30SLisandro Dalcin NULL, 1378f4259b30SLisandro Dalcin /* 99*/ NULL, 1379f4259b30SLisandro Dalcin NULL, 1380f4259b30SLisandro Dalcin NULL, 13812726fb6dSPierre Jolivet MatConjugate_SeqSBAIJ, 1382f4259b30SLisandro Dalcin NULL, 1383f4259b30SLisandro Dalcin /*104*/ NULL, 138499cafbc1SBarry Smith MatRealPart_SeqSBAIJ, 1385f5edf698SHong Zhang MatImaginaryPart_SeqSBAIJ, 1386f5edf698SHong Zhang MatGetRowUpperTriangular_SeqSBAIJ, 13872af78befSBarry Smith MatRestoreRowUpperTriangular_SeqSBAIJ, 1388f4259b30SLisandro Dalcin /*109*/ NULL, 1389f4259b30SLisandro Dalcin NULL, 1390f4259b30SLisandro Dalcin NULL, 1391f4259b30SLisandro Dalcin NULL, 1392547795f9SHong Zhang MatMissingDiagonal_SeqSBAIJ, 1393f4259b30SLisandro Dalcin /*114*/ NULL, 1394f4259b30SLisandro Dalcin NULL, 1395f4259b30SLisandro Dalcin NULL, 1396f4259b30SLisandro Dalcin NULL, 1397f4259b30SLisandro Dalcin NULL, 1398f4259b30SLisandro Dalcin /*119*/ NULL, 1399f4259b30SLisandro Dalcin NULL, 1400f4259b30SLisandro Dalcin NULL, 1401f4259b30SLisandro Dalcin NULL, 1402f4259b30SLisandro Dalcin NULL, 1403f4259b30SLisandro Dalcin /*124*/ NULL, 1404f4259b30SLisandro Dalcin NULL, 1405f4259b30SLisandro Dalcin NULL, 1406f4259b30SLisandro Dalcin NULL, 1407f4259b30SLisandro Dalcin NULL, 1408f4259b30SLisandro Dalcin /*129*/ NULL, 1409f4259b30SLisandro Dalcin NULL, 1410f4259b30SLisandro Dalcin NULL, 1411f4259b30SLisandro Dalcin NULL, 1412f4259b30SLisandro Dalcin NULL, 1413f4259b30SLisandro Dalcin /*134*/ NULL, 1414f4259b30SLisandro Dalcin NULL, 1415f4259b30SLisandro Dalcin NULL, 1416f4259b30SLisandro Dalcin NULL, 1417f4259b30SLisandro Dalcin NULL, 141846533700Sstefano_zampini /*139*/ MatSetBlockSizes_Default, 1419f4259b30SLisandro Dalcin NULL, 1420f4259b30SLisandro Dalcin NULL, 1421f4259b30SLisandro Dalcin NULL, 1422f4259b30SLisandro Dalcin NULL, 1423d70f29a3SPierre Jolivet /*144*/ MatCreateMPIMatConcatenateSeqMat_SeqSBAIJ, 1424d70f29a3SPierre Jolivet NULL, 1425d70f29a3SPierre Jolivet NULL, 142699a7f59eSMark Adams NULL, 142799a7f59eSMark Adams NULL, 14287fb60732SBarry Smith NULL, 1429dec0b466SHong Zhang /*150*/ NULL, 1430dec0b466SHong Zhang NULL}; 1431be1d678aSKris Buschelman 1432d71ae5a4SJacob Faibussowitsch PetscErrorCode MatStoreValues_SeqSBAIJ(Mat mat) 1433d71ae5a4SJacob Faibussowitsch { 14344afc71dfSHong Zhang Mat_SeqSBAIJ *aij = (Mat_SeqSBAIJ *)mat->data; 1435d0f46423SBarry Smith PetscInt nz = aij->i[mat->rmap->N] * mat->rmap->bs * aij->bs2; 143649b5e25fSSatish Balay 143749b5e25fSSatish Balay PetscFunctionBegin; 143808401ef6SPierre Jolivet PetscCheck(aij->nonew == 1, PETSC_COMM_SELF, PETSC_ERR_ORDER, "Must call MatSetOption(A,MAT_NEW_NONZERO_LOCATIONS,PETSC_FALSE);first"); 143949b5e25fSSatish Balay 144049b5e25fSSatish Balay /* allocate space for values if not already there */ 144148a46eb9SPierre Jolivet if (!aij->saved_values) PetscCall(PetscMalloc1(nz + 1, &aij->saved_values)); 144249b5e25fSSatish Balay 144349b5e25fSSatish Balay /* copy values over */ 14449566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(aij->saved_values, aij->a, nz)); 14453ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 144649b5e25fSSatish Balay } 144749b5e25fSSatish Balay 1448d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRetrieveValues_SeqSBAIJ(Mat mat) 1449d71ae5a4SJacob Faibussowitsch { 14504afc71dfSHong Zhang Mat_SeqSBAIJ *aij = (Mat_SeqSBAIJ *)mat->data; 1451d0f46423SBarry Smith PetscInt nz = aij->i[mat->rmap->N] * mat->rmap->bs * aij->bs2; 145249b5e25fSSatish Balay 145349b5e25fSSatish Balay PetscFunctionBegin; 145408401ef6SPierre Jolivet PetscCheck(aij->nonew == 1, PETSC_COMM_SELF, PETSC_ERR_ORDER, "Must call MatSetOption(A,MAT_NEW_NONZERO_LOCATIONS,PETSC_FALSE);first"); 145528b400f6SJacob Faibussowitsch PetscCheck(aij->saved_values, PETSC_COMM_SELF, PETSC_ERR_ORDER, "Must call MatStoreValues(A);first"); 145649b5e25fSSatish Balay 145749b5e25fSSatish Balay /* copy values over */ 14589566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(aij->a, aij->saved_values, nz)); 14593ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 146049b5e25fSSatish Balay } 146149b5e25fSSatish Balay 1462d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatSeqSBAIJSetPreallocation_SeqSBAIJ(Mat B, PetscInt bs, PetscInt nz, PetscInt *nnz) 1463d71ae5a4SJacob Faibussowitsch { 1464c464158bSHong Zhang Mat_SeqSBAIJ *b = (Mat_SeqSBAIJ *)B->data; 14654dcd73b1SHong Zhang PetscInt i, mbs, nbs, bs2; 14662576faa2SJed Brown PetscBool skipallocation = PETSC_FALSE, flg = PETSC_FALSE, realalloc = PETSC_FALSE; 146749b5e25fSSatish Balay 1468b4e2f619SBarry Smith PetscFunctionBegin; 1469ad79cf63SBarry Smith if (B->hash_active) { 1470ad79cf63SBarry Smith PetscInt bs; 1471aea10558SJacob Faibussowitsch B->ops[0] = b->cops; 1472ad79cf63SBarry Smith PetscCall(PetscHMapIJVDestroy(&b->ht)); 1473ad79cf63SBarry Smith PetscCall(MatGetBlockSize(B, &bs)); 1474ad79cf63SBarry Smith if (bs > 1) PetscCall(PetscHSetIJDestroy(&b->bht)); 1475ad79cf63SBarry Smith PetscCall(PetscFree(b->dnz)); 1476ad79cf63SBarry Smith PetscCall(PetscFree(b->bdnz)); 1477ad79cf63SBarry Smith B->hash_active = PETSC_FALSE; 1478ad79cf63SBarry Smith } 14792576faa2SJed Brown if (nz >= 0 || nnz) realalloc = PETSC_TRUE; 1480db4efbfdSBarry Smith 14819566063dSJacob Faibussowitsch PetscCall(MatSetBlockSize(B, PetscAbs(bs))); 14829566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(B->rmap)); 14839566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(B->cmap)); 148408401ef6SPierre Jolivet PetscCheck(B->rmap->N <= B->cmap->N, PETSC_COMM_SELF, PETSC_ERR_SUP, "SEQSBAIJ matrix cannot have more rows %" PetscInt_FMT " than columns %" PetscInt_FMT, B->rmap->N, B->cmap->N); 14859566063dSJacob Faibussowitsch PetscCall(PetscLayoutGetBlockSize(B->rmap, &bs)); 1486899cda47SBarry Smith 148721940c7eSstefano_zampini B->preallocated = PETSC_TRUE; 148821940c7eSstefano_zampini 1489d0f46423SBarry Smith mbs = B->rmap->N / bs; 14904dcd73b1SHong Zhang nbs = B->cmap->n / bs; 149149b5e25fSSatish Balay bs2 = bs * bs; 149249b5e25fSSatish Balay 1493aed4548fSBarry Smith PetscCheck(mbs * bs == B->rmap->N && nbs * bs == B->cmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Number rows, cols must be divisible by blocksize"); 149449b5e25fSSatish Balay 1495ab93d7beSBarry Smith if (nz == MAT_SKIP_ALLOCATION) { 1496ab93d7beSBarry Smith skipallocation = PETSC_TRUE; 1497ab93d7beSBarry Smith nz = 0; 1498ab93d7beSBarry Smith } 1499ab93d7beSBarry Smith 1500435da068SBarry Smith if (nz == PETSC_DEFAULT || nz == PETSC_DECIDE) nz = 3; 150108401ef6SPierre Jolivet PetscCheck(nz >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "nz cannot be less than 0: value %" PetscInt_FMT, nz); 150249b5e25fSSatish Balay if (nnz) { 150349b5e25fSSatish Balay for (i = 0; i < mbs; i++) { 150408401ef6SPierre Jolivet PetscCheck(nnz[i] >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "nnz cannot be less than 0: local row %" PetscInt_FMT " value %" PetscInt_FMT, i, nnz[i]); 150508401ef6SPierre Jolivet PetscCheck(nnz[i] <= nbs, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "nnz cannot be greater than block row length: local row %" PetscInt_FMT " value %" PetscInt_FMT " block rowlength %" PetscInt_FMT, i, nnz[i], nbs); 150649b5e25fSSatish Balay } 150749b5e25fSSatish Balay } 150849b5e25fSSatish Balay 1509db4efbfdSBarry Smith B->ops->mult = MatMult_SeqSBAIJ_N; 1510db4efbfdSBarry Smith B->ops->multadd = MatMultAdd_SeqSBAIJ_N; 1511db4efbfdSBarry Smith B->ops->multtranspose = MatMult_SeqSBAIJ_N; 1512db4efbfdSBarry Smith B->ops->multtransposeadd = MatMultAdd_SeqSBAIJ_N; 151326fbe8dcSKarl Rupp 15149566063dSJacob Faibussowitsch PetscCall(PetscOptionsGetBool(((PetscObject)B)->options, ((PetscObject)B)->prefix, "-mat_no_unroll", &flg, NULL)); 151549b5e25fSSatish Balay if (!flg) { 151649b5e25fSSatish Balay switch (bs) { 151749b5e25fSSatish Balay case 1: 151849b5e25fSSatish Balay B->ops->mult = MatMult_SeqSBAIJ_1; 151949b5e25fSSatish Balay B->ops->multadd = MatMultAdd_SeqSBAIJ_1; 1520431c96f7SBarry Smith B->ops->multtranspose = MatMult_SeqSBAIJ_1; 1521431c96f7SBarry Smith B->ops->multtransposeadd = MatMultAdd_SeqSBAIJ_1; 152249b5e25fSSatish Balay break; 152349b5e25fSSatish Balay case 2: 152449b5e25fSSatish Balay B->ops->mult = MatMult_SeqSBAIJ_2; 152549b5e25fSSatish Balay B->ops->multadd = MatMultAdd_SeqSBAIJ_2; 1526431c96f7SBarry Smith B->ops->multtranspose = MatMult_SeqSBAIJ_2; 1527431c96f7SBarry Smith B->ops->multtransposeadd = MatMultAdd_SeqSBAIJ_2; 152849b5e25fSSatish Balay break; 152949b5e25fSSatish Balay case 3: 153049b5e25fSSatish Balay B->ops->mult = MatMult_SeqSBAIJ_3; 153149b5e25fSSatish Balay B->ops->multadd = MatMultAdd_SeqSBAIJ_3; 1532431c96f7SBarry Smith B->ops->multtranspose = MatMult_SeqSBAIJ_3; 1533431c96f7SBarry Smith B->ops->multtransposeadd = MatMultAdd_SeqSBAIJ_3; 153449b5e25fSSatish Balay break; 153549b5e25fSSatish Balay case 4: 153649b5e25fSSatish Balay B->ops->mult = MatMult_SeqSBAIJ_4; 153749b5e25fSSatish Balay B->ops->multadd = MatMultAdd_SeqSBAIJ_4; 1538431c96f7SBarry Smith B->ops->multtranspose = MatMult_SeqSBAIJ_4; 1539431c96f7SBarry Smith B->ops->multtransposeadd = MatMultAdd_SeqSBAIJ_4; 154049b5e25fSSatish Balay break; 154149b5e25fSSatish Balay case 5: 154249b5e25fSSatish Balay B->ops->mult = MatMult_SeqSBAIJ_5; 154349b5e25fSSatish Balay B->ops->multadd = MatMultAdd_SeqSBAIJ_5; 1544431c96f7SBarry Smith B->ops->multtranspose = MatMult_SeqSBAIJ_5; 1545431c96f7SBarry Smith B->ops->multtransposeadd = MatMultAdd_SeqSBAIJ_5; 154649b5e25fSSatish Balay break; 154749b5e25fSSatish Balay case 6: 154849b5e25fSSatish Balay B->ops->mult = MatMult_SeqSBAIJ_6; 154949b5e25fSSatish Balay B->ops->multadd = MatMultAdd_SeqSBAIJ_6; 1550431c96f7SBarry Smith B->ops->multtranspose = MatMult_SeqSBAIJ_6; 1551431c96f7SBarry Smith B->ops->multtransposeadd = MatMultAdd_SeqSBAIJ_6; 155249b5e25fSSatish Balay break; 155349b5e25fSSatish Balay case 7: 1554de53e5efSHong Zhang B->ops->mult = MatMult_SeqSBAIJ_7; 155549b5e25fSSatish Balay B->ops->multadd = MatMultAdd_SeqSBAIJ_7; 1556431c96f7SBarry Smith B->ops->multtranspose = MatMult_SeqSBAIJ_7; 1557431c96f7SBarry Smith B->ops->multtransposeadd = MatMultAdd_SeqSBAIJ_7; 155849b5e25fSSatish Balay break; 155949b5e25fSSatish Balay } 156049b5e25fSSatish Balay } 156149b5e25fSSatish Balay 156249b5e25fSSatish Balay b->mbs = mbs; 15634dcd73b1SHong Zhang b->nbs = nbs; 1564ab93d7beSBarry Smith if (!skipallocation) { 15652ee49352SLisandro Dalcin if (!b->imax) { 15669566063dSJacob Faibussowitsch PetscCall(PetscMalloc2(mbs, &b->imax, mbs, &b->ilen)); 156726fbe8dcSKarl Rupp 1568c760cd28SBarry Smith b->free_imax_ilen = PETSC_TRUE; 15692ee49352SLisandro Dalcin } 157049b5e25fSSatish Balay if (!nnz) { 1571435da068SBarry Smith if (nz == PETSC_DEFAULT || nz == PETSC_DECIDE) nz = 5; 157249b5e25fSSatish Balay else if (nz <= 0) nz = 1; 15735d2a9ed1SStefano Zampini nz = PetscMin(nbs, nz); 157426fbe8dcSKarl Rupp for (i = 0; i < mbs; i++) b->imax[i] = nz; 15759566063dSJacob Faibussowitsch PetscCall(PetscIntMultError(nz, mbs, &nz)); 157649b5e25fSSatish Balay } else { 1577c73702f5SBarry Smith PetscInt64 nz64 = 0; 15789371c9d4SSatish Balay for (i = 0; i < mbs; i++) { 15799371c9d4SSatish Balay b->imax[i] = nnz[i]; 15809371c9d4SSatish Balay nz64 += nnz[i]; 15819371c9d4SSatish Balay } 15829566063dSJacob Faibussowitsch PetscCall(PetscIntCast(nz64, &nz)); 158349b5e25fSSatish Balay } 15842ee49352SLisandro Dalcin /* b->ilen will count nonzeros in each block row so far. */ 158526fbe8dcSKarl Rupp for (i = 0; i < mbs; i++) b->ilen[i] = 0; 15866c6c5352SBarry Smith /* nz=(nz+mbs)/2; */ /* total diagonal and superdiagonal nonzero blocks */ 158749b5e25fSSatish Balay 158849b5e25fSSatish Balay /* allocate the matrix space */ 15899566063dSJacob Faibussowitsch PetscCall(MatSeqXAIJFreeAIJ(B, &b->a, &b->j, &b->i)); 15909566063dSJacob Faibussowitsch PetscCall(PetscMalloc3(bs2 * nz, &b->a, nz, &b->j, B->rmap->N + 1, &b->i)); 15919566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(b->a, nz * bs2)); 15929566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(b->j, nz)); 159326fbe8dcSKarl Rupp 159449b5e25fSSatish Balay b->singlemalloc = PETSC_TRUE; 159549b5e25fSSatish Balay 159649b5e25fSSatish Balay /* pointer to beginning of each row */ 1597e60cf9a0SBarry Smith b->i[0] = 0; 159826fbe8dcSKarl Rupp for (i = 1; i < mbs + 1; i++) b->i[i] = b->i[i - 1] + b->imax[i - 1]; 159926fbe8dcSKarl Rupp 1600e6b907acSBarry Smith b->free_a = PETSC_TRUE; 1601e6b907acSBarry Smith b->free_ij = PETSC_TRUE; 1602e811da20SHong Zhang } else { 1603e6b907acSBarry Smith b->free_a = PETSC_FALSE; 1604e6b907acSBarry Smith b->free_ij = PETSC_FALSE; 1605ab93d7beSBarry Smith } 160649b5e25fSSatish Balay 160749b5e25fSSatish Balay b->bs2 = bs2; 16086c6c5352SBarry Smith b->nz = 0; 1609b32cb4a7SJed Brown b->maxnz = nz; 1610f4259b30SLisandro Dalcin b->inew = NULL; 1611f4259b30SLisandro Dalcin b->jnew = NULL; 1612f4259b30SLisandro Dalcin b->anew = NULL; 1613f4259b30SLisandro Dalcin b->a2anew = NULL; 16141a3463dfSHong Zhang b->permute = PETSC_FALSE; 1615cb7b82ddSBarry Smith 1616cb7b82ddSBarry Smith B->was_assembled = PETSC_FALSE; 1617cb7b82ddSBarry Smith B->assembled = PETSC_FALSE; 16189566063dSJacob Faibussowitsch if (realalloc) PetscCall(MatSetOption(B, MAT_NEW_NONZERO_ALLOCATION_ERR, PETSC_TRUE)); 16193ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1620c464158bSHong Zhang } 1621153ea458SHong Zhang 1622d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqSBAIJSetPreallocationCSR_SeqSBAIJ(Mat B, PetscInt bs, const PetscInt ii[], const PetscInt jj[], const PetscScalar V[]) 1623d71ae5a4SJacob Faibussowitsch { 16240cd7f59aSBarry Smith PetscInt i, j, m, nz, anz, nz_max = 0, *nnz; 1625f4259b30SLisandro Dalcin PetscScalar *values = NULL; 162638f409ebSLisandro Dalcin PetscBool roworiented = ((Mat_SeqSBAIJ *)B->data)->roworiented; 16270cd7f59aSBarry Smith 162838f409ebSLisandro Dalcin PetscFunctionBegin; 162908401ef6SPierre Jolivet PetscCheck(bs >= 1, PetscObjectComm((PetscObject)B), PETSC_ERR_ARG_OUTOFRANGE, "Invalid block size specified, must be positive but it is %" PetscInt_FMT, bs); 16309566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetBlockSize(B->rmap, bs)); 16319566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetBlockSize(B->cmap, bs)); 16329566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(B->rmap)); 16339566063dSJacob Faibussowitsch PetscCall(PetscLayoutSetUp(B->cmap)); 16349566063dSJacob Faibussowitsch PetscCall(PetscLayoutGetBlockSize(B->rmap, &bs)); 163538f409ebSLisandro Dalcin m = B->rmap->n / bs; 163638f409ebSLisandro Dalcin 1637aed4548fSBarry Smith PetscCheck(!ii[0], PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "ii[0] must be 0 but it is %" PetscInt_FMT, ii[0]); 16389566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(m + 1, &nnz)); 163938f409ebSLisandro Dalcin for (i = 0; i < m; i++) { 164038f409ebSLisandro Dalcin nz = ii[i + 1] - ii[i]; 164108401ef6SPierre Jolivet PetscCheck(nz >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Row %" PetscInt_FMT " has a negative number of columns %" PetscInt_FMT, i, nz); 16420cd7f59aSBarry Smith anz = 0; 16430cd7f59aSBarry Smith for (j = 0; j < nz; j++) { 16440cd7f59aSBarry Smith /* count only values on the diagonal or above */ 16450cd7f59aSBarry Smith if (jj[ii[i] + j] >= i) { 16460cd7f59aSBarry Smith anz = nz - j; 16470cd7f59aSBarry Smith break; 16480cd7f59aSBarry Smith } 16490cd7f59aSBarry Smith } 16500cd7f59aSBarry Smith nz_max = PetscMax(nz_max, anz); 16510cd7f59aSBarry Smith nnz[i] = anz; 165238f409ebSLisandro Dalcin } 16539566063dSJacob Faibussowitsch PetscCall(MatSeqSBAIJSetPreallocation(B, bs, 0, nnz)); 16549566063dSJacob Faibussowitsch PetscCall(PetscFree(nnz)); 165538f409ebSLisandro Dalcin 165638f409ebSLisandro Dalcin values = (PetscScalar *)V; 165748a46eb9SPierre Jolivet if (!values) PetscCall(PetscCalloc1(bs * bs * nz_max, &values)); 165838f409ebSLisandro Dalcin for (i = 0; i < m; i++) { 165938f409ebSLisandro Dalcin PetscInt ncols = ii[i + 1] - ii[i]; 166038f409ebSLisandro Dalcin const PetscInt *icols = jj + ii[i]; 166138f409ebSLisandro Dalcin if (!roworiented || bs == 1) { 166238f409ebSLisandro Dalcin const PetscScalar *svals = values + (V ? (bs * bs * ii[i]) : 0); 16639566063dSJacob Faibussowitsch PetscCall(MatSetValuesBlocked_SeqSBAIJ(B, 1, &i, ncols, icols, svals, INSERT_VALUES)); 166438f409ebSLisandro Dalcin } else { 166538f409ebSLisandro Dalcin for (j = 0; j < ncols; j++) { 166638f409ebSLisandro Dalcin const PetscScalar *svals = values + (V ? (bs * bs * (ii[i] + j)) : 0); 16679566063dSJacob Faibussowitsch PetscCall(MatSetValuesBlocked_SeqSBAIJ(B, 1, &i, 1, &icols[j], svals, INSERT_VALUES)); 166838f409ebSLisandro Dalcin } 166938f409ebSLisandro Dalcin } 167038f409ebSLisandro Dalcin } 16719566063dSJacob Faibussowitsch if (!V) PetscCall(PetscFree(values)); 16729566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(B, MAT_FINAL_ASSEMBLY)); 16739566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(B, MAT_FINAL_ASSEMBLY)); 16749566063dSJacob Faibussowitsch PetscCall(MatSetOption(B, MAT_NEW_NONZERO_LOCATION_ERR, PETSC_TRUE)); 16753ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 167638f409ebSLisandro Dalcin } 167738f409ebSLisandro Dalcin 1678db4efbfdSBarry Smith /* 1679db4efbfdSBarry Smith This is used to set the numeric factorization for both Cholesky and ICC symbolic factorization 1680db4efbfdSBarry Smith */ 1681d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqSBAIJSetNumericFactorization_inplace(Mat B, PetscBool natural) 1682d71ae5a4SJacob Faibussowitsch { 1683ace3abfcSBarry Smith PetscBool flg = PETSC_FALSE; 1684db4efbfdSBarry Smith PetscInt bs = B->rmap->bs; 1685db4efbfdSBarry Smith 1686db4efbfdSBarry Smith PetscFunctionBegin; 16879566063dSJacob Faibussowitsch PetscCall(PetscOptionsGetBool(((PetscObject)B)->options, ((PetscObject)B)->prefix, "-mat_no_unroll", &flg, NULL)); 1688db4efbfdSBarry Smith if (flg) bs = 8; 1689db4efbfdSBarry Smith 1690db4efbfdSBarry Smith if (!natural) { 1691db4efbfdSBarry Smith switch (bs) { 1692d71ae5a4SJacob Faibussowitsch case 1: 1693d71ae5a4SJacob Faibussowitsch B->ops->choleskyfactornumeric = MatCholeskyFactorNumeric_SeqSBAIJ_1_inplace; 1694d71ae5a4SJacob Faibussowitsch break; 1695d71ae5a4SJacob Faibussowitsch case 2: 1696d71ae5a4SJacob Faibussowitsch B->ops->choleskyfactornumeric = MatCholeskyFactorNumeric_SeqSBAIJ_2; 1697d71ae5a4SJacob Faibussowitsch break; 1698d71ae5a4SJacob Faibussowitsch case 3: 1699d71ae5a4SJacob Faibussowitsch B->ops->choleskyfactornumeric = MatCholeskyFactorNumeric_SeqSBAIJ_3; 1700d71ae5a4SJacob Faibussowitsch break; 1701d71ae5a4SJacob Faibussowitsch case 4: 1702d71ae5a4SJacob Faibussowitsch B->ops->choleskyfactornumeric = MatCholeskyFactorNumeric_SeqSBAIJ_4; 1703d71ae5a4SJacob Faibussowitsch break; 1704d71ae5a4SJacob Faibussowitsch case 5: 1705d71ae5a4SJacob Faibussowitsch B->ops->choleskyfactornumeric = MatCholeskyFactorNumeric_SeqSBAIJ_5; 1706d71ae5a4SJacob Faibussowitsch break; 1707d71ae5a4SJacob Faibussowitsch case 6: 1708d71ae5a4SJacob Faibussowitsch B->ops->choleskyfactornumeric = MatCholeskyFactorNumeric_SeqSBAIJ_6; 1709d71ae5a4SJacob Faibussowitsch break; 1710d71ae5a4SJacob Faibussowitsch case 7: 1711d71ae5a4SJacob Faibussowitsch B->ops->choleskyfactornumeric = MatCholeskyFactorNumeric_SeqSBAIJ_7; 1712d71ae5a4SJacob Faibussowitsch break; 1713d71ae5a4SJacob Faibussowitsch default: 1714d71ae5a4SJacob Faibussowitsch B->ops->choleskyfactornumeric = MatCholeskyFactorNumeric_SeqSBAIJ_N; 1715d71ae5a4SJacob Faibussowitsch break; 1716db4efbfdSBarry Smith } 1717db4efbfdSBarry Smith } else { 1718db4efbfdSBarry Smith switch (bs) { 1719d71ae5a4SJacob Faibussowitsch case 1: 1720d71ae5a4SJacob Faibussowitsch B->ops->choleskyfactornumeric = MatCholeskyFactorNumeric_SeqSBAIJ_1_NaturalOrdering_inplace; 1721d71ae5a4SJacob Faibussowitsch break; 1722d71ae5a4SJacob Faibussowitsch case 2: 1723d71ae5a4SJacob Faibussowitsch B->ops->choleskyfactornumeric = MatCholeskyFactorNumeric_SeqSBAIJ_2_NaturalOrdering; 1724d71ae5a4SJacob Faibussowitsch break; 1725d71ae5a4SJacob Faibussowitsch case 3: 1726d71ae5a4SJacob Faibussowitsch B->ops->choleskyfactornumeric = MatCholeskyFactorNumeric_SeqSBAIJ_3_NaturalOrdering; 1727d71ae5a4SJacob Faibussowitsch break; 1728d71ae5a4SJacob Faibussowitsch case 4: 1729d71ae5a4SJacob Faibussowitsch B->ops->choleskyfactornumeric = MatCholeskyFactorNumeric_SeqSBAIJ_4_NaturalOrdering; 1730d71ae5a4SJacob Faibussowitsch break; 1731d71ae5a4SJacob Faibussowitsch case 5: 1732d71ae5a4SJacob Faibussowitsch B->ops->choleskyfactornumeric = MatCholeskyFactorNumeric_SeqSBAIJ_5_NaturalOrdering; 1733d71ae5a4SJacob Faibussowitsch break; 1734d71ae5a4SJacob Faibussowitsch case 6: 1735d71ae5a4SJacob Faibussowitsch B->ops->choleskyfactornumeric = MatCholeskyFactorNumeric_SeqSBAIJ_6_NaturalOrdering; 1736d71ae5a4SJacob Faibussowitsch break; 1737d71ae5a4SJacob Faibussowitsch case 7: 1738d71ae5a4SJacob Faibussowitsch B->ops->choleskyfactornumeric = MatCholeskyFactorNumeric_SeqSBAIJ_7_NaturalOrdering; 1739d71ae5a4SJacob Faibussowitsch break; 1740d71ae5a4SJacob Faibussowitsch default: 1741d71ae5a4SJacob Faibussowitsch B->ops->choleskyfactornumeric = MatCholeskyFactorNumeric_SeqSBAIJ_N_NaturalOrdering; 1742d71ae5a4SJacob Faibussowitsch break; 1743db4efbfdSBarry Smith } 1744db4efbfdSBarry Smith } 17453ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1746db4efbfdSBarry Smith } 1747db4efbfdSBarry Smith 1748cc2e6a90SBarry Smith PETSC_INTERN PetscErrorCode MatConvert_SeqSBAIJ_SeqAIJ(Mat, MatType, MatReuse, Mat *); 1749cc2e6a90SBarry Smith PETSC_INTERN PetscErrorCode MatConvert_SeqSBAIJ_SeqBAIJ(Mat, MatType, MatReuse, Mat *); 1750d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatFactorGetSolverType_petsc(Mat A, MatSolverType *type) 1751d71ae5a4SJacob Faibussowitsch { 17524ac6704cSBarry Smith PetscFunctionBegin; 17534ac6704cSBarry Smith *type = MATSOLVERPETSC; 17543ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 17554ac6704cSBarry Smith } 1756d769727bSBarry Smith 1757d71ae5a4SJacob Faibussowitsch PETSC_INTERN PetscErrorCode MatGetFactor_seqsbaij_petsc(Mat A, MatFactorType ftype, Mat *B) 1758d71ae5a4SJacob Faibussowitsch { 1759d0f46423SBarry Smith PetscInt n = A->rmap->n; 17605c9eb25fSBarry Smith 17615c9eb25fSBarry Smith PetscFunctionBegin; 17620e92d65fSHong Zhang #if defined(PETSC_USE_COMPLEX) 176303e5aca4SStefano Zampini if ((ftype == MAT_FACTOR_CHOLESKY || ftype == MAT_FACTOR_ICC) && A->hermitian == PETSC_BOOL3_TRUE && A->symmetric != PETSC_BOOL3_TRUE) { 176403e5aca4SStefano Zampini PetscCall(PetscInfo(A, "Hermitian MAT_FACTOR_CHOLESKY or MAT_FACTOR_ICC are not supported. Use MAT_FACTOR_LU instead.\n")); 176503e5aca4SStefano Zampini *B = NULL; 176603e5aca4SStefano Zampini PetscFunctionReturn(PETSC_SUCCESS); 176703e5aca4SStefano Zampini } 17680e92d65fSHong Zhang #endif 1769eb1ec7c1SStefano Zampini 17709566063dSJacob Faibussowitsch PetscCall(MatCreate(PetscObjectComm((PetscObject)A), B)); 17719566063dSJacob Faibussowitsch PetscCall(MatSetSizes(*B, n, n, n, n)); 17725c9eb25fSBarry Smith if (ftype == MAT_FACTOR_CHOLESKY || ftype == MAT_FACTOR_ICC) { 17739566063dSJacob Faibussowitsch PetscCall(MatSetType(*B, MATSEQSBAIJ)); 17749566063dSJacob Faibussowitsch PetscCall(MatSeqSBAIJSetPreallocation(*B, A->rmap->bs, MAT_SKIP_ALLOCATION, NULL)); 177526fbe8dcSKarl Rupp 17767b056e98SHong Zhang (*B)->ops->choleskyfactorsymbolic = MatCholeskyFactorSymbolic_SeqSBAIJ; 1777c6d0d4f0SHong Zhang (*B)->ops->iccfactorsymbolic = MatICCFactorSymbolic_SeqSBAIJ; 17789566063dSJacob Faibussowitsch PetscCall(PetscStrallocpy(MATORDERINGNATURAL, (char **)&(*B)->preferredordering[MAT_FACTOR_CHOLESKY])); 17799566063dSJacob Faibussowitsch PetscCall(PetscStrallocpy(MATORDERINGNATURAL, (char **)&(*B)->preferredordering[MAT_FACTOR_ICC])); 1780e32f2f54SBarry Smith } else SETERRQ(PETSC_COMM_SELF, PETSC_ERR_SUP, "Factor type not supported"); 178100c67f3bSHong Zhang 1782d5f3da31SBarry Smith (*B)->factortype = ftype; 1783f73b0415SBarry Smith (*B)->canuseordering = PETSC_TRUE; 17849566063dSJacob Faibussowitsch PetscCall(PetscFree((*B)->solvertype)); 17859566063dSJacob Faibussowitsch PetscCall(PetscStrallocpy(MATSOLVERPETSC, &(*B)->solvertype)); 17869566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)*B, "MatFactorGetSolverType_C", MatFactorGetSolverType_petsc)); 17873ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 17885c9eb25fSBarry Smith } 17895c9eb25fSBarry Smith 17908397e458SBarry Smith /*@C 17912ef1f0ffSBarry Smith MatSeqSBAIJGetArray - gives access to the array where the numerical data for a `MATSEQSBAIJ` matrix is stored 17928397e458SBarry Smith 17938397e458SBarry Smith Not Collective 17948397e458SBarry Smith 17958397e458SBarry Smith Input Parameter: 1796fe59aa6dSJacob Faibussowitsch . A - a `MATSEQSBAIJ` matrix 17978397e458SBarry Smith 17988397e458SBarry Smith Output Parameter: 17998397e458SBarry Smith . array - pointer to the data 18008397e458SBarry Smith 18018397e458SBarry Smith Level: intermediate 18028397e458SBarry Smith 18031cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MATSEQSBAIJ`, `MatSeqSBAIJRestoreArray()`, `MatSeqAIJGetArray()`, `MatSeqAIJRestoreArray()` 18048397e458SBarry Smith @*/ 1805d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqSBAIJGetArray(Mat A, PetscScalar **array) 1806d71ae5a4SJacob Faibussowitsch { 18078397e458SBarry Smith PetscFunctionBegin; 1808cac4c232SBarry Smith PetscUseMethod(A, "MatSeqSBAIJGetArray_C", (Mat, PetscScalar **), (A, array)); 18093ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 18108397e458SBarry Smith } 18118397e458SBarry Smith 18128397e458SBarry Smith /*@C 18132ef1f0ffSBarry Smith MatSeqSBAIJRestoreArray - returns access to the array where the numerical data for a `MATSEQSBAIJ` matrix is stored obtained by `MatSeqSBAIJGetArray()` 18148397e458SBarry Smith 18158397e458SBarry Smith Not Collective 18168397e458SBarry Smith 18178397e458SBarry Smith Input Parameters: 1818fe59aa6dSJacob Faibussowitsch + A - a `MATSEQSBAIJ` matrix 1819a2b725a8SWilliam Gropp - array - pointer to the data 18208397e458SBarry Smith 18218397e458SBarry Smith Level: intermediate 18228397e458SBarry Smith 18231cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MATSEQSBAIJ`, `MatSeqSBAIJGetArray()`, `MatSeqAIJGetArray()`, `MatSeqAIJRestoreArray()` 18248397e458SBarry Smith @*/ 1825d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqSBAIJRestoreArray(Mat A, PetscScalar **array) 1826d71ae5a4SJacob Faibussowitsch { 18278397e458SBarry Smith PetscFunctionBegin; 1828cac4c232SBarry Smith PetscUseMethod(A, "MatSeqSBAIJRestoreArray_C", (Mat, PetscScalar **), (A, array)); 18293ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 18308397e458SBarry Smith } 18318397e458SBarry Smith 18320bad9183SKris Buschelman /*MC 1833fafad747SKris Buschelman MATSEQSBAIJ - MATSEQSBAIJ = "seqsbaij" - A matrix type to be used for sequential symmetric block sparse matrices, 18340bad9183SKris Buschelman based on block compressed sparse row format. Only the upper triangular portion of the matrix is stored. 18350bad9183SKris Buschelman 1836828413b8SBarry Smith For complex numbers by default this matrix is symmetric, NOT Hermitian symmetric. To make it Hermitian symmetric you 183711a5261eSBarry Smith can call `MatSetOption`(`Mat`, `MAT_HERMITIAN`). 1838828413b8SBarry Smith 18392ef1f0ffSBarry Smith Options Database Key: 184011a5261eSBarry Smith . -mat_type seqsbaij - sets the matrix type to "seqsbaij" during a call to `MatSetFromOptions()` 18410bad9183SKris Buschelman 18422ef1f0ffSBarry Smith Level: beginner 18432ef1f0ffSBarry Smith 184495452b02SPatrick Sanan Notes: 184595452b02SPatrick Sanan By default if you insert values into the lower triangular part of the matrix they are simply ignored (since they are not 184611a5261eSBarry Smith stored and it is assumed they symmetric to the upper triangular). If you call `MatSetOption`(`Mat`,`MAT_IGNORE_LOWER_TRIANGULAR`,`PETSC_FALSE`) or use 18472ef1f0ffSBarry Smith the options database `-mat_ignore_lower_triangular` false it will generate an error if you try to set a value in the lower triangular portion. 184871dad5bbSBarry Smith 1849476417e5SBarry Smith The number of rows in the matrix must be less than or equal to the number of columns 185071dad5bbSBarry Smith 18511cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MATSEQSBAIJ`, `MatCreateSeqSBAIJ()`, `MatType`, `MATMPISBAIJ` 18520bad9183SKris Buschelman M*/ 1853d71ae5a4SJacob Faibussowitsch PETSC_EXTERN PetscErrorCode MatCreate_SeqSBAIJ(Mat B) 1854d71ae5a4SJacob Faibussowitsch { 1855a23d5eceSKris Buschelman Mat_SeqSBAIJ *b; 185613f74950SBarry Smith PetscMPIInt size; 1857ace3abfcSBarry Smith PetscBool no_unroll = PETSC_FALSE, no_inode = PETSC_FALSE; 1858a23d5eceSKris Buschelman 1859a23d5eceSKris Buschelman PetscFunctionBegin; 18609566063dSJacob Faibussowitsch PetscCallMPI(MPI_Comm_size(PetscObjectComm((PetscObject)B), &size)); 186108401ef6SPierre Jolivet PetscCheck(size <= 1, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONG, "Comm must be of size 1"); 1862a23d5eceSKris Buschelman 18634dfa11a4SJacob Faibussowitsch PetscCall(PetscNew(&b)); 1864a23d5eceSKris Buschelman B->data = (void *)b; 1865aea10558SJacob Faibussowitsch B->ops[0] = MatOps_Values; 186626fbe8dcSKarl Rupp 1867a23d5eceSKris Buschelman B->ops->destroy = MatDestroy_SeqSBAIJ; 1868a23d5eceSKris Buschelman B->ops->view = MatView_SeqSBAIJ; 1869f4259b30SLisandro Dalcin b->row = NULL; 1870f4259b30SLisandro Dalcin b->icol = NULL; 1871a23d5eceSKris Buschelman b->reallocs = 0; 1872f4259b30SLisandro Dalcin b->saved_values = NULL; 18730def2e27SBarry Smith b->inode.limit = 5; 18740def2e27SBarry Smith b->inode.max_limit = 5; 1875a23d5eceSKris Buschelman 1876a23d5eceSKris Buschelman b->roworiented = PETSC_TRUE; 1877a23d5eceSKris Buschelman b->nonew = 0; 1878f4259b30SLisandro Dalcin b->diag = NULL; 1879f4259b30SLisandro Dalcin b->solve_work = NULL; 1880f4259b30SLisandro Dalcin b->mult_work = NULL; 1881f4259b30SLisandro Dalcin B->spptr = NULL; 1882f2cbd3d5SJed Brown B->info.nz_unneeded = (PetscReal)b->maxnz * b->bs2; 1883a9817697SBarry Smith b->keepnonzeropattern = PETSC_FALSE; 1884a23d5eceSKris Buschelman 1885f4259b30SLisandro Dalcin b->inew = NULL; 1886f4259b30SLisandro Dalcin b->jnew = NULL; 1887f4259b30SLisandro Dalcin b->anew = NULL; 1888f4259b30SLisandro Dalcin b->a2anew = NULL; 1889a23d5eceSKris Buschelman b->permute = PETSC_FALSE; 1890a23d5eceSKris Buschelman 189171dad5bbSBarry Smith b->ignore_ltriangular = PETSC_TRUE; 189226fbe8dcSKarl Rupp 18939566063dSJacob Faibussowitsch PetscCall(PetscOptionsGetBool(((PetscObject)B)->options, ((PetscObject)B)->prefix, "-mat_ignore_lower_triangular", &b->ignore_ltriangular, NULL)); 1894941593c8SHong Zhang 1895f5edf698SHong Zhang b->getrow_utriangular = PETSC_FALSE; 189626fbe8dcSKarl Rupp 18979566063dSJacob Faibussowitsch PetscCall(PetscOptionsGetBool(((PetscObject)B)->options, ((PetscObject)B)->prefix, "-mat_getrow_uppertriangular", &b->getrow_utriangular, NULL)); 1898f5edf698SHong Zhang 18999566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSeqSBAIJGetArray_C", MatSeqSBAIJGetArray_SeqSBAIJ)); 19009566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSeqSBAIJRestoreArray_C", MatSeqSBAIJRestoreArray_SeqSBAIJ)); 19019566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatStoreValues_C", MatStoreValues_SeqSBAIJ)); 19029566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatRetrieveValues_C", MatRetrieveValues_SeqSBAIJ)); 19039566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSeqSBAIJSetColumnIndices_C", MatSeqSBAIJSetColumnIndices_SeqSBAIJ)); 19049566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqsbaij_seqaij_C", MatConvert_SeqSBAIJ_SeqAIJ)); 19059566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqsbaij_seqbaij_C", MatConvert_SeqSBAIJ_SeqBAIJ)); 19069566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSeqSBAIJSetPreallocation_C", MatSeqSBAIJSetPreallocation_SeqSBAIJ)); 19079566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSeqSBAIJSetPreallocationCSR_C", MatSeqSBAIJSetPreallocationCSR_SeqSBAIJ)); 19086214f412SHong Zhang #if defined(PETSC_HAVE_ELEMENTAL) 19099566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqsbaij_elemental_C", MatConvert_SeqSBAIJ_Elemental)); 19106214f412SHong Zhang #endif 1911d24d4204SJose E. Roman #if defined(PETSC_HAVE_SCALAPACK) 19129566063dSJacob Faibussowitsch PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqsbaij_scalapack_C", MatConvert_SBAIJ_ScaLAPACK)); 1913d24d4204SJose E. Roman #endif 191423ce1328SBarry Smith 1915b94d7dedSBarry Smith B->symmetry_eternal = PETSC_TRUE; 1916b94d7dedSBarry Smith B->structural_symmetry_eternal = PETSC_TRUE; 1917b94d7dedSBarry Smith B->symmetric = PETSC_BOOL3_TRUE; 1918b94d7dedSBarry Smith B->structurally_symmetric = PETSC_BOOL3_TRUE; 1919eb1ec7c1SStefano Zampini #if defined(PETSC_USE_COMPLEX) 1920b94d7dedSBarry Smith B->hermitian = PETSC_BOOL3_FALSE; 1921eb1ec7c1SStefano Zampini #else 1922b94d7dedSBarry Smith B->hermitian = PETSC_BOOL3_TRUE; 1923eb1ec7c1SStefano Zampini #endif 192413647f61SHong Zhang 19259566063dSJacob Faibussowitsch PetscCall(PetscObjectChangeTypeName((PetscObject)B, MATSEQSBAIJ)); 19260def2e27SBarry Smith 1927d0609cedSBarry Smith PetscOptionsBegin(PetscObjectComm((PetscObject)B), ((PetscObject)B)->prefix, "Options for SEQSBAIJ matrix", "Mat"); 19289566063dSJacob Faibussowitsch PetscCall(PetscOptionsBool("-mat_no_unroll", "Do not optimize for inodes (slower)", NULL, no_unroll, &no_unroll, NULL)); 192948a46eb9SPierre Jolivet if (no_unroll) PetscCall(PetscInfo(B, "Not using Inode routines due to -mat_no_unroll\n")); 19309566063dSJacob Faibussowitsch PetscCall(PetscOptionsBool("-mat_no_inode", "Do not optimize for inodes (slower)", NULL, no_inode, &no_inode, NULL)); 19319566063dSJacob Faibussowitsch if (no_inode) PetscCall(PetscInfo(B, "Not using Inode routines due to -mat_no_inode\n")); 19329566063dSJacob Faibussowitsch PetscCall(PetscOptionsInt("-mat_inode_limit", "Do not use inodes larger then this value", NULL, b->inode.limit, &b->inode.limit, NULL)); 1933d0609cedSBarry Smith PetscOptionsEnd(); 1934ace3abfcSBarry Smith b->inode.use = (PetscBool)(!(no_unroll || no_inode)); 19350def2e27SBarry Smith if (b->inode.limit > b->inode.max_limit) b->inode.limit = b->inode.max_limit; 19363ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1937a23d5eceSKris Buschelman } 1938a23d5eceSKris Buschelman 1939a23d5eceSKris Buschelman /*@C 1940a23d5eceSKris Buschelman MatSeqSBAIJSetPreallocation - Creates a sparse symmetric matrix in block AIJ (block 194111a5261eSBarry Smith compressed row) `MATSEQSBAIJ` format. For good matrix assembly performance the 194220f4b53cSBarry Smith user should preallocate the matrix storage by setting the parameter `nz` 194320f4b53cSBarry Smith (or the array `nnz`). 1944a23d5eceSKris Buschelman 1945c3339decSBarry Smith Collective 1946a23d5eceSKris Buschelman 1947a23d5eceSKris Buschelman Input Parameters: 19481c4f3114SJed Brown + B - the symmetric matrix 194911a5261eSBarry Smith . bs - size of block, the blocks are ALWAYS square. One can use `MatSetBlockSizes()` to set a different row and column blocksize but the row 195011a5261eSBarry Smith blocksize always defines the size of the blocks. The column blocksize sets the blocksize of the vectors obtained with `MatCreateVecs()` 1951a23d5eceSKris Buschelman . nz - number of block nonzeros per block row (same for all rows) 1952a23d5eceSKris Buschelman - nnz - array containing the number of block nonzeros in the upper triangular plus 19532ef1f0ffSBarry Smith diagonal portion of each block (possibly different for each block row) or `NULL` 1954a23d5eceSKris Buschelman 1955a23d5eceSKris Buschelman Options Database Keys: 1956a2b725a8SWilliam Gropp + -mat_no_unroll - uses code that does not unroll the loops in the 1957a23d5eceSKris Buschelman block calculations (much slower) 1958a2b725a8SWilliam Gropp - -mat_block_size - size of the blocks to use (only works if a negative bs is passed in 1959a23d5eceSKris Buschelman 1960a23d5eceSKris Buschelman Level: intermediate 1961a23d5eceSKris Buschelman 1962a23d5eceSKris Buschelman Notes: 196320f4b53cSBarry Smith Specify the preallocated storage with either `nz` or `nnz` (not both). 19642ef1f0ffSBarry Smith Set `nz` = `PETSC_DEFAULT` and `nnz` = `NULL` for PETSc to control dynamic memory 1965651615e1SBarry Smith allocation. See [Sparse Matrices](sec_matsparse) for details. 1966a23d5eceSKris Buschelman 196711a5261eSBarry Smith You can call `MatGetInfo()` to get information on how effective the preallocation was; 1968aa95bbe8SBarry Smith for example the fields mallocs,nz_allocated,nz_used,nz_unneeded; 19692ef1f0ffSBarry Smith You can also run with the option `-info` and look for messages with the string 1970aa95bbe8SBarry Smith malloc in them to see if additional memory allocation was needed. 1971aa95bbe8SBarry Smith 19722ef1f0ffSBarry Smith If the `nnz` parameter is given then the `nz` parameter is ignored 197349a6f317SBarry Smith 19741cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, [Sparse Matrices](sec_matsparse), `MATSEQSBAIJ`, `MatCreate()`, `MatCreateSeqAIJ()`, `MatSetValues()`, `MatCreateSBAIJ()` 1975a23d5eceSKris Buschelman @*/ 1976d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqSBAIJSetPreallocation(Mat B, PetscInt bs, PetscInt nz, const PetscInt nnz[]) 1977d71ae5a4SJacob Faibussowitsch { 1978a23d5eceSKris Buschelman PetscFunctionBegin; 19796ba663aaSJed Brown PetscValidHeaderSpecific(B, MAT_CLASSID, 1); 19806ba663aaSJed Brown PetscValidType(B, 1); 19816ba663aaSJed Brown PetscValidLogicalCollectiveInt(B, bs, 2); 1982cac4c232SBarry Smith PetscTryMethod(B, "MatSeqSBAIJSetPreallocation_C", (Mat, PetscInt, PetscInt, const PetscInt[]), (B, bs, nz, nnz)); 19833ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 1984a23d5eceSKris Buschelman } 198549b5e25fSSatish Balay 198638f409ebSLisandro Dalcin /*@C 198711a5261eSBarry Smith MatSeqSBAIJSetPreallocationCSR - Creates a sparse parallel matrix in `MATSEQSBAIJ` format using the given nonzero structure and (optional) numerical values 198838f409ebSLisandro Dalcin 198938f409ebSLisandro Dalcin Input Parameters: 19901c4f3114SJed Brown + B - the matrix 1991eab78319SHong Zhang . bs - size of block, the blocks are ALWAYS square. 199238f409ebSLisandro Dalcin . i - the indices into j for the start of each local row (starts with zero) 199338f409ebSLisandro Dalcin . j - the column indices for each local row (starts with zero) these must be sorted for each row 199438f409ebSLisandro Dalcin - v - optional values in the matrix 199538f409ebSLisandro Dalcin 1996664954b6SBarry Smith Level: advanced 199738f409ebSLisandro Dalcin 199838f409ebSLisandro Dalcin Notes: 199911a5261eSBarry Smith The order of the entries in values is specified by the `MatOption` `MAT_ROW_ORIENTED`. For example, C programs 200011a5261eSBarry Smith may want to use the default `MAT_ROW_ORIENTED` = `PETSC_TRUE` and use an array v[nnz][bs][bs] where the second index is 200138f409ebSLisandro Dalcin over rows within a block and the last index is over columns within a block row. Fortran programs will likely set 200211a5261eSBarry Smith `MAT_ROW_ORIENTED` = `PETSC_FALSE` and use a Fortran array v(bs,bs,nnz) in which the first index is over rows within a 200338f409ebSLisandro Dalcin block column and the second index is over columns within a block. 200438f409ebSLisandro Dalcin 200550c5228eSBarry Smith Any entries below the diagonal are ignored 20060cd7f59aSBarry Smith 20070cd7f59aSBarry Smith Though this routine has Preallocation() in the name it also sets the exact nonzero locations of the matrix entries 20080cd7f59aSBarry Smith and usually the numerical values as well 2009664954b6SBarry Smith 2010fe59aa6dSJacob Faibussowitsch .seealso: [](ch_matrices), `Mat`, `MATSEQSBAIJ`, `MatCreate()`, `MatCreateSeqSBAIJ()`, `MatSetValuesBlocked()`, `MatSeqSBAIJSetPreallocation()` 201138f409ebSLisandro Dalcin @*/ 2012d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqSBAIJSetPreallocationCSR(Mat B, PetscInt bs, const PetscInt i[], const PetscInt j[], const PetscScalar v[]) 2013d71ae5a4SJacob Faibussowitsch { 201438f409ebSLisandro Dalcin PetscFunctionBegin; 201538f409ebSLisandro Dalcin PetscValidHeaderSpecific(B, MAT_CLASSID, 1); 201638f409ebSLisandro Dalcin PetscValidType(B, 1); 201738f409ebSLisandro Dalcin PetscValidLogicalCollectiveInt(B, bs, 2); 2018cac4c232SBarry Smith PetscTryMethod(B, "MatSeqSBAIJSetPreallocationCSR_C", (Mat, PetscInt, const PetscInt[], const PetscInt[], const PetscScalar[]), (B, bs, i, j, v)); 20193ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 202038f409ebSLisandro Dalcin } 202138f409ebSLisandro Dalcin 2022c464158bSHong Zhang /*@C 20232ef1f0ffSBarry Smith MatCreateSeqSBAIJ - Creates a sparse symmetric matrix in (block 202411a5261eSBarry Smith compressed row) `MATSEQSBAIJ` format. For good matrix assembly performance the 20252ef1f0ffSBarry Smith user should preallocate the matrix storage by setting the parameter `nz` 20262ef1f0ffSBarry Smith (or the array `nnz`). 202749b5e25fSSatish Balay 2028d083f849SBarry Smith Collective 2029c464158bSHong Zhang 2030c464158bSHong Zhang Input Parameters: 203111a5261eSBarry Smith + comm - MPI communicator, set to `PETSC_COMM_SELF` 203211a5261eSBarry Smith . bs - size of block, the blocks are ALWAYS square. One can use `MatSetBlockSizes()` to set a different row and column blocksize but the row 2033bb7ae925SBarry Smith blocksize always defines the size of the blocks. The column blocksize sets the blocksize of the vectors obtained with MatCreateVecs() 203420f4b53cSBarry Smith . m - number of rows 203520f4b53cSBarry Smith . n - number of columns 2036c464158bSHong Zhang . nz - number of block nonzeros per block row (same for all rows) 2037744e8345SSatish Balay - nnz - array containing the number of block nonzeros in the upper triangular plus 20382ef1f0ffSBarry Smith diagonal portion of each block (possibly different for each block row) or `NULL` 2039c464158bSHong Zhang 2040c464158bSHong Zhang Output Parameter: 2041c464158bSHong Zhang . A - the symmetric matrix 2042c464158bSHong Zhang 2043c464158bSHong Zhang Options Database Keys: 2044a2b725a8SWilliam Gropp + -mat_no_unroll - uses code that does not unroll the loops in the 2045c464158bSHong Zhang block calculations (much slower) 2046a2b725a8SWilliam Gropp - -mat_block_size - size of the blocks to use 2047c464158bSHong Zhang 2048c464158bSHong Zhang Level: intermediate 2049c464158bSHong Zhang 20502ef1f0ffSBarry Smith Notes: 205111a5261eSBarry Smith It is recommended that one use the `MatCreate()`, `MatSetType()` and/or `MatSetFromOptions()`, 2052f6f02116SRichard Tran Mills MatXXXXSetPreallocation() paradigm instead of this routine directly. 205311a5261eSBarry Smith [MatXXXXSetPreallocation() is, for example, `MatSeqAIJSetPreallocation()`] 2054175b88e8SBarry Smith 20556d6d819aSHong Zhang The number of rows and columns must be divisible by blocksize. 20566d6d819aSHong Zhang This matrix type does not support complex Hermitian operation. 2057c464158bSHong Zhang 20582ef1f0ffSBarry Smith Specify the preallocated storage with either `nz` or `nnz` (not both). 20592ef1f0ffSBarry Smith Set `nz` = `PETSC_DEFAULT` and `nnz` = `NULL` for PETSc to control dynamic memory 2060651615e1SBarry Smith allocation. See [Sparse Matrices](sec_matsparse) for details. 2061c464158bSHong Zhang 20622ef1f0ffSBarry Smith If the `nnz` parameter is given then the `nz` parameter is ignored 206349a6f317SBarry Smith 20641cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, [Sparse Matrices](sec_matsparse), `MATSEQSBAIJ`, `MatCreate()`, `MatCreateSeqAIJ()`, `MatSetValues()`, `MatCreateSBAIJ()` 2065c464158bSHong Zhang @*/ 2066d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateSeqSBAIJ(MPI_Comm comm, PetscInt bs, PetscInt m, PetscInt n, PetscInt nz, const PetscInt nnz[], Mat *A) 2067d71ae5a4SJacob Faibussowitsch { 2068c464158bSHong Zhang PetscFunctionBegin; 20699566063dSJacob Faibussowitsch PetscCall(MatCreate(comm, A)); 20709566063dSJacob Faibussowitsch PetscCall(MatSetSizes(*A, m, n, m, n)); 20719566063dSJacob Faibussowitsch PetscCall(MatSetType(*A, MATSEQSBAIJ)); 20729566063dSJacob Faibussowitsch PetscCall(MatSeqSBAIJSetPreallocation(*A, bs, nz, (PetscInt *)nnz)); 20733ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 207449b5e25fSSatish Balay } 207549b5e25fSSatish Balay 2076d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDuplicate_SeqSBAIJ(Mat A, MatDuplicateOption cpvalues, Mat *B) 2077d71ae5a4SJacob Faibussowitsch { 207849b5e25fSSatish Balay Mat C; 207949b5e25fSSatish Balay Mat_SeqSBAIJ *c, *a = (Mat_SeqSBAIJ *)A->data; 2080b40805acSSatish Balay PetscInt i, mbs = a->mbs, nz = a->nz, bs2 = a->bs2; 208149b5e25fSSatish Balay 208249b5e25fSSatish Balay PetscFunctionBegin; 208331fe6a7dSBarry Smith PetscCheck(A->assembled, PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_WRONGSTATE, "Cannot duplicate unassembled matrix"); 208408401ef6SPierre Jolivet PetscCheck(a->i[mbs] == nz, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Corrupt matrix"); 208549b5e25fSSatish Balay 2086f4259b30SLisandro Dalcin *B = NULL; 20879566063dSJacob Faibussowitsch PetscCall(MatCreate(PetscObjectComm((PetscObject)A), &C)); 20889566063dSJacob Faibussowitsch PetscCall(MatSetSizes(C, A->rmap->N, A->cmap->n, A->rmap->N, A->cmap->n)); 20899566063dSJacob Faibussowitsch PetscCall(MatSetBlockSizesFromMats(C, A, A)); 20909566063dSJacob Faibussowitsch PetscCall(MatSetType(C, MATSEQSBAIJ)); 2091692f9cbeSHong Zhang c = (Mat_SeqSBAIJ *)C->data; 2092692f9cbeSHong Zhang 2093273d9f13SBarry Smith C->preallocated = PETSC_TRUE; 2094d5f3da31SBarry Smith C->factortype = A->factortype; 2095f4259b30SLisandro Dalcin c->row = NULL; 2096f4259b30SLisandro Dalcin c->icol = NULL; 2097f4259b30SLisandro Dalcin c->saved_values = NULL; 2098a9817697SBarry Smith c->keepnonzeropattern = a->keepnonzeropattern; 209949b5e25fSSatish Balay C->assembled = PETSC_TRUE; 210049b5e25fSSatish Balay 21019566063dSJacob Faibussowitsch PetscCall(PetscLayoutReference(A->rmap, &C->rmap)); 21029566063dSJacob Faibussowitsch PetscCall(PetscLayoutReference(A->cmap, &C->cmap)); 210349b5e25fSSatish Balay c->bs2 = a->bs2; 210449b5e25fSSatish Balay c->mbs = a->mbs; 210549b5e25fSSatish Balay c->nbs = a->nbs; 210649b5e25fSSatish Balay 2107c760cd28SBarry Smith if (cpvalues == MAT_SHARE_NONZERO_PATTERN) { 2108c760cd28SBarry Smith c->imax = a->imax; 2109c760cd28SBarry Smith c->ilen = a->ilen; 2110c760cd28SBarry Smith c->free_imax_ilen = PETSC_FALSE; 2111c760cd28SBarry Smith } else { 21129566063dSJacob Faibussowitsch PetscCall(PetscMalloc2((mbs + 1), &c->imax, (mbs + 1), &c->ilen)); 211349b5e25fSSatish Balay for (i = 0; i < mbs; i++) { 211449b5e25fSSatish Balay c->imax[i] = a->imax[i]; 211549b5e25fSSatish Balay c->ilen[i] = a->ilen[i]; 211649b5e25fSSatish Balay } 2117c760cd28SBarry Smith c->free_imax_ilen = PETSC_TRUE; 2118c760cd28SBarry Smith } 211949b5e25fSSatish Balay 212049b5e25fSSatish Balay /* allocate the matrix space */ 21214da8f245SBarry Smith if (cpvalues == MAT_SHARE_NONZERO_PATTERN) { 21229566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(bs2 * nz, &c->a)); 212344e1c64aSLisandro Dalcin c->i = a->i; 212444e1c64aSLisandro Dalcin c->j = a->j; 21254da8f245SBarry Smith c->singlemalloc = PETSC_FALSE; 212644e1c64aSLisandro Dalcin c->free_a = PETSC_TRUE; 21274da8f245SBarry Smith c->free_ij = PETSC_FALSE; 21284da8f245SBarry Smith c->parent = A; 21299566063dSJacob Faibussowitsch PetscCall(PetscObjectReference((PetscObject)A)); 21309566063dSJacob Faibussowitsch PetscCall(MatSetOption(A, MAT_NEW_NONZERO_LOCATION_ERR, PETSC_TRUE)); 21319566063dSJacob Faibussowitsch PetscCall(MatSetOption(C, MAT_NEW_NONZERO_LOCATION_ERR, PETSC_TRUE)); 21324da8f245SBarry Smith } else { 21339566063dSJacob Faibussowitsch PetscCall(PetscMalloc3(bs2 * nz, &c->a, nz, &c->j, mbs + 1, &c->i)); 21349566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(c->i, a->i, mbs + 1)); 21354da8f245SBarry Smith c->singlemalloc = PETSC_TRUE; 213644e1c64aSLisandro Dalcin c->free_a = PETSC_TRUE; 21374da8f245SBarry Smith c->free_ij = PETSC_TRUE; 21384da8f245SBarry Smith } 213949b5e25fSSatish Balay if (mbs > 0) { 214048a46eb9SPierre Jolivet if (cpvalues != MAT_SHARE_NONZERO_PATTERN) PetscCall(PetscArraycpy(c->j, a->j, nz)); 214149b5e25fSSatish Balay if (cpvalues == MAT_COPY_VALUES) { 21429566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(c->a, a->a, bs2 * nz)); 214349b5e25fSSatish Balay } else { 21449566063dSJacob Faibussowitsch PetscCall(PetscArrayzero(c->a, bs2 * nz)); 214549b5e25fSSatish Balay } 2146a1c3900fSBarry Smith if (a->jshort) { 214744e1c64aSLisandro Dalcin /* cannot share jshort, it is reallocated in MatAssemblyEnd_SeqSBAIJ() */ 214844e1c64aSLisandro Dalcin /* if the parent matrix is reassembled, this child matrix will never notice */ 21499566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nz, &c->jshort)); 21509566063dSJacob Faibussowitsch PetscCall(PetscArraycpy(c->jshort, a->jshort, nz)); 215126fbe8dcSKarl Rupp 21524da8f245SBarry Smith c->free_jshort = PETSC_TRUE; 21534da8f245SBarry Smith } 2154a1c3900fSBarry Smith } 215549b5e25fSSatish Balay 215649b5e25fSSatish Balay c->roworiented = a->roworiented; 215749b5e25fSSatish Balay c->nonew = a->nonew; 215849b5e25fSSatish Balay 215949b5e25fSSatish Balay if (a->diag) { 2160c760cd28SBarry Smith if (cpvalues == MAT_SHARE_NONZERO_PATTERN) { 2161c760cd28SBarry Smith c->diag = a->diag; 2162c760cd28SBarry Smith c->free_diag = PETSC_FALSE; 2163c760cd28SBarry Smith } else { 21649566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(mbs, &c->diag)); 216526fbe8dcSKarl Rupp for (i = 0; i < mbs; i++) c->diag[i] = a->diag[i]; 2166c760cd28SBarry Smith c->free_diag = PETSC_TRUE; 2167c760cd28SBarry Smith } 216844e1c64aSLisandro Dalcin } 21696c6c5352SBarry Smith c->nz = a->nz; 2170f2cbd3d5SJed Brown c->maxnz = a->nz; /* Since we allocate exactly the right amount */ 2171f4259b30SLisandro Dalcin c->solve_work = NULL; 2172f4259b30SLisandro Dalcin c->mult_work = NULL; 217326fbe8dcSKarl Rupp 217449b5e25fSSatish Balay *B = C; 21759566063dSJacob Faibussowitsch PetscCall(PetscFunctionListDuplicate(((PetscObject)A)->qlist, &((PetscObject)C)->qlist)); 21763ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 217749b5e25fSSatish Balay } 217849b5e25fSSatish Balay 2179618cc2edSLisandro Dalcin /* Used for both SeqBAIJ and SeqSBAIJ matrices */ 2180618cc2edSLisandro Dalcin #define MatLoad_SeqSBAIJ_Binary MatLoad_SeqBAIJ_Binary 2181618cc2edSLisandro Dalcin 2182d71ae5a4SJacob Faibussowitsch PetscErrorCode MatLoad_SeqSBAIJ(Mat mat, PetscViewer viewer) 2183d71ae5a4SJacob Faibussowitsch { 21847f489da9SVaclav Hapla PetscBool isbinary; 21852f480046SShri Abhyankar 21862f480046SShri Abhyankar PetscFunctionBegin; 21879566063dSJacob Faibussowitsch PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERBINARY, &isbinary)); 218828b400f6SJacob Faibussowitsch PetscCheck(isbinary, PetscObjectComm((PetscObject)viewer), PETSC_ERR_SUP, "Viewer type %s not yet supported for reading %s matrices", ((PetscObject)viewer)->type_name, ((PetscObject)mat)->type_name); 21899566063dSJacob Faibussowitsch PetscCall(MatLoad_SeqSBAIJ_Binary(mat, viewer)); 21903ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 21912f480046SShri Abhyankar } 21922f480046SShri Abhyankar 2193c75a6043SHong Zhang /*@ 219411a5261eSBarry Smith MatCreateSeqSBAIJWithArrays - Creates an sequential `MATSEQSBAIJ` matrix using matrix elements 2195c75a6043SHong Zhang (upper triangular entries in CSR format) provided by the user. 2196c75a6043SHong Zhang 2197d083f849SBarry Smith Collective 2198c75a6043SHong Zhang 2199c75a6043SHong Zhang Input Parameters: 2200c75a6043SHong Zhang + comm - must be an MPI communicator of size 1 2201c75a6043SHong Zhang . bs - size of block 2202c75a6043SHong Zhang . m - number of rows 2203c75a6043SHong Zhang . n - number of columns 2204483a2f95SBarry Smith . i - row indices; that is i[0] = 0, i[row] = i[row-1] + number of block elements in that row block row of the matrix 2205c75a6043SHong Zhang . j - column indices 2206c75a6043SHong Zhang - a - matrix values 2207c75a6043SHong Zhang 2208c75a6043SHong Zhang Output Parameter: 2209c75a6043SHong Zhang . mat - the matrix 2210c75a6043SHong Zhang 2211dfb205c3SBarry Smith Level: advanced 2212c75a6043SHong Zhang 2213c75a6043SHong Zhang Notes: 22142ef1f0ffSBarry Smith The `i`, `j`, and `a` arrays are not copied by this routine, the user must free these arrays 2215c75a6043SHong Zhang once the matrix is destroyed 2216c75a6043SHong Zhang 2217c75a6043SHong Zhang You cannot set new nonzero locations into this matrix, that will generate an error. 2218c75a6043SHong Zhang 22192ef1f0ffSBarry Smith The `i` and `j` indices are 0 based 2220c75a6043SHong Zhang 22212ef1f0ffSBarry Smith When block size is greater than 1 the matrix values must be stored using the `MATSBAIJ` storage format. For block size of 1 2222dfb205c3SBarry Smith it is the regular CSR format excluding the lower triangular elements. 2223dfb205c3SBarry Smith 22241cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MATSEQSBAIJ`, `MatCreate()`, `MatCreateSBAIJ()`, `MatCreateSeqSBAIJ()` 2225c75a6043SHong Zhang @*/ 2226d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateSeqSBAIJWithArrays(MPI_Comm comm, PetscInt bs, PetscInt m, PetscInt n, PetscInt i[], PetscInt j[], PetscScalar a[], Mat *mat) 2227d71ae5a4SJacob Faibussowitsch { 2228c75a6043SHong Zhang PetscInt ii; 2229c75a6043SHong Zhang Mat_SeqSBAIJ *sbaij; 2230c75a6043SHong Zhang 2231c75a6043SHong Zhang PetscFunctionBegin; 223208401ef6SPierre Jolivet PetscCheck(bs == 1, PETSC_COMM_SELF, PETSC_ERR_SUP, "block size %" PetscInt_FMT " > 1 is not supported yet", bs); 2233aed4548fSBarry Smith PetscCheck(m == 0 || i[0] == 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "i (row indices) must start with 0"); 2234c75a6043SHong Zhang 22359566063dSJacob Faibussowitsch PetscCall(MatCreate(comm, mat)); 22369566063dSJacob Faibussowitsch PetscCall(MatSetSizes(*mat, m, n, m, n)); 22379566063dSJacob Faibussowitsch PetscCall(MatSetType(*mat, MATSEQSBAIJ)); 22389566063dSJacob Faibussowitsch PetscCall(MatSeqSBAIJSetPreallocation(*mat, bs, MAT_SKIP_ALLOCATION, NULL)); 2239c75a6043SHong Zhang sbaij = (Mat_SeqSBAIJ *)(*mat)->data; 22409566063dSJacob Faibussowitsch PetscCall(PetscMalloc2(m, &sbaij->imax, m, &sbaij->ilen)); 2241c75a6043SHong Zhang 2242c75a6043SHong Zhang sbaij->i = i; 2243c75a6043SHong Zhang sbaij->j = j; 2244c75a6043SHong Zhang sbaij->a = a; 224526fbe8dcSKarl Rupp 2246c75a6043SHong Zhang sbaij->singlemalloc = PETSC_FALSE; 2247c75a6043SHong Zhang sbaij->nonew = -1; /*this indicates that inserting a new value in the matrix that generates a new nonzero is an error*/ 2248e6b907acSBarry Smith sbaij->free_a = PETSC_FALSE; 2249e6b907acSBarry Smith sbaij->free_ij = PETSC_FALSE; 2250ddf7884eSMatthew Knepley sbaij->free_imax_ilen = PETSC_TRUE; 2251c75a6043SHong Zhang 2252c75a6043SHong Zhang for (ii = 0; ii < m; ii++) { 2253c75a6043SHong Zhang sbaij->ilen[ii] = sbaij->imax[ii] = i[ii + 1] - i[ii]; 22546bdcaf15SBarry Smith PetscCheck(i[ii + 1] >= i[ii], PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Negative row length in i (row indices) row = %" PetscInt_FMT " length = %" PetscInt_FMT, ii, i[ii + 1] - i[ii]); 2255c75a6043SHong Zhang } 225676bd3646SJed Brown if (PetscDefined(USE_DEBUG)) { 2257c75a6043SHong Zhang for (ii = 0; ii < sbaij->i[m]; ii++) { 22586bdcaf15SBarry Smith PetscCheck(j[ii] >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Negative column index at location = %" PetscInt_FMT " index = %" PetscInt_FMT, ii, j[ii]); 22596bdcaf15SBarry Smith PetscCheck(j[ii] < n, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Column index too large at location = %" PetscInt_FMT " index = %" PetscInt_FMT, ii, j[ii]); 2260c75a6043SHong Zhang } 226176bd3646SJed Brown } 2262c75a6043SHong Zhang 22639566063dSJacob Faibussowitsch PetscCall(MatAssemblyBegin(*mat, MAT_FINAL_ASSEMBLY)); 22649566063dSJacob Faibussowitsch PetscCall(MatAssemblyEnd(*mat, MAT_FINAL_ASSEMBLY)); 22653ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 2266c75a6043SHong Zhang } 2267d06b337dSHong Zhang 2268d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateMPIMatConcatenateSeqMat_SeqSBAIJ(MPI_Comm comm, Mat inmat, PetscInt n, MatReuse scall, Mat *outmat) 2269d71ae5a4SJacob Faibussowitsch { 227059f5e6ceSHong Zhang PetscFunctionBegin; 22719566063dSJacob Faibussowitsch PetscCall(MatCreateMPIMatConcatenateSeqMat_MPISBAIJ(comm, inmat, n, scall, outmat)); 22723ba16761SJacob Faibussowitsch PetscFunctionReturn(PETSC_SUCCESS); 227359f5e6ceSHong Zhang } 2274