xref: /petsc/src/mat/impls/sbaij/seq/sbaij.c (revision 26cec32642a02ddeaa9481e1a5bd50b8500ffeea)
149b5e25fSSatish Balay 
249b5e25fSSatish Balay /*
3a1373b80SHong Zhang     Defines the basic matrix operations for the SBAIJ (compressed row)
449b5e25fSSatish Balay   matrix storage format.
549b5e25fSSatish Balay */
6c6db04a5SJed Brown #include <../src/mat/impls/baij/seq/baij.h> /*I "petscmat.h" I*/
7c6db04a5SJed Brown #include <../src/mat/impls/sbaij/seq/sbaij.h>
8c6db04a5SJed Brown #include <petscblaslapack.h>
949b5e25fSSatish Balay 
10c6db04a5SJed Brown #include <../src/mat/impls/sbaij/seq/relax.h>
1170dcbbb9SBarry Smith #define USESHORT
12c6db04a5SJed Brown #include <../src/mat/impls/sbaij/seq/relax.h>
1370dcbbb9SBarry Smith 
14*26cec326SBarry Smith /* defines MatSetValues_Seq_Hash(), MatAssemblyEnd_Seq_Hash(), MatSetUp_Seq_Hash() */
15*26cec326SBarry Smith #define TYPE SBAIJ
16*26cec326SBarry Smith #define TYPE_SBAIJ
17*26cec326SBarry Smith #define TYPE_BS
18*26cec326SBarry Smith #include "../src/mat/impls/aij/seq/seqhashmatsetvalues.h"
19*26cec326SBarry Smith #undef TYPE_BS
20*26cec326SBarry Smith #define TYPE_BS _BS
21*26cec326SBarry Smith #define TYPE_BS_ON
22*26cec326SBarry Smith #include "../src/mat/impls/aij/seq/seqhashmatsetvalues.h"
23*26cec326SBarry Smith #undef TYPE_BS
24*26cec326SBarry Smith #undef TYPE_SBAIJ
25*26cec326SBarry Smith #include "../src/mat/impls/aij/seq/seqhashmat.h"
26*26cec326SBarry Smith #undef TYPE
27*26cec326SBarry Smith #undef TYPE_BS_ON
28*26cec326SBarry Smith 
296214f412SHong Zhang #if defined(PETSC_HAVE_ELEMENTAL)
30cc2e6a90SBarry Smith PETSC_INTERN PetscErrorCode MatConvert_SeqSBAIJ_Elemental(Mat, MatType, MatReuse, Mat *);
316214f412SHong Zhang #endif
32d24d4204SJose E. Roman #if defined(PETSC_HAVE_SCALAPACK)
33d24d4204SJose E. Roman PETSC_INTERN PetscErrorCode MatConvert_SBAIJ_ScaLAPACK(Mat, MatType, MatReuse, Mat *);
34d24d4204SJose E. Roman #endif
3528d58a37SPierre Jolivet PETSC_INTERN PetscErrorCode MatConvert_MPISBAIJ_Basic(Mat, MatType, MatReuse, Mat *);
36b5b17502SBarry Smith 
3749b5e25fSSatish Balay /*
3849b5e25fSSatish Balay      Checks for missing diagonals
3949b5e25fSSatish Balay */
40d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMissingDiagonal_SeqSBAIJ(Mat A, PetscBool *missing, PetscInt *dd)
41d71ae5a4SJacob Faibussowitsch {
42045c9aa0SHong Zhang   Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)A->data;
437734d3b5SMatthew G. Knepley   PetscInt     *diag, *ii = a->i, i;
4449b5e25fSSatish Balay 
4549b5e25fSSatish Balay   PetscFunctionBegin;
469566063dSJacob Faibussowitsch   PetscCall(MatMarkDiagonal_SeqSBAIJ(A));
472af78befSBarry Smith   *missing = PETSC_FALSE;
487734d3b5SMatthew G. Knepley   if (A->rmap->n > 0 && !ii) {
49358d2f5dSShri Abhyankar     *missing = PETSC_TRUE;
50358d2f5dSShri Abhyankar     if (dd) *dd = 0;
519566063dSJacob Faibussowitsch     PetscCall(PetscInfo(A, "Matrix has no entries therefore is missing diagonal\n"));
52358d2f5dSShri Abhyankar   } else {
53358d2f5dSShri Abhyankar     diag = a->diag;
5449b5e25fSSatish Balay     for (i = 0; i < a->mbs; i++) {
557734d3b5SMatthew G. Knepley       if (diag[i] >= ii[i + 1]) {
562af78befSBarry Smith         *missing = PETSC_TRUE;
572af78befSBarry Smith         if (dd) *dd = i;
582af78befSBarry Smith         break;
592af78befSBarry Smith       }
6049b5e25fSSatish Balay     }
61358d2f5dSShri Abhyankar   }
623ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
6349b5e25fSSatish Balay }
6449b5e25fSSatish Balay 
65d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMarkDiagonal_SeqSBAIJ(Mat A)
66d71ae5a4SJacob Faibussowitsch {
67045c9aa0SHong Zhang   Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)A->data;
6848dd3d27SHong Zhang   PetscInt      i, j;
6949b5e25fSSatish Balay 
7049b5e25fSSatish Balay   PetscFunctionBegin;
7109f38230SBarry Smith   if (!a->diag) {
729566063dSJacob Faibussowitsch     PetscCall(PetscMalloc1(a->mbs, &a->diag));
73c760cd28SBarry Smith     a->free_diag = PETSC_TRUE;
7409f38230SBarry Smith   }
7548dd3d27SHong Zhang   for (i = 0; i < a->mbs; i++) {
7648dd3d27SHong Zhang     a->diag[i] = a->i[i + 1];
7748dd3d27SHong Zhang     for (j = a->i[i]; j < a->i[i + 1]; j++) {
7848dd3d27SHong Zhang       if (a->j[j] == i) {
7948dd3d27SHong Zhang         a->diag[i] = j;
8048dd3d27SHong Zhang         break;
8148dd3d27SHong Zhang       }
8248dd3d27SHong Zhang     }
8348dd3d27SHong Zhang   }
843ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
8549b5e25fSSatish Balay }
8649b5e25fSSatish Balay 
87d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatGetRowIJ_SeqSBAIJ(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool blockcompressed, PetscInt *nn, const PetscInt *inia[], const PetscInt *inja[], PetscBool *done)
88d71ae5a4SJacob Faibussowitsch {
89a6ece127SHong Zhang   Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)A->data;
902462f5fdSStefano Zampini   PetscInt      i, j, n = a->mbs, nz = a->i[n], *tia, *tja, bs = A->rmap->bs, k, l, cnt;
912462f5fdSStefano Zampini   PetscInt    **ia = (PetscInt **)inia, **ja = (PetscInt **)inja;
9249b5e25fSSatish Balay 
9349b5e25fSSatish Balay   PetscFunctionBegin;
94d3e5a4abSHong Zhang   *nn = n;
953ba16761SJacob Faibussowitsch   if (!ia) PetscFunctionReturn(PETSC_SUCCESS);
962462f5fdSStefano Zampini   if (symmetric) {
979566063dSJacob Faibussowitsch     PetscCall(MatToSymmetricIJ_SeqAIJ(n, a->i, a->j, PETSC_FALSE, 0, 0, &tia, &tja));
982462f5fdSStefano Zampini     nz = tia[n];
992462f5fdSStefano Zampini   } else {
1009371c9d4SSatish Balay     tia = a->i;
1019371c9d4SSatish Balay     tja = a->j;
1022462f5fdSStefano Zampini   }
1032462f5fdSStefano Zampini 
1042462f5fdSStefano Zampini   if (!blockcompressed && bs > 1) {
1052462f5fdSStefano Zampini     (*nn) *= bs;
1068f7157efSSatish Balay     /* malloc & create the natural set of indices */
1079566063dSJacob Faibussowitsch     PetscCall(PetscMalloc1((n + 1) * bs, ia));
1082462f5fdSStefano Zampini     if (n) {
1092462f5fdSStefano Zampini       (*ia)[0] = oshift;
110ad540459SPierre Jolivet       for (j = 1; j < bs; j++) (*ia)[j] = (tia[1] - tia[0]) * bs + (*ia)[j - 1];
1112462f5fdSStefano Zampini     }
1122462f5fdSStefano Zampini 
1132462f5fdSStefano Zampini     for (i = 1; i < n; i++) {
1142462f5fdSStefano Zampini       (*ia)[i * bs] = (tia[i] - tia[i - 1]) * bs + (*ia)[i * bs - 1];
115ad540459SPierre Jolivet       for (j = 1; j < bs; j++) (*ia)[i * bs + j] = (tia[i + 1] - tia[i]) * bs + (*ia)[i * bs + j - 1];
1162462f5fdSStefano Zampini     }
117ad540459SPierre Jolivet     if (n) (*ia)[n * bs] = (tia[n] - tia[n - 1]) * bs + (*ia)[n * bs - 1];
1182462f5fdSStefano Zampini 
1192462f5fdSStefano Zampini     if (inja) {
1209566063dSJacob Faibussowitsch       PetscCall(PetscMalloc1(nz * bs * bs, ja));
1212462f5fdSStefano Zampini       cnt = 0;
1222462f5fdSStefano Zampini       for (i = 0; i < n; i++) {
1238f7157efSSatish Balay         for (j = 0; j < bs; j++) {
1242462f5fdSStefano Zampini           for (k = tia[i]; k < tia[i + 1]; k++) {
125ad540459SPierre Jolivet             for (l = 0; l < bs; l++) (*ja)[cnt++] = bs * tja[k] + l;
1268f7157efSSatish Balay           }
1278f7157efSSatish Balay         }
1288f7157efSSatish Balay       }
1298f7157efSSatish Balay     }
1302462f5fdSStefano Zampini 
1312462f5fdSStefano Zampini     if (symmetric) { /* deallocate memory allocated in MatToSymmetricIJ_SeqAIJ() */
1329566063dSJacob Faibussowitsch       PetscCall(PetscFree(tia));
1339566063dSJacob Faibussowitsch       PetscCall(PetscFree(tja));
1342462f5fdSStefano Zampini     }
1352462f5fdSStefano Zampini   } else if (oshift == 1) {
1362462f5fdSStefano Zampini     if (symmetric) {
1372462f5fdSStefano Zampini       nz = tia[A->rmap->n / bs];
1382462f5fdSStefano Zampini       /*  add 1 to i and j indices */
1392462f5fdSStefano Zampini       for (i = 0; i < A->rmap->n / bs + 1; i++) tia[i] = tia[i] + 1;
1402462f5fdSStefano Zampini       *ia = tia;
1412462f5fdSStefano Zampini       if (ja) {
1422462f5fdSStefano Zampini         for (i = 0; i < nz; i++) tja[i] = tja[i] + 1;
1432462f5fdSStefano Zampini         *ja = tja;
1442462f5fdSStefano Zampini       }
1452462f5fdSStefano Zampini     } else {
1462462f5fdSStefano Zampini       nz = a->i[A->rmap->n / bs];
1472462f5fdSStefano Zampini       /* malloc space and  add 1 to i and j indices */
1489566063dSJacob Faibussowitsch       PetscCall(PetscMalloc1(A->rmap->n / bs + 1, ia));
1492462f5fdSStefano Zampini       for (i = 0; i < A->rmap->n / bs + 1; i++) (*ia)[i] = a->i[i] + 1;
1502462f5fdSStefano Zampini       if (ja) {
1519566063dSJacob Faibussowitsch         PetscCall(PetscMalloc1(nz, ja));
1522462f5fdSStefano Zampini         for (i = 0; i < nz; i++) (*ja)[i] = a->j[i] + 1;
1532462f5fdSStefano Zampini       }
1542462f5fdSStefano Zampini     }
1552462f5fdSStefano Zampini   } else {
1562462f5fdSStefano Zampini     *ia = tia;
1572462f5fdSStefano Zampini     if (ja) *ja = tja;
158a6ece127SHong Zhang   }
1593ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
16049b5e25fSSatish Balay }
16149b5e25fSSatish Balay 
162d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatRestoreRowIJ_SeqSBAIJ(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool blockcompressed, PetscInt *nn, const PetscInt *ia[], const PetscInt *ja[], PetscBool *done)
163d71ae5a4SJacob Faibussowitsch {
16449b5e25fSSatish Balay   PetscFunctionBegin;
1653ba16761SJacob Faibussowitsch   if (!ia) PetscFunctionReturn(PETSC_SUCCESS);
1662462f5fdSStefano Zampini   if ((!blockcompressed && A->rmap->bs > 1) || (symmetric || oshift == 1)) {
1679566063dSJacob Faibussowitsch     PetscCall(PetscFree(*ia));
1689566063dSJacob Faibussowitsch     if (ja) PetscCall(PetscFree(*ja));
169a6ece127SHong Zhang   }
1703ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
17149b5e25fSSatish Balay }
17249b5e25fSSatish Balay 
173d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDestroy_SeqSBAIJ(Mat A)
174d71ae5a4SJacob Faibussowitsch {
17549b5e25fSSatish Balay   Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)A->data;
17649b5e25fSSatish Balay 
17749b5e25fSSatish Balay   PetscFunctionBegin;
178a9f03627SSatish Balay #if defined(PETSC_USE_LOG)
1793ba16761SJacob Faibussowitsch   PetscCall(PetscLogObjectState((PetscObject)A, "Rows=%" PetscInt_FMT ", NZ=%" PetscInt_FMT, A->rmap->N, a->nz));
180a9f03627SSatish Balay #endif
1819566063dSJacob Faibussowitsch   PetscCall(MatSeqXAIJFreeAIJ(A, &a->a, &a->j, &a->i));
1829566063dSJacob Faibussowitsch   if (a->free_diag) PetscCall(PetscFree(a->diag));
1839566063dSJacob Faibussowitsch   PetscCall(ISDestroy(&a->row));
1849566063dSJacob Faibussowitsch   PetscCall(ISDestroy(&a->col));
1859566063dSJacob Faibussowitsch   PetscCall(ISDestroy(&a->icol));
1869566063dSJacob Faibussowitsch   PetscCall(PetscFree(a->idiag));
1879566063dSJacob Faibussowitsch   PetscCall(PetscFree(a->inode.size));
1889566063dSJacob Faibussowitsch   if (a->free_imax_ilen) PetscCall(PetscFree2(a->imax, a->ilen));
1899566063dSJacob Faibussowitsch   PetscCall(PetscFree(a->solve_work));
1909566063dSJacob Faibussowitsch   PetscCall(PetscFree(a->sor_work));
1919566063dSJacob Faibussowitsch   PetscCall(PetscFree(a->solves_work));
1929566063dSJacob Faibussowitsch   PetscCall(PetscFree(a->mult_work));
1939566063dSJacob Faibussowitsch   PetscCall(PetscFree(a->saved_values));
1949566063dSJacob Faibussowitsch   if (a->free_jshort) PetscCall(PetscFree(a->jshort));
1959566063dSJacob Faibussowitsch   PetscCall(PetscFree(a->inew));
1969566063dSJacob Faibussowitsch   PetscCall(MatDestroy(&a->parent));
1979566063dSJacob Faibussowitsch   PetscCall(PetscFree(A->data));
198901853e0SKris Buschelman 
1999566063dSJacob Faibussowitsch   PetscCall(PetscObjectChangeTypeName((PetscObject)A, NULL));
2002e956fe4SStefano Zampini   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSeqSBAIJGetArray_C", NULL));
2012e956fe4SStefano Zampini   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSeqSBAIJRestoreArray_C", NULL));
2029566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatStoreValues_C", NULL));
2039566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatRetrieveValues_C", NULL));
2049566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSeqSBAIJSetColumnIndices_C", NULL));
2059566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqsbaij_seqaij_C", NULL));
2069566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqsbaij_seqbaij_C", NULL));
2079566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSeqSBAIJSetPreallocation_C", NULL));
2089566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSeqSBAIJSetPreallocationCSR_C", NULL));
2096214f412SHong Zhang #if defined(PETSC_HAVE_ELEMENTAL)
2109566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqsbaij_elemental_C", NULL));
2116214f412SHong Zhang #endif
212d24d4204SJose E. Roman #if defined(PETSC_HAVE_SCALAPACK)
2139566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqsbaij_scalapack_C", NULL));
214d24d4204SJose E. Roman #endif
2152e956fe4SStefano Zampini   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatFactorGetSolverType_C", NULL));
2163ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
21749b5e25fSSatish Balay }
21849b5e25fSSatish Balay 
219d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetOption_SeqSBAIJ(Mat A, MatOption op, PetscBool flg)
220d71ae5a4SJacob Faibussowitsch {
221045c9aa0SHong Zhang   Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)A->data;
222eb1ec7c1SStefano Zampini #if defined(PETSC_USE_COMPLEX)
223eb1ec7c1SStefano Zampini   PetscInt bs;
224eb1ec7c1SStefano Zampini #endif
22549b5e25fSSatish Balay 
22649b5e25fSSatish Balay   PetscFunctionBegin;
227eb1ec7c1SStefano Zampini #if defined(PETSC_USE_COMPLEX)
2289566063dSJacob Faibussowitsch   PetscCall(MatGetBlockSize(A, &bs));
229eb1ec7c1SStefano Zampini #endif
2304d9d31abSKris Buschelman   switch (op) {
231d71ae5a4SJacob Faibussowitsch   case MAT_ROW_ORIENTED:
232d71ae5a4SJacob Faibussowitsch     a->roworiented = flg;
233d71ae5a4SJacob Faibussowitsch     break;
234d71ae5a4SJacob Faibussowitsch   case MAT_KEEP_NONZERO_PATTERN:
235d71ae5a4SJacob Faibussowitsch     a->keepnonzeropattern = flg;
236d71ae5a4SJacob Faibussowitsch     break;
237d71ae5a4SJacob Faibussowitsch   case MAT_NEW_NONZERO_LOCATIONS:
238d71ae5a4SJacob Faibussowitsch     a->nonew = (flg ? 0 : 1);
239d71ae5a4SJacob Faibussowitsch     break;
240d71ae5a4SJacob Faibussowitsch   case MAT_NEW_NONZERO_LOCATION_ERR:
241d71ae5a4SJacob Faibussowitsch     a->nonew = (flg ? -1 : 0);
242d71ae5a4SJacob Faibussowitsch     break;
243d71ae5a4SJacob Faibussowitsch   case MAT_NEW_NONZERO_ALLOCATION_ERR:
244d71ae5a4SJacob Faibussowitsch     a->nonew = (flg ? -2 : 0);
245d71ae5a4SJacob Faibussowitsch     break;
246d71ae5a4SJacob Faibussowitsch   case MAT_UNUSED_NONZERO_LOCATION_ERR:
247d71ae5a4SJacob Faibussowitsch     a->nounused = (flg ? -1 : 0);
248d71ae5a4SJacob Faibussowitsch     break;
2498c78258cSHong Zhang   case MAT_FORCE_DIAGONAL_ENTRIES:
2504d9d31abSKris Buschelman   case MAT_IGNORE_OFF_PROC_ENTRIES:
2514d9d31abSKris Buschelman   case MAT_USE_HASH_TABLE:
252d71ae5a4SJacob Faibussowitsch   case MAT_SORTED_FULL:
253d71ae5a4SJacob Faibussowitsch     PetscCall(PetscInfo(A, "Option %s ignored\n", MatOptions[op]));
254d71ae5a4SJacob Faibussowitsch     break;
2559a4540c5SBarry Smith   case MAT_HERMITIAN:
256eb1ec7c1SStefano Zampini #if defined(PETSC_USE_COMPLEX)
257eb1ec7c1SStefano Zampini     if (flg) { /* disable transpose ops */
25808401ef6SPierre Jolivet       PetscCheck(bs <= 1, PETSC_COMM_SELF, PETSC_ERR_SUP, "No support for Hermitian with block size greater than 1");
259eb1ec7c1SStefano Zampini       A->ops->multtranspose    = NULL;
260eb1ec7c1SStefano Zampini       A->ops->multtransposeadd = NULL;
261b94d7dedSBarry Smith       A->symmetric             = PETSC_BOOL3_FALSE;
262eb1ec7c1SStefano Zampini     }
2630f2140c7SStefano Zampini #endif
264eeffb40dSHong Zhang     break;
26577e54ba9SKris Buschelman   case MAT_SYMMETRIC:
266eb1ec7c1SStefano Zampini   case MAT_SPD:
267eb1ec7c1SStefano Zampini #if defined(PETSC_USE_COMPLEX)
268eb1ec7c1SStefano Zampini     if (flg) { /* An hermitian and symmetric matrix has zero imaginary part (restore back transpose ops) */
269eb1ec7c1SStefano Zampini       A->ops->multtranspose    = A->ops->mult;
270eb1ec7c1SStefano Zampini       A->ops->multtransposeadd = A->ops->multadd;
271eb1ec7c1SStefano Zampini     }
272eb1ec7c1SStefano Zampini #endif
273eb1ec7c1SStefano Zampini     break;
274eb1ec7c1SStefano Zampini     /* These options are handled directly by MatSetOption() */
27577e54ba9SKris Buschelman   case MAT_STRUCTURALLY_SYMMETRIC:
2769a4540c5SBarry Smith   case MAT_SYMMETRY_ETERNAL:
277b94d7dedSBarry Smith   case MAT_STRUCTURAL_SYMMETRY_ETERNAL:
278672ba085SHong Zhang   case MAT_STRUCTURE_ONLY:
279b94d7dedSBarry Smith   case MAT_SPD_ETERNAL:
2804dcd73b1SHong Zhang     /* These options are handled directly by MatSetOption() */
281290bbb0aSBarry Smith     break;
282d71ae5a4SJacob Faibussowitsch   case MAT_IGNORE_LOWER_TRIANGULAR:
283d71ae5a4SJacob Faibussowitsch     a->ignore_ltriangular = flg;
284d71ae5a4SJacob Faibussowitsch     break;
285d71ae5a4SJacob Faibussowitsch   case MAT_ERROR_LOWER_TRIANGULAR:
286d71ae5a4SJacob Faibussowitsch     a->ignore_ltriangular = flg;
287d71ae5a4SJacob Faibussowitsch     break;
288d71ae5a4SJacob Faibussowitsch   case MAT_GETROW_UPPERTRIANGULAR:
289d71ae5a4SJacob Faibussowitsch     a->getrow_utriangular = flg;
290d71ae5a4SJacob Faibussowitsch     break;
291d71ae5a4SJacob Faibussowitsch   case MAT_SUBMAT_SINGLEIS:
292d71ae5a4SJacob Faibussowitsch     break;
293d71ae5a4SJacob Faibussowitsch   default:
294d71ae5a4SJacob Faibussowitsch     SETERRQ(PETSC_COMM_SELF, PETSC_ERR_SUP, "unknown option %d", op);
29549b5e25fSSatish Balay   }
2963ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
29749b5e25fSSatish Balay }
29849b5e25fSSatish Balay 
299d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetRow_SeqSBAIJ(Mat A, PetscInt row, PetscInt *nz, PetscInt **idx, PetscScalar **v)
300d71ae5a4SJacob Faibussowitsch {
30149b5e25fSSatish Balay   Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)A->data;
30249b5e25fSSatish Balay 
30349b5e25fSSatish Balay   PetscFunctionBegin;
30408401ef6SPierre Jolivet   PetscCheck(!A || a->getrow_utriangular, PETSC_COMM_SELF, PETSC_ERR_SUP, "MatGetRow is not supported for SBAIJ matrix format. Getting the upper triangular part of row, run with -mat_getrow_uppertriangular, call MatSetOption(mat,MAT_GETROW_UPPERTRIANGULAR,PETSC_TRUE) or MatGetRowUpperTriangular()");
30552768537SHong Zhang 
306f5edf698SHong Zhang   /* Get the upper triangular part of the row */
3079566063dSJacob Faibussowitsch   PetscCall(MatGetRow_SeqBAIJ_private(A, row, nz, idx, v, a->i, a->j, a->a));
3083ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
30949b5e25fSSatish Balay }
31049b5e25fSSatish Balay 
311d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRestoreRow_SeqSBAIJ(Mat A, PetscInt row, PetscInt *nz, PetscInt **idx, PetscScalar **v)
312d71ae5a4SJacob Faibussowitsch {
31349b5e25fSSatish Balay   PetscFunctionBegin;
314cb4a9cd9SHong Zhang   if (nz) *nz = 0;
3159566063dSJacob Faibussowitsch   if (idx) PetscCall(PetscFree(*idx));
3169566063dSJacob Faibussowitsch   if (v) PetscCall(PetscFree(*v));
3173ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
31849b5e25fSSatish Balay }
31949b5e25fSSatish Balay 
320d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetRowUpperTriangular_SeqSBAIJ(Mat A)
321d71ae5a4SJacob Faibussowitsch {
322f5edf698SHong Zhang   Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)A->data;
323f5edf698SHong Zhang 
324f5edf698SHong Zhang   PetscFunctionBegin;
325f5edf698SHong Zhang   a->getrow_utriangular = PETSC_TRUE;
3263ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
327f5edf698SHong Zhang }
328a323099bSStefano Zampini 
329d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRestoreRowUpperTriangular_SeqSBAIJ(Mat A)
330d71ae5a4SJacob Faibussowitsch {
331f5edf698SHong Zhang   Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)A->data;
332f5edf698SHong Zhang 
333f5edf698SHong Zhang   PetscFunctionBegin;
334f5edf698SHong Zhang   a->getrow_utriangular = PETSC_FALSE;
3353ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
336f5edf698SHong Zhang }
337f5edf698SHong Zhang 
338d71ae5a4SJacob Faibussowitsch PetscErrorCode MatTranspose_SeqSBAIJ(Mat A, MatReuse reuse, Mat *B)
339d71ae5a4SJacob Faibussowitsch {
34049b5e25fSSatish Balay   PetscFunctionBegin;
3417fb60732SBarry Smith   if (reuse == MAT_REUSE_MATRIX) PetscCall(MatTransposeCheckNonzeroState_Private(A, *B));
342cf37664fSBarry Smith   if (reuse == MAT_INITIAL_MATRIX) {
3439566063dSJacob Faibussowitsch     PetscCall(MatDuplicate(A, MAT_COPY_VALUES, B));
344cf37664fSBarry Smith   } else if (reuse == MAT_REUSE_MATRIX) {
3459566063dSJacob Faibussowitsch     PetscCall(MatCopy(A, *B, SAME_NONZERO_PATTERN));
346fc4dec0aSBarry Smith   }
3473ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
34849b5e25fSSatish Balay }
34949b5e25fSSatish Balay 
350d71ae5a4SJacob Faibussowitsch PetscErrorCode MatView_SeqSBAIJ_ASCII(Mat A, PetscViewer viewer)
351d71ae5a4SJacob Faibussowitsch {
35249b5e25fSSatish Balay   Mat_SeqSBAIJ     *a = (Mat_SeqSBAIJ *)A->data;
353d0f46423SBarry Smith   PetscInt          i, j, bs = A->rmap->bs, k, l, bs2 = a->bs2;
354f3ef73ceSBarry Smith   PetscViewerFormat format;
355121deb67SSatish Balay   PetscInt         *diag;
356b3a0534dSBarry Smith   const char       *matname;
35749b5e25fSSatish Balay 
35849b5e25fSSatish Balay   PetscFunctionBegin;
3599566063dSJacob Faibussowitsch   PetscCall(PetscViewerGetFormat(viewer, &format));
360456192e2SBarry Smith   if (format == PETSC_VIEWER_ASCII_INFO || format == PETSC_VIEWER_ASCII_INFO_DETAIL) {
3619566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIPrintf(viewer, "  block size is %" PetscInt_FMT "\n", bs));
362fb9695e5SSatish Balay   } else if (format == PETSC_VIEWER_ASCII_MATLAB) {
363d2507d54SMatthew Knepley     Mat aij;
364ade3a672SBarry Smith 
365d5f3da31SBarry Smith     if (A->factortype && bs > 1) {
3669566063dSJacob Faibussowitsch       PetscCall(PetscPrintf(PETSC_COMM_SELF, "Warning: matrix is factored with bs>1. MatView() with PETSC_VIEWER_ASCII_MATLAB is not supported and ignored!\n"));
3673ba16761SJacob Faibussowitsch       PetscFunctionReturn(PETSC_SUCCESS);
36870d5e725SHong Zhang     }
3699566063dSJacob Faibussowitsch     PetscCall(MatConvert(A, MATSEQAIJ, MAT_INITIAL_MATRIX, &aij));
37023a3927dSBarry Smith     if (((PetscObject)A)->name) PetscCall(PetscObjectGetName((PetscObject)A, &matname));
37123a3927dSBarry Smith     if (((PetscObject)A)->name) PetscCall(PetscObjectSetName((PetscObject)aij, matname));
37223a3927dSBarry Smith     PetscCall(MatView_SeqAIJ(aij, viewer));
3739566063dSJacob Faibussowitsch     PetscCall(MatDestroy(&aij));
374fb9695e5SSatish Balay   } else if (format == PETSC_VIEWER_ASCII_COMMON) {
375b3a0534dSBarry Smith     Mat B;
376b3a0534dSBarry Smith 
377b3a0534dSBarry Smith     PetscCall(MatConvert(A, MATSEQAIJ, MAT_INITIAL_MATRIX, &B));
378b3a0534dSBarry Smith     if (((PetscObject)A)->name) PetscCall(PetscObjectGetName((PetscObject)A, &matname));
379b3a0534dSBarry Smith     if (((PetscObject)A)->name) PetscCall(PetscObjectSetName((PetscObject)B, matname));
380b3a0534dSBarry Smith     PetscCall(MatView_SeqAIJ(B, viewer));
381b3a0534dSBarry Smith     PetscCall(MatDestroy(&B));
382c1490034SHong Zhang   } else if (format == PETSC_VIEWER_ASCII_FACTOR_INFO) {
3833ba16761SJacob Faibussowitsch     PetscFunctionReturn(PETSC_SUCCESS);
38449b5e25fSSatish Balay   } else {
3859566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE));
3862c990fa1SHong Zhang     if (A->factortype) { /* for factored matrix */
38708401ef6SPierre Jolivet       PetscCheck(bs <= 1, PETSC_COMM_SELF, PETSC_ERR_SUP, "matrix is factored with bs>1. Not implemented yet");
3882c990fa1SHong Zhang 
389121deb67SSatish Balay       diag = a->diag;
390121deb67SSatish Balay       for (i = 0; i < a->mbs; i++) { /* for row block i */
3919566063dSJacob Faibussowitsch         PetscCall(PetscViewerASCIIPrintf(viewer, "row %" PetscInt_FMT ":", i));
3922c990fa1SHong Zhang         /* diagonal entry */
3932c990fa1SHong Zhang #if defined(PETSC_USE_COMPLEX)
3942c990fa1SHong Zhang         if (PetscImaginaryPart(a->a[diag[i]]) > 0.0) {
3959566063dSJacob Faibussowitsch           PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g + %g i) ", a->j[diag[i]], (double)PetscRealPart(1.0 / a->a[diag[i]]), (double)PetscImaginaryPart(1.0 / a->a[diag[i]])));
3962c990fa1SHong Zhang         } else if (PetscImaginaryPart(a->a[diag[i]]) < 0.0) {
3979566063dSJacob Faibussowitsch           PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g - %g i) ", a->j[diag[i]], (double)PetscRealPart(1.0 / a->a[diag[i]]), -(double)PetscImaginaryPart(1.0 / a->a[diag[i]])));
3982c990fa1SHong Zhang         } else {
3999566063dSJacob Faibussowitsch           PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[diag[i]], (double)PetscRealPart(1.0 / a->a[diag[i]])));
4002c990fa1SHong Zhang         }
4012c990fa1SHong Zhang #else
4029566063dSJacob Faibussowitsch         PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[diag[i]], (double)(1.0 / a->a[diag[i]])));
4032c990fa1SHong Zhang #endif
4042c990fa1SHong Zhang         /* off-diagonal entries */
4052c990fa1SHong Zhang         for (k = a->i[i]; k < a->i[i + 1] - 1; k++) {
4062c990fa1SHong Zhang #if defined(PETSC_USE_COMPLEX)
407ca0704adSBarry Smith           if (PetscImaginaryPart(a->a[k]) > 0.0) {
4089566063dSJacob Faibussowitsch             PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g + %g i) ", bs * a->j[k], (double)PetscRealPart(a->a[k]), (double)PetscImaginaryPart(a->a[k])));
409ca0704adSBarry Smith           } else if (PetscImaginaryPart(a->a[k]) < 0.0) {
4109566063dSJacob Faibussowitsch             PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g - %g i) ", bs * a->j[k], (double)PetscRealPart(a->a[k]), -(double)PetscImaginaryPart(a->a[k])));
4112c990fa1SHong Zhang           } else {
4129566063dSJacob Faibussowitsch             PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", bs * a->j[k], (double)PetscRealPart(a->a[k])));
4132c990fa1SHong Zhang           }
4142c990fa1SHong Zhang #else
4159566063dSJacob Faibussowitsch           PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[k], (double)a->a[k]));
4162c990fa1SHong Zhang #endif
4172c990fa1SHong Zhang         }
4189566063dSJacob Faibussowitsch         PetscCall(PetscViewerASCIIPrintf(viewer, "\n"));
4192c990fa1SHong Zhang       }
4202c990fa1SHong Zhang 
4212c990fa1SHong Zhang     } else {                         /* for non-factored matrix */
4220c74a584SJed Brown       for (i = 0; i < a->mbs; i++) { /* for row block i */
4230c74a584SJed Brown         for (j = 0; j < bs; j++) {   /* for row bs*i + j */
4249566063dSJacob Faibussowitsch           PetscCall(PetscViewerASCIIPrintf(viewer, "row %" PetscInt_FMT ":", i * bs + j));
4250c74a584SJed Brown           for (k = a->i[i]; k < a->i[i + 1]; k++) { /* for column block */
4260c74a584SJed Brown             for (l = 0; l < bs; l++) {              /* for column */
42749b5e25fSSatish Balay #if defined(PETSC_USE_COMPLEX)
42849b5e25fSSatish Balay               if (PetscImaginaryPart(a->a[bs2 * k + l * bs + j]) > 0.0) {
4299371c9d4SSatish Balay                 PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g + %g i) ", bs * a->j[k] + l, (double)PetscRealPart(a->a[bs2 * k + l * bs + j]), (double)PetscImaginaryPart(a->a[bs2 * k + l * bs + j])));
43049b5e25fSSatish Balay               } else if (PetscImaginaryPart(a->a[bs2 * k + l * bs + j]) < 0.0) {
4319371c9d4SSatish Balay                 PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g - %g i) ", bs * a->j[k] + l, (double)PetscRealPart(a->a[bs2 * k + l * bs + j]), -(double)PetscImaginaryPart(a->a[bs2 * k + l * bs + j])));
43249b5e25fSSatish Balay               } else {
4339566063dSJacob Faibussowitsch                 PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", bs * a->j[k] + l, (double)PetscRealPart(a->a[bs2 * k + l * bs + j])));
43449b5e25fSSatish Balay               }
43549b5e25fSSatish Balay #else
4369566063dSJacob Faibussowitsch               PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", bs * a->j[k] + l, (double)a->a[bs2 * k + l * bs + j]));
43749b5e25fSSatish Balay #endif
43849b5e25fSSatish Balay             }
43949b5e25fSSatish Balay           }
4409566063dSJacob Faibussowitsch           PetscCall(PetscViewerASCIIPrintf(viewer, "\n"));
44149b5e25fSSatish Balay         }
44249b5e25fSSatish Balay       }
4432c990fa1SHong Zhang     }
4449566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE));
44549b5e25fSSatish Balay   }
4469566063dSJacob Faibussowitsch   PetscCall(PetscViewerFlush(viewer));
4473ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
44849b5e25fSSatish Balay }
44949b5e25fSSatish Balay 
4509804daf3SBarry Smith #include <petscdraw.h>
451d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatView_SeqSBAIJ_Draw_Zoom(PetscDraw draw, void *Aa)
452d71ae5a4SJacob Faibussowitsch {
45349b5e25fSSatish Balay   Mat           A = (Mat)Aa;
45449b5e25fSSatish Balay   Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)A->data;
455d0f46423SBarry Smith   PetscInt      row, i, j, k, l, mbs = a->mbs, color, bs = A->rmap->bs, bs2 = a->bs2;
45649b5e25fSSatish Balay   PetscReal     xl, yl, xr, yr, x_l, x_r, y_l, y_r;
45749b5e25fSSatish Balay   MatScalar    *aa;
458b0a32e0cSBarry Smith   PetscViewer   viewer;
45949b5e25fSSatish Balay 
46049b5e25fSSatish Balay   PetscFunctionBegin;
4619566063dSJacob Faibussowitsch   PetscCall(PetscObjectQuery((PetscObject)A, "Zoomviewer", (PetscObject *)&viewer));
4629566063dSJacob Faibussowitsch   PetscCall(PetscDrawGetCoordinates(draw, &xl, &yl, &xr, &yr));
46349b5e25fSSatish Balay 
46449b5e25fSSatish Balay   /* loop over matrix elements drawing boxes */
465383922c3SLisandro Dalcin 
466d0609cedSBarry Smith   PetscDrawCollectiveBegin(draw);
4679566063dSJacob Faibussowitsch   PetscCall(PetscDrawString(draw, .3 * (xl + xr), .3 * (yl + yr), PETSC_DRAW_BLACK, "symmetric"));
468383922c3SLisandro Dalcin   /* Blue for negative, Cyan for zero and  Red for positive */
469b0a32e0cSBarry Smith   color = PETSC_DRAW_BLUE;
47049b5e25fSSatish Balay   for (i = 0, row = 0; i < mbs; i++, row += bs) {
47149b5e25fSSatish Balay     for (j = a->i[i]; j < a->i[i + 1]; j++) {
4729371c9d4SSatish Balay       y_l = A->rmap->N - row - 1.0;
4739371c9d4SSatish Balay       y_r = y_l + 1.0;
4749371c9d4SSatish Balay       x_l = a->j[j] * bs;
4759371c9d4SSatish Balay       x_r = x_l + 1.0;
47649b5e25fSSatish Balay       aa  = a->a + j * bs2;
47749b5e25fSSatish Balay       for (k = 0; k < bs; k++) {
47849b5e25fSSatish Balay         for (l = 0; l < bs; l++) {
47949b5e25fSSatish Balay           if (PetscRealPart(*aa++) >= 0.) continue;
4809566063dSJacob Faibussowitsch           PetscCall(PetscDrawRectangle(draw, x_l + k, y_l - l, x_r + k, y_r - l, color, color, color, color));
48149b5e25fSSatish Balay         }
48249b5e25fSSatish Balay       }
48349b5e25fSSatish Balay     }
48449b5e25fSSatish Balay   }
485b0a32e0cSBarry Smith   color = PETSC_DRAW_CYAN;
48649b5e25fSSatish Balay   for (i = 0, row = 0; i < mbs; i++, row += bs) {
48749b5e25fSSatish Balay     for (j = a->i[i]; j < a->i[i + 1]; j++) {
4889371c9d4SSatish Balay       y_l = A->rmap->N - row - 1.0;
4899371c9d4SSatish Balay       y_r = y_l + 1.0;
4909371c9d4SSatish Balay       x_l = a->j[j] * bs;
4919371c9d4SSatish Balay       x_r = x_l + 1.0;
49249b5e25fSSatish Balay       aa  = a->a + j * bs2;
49349b5e25fSSatish Balay       for (k = 0; k < bs; k++) {
49449b5e25fSSatish Balay         for (l = 0; l < bs; l++) {
49549b5e25fSSatish Balay           if (PetscRealPart(*aa++) != 0.) continue;
4969566063dSJacob Faibussowitsch           PetscCall(PetscDrawRectangle(draw, x_l + k, y_l - l, x_r + k, y_r - l, color, color, color, color));
49749b5e25fSSatish Balay         }
49849b5e25fSSatish Balay       }
49949b5e25fSSatish Balay     }
50049b5e25fSSatish Balay   }
501b0a32e0cSBarry Smith   color = PETSC_DRAW_RED;
50249b5e25fSSatish Balay   for (i = 0, row = 0; i < mbs; i++, row += bs) {
50349b5e25fSSatish Balay     for (j = a->i[i]; j < a->i[i + 1]; j++) {
5049371c9d4SSatish Balay       y_l = A->rmap->N - row - 1.0;
5059371c9d4SSatish Balay       y_r = y_l + 1.0;
5069371c9d4SSatish Balay       x_l = a->j[j] * bs;
5079371c9d4SSatish Balay       x_r = x_l + 1.0;
50849b5e25fSSatish Balay       aa  = a->a + j * bs2;
50949b5e25fSSatish Balay       for (k = 0; k < bs; k++) {
51049b5e25fSSatish Balay         for (l = 0; l < bs; l++) {
51149b5e25fSSatish Balay           if (PetscRealPart(*aa++) <= 0.) continue;
5129566063dSJacob Faibussowitsch           PetscCall(PetscDrawRectangle(draw, x_l + k, y_l - l, x_r + k, y_r - l, color, color, color, color));
51349b5e25fSSatish Balay         }
51449b5e25fSSatish Balay       }
51549b5e25fSSatish Balay     }
51649b5e25fSSatish Balay   }
517d0609cedSBarry Smith   PetscDrawCollectiveEnd(draw);
5183ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
51949b5e25fSSatish Balay }
52049b5e25fSSatish Balay 
521d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatView_SeqSBAIJ_Draw(Mat A, PetscViewer viewer)
522d71ae5a4SJacob Faibussowitsch {
52349b5e25fSSatish Balay   PetscReal xl, yl, xr, yr, w, h;
524b0a32e0cSBarry Smith   PetscDraw draw;
525ace3abfcSBarry Smith   PetscBool isnull;
52649b5e25fSSatish Balay 
52749b5e25fSSatish Balay   PetscFunctionBegin;
5289566063dSJacob Faibussowitsch   PetscCall(PetscViewerDrawGetDraw(viewer, 0, &draw));
5299566063dSJacob Faibussowitsch   PetscCall(PetscDrawIsNull(draw, &isnull));
5303ba16761SJacob Faibussowitsch   if (isnull) PetscFunctionReturn(PETSC_SUCCESS);
53149b5e25fSSatish Balay 
5329371c9d4SSatish Balay   xr = A->rmap->N;
5339371c9d4SSatish Balay   yr = A->rmap->N;
5349371c9d4SSatish Balay   h  = yr / 10.0;
5359371c9d4SSatish Balay   w  = xr / 10.0;
5369371c9d4SSatish Balay   xr += w;
5379371c9d4SSatish Balay   yr += h;
5389371c9d4SSatish Balay   xl = -w;
5399371c9d4SSatish Balay   yl = -h;
5409566063dSJacob Faibussowitsch   PetscCall(PetscDrawSetCoordinates(draw, xl, yl, xr, yr));
5419566063dSJacob Faibussowitsch   PetscCall(PetscObjectCompose((PetscObject)A, "Zoomviewer", (PetscObject)viewer));
5429566063dSJacob Faibussowitsch   PetscCall(PetscDrawZoom(draw, MatView_SeqSBAIJ_Draw_Zoom, A));
5439566063dSJacob Faibussowitsch   PetscCall(PetscObjectCompose((PetscObject)A, "Zoomviewer", NULL));
5449566063dSJacob Faibussowitsch   PetscCall(PetscDrawSave(draw));
5453ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
54649b5e25fSSatish Balay }
54749b5e25fSSatish Balay 
548618cc2edSLisandro Dalcin /* Used for both MPIBAIJ and MPISBAIJ matrices */
549618cc2edSLisandro Dalcin #define MatView_SeqSBAIJ_Binary MatView_SeqBAIJ_Binary
550618cc2edSLisandro Dalcin 
551d71ae5a4SJacob Faibussowitsch PetscErrorCode MatView_SeqSBAIJ(Mat A, PetscViewer viewer)
552d71ae5a4SJacob Faibussowitsch {
553618cc2edSLisandro Dalcin   PetscBool iascii, isbinary, isdraw;
55449b5e25fSSatish Balay 
55549b5e25fSSatish Balay   PetscFunctionBegin;
5569566063dSJacob Faibussowitsch   PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERASCII, &iascii));
5579566063dSJacob Faibussowitsch   PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERBINARY, &isbinary));
5589566063dSJacob Faibussowitsch   PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERDRAW, &isdraw));
55932077d6dSBarry Smith   if (iascii) {
5609566063dSJacob Faibussowitsch     PetscCall(MatView_SeqSBAIJ_ASCII(A, viewer));
561618cc2edSLisandro Dalcin   } else if (isbinary) {
5629566063dSJacob Faibussowitsch     PetscCall(MatView_SeqSBAIJ_Binary(A, viewer));
56349b5e25fSSatish Balay   } else if (isdraw) {
5649566063dSJacob Faibussowitsch     PetscCall(MatView_SeqSBAIJ_Draw(A, viewer));
56549b5e25fSSatish Balay   } else {
566a5e6ed63SBarry Smith     Mat         B;
567ade3a672SBarry Smith     const char *matname;
5689566063dSJacob Faibussowitsch     PetscCall(MatConvert(A, MATSEQAIJ, MAT_INITIAL_MATRIX, &B));
56923a3927dSBarry Smith     if (((PetscObject)A)->name) PetscCall(PetscObjectGetName((PetscObject)A, &matname));
57023a3927dSBarry Smith     if (((PetscObject)A)->name) PetscCall(PetscObjectSetName((PetscObject)B, matname));
5719566063dSJacob Faibussowitsch     PetscCall(MatView(B, viewer));
5729566063dSJacob Faibussowitsch     PetscCall(MatDestroy(&B));
57349b5e25fSSatish Balay   }
5743ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
57549b5e25fSSatish Balay }
57649b5e25fSSatish Balay 
577d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetValues_SeqSBAIJ(Mat A, PetscInt m, const PetscInt im[], PetscInt n, const PetscInt in[], PetscScalar v[])
578d71ae5a4SJacob Faibussowitsch {
579045c9aa0SHong Zhang   Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)A->data;
58013f74950SBarry Smith   PetscInt     *rp, k, low, high, t, row, nrow, i, col, l, *aj = a->j;
58113f74950SBarry Smith   PetscInt     *ai = a->i, *ailen = a->ilen;
582d0f46423SBarry Smith   PetscInt      brow, bcol, ridx, cidx, bs = A->rmap->bs, bs2 = a->bs2;
58397e567efSBarry Smith   MatScalar    *ap, *aa = a->a;
58449b5e25fSSatish Balay 
58549b5e25fSSatish Balay   PetscFunctionBegin;
58649b5e25fSSatish Balay   for (k = 0; k < m; k++) { /* loop over rows */
5879371c9d4SSatish Balay     row  = im[k];
5889371c9d4SSatish Balay     brow = row / bs;
5899371c9d4SSatish Balay     if (row < 0) {
5909371c9d4SSatish Balay       v += n;
5919371c9d4SSatish Balay       continue;
5929371c9d4SSatish Balay     } /* negative row */
59354c59aa7SJacob Faibussowitsch     PetscCheck(row < A->rmap->N, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Row too large: row %" PetscInt_FMT " max %" PetscInt_FMT, row, A->rmap->N - 1);
5949371c9d4SSatish Balay     rp   = aj + ai[brow];
5959371c9d4SSatish Balay     ap   = aa + bs2 * ai[brow];
59649b5e25fSSatish Balay     nrow = ailen[brow];
59749b5e25fSSatish Balay     for (l = 0; l < n; l++) { /* loop over columns */
5989371c9d4SSatish Balay       if (in[l] < 0) {
5999371c9d4SSatish Balay         v++;
6009371c9d4SSatish Balay         continue;
6019371c9d4SSatish Balay       } /* negative column */
60254c59aa7SJacob Faibussowitsch       PetscCheck(in[l] < A->cmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Column too large: col %" PetscInt_FMT " max %" PetscInt_FMT, in[l], A->cmap->n - 1);
60349b5e25fSSatish Balay       col  = in[l];
60449b5e25fSSatish Balay       bcol = col / bs;
60549b5e25fSSatish Balay       cidx = col % bs;
60649b5e25fSSatish Balay       ridx = row % bs;
60749b5e25fSSatish Balay       high = nrow;
60849b5e25fSSatish Balay       low  = 0; /* assume unsorted */
60949b5e25fSSatish Balay       while (high - low > 5) {
61049b5e25fSSatish Balay         t = (low + high) / 2;
61149b5e25fSSatish Balay         if (rp[t] > bcol) high = t;
61249b5e25fSSatish Balay         else low = t;
61349b5e25fSSatish Balay       }
61449b5e25fSSatish Balay       for (i = low; i < high; i++) {
61549b5e25fSSatish Balay         if (rp[i] > bcol) break;
61649b5e25fSSatish Balay         if (rp[i] == bcol) {
61749b5e25fSSatish Balay           *v++ = ap[bs2 * i + bs * cidx + ridx];
61849b5e25fSSatish Balay           goto finished;
61949b5e25fSSatish Balay         }
62049b5e25fSSatish Balay       }
62197e567efSBarry Smith       *v++ = 0.0;
62249b5e25fSSatish Balay     finished:;
62349b5e25fSSatish Balay     }
62449b5e25fSSatish Balay   }
6253ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
62649b5e25fSSatish Balay }
62749b5e25fSSatish Balay 
628d71ae5a4SJacob Faibussowitsch PetscErrorCode MatPermute_SeqSBAIJ(Mat A, IS rowp, IS colp, Mat *B)
629d71ae5a4SJacob Faibussowitsch {
630dc29a518SPierre Jolivet   Mat C;
631dc29a518SPierre Jolivet 
632dc29a518SPierre Jolivet   PetscFunctionBegin;
6339566063dSJacob Faibussowitsch   PetscCall(MatConvert(A, MATSEQBAIJ, MAT_INITIAL_MATRIX, &C));
6349566063dSJacob Faibussowitsch   PetscCall(MatPermute(C, rowp, colp, B));
6359566063dSJacob Faibussowitsch   PetscCall(MatDestroy(&C));
63648a46eb9SPierre Jolivet   if (rowp == colp) PetscCall(MatConvert(*B, MATSEQSBAIJ, MAT_INPLACE_MATRIX, B));
6373ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
638dc29a518SPierre Jolivet }
63949b5e25fSSatish Balay 
640d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetValuesBlocked_SeqSBAIJ(Mat A, PetscInt m, const PetscInt im[], PetscInt n, const PetscInt in[], const PetscScalar v[], InsertMode is)
641d71ae5a4SJacob Faibussowitsch {
6420880e062SHong Zhang   Mat_SeqSBAIJ      *a = (Mat_SeqSBAIJ *)A->data;
643e2ee6c50SBarry Smith   PetscInt          *rp, k, low, high, t, ii, jj, row, nrow, i, col, l, rmax, N, lastcol = -1;
64413f74950SBarry Smith   PetscInt          *imax = a->imax, *ai = a->i, *ailen = a->ilen;
645d0f46423SBarry Smith   PetscInt          *aj = a->j, nonew = a->nonew, bs2 = a->bs2, bs = A->rmap->bs, stepval;
646ace3abfcSBarry Smith   PetscBool          roworiented = a->roworiented;
647dd6ea824SBarry Smith   const PetscScalar *value       = v;
648f15d580aSBarry Smith   MatScalar         *ap, *aa = a->a, *bap;
6490880e062SHong Zhang 
65049b5e25fSSatish Balay   PetscFunctionBegin;
65126fbe8dcSKarl Rupp   if (roworiented) stepval = (n - 1) * bs;
65226fbe8dcSKarl Rupp   else stepval = (m - 1) * bs;
65326fbe8dcSKarl Rupp 
6540880e062SHong Zhang   for (k = 0; k < m; k++) { /* loop over added rows */
6550880e062SHong Zhang     row = im[k];
6560880e062SHong Zhang     if (row < 0) continue;
6576bdcaf15SBarry Smith     PetscCheck(row < a->mbs, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Block index row too large %" PetscInt_FMT " max %" PetscInt_FMT, row, a->mbs - 1);
6580880e062SHong Zhang     rp   = aj + ai[row];
6590880e062SHong Zhang     ap   = aa + bs2 * ai[row];
6600880e062SHong Zhang     rmax = imax[row];
6610880e062SHong Zhang     nrow = ailen[row];
6620880e062SHong Zhang     low  = 0;
663818f2c47SBarry Smith     high = nrow;
6640880e062SHong Zhang     for (l = 0; l < n; l++) { /* loop over added columns */
6650880e062SHong Zhang       if (in[l] < 0) continue;
6660880e062SHong Zhang       col = in[l];
6676bdcaf15SBarry Smith       PetscCheck(col < a->nbs, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Block index column too large %" PetscInt_FMT " max %" PetscInt_FMT, col, a->nbs - 1);
668b98bf0e1SJed Brown       if (col < row) {
66926fbe8dcSKarl Rupp         if (a->ignore_ltriangular) continue; /* ignore lower triangular block */
67026fbe8dcSKarl Rupp         else SETERRQ(PETSC_COMM_SELF, PETSC_ERR_USER, "Lower triangular value cannot be set for sbaij format. Ignoring these values, run with -mat_ignore_lower_triangular or call MatSetOption(mat,MAT_IGNORE_LOWER_TRIANGULAR,PETSC_TRUE)");
671b98bf0e1SJed Brown       }
67226fbe8dcSKarl Rupp       if (roworiented) value = v + k * (stepval + bs) * bs + l * bs;
67326fbe8dcSKarl Rupp       else value = v + l * (stepval + bs) * bs + k * bs;
67426fbe8dcSKarl Rupp 
67526fbe8dcSKarl Rupp       if (col <= lastcol) low = 0;
67626fbe8dcSKarl Rupp       else high = nrow;
67726fbe8dcSKarl Rupp 
678e2ee6c50SBarry Smith       lastcol = col;
6790880e062SHong Zhang       while (high - low > 7) {
6800880e062SHong Zhang         t = (low + high) / 2;
6810880e062SHong Zhang         if (rp[t] > col) high = t;
6820880e062SHong Zhang         else low = t;
6830880e062SHong Zhang       }
6840880e062SHong Zhang       for (i = low; i < high; i++) {
6850880e062SHong Zhang         if (rp[i] > col) break;
6860880e062SHong Zhang         if (rp[i] == col) {
6870880e062SHong Zhang           bap = ap + bs2 * i;
6880880e062SHong Zhang           if (roworiented) {
6890880e062SHong Zhang             if (is == ADD_VALUES) {
6900880e062SHong Zhang               for (ii = 0; ii < bs; ii++, value += stepval) {
691ad540459SPierre Jolivet                 for (jj = ii; jj < bs2; jj += bs) bap[jj] += *value++;
6920880e062SHong Zhang               }
6930880e062SHong Zhang             } else {
6940880e062SHong Zhang               for (ii = 0; ii < bs; ii++, value += stepval) {
695ad540459SPierre Jolivet                 for (jj = ii; jj < bs2; jj += bs) bap[jj] = *value++;
6960880e062SHong Zhang               }
6970880e062SHong Zhang             }
6980880e062SHong Zhang           } else {
6990880e062SHong Zhang             if (is == ADD_VALUES) {
7000880e062SHong Zhang               for (ii = 0; ii < bs; ii++, value += stepval) {
701ad540459SPierre Jolivet                 for (jj = 0; jj < bs; jj++) *bap++ += *value++;
7020880e062SHong Zhang               }
7030880e062SHong Zhang             } else {
7040880e062SHong Zhang               for (ii = 0; ii < bs; ii++, value += stepval) {
705ad540459SPierre Jolivet                 for (jj = 0; jj < bs; jj++) *bap++ = *value++;
7060880e062SHong Zhang               }
7070880e062SHong Zhang             }
7080880e062SHong Zhang           }
7090880e062SHong Zhang           goto noinsert2;
7100880e062SHong Zhang         }
7110880e062SHong Zhang       }
7120880e062SHong Zhang       if (nonew == 1) goto noinsert2;
71308401ef6SPierre Jolivet       PetscCheck(nonew != -1, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Inserting a new block index nonzero block (%" PetscInt_FMT ", %" PetscInt_FMT ") in the matrix", row, col);
714fef13f97SBarry Smith       MatSeqXAIJReallocateAIJ(A, a->mbs, bs2, nrow, row, col, rmax, aa, ai, aj, rp, ap, imax, nonew, MatScalar);
7159371c9d4SSatish Balay       N = nrow++ - 1;
7169371c9d4SSatish Balay       high++;
7170880e062SHong Zhang       /* shift up all the later entries in this row */
7189566063dSJacob Faibussowitsch       PetscCall(PetscArraymove(rp + i + 1, rp + i, N - i + 1));
7199566063dSJacob Faibussowitsch       PetscCall(PetscArraymove(ap + bs2 * (i + 1), ap + bs2 * i, bs2 * (N - i + 1)));
7209566063dSJacob Faibussowitsch       PetscCall(PetscArrayzero(ap + bs2 * i, bs2));
7210880e062SHong Zhang       rp[i] = col;
7220880e062SHong Zhang       bap   = ap + bs2 * i;
7230880e062SHong Zhang       if (roworiented) {
7240880e062SHong Zhang         for (ii = 0; ii < bs; ii++, value += stepval) {
725ad540459SPierre Jolivet           for (jj = ii; jj < bs2; jj += bs) bap[jj] = *value++;
7260880e062SHong Zhang         }
7270880e062SHong Zhang       } else {
7280880e062SHong Zhang         for (ii = 0; ii < bs; ii++, value += stepval) {
729ad540459SPierre Jolivet           for (jj = 0; jj < bs; jj++) *bap++ = *value++;
7300880e062SHong Zhang         }
7310880e062SHong Zhang       }
7320880e062SHong Zhang     noinsert2:;
7330880e062SHong Zhang       low = i;
7340880e062SHong Zhang     }
7350880e062SHong Zhang     ailen[row] = nrow;
7360880e062SHong Zhang   }
7373ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
73849b5e25fSSatish Balay }
73949b5e25fSSatish Balay 
74064831d72SBarry Smith /*
74164831d72SBarry Smith     This is not yet used
74264831d72SBarry Smith */
743d71ae5a4SJacob Faibussowitsch PetscErrorCode MatAssemblyEnd_SeqSBAIJ_SeqAIJ_Inode(Mat A)
744d71ae5a4SJacob Faibussowitsch {
7450def2e27SBarry Smith   Mat_SeqSBAIJ   *a  = (Mat_SeqSBAIJ *)A->data;
7460def2e27SBarry Smith   const PetscInt *ai = a->i, *aj = a->j, *cols;
7470def2e27SBarry Smith   PetscInt        i = 0, j, blk_size, m = A->rmap->n, node_count = 0, nzx, nzy, *ns, row, nz, cnt, cnt2, *counts;
748ace3abfcSBarry Smith   PetscBool       flag;
7490def2e27SBarry Smith 
7500def2e27SBarry Smith   PetscFunctionBegin;
7519566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(m, &ns));
7520def2e27SBarry Smith   while (i < m) {
7530def2e27SBarry Smith     nzx = ai[i + 1] - ai[i]; /* Number of nonzeros */
7540def2e27SBarry Smith     /* Limits the number of elements in a node to 'a->inode.limit' */
7550def2e27SBarry Smith     for (j = i + 1, blk_size = 1; j < m && blk_size < a->inode.limit; ++j, ++blk_size) {
7560def2e27SBarry Smith       nzy = ai[j + 1] - ai[j];
7570def2e27SBarry Smith       if (nzy != (nzx - j + i)) break;
7589566063dSJacob Faibussowitsch       PetscCall(PetscArraycmp(aj + ai[i] + j - i, aj + ai[j], nzy, &flag));
7590def2e27SBarry Smith       if (!flag) break;
7600def2e27SBarry Smith     }
7610def2e27SBarry Smith     ns[node_count++] = blk_size;
76226fbe8dcSKarl Rupp 
7630def2e27SBarry Smith     i = j;
7640def2e27SBarry Smith   }
7650def2e27SBarry Smith   if (!a->inode.size && m && node_count > .9 * m) {
7669566063dSJacob Faibussowitsch     PetscCall(PetscFree(ns));
7679566063dSJacob Faibussowitsch     PetscCall(PetscInfo(A, "Found %" PetscInt_FMT " nodes out of %" PetscInt_FMT " rows. Not using Inode routines\n", node_count, m));
7680def2e27SBarry Smith   } else {
7690def2e27SBarry Smith     a->inode.node_count = node_count;
77026fbe8dcSKarl Rupp 
7719566063dSJacob Faibussowitsch     PetscCall(PetscMalloc1(node_count, &a->inode.size));
7729566063dSJacob Faibussowitsch     PetscCall(PetscArraycpy(a->inode.size, ns, node_count));
7739566063dSJacob Faibussowitsch     PetscCall(PetscFree(ns));
7749566063dSJacob Faibussowitsch     PetscCall(PetscInfo(A, "Found %" PetscInt_FMT " nodes of %" PetscInt_FMT ". Limit used: %" PetscInt_FMT ". Using Inode routines\n", node_count, m, a->inode.limit));
7750def2e27SBarry Smith 
7760def2e27SBarry Smith     /* count collections of adjacent columns in each inode */
7770def2e27SBarry Smith     row = 0;
7780def2e27SBarry Smith     cnt = 0;
7790def2e27SBarry Smith     for (i = 0; i < node_count; i++) {
7800def2e27SBarry Smith       cols = aj + ai[row] + a->inode.size[i];
7810def2e27SBarry Smith       nz   = ai[row + 1] - ai[row] - a->inode.size[i];
7820def2e27SBarry Smith       for (j = 1; j < nz; j++) {
78326fbe8dcSKarl Rupp         if (cols[j] != cols[j - 1] + 1) cnt++;
7840def2e27SBarry Smith       }
7850def2e27SBarry Smith       cnt++;
7860def2e27SBarry Smith       row += a->inode.size[i];
7870def2e27SBarry Smith     }
7889566063dSJacob Faibussowitsch     PetscCall(PetscMalloc1(2 * cnt, &counts));
7890def2e27SBarry Smith     cnt = 0;
7900def2e27SBarry Smith     row = 0;
7910def2e27SBarry Smith     for (i = 0; i < node_count; i++) {
7920def2e27SBarry Smith       cols            = aj + ai[row] + a->inode.size[i];
7930def2e27SBarry Smith       counts[2 * cnt] = cols[0];
7940def2e27SBarry Smith       nz              = ai[row + 1] - ai[row] - a->inode.size[i];
7950def2e27SBarry Smith       cnt2            = 1;
7960def2e27SBarry Smith       for (j = 1; j < nz; j++) {
7970def2e27SBarry Smith         if (cols[j] != cols[j - 1] + 1) {
7980def2e27SBarry Smith           counts[2 * (cnt++) + 1] = cnt2;
7990def2e27SBarry Smith           counts[2 * cnt]         = cols[j];
8000def2e27SBarry Smith           cnt2                    = 1;
8010def2e27SBarry Smith         } else cnt2++;
8020def2e27SBarry Smith       }
8030def2e27SBarry Smith       counts[2 * (cnt++) + 1] = cnt2;
8040def2e27SBarry Smith       row += a->inode.size[i];
8050def2e27SBarry Smith     }
8069566063dSJacob Faibussowitsch     PetscCall(PetscIntView(2 * cnt, counts, NULL));
8070def2e27SBarry Smith   }
8083ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
80938702af4SBarry Smith }
81038702af4SBarry Smith 
811d71ae5a4SJacob Faibussowitsch PetscErrorCode MatAssemblyEnd_SeqSBAIJ(Mat A, MatAssemblyType mode)
812d71ae5a4SJacob Faibussowitsch {
81349b5e25fSSatish Balay   Mat_SeqSBAIJ *a      = (Mat_SeqSBAIJ *)A->data;
8148f8f2f0dSBarry Smith   PetscInt      fshift = 0, i, *ai = a->i, *aj = a->j, *imax = a->imax;
815d0f46423SBarry Smith   PetscInt      m = A->rmap->N, *ip, N, *ailen = a->ilen;
81613f74950SBarry Smith   PetscInt      mbs = a->mbs, bs2 = a->bs2, rmax = 0;
81749b5e25fSSatish Balay   MatScalar    *aa = a->a, *ap;
81849b5e25fSSatish Balay 
81949b5e25fSSatish Balay   PetscFunctionBegin;
8203ba16761SJacob Faibussowitsch   if (mode == MAT_FLUSH_ASSEMBLY) PetscFunctionReturn(PETSC_SUCCESS);
82149b5e25fSSatish Balay 
82249b5e25fSSatish Balay   if (m) rmax = ailen[0];
82349b5e25fSSatish Balay   for (i = 1; i < mbs; i++) {
82449b5e25fSSatish Balay     /* move each row back by the amount of empty slots (fshift) before it*/
82549b5e25fSSatish Balay     fshift += imax[i - 1] - ailen[i - 1];
82649b5e25fSSatish Balay     rmax = PetscMax(rmax, ailen[i]);
82749b5e25fSSatish Balay     if (fshift) {
828580bdb30SBarry Smith       ip = aj + ai[i];
829580bdb30SBarry Smith       ap = aa + bs2 * ai[i];
83049b5e25fSSatish Balay       N  = ailen[i];
8319566063dSJacob Faibussowitsch       PetscCall(PetscArraymove(ip - fshift, ip, N));
8329566063dSJacob Faibussowitsch       PetscCall(PetscArraymove(ap - bs2 * fshift, ap, bs2 * N));
83349b5e25fSSatish Balay     }
83449b5e25fSSatish Balay     ai[i] = ai[i - 1] + ailen[i - 1];
83549b5e25fSSatish Balay   }
83649b5e25fSSatish Balay   if (mbs) {
83749b5e25fSSatish Balay     fshift += imax[mbs - 1] - ailen[mbs - 1];
83849b5e25fSSatish Balay     ai[mbs] = ai[mbs - 1] + ailen[mbs - 1];
83949b5e25fSSatish Balay   }
84049b5e25fSSatish Balay   /* reset ilen and imax for each row */
841ad540459SPierre Jolivet   for (i = 0; i < mbs; i++) ailen[i] = imax[i] = ai[i + 1] - ai[i];
8426c6c5352SBarry Smith   a->nz = ai[mbs];
84349b5e25fSSatish Balay 
844b424e231SHong Zhang   /* diagonals may have moved, reset it */
8451baa6e33SBarry Smith   if (a->diag) PetscCall(PetscArraycpy(a->diag, ai, mbs));
846aed4548fSBarry Smith   PetscCheck(!fshift || a->nounused != -1, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Unused space detected in matrix: %" PetscInt_FMT " X %" PetscInt_FMT " block size %" PetscInt_FMT ", %" PetscInt_FMT " unneeded", m, A->cmap->n, A->rmap->bs, fshift * bs2);
84726fbe8dcSKarl Rupp 
8489566063dSJacob Faibussowitsch   PetscCall(PetscInfo(A, "Matrix size: %" PetscInt_FMT " X %" PetscInt_FMT ", block size %" PetscInt_FMT "; storage space: %" PetscInt_FMT " unneeded, %" PetscInt_FMT " used\n", m, A->rmap->N, A->rmap->bs, fshift * bs2, a->nz * bs2));
8499566063dSJacob Faibussowitsch   PetscCall(PetscInfo(A, "Number of mallocs during MatSetValues is %" PetscInt_FMT "\n", a->reallocs));
8509566063dSJacob Faibussowitsch   PetscCall(PetscInfo(A, "Most nonzeros blocks in any row is %" PetscInt_FMT "\n", rmax));
85126fbe8dcSKarl Rupp 
8528e58a170SBarry Smith   A->info.mallocs += a->reallocs;
85349b5e25fSSatish Balay   a->reallocs         = 0;
85449b5e25fSSatish Balay   A->info.nz_unneeded = (PetscReal)fshift * bs2;
855061b2667SBarry Smith   a->idiagvalid       = PETSC_FALSE;
8564dcd73b1SHong Zhang   a->rmax             = rmax;
85738702af4SBarry Smith 
85838702af4SBarry Smith   if (A->cmap->n < 65536 && A->cmap->bs == 1) {
85944e1c64aSLisandro Dalcin     if (a->jshort && a->free_jshort) {
86017803ae8SHong Zhang       /* when matrix data structure is changed, previous jshort must be replaced */
8619566063dSJacob Faibussowitsch       PetscCall(PetscFree(a->jshort));
86217803ae8SHong Zhang     }
8639566063dSJacob Faibussowitsch     PetscCall(PetscMalloc1(a->i[A->rmap->n], &a->jshort));
86438702af4SBarry Smith     for (i = 0; i < a->i[A->rmap->n]; i++) a->jshort[i] = a->j[i];
86538702af4SBarry Smith     A->ops->mult   = MatMult_SeqSBAIJ_1_ushort;
86641f059aeSBarry Smith     A->ops->sor    = MatSOR_SeqSBAIJ_ushort;
8674da8f245SBarry Smith     a->free_jshort = PETSC_TRUE;
86838702af4SBarry Smith   }
8693ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
87049b5e25fSSatish Balay }
87149b5e25fSSatish Balay 
87249b5e25fSSatish Balay /*
87349b5e25fSSatish Balay    This function returns an array of flags which indicate the locations of contiguous
87449b5e25fSSatish Balay    blocks that should be zeroed. for eg: if bs = 3  and is = [0,1,2,3,5,6,7,8,9]
875a5b23f4aSJose E. Roman    then the resulting sizes = [3,1,1,3,1] corresponding to sets [(0,1,2),(3),(5),(6,7,8),(9)]
87649b5e25fSSatish Balay    Assume: sizes should be long enough to hold all the values.
87749b5e25fSSatish Balay */
878d71ae5a4SJacob Faibussowitsch PetscErrorCode MatZeroRows_SeqSBAIJ_Check_Blocks(PetscInt idx[], PetscInt n, PetscInt bs, PetscInt sizes[], PetscInt *bs_max)
879d71ae5a4SJacob Faibussowitsch {
88013f74950SBarry Smith   PetscInt  i, j, k, row;
881ace3abfcSBarry Smith   PetscBool flg;
88249b5e25fSSatish Balay 
88349b5e25fSSatish Balay   PetscFunctionBegin;
88449b5e25fSSatish Balay   for (i = 0, j = 0; i < n; j++) {
88549b5e25fSSatish Balay     row = idx[i];
886a5b23f4aSJose E. Roman     if (row % bs != 0) { /* Not the beginning of a block */
88749b5e25fSSatish Balay       sizes[j] = 1;
88849b5e25fSSatish Balay       i++;
88949b5e25fSSatish Balay     } else if (i + bs > n) { /* Beginning of a block, but complete block doesn't exist (at idx end) */
89049b5e25fSSatish Balay       sizes[j] = 1;          /* Also makes sure at least 'bs' values exist for next else */
89149b5e25fSSatish Balay       i++;
8926aad120cSJose E. Roman     } else { /* Beginning of the block, so check if the complete block exists */
89349b5e25fSSatish Balay       flg = PETSC_TRUE;
89449b5e25fSSatish Balay       for (k = 1; k < bs; k++) {
89549b5e25fSSatish Balay         if (row + k != idx[i + k]) { /* break in the block */
89649b5e25fSSatish Balay           flg = PETSC_FALSE;
89749b5e25fSSatish Balay           break;
89849b5e25fSSatish Balay         }
89949b5e25fSSatish Balay       }
900abc0a331SBarry Smith       if (flg) { /* No break in the bs */
90149b5e25fSSatish Balay         sizes[j] = bs;
90249b5e25fSSatish Balay         i += bs;
90349b5e25fSSatish Balay       } else {
90449b5e25fSSatish Balay         sizes[j] = 1;
90549b5e25fSSatish Balay         i++;
90649b5e25fSSatish Balay       }
90749b5e25fSSatish Balay     }
90849b5e25fSSatish Balay   }
90949b5e25fSSatish Balay   *bs_max = j;
9103ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
91149b5e25fSSatish Balay }
91249b5e25fSSatish Balay 
91349b5e25fSSatish Balay /* Only add/insert a(i,j) with i<=j (blocks).
914da81f932SPierre Jolivet    Any a(i,j) with i>j input by user is ignored.
91549b5e25fSSatish Balay */
91649b5e25fSSatish Balay 
917d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetValues_SeqSBAIJ(Mat A, PetscInt m, const PetscInt im[], PetscInt n, const PetscInt in[], const PetscScalar v[], InsertMode is)
918d71ae5a4SJacob Faibussowitsch {
91949b5e25fSSatish Balay   Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)A->data;
920e2ee6c50SBarry Smith   PetscInt     *rp, k, low, high, t, ii, row, nrow, i, col, l, rmax, N, lastcol = -1;
92113f74950SBarry Smith   PetscInt     *imax = a->imax, *ai = a->i, *ailen = a->ilen, roworiented = a->roworiented;
922d0f46423SBarry Smith   PetscInt     *aj = a->j, nonew = a->nonew, bs = A->rmap->bs, brow, bcol;
92313f74950SBarry Smith   PetscInt      ridx, cidx, bs2                 = a->bs2;
92449b5e25fSSatish Balay   MatScalar    *ap, value, *aa                  = a->a, *bap;
92549b5e25fSSatish Balay 
92649b5e25fSSatish Balay   PetscFunctionBegin;
92749b5e25fSSatish Balay   for (k = 0; k < m; k++) { /* loop over added rows */
92849b5e25fSSatish Balay     row  = im[k];           /* row number */
92949b5e25fSSatish Balay     brow = row / bs;        /* block row number */
93049b5e25fSSatish Balay     if (row < 0) continue;
9316bdcaf15SBarry Smith     PetscCheck(row < A->rmap->N, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Row too large: row %" PetscInt_FMT " max %" PetscInt_FMT, row, A->rmap->N - 1);
93249b5e25fSSatish Balay     rp   = aj + ai[brow];       /*ptr to beginning of column value of the row block*/
93349b5e25fSSatish Balay     ap   = aa + bs2 * ai[brow]; /*ptr to beginning of element value of the row block*/
93449b5e25fSSatish Balay     rmax = imax[brow];          /* maximum space allocated for this row */
93549b5e25fSSatish Balay     nrow = ailen[brow];         /* actual length of this row */
93649b5e25fSSatish Balay     low  = 0;
9378509e838SStefano Zampini     high = nrow;
93849b5e25fSSatish Balay     for (l = 0; l < n; l++) { /* loop over added columns */
93949b5e25fSSatish Balay       if (in[l] < 0) continue;
9406bdcaf15SBarry Smith       PetscCheck(in[l] < A->cmap->N, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Column too large: col %" PetscInt_FMT " max %" PetscInt_FMT, in[l], A->cmap->N - 1);
94149b5e25fSSatish Balay       col  = in[l];
94249b5e25fSSatish Balay       bcol = col / bs; /* block col number */
94349b5e25fSSatish Balay 
944941593c8SHong Zhang       if (brow > bcol) {
94526fbe8dcSKarl Rupp         if (a->ignore_ltriangular) continue; /* ignore lower triangular values */
94626fbe8dcSKarl Rupp         else SETERRQ(PETSC_COMM_SELF, PETSC_ERR_USER, "Lower triangular value cannot be set for sbaij format. Ignoring these values, run with -mat_ignore_lower_triangular or call MatSetOption(mat,MAT_IGNORE_LOWER_TRIANGULAR,PETSC_TRUE)");
947941593c8SHong Zhang       }
948f4989cb3SHong Zhang 
9499371c9d4SSatish Balay       ridx = row % bs;
9509371c9d4SSatish Balay       cidx = col % bs; /*row and col index inside the block */
9518549e402SHong Zhang       if ((brow == bcol && ridx <= cidx) || (brow < bcol)) {
95249b5e25fSSatish Balay         /* element value a(k,l) */
95326fbe8dcSKarl Rupp         if (roworiented) value = v[l + k * n];
95426fbe8dcSKarl Rupp         else value = v[k + l * m];
95549b5e25fSSatish Balay 
95649b5e25fSSatish Balay         /* move pointer bap to a(k,l) quickly and add/insert value */
95726fbe8dcSKarl Rupp         if (col <= lastcol) low = 0;
9588509e838SStefano Zampini         else high = nrow;
9598509e838SStefano Zampini 
960e2ee6c50SBarry Smith         lastcol = col;
96149b5e25fSSatish Balay         while (high - low > 7) {
96249b5e25fSSatish Balay           t = (low + high) / 2;
96349b5e25fSSatish Balay           if (rp[t] > bcol) high = t;
96449b5e25fSSatish Balay           else low = t;
96549b5e25fSSatish Balay         }
96649b5e25fSSatish Balay         for (i = low; i < high; i++) {
96749b5e25fSSatish Balay           if (rp[i] > bcol) break;
96849b5e25fSSatish Balay           if (rp[i] == bcol) {
96949b5e25fSSatish Balay             bap = ap + bs2 * i + bs * cidx + ridx;
97049b5e25fSSatish Balay             if (is == ADD_VALUES) *bap += value;
97149b5e25fSSatish Balay             else *bap = value;
9728549e402SHong Zhang             /* for diag block, add/insert its symmetric element a(cidx,ridx) */
9738549e402SHong Zhang             if (brow == bcol && ridx < cidx) {
9748549e402SHong Zhang               bap = ap + bs2 * i + bs * ridx + cidx;
9758549e402SHong Zhang               if (is == ADD_VALUES) *bap += value;
9768549e402SHong Zhang               else *bap = value;
9778549e402SHong Zhang             }
97849b5e25fSSatish Balay             goto noinsert1;
97949b5e25fSSatish Balay           }
98049b5e25fSSatish Balay         }
98149b5e25fSSatish Balay 
98249b5e25fSSatish Balay         if (nonew == 1) goto noinsert1;
98308401ef6SPierre Jolivet         PetscCheck(nonew != -1, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Inserting a new nonzero (%" PetscInt_FMT ", %" PetscInt_FMT ") in the matrix", row, col);
984fef13f97SBarry Smith         MatSeqXAIJReallocateAIJ(A, a->mbs, bs2, nrow, brow, bcol, rmax, aa, ai, aj, rp, ap, imax, nonew, MatScalar);
98549b5e25fSSatish Balay 
9869371c9d4SSatish Balay         N = nrow++ - 1;
9879371c9d4SSatish Balay         high++;
98849b5e25fSSatish Balay         /* shift up all the later entries in this row */
9899566063dSJacob Faibussowitsch         PetscCall(PetscArraymove(rp + i + 1, rp + i, N - i + 1));
9909566063dSJacob Faibussowitsch         PetscCall(PetscArraymove(ap + bs2 * (i + 1), ap + bs2 * i, bs2 * (N - i + 1)));
9919566063dSJacob Faibussowitsch         PetscCall(PetscArrayzero(ap + bs2 * i, bs2));
99249b5e25fSSatish Balay         rp[i]                          = bcol;
99349b5e25fSSatish Balay         ap[bs2 * i + bs * cidx + ridx] = value;
9948509e838SStefano Zampini         /* for diag block, add/insert its symmetric element a(cidx,ridx) */
995ad540459SPierre Jolivet         if (brow == bcol && ridx < cidx) ap[bs2 * i + bs * ridx + cidx] = value;
996e56f5c9eSBarry Smith         A->nonzerostate++;
99749b5e25fSSatish Balay       noinsert1:;
99849b5e25fSSatish Balay         low = i;
9998549e402SHong Zhang       }
100049b5e25fSSatish Balay     } /* end of loop over added columns */
100149b5e25fSSatish Balay     ailen[brow] = nrow;
100249b5e25fSSatish Balay   } /* end of loop over added rows */
10033ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
100449b5e25fSSatish Balay }
100549b5e25fSSatish Balay 
1006d71ae5a4SJacob Faibussowitsch PetscErrorCode MatICCFactor_SeqSBAIJ(Mat inA, IS row, const MatFactorInfo *info)
1007d71ae5a4SJacob Faibussowitsch {
10084ccecd49SHong Zhang   Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)inA->data;
100949b5e25fSSatish Balay   Mat           outA;
1010ace3abfcSBarry Smith   PetscBool     row_identity;
101149b5e25fSSatish Balay 
101249b5e25fSSatish Balay   PetscFunctionBegin;
101308401ef6SPierre Jolivet   PetscCheck(info->levels == 0, PETSC_COMM_SELF, PETSC_ERR_SUP, "Only levels=0 is supported for in-place icc");
10149566063dSJacob Faibussowitsch   PetscCall(ISIdentity(row, &row_identity));
101528b400f6SJacob Faibussowitsch   PetscCheck(row_identity, PETSC_COMM_SELF, PETSC_ERR_SUP, "Matrix reordering is not supported");
101608401ef6SPierre Jolivet   PetscCheck(inA->rmap->bs == 1, PETSC_COMM_SELF, PETSC_ERR_SUP, "Matrix block size %" PetscInt_FMT " is not supported", inA->rmap->bs); /* Need to replace MatCholeskyFactorSymbolic_SeqSBAIJ_MSR()! */
1017c84f5b01SHong Zhang 
101849b5e25fSSatish Balay   outA            = inA;
1019d5f3da31SBarry Smith   inA->factortype = MAT_FACTOR_ICC;
10209566063dSJacob Faibussowitsch   PetscCall(PetscFree(inA->solvertype));
10219566063dSJacob Faibussowitsch   PetscCall(PetscStrallocpy(MATSOLVERPETSC, &inA->solvertype));
102249b5e25fSSatish Balay 
10239566063dSJacob Faibussowitsch   PetscCall(MatMarkDiagonal_SeqSBAIJ(inA));
10249566063dSJacob Faibussowitsch   PetscCall(MatSeqSBAIJSetNumericFactorization_inplace(inA, row_identity));
102549b5e25fSSatish Balay 
10269566063dSJacob Faibussowitsch   PetscCall(PetscObjectReference((PetscObject)row));
10279566063dSJacob Faibussowitsch   PetscCall(ISDestroy(&a->row));
1028c84f5b01SHong Zhang   a->row = row;
10299566063dSJacob Faibussowitsch   PetscCall(PetscObjectReference((PetscObject)row));
10309566063dSJacob Faibussowitsch   PetscCall(ISDestroy(&a->col));
1031c84f5b01SHong Zhang   a->col = row;
1032c84f5b01SHong Zhang 
1033c84f5b01SHong Zhang   /* Create the invert permutation so that it can be used in MatCholeskyFactorNumeric() */
10349566063dSJacob Faibussowitsch   if (a->icol) PetscCall(ISInvertPermutation(row, PETSC_DECIDE, &a->icol));
103549b5e25fSSatish Balay 
10364dfa11a4SJacob Faibussowitsch   if (!a->solve_work) { PetscCall(PetscMalloc1(inA->rmap->N + inA->rmap->bs, &a->solve_work)); }
103749b5e25fSSatish Balay 
10389566063dSJacob Faibussowitsch   PetscCall(MatCholeskyFactorNumeric(outA, inA, info));
10393ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
104049b5e25fSSatish Balay }
1041950f1e5bSHong Zhang 
1042d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqSBAIJSetColumnIndices_SeqSBAIJ(Mat mat, PetscInt *indices)
1043d71ae5a4SJacob Faibussowitsch {
1044045c9aa0SHong Zhang   Mat_SeqSBAIJ *baij = (Mat_SeqSBAIJ *)mat->data;
104513f74950SBarry Smith   PetscInt      i, nz, n;
104649b5e25fSSatish Balay 
104749b5e25fSSatish Balay   PetscFunctionBegin;
10486c6c5352SBarry Smith   nz = baij->maxnz;
1049d0f46423SBarry Smith   n  = mat->cmap->n;
105026fbe8dcSKarl Rupp   for (i = 0; i < nz; i++) baij->j[i] = indices[i];
105126fbe8dcSKarl Rupp 
10526c6c5352SBarry Smith   baij->nz = nz;
105326fbe8dcSKarl Rupp   for (i = 0; i < n; i++) baij->ilen[i] = baij->imax[i];
105426fbe8dcSKarl Rupp 
10559566063dSJacob Faibussowitsch   PetscCall(MatSetOption(mat, MAT_NEW_NONZERO_LOCATION_ERR, PETSC_TRUE));
10563ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
105749b5e25fSSatish Balay }
105849b5e25fSSatish Balay 
105949b5e25fSSatish Balay /*@
106019585528SSatish Balay   MatSeqSBAIJSetColumnIndices - Set the column indices for all the rows
106111a5261eSBarry Smith   in a `MATSEQSBAIJ` matrix.
106249b5e25fSSatish Balay 
106349b5e25fSSatish Balay   Input Parameters:
106411a5261eSBarry Smith   +  mat     - the `MATSEQSBAIJ` matrix
106549b5e25fSSatish Balay   -  indices - the column indices
106649b5e25fSSatish Balay 
106749b5e25fSSatish Balay   Level: advanced
106849b5e25fSSatish Balay 
106949b5e25fSSatish Balay   Notes:
107049b5e25fSSatish Balay   This can be called if you have precomputed the nonzero structure of the
107149b5e25fSSatish Balay   matrix and want to provide it to the matrix object to improve the performance
107211a5261eSBarry Smith   of the `MatSetValues()` operation.
107349b5e25fSSatish Balay 
107449b5e25fSSatish Balay   You MUST have set the correct numbers of nonzeros per row in the call to
107511a5261eSBarry Smith   `MatCreateSeqSBAIJ()`, and the columns indices MUST be sorted.
107649b5e25fSSatish Balay 
1077ab9f2c04SSatish Balay   MUST be called before any calls to MatSetValues()
107849b5e25fSSatish Balay 
107911a5261eSBarry Smith  .seealso: `MATSEQSBAIJ`, `MatCreateSeqSBAIJ`
108049b5e25fSSatish Balay @*/
1081d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqSBAIJSetColumnIndices(Mat mat, PetscInt *indices)
1082d71ae5a4SJacob Faibussowitsch {
108349b5e25fSSatish Balay   PetscFunctionBegin;
10840700a824SBarry Smith   PetscValidHeaderSpecific(mat, MAT_CLASSID, 1);
1085dadcf809SJacob Faibussowitsch   PetscValidIntPointer(indices, 2);
1086cac4c232SBarry Smith   PetscUseMethod(mat, "MatSeqSBAIJSetColumnIndices_C", (Mat, PetscInt *), (mat, indices));
10873ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
108849b5e25fSSatish Balay }
108949b5e25fSSatish Balay 
1090d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCopy_SeqSBAIJ(Mat A, Mat B, MatStructure str)
1091d71ae5a4SJacob Faibussowitsch {
10924c7a3774SStefano Zampini   PetscBool isbaij;
10933c896bc6SHong Zhang 
10943c896bc6SHong Zhang   PetscFunctionBegin;
10959566063dSJacob Faibussowitsch   PetscCall(PetscObjectTypeCompareAny((PetscObject)B, &isbaij, MATSEQSBAIJ, MATMPISBAIJ, ""));
109628b400f6SJacob Faibussowitsch   PetscCheck(isbaij, PetscObjectComm((PetscObject)B), PETSC_ERR_SUP, "Not for matrix type %s", ((PetscObject)B)->type_name);
10974c7a3774SStefano Zampini   /* If the two matrices have the same copy implementation and nonzero pattern, use fast copy. */
10984c7a3774SStefano Zampini   if (str == SAME_NONZERO_PATTERN && A->ops->copy == B->ops->copy) {
10993c896bc6SHong Zhang     Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)A->data;
11003c896bc6SHong Zhang     Mat_SeqSBAIJ *b = (Mat_SeqSBAIJ *)B->data;
11013c896bc6SHong Zhang 
110208401ef6SPierre Jolivet     PetscCheck(a->i[a->mbs] == b->i[b->mbs], PETSC_COMM_SELF, PETSC_ERR_ARG_INCOMP, "Number of nonzeros in two matrices are different");
110308401ef6SPierre Jolivet     PetscCheck(a->mbs == b->mbs, PETSC_COMM_SELF, PETSC_ERR_ARG_INCOMP, "Number of rows in two matrices are different");
110408401ef6SPierre Jolivet     PetscCheck(a->bs2 == b->bs2, PETSC_COMM_SELF, PETSC_ERR_ARG_INCOMP, "Different block size");
11059566063dSJacob Faibussowitsch     PetscCall(PetscArraycpy(b->a, a->a, a->bs2 * a->i[a->mbs]));
11069566063dSJacob Faibussowitsch     PetscCall(PetscObjectStateIncrease((PetscObject)B));
11073c896bc6SHong Zhang   } else {
11089566063dSJacob Faibussowitsch     PetscCall(MatGetRowUpperTriangular(A));
11099566063dSJacob Faibussowitsch     PetscCall(MatCopy_Basic(A, B, str));
11109566063dSJacob Faibussowitsch     PetscCall(MatRestoreRowUpperTriangular(A));
11113c896bc6SHong Zhang   }
11123ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
11133c896bc6SHong Zhang }
11143c896bc6SHong Zhang 
1115d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatSeqSBAIJGetArray_SeqSBAIJ(Mat A, PetscScalar *array[])
1116d71ae5a4SJacob Faibussowitsch {
1117a6ece127SHong Zhang   Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)A->data;
11185fd66863SKarl Rupp 
1119a6ece127SHong Zhang   PetscFunctionBegin;
1120a6ece127SHong Zhang   *array = a->a;
11213ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
1122a6ece127SHong Zhang }
1123a6ece127SHong Zhang 
1124d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatSeqSBAIJRestoreArray_SeqSBAIJ(Mat A, PetscScalar *array[])
1125d71ae5a4SJacob Faibussowitsch {
1126a6ece127SHong Zhang   PetscFunctionBegin;
1127cda14afcSprj-   *array = NULL;
11283ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
1129a6ece127SHong Zhang }
1130a6ece127SHong Zhang 
1131d71ae5a4SJacob Faibussowitsch PetscErrorCode MatAXPYGetPreallocation_SeqSBAIJ(Mat Y, Mat X, PetscInt *nnz)
1132d71ae5a4SJacob Faibussowitsch {
1133b264fe52SHong Zhang   PetscInt      bs = Y->rmap->bs, mbs = Y->rmap->N / bs;
113452768537SHong Zhang   Mat_SeqSBAIJ *x = (Mat_SeqSBAIJ *)X->data;
113552768537SHong Zhang   Mat_SeqSBAIJ *y = (Mat_SeqSBAIJ *)Y->data;
113652768537SHong Zhang 
113752768537SHong Zhang   PetscFunctionBegin;
113852768537SHong Zhang   /* Set the number of nonzeros in the new matrix */
11399566063dSJacob Faibussowitsch   PetscCall(MatAXPYGetPreallocation_SeqX_private(mbs, x->i, x->j, y->i, y->j, nnz));
11403ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
114152768537SHong Zhang }
114252768537SHong Zhang 
1143d71ae5a4SJacob Faibussowitsch PetscErrorCode MatAXPY_SeqSBAIJ(Mat Y, PetscScalar a, Mat X, MatStructure str)
1144d71ae5a4SJacob Faibussowitsch {
114542ee4b1aSHong Zhang   Mat_SeqSBAIJ *x = (Mat_SeqSBAIJ *)X->data, *y = (Mat_SeqSBAIJ *)Y->data;
114631ce2d13SHong Zhang   PetscInt      bs = Y->rmap->bs, bs2 = bs * bs;
1147e838b9e7SJed Brown   PetscBLASInt  one = 1;
114842ee4b1aSHong Zhang 
114942ee4b1aSHong Zhang   PetscFunctionBegin;
1150134adf20SPierre Jolivet   if (str == UNKNOWN_NONZERO_PATTERN || (PetscDefined(USE_DEBUG) && str == SAME_NONZERO_PATTERN)) {
1151134adf20SPierre Jolivet     PetscBool e = x->nz == y->nz && x->mbs == y->mbs ? PETSC_TRUE : PETSC_FALSE;
1152134adf20SPierre Jolivet     if (e) {
11539566063dSJacob Faibussowitsch       PetscCall(PetscArraycmp(x->i, y->i, x->mbs + 1, &e));
1154134adf20SPierre Jolivet       if (e) {
11559566063dSJacob Faibussowitsch         PetscCall(PetscArraycmp(x->j, y->j, x->i[x->mbs], &e));
1156134adf20SPierre Jolivet         if (e) str = SAME_NONZERO_PATTERN;
1157134adf20SPierre Jolivet       }
1158134adf20SPierre Jolivet     }
115954c59aa7SJacob Faibussowitsch     if (!e) PetscCheck(str != SAME_NONZERO_PATTERN, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONG, "MatStructure is not SAME_NONZERO_PATTERN");
1160134adf20SPierre Jolivet   }
116142ee4b1aSHong Zhang   if (str == SAME_NONZERO_PATTERN) {
1162f4df32b1SMatthew Knepley     PetscScalar  alpha = a;
1163c5df96a5SBarry Smith     PetscBLASInt bnz;
11649566063dSJacob Faibussowitsch     PetscCall(PetscBLASIntCast(x->nz * bs2, &bnz));
1165792fecdfSBarry Smith     PetscCallBLAS("BLASaxpy", BLASaxpy_(&bnz, &alpha, x->a, &one, y->a, &one));
11669566063dSJacob Faibussowitsch     PetscCall(PetscObjectStateIncrease((PetscObject)Y));
1167ab784542SHong Zhang   } else if (str == SUBSET_NONZERO_PATTERN) { /* nonzeros of X is a subset of Y's */
11689566063dSJacob Faibussowitsch     PetscCall(MatSetOption(X, MAT_GETROW_UPPERTRIANGULAR, PETSC_TRUE));
11699566063dSJacob Faibussowitsch     PetscCall(MatAXPY_Basic(Y, a, X, str));
11709566063dSJacob Faibussowitsch     PetscCall(MatSetOption(X, MAT_GETROW_UPPERTRIANGULAR, PETSC_FALSE));
117142ee4b1aSHong Zhang   } else {
117252768537SHong Zhang     Mat       B;
117352768537SHong Zhang     PetscInt *nnz;
117454c59aa7SJacob Faibussowitsch     PetscCheck(bs == X->rmap->bs, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Matrices must have same block size");
11759566063dSJacob Faibussowitsch     PetscCall(MatGetRowUpperTriangular(X));
11769566063dSJacob Faibussowitsch     PetscCall(MatGetRowUpperTriangular(Y));
11779566063dSJacob Faibussowitsch     PetscCall(PetscMalloc1(Y->rmap->N, &nnz));
11789566063dSJacob Faibussowitsch     PetscCall(MatCreate(PetscObjectComm((PetscObject)Y), &B));
11799566063dSJacob Faibussowitsch     PetscCall(PetscObjectSetName((PetscObject)B, ((PetscObject)Y)->name));
11809566063dSJacob Faibussowitsch     PetscCall(MatSetSizes(B, Y->rmap->n, Y->cmap->n, Y->rmap->N, Y->cmap->N));
11819566063dSJacob Faibussowitsch     PetscCall(MatSetBlockSizesFromMats(B, Y, Y));
11829566063dSJacob Faibussowitsch     PetscCall(MatSetType(B, ((PetscObject)Y)->type_name));
11839566063dSJacob Faibussowitsch     PetscCall(MatAXPYGetPreallocation_SeqSBAIJ(Y, X, nnz));
11849566063dSJacob Faibussowitsch     PetscCall(MatSeqSBAIJSetPreallocation(B, bs, 0, nnz));
118552768537SHong Zhang 
11869566063dSJacob Faibussowitsch     PetscCall(MatAXPY_BasicWithPreallocation(B, Y, a, X, str));
118752768537SHong Zhang 
11889566063dSJacob Faibussowitsch     PetscCall(MatHeaderMerge(Y, &B));
11899566063dSJacob Faibussowitsch     PetscCall(PetscFree(nnz));
11909566063dSJacob Faibussowitsch     PetscCall(MatRestoreRowUpperTriangular(X));
11919566063dSJacob Faibussowitsch     PetscCall(MatRestoreRowUpperTriangular(Y));
119242ee4b1aSHong Zhang   }
11933ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
119442ee4b1aSHong Zhang }
119542ee4b1aSHong Zhang 
1196d71ae5a4SJacob Faibussowitsch PetscErrorCode MatIsSymmetric_SeqSBAIJ(Mat A, PetscReal tol, PetscBool *flg)
1197d71ae5a4SJacob Faibussowitsch {
1198efcf0fc3SBarry Smith   PetscFunctionBegin;
1199efcf0fc3SBarry Smith   *flg = PETSC_TRUE;
12003ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
1201efcf0fc3SBarry Smith }
1202efcf0fc3SBarry Smith 
1203d71ae5a4SJacob Faibussowitsch PetscErrorCode MatIsStructurallySymmetric_SeqSBAIJ(Mat A, PetscBool *flg)
1204d71ae5a4SJacob Faibussowitsch {
1205efcf0fc3SBarry Smith   PetscFunctionBegin;
1206efcf0fc3SBarry Smith   *flg = PETSC_TRUE;
12073ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
1208efcf0fc3SBarry Smith }
1209efcf0fc3SBarry Smith 
1210d71ae5a4SJacob Faibussowitsch PetscErrorCode MatIsHermitian_SeqSBAIJ(Mat A, PetscReal tol, PetscBool *flg)
1211d71ae5a4SJacob Faibussowitsch {
1212efcf0fc3SBarry Smith   PetscFunctionBegin;
1213efcf0fc3SBarry Smith   *flg = PETSC_FALSE;
12143ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
1215efcf0fc3SBarry Smith }
1216efcf0fc3SBarry Smith 
1217d71ae5a4SJacob Faibussowitsch PetscErrorCode MatConjugate_SeqSBAIJ(Mat A)
1218d71ae5a4SJacob Faibussowitsch {
12192726fb6dSPierre Jolivet #if defined(PETSC_USE_COMPLEX)
12202726fb6dSPierre Jolivet   Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)A->data;
12212726fb6dSPierre Jolivet   PetscInt      i, nz = a->bs2 * a->i[a->mbs];
12222726fb6dSPierre Jolivet   MatScalar    *aa = a->a;
12232726fb6dSPierre Jolivet 
12242726fb6dSPierre Jolivet   PetscFunctionBegin;
12252726fb6dSPierre Jolivet   for (i = 0; i < nz; i++) aa[i] = PetscConj(aa[i]);
12262726fb6dSPierre Jolivet #else
12272726fb6dSPierre Jolivet   PetscFunctionBegin;
12282726fb6dSPierre Jolivet #endif
12293ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
12302726fb6dSPierre Jolivet }
12312726fb6dSPierre Jolivet 
1232d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRealPart_SeqSBAIJ(Mat A)
1233d71ae5a4SJacob Faibussowitsch {
123499cafbc1SBarry Smith   Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)A->data;
123599cafbc1SBarry Smith   PetscInt      i, nz = a->bs2 * a->i[a->mbs];
1236dd6ea824SBarry Smith   MatScalar    *aa = a->a;
123799cafbc1SBarry Smith 
123899cafbc1SBarry Smith   PetscFunctionBegin;
123999cafbc1SBarry Smith   for (i = 0; i < nz; i++) aa[i] = PetscRealPart(aa[i]);
12403ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
124199cafbc1SBarry Smith }
124299cafbc1SBarry Smith 
1243d71ae5a4SJacob Faibussowitsch PetscErrorCode MatImaginaryPart_SeqSBAIJ(Mat A)
1244d71ae5a4SJacob Faibussowitsch {
124599cafbc1SBarry Smith   Mat_SeqSBAIJ *a = (Mat_SeqSBAIJ *)A->data;
124699cafbc1SBarry Smith   PetscInt      i, nz = a->bs2 * a->i[a->mbs];
1247dd6ea824SBarry Smith   MatScalar    *aa = a->a;
124899cafbc1SBarry Smith 
124999cafbc1SBarry Smith   PetscFunctionBegin;
125099cafbc1SBarry Smith   for (i = 0; i < nz; i++) aa[i] = PetscImaginaryPart(aa[i]);
12513ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
125299cafbc1SBarry Smith }
125399cafbc1SBarry Smith 
1254d71ae5a4SJacob Faibussowitsch PetscErrorCode MatZeroRowsColumns_SeqSBAIJ(Mat A, PetscInt is_n, const PetscInt is_idx[], PetscScalar diag, Vec x, Vec b)
1255d71ae5a4SJacob Faibussowitsch {
12563bededecSBarry Smith   Mat_SeqSBAIJ      *baij = (Mat_SeqSBAIJ *)A->data;
12573bededecSBarry Smith   PetscInt           i, j, k, count;
12583bededecSBarry Smith   PetscInt           bs = A->rmap->bs, bs2 = baij->bs2, row, col;
12593bededecSBarry Smith   PetscScalar        zero = 0.0;
12603bededecSBarry Smith   MatScalar         *aa;
12613bededecSBarry Smith   const PetscScalar *xx;
12623bededecSBarry Smith   PetscScalar       *bb;
126356777dd2SBarry Smith   PetscBool         *zeroed, vecs = PETSC_FALSE;
12643bededecSBarry Smith 
12653bededecSBarry Smith   PetscFunctionBegin;
12663bededecSBarry Smith   /* fix right hand side if needed */
12673bededecSBarry Smith   if (x && b) {
12689566063dSJacob Faibussowitsch     PetscCall(VecGetArrayRead(x, &xx));
12699566063dSJacob Faibussowitsch     PetscCall(VecGetArray(b, &bb));
127056777dd2SBarry Smith     vecs = PETSC_TRUE;
12713bededecSBarry Smith   }
12723bededecSBarry Smith 
12733bededecSBarry Smith   /* zero the columns */
12749566063dSJacob Faibussowitsch   PetscCall(PetscCalloc1(A->rmap->n, &zeroed));
12753bededecSBarry Smith   for (i = 0; i < is_n; i++) {
1276aed4548fSBarry Smith     PetscCheck(is_idx[i] >= 0 && is_idx[i] < A->rmap->N, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "row %" PetscInt_FMT " out of range", is_idx[i]);
12773bededecSBarry Smith     zeroed[is_idx[i]] = PETSC_TRUE;
12783bededecSBarry Smith   }
127956777dd2SBarry Smith   if (vecs) {
128056777dd2SBarry Smith     for (i = 0; i < A->rmap->N; i++) {
128156777dd2SBarry Smith       row = i / bs;
128256777dd2SBarry Smith       for (j = baij->i[row]; j < baij->i[row + 1]; j++) {
128356777dd2SBarry Smith         for (k = 0; k < bs; k++) {
128456777dd2SBarry Smith           col = bs * baij->j[j] + k;
128556777dd2SBarry Smith           if (col <= i) continue;
128656777dd2SBarry Smith           aa = ((MatScalar *)(baij->a)) + j * bs2 + (i % bs) + bs * k;
128726fbe8dcSKarl Rupp           if (!zeroed[i] && zeroed[col]) bb[i] -= aa[0] * xx[col];
128826fbe8dcSKarl Rupp           if (zeroed[i] && !zeroed[col]) bb[col] -= aa[0] * xx[i];
128956777dd2SBarry Smith         }
129056777dd2SBarry Smith       }
129156777dd2SBarry Smith     }
129226fbe8dcSKarl Rupp     for (i = 0; i < is_n; i++) bb[is_idx[i]] = diag * xx[is_idx[i]];
129356777dd2SBarry Smith   }
129456777dd2SBarry Smith 
12953bededecSBarry Smith   for (i = 0; i < A->rmap->N; i++) {
12963bededecSBarry Smith     if (!zeroed[i]) {
12973bededecSBarry Smith       row = i / bs;
12983bededecSBarry Smith       for (j = baij->i[row]; j < baij->i[row + 1]; j++) {
12993bededecSBarry Smith         for (k = 0; k < bs; k++) {
13003bededecSBarry Smith           col = bs * baij->j[j] + k;
13013bededecSBarry Smith           if (zeroed[col]) {
13023bededecSBarry Smith             aa    = ((MatScalar *)(baij->a)) + j * bs2 + (i % bs) + bs * k;
13033bededecSBarry Smith             aa[0] = 0.0;
13043bededecSBarry Smith           }
13053bededecSBarry Smith         }
13063bededecSBarry Smith       }
13073bededecSBarry Smith     }
13083bededecSBarry Smith   }
13099566063dSJacob Faibussowitsch   PetscCall(PetscFree(zeroed));
131056777dd2SBarry Smith   if (vecs) {
13119566063dSJacob Faibussowitsch     PetscCall(VecRestoreArrayRead(x, &xx));
13129566063dSJacob Faibussowitsch     PetscCall(VecRestoreArray(b, &bb));
131356777dd2SBarry Smith   }
13143bededecSBarry Smith 
13153bededecSBarry Smith   /* zero the rows */
13163bededecSBarry Smith   for (i = 0; i < is_n; i++) {
13173bededecSBarry Smith     row   = is_idx[i];
13183bededecSBarry Smith     count = (baij->i[row / bs + 1] - baij->i[row / bs]) * bs;
13193bededecSBarry Smith     aa    = ((MatScalar *)(baij->a)) + baij->i[row / bs] * bs2 + (row % bs);
13203bededecSBarry Smith     for (k = 0; k < count; k++) {
13213bededecSBarry Smith       aa[0] = zero;
13223bededecSBarry Smith       aa += bs;
13233bededecSBarry Smith     }
1324dbbe0bcdSBarry Smith     if (diag != 0.0) PetscUseTypeMethod(A, setvalues, 1, &row, 1, &row, &diag, INSERT_VALUES);
13253bededecSBarry Smith   }
13269566063dSJacob Faibussowitsch   PetscCall(MatAssemblyEnd_SeqSBAIJ(A, MAT_FINAL_ASSEMBLY));
13273ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
13283bededecSBarry Smith }
13293bededecSBarry Smith 
1330d71ae5a4SJacob Faibussowitsch PetscErrorCode MatShift_SeqSBAIJ(Mat Y, PetscScalar a)
1331d71ae5a4SJacob Faibussowitsch {
13327d68702bSBarry Smith   Mat_SeqSBAIJ *aij = (Mat_SeqSBAIJ *)Y->data;
13337d68702bSBarry Smith 
13347d68702bSBarry Smith   PetscFunctionBegin;
133548a46eb9SPierre Jolivet   if (!Y->preallocated || !aij->nz) PetscCall(MatSeqSBAIJSetPreallocation(Y, Y->rmap->bs, 1, NULL));
13369566063dSJacob Faibussowitsch   PetscCall(MatShift_Basic(Y, a));
13373ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
13387d68702bSBarry Smith }
13397d68702bSBarry Smith 
134049b5e25fSSatish Balay /* -------------------------------------------------------------------*/
13413964eb88SJed Brown static struct _MatOps MatOps_Values = {MatSetValues_SeqSBAIJ,
134249b5e25fSSatish Balay                                        MatGetRow_SeqSBAIJ,
134349b5e25fSSatish Balay                                        MatRestoreRow_SeqSBAIJ,
134449b5e25fSSatish Balay                                        MatMult_SeqSBAIJ_N,
134597304618SKris Buschelman                                        /*  4*/ MatMultAdd_SeqSBAIJ_N,
1346431c96f7SBarry Smith                                        MatMult_SeqSBAIJ_N, /* transpose versions are same as non-transpose versions */
1347e005ede5SBarry Smith                                        MatMultAdd_SeqSBAIJ_N,
1348f4259b30SLisandro Dalcin                                        NULL,
1349f4259b30SLisandro Dalcin                                        NULL,
1350f4259b30SLisandro Dalcin                                        NULL,
1351f4259b30SLisandro Dalcin                                        /* 10*/ NULL,
1352f4259b30SLisandro Dalcin                                        NULL,
1353c078aec8SLisandro Dalcin                                        MatCholeskyFactor_SeqSBAIJ,
135441f059aeSBarry Smith                                        MatSOR_SeqSBAIJ,
135549b5e25fSSatish Balay                                        MatTranspose_SeqSBAIJ,
135697304618SKris Buschelman                                        /* 15*/ MatGetInfo_SeqSBAIJ,
135749b5e25fSSatish Balay                                        MatEqual_SeqSBAIJ,
135849b5e25fSSatish Balay                                        MatGetDiagonal_SeqSBAIJ,
135949b5e25fSSatish Balay                                        MatDiagonalScale_SeqSBAIJ,
136049b5e25fSSatish Balay                                        MatNorm_SeqSBAIJ,
1361f4259b30SLisandro Dalcin                                        /* 20*/ NULL,
136249b5e25fSSatish Balay                                        MatAssemblyEnd_SeqSBAIJ,
136349b5e25fSSatish Balay                                        MatSetOption_SeqSBAIJ,
136449b5e25fSSatish Balay                                        MatZeroEntries_SeqSBAIJ,
1365f4259b30SLisandro Dalcin                                        /* 24*/ NULL,
1366f4259b30SLisandro Dalcin                                        NULL,
1367f4259b30SLisandro Dalcin                                        NULL,
1368f4259b30SLisandro Dalcin                                        NULL,
1369f4259b30SLisandro Dalcin                                        NULL,
1370*26cec326SBarry Smith                                        /* 29*/ MatSetUp_Seq_Hash,
1371f4259b30SLisandro Dalcin                                        NULL,
1372f4259b30SLisandro Dalcin                                        NULL,
1373f4259b30SLisandro Dalcin                                        NULL,
1374f4259b30SLisandro Dalcin                                        NULL,
1375d519adbfSMatthew Knepley                                        /* 34*/ MatDuplicate_SeqSBAIJ,
1376f4259b30SLisandro Dalcin                                        NULL,
1377f4259b30SLisandro Dalcin                                        NULL,
1378f4259b30SLisandro Dalcin                                        NULL,
1379c84f5b01SHong Zhang                                        MatICCFactor_SeqSBAIJ,
1380d519adbfSMatthew Knepley                                        /* 39*/ MatAXPY_SeqSBAIJ,
13817dae84e0SHong Zhang                                        MatCreateSubMatrices_SeqSBAIJ,
138249b5e25fSSatish Balay                                        MatIncreaseOverlap_SeqSBAIJ,
138349b5e25fSSatish Balay                                        MatGetValues_SeqSBAIJ,
13843c896bc6SHong Zhang                                        MatCopy_SeqSBAIJ,
1385f4259b30SLisandro Dalcin                                        /* 44*/ NULL,
138649b5e25fSSatish Balay                                        MatScale_SeqSBAIJ,
13877d68702bSBarry Smith                                        MatShift_SeqSBAIJ,
1388f4259b30SLisandro Dalcin                                        NULL,
13893bededecSBarry Smith                                        MatZeroRowsColumns_SeqSBAIJ,
1390f4259b30SLisandro Dalcin                                        /* 49*/ NULL,
139149b5e25fSSatish Balay                                        MatGetRowIJ_SeqSBAIJ,
139249b5e25fSSatish Balay                                        MatRestoreRowIJ_SeqSBAIJ,
1393f4259b30SLisandro Dalcin                                        NULL,
1394f4259b30SLisandro Dalcin                                        NULL,
1395f4259b30SLisandro Dalcin                                        /* 54*/ NULL,
1396f4259b30SLisandro Dalcin                                        NULL,
1397f4259b30SLisandro Dalcin                                        NULL,
1398dc29a518SPierre Jolivet                                        MatPermute_SeqSBAIJ,
139949b5e25fSSatish Balay                                        MatSetValuesBlocked_SeqSBAIJ,
14007dae84e0SHong Zhang                                        /* 59*/ MatCreateSubMatrix_SeqSBAIJ,
1401f4259b30SLisandro Dalcin                                        NULL,
1402f4259b30SLisandro Dalcin                                        NULL,
1403f4259b30SLisandro Dalcin                                        NULL,
1404f4259b30SLisandro Dalcin                                        NULL,
1405f4259b30SLisandro Dalcin                                        /* 64*/ NULL,
1406f4259b30SLisandro Dalcin                                        NULL,
1407f4259b30SLisandro Dalcin                                        NULL,
1408f4259b30SLisandro Dalcin                                        NULL,
1409f4259b30SLisandro Dalcin                                        NULL,
1410d519adbfSMatthew Knepley                                        /* 69*/ MatGetRowMaxAbs_SeqSBAIJ,
1411f4259b30SLisandro Dalcin                                        NULL,
141228d58a37SPierre Jolivet                                        MatConvert_MPISBAIJ_Basic,
1413f4259b30SLisandro Dalcin                                        NULL,
1414f4259b30SLisandro Dalcin                                        NULL,
1415f4259b30SLisandro Dalcin                                        /* 74*/ NULL,
1416f4259b30SLisandro Dalcin                                        NULL,
1417f4259b30SLisandro Dalcin                                        NULL,
1418f4259b30SLisandro Dalcin                                        NULL,
1419f4259b30SLisandro Dalcin                                        NULL,
1420f4259b30SLisandro Dalcin                                        /* 79*/ NULL,
1421f4259b30SLisandro Dalcin                                        NULL,
1422f4259b30SLisandro Dalcin                                        NULL,
142397304618SKris Buschelman                                        MatGetInertia_SeqSBAIJ,
14245bba2384SShri Abhyankar                                        MatLoad_SeqSBAIJ,
1425d519adbfSMatthew Knepley                                        /* 84*/ MatIsSymmetric_SeqSBAIJ,
1426865e5f61SKris Buschelman                                        MatIsHermitian_SeqSBAIJ,
1427efcf0fc3SBarry Smith                                        MatIsStructurallySymmetric_SeqSBAIJ,
1428f4259b30SLisandro Dalcin                                        NULL,
1429f4259b30SLisandro Dalcin                                        NULL,
1430f4259b30SLisandro Dalcin                                        /* 89*/ NULL,
1431f4259b30SLisandro Dalcin                                        NULL,
1432f4259b30SLisandro Dalcin                                        NULL,
1433f4259b30SLisandro Dalcin                                        NULL,
1434f4259b30SLisandro Dalcin                                        NULL,
1435f4259b30SLisandro Dalcin                                        /* 94*/ NULL,
1436f4259b30SLisandro Dalcin                                        NULL,
1437f4259b30SLisandro Dalcin                                        NULL,
1438f4259b30SLisandro Dalcin                                        NULL,
1439f4259b30SLisandro Dalcin                                        NULL,
1440f4259b30SLisandro Dalcin                                        /* 99*/ NULL,
1441f4259b30SLisandro Dalcin                                        NULL,
1442f4259b30SLisandro Dalcin                                        NULL,
14432726fb6dSPierre Jolivet                                        MatConjugate_SeqSBAIJ,
1444f4259b30SLisandro Dalcin                                        NULL,
1445f4259b30SLisandro Dalcin                                        /*104*/ NULL,
144699cafbc1SBarry Smith                                        MatRealPart_SeqSBAIJ,
1447f5edf698SHong Zhang                                        MatImaginaryPart_SeqSBAIJ,
1448f5edf698SHong Zhang                                        MatGetRowUpperTriangular_SeqSBAIJ,
14492af78befSBarry Smith                                        MatRestoreRowUpperTriangular_SeqSBAIJ,
1450f4259b30SLisandro Dalcin                                        /*109*/ NULL,
1451f4259b30SLisandro Dalcin                                        NULL,
1452f4259b30SLisandro Dalcin                                        NULL,
1453f4259b30SLisandro Dalcin                                        NULL,
1454547795f9SHong Zhang                                        MatMissingDiagonal_SeqSBAIJ,
1455f4259b30SLisandro Dalcin                                        /*114*/ NULL,
1456f4259b30SLisandro Dalcin                                        NULL,
1457f4259b30SLisandro Dalcin                                        NULL,
1458f4259b30SLisandro Dalcin                                        NULL,
1459f4259b30SLisandro Dalcin                                        NULL,
1460f4259b30SLisandro Dalcin                                        /*119*/ NULL,
1461f4259b30SLisandro Dalcin                                        NULL,
1462f4259b30SLisandro Dalcin                                        NULL,
1463f4259b30SLisandro Dalcin                                        NULL,
1464f4259b30SLisandro Dalcin                                        NULL,
1465f4259b30SLisandro Dalcin                                        /*124*/ NULL,
1466f4259b30SLisandro Dalcin                                        NULL,
1467f4259b30SLisandro Dalcin                                        NULL,
1468f4259b30SLisandro Dalcin                                        NULL,
1469f4259b30SLisandro Dalcin                                        NULL,
1470f4259b30SLisandro Dalcin                                        /*129*/ NULL,
1471f4259b30SLisandro Dalcin                                        NULL,
1472f4259b30SLisandro Dalcin                                        NULL,
1473f4259b30SLisandro Dalcin                                        NULL,
1474f4259b30SLisandro Dalcin                                        NULL,
1475f4259b30SLisandro Dalcin                                        /*134*/ NULL,
1476f4259b30SLisandro Dalcin                                        NULL,
1477f4259b30SLisandro Dalcin                                        NULL,
1478f4259b30SLisandro Dalcin                                        NULL,
1479f4259b30SLisandro Dalcin                                        NULL,
148046533700Sstefano_zampini                                        /*139*/ MatSetBlockSizes_Default,
1481f4259b30SLisandro Dalcin                                        NULL,
1482f4259b30SLisandro Dalcin                                        NULL,
1483f4259b30SLisandro Dalcin                                        NULL,
1484f4259b30SLisandro Dalcin                                        NULL,
1485d70f29a3SPierre Jolivet                                        /*144*/ MatCreateMPIMatConcatenateSeqMat_SeqSBAIJ,
1486d70f29a3SPierre Jolivet                                        NULL,
1487d70f29a3SPierre Jolivet                                        NULL,
148899a7f59eSMark Adams                                        NULL,
148999a7f59eSMark Adams                                        NULL,
14907fb60732SBarry Smith                                        NULL,
1491dec0b466SHong Zhang                                        /*150*/ NULL,
1492dec0b466SHong Zhang                                        NULL};
1493be1d678aSKris Buschelman 
1494d71ae5a4SJacob Faibussowitsch PetscErrorCode MatStoreValues_SeqSBAIJ(Mat mat)
1495d71ae5a4SJacob Faibussowitsch {
14964afc71dfSHong Zhang   Mat_SeqSBAIJ *aij = (Mat_SeqSBAIJ *)mat->data;
1497d0f46423SBarry Smith   PetscInt      nz  = aij->i[mat->rmap->N] * mat->rmap->bs * aij->bs2;
149849b5e25fSSatish Balay 
149949b5e25fSSatish Balay   PetscFunctionBegin;
150008401ef6SPierre Jolivet   PetscCheck(aij->nonew == 1, PETSC_COMM_SELF, PETSC_ERR_ORDER, "Must call MatSetOption(A,MAT_NEW_NONZERO_LOCATIONS,PETSC_FALSE);first");
150149b5e25fSSatish Balay 
150249b5e25fSSatish Balay   /* allocate space for values if not already there */
150348a46eb9SPierre Jolivet   if (!aij->saved_values) PetscCall(PetscMalloc1(nz + 1, &aij->saved_values));
150449b5e25fSSatish Balay 
150549b5e25fSSatish Balay   /* copy values over */
15069566063dSJacob Faibussowitsch   PetscCall(PetscArraycpy(aij->saved_values, aij->a, nz));
15073ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
150849b5e25fSSatish Balay }
150949b5e25fSSatish Balay 
1510d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRetrieveValues_SeqSBAIJ(Mat mat)
1511d71ae5a4SJacob Faibussowitsch {
15124afc71dfSHong Zhang   Mat_SeqSBAIJ *aij = (Mat_SeqSBAIJ *)mat->data;
1513d0f46423SBarry Smith   PetscInt      nz  = aij->i[mat->rmap->N] * mat->rmap->bs * aij->bs2;
151449b5e25fSSatish Balay 
151549b5e25fSSatish Balay   PetscFunctionBegin;
151608401ef6SPierre Jolivet   PetscCheck(aij->nonew == 1, PETSC_COMM_SELF, PETSC_ERR_ORDER, "Must call MatSetOption(A,MAT_NEW_NONZERO_LOCATIONS,PETSC_FALSE);first");
151728b400f6SJacob Faibussowitsch   PetscCheck(aij->saved_values, PETSC_COMM_SELF, PETSC_ERR_ORDER, "Must call MatStoreValues(A);first");
151849b5e25fSSatish Balay 
151949b5e25fSSatish Balay   /* copy values over */
15209566063dSJacob Faibussowitsch   PetscCall(PetscArraycpy(aij->a, aij->saved_values, nz));
15213ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
152249b5e25fSSatish Balay }
152349b5e25fSSatish Balay 
1524d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatSeqSBAIJSetPreallocation_SeqSBAIJ(Mat B, PetscInt bs, PetscInt nz, PetscInt *nnz)
1525d71ae5a4SJacob Faibussowitsch {
1526c464158bSHong Zhang   Mat_SeqSBAIJ *b = (Mat_SeqSBAIJ *)B->data;
15274dcd73b1SHong Zhang   PetscInt      i, mbs, nbs, bs2;
15282576faa2SJed Brown   PetscBool     skipallocation = PETSC_FALSE, flg = PETSC_FALSE, realalloc = PETSC_FALSE;
152949b5e25fSSatish Balay 
153049b5e25fSSatish Balay   PetscFunctionBegin;
15312576faa2SJed Brown   if (nz >= 0 || nnz) realalloc = PETSC_TRUE;
1532db4efbfdSBarry Smith 
15339566063dSJacob Faibussowitsch   PetscCall(MatSetBlockSize(B, PetscAbs(bs)));
15349566063dSJacob Faibussowitsch   PetscCall(PetscLayoutSetUp(B->rmap));
15359566063dSJacob Faibussowitsch   PetscCall(PetscLayoutSetUp(B->cmap));
153608401ef6SPierre Jolivet   PetscCheck(B->rmap->N <= B->cmap->N, PETSC_COMM_SELF, PETSC_ERR_SUP, "SEQSBAIJ matrix cannot have more rows %" PetscInt_FMT " than columns %" PetscInt_FMT, B->rmap->N, B->cmap->N);
15379566063dSJacob Faibussowitsch   PetscCall(PetscLayoutGetBlockSize(B->rmap, &bs));
1538899cda47SBarry Smith 
153921940c7eSstefano_zampini   B->preallocated = PETSC_TRUE;
154021940c7eSstefano_zampini 
1541d0f46423SBarry Smith   mbs = B->rmap->N / bs;
15424dcd73b1SHong Zhang   nbs = B->cmap->n / bs;
154349b5e25fSSatish Balay   bs2 = bs * bs;
154449b5e25fSSatish Balay 
1545aed4548fSBarry Smith   PetscCheck(mbs * bs == B->rmap->N && nbs * bs == B->cmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Number rows, cols must be divisible by blocksize");
154649b5e25fSSatish Balay 
1547ab93d7beSBarry Smith   if (nz == MAT_SKIP_ALLOCATION) {
1548ab93d7beSBarry Smith     skipallocation = PETSC_TRUE;
1549ab93d7beSBarry Smith     nz             = 0;
1550ab93d7beSBarry Smith   }
1551ab93d7beSBarry Smith 
1552435da068SBarry Smith   if (nz == PETSC_DEFAULT || nz == PETSC_DECIDE) nz = 3;
155308401ef6SPierre Jolivet   PetscCheck(nz >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "nz cannot be less than 0: value %" PetscInt_FMT, nz);
155449b5e25fSSatish Balay   if (nnz) {
155549b5e25fSSatish Balay     for (i = 0; i < mbs; i++) {
155608401ef6SPierre Jolivet       PetscCheck(nnz[i] >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "nnz cannot be less than 0: local row %" PetscInt_FMT " value %" PetscInt_FMT, i, nnz[i]);
155708401ef6SPierre Jolivet       PetscCheck(nnz[i] <= nbs, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "nnz cannot be greater than block row length: local row %" PetscInt_FMT " value %" PetscInt_FMT " block rowlength %" PetscInt_FMT, i, nnz[i], nbs);
155849b5e25fSSatish Balay     }
155949b5e25fSSatish Balay   }
156049b5e25fSSatish Balay 
1561db4efbfdSBarry Smith   B->ops->mult             = MatMult_SeqSBAIJ_N;
1562db4efbfdSBarry Smith   B->ops->multadd          = MatMultAdd_SeqSBAIJ_N;
1563db4efbfdSBarry Smith   B->ops->multtranspose    = MatMult_SeqSBAIJ_N;
1564db4efbfdSBarry Smith   B->ops->multtransposeadd = MatMultAdd_SeqSBAIJ_N;
156526fbe8dcSKarl Rupp 
15669566063dSJacob Faibussowitsch   PetscCall(PetscOptionsGetBool(((PetscObject)B)->options, ((PetscObject)B)->prefix, "-mat_no_unroll", &flg, NULL));
156749b5e25fSSatish Balay   if (!flg) {
156849b5e25fSSatish Balay     switch (bs) {
156949b5e25fSSatish Balay     case 1:
157049b5e25fSSatish Balay       B->ops->mult             = MatMult_SeqSBAIJ_1;
157149b5e25fSSatish Balay       B->ops->multadd          = MatMultAdd_SeqSBAIJ_1;
1572431c96f7SBarry Smith       B->ops->multtranspose    = MatMult_SeqSBAIJ_1;
1573431c96f7SBarry Smith       B->ops->multtransposeadd = MatMultAdd_SeqSBAIJ_1;
157449b5e25fSSatish Balay       break;
157549b5e25fSSatish Balay     case 2:
157649b5e25fSSatish Balay       B->ops->mult             = MatMult_SeqSBAIJ_2;
157749b5e25fSSatish Balay       B->ops->multadd          = MatMultAdd_SeqSBAIJ_2;
1578431c96f7SBarry Smith       B->ops->multtranspose    = MatMult_SeqSBAIJ_2;
1579431c96f7SBarry Smith       B->ops->multtransposeadd = MatMultAdd_SeqSBAIJ_2;
158049b5e25fSSatish Balay       break;
158149b5e25fSSatish Balay     case 3:
158249b5e25fSSatish Balay       B->ops->mult             = MatMult_SeqSBAIJ_3;
158349b5e25fSSatish Balay       B->ops->multadd          = MatMultAdd_SeqSBAIJ_3;
1584431c96f7SBarry Smith       B->ops->multtranspose    = MatMult_SeqSBAIJ_3;
1585431c96f7SBarry Smith       B->ops->multtransposeadd = MatMultAdd_SeqSBAIJ_3;
158649b5e25fSSatish Balay       break;
158749b5e25fSSatish Balay     case 4:
158849b5e25fSSatish Balay       B->ops->mult             = MatMult_SeqSBAIJ_4;
158949b5e25fSSatish Balay       B->ops->multadd          = MatMultAdd_SeqSBAIJ_4;
1590431c96f7SBarry Smith       B->ops->multtranspose    = MatMult_SeqSBAIJ_4;
1591431c96f7SBarry Smith       B->ops->multtransposeadd = MatMultAdd_SeqSBAIJ_4;
159249b5e25fSSatish Balay       break;
159349b5e25fSSatish Balay     case 5:
159449b5e25fSSatish Balay       B->ops->mult             = MatMult_SeqSBAIJ_5;
159549b5e25fSSatish Balay       B->ops->multadd          = MatMultAdd_SeqSBAIJ_5;
1596431c96f7SBarry Smith       B->ops->multtranspose    = MatMult_SeqSBAIJ_5;
1597431c96f7SBarry Smith       B->ops->multtransposeadd = MatMultAdd_SeqSBAIJ_5;
159849b5e25fSSatish Balay       break;
159949b5e25fSSatish Balay     case 6:
160049b5e25fSSatish Balay       B->ops->mult             = MatMult_SeqSBAIJ_6;
160149b5e25fSSatish Balay       B->ops->multadd          = MatMultAdd_SeqSBAIJ_6;
1602431c96f7SBarry Smith       B->ops->multtranspose    = MatMult_SeqSBAIJ_6;
1603431c96f7SBarry Smith       B->ops->multtransposeadd = MatMultAdd_SeqSBAIJ_6;
160449b5e25fSSatish Balay       break;
160549b5e25fSSatish Balay     case 7:
1606de53e5efSHong Zhang       B->ops->mult             = MatMult_SeqSBAIJ_7;
160749b5e25fSSatish Balay       B->ops->multadd          = MatMultAdd_SeqSBAIJ_7;
1608431c96f7SBarry Smith       B->ops->multtranspose    = MatMult_SeqSBAIJ_7;
1609431c96f7SBarry Smith       B->ops->multtransposeadd = MatMultAdd_SeqSBAIJ_7;
161049b5e25fSSatish Balay       break;
161149b5e25fSSatish Balay     }
161249b5e25fSSatish Balay   }
161349b5e25fSSatish Balay 
161449b5e25fSSatish Balay   b->mbs = mbs;
16154dcd73b1SHong Zhang   b->nbs = nbs;
1616ab93d7beSBarry Smith   if (!skipallocation) {
16172ee49352SLisandro Dalcin     if (!b->imax) {
16189566063dSJacob Faibussowitsch       PetscCall(PetscMalloc2(mbs, &b->imax, mbs, &b->ilen));
161926fbe8dcSKarl Rupp 
1620c760cd28SBarry Smith       b->free_imax_ilen = PETSC_TRUE;
16212ee49352SLisandro Dalcin     }
162249b5e25fSSatish Balay     if (!nnz) {
1623435da068SBarry Smith       if (nz == PETSC_DEFAULT || nz == PETSC_DECIDE) nz = 5;
162449b5e25fSSatish Balay       else if (nz <= 0) nz = 1;
16255d2a9ed1SStefano Zampini       nz = PetscMin(nbs, nz);
162626fbe8dcSKarl Rupp       for (i = 0; i < mbs; i++) b->imax[i] = nz;
16279566063dSJacob Faibussowitsch       PetscCall(PetscIntMultError(nz, mbs, &nz));
162849b5e25fSSatish Balay     } else {
1629c73702f5SBarry Smith       PetscInt64 nz64 = 0;
16309371c9d4SSatish Balay       for (i = 0; i < mbs; i++) {
16319371c9d4SSatish Balay         b->imax[i] = nnz[i];
16329371c9d4SSatish Balay         nz64 += nnz[i];
16339371c9d4SSatish Balay       }
16349566063dSJacob Faibussowitsch       PetscCall(PetscIntCast(nz64, &nz));
163549b5e25fSSatish Balay     }
16362ee49352SLisandro Dalcin     /* b->ilen will count nonzeros in each block row so far. */
163726fbe8dcSKarl Rupp     for (i = 0; i < mbs; i++) b->ilen[i] = 0;
16386c6c5352SBarry Smith     /* nz=(nz+mbs)/2; */ /* total diagonal and superdiagonal nonzero blocks */
163949b5e25fSSatish Balay 
164049b5e25fSSatish Balay     /* allocate the matrix space */
16419566063dSJacob Faibussowitsch     PetscCall(MatSeqXAIJFreeAIJ(B, &b->a, &b->j, &b->i));
16429566063dSJacob Faibussowitsch     PetscCall(PetscMalloc3(bs2 * nz, &b->a, nz, &b->j, B->rmap->N + 1, &b->i));
16439566063dSJacob Faibussowitsch     PetscCall(PetscArrayzero(b->a, nz * bs2));
16449566063dSJacob Faibussowitsch     PetscCall(PetscArrayzero(b->j, nz));
164526fbe8dcSKarl Rupp 
164649b5e25fSSatish Balay     b->singlemalloc = PETSC_TRUE;
164749b5e25fSSatish Balay 
164849b5e25fSSatish Balay     /* pointer to beginning of each row */
1649e60cf9a0SBarry Smith     b->i[0] = 0;
165026fbe8dcSKarl Rupp     for (i = 1; i < mbs + 1; i++) b->i[i] = b->i[i - 1] + b->imax[i - 1];
165126fbe8dcSKarl Rupp 
1652e6b907acSBarry Smith     b->free_a  = PETSC_TRUE;
1653e6b907acSBarry Smith     b->free_ij = PETSC_TRUE;
1654e811da20SHong Zhang   } else {
1655e6b907acSBarry Smith     b->free_a  = PETSC_FALSE;
1656e6b907acSBarry Smith     b->free_ij = PETSC_FALSE;
1657ab93d7beSBarry Smith   }
165849b5e25fSSatish Balay 
165949b5e25fSSatish Balay   b->bs2     = bs2;
16606c6c5352SBarry Smith   b->nz      = 0;
1661b32cb4a7SJed Brown   b->maxnz   = nz;
1662f4259b30SLisandro Dalcin   b->inew    = NULL;
1663f4259b30SLisandro Dalcin   b->jnew    = NULL;
1664f4259b30SLisandro Dalcin   b->anew    = NULL;
1665f4259b30SLisandro Dalcin   b->a2anew  = NULL;
16661a3463dfSHong Zhang   b->permute = PETSC_FALSE;
1667cb7b82ddSBarry Smith 
1668cb7b82ddSBarry Smith   B->was_assembled = PETSC_FALSE;
1669cb7b82ddSBarry Smith   B->assembled     = PETSC_FALSE;
16709566063dSJacob Faibussowitsch   if (realalloc) PetscCall(MatSetOption(B, MAT_NEW_NONZERO_ALLOCATION_ERR, PETSC_TRUE));
16713ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
1672c464158bSHong Zhang }
1673153ea458SHong Zhang 
1674d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqSBAIJSetPreallocationCSR_SeqSBAIJ(Mat B, PetscInt bs, const PetscInt ii[], const PetscInt jj[], const PetscScalar V[])
1675d71ae5a4SJacob Faibussowitsch {
16760cd7f59aSBarry Smith   PetscInt     i, j, m, nz, anz, nz_max = 0, *nnz;
1677f4259b30SLisandro Dalcin   PetscScalar *values      = NULL;
167838f409ebSLisandro Dalcin   PetscBool    roworiented = ((Mat_SeqSBAIJ *)B->data)->roworiented;
16790cd7f59aSBarry Smith 
168038f409ebSLisandro Dalcin   PetscFunctionBegin;
168108401ef6SPierre Jolivet   PetscCheck(bs >= 1, PetscObjectComm((PetscObject)B), PETSC_ERR_ARG_OUTOFRANGE, "Invalid block size specified, must be positive but it is %" PetscInt_FMT, bs);
16829566063dSJacob Faibussowitsch   PetscCall(PetscLayoutSetBlockSize(B->rmap, bs));
16839566063dSJacob Faibussowitsch   PetscCall(PetscLayoutSetBlockSize(B->cmap, bs));
16849566063dSJacob Faibussowitsch   PetscCall(PetscLayoutSetUp(B->rmap));
16859566063dSJacob Faibussowitsch   PetscCall(PetscLayoutSetUp(B->cmap));
16869566063dSJacob Faibussowitsch   PetscCall(PetscLayoutGetBlockSize(B->rmap, &bs));
168738f409ebSLisandro Dalcin   m = B->rmap->n / bs;
168838f409ebSLisandro Dalcin 
1689aed4548fSBarry Smith   PetscCheck(!ii[0], PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "ii[0] must be 0 but it is %" PetscInt_FMT, ii[0]);
16909566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(m + 1, &nnz));
169138f409ebSLisandro Dalcin   for (i = 0; i < m; i++) {
169238f409ebSLisandro Dalcin     nz = ii[i + 1] - ii[i];
169308401ef6SPierre Jolivet     PetscCheck(nz >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Row %" PetscInt_FMT " has a negative number of columns %" PetscInt_FMT, i, nz);
16940cd7f59aSBarry Smith     anz = 0;
16950cd7f59aSBarry Smith     for (j = 0; j < nz; j++) {
16960cd7f59aSBarry Smith       /* count only values on the diagonal or above */
16970cd7f59aSBarry Smith       if (jj[ii[i] + j] >= i) {
16980cd7f59aSBarry Smith         anz = nz - j;
16990cd7f59aSBarry Smith         break;
17000cd7f59aSBarry Smith       }
17010cd7f59aSBarry Smith     }
17020cd7f59aSBarry Smith     nz_max = PetscMax(nz_max, anz);
17030cd7f59aSBarry Smith     nnz[i] = anz;
170438f409ebSLisandro Dalcin   }
17059566063dSJacob Faibussowitsch   PetscCall(MatSeqSBAIJSetPreallocation(B, bs, 0, nnz));
17069566063dSJacob Faibussowitsch   PetscCall(PetscFree(nnz));
170738f409ebSLisandro Dalcin 
170838f409ebSLisandro Dalcin   values = (PetscScalar *)V;
170948a46eb9SPierre Jolivet   if (!values) PetscCall(PetscCalloc1(bs * bs * nz_max, &values));
171038f409ebSLisandro Dalcin   for (i = 0; i < m; i++) {
171138f409ebSLisandro Dalcin     PetscInt        ncols = ii[i + 1] - ii[i];
171238f409ebSLisandro Dalcin     const PetscInt *icols = jj + ii[i];
171338f409ebSLisandro Dalcin     if (!roworiented || bs == 1) {
171438f409ebSLisandro Dalcin       const PetscScalar *svals = values + (V ? (bs * bs * ii[i]) : 0);
17159566063dSJacob Faibussowitsch       PetscCall(MatSetValuesBlocked_SeqSBAIJ(B, 1, &i, ncols, icols, svals, INSERT_VALUES));
171638f409ebSLisandro Dalcin     } else {
171738f409ebSLisandro Dalcin       for (j = 0; j < ncols; j++) {
171838f409ebSLisandro Dalcin         const PetscScalar *svals = values + (V ? (bs * bs * (ii[i] + j)) : 0);
17199566063dSJacob Faibussowitsch         PetscCall(MatSetValuesBlocked_SeqSBAIJ(B, 1, &i, 1, &icols[j], svals, INSERT_VALUES));
172038f409ebSLisandro Dalcin       }
172138f409ebSLisandro Dalcin     }
172238f409ebSLisandro Dalcin   }
17239566063dSJacob Faibussowitsch   if (!V) PetscCall(PetscFree(values));
17249566063dSJacob Faibussowitsch   PetscCall(MatAssemblyBegin(B, MAT_FINAL_ASSEMBLY));
17259566063dSJacob Faibussowitsch   PetscCall(MatAssemblyEnd(B, MAT_FINAL_ASSEMBLY));
17269566063dSJacob Faibussowitsch   PetscCall(MatSetOption(B, MAT_NEW_NONZERO_LOCATION_ERR, PETSC_TRUE));
17273ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
172838f409ebSLisandro Dalcin }
172938f409ebSLisandro Dalcin 
1730db4efbfdSBarry Smith /*
1731db4efbfdSBarry Smith    This is used to set the numeric factorization for both Cholesky and ICC symbolic factorization
1732db4efbfdSBarry Smith */
1733d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqSBAIJSetNumericFactorization_inplace(Mat B, PetscBool natural)
1734d71ae5a4SJacob Faibussowitsch {
1735ace3abfcSBarry Smith   PetscBool flg = PETSC_FALSE;
1736db4efbfdSBarry Smith   PetscInt  bs  = B->rmap->bs;
1737db4efbfdSBarry Smith 
1738db4efbfdSBarry Smith   PetscFunctionBegin;
17399566063dSJacob Faibussowitsch   PetscCall(PetscOptionsGetBool(((PetscObject)B)->options, ((PetscObject)B)->prefix, "-mat_no_unroll", &flg, NULL));
1740db4efbfdSBarry Smith   if (flg) bs = 8;
1741db4efbfdSBarry Smith 
1742db4efbfdSBarry Smith   if (!natural) {
1743db4efbfdSBarry Smith     switch (bs) {
1744d71ae5a4SJacob Faibussowitsch     case 1:
1745d71ae5a4SJacob Faibussowitsch       B->ops->choleskyfactornumeric = MatCholeskyFactorNumeric_SeqSBAIJ_1_inplace;
1746d71ae5a4SJacob Faibussowitsch       break;
1747d71ae5a4SJacob Faibussowitsch     case 2:
1748d71ae5a4SJacob Faibussowitsch       B->ops->choleskyfactornumeric = MatCholeskyFactorNumeric_SeqSBAIJ_2;
1749d71ae5a4SJacob Faibussowitsch       break;
1750d71ae5a4SJacob Faibussowitsch     case 3:
1751d71ae5a4SJacob Faibussowitsch       B->ops->choleskyfactornumeric = MatCholeskyFactorNumeric_SeqSBAIJ_3;
1752d71ae5a4SJacob Faibussowitsch       break;
1753d71ae5a4SJacob Faibussowitsch     case 4:
1754d71ae5a4SJacob Faibussowitsch       B->ops->choleskyfactornumeric = MatCholeskyFactorNumeric_SeqSBAIJ_4;
1755d71ae5a4SJacob Faibussowitsch       break;
1756d71ae5a4SJacob Faibussowitsch     case 5:
1757d71ae5a4SJacob Faibussowitsch       B->ops->choleskyfactornumeric = MatCholeskyFactorNumeric_SeqSBAIJ_5;
1758d71ae5a4SJacob Faibussowitsch       break;
1759d71ae5a4SJacob Faibussowitsch     case 6:
1760d71ae5a4SJacob Faibussowitsch       B->ops->choleskyfactornumeric = MatCholeskyFactorNumeric_SeqSBAIJ_6;
1761d71ae5a4SJacob Faibussowitsch       break;
1762d71ae5a4SJacob Faibussowitsch     case 7:
1763d71ae5a4SJacob Faibussowitsch       B->ops->choleskyfactornumeric = MatCholeskyFactorNumeric_SeqSBAIJ_7;
1764d71ae5a4SJacob Faibussowitsch       break;
1765d71ae5a4SJacob Faibussowitsch     default:
1766d71ae5a4SJacob Faibussowitsch       B->ops->choleskyfactornumeric = MatCholeskyFactorNumeric_SeqSBAIJ_N;
1767d71ae5a4SJacob Faibussowitsch       break;
1768db4efbfdSBarry Smith     }
1769db4efbfdSBarry Smith   } else {
1770db4efbfdSBarry Smith     switch (bs) {
1771d71ae5a4SJacob Faibussowitsch     case 1:
1772d71ae5a4SJacob Faibussowitsch       B->ops->choleskyfactornumeric = MatCholeskyFactorNumeric_SeqSBAIJ_1_NaturalOrdering_inplace;
1773d71ae5a4SJacob Faibussowitsch       break;
1774d71ae5a4SJacob Faibussowitsch     case 2:
1775d71ae5a4SJacob Faibussowitsch       B->ops->choleskyfactornumeric = MatCholeskyFactorNumeric_SeqSBAIJ_2_NaturalOrdering;
1776d71ae5a4SJacob Faibussowitsch       break;
1777d71ae5a4SJacob Faibussowitsch     case 3:
1778d71ae5a4SJacob Faibussowitsch       B->ops->choleskyfactornumeric = MatCholeskyFactorNumeric_SeqSBAIJ_3_NaturalOrdering;
1779d71ae5a4SJacob Faibussowitsch       break;
1780d71ae5a4SJacob Faibussowitsch     case 4:
1781d71ae5a4SJacob Faibussowitsch       B->ops->choleskyfactornumeric = MatCholeskyFactorNumeric_SeqSBAIJ_4_NaturalOrdering;
1782d71ae5a4SJacob Faibussowitsch       break;
1783d71ae5a4SJacob Faibussowitsch     case 5:
1784d71ae5a4SJacob Faibussowitsch       B->ops->choleskyfactornumeric = MatCholeskyFactorNumeric_SeqSBAIJ_5_NaturalOrdering;
1785d71ae5a4SJacob Faibussowitsch       break;
1786d71ae5a4SJacob Faibussowitsch     case 6:
1787d71ae5a4SJacob Faibussowitsch       B->ops->choleskyfactornumeric = MatCholeskyFactorNumeric_SeqSBAIJ_6_NaturalOrdering;
1788d71ae5a4SJacob Faibussowitsch       break;
1789d71ae5a4SJacob Faibussowitsch     case 7:
1790d71ae5a4SJacob Faibussowitsch       B->ops->choleskyfactornumeric = MatCholeskyFactorNumeric_SeqSBAIJ_7_NaturalOrdering;
1791d71ae5a4SJacob Faibussowitsch       break;
1792d71ae5a4SJacob Faibussowitsch     default:
1793d71ae5a4SJacob Faibussowitsch       B->ops->choleskyfactornumeric = MatCholeskyFactorNumeric_SeqSBAIJ_N_NaturalOrdering;
1794d71ae5a4SJacob Faibussowitsch       break;
1795db4efbfdSBarry Smith     }
1796db4efbfdSBarry Smith   }
17973ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
1798db4efbfdSBarry Smith }
1799db4efbfdSBarry Smith 
1800cc2e6a90SBarry Smith PETSC_INTERN PetscErrorCode MatConvert_SeqSBAIJ_SeqAIJ(Mat, MatType, MatReuse, Mat *);
1801cc2e6a90SBarry Smith PETSC_INTERN PetscErrorCode MatConvert_SeqSBAIJ_SeqBAIJ(Mat, MatType, MatReuse, Mat *);
1802d71ae5a4SJacob Faibussowitsch static PetscErrorCode       MatFactorGetSolverType_petsc(Mat A, MatSolverType *type)
1803d71ae5a4SJacob Faibussowitsch {
18044ac6704cSBarry Smith   PetscFunctionBegin;
18054ac6704cSBarry Smith   *type = MATSOLVERPETSC;
18063ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
18074ac6704cSBarry Smith }
1808d769727bSBarry Smith 
1809d71ae5a4SJacob Faibussowitsch PETSC_INTERN PetscErrorCode MatGetFactor_seqsbaij_petsc(Mat A, MatFactorType ftype, Mat *B)
1810d71ae5a4SJacob Faibussowitsch {
1811d0f46423SBarry Smith   PetscInt n = A->rmap->n;
18125c9eb25fSBarry Smith 
18135c9eb25fSBarry Smith   PetscFunctionBegin;
18140e92d65fSHong Zhang #if defined(PETSC_USE_COMPLEX)
1815b94d7dedSBarry Smith   PetscCheck(A->hermitian != PETSC_BOOL3_TRUE || A->symmetric == PETSC_BOOL3_TRUE || (ftype != MAT_FACTOR_CHOLESKY && ftype != MAT_FACTOR_ICC), PETSC_COMM_SELF, PETSC_ERR_SUP, "Hermitian CHOLESKY or ICC Factor is not supported");
18160e92d65fSHong Zhang #endif
1817eb1ec7c1SStefano Zampini 
18189566063dSJacob Faibussowitsch   PetscCall(MatCreate(PetscObjectComm((PetscObject)A), B));
18199566063dSJacob Faibussowitsch   PetscCall(MatSetSizes(*B, n, n, n, n));
18205c9eb25fSBarry Smith   if (ftype == MAT_FACTOR_CHOLESKY || ftype == MAT_FACTOR_ICC) {
18219566063dSJacob Faibussowitsch     PetscCall(MatSetType(*B, MATSEQSBAIJ));
18229566063dSJacob Faibussowitsch     PetscCall(MatSeqSBAIJSetPreallocation(*B, A->rmap->bs, MAT_SKIP_ALLOCATION, NULL));
182326fbe8dcSKarl Rupp 
18247b056e98SHong Zhang     (*B)->ops->choleskyfactorsymbolic = MatCholeskyFactorSymbolic_SeqSBAIJ;
1825c6d0d4f0SHong Zhang     (*B)->ops->iccfactorsymbolic      = MatICCFactorSymbolic_SeqSBAIJ;
18269566063dSJacob Faibussowitsch     PetscCall(PetscStrallocpy(MATORDERINGNATURAL, (char **)&(*B)->preferredordering[MAT_FACTOR_CHOLESKY]));
18279566063dSJacob Faibussowitsch     PetscCall(PetscStrallocpy(MATORDERINGNATURAL, (char **)&(*B)->preferredordering[MAT_FACTOR_ICC]));
1828e32f2f54SBarry Smith   } else SETERRQ(PETSC_COMM_SELF, PETSC_ERR_SUP, "Factor type not supported");
182900c67f3bSHong Zhang 
1830d5f3da31SBarry Smith   (*B)->factortype     = ftype;
1831f73b0415SBarry Smith   (*B)->canuseordering = PETSC_TRUE;
18329566063dSJacob Faibussowitsch   PetscCall(PetscFree((*B)->solvertype));
18339566063dSJacob Faibussowitsch   PetscCall(PetscStrallocpy(MATSOLVERPETSC, &(*B)->solvertype));
18349566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)*B, "MatFactorGetSolverType_C", MatFactorGetSolverType_petsc));
18353ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
18365c9eb25fSBarry Smith }
18375c9eb25fSBarry Smith 
18388397e458SBarry Smith /*@C
183911a5261eSBarry Smith    MatSeqSBAIJGetArray - gives access to the array where the data for a `MATSEQSBAIJ` matrix is stored
18408397e458SBarry Smith 
18418397e458SBarry Smith    Not Collective
18428397e458SBarry Smith 
18438397e458SBarry Smith    Input Parameter:
184411a5261eSBarry Smith .  mat - a `MATSEQSBAIJ` matrix
18458397e458SBarry Smith 
18468397e458SBarry Smith    Output Parameter:
18478397e458SBarry Smith .   array - pointer to the data
18488397e458SBarry Smith 
18498397e458SBarry Smith    Level: intermediate
18508397e458SBarry Smith 
185111a5261eSBarry Smith .seealso: `MATSEQSBAIJ`, `MatSeqSBAIJRestoreArray()`, `MatSeqAIJGetArray()`, `MatSeqAIJRestoreArray()`
18528397e458SBarry Smith @*/
1853d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqSBAIJGetArray(Mat A, PetscScalar **array)
1854d71ae5a4SJacob Faibussowitsch {
18558397e458SBarry Smith   PetscFunctionBegin;
1856cac4c232SBarry Smith   PetscUseMethod(A, "MatSeqSBAIJGetArray_C", (Mat, PetscScalar **), (A, array));
18573ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
18588397e458SBarry Smith }
18598397e458SBarry Smith 
18608397e458SBarry Smith /*@C
186111a5261eSBarry Smith    MatSeqSBAIJRestoreArray - returns access to the array where the data for a `MATSEQSBAIJ` matrix is stored obtained by `MatSeqSBAIJGetArray()`
18628397e458SBarry Smith 
18638397e458SBarry Smith    Not Collective
18648397e458SBarry Smith 
18658397e458SBarry Smith    Input Parameters:
1866a2b725a8SWilliam Gropp +  mat - a MATSEQSBAIJ matrix
1867a2b725a8SWilliam Gropp -  array - pointer to the data
18688397e458SBarry Smith 
18698397e458SBarry Smith    Level: intermediate
18708397e458SBarry Smith 
187111a5261eSBarry Smith .seealso: `MATSEQSBAIJ`, `MatSeqSBAIJGetArray()`, `MatSeqAIJGetArray()`, `MatSeqAIJRestoreArray()`
18728397e458SBarry Smith @*/
1873d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqSBAIJRestoreArray(Mat A, PetscScalar **array)
1874d71ae5a4SJacob Faibussowitsch {
18758397e458SBarry Smith   PetscFunctionBegin;
1876cac4c232SBarry Smith   PetscUseMethod(A, "MatSeqSBAIJRestoreArray_C", (Mat, PetscScalar **), (A, array));
18773ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
18788397e458SBarry Smith }
18798397e458SBarry Smith 
18800bad9183SKris Buschelman /*MC
1881fafad747SKris Buschelman   MATSEQSBAIJ - MATSEQSBAIJ = "seqsbaij" - A matrix type to be used for sequential symmetric block sparse matrices,
18820bad9183SKris Buschelman   based on block compressed sparse row format.  Only the upper triangular portion of the matrix is stored.
18830bad9183SKris Buschelman 
1884828413b8SBarry Smith   For complex numbers by default this matrix is symmetric, NOT Hermitian symmetric. To make it Hermitian symmetric you
188511a5261eSBarry Smith   can call `MatSetOption`(`Mat`, `MAT_HERMITIAN`).
1886828413b8SBarry Smith 
18870bad9183SKris Buschelman   Options Database Keys:
188811a5261eSBarry Smith   . -mat_type seqsbaij - sets the matrix type to "seqsbaij" during a call to `MatSetFromOptions()`
18890bad9183SKris Buschelman 
189095452b02SPatrick Sanan   Notes:
189195452b02SPatrick Sanan     By default if you insert values into the lower triangular part of the matrix they are simply ignored (since they are not
189211a5261eSBarry Smith      stored and it is assumed they symmetric to the upper triangular). If you call `MatSetOption`(`Mat`,`MAT_IGNORE_LOWER_TRIANGULAR`,`PETSC_FALSE`) or use
189371dad5bbSBarry Smith      the options database -mat_ignore_lower_triangular false it will generate an error if you try to set a value in the lower triangular portion.
189471dad5bbSBarry Smith 
1895476417e5SBarry Smith     The number of rows in the matrix must be less than or equal to the number of columns
189671dad5bbSBarry Smith 
18970bad9183SKris Buschelman   Level: beginner
18980bad9183SKris Buschelman 
189911a5261eSBarry Smith   .seealso: `MATSEQSBAIJ`, `MatCreateSeqSBAIJ()`, `MatType`, `MATMPISBAIJ`
19000bad9183SKris Buschelman M*/
1901d71ae5a4SJacob Faibussowitsch PETSC_EXTERN PetscErrorCode MatCreate_SeqSBAIJ(Mat B)
1902d71ae5a4SJacob Faibussowitsch {
1903a23d5eceSKris Buschelman   Mat_SeqSBAIJ *b;
190413f74950SBarry Smith   PetscMPIInt   size;
1905ace3abfcSBarry Smith   PetscBool     no_unroll = PETSC_FALSE, no_inode = PETSC_FALSE;
1906a23d5eceSKris Buschelman 
1907a23d5eceSKris Buschelman   PetscFunctionBegin;
19089566063dSJacob Faibussowitsch   PetscCallMPI(MPI_Comm_size(PetscObjectComm((PetscObject)B), &size));
190908401ef6SPierre Jolivet   PetscCheck(size <= 1, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONG, "Comm must be of size 1");
1910a23d5eceSKris Buschelman 
19114dfa11a4SJacob Faibussowitsch   PetscCall(PetscNew(&b));
1912a23d5eceSKris Buschelman   B->data = (void *)b;
19139566063dSJacob Faibussowitsch   PetscCall(PetscMemcpy(B->ops, &MatOps_Values, sizeof(struct _MatOps)));
191426fbe8dcSKarl Rupp 
1915a23d5eceSKris Buschelman   B->ops->destroy    = MatDestroy_SeqSBAIJ;
1916a23d5eceSKris Buschelman   B->ops->view       = MatView_SeqSBAIJ;
1917f4259b30SLisandro Dalcin   b->row             = NULL;
1918f4259b30SLisandro Dalcin   b->icol            = NULL;
1919a23d5eceSKris Buschelman   b->reallocs        = 0;
1920f4259b30SLisandro Dalcin   b->saved_values    = NULL;
19210def2e27SBarry Smith   b->inode.limit     = 5;
19220def2e27SBarry Smith   b->inode.max_limit = 5;
1923a23d5eceSKris Buschelman 
1924a23d5eceSKris Buschelman   b->roworiented        = PETSC_TRUE;
1925a23d5eceSKris Buschelman   b->nonew              = 0;
1926f4259b30SLisandro Dalcin   b->diag               = NULL;
1927f4259b30SLisandro Dalcin   b->solve_work         = NULL;
1928f4259b30SLisandro Dalcin   b->mult_work          = NULL;
1929f4259b30SLisandro Dalcin   B->spptr              = NULL;
1930f2cbd3d5SJed Brown   B->info.nz_unneeded   = (PetscReal)b->maxnz * b->bs2;
1931a9817697SBarry Smith   b->keepnonzeropattern = PETSC_FALSE;
1932a23d5eceSKris Buschelman 
1933f4259b30SLisandro Dalcin   b->inew    = NULL;
1934f4259b30SLisandro Dalcin   b->jnew    = NULL;
1935f4259b30SLisandro Dalcin   b->anew    = NULL;
1936f4259b30SLisandro Dalcin   b->a2anew  = NULL;
1937a23d5eceSKris Buschelman   b->permute = PETSC_FALSE;
1938a23d5eceSKris Buschelman 
193971dad5bbSBarry Smith   b->ignore_ltriangular = PETSC_TRUE;
194026fbe8dcSKarl Rupp 
19419566063dSJacob Faibussowitsch   PetscCall(PetscOptionsGetBool(((PetscObject)B)->options, ((PetscObject)B)->prefix, "-mat_ignore_lower_triangular", &b->ignore_ltriangular, NULL));
1942941593c8SHong Zhang 
1943f5edf698SHong Zhang   b->getrow_utriangular = PETSC_FALSE;
194426fbe8dcSKarl Rupp 
19459566063dSJacob Faibussowitsch   PetscCall(PetscOptionsGetBool(((PetscObject)B)->options, ((PetscObject)B)->prefix, "-mat_getrow_uppertriangular", &b->getrow_utriangular, NULL));
1946f5edf698SHong Zhang 
19479566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSeqSBAIJGetArray_C", MatSeqSBAIJGetArray_SeqSBAIJ));
19489566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSeqSBAIJRestoreArray_C", MatSeqSBAIJRestoreArray_SeqSBAIJ));
19499566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatStoreValues_C", MatStoreValues_SeqSBAIJ));
19509566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatRetrieveValues_C", MatRetrieveValues_SeqSBAIJ));
19519566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSeqSBAIJSetColumnIndices_C", MatSeqSBAIJSetColumnIndices_SeqSBAIJ));
19529566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqsbaij_seqaij_C", MatConvert_SeqSBAIJ_SeqAIJ));
19539566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqsbaij_seqbaij_C", MatConvert_SeqSBAIJ_SeqBAIJ));
19549566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSeqSBAIJSetPreallocation_C", MatSeqSBAIJSetPreallocation_SeqSBAIJ));
19559566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSeqSBAIJSetPreallocationCSR_C", MatSeqSBAIJSetPreallocationCSR_SeqSBAIJ));
19566214f412SHong Zhang #if defined(PETSC_HAVE_ELEMENTAL)
19579566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqsbaij_elemental_C", MatConvert_SeqSBAIJ_Elemental));
19586214f412SHong Zhang #endif
1959d24d4204SJose E. Roman #if defined(PETSC_HAVE_SCALAPACK)
19609566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqsbaij_scalapack_C", MatConvert_SBAIJ_ScaLAPACK));
1961d24d4204SJose E. Roman #endif
196223ce1328SBarry Smith 
1963b94d7dedSBarry Smith   B->symmetry_eternal            = PETSC_TRUE;
1964b94d7dedSBarry Smith   B->structural_symmetry_eternal = PETSC_TRUE;
1965b94d7dedSBarry Smith   B->symmetric                   = PETSC_BOOL3_TRUE;
1966b94d7dedSBarry Smith   B->structurally_symmetric      = PETSC_BOOL3_TRUE;
1967eb1ec7c1SStefano Zampini #if defined(PETSC_USE_COMPLEX)
1968b94d7dedSBarry Smith   B->hermitian = PETSC_BOOL3_FALSE;
1969eb1ec7c1SStefano Zampini #else
1970b94d7dedSBarry Smith   B->hermitian = PETSC_BOOL3_TRUE;
1971eb1ec7c1SStefano Zampini #endif
197213647f61SHong Zhang 
19739566063dSJacob Faibussowitsch   PetscCall(PetscObjectChangeTypeName((PetscObject)B, MATSEQSBAIJ));
19740def2e27SBarry Smith 
1975d0609cedSBarry Smith   PetscOptionsBegin(PetscObjectComm((PetscObject)B), ((PetscObject)B)->prefix, "Options for SEQSBAIJ matrix", "Mat");
19769566063dSJacob Faibussowitsch   PetscCall(PetscOptionsBool("-mat_no_unroll", "Do not optimize for inodes (slower)", NULL, no_unroll, &no_unroll, NULL));
197748a46eb9SPierre Jolivet   if (no_unroll) PetscCall(PetscInfo(B, "Not using Inode routines due to -mat_no_unroll\n"));
19789566063dSJacob Faibussowitsch   PetscCall(PetscOptionsBool("-mat_no_inode", "Do not optimize for inodes (slower)", NULL, no_inode, &no_inode, NULL));
19799566063dSJacob Faibussowitsch   if (no_inode) PetscCall(PetscInfo(B, "Not using Inode routines due to -mat_no_inode\n"));
19809566063dSJacob Faibussowitsch   PetscCall(PetscOptionsInt("-mat_inode_limit", "Do not use inodes larger then this value", NULL, b->inode.limit, &b->inode.limit, NULL));
1981d0609cedSBarry Smith   PetscOptionsEnd();
1982ace3abfcSBarry Smith   b->inode.use = (PetscBool)(!(no_unroll || no_inode));
19830def2e27SBarry Smith   if (b->inode.limit > b->inode.max_limit) b->inode.limit = b->inode.max_limit;
19843ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
1985a23d5eceSKris Buschelman }
1986a23d5eceSKris Buschelman 
1987a23d5eceSKris Buschelman /*@C
1988a23d5eceSKris Buschelman    MatSeqSBAIJSetPreallocation - Creates a sparse symmetric matrix in block AIJ (block
198911a5261eSBarry Smith    compressed row) `MATSEQSBAIJ` format.  For good matrix assembly performance the
1990a23d5eceSKris Buschelman    user should preallocate the matrix storage by setting the parameter nz
1991a23d5eceSKris Buschelman    (or the array nnz).  By setting these parameters accurately, performance
1992a23d5eceSKris Buschelman    during matrix assembly can be increased by more than a factor of 50.
1993a23d5eceSKris Buschelman 
1994c3339decSBarry Smith    Collective
1995a23d5eceSKris Buschelman 
1996a23d5eceSKris Buschelman    Input Parameters:
19971c4f3114SJed Brown +  B - the symmetric matrix
199811a5261eSBarry Smith .  bs - size of block, the blocks are ALWAYS square. One can use `MatSetBlockSizes()` to set a different row and column blocksize but the row
199911a5261eSBarry Smith           blocksize always defines the size of the blocks. The column blocksize sets the blocksize of the vectors obtained with `MatCreateVecs()`
2000a23d5eceSKris Buschelman .  nz - number of block nonzeros per block row (same for all rows)
2001a23d5eceSKris Buschelman -  nnz - array containing the number of block nonzeros in the upper triangular plus
20020298fd71SBarry Smith          diagonal portion of each block (possibly different for each block row) or NULL
2003a23d5eceSKris Buschelman 
2004a23d5eceSKris Buschelman    Options Database Keys:
2005a2b725a8SWilliam Gropp +   -mat_no_unroll - uses code that does not unroll the loops in the
2006a23d5eceSKris Buschelman                      block calculations (much slower)
2007a2b725a8SWilliam Gropp -   -mat_block_size - size of the blocks to use (only works if a negative bs is passed in
2008a23d5eceSKris Buschelman 
2009a23d5eceSKris Buschelman    Level: intermediate
2010a23d5eceSKris Buschelman 
2011a23d5eceSKris Buschelman    Notes:
2012a23d5eceSKris Buschelman    Specify the preallocated storage with either nz or nnz (not both).
201311a5261eSBarry Smith    Set nz = `PETSC_DEFAULT` and nnz = NULL for PETSc to control dynamic memory
2014651615e1SBarry Smith    allocation.  See [Sparse Matrices](sec_matsparse) for details.
2015a23d5eceSKris Buschelman 
201611a5261eSBarry Smith    You can call `MatGetInfo()` to get information on how effective the preallocation was;
2017aa95bbe8SBarry Smith    for example the fields mallocs,nz_allocated,nz_used,nz_unneeded;
2018aa95bbe8SBarry Smith    You can also run with the option -info and look for messages with the string
2019aa95bbe8SBarry Smith    malloc in them to see if additional memory allocation was needed.
2020aa95bbe8SBarry Smith 
202149a6f317SBarry Smith    If the nnz parameter is given then the nz parameter is ignored
202249a6f317SBarry Smith 
2023651615e1SBarry Smith .seealso: [Sparse Matrices](sec_matsparse), `MATSEQSBAIJ`, `MatCreate()`, `MatCreateSeqAIJ()`, `MatSetValues()`, `MatCreateSBAIJ()`
2024a23d5eceSKris Buschelman @*/
2025d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqSBAIJSetPreallocation(Mat B, PetscInt bs, PetscInt nz, const PetscInt nnz[])
2026d71ae5a4SJacob Faibussowitsch {
2027a23d5eceSKris Buschelman   PetscFunctionBegin;
20286ba663aaSJed Brown   PetscValidHeaderSpecific(B, MAT_CLASSID, 1);
20296ba663aaSJed Brown   PetscValidType(B, 1);
20306ba663aaSJed Brown   PetscValidLogicalCollectiveInt(B, bs, 2);
2031cac4c232SBarry Smith   PetscTryMethod(B, "MatSeqSBAIJSetPreallocation_C", (Mat, PetscInt, PetscInt, const PetscInt[]), (B, bs, nz, nnz));
20323ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
2033a23d5eceSKris Buschelman }
203449b5e25fSSatish Balay 
203538f409ebSLisandro Dalcin /*@C
203611a5261eSBarry Smith    MatSeqSBAIJSetPreallocationCSR - Creates a sparse parallel matrix in `MATSEQSBAIJ` format using the given nonzero structure and (optional) numerical values
203738f409ebSLisandro Dalcin 
203838f409ebSLisandro Dalcin    Input Parameters:
20391c4f3114SJed Brown +  B - the matrix
2040eab78319SHong Zhang .  bs - size of block, the blocks are ALWAYS square.
204138f409ebSLisandro Dalcin .  i - the indices into j for the start of each local row (starts with zero)
204238f409ebSLisandro Dalcin .  j - the column indices for each local row (starts with zero) these must be sorted for each row
204338f409ebSLisandro Dalcin -  v - optional values in the matrix
204438f409ebSLisandro Dalcin 
2045664954b6SBarry Smith    Level: advanced
204638f409ebSLisandro Dalcin 
204738f409ebSLisandro Dalcin    Notes:
204811a5261eSBarry Smith    The order of the entries in values is specified by the `MatOption` `MAT_ROW_ORIENTED`.  For example, C programs
204911a5261eSBarry Smith    may want to use the default `MAT_ROW_ORIENTED` = `PETSC_TRUE` and use an array v[nnz][bs][bs] where the second index is
205038f409ebSLisandro Dalcin    over rows within a block and the last index is over columns within a block row.  Fortran programs will likely set
205111a5261eSBarry Smith    `MAT_ROW_ORIENTED` = `PETSC_FALSE` and use a Fortran array v(bs,bs,nnz) in which the first index is over rows within a
205238f409ebSLisandro Dalcin    block column and the second index is over columns within a block.
205338f409ebSLisandro Dalcin 
205450c5228eSBarry Smith    Any entries below the diagonal are ignored
20550cd7f59aSBarry Smith 
20560cd7f59aSBarry Smith    Though this routine has Preallocation() in the name it also sets the exact nonzero locations of the matrix entries
20570cd7f59aSBarry Smith    and usually the numerical values as well
2058664954b6SBarry Smith 
205911a5261eSBarry Smith .seealso: `MATSEQSBAIJ`, `MatCreate()`, `MatCreateSeqSBAIJ()`, `MatSetValuesBlocked()`, `MatSeqSBAIJSetPreallocation()`, `MATSEQSBAIJ`
206038f409ebSLisandro Dalcin @*/
2061d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqSBAIJSetPreallocationCSR(Mat B, PetscInt bs, const PetscInt i[], const PetscInt j[], const PetscScalar v[])
2062d71ae5a4SJacob Faibussowitsch {
206338f409ebSLisandro Dalcin   PetscFunctionBegin;
206438f409ebSLisandro Dalcin   PetscValidHeaderSpecific(B, MAT_CLASSID, 1);
206538f409ebSLisandro Dalcin   PetscValidType(B, 1);
206638f409ebSLisandro Dalcin   PetscValidLogicalCollectiveInt(B, bs, 2);
2067cac4c232SBarry Smith   PetscTryMethod(B, "MatSeqSBAIJSetPreallocationCSR_C", (Mat, PetscInt, const PetscInt[], const PetscInt[], const PetscScalar[]), (B, bs, i, j, v));
20683ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
206938f409ebSLisandro Dalcin }
207038f409ebSLisandro Dalcin 
2071c464158bSHong Zhang /*@C
2072c464158bSHong Zhang    MatCreateSeqSBAIJ - Creates a sparse symmetric matrix in block AIJ (block
207311a5261eSBarry Smith    compressed row) `MATSEQSBAIJ` format.  For good matrix assembly performance the
2074c464158bSHong Zhang    user should preallocate the matrix storage by setting the parameter nz
2075c464158bSHong Zhang    (or the array nnz).  By setting these parameters accurately, performance
2076c464158bSHong Zhang    during matrix assembly can be increased by more than a factor of 50.
207749b5e25fSSatish Balay 
2078d083f849SBarry Smith    Collective
2079c464158bSHong Zhang 
2080c464158bSHong Zhang    Input Parameters:
208111a5261eSBarry Smith +  comm - MPI communicator, set to `PETSC_COMM_SELF`
208211a5261eSBarry Smith .  bs - size of block, the blocks are ALWAYS square. One can use `MatSetBlockSizes()` to set a different row and column blocksize but the row
2083bb7ae925SBarry Smith           blocksize always defines the size of the blocks. The column blocksize sets the blocksize of the vectors obtained with MatCreateVecs()
2084c464158bSHong Zhang .  m - number of rows, or number of columns
2085c464158bSHong Zhang .  nz - number of block nonzeros per block row (same for all rows)
2086744e8345SSatish Balay -  nnz - array containing the number of block nonzeros in the upper triangular plus
20870298fd71SBarry Smith          diagonal portion of each block (possibly different for each block row) or NULL
2088c464158bSHong Zhang 
2089c464158bSHong Zhang    Output Parameter:
2090c464158bSHong Zhang .  A - the symmetric matrix
2091c464158bSHong Zhang 
2092c464158bSHong Zhang    Options Database Keys:
2093a2b725a8SWilliam Gropp +   -mat_no_unroll - uses code that does not unroll the loops in the
2094c464158bSHong Zhang                      block calculations (much slower)
2095a2b725a8SWilliam Gropp -   -mat_block_size - size of the blocks to use
2096c464158bSHong Zhang 
2097c464158bSHong Zhang    Level: intermediate
2098c464158bSHong Zhang 
209911a5261eSBarry Smith    It is recommended that one use the `MatCreate()`, `MatSetType()` and/or `MatSetFromOptions()`,
2100f6f02116SRichard Tran Mills    MatXXXXSetPreallocation() paradigm instead of this routine directly.
210111a5261eSBarry Smith    [MatXXXXSetPreallocation() is, for example, `MatSeqAIJSetPreallocation()`]
2102175b88e8SBarry Smith 
2103c464158bSHong Zhang    Notes:
21046d6d819aSHong Zhang    The number of rows and columns must be divisible by blocksize.
21056d6d819aSHong Zhang    This matrix type does not support complex Hermitian operation.
2106c464158bSHong Zhang 
2107c464158bSHong Zhang    Specify the preallocated storage with either nz or nnz (not both).
210811a5261eSBarry Smith    Set nz = `PETSC_DEFAULT` and nnz = NULL for PETSc to control dynamic memory
2109651615e1SBarry Smith    allocation.  See [Sparse Matrices](sec_matsparse) for details.
2110c464158bSHong Zhang 
211149a6f317SBarry Smith    If the nnz parameter is given then the nz parameter is ignored
211249a6f317SBarry Smith 
2113651615e1SBarry Smith .seealso: [Sparse Matrices](sec_matsparse), `MATSEQSBAIJ`, `MatCreate()`, `MatCreateSeqAIJ()`, `MatSetValues()`, `MatCreateSBAIJ()`
2114c464158bSHong Zhang @*/
2115d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateSeqSBAIJ(MPI_Comm comm, PetscInt bs, PetscInt m, PetscInt n, PetscInt nz, const PetscInt nnz[], Mat *A)
2116d71ae5a4SJacob Faibussowitsch {
2117c464158bSHong Zhang   PetscFunctionBegin;
21189566063dSJacob Faibussowitsch   PetscCall(MatCreate(comm, A));
21199566063dSJacob Faibussowitsch   PetscCall(MatSetSizes(*A, m, n, m, n));
21209566063dSJacob Faibussowitsch   PetscCall(MatSetType(*A, MATSEQSBAIJ));
21219566063dSJacob Faibussowitsch   PetscCall(MatSeqSBAIJSetPreallocation(*A, bs, nz, (PetscInt *)nnz));
21223ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
212349b5e25fSSatish Balay }
212449b5e25fSSatish Balay 
2125d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDuplicate_SeqSBAIJ(Mat A, MatDuplicateOption cpvalues, Mat *B)
2126d71ae5a4SJacob Faibussowitsch {
212749b5e25fSSatish Balay   Mat           C;
212849b5e25fSSatish Balay   Mat_SeqSBAIJ *c, *a  = (Mat_SeqSBAIJ *)A->data;
2129b40805acSSatish Balay   PetscInt      i, mbs = a->mbs, nz = a->nz, bs2 = a->bs2;
213049b5e25fSSatish Balay 
213149b5e25fSSatish Balay   PetscFunctionBegin;
213208401ef6SPierre Jolivet   PetscCheck(a->i[mbs] == nz, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Corrupt matrix");
213349b5e25fSSatish Balay 
2134f4259b30SLisandro Dalcin   *B = NULL;
21359566063dSJacob Faibussowitsch   PetscCall(MatCreate(PetscObjectComm((PetscObject)A), &C));
21369566063dSJacob Faibussowitsch   PetscCall(MatSetSizes(C, A->rmap->N, A->cmap->n, A->rmap->N, A->cmap->n));
21379566063dSJacob Faibussowitsch   PetscCall(MatSetBlockSizesFromMats(C, A, A));
21389566063dSJacob Faibussowitsch   PetscCall(MatSetType(C, MATSEQSBAIJ));
2139692f9cbeSHong Zhang   c = (Mat_SeqSBAIJ *)C->data;
2140692f9cbeSHong Zhang 
2141273d9f13SBarry Smith   C->preallocated       = PETSC_TRUE;
2142d5f3da31SBarry Smith   C->factortype         = A->factortype;
2143f4259b30SLisandro Dalcin   c->row                = NULL;
2144f4259b30SLisandro Dalcin   c->icol               = NULL;
2145f4259b30SLisandro Dalcin   c->saved_values       = NULL;
2146a9817697SBarry Smith   c->keepnonzeropattern = a->keepnonzeropattern;
214749b5e25fSSatish Balay   C->assembled          = PETSC_TRUE;
214849b5e25fSSatish Balay 
21499566063dSJacob Faibussowitsch   PetscCall(PetscLayoutReference(A->rmap, &C->rmap));
21509566063dSJacob Faibussowitsch   PetscCall(PetscLayoutReference(A->cmap, &C->cmap));
215149b5e25fSSatish Balay   c->bs2 = a->bs2;
215249b5e25fSSatish Balay   c->mbs = a->mbs;
215349b5e25fSSatish Balay   c->nbs = a->nbs;
215449b5e25fSSatish Balay 
2155c760cd28SBarry Smith   if (cpvalues == MAT_SHARE_NONZERO_PATTERN) {
2156c760cd28SBarry Smith     c->imax           = a->imax;
2157c760cd28SBarry Smith     c->ilen           = a->ilen;
2158c760cd28SBarry Smith     c->free_imax_ilen = PETSC_FALSE;
2159c760cd28SBarry Smith   } else {
21609566063dSJacob Faibussowitsch     PetscCall(PetscMalloc2((mbs + 1), &c->imax, (mbs + 1), &c->ilen));
216149b5e25fSSatish Balay     for (i = 0; i < mbs; i++) {
216249b5e25fSSatish Balay       c->imax[i] = a->imax[i];
216349b5e25fSSatish Balay       c->ilen[i] = a->ilen[i];
216449b5e25fSSatish Balay     }
2165c760cd28SBarry Smith     c->free_imax_ilen = PETSC_TRUE;
2166c760cd28SBarry Smith   }
216749b5e25fSSatish Balay 
216849b5e25fSSatish Balay   /* allocate the matrix space */
21694da8f245SBarry Smith   if (cpvalues == MAT_SHARE_NONZERO_PATTERN) {
21709566063dSJacob Faibussowitsch     PetscCall(PetscMalloc1(bs2 * nz, &c->a));
217144e1c64aSLisandro Dalcin     c->i            = a->i;
217244e1c64aSLisandro Dalcin     c->j            = a->j;
21734da8f245SBarry Smith     c->singlemalloc = PETSC_FALSE;
217444e1c64aSLisandro Dalcin     c->free_a       = PETSC_TRUE;
21754da8f245SBarry Smith     c->free_ij      = PETSC_FALSE;
21764da8f245SBarry Smith     c->parent       = A;
21779566063dSJacob Faibussowitsch     PetscCall(PetscObjectReference((PetscObject)A));
21789566063dSJacob Faibussowitsch     PetscCall(MatSetOption(A, MAT_NEW_NONZERO_LOCATION_ERR, PETSC_TRUE));
21799566063dSJacob Faibussowitsch     PetscCall(MatSetOption(C, MAT_NEW_NONZERO_LOCATION_ERR, PETSC_TRUE));
21804da8f245SBarry Smith   } else {
21819566063dSJacob Faibussowitsch     PetscCall(PetscMalloc3(bs2 * nz, &c->a, nz, &c->j, mbs + 1, &c->i));
21829566063dSJacob Faibussowitsch     PetscCall(PetscArraycpy(c->i, a->i, mbs + 1));
21834da8f245SBarry Smith     c->singlemalloc = PETSC_TRUE;
218444e1c64aSLisandro Dalcin     c->free_a       = PETSC_TRUE;
21854da8f245SBarry Smith     c->free_ij      = PETSC_TRUE;
21864da8f245SBarry Smith   }
218749b5e25fSSatish Balay   if (mbs > 0) {
218848a46eb9SPierre Jolivet     if (cpvalues != MAT_SHARE_NONZERO_PATTERN) PetscCall(PetscArraycpy(c->j, a->j, nz));
218949b5e25fSSatish Balay     if (cpvalues == MAT_COPY_VALUES) {
21909566063dSJacob Faibussowitsch       PetscCall(PetscArraycpy(c->a, a->a, bs2 * nz));
219149b5e25fSSatish Balay     } else {
21929566063dSJacob Faibussowitsch       PetscCall(PetscArrayzero(c->a, bs2 * nz));
219349b5e25fSSatish Balay     }
2194a1c3900fSBarry Smith     if (a->jshort) {
219544e1c64aSLisandro Dalcin       /* cannot share jshort, it is reallocated in MatAssemblyEnd_SeqSBAIJ() */
219644e1c64aSLisandro Dalcin       /* if the parent matrix is reassembled, this child matrix will never notice */
21979566063dSJacob Faibussowitsch       PetscCall(PetscMalloc1(nz, &c->jshort));
21989566063dSJacob Faibussowitsch       PetscCall(PetscArraycpy(c->jshort, a->jshort, nz));
219926fbe8dcSKarl Rupp 
22004da8f245SBarry Smith       c->free_jshort = PETSC_TRUE;
22014da8f245SBarry Smith     }
2202a1c3900fSBarry Smith   }
220349b5e25fSSatish Balay 
220449b5e25fSSatish Balay   c->roworiented = a->roworiented;
220549b5e25fSSatish Balay   c->nonew       = a->nonew;
220649b5e25fSSatish Balay 
220749b5e25fSSatish Balay   if (a->diag) {
2208c760cd28SBarry Smith     if (cpvalues == MAT_SHARE_NONZERO_PATTERN) {
2209c760cd28SBarry Smith       c->diag      = a->diag;
2210c760cd28SBarry Smith       c->free_diag = PETSC_FALSE;
2211c760cd28SBarry Smith     } else {
22129566063dSJacob Faibussowitsch       PetscCall(PetscMalloc1(mbs, &c->diag));
221326fbe8dcSKarl Rupp       for (i = 0; i < mbs; i++) c->diag[i] = a->diag[i];
2214c760cd28SBarry Smith       c->free_diag = PETSC_TRUE;
2215c760cd28SBarry Smith     }
221644e1c64aSLisandro Dalcin   }
22176c6c5352SBarry Smith   c->nz         = a->nz;
2218f2cbd3d5SJed Brown   c->maxnz      = a->nz; /* Since we allocate exactly the right amount */
2219f4259b30SLisandro Dalcin   c->solve_work = NULL;
2220f4259b30SLisandro Dalcin   c->mult_work  = NULL;
222126fbe8dcSKarl Rupp 
222249b5e25fSSatish Balay   *B = C;
22239566063dSJacob Faibussowitsch   PetscCall(PetscFunctionListDuplicate(((PetscObject)A)->qlist, &((PetscObject)C)->qlist));
22243ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
222549b5e25fSSatish Balay }
222649b5e25fSSatish Balay 
2227618cc2edSLisandro Dalcin /* Used for both SeqBAIJ and SeqSBAIJ matrices */
2228618cc2edSLisandro Dalcin #define MatLoad_SeqSBAIJ_Binary MatLoad_SeqBAIJ_Binary
2229618cc2edSLisandro Dalcin 
2230d71ae5a4SJacob Faibussowitsch PetscErrorCode MatLoad_SeqSBAIJ(Mat mat, PetscViewer viewer)
2231d71ae5a4SJacob Faibussowitsch {
22327f489da9SVaclav Hapla   PetscBool isbinary;
22332f480046SShri Abhyankar 
22342f480046SShri Abhyankar   PetscFunctionBegin;
22359566063dSJacob Faibussowitsch   PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERBINARY, &isbinary));
223628b400f6SJacob Faibussowitsch   PetscCheck(isbinary, PetscObjectComm((PetscObject)viewer), PETSC_ERR_SUP, "Viewer type %s not yet supported for reading %s matrices", ((PetscObject)viewer)->type_name, ((PetscObject)mat)->type_name);
22379566063dSJacob Faibussowitsch   PetscCall(MatLoad_SeqSBAIJ_Binary(mat, viewer));
22383ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
22392f480046SShri Abhyankar }
22402f480046SShri Abhyankar 
2241c75a6043SHong Zhang /*@
224211a5261eSBarry Smith      MatCreateSeqSBAIJWithArrays - Creates an sequential `MATSEQSBAIJ` matrix using matrix elements
2243c75a6043SHong Zhang               (upper triangular entries in CSR format) provided by the user.
2244c75a6043SHong Zhang 
2245d083f849SBarry Smith      Collective
2246c75a6043SHong Zhang 
2247c75a6043SHong Zhang    Input Parameters:
2248c75a6043SHong Zhang +  comm - must be an MPI communicator of size 1
2249c75a6043SHong Zhang .  bs - size of block
2250c75a6043SHong Zhang .  m - number of rows
2251c75a6043SHong Zhang .  n - number of columns
2252483a2f95SBarry Smith .  i - row indices; that is i[0] = 0, i[row] = i[row-1] + number of block elements in that row block row of the matrix
2253c75a6043SHong Zhang .  j - column indices
2254c75a6043SHong Zhang -  a - matrix values
2255c75a6043SHong Zhang 
2256c75a6043SHong Zhang    Output Parameter:
2257c75a6043SHong Zhang .  mat - the matrix
2258c75a6043SHong Zhang 
2259dfb205c3SBarry Smith    Level: advanced
2260c75a6043SHong Zhang 
2261c75a6043SHong Zhang    Notes:
2262c75a6043SHong Zhang        The i, j, and a arrays are not copied by this routine, the user must free these arrays
2263c75a6043SHong Zhang     once the matrix is destroyed
2264c75a6043SHong Zhang 
2265c75a6043SHong Zhang        You cannot set new nonzero locations into this matrix, that will generate an error.
2266c75a6043SHong Zhang 
2267c75a6043SHong Zhang        The i and j indices are 0 based
2268c75a6043SHong Zhang 
226911a5261eSBarry Smith        When block size is greater than 1 the matrix values must be stored using the SBAIJ storage format (see the SBAIJ source code to determine this). For block size of 1
2270dfb205c3SBarry Smith        it is the regular CSR format excluding the lower triangular elements.
2271dfb205c3SBarry Smith 
227211a5261eSBarry Smith .seealso: `MATSEQSBAIJ`, `MatCreate()`, `MatCreateSBAIJ()`, `MatCreateSeqSBAIJ()`
2273c75a6043SHong Zhang @*/
2274d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateSeqSBAIJWithArrays(MPI_Comm comm, PetscInt bs, PetscInt m, PetscInt n, PetscInt i[], PetscInt j[], PetscScalar a[], Mat *mat)
2275d71ae5a4SJacob Faibussowitsch {
2276c75a6043SHong Zhang   PetscInt      ii;
2277c75a6043SHong Zhang   Mat_SeqSBAIJ *sbaij;
2278c75a6043SHong Zhang 
2279c75a6043SHong Zhang   PetscFunctionBegin;
228008401ef6SPierre Jolivet   PetscCheck(bs == 1, PETSC_COMM_SELF, PETSC_ERR_SUP, "block size %" PetscInt_FMT " > 1 is not supported yet", bs);
2281aed4548fSBarry Smith   PetscCheck(m == 0 || i[0] == 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "i (row indices) must start with 0");
2282c75a6043SHong Zhang 
22839566063dSJacob Faibussowitsch   PetscCall(MatCreate(comm, mat));
22849566063dSJacob Faibussowitsch   PetscCall(MatSetSizes(*mat, m, n, m, n));
22859566063dSJacob Faibussowitsch   PetscCall(MatSetType(*mat, MATSEQSBAIJ));
22869566063dSJacob Faibussowitsch   PetscCall(MatSeqSBAIJSetPreallocation(*mat, bs, MAT_SKIP_ALLOCATION, NULL));
2287c75a6043SHong Zhang   sbaij = (Mat_SeqSBAIJ *)(*mat)->data;
22889566063dSJacob Faibussowitsch   PetscCall(PetscMalloc2(m, &sbaij->imax, m, &sbaij->ilen));
2289c75a6043SHong Zhang 
2290c75a6043SHong Zhang   sbaij->i = i;
2291c75a6043SHong Zhang   sbaij->j = j;
2292c75a6043SHong Zhang   sbaij->a = a;
229326fbe8dcSKarl Rupp 
2294c75a6043SHong Zhang   sbaij->singlemalloc   = PETSC_FALSE;
2295c75a6043SHong Zhang   sbaij->nonew          = -1; /*this indicates that inserting a new value in the matrix that generates a new nonzero is an error*/
2296e6b907acSBarry Smith   sbaij->free_a         = PETSC_FALSE;
2297e6b907acSBarry Smith   sbaij->free_ij        = PETSC_FALSE;
2298ddf7884eSMatthew Knepley   sbaij->free_imax_ilen = PETSC_TRUE;
2299c75a6043SHong Zhang 
2300c75a6043SHong Zhang   for (ii = 0; ii < m; ii++) {
2301c75a6043SHong Zhang     sbaij->ilen[ii] = sbaij->imax[ii] = i[ii + 1] - i[ii];
23026bdcaf15SBarry Smith     PetscCheck(i[ii + 1] >= i[ii], PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Negative row length in i (row indices) row = %" PetscInt_FMT " length = %" PetscInt_FMT, ii, i[ii + 1] - i[ii]);
2303c75a6043SHong Zhang   }
230476bd3646SJed Brown   if (PetscDefined(USE_DEBUG)) {
2305c75a6043SHong Zhang     for (ii = 0; ii < sbaij->i[m]; ii++) {
23066bdcaf15SBarry Smith       PetscCheck(j[ii] >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Negative column index at location = %" PetscInt_FMT " index = %" PetscInt_FMT, ii, j[ii]);
23076bdcaf15SBarry Smith       PetscCheck(j[ii] < n, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Column index too large at location = %" PetscInt_FMT " index = %" PetscInt_FMT, ii, j[ii]);
2308c75a6043SHong Zhang     }
230976bd3646SJed Brown   }
2310c75a6043SHong Zhang 
23119566063dSJacob Faibussowitsch   PetscCall(MatAssemblyBegin(*mat, MAT_FINAL_ASSEMBLY));
23129566063dSJacob Faibussowitsch   PetscCall(MatAssemblyEnd(*mat, MAT_FINAL_ASSEMBLY));
23133ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
2314c75a6043SHong Zhang }
2315d06b337dSHong Zhang 
2316d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateMPIMatConcatenateSeqMat_SeqSBAIJ(MPI_Comm comm, Mat inmat, PetscInt n, MatReuse scall, Mat *outmat)
2317d71ae5a4SJacob Faibussowitsch {
231859f5e6ceSHong Zhang   PetscFunctionBegin;
23199566063dSJacob Faibussowitsch   PetscCall(MatCreateMPIMatConcatenateSeqMat_MPISBAIJ(comm, inmat, n, scall, outmat));
23203ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
232159f5e6ceSHong Zhang }
2322