xref: /petsc/src/mat/impls/aij/seq/aij.c (revision 62e5df077c11d978a6fe24205582b68a66e64d0b)
1d5d45c9bSBarry Smith /*
23369ce9aSBarry Smith     Defines the basic matrix operations for the AIJ (compressed row)
3d5d45c9bSBarry Smith   matrix storage format.
4d5d45c9bSBarry Smith */
53369ce9aSBarry Smith 
6c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/aij.h> /*I "petscmat.h" I*/
7c6db04a5SJed Brown #include <petscblaslapack.h>
8c6db04a5SJed Brown #include <petscbt.h>
9af0996ceSBarry Smith #include <petsc/private/kernels/blocktranspose.h>
100716a85fSBarry Smith 
1126cec326SBarry Smith /* defines MatSetValues_Seq_Hash(), MatAssemblyEnd_Seq_Hash(), MatSetUp_Seq_Hash() */
1226cec326SBarry Smith #define TYPE AIJ
1326cec326SBarry Smith #define TYPE_BS
1426cec326SBarry Smith #include "../src/mat/impls/aij/seq/seqhashmatsetvalues.h"
1526cec326SBarry Smith #include "../src/mat/impls/aij/seq/seqhashmat.h"
1626cec326SBarry Smith #undef TYPE
1726cec326SBarry Smith #undef TYPE_BS
1826cec326SBarry Smith 
19ba38deedSJacob Faibussowitsch static PetscErrorCode MatSeqAIJSetTypeFromOptions(Mat A)
20d71ae5a4SJacob Faibussowitsch {
214099cc6bSBarry Smith   PetscBool flg;
224099cc6bSBarry Smith   char      type[256];
234099cc6bSBarry Smith 
244099cc6bSBarry Smith   PetscFunctionBegin;
25d0609cedSBarry Smith   PetscObjectOptionsBegin((PetscObject)A);
269566063dSJacob Faibussowitsch   PetscCall(PetscOptionsFList("-mat_seqaij_type", "Matrix SeqAIJ type", "MatSeqAIJSetType", MatSeqAIJList, "seqaij", type, 256, &flg));
279566063dSJacob Faibussowitsch   if (flg) PetscCall(MatSeqAIJSetType(A, type));
28d0609cedSBarry Smith   PetscOptionsEnd();
293ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
304099cc6bSBarry Smith }
314099cc6bSBarry Smith 
32ba38deedSJacob Faibussowitsch static PetscErrorCode MatGetColumnReductions_SeqAIJ(Mat A, PetscInt type, PetscReal *reductions)
33d71ae5a4SJacob Faibussowitsch {
340716a85fSBarry Smith   PetscInt    i, m, n;
350716a85fSBarry Smith   Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data;
360716a85fSBarry Smith 
370716a85fSBarry Smith   PetscFunctionBegin;
389566063dSJacob Faibussowitsch   PetscCall(MatGetSize(A, &m, &n));
399566063dSJacob Faibussowitsch   PetscCall(PetscArrayzero(reductions, n));
400716a85fSBarry Smith   if (type == NORM_2) {
41ad540459SPierre Jolivet     for (i = 0; i < aij->i[m]; i++) reductions[aij->j[i]] += PetscAbsScalar(aij->a[i] * aij->a[i]);
420716a85fSBarry Smith   } else if (type == NORM_1) {
43ad540459SPierre Jolivet     for (i = 0; i < aij->i[m]; i++) reductions[aij->j[i]] += PetscAbsScalar(aij->a[i]);
440716a85fSBarry Smith   } else if (type == NORM_INFINITY) {
45ad540459SPierre Jolivet     for (i = 0; i < aij->i[m]; i++) reductions[aij->j[i]] = PetscMax(PetscAbsScalar(aij->a[i]), reductions[aij->j[i]]);
46857cbf51SRichard Tran Mills   } else if (type == REDUCTION_SUM_REALPART || type == REDUCTION_MEAN_REALPART) {
47ad540459SPierre Jolivet     for (i = 0; i < aij->i[m]; i++) reductions[aij->j[i]] += PetscRealPart(aij->a[i]);
48857cbf51SRichard Tran Mills   } else if (type == REDUCTION_SUM_IMAGINARYPART || type == REDUCTION_MEAN_IMAGINARYPART) {
49ad540459SPierre Jolivet     for (i = 0; i < aij->i[m]; i++) reductions[aij->j[i]] += PetscImaginaryPart(aij->a[i]);
506adde796SStefano Zampini   } else SETERRQ(PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_WRONG, "Unknown reduction type");
510716a85fSBarry Smith 
520716a85fSBarry Smith   if (type == NORM_2) {
53a873a8cdSSam Reynolds     for (i = 0; i < n; i++) reductions[i] = PetscSqrtReal(reductions[i]);
54857cbf51SRichard Tran Mills   } else if (type == REDUCTION_MEAN_REALPART || type == REDUCTION_MEAN_IMAGINARYPART) {
55a873a8cdSSam Reynolds     for (i = 0; i < n; i++) reductions[i] /= m;
560716a85fSBarry Smith   }
573ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
580716a85fSBarry Smith }
590716a85fSBarry Smith 
60ba38deedSJacob Faibussowitsch static PetscErrorCode MatFindOffBlockDiagonalEntries_SeqAIJ(Mat A, IS *is)
61d71ae5a4SJacob Faibussowitsch {
623a062f41SBarry Smith   Mat_SeqAIJ     *a = (Mat_SeqAIJ *)A->data;
633a062f41SBarry Smith   PetscInt        i, m = A->rmap->n, cnt = 0, bs = A->rmap->bs;
643a062f41SBarry Smith   const PetscInt *jj = a->j, *ii = a->i;
653a062f41SBarry Smith   PetscInt       *rows;
663a062f41SBarry Smith 
673a062f41SBarry Smith   PetscFunctionBegin;
683a062f41SBarry Smith   for (i = 0; i < m; i++) {
69ad540459SPierre Jolivet     if ((ii[i] != ii[i + 1]) && ((jj[ii[i]] < bs * (i / bs)) || (jj[ii[i + 1] - 1] > bs * ((i + bs) / bs) - 1))) cnt++;
703a062f41SBarry Smith   }
719566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(cnt, &rows));
723a062f41SBarry Smith   cnt = 0;
733a062f41SBarry Smith   for (i = 0; i < m; i++) {
743a062f41SBarry Smith     if ((ii[i] != ii[i + 1]) && ((jj[ii[i]] < bs * (i / bs)) || (jj[ii[i + 1] - 1] > bs * ((i + bs) / bs) - 1))) {
753a062f41SBarry Smith       rows[cnt] = i;
763a062f41SBarry Smith       cnt++;
773a062f41SBarry Smith     }
783a062f41SBarry Smith   }
799566063dSJacob Faibussowitsch   PetscCall(ISCreateGeneral(PETSC_COMM_SELF, cnt, rows, PETSC_OWN_POINTER, is));
803ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
813a062f41SBarry Smith }
823a062f41SBarry Smith 
83d71ae5a4SJacob Faibussowitsch PetscErrorCode MatFindZeroDiagonals_SeqAIJ_Private(Mat A, PetscInt *nrows, PetscInt **zrows)
84d71ae5a4SJacob Faibussowitsch {
856ce1633cSBarry Smith   Mat_SeqAIJ      *a = (Mat_SeqAIJ *)A->data;
86fff043a9SJunchao Zhang   const MatScalar *aa;
876ce1633cSBarry Smith   PetscInt         i, m = A->rmap->n, cnt = 0;
88b2db7409Sstefano_zampini   const PetscInt  *ii = a->i, *jj = a->j, *diag;
896ce1633cSBarry Smith   PetscInt        *rows;
906ce1633cSBarry Smith 
916ce1633cSBarry Smith   PetscFunctionBegin;
929566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &aa));
939566063dSJacob Faibussowitsch   PetscCall(MatMarkDiagonal_SeqAIJ(A));
946ce1633cSBarry Smith   diag = a->diag;
956ce1633cSBarry Smith   for (i = 0; i < m; i++) {
96ad540459SPierre Jolivet     if ((diag[i] >= ii[i + 1]) || (jj[diag[i]] != i) || (aa[diag[i]] == 0.0)) cnt++;
976ce1633cSBarry Smith   }
989566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(cnt, &rows));
996ce1633cSBarry Smith   cnt = 0;
1006ce1633cSBarry Smith   for (i = 0; i < m; i++) {
101ad540459SPierre Jolivet     if ((diag[i] >= ii[i + 1]) || (jj[diag[i]] != i) || (aa[diag[i]] == 0.0)) rows[cnt++] = i;
1026ce1633cSBarry Smith   }
103f1f41ecbSJed Brown   *nrows = cnt;
104f1f41ecbSJed Brown   *zrows = rows;
1059566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &aa));
1063ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
107f1f41ecbSJed Brown }
108f1f41ecbSJed Brown 
109ba38deedSJacob Faibussowitsch static PetscErrorCode MatFindZeroDiagonals_SeqAIJ(Mat A, IS *zrows)
110d71ae5a4SJacob Faibussowitsch {
111f1f41ecbSJed Brown   PetscInt nrows, *rows;
112f1f41ecbSJed Brown 
113f1f41ecbSJed Brown   PetscFunctionBegin;
1140298fd71SBarry Smith   *zrows = NULL;
1159566063dSJacob Faibussowitsch   PetscCall(MatFindZeroDiagonals_SeqAIJ_Private(A, &nrows, &rows));
1169566063dSJacob Faibussowitsch   PetscCall(ISCreateGeneral(PetscObjectComm((PetscObject)A), nrows, rows, PETSC_OWN_POINTER, zrows));
1173ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
1186ce1633cSBarry Smith }
1196ce1633cSBarry Smith 
120ba38deedSJacob Faibussowitsch static PetscErrorCode MatFindNonzeroRows_SeqAIJ(Mat A, IS *keptrows)
121d71ae5a4SJacob Faibussowitsch {
122b3a44c85SBarry Smith   Mat_SeqAIJ      *a = (Mat_SeqAIJ *)A->data;
123b3a44c85SBarry Smith   const MatScalar *aa;
124b3a44c85SBarry Smith   PetscInt         m = A->rmap->n, cnt = 0;
125b3a44c85SBarry Smith   const PetscInt  *ii;
126b3a44c85SBarry Smith   PetscInt         n, i, j, *rows;
127b3a44c85SBarry Smith 
128b3a44c85SBarry Smith   PetscFunctionBegin;
1299566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &aa));
130f4259b30SLisandro Dalcin   *keptrows = NULL;
131b3a44c85SBarry Smith   ii        = a->i;
132b3a44c85SBarry Smith   for (i = 0; i < m; i++) {
133b3a44c85SBarry Smith     n = ii[i + 1] - ii[i];
134b3a44c85SBarry Smith     if (!n) {
135b3a44c85SBarry Smith       cnt++;
136b3a44c85SBarry Smith       goto ok1;
137b3a44c85SBarry Smith     }
1382e5835c6SStefano Zampini     for (j = ii[i]; j < ii[i + 1]; j++) {
139b3a44c85SBarry Smith       if (aa[j] != 0.0) goto ok1;
140b3a44c85SBarry Smith     }
141b3a44c85SBarry Smith     cnt++;
142b3a44c85SBarry Smith   ok1:;
143b3a44c85SBarry Smith   }
1442e5835c6SStefano Zampini   if (!cnt) {
1459566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJRestoreArrayRead(A, &aa));
1463ba16761SJacob Faibussowitsch     PetscFunctionReturn(PETSC_SUCCESS);
1472e5835c6SStefano Zampini   }
1489566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(A->rmap->n - cnt, &rows));
149b3a44c85SBarry Smith   cnt = 0;
150b3a44c85SBarry Smith   for (i = 0; i < m; i++) {
151b3a44c85SBarry Smith     n = ii[i + 1] - ii[i];
152b3a44c85SBarry Smith     if (!n) continue;
1532e5835c6SStefano Zampini     for (j = ii[i]; j < ii[i + 1]; j++) {
154b3a44c85SBarry Smith       if (aa[j] != 0.0) {
155b3a44c85SBarry Smith         rows[cnt++] = i;
156b3a44c85SBarry Smith         break;
157b3a44c85SBarry Smith       }
158b3a44c85SBarry Smith     }
159b3a44c85SBarry Smith   }
1609566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &aa));
1619566063dSJacob Faibussowitsch   PetscCall(ISCreateGeneral(PETSC_COMM_SELF, cnt, rows, PETSC_OWN_POINTER, keptrows));
1623ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
163b3a44c85SBarry Smith }
164b3a44c85SBarry Smith 
165d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDiagonalSet_SeqAIJ(Mat Y, Vec D, InsertMode is)
166d71ae5a4SJacob Faibussowitsch {
16779299369SBarry Smith   Mat_SeqAIJ        *aij = (Mat_SeqAIJ *)Y->data;
16899e65526SBarry Smith   PetscInt           i, m = Y->rmap->n;
16999e65526SBarry Smith   const PetscInt    *diag;
1702e5835c6SStefano Zampini   MatScalar         *aa;
17199e65526SBarry Smith   const PetscScalar *v;
172ace3abfcSBarry Smith   PetscBool          missing;
17379299369SBarry Smith 
17479299369SBarry Smith   PetscFunctionBegin;
17509f38230SBarry Smith   if (Y->assembled) {
1769566063dSJacob Faibussowitsch     PetscCall(MatMissingDiagonal_SeqAIJ(Y, &missing, NULL));
17709f38230SBarry Smith     if (!missing) {
17879299369SBarry Smith       diag = aij->diag;
1799566063dSJacob Faibussowitsch       PetscCall(VecGetArrayRead(D, &v));
1809566063dSJacob Faibussowitsch       PetscCall(MatSeqAIJGetArray(Y, &aa));
18179299369SBarry Smith       if (is == INSERT_VALUES) {
182ad540459SPierre Jolivet         for (i = 0; i < m; i++) aa[diag[i]] = v[i];
18379299369SBarry Smith       } else {
184ad540459SPierre Jolivet         for (i = 0; i < m; i++) aa[diag[i]] += v[i];
18579299369SBarry Smith       }
1869566063dSJacob Faibussowitsch       PetscCall(MatSeqAIJRestoreArray(Y, &aa));
1879566063dSJacob Faibussowitsch       PetscCall(VecRestoreArrayRead(D, &v));
1883ba16761SJacob Faibussowitsch       PetscFunctionReturn(PETSC_SUCCESS);
18979299369SBarry Smith     }
1909566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJInvalidateDiagonal(Y));
19109f38230SBarry Smith   }
1929566063dSJacob Faibussowitsch   PetscCall(MatDiagonalSet_Default(Y, D, is));
1933ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
19409f38230SBarry Smith }
19579299369SBarry Smith 
196d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetRowIJ_SeqAIJ(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *m, const PetscInt *ia[], const PetscInt *ja[], PetscBool *done)
197d71ae5a4SJacob Faibussowitsch {
198416022c9SBarry Smith   Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data;
19997f1f81fSBarry Smith   PetscInt    i, ishift;
20017ab2063SBarry Smith 
2013a40ed3dSBarry Smith   PetscFunctionBegin;
202f1f2ae84SBarry Smith   if (m) *m = A->rmap->n;
2033ba16761SJacob Faibussowitsch   if (!ia) PetscFunctionReturn(PETSC_SUCCESS);
204bfeeae90SHong Zhang   ishift = 0;
205b94d7dedSBarry Smith   if (symmetric && A->structurally_symmetric != PETSC_BOOL3_TRUE) {
2069566063dSJacob Faibussowitsch     PetscCall(MatToSymmetricIJ_SeqAIJ(A->rmap->n, a->i, a->j, PETSC_TRUE, ishift, oshift, (PetscInt **)ia, (PetscInt **)ja));
207bfeeae90SHong Zhang   } else if (oshift == 1) {
2081a83f524SJed Brown     PetscInt *tia;
209d0f46423SBarry Smith     PetscInt  nz = a->i[A->rmap->n];
2103b2fbd54SBarry Smith     /* malloc space and  add 1 to i and j indices */
2119566063dSJacob Faibussowitsch     PetscCall(PetscMalloc1(A->rmap->n + 1, &tia));
2121a83f524SJed Brown     for (i = 0; i < A->rmap->n + 1; i++) tia[i] = a->i[i] + 1;
2131a83f524SJed Brown     *ia = tia;
214ecc77c7aSBarry Smith     if (ja) {
2151a83f524SJed Brown       PetscInt *tja;
2169566063dSJacob Faibussowitsch       PetscCall(PetscMalloc1(nz + 1, &tja));
2171a83f524SJed Brown       for (i = 0; i < nz; i++) tja[i] = a->j[i] + 1;
2181a83f524SJed Brown       *ja = tja;
219ecc77c7aSBarry Smith     }
2206945ee14SBarry Smith   } else {
221ecc77c7aSBarry Smith     *ia = a->i;
222ecc77c7aSBarry Smith     if (ja) *ja = a->j;
223a2ce50c7SBarry Smith   }
2243ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
225a2744918SBarry Smith }
226a2744918SBarry Smith 
227d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRestoreRowIJ_SeqAIJ(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *n, const PetscInt *ia[], const PetscInt *ja[], PetscBool *done)
228d71ae5a4SJacob Faibussowitsch {
2293a40ed3dSBarry Smith   PetscFunctionBegin;
2303ba16761SJacob Faibussowitsch   if (!ia) PetscFunctionReturn(PETSC_SUCCESS);
231b94d7dedSBarry Smith   if ((symmetric && A->structurally_symmetric != PETSC_BOOL3_TRUE) || oshift == 1) {
2329566063dSJacob Faibussowitsch     PetscCall(PetscFree(*ia));
2339566063dSJacob Faibussowitsch     if (ja) PetscCall(PetscFree(*ja));
234bcd2baecSBarry Smith   }
2353ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
23617ab2063SBarry Smith }
23717ab2063SBarry Smith 
238d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetColumnIJ_SeqAIJ(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *nn, const PetscInt *ia[], const PetscInt *ja[], PetscBool *done)
239d71ae5a4SJacob Faibussowitsch {
2403b2fbd54SBarry Smith   Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data;
241d0f46423SBarry Smith   PetscInt    i, *collengths, *cia, *cja, n = A->cmap->n, m = A->rmap->n;
24297f1f81fSBarry Smith   PetscInt    nz = a->i[m], row, *jj, mr, col;
2433b2fbd54SBarry Smith 
2443a40ed3dSBarry Smith   PetscFunctionBegin;
245899cda47SBarry Smith   *nn = n;
2463ba16761SJacob Faibussowitsch   if (!ia) PetscFunctionReturn(PETSC_SUCCESS);
2473b2fbd54SBarry Smith   if (symmetric) {
2489566063dSJacob Faibussowitsch     PetscCall(MatToSymmetricIJ_SeqAIJ(A->rmap->n, a->i, a->j, PETSC_TRUE, 0, oshift, (PetscInt **)ia, (PetscInt **)ja));
2493b2fbd54SBarry Smith   } else {
2509566063dSJacob Faibussowitsch     PetscCall(PetscCalloc1(n, &collengths));
2519566063dSJacob Faibussowitsch     PetscCall(PetscMalloc1(n + 1, &cia));
2529566063dSJacob Faibussowitsch     PetscCall(PetscMalloc1(nz, &cja));
2533b2fbd54SBarry Smith     jj = a->j;
254ad540459SPierre Jolivet     for (i = 0; i < nz; i++) collengths[jj[i]]++;
2553b2fbd54SBarry Smith     cia[0] = oshift;
256ad540459SPierre Jolivet     for (i = 0; i < n; i++) cia[i + 1] = cia[i] + collengths[i];
2579566063dSJacob Faibussowitsch     PetscCall(PetscArrayzero(collengths, n));
2583b2fbd54SBarry Smith     jj = a->j;
259a93ec695SBarry Smith     for (row = 0; row < m; row++) {
260a93ec695SBarry Smith       mr = a->i[row + 1] - a->i[row];
261a93ec695SBarry Smith       for (i = 0; i < mr; i++) {
262bfeeae90SHong Zhang         col = *jj++;
2632205254eSKarl Rupp 
2643b2fbd54SBarry Smith         cja[cia[col] + collengths[col]++ - oshift] = row + oshift;
2653b2fbd54SBarry Smith       }
2663b2fbd54SBarry Smith     }
2679566063dSJacob Faibussowitsch     PetscCall(PetscFree(collengths));
2689371c9d4SSatish Balay     *ia = cia;
2699371c9d4SSatish Balay     *ja = cja;
2703b2fbd54SBarry Smith   }
2713ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
2723b2fbd54SBarry Smith }
2733b2fbd54SBarry Smith 
274d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRestoreColumnIJ_SeqAIJ(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *n, const PetscInt *ia[], const PetscInt *ja[], PetscBool *done)
275d71ae5a4SJacob Faibussowitsch {
2763a40ed3dSBarry Smith   PetscFunctionBegin;
2773ba16761SJacob Faibussowitsch   if (!ia) PetscFunctionReturn(PETSC_SUCCESS);
2783b2fbd54SBarry Smith 
2799566063dSJacob Faibussowitsch   PetscCall(PetscFree(*ia));
2809566063dSJacob Faibussowitsch   PetscCall(PetscFree(*ja));
2813ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
2823b2fbd54SBarry Smith }
2833b2fbd54SBarry Smith 
2847cee066cSHong Zhang /*
2857cee066cSHong Zhang  MatGetColumnIJ_SeqAIJ_Color() and MatRestoreColumnIJ_SeqAIJ_Color() are customized from
2867cee066cSHong Zhang  MatGetColumnIJ_SeqAIJ() and MatRestoreColumnIJ_SeqAIJ() by adding an output
287040ebd07SHong Zhang  spidx[], index of a->a, to be used in MatTransposeColoringCreate_SeqAIJ() and MatFDColoringCreate_SeqXAIJ()
2887cee066cSHong Zhang */
289d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetColumnIJ_SeqAIJ_Color(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *nn, const PetscInt *ia[], const PetscInt *ja[], PetscInt *spidx[], PetscBool *done)
290d71ae5a4SJacob Faibussowitsch {
2917cee066cSHong Zhang   Mat_SeqAIJ     *a = (Mat_SeqAIJ *)A->data;
2927cee066cSHong Zhang   PetscInt        i, *collengths, *cia, *cja, n = A->cmap->n, m = A->rmap->n;
293071fcb05SBarry Smith   PetscInt        nz = a->i[m], row, mr, col, tmp;
2947cee066cSHong Zhang   PetscInt       *cspidx;
295071fcb05SBarry Smith   const PetscInt *jj;
2967cee066cSHong Zhang 
2977cee066cSHong Zhang   PetscFunctionBegin;
2987cee066cSHong Zhang   *nn = n;
2993ba16761SJacob Faibussowitsch   if (!ia) PetscFunctionReturn(PETSC_SUCCESS);
300625f6d37SHong Zhang 
3019566063dSJacob Faibussowitsch   PetscCall(PetscCalloc1(n, &collengths));
3029566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(n + 1, &cia));
3039566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(nz, &cja));
3049566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(nz, &cspidx));
3057cee066cSHong Zhang   jj = a->j;
306ad540459SPierre Jolivet   for (i = 0; i < nz; i++) collengths[jj[i]]++;
3077cee066cSHong Zhang   cia[0] = oshift;
308ad540459SPierre Jolivet   for (i = 0; i < n; i++) cia[i + 1] = cia[i] + collengths[i];
3099566063dSJacob Faibussowitsch   PetscCall(PetscArrayzero(collengths, n));
3107cee066cSHong Zhang   jj = a->j;
3117cee066cSHong Zhang   for (row = 0; row < m; row++) {
3127cee066cSHong Zhang     mr = a->i[row + 1] - a->i[row];
3137cee066cSHong Zhang     for (i = 0; i < mr; i++) {
3147cee066cSHong Zhang       col         = *jj++;
315071fcb05SBarry Smith       tmp         = cia[col] + collengths[col]++ - oshift;
316071fcb05SBarry Smith       cspidx[tmp] = a->i[row] + i; /* index of a->j */
317071fcb05SBarry Smith       cja[tmp]    = row + oshift;
3187cee066cSHong Zhang     }
3197cee066cSHong Zhang   }
3209566063dSJacob Faibussowitsch   PetscCall(PetscFree(collengths));
321071fcb05SBarry Smith   *ia    = cia;
322071fcb05SBarry Smith   *ja    = cja;
3237cee066cSHong Zhang   *spidx = cspidx;
3243ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3257cee066cSHong Zhang }
3267cee066cSHong Zhang 
327d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRestoreColumnIJ_SeqAIJ_Color(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *n, const PetscInt *ia[], const PetscInt *ja[], PetscInt *spidx[], PetscBool *done)
328d71ae5a4SJacob Faibussowitsch {
3297cee066cSHong Zhang   PetscFunctionBegin;
3309566063dSJacob Faibussowitsch   PetscCall(MatRestoreColumnIJ_SeqAIJ(A, oshift, symmetric, inodecompressed, n, ia, ja, done));
3319566063dSJacob Faibussowitsch   PetscCall(PetscFree(*spidx));
3323ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3337cee066cSHong Zhang }
3347cee066cSHong Zhang 
335ba38deedSJacob Faibussowitsch static PetscErrorCode MatSetValuesRow_SeqAIJ(Mat A, PetscInt row, const PetscScalar v[])
336d71ae5a4SJacob Faibussowitsch {
33787d4246cSBarry Smith   Mat_SeqAIJ  *a  = (Mat_SeqAIJ *)A->data;
33887d4246cSBarry Smith   PetscInt    *ai = a->i;
339fff043a9SJunchao Zhang   PetscScalar *aa;
34087d4246cSBarry Smith 
34187d4246cSBarry Smith   PetscFunctionBegin;
3429566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArray(A, &aa));
3439566063dSJacob Faibussowitsch   PetscCall(PetscArraycpy(aa + ai[row], v, ai[row + 1] - ai[row]));
3449566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArray(A, &aa));
3453ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
34687d4246cSBarry Smith }
34787d4246cSBarry Smith 
348bd04181cSBarry Smith /*
349bd04181cSBarry Smith     MatSeqAIJSetValuesLocalFast - An optimized version of MatSetValuesLocal() for SeqAIJ matrices with several assumptions
350bd04181cSBarry Smith 
351bd04181cSBarry Smith       -   a single row of values is set with each call
352bd04181cSBarry Smith       -   no row or column indices are negative or (in error) larger than the number of rows or columns
353bd04181cSBarry Smith       -   the values are always added to the matrix, not set
354bd04181cSBarry Smith       -   no new locations are introduced in the nonzero structure of the matrix
355bd04181cSBarry Smith 
3561f763a69SBarry Smith      This does NOT assume the global column indices are sorted
357bd04181cSBarry Smith 
3581f763a69SBarry Smith */
359bd04181cSBarry Smith 
360af0996ceSBarry Smith #include <petsc/private/isimpl.h>
361d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetValuesLocalFast(Mat A, PetscInt m, const PetscInt im[], PetscInt n, const PetscInt in[], const PetscScalar v[], InsertMode is)
362d71ae5a4SJacob Faibussowitsch {
363189e4007SBarry Smith   Mat_SeqAIJ     *a = (Mat_SeqAIJ *)A->data;
3641f763a69SBarry Smith   PetscInt        low, high, t, row, nrow, i, col, l;
3651f763a69SBarry Smith   const PetscInt *rp, *ai = a->i, *ailen = a->ilen, *aj = a->j;
3661f763a69SBarry Smith   PetscInt        lastcol = -1;
367fff043a9SJunchao Zhang   MatScalar      *ap, value, *aa;
368189e4007SBarry Smith   const PetscInt *ridx = A->rmap->mapping->indices, *cidx = A->cmap->mapping->indices;
369189e4007SBarry Smith 
370fff043a9SJunchao Zhang   PetscFunctionBegin;
3719566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArray(A, &aa));
372f38dd0b8SBarry Smith   row  = ridx[im[0]];
3731f763a69SBarry Smith   rp   = aj + ai[row];
3741f763a69SBarry Smith   ap   = aa + ai[row];
3751f763a69SBarry Smith   nrow = ailen[row];
376189e4007SBarry Smith   low  = 0;
377189e4007SBarry Smith   high = nrow;
378189e4007SBarry Smith   for (l = 0; l < n; l++) { /* loop over added columns */
379189e4007SBarry Smith     col   = cidx[in[l]];
380f38dd0b8SBarry Smith     value = v[l];
381189e4007SBarry Smith 
382189e4007SBarry Smith     if (col <= lastcol) low = 0;
383189e4007SBarry Smith     else high = nrow;
384189e4007SBarry Smith     lastcol = col;
385189e4007SBarry Smith     while (high - low > 5) {
386189e4007SBarry Smith       t = (low + high) / 2;
387189e4007SBarry Smith       if (rp[t] > col) high = t;
388189e4007SBarry Smith       else low = t;
389189e4007SBarry Smith     }
390189e4007SBarry Smith     for (i = low; i < high; i++) {
391189e4007SBarry Smith       if (rp[i] == col) {
3921f763a69SBarry Smith         ap[i] += value;
393189e4007SBarry Smith         low = i + 1;
3941f763a69SBarry Smith         break;
395189e4007SBarry Smith       }
396189e4007SBarry Smith     }
397189e4007SBarry Smith   }
3989566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArray(A, &aa));
3993ba16761SJacob Faibussowitsch   return PETSC_SUCCESS;
400189e4007SBarry Smith }
401189e4007SBarry Smith 
402d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetValues_SeqAIJ(Mat A, PetscInt m, const PetscInt im[], PetscInt n, const PetscInt in[], const PetscScalar v[], InsertMode is)
403d71ae5a4SJacob Faibussowitsch {
404416022c9SBarry Smith   Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data;
405e2ee6c50SBarry Smith   PetscInt   *rp, k, low, high, t, ii, row, nrow, i, col, l, rmax, N;
40697f1f81fSBarry Smith   PetscInt   *imax = a->imax, *ai = a->i, *ailen = a->ilen;
407e2ee6c50SBarry Smith   PetscInt   *aj = a->j, nonew = a->nonew, lastcol = -1;
408ce496241SStefano Zampini   MatScalar  *ap = NULL, value = 0.0, *aa;
409ace3abfcSBarry Smith   PetscBool   ignorezeroentries = a->ignorezeroentries;
410ace3abfcSBarry Smith   PetscBool   roworiented       = a->roworiented;
41117ab2063SBarry Smith 
4123a40ed3dSBarry Smith   PetscFunctionBegin;
4139566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArray(A, &aa));
41417ab2063SBarry Smith   for (k = 0; k < m; k++) { /* loop over added rows */
415416022c9SBarry Smith     row = im[k];
4165ef9f2a5SBarry Smith     if (row < 0) continue;
4176bdcaf15SBarry Smith     PetscCheck(row < A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Row too large: row %" PetscInt_FMT " max %" PetscInt_FMT, row, A->rmap->n - 1);
4188e3a54c0SPierre Jolivet     rp = PetscSafePointerPlusOffset(aj, ai[row]);
4198e3a54c0SPierre Jolivet     if (!A->structure_only) ap = PetscSafePointerPlusOffset(aa, ai[row]);
4209371c9d4SSatish Balay     rmax = imax[row];
4219371c9d4SSatish Balay     nrow = ailen[row];
422416022c9SBarry Smith     low  = 0;
423c71e6ed7SBarry Smith     high = nrow;
42417ab2063SBarry Smith     for (l = 0; l < n; l++) { /* loop over added columns */
4255ef9f2a5SBarry Smith       if (in[l] < 0) continue;
4266bdcaf15SBarry Smith       PetscCheck(in[l] < A->cmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Column too large: col %" PetscInt_FMT " max %" PetscInt_FMT, in[l], A->cmap->n - 1);
427bfeeae90SHong Zhang       col = in[l];
428071fcb05SBarry Smith       if (v && !A->structure_only) value = roworiented ? v[l + k * n] : v[k + l * m];
429071fcb05SBarry Smith       if (!A->structure_only && value == 0.0 && ignorezeroentries && is == ADD_VALUES && row != col) continue;
43036db0b34SBarry Smith 
4312205254eSKarl Rupp       if (col <= lastcol) low = 0;
4322205254eSKarl Rupp       else high = nrow;
433e2ee6c50SBarry Smith       lastcol = col;
434416022c9SBarry Smith       while (high - low > 5) {
435416022c9SBarry Smith         t = (low + high) / 2;
436416022c9SBarry Smith         if (rp[t] > col) high = t;
437416022c9SBarry Smith         else low = t;
43817ab2063SBarry Smith       }
439416022c9SBarry Smith       for (i = low; i < high; i++) {
44017ab2063SBarry Smith         if (rp[i] > col) break;
44117ab2063SBarry Smith         if (rp[i] == col) {
442876c6284SHong Zhang           if (!A->structure_only) {
4430c0d7e18SFande Kong             if (is == ADD_VALUES) {
4440c0d7e18SFande Kong               ap[i] += value;
4450c0d7e18SFande Kong               (void)PetscLogFlops(1.0);
4469371c9d4SSatish Balay             } else ap[i] = value;
447720833daSHong Zhang           }
448e44c0bd4SBarry Smith           low = i + 1;
44917ab2063SBarry Smith           goto noinsert;
45017ab2063SBarry Smith         }
45117ab2063SBarry Smith       }
452dcd36c23SBarry Smith       if (value == 0.0 && ignorezeroentries && row != col) goto noinsert;
453c2653b3dSLois Curfman McInnes       if (nonew == 1) goto noinsert;
45408401ef6SPierre Jolivet       PetscCheck(nonew != -1, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Inserting a new nonzero at (%" PetscInt_FMT ",%" PetscInt_FMT ") in the matrix", row, col);
455720833daSHong Zhang       if (A->structure_only) {
456876c6284SHong Zhang         MatSeqXAIJReallocateAIJ_structure_only(A, A->rmap->n, 1, nrow, row, col, rmax, ai, aj, rp, imax, nonew, MatScalar);
457720833daSHong Zhang       } else {
458fef13f97SBarry Smith         MatSeqXAIJReallocateAIJ(A, A->rmap->n, 1, nrow, row, col, rmax, aa, ai, aj, rp, ap, imax, nonew, MatScalar);
459720833daSHong Zhang       }
4609371c9d4SSatish Balay       N = nrow++ - 1;
4619371c9d4SSatish Balay       a->nz++;
4629371c9d4SSatish Balay       high++;
463416022c9SBarry Smith       /* shift up all the later entries in this row */
4649566063dSJacob Faibussowitsch       PetscCall(PetscArraymove(rp + i + 1, rp + i, N - i + 1));
46517ab2063SBarry Smith       rp[i] = col;
466580bdb30SBarry Smith       if (!A->structure_only) {
4679566063dSJacob Faibussowitsch         PetscCall(PetscArraymove(ap + i + 1, ap + i, N - i + 1));
468580bdb30SBarry Smith         ap[i] = value;
469580bdb30SBarry Smith       }
470416022c9SBarry Smith       low = i + 1;
471e44c0bd4SBarry Smith     noinsert:;
47217ab2063SBarry Smith     }
47317ab2063SBarry Smith     ailen[row] = nrow;
47417ab2063SBarry Smith   }
4759566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArray(A, &aa));
4763ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
47717ab2063SBarry Smith }
47817ab2063SBarry Smith 
479ba38deedSJacob Faibussowitsch static PetscErrorCode MatSetValues_SeqAIJ_SortedFullNoPreallocation(Mat A, PetscInt m, const PetscInt im[], PetscInt n, const PetscInt in[], const PetscScalar v[], InsertMode is)
480d71ae5a4SJacob Faibussowitsch {
48119b08ed1SBarry Smith   Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data;
48219b08ed1SBarry Smith   PetscInt   *rp, k, row;
48319b08ed1SBarry Smith   PetscInt   *ai = a->i;
48419b08ed1SBarry Smith   PetscInt   *aj = a->j;
485fff043a9SJunchao Zhang   MatScalar  *aa, *ap;
48619b08ed1SBarry Smith 
48719b08ed1SBarry Smith   PetscFunctionBegin;
48828b400f6SJacob Faibussowitsch   PetscCheck(!A->was_assembled, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Cannot call on assembled matrix.");
48908401ef6SPierre Jolivet   PetscCheck(m * n + a->nz <= a->maxnz, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Number of entries in matrix will be larger than maximum nonzeros allocated for %" PetscInt_FMT " in MatSeqAIJSetTotalPreallocation()", a->maxnz);
490fff043a9SJunchao Zhang 
4919566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArray(A, &aa));
49219b08ed1SBarry Smith   for (k = 0; k < m; k++) { /* loop over added rows */
49319b08ed1SBarry Smith     row = im[k];
49419b08ed1SBarry Smith     rp  = aj + ai[row];
4958e3a54c0SPierre Jolivet     ap  = PetscSafePointerPlusOffset(aa, ai[row]);
49619b08ed1SBarry Smith 
4979566063dSJacob Faibussowitsch     PetscCall(PetscMemcpy(rp, in, n * sizeof(PetscInt)));
49819b08ed1SBarry Smith     if (!A->structure_only) {
49919b08ed1SBarry Smith       if (v) {
5009566063dSJacob Faibussowitsch         PetscCall(PetscMemcpy(ap, v, n * sizeof(PetscScalar)));
50119b08ed1SBarry Smith         v += n;
50219b08ed1SBarry Smith       } else {
5039566063dSJacob Faibussowitsch         PetscCall(PetscMemzero(ap, n * sizeof(PetscScalar)));
50419b08ed1SBarry Smith       }
50519b08ed1SBarry Smith     }
50619b08ed1SBarry Smith     a->ilen[row]  = n;
50719b08ed1SBarry Smith     a->imax[row]  = n;
50819b08ed1SBarry Smith     a->i[row + 1] = a->i[row] + n;
50919b08ed1SBarry Smith     a->nz += n;
51019b08ed1SBarry Smith   }
5119566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArray(A, &aa));
5123ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
51319b08ed1SBarry Smith }
51419b08ed1SBarry Smith 
51519b08ed1SBarry Smith /*@
51619b08ed1SBarry Smith   MatSeqAIJSetTotalPreallocation - Sets an upper bound on the total number of expected nonzeros in the matrix.
51719b08ed1SBarry Smith 
51819b08ed1SBarry Smith   Input Parameters:
51911a5261eSBarry Smith + A       - the `MATSEQAIJ` matrix
52019b08ed1SBarry Smith - nztotal - bound on the number of nonzeros
52119b08ed1SBarry Smith 
52219b08ed1SBarry Smith   Level: advanced
52319b08ed1SBarry Smith 
52419b08ed1SBarry Smith   Notes:
52519b08ed1SBarry Smith   This can be called if you will be provided the matrix row by row (from row zero) with sorted column indices for each row.
52611a5261eSBarry Smith   Simply call `MatSetValues()` after this call to provide the matrix entries in the usual manner. This matrix may be used
52719b08ed1SBarry Smith   as always with multiple matrix assemblies.
52819b08ed1SBarry Smith 
5291cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSetOption()`, `MAT_SORTED_FULL`, `MatSetValues()`, `MatSeqAIJSetPreallocation()`
53019b08ed1SBarry Smith @*/
531d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetTotalPreallocation(Mat A, PetscInt nztotal)
532d71ae5a4SJacob Faibussowitsch {
53319b08ed1SBarry Smith   Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data;
53419b08ed1SBarry Smith 
53519b08ed1SBarry Smith   PetscFunctionBegin;
5369566063dSJacob Faibussowitsch   PetscCall(PetscLayoutSetUp(A->rmap));
5379566063dSJacob Faibussowitsch   PetscCall(PetscLayoutSetUp(A->cmap));
53819b08ed1SBarry Smith   a->maxnz = nztotal;
5394dfa11a4SJacob Faibussowitsch   if (!a->imax) { PetscCall(PetscMalloc1(A->rmap->n, &a->imax)); }
54019b08ed1SBarry Smith   if (!a->ilen) {
5419566063dSJacob Faibussowitsch     PetscCall(PetscMalloc1(A->rmap->n, &a->ilen));
54219b08ed1SBarry Smith   } else {
5439566063dSJacob Faibussowitsch     PetscCall(PetscMemzero(a->ilen, A->rmap->n * sizeof(PetscInt)));
54419b08ed1SBarry Smith   }
54519b08ed1SBarry Smith 
54619b08ed1SBarry Smith   /* allocate the matrix space */
5479f0612e4SBarry Smith   PetscCall(PetscShmgetAllocateArray(A->rmap->n + 1, sizeof(PetscInt), (void **)&a->i));
5489f0612e4SBarry Smith   PetscCall(PetscShmgetAllocateArray(nztotal, sizeof(PetscInt), (void **)&a->j));
5499f0612e4SBarry Smith   a->free_ij = PETSC_TRUE;
55019b08ed1SBarry Smith   if (A->structure_only) {
55119b08ed1SBarry Smith     a->free_a = PETSC_FALSE;
55219b08ed1SBarry Smith   } else {
5539f0612e4SBarry Smith     PetscCall(PetscShmgetAllocateArray(nztotal, sizeof(PetscScalar), (void **)&a->a));
55419b08ed1SBarry Smith     a->free_a = PETSC_TRUE;
55519b08ed1SBarry Smith   }
5569f0612e4SBarry Smith   a->i[0]           = 0;
55719b08ed1SBarry Smith   A->ops->setvalues = MatSetValues_SeqAIJ_SortedFullNoPreallocation;
55819b08ed1SBarry Smith   A->preallocated   = PETSC_TRUE;
5593ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
56019b08ed1SBarry Smith }
56119b08ed1SBarry Smith 
562ba38deedSJacob Faibussowitsch static PetscErrorCode MatSetValues_SeqAIJ_SortedFull(Mat A, PetscInt m, const PetscInt im[], PetscInt n, const PetscInt in[], const PetscScalar v[], InsertMode is)
563d71ae5a4SJacob Faibussowitsch {
564071fcb05SBarry Smith   Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data;
565071fcb05SBarry Smith   PetscInt   *rp, k, row;
566071fcb05SBarry Smith   PetscInt   *ai = a->i, *ailen = a->ilen;
567071fcb05SBarry Smith   PetscInt   *aj = a->j;
568fff043a9SJunchao Zhang   MatScalar  *aa, *ap;
569071fcb05SBarry Smith 
570071fcb05SBarry Smith   PetscFunctionBegin;
5719566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArray(A, &aa));
572071fcb05SBarry Smith   for (k = 0; k < m; k++) { /* loop over added rows */
573071fcb05SBarry Smith     row = im[k];
5746bdcaf15SBarry Smith     PetscCheck(n <= a->imax[row], PETSC_COMM_SELF, PETSC_ERR_ARG_WRONG, "Preallocation for row %" PetscInt_FMT " does not match number of columns provided", n);
575071fcb05SBarry Smith     rp = aj + ai[row];
576071fcb05SBarry Smith     ap = aa + ai[row];
57748a46eb9SPierre Jolivet     if (!A->was_assembled) PetscCall(PetscMemcpy(rp, in, n * sizeof(PetscInt)));
578071fcb05SBarry Smith     if (!A->structure_only) {
579071fcb05SBarry Smith       if (v) {
5809566063dSJacob Faibussowitsch         PetscCall(PetscMemcpy(ap, v, n * sizeof(PetscScalar)));
581071fcb05SBarry Smith         v += n;
582071fcb05SBarry Smith       } else {
5839566063dSJacob Faibussowitsch         PetscCall(PetscMemzero(ap, n * sizeof(PetscScalar)));
584071fcb05SBarry Smith       }
585071fcb05SBarry Smith     }
586071fcb05SBarry Smith     ailen[row] = n;
587071fcb05SBarry Smith     a->nz += n;
588071fcb05SBarry Smith   }
5899566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArray(A, &aa));
5903ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
591071fcb05SBarry Smith }
592071fcb05SBarry Smith 
593ba38deedSJacob Faibussowitsch static PetscErrorCode MatGetValues_SeqAIJ(Mat A, PetscInt m, const PetscInt im[], PetscInt n, const PetscInt in[], PetscScalar v[])
594d71ae5a4SJacob Faibussowitsch {
5957eb43aa7SLois Curfman McInnes   Mat_SeqAIJ      *a = (Mat_SeqAIJ *)A->data;
59697f1f81fSBarry Smith   PetscInt        *rp, k, low, high, t, row, nrow, i, col, l, *aj = a->j;
59797f1f81fSBarry Smith   PetscInt        *ai = a->i, *ailen = a->ilen;
5984e208921SJed Brown   const MatScalar *ap, *aa;
5997eb43aa7SLois Curfman McInnes 
6003a40ed3dSBarry Smith   PetscFunctionBegin;
6014e208921SJed Brown   PetscCall(MatSeqAIJGetArrayRead(A, &aa));
6027eb43aa7SLois Curfman McInnes   for (k = 0; k < m; k++) { /* loop over rows */
6037eb43aa7SLois Curfman McInnes     row = im[k];
6049371c9d4SSatish Balay     if (row < 0) {
6059371c9d4SSatish Balay       v += n;
6069371c9d4SSatish Balay       continue;
6079371c9d4SSatish Balay     } /* negative row */
60854c59aa7SJacob Faibussowitsch     PetscCheck(row < A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Row too large: row %" PetscInt_FMT " max %" PetscInt_FMT, row, A->rmap->n - 1);
6098e3a54c0SPierre Jolivet     rp   = PetscSafePointerPlusOffset(aj, ai[row]);
6108e3a54c0SPierre Jolivet     ap   = PetscSafePointerPlusOffset(aa, ai[row]);
6117eb43aa7SLois Curfman McInnes     nrow = ailen[row];
6127eb43aa7SLois Curfman McInnes     for (l = 0; l < n; l++) { /* loop over columns */
6139371c9d4SSatish Balay       if (in[l] < 0) {
6149371c9d4SSatish Balay         v++;
6159371c9d4SSatish Balay         continue;
6169371c9d4SSatish Balay       } /* negative column */
61754c59aa7SJacob Faibussowitsch       PetscCheck(in[l] < A->cmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Column too large: col %" PetscInt_FMT " max %" PetscInt_FMT, in[l], A->cmap->n - 1);
618bfeeae90SHong Zhang       col  = in[l];
6199371c9d4SSatish Balay       high = nrow;
6209371c9d4SSatish Balay       low  = 0; /* assume unsorted */
6217eb43aa7SLois Curfman McInnes       while (high - low > 5) {
6227eb43aa7SLois Curfman McInnes         t = (low + high) / 2;
6237eb43aa7SLois Curfman McInnes         if (rp[t] > col) high = t;
6247eb43aa7SLois Curfman McInnes         else low = t;
6257eb43aa7SLois Curfman McInnes       }
6267eb43aa7SLois Curfman McInnes       for (i = low; i < high; i++) {
6277eb43aa7SLois Curfman McInnes         if (rp[i] > col) break;
6287eb43aa7SLois Curfman McInnes         if (rp[i] == col) {
629b49de8d1SLois Curfman McInnes           *v++ = ap[i];
6307eb43aa7SLois Curfman McInnes           goto finished;
6317eb43aa7SLois Curfman McInnes         }
6327eb43aa7SLois Curfman McInnes       }
63397e567efSBarry Smith       *v++ = 0.0;
6347eb43aa7SLois Curfman McInnes     finished:;
6357eb43aa7SLois Curfman McInnes     }
6367eb43aa7SLois Curfman McInnes   }
6374e208921SJed Brown   PetscCall(MatSeqAIJRestoreArrayRead(A, &aa));
6383ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
6397eb43aa7SLois Curfman McInnes }
6407eb43aa7SLois Curfman McInnes 
641ba38deedSJacob Faibussowitsch static PetscErrorCode MatView_SeqAIJ_Binary(Mat mat, PetscViewer viewer)
642d71ae5a4SJacob Faibussowitsch {
6433ea6fe3dSLisandro Dalcin   Mat_SeqAIJ        *A = (Mat_SeqAIJ *)mat->data;
644c898d852SStefano Zampini   const PetscScalar *av;
6453ea6fe3dSLisandro Dalcin   PetscInt           header[4], M, N, m, nz, i;
6463ea6fe3dSLisandro Dalcin   PetscInt          *rowlens;
64717ab2063SBarry Smith 
6483a40ed3dSBarry Smith   PetscFunctionBegin;
6499566063dSJacob Faibussowitsch   PetscCall(PetscViewerSetUp(viewer));
6502205254eSKarl Rupp 
6513ea6fe3dSLisandro Dalcin   M  = mat->rmap->N;
6523ea6fe3dSLisandro Dalcin   N  = mat->cmap->N;
6533ea6fe3dSLisandro Dalcin   m  = mat->rmap->n;
6543ea6fe3dSLisandro Dalcin   nz = A->nz;
655416022c9SBarry Smith 
6563ea6fe3dSLisandro Dalcin   /* write matrix header */
6573ea6fe3dSLisandro Dalcin   header[0] = MAT_FILE_CLASSID;
6589371c9d4SSatish Balay   header[1] = M;
6599371c9d4SSatish Balay   header[2] = N;
6609371c9d4SSatish Balay   header[3] = nz;
6619566063dSJacob Faibussowitsch   PetscCall(PetscViewerBinaryWrite(viewer, header, 4, PETSC_INT));
662416022c9SBarry Smith 
6633ea6fe3dSLisandro Dalcin   /* fill in and store row lengths */
6649566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(m, &rowlens));
6653ea6fe3dSLisandro Dalcin   for (i = 0; i < m; i++) rowlens[i] = A->i[i + 1] - A->i[i];
666e457bb90SBarry Smith   if (PetscDefined(USE_DEBUG)) {
667e457bb90SBarry Smith     PetscInt mnz = 0;
668e457bb90SBarry Smith 
669e457bb90SBarry Smith     for (i = 0; i < m; i++) mnz += rowlens[i];
670e457bb90SBarry Smith     PetscCheck(nz == mnz, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Row lens %" PetscInt_FMT " do not sum to nz %" PetscInt_FMT, mnz, nz);
671e457bb90SBarry Smith   }
6729566063dSJacob Faibussowitsch   PetscCall(PetscViewerBinaryWrite(viewer, rowlens, m, PETSC_INT));
6739566063dSJacob Faibussowitsch   PetscCall(PetscFree(rowlens));
6743ea6fe3dSLisandro Dalcin   /* store column indices */
6759566063dSJacob Faibussowitsch   PetscCall(PetscViewerBinaryWrite(viewer, A->j, nz, PETSC_INT));
676416022c9SBarry Smith   /* store nonzero values */
6779566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(mat, &av));
6789566063dSJacob Faibussowitsch   PetscCall(PetscViewerBinaryWrite(viewer, av, nz, PETSC_SCALAR));
6799566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(mat, &av));
680b37d52dbSMark F. Adams 
6813ea6fe3dSLisandro Dalcin   /* write block size option to the viewer's .info file */
6829566063dSJacob Faibussowitsch   PetscCall(MatView_Binary_BlockSizes(mat, viewer));
6833ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
68417ab2063SBarry Smith }
685416022c9SBarry Smith 
686d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatView_SeqAIJ_ASCII_structonly(Mat A, PetscViewer viewer)
687d71ae5a4SJacob Faibussowitsch {
6887dc0baabSHong Zhang   Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data;
6897dc0baabSHong Zhang   PetscInt    i, k, m = A->rmap->N;
6907dc0baabSHong Zhang 
6917dc0baabSHong Zhang   PetscFunctionBegin;
6929566063dSJacob Faibussowitsch   PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE));
6937dc0baabSHong Zhang   for (i = 0; i < m; i++) {
6949566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIPrintf(viewer, "row %" PetscInt_FMT ":", i));
69548a46eb9SPierre Jolivet     for (k = a->i[i]; k < a->i[i + 1]; k++) PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ") ", a->j[k]));
6969566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIPrintf(viewer, "\n"));
6977dc0baabSHong Zhang   }
6989566063dSJacob Faibussowitsch   PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE));
6993ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
7007dc0baabSHong Zhang }
7017dc0baabSHong Zhang 
70209573ac7SBarry Smith extern PetscErrorCode MatSeqAIJFactorInfo_Matlab(Mat, PetscViewer);
703cd155464SBarry Smith 
704ba38deedSJacob Faibussowitsch static PetscErrorCode MatView_SeqAIJ_ASCII(Mat A, PetscViewer viewer)
705d71ae5a4SJacob Faibussowitsch {
706416022c9SBarry Smith   Mat_SeqAIJ        *a = (Mat_SeqAIJ *)A->data;
707c898d852SStefano Zampini   const PetscScalar *av;
70860e0710aSBarry Smith   PetscInt           i, j, m = A->rmap->n;
709e060cb09SBarry Smith   const char        *name;
710f3ef73ceSBarry Smith   PetscViewerFormat  format;
71117ab2063SBarry Smith 
7123a40ed3dSBarry Smith   PetscFunctionBegin;
7137dc0baabSHong Zhang   if (A->structure_only) {
7149566063dSJacob Faibussowitsch     PetscCall(MatView_SeqAIJ_ASCII_structonly(A, viewer));
7153ba16761SJacob Faibussowitsch     PetscFunctionReturn(PETSC_SUCCESS);
7167dc0baabSHong Zhang   }
71743e49210SHong Zhang 
7189566063dSJacob Faibussowitsch   PetscCall(PetscViewerGetFormat(viewer, &format));
719bd6a2ce3SJunchao Zhang   // By petsc's rule, even PETSC_VIEWER_ASCII_INFO_DETAIL doesn't print matrix entries
7203ba16761SJacob Faibussowitsch   if (format == PETSC_VIEWER_ASCII_FACTOR_INFO || format == PETSC_VIEWER_ASCII_INFO || format == PETSC_VIEWER_ASCII_INFO_DETAIL) PetscFunctionReturn(PETSC_SUCCESS);
7212e5835c6SStefano Zampini 
722c898d852SStefano Zampini   /* trigger copy to CPU if needed */
7239566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &av));
7249566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &av));
72571c2f376SKris Buschelman   if (format == PETSC_VIEWER_ASCII_MATLAB) {
72697f1f81fSBarry Smith     PetscInt nofinalvalue = 0;
72760e0710aSBarry Smith     if (m && ((a->i[m] == a->i[m - 1]) || (a->j[a->nz - 1] != A->cmap->n - 1))) {
728c337ccceSJed Brown       /* Need a dummy value to ensure the dimension of the matrix. */
729d00d2cf4SBarry Smith       nofinalvalue = 1;
730d00d2cf4SBarry Smith     }
7319566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE));
7329566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIPrintf(viewer, "%% Size = %" PetscInt_FMT " %" PetscInt_FMT " \n", m, A->cmap->n));
7339566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIPrintf(viewer, "%% Nonzeros = %" PetscInt_FMT " \n", a->nz));
734fbfe6fa7SJed Brown #if defined(PETSC_USE_COMPLEX)
7359566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIPrintf(viewer, "zzz = zeros(%" PetscInt_FMT ",4);\n", a->nz + nofinalvalue));
736fbfe6fa7SJed Brown #else
7379566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIPrintf(viewer, "zzz = zeros(%" PetscInt_FMT ",3);\n", a->nz + nofinalvalue));
738fbfe6fa7SJed Brown #endif
7399566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIPrintf(viewer, "zzz = [\n"));
74017ab2063SBarry Smith 
74117ab2063SBarry Smith     for (i = 0; i < m; i++) {
74260e0710aSBarry Smith       for (j = a->i[i]; j < a->i[i + 1]; j++) {
743aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX)
7449566063dSJacob Faibussowitsch         PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT "  %18.16e %18.16e\n", i + 1, a->j[j] + 1, (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j])));
74517ab2063SBarry Smith #else
7469566063dSJacob Faibussowitsch         PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT "  %18.16e\n", i + 1, a->j[j] + 1, (double)a->a[j]));
74717ab2063SBarry Smith #endif
74817ab2063SBarry Smith       }
74917ab2063SBarry Smith     }
750d00d2cf4SBarry Smith     if (nofinalvalue) {
751c337ccceSJed Brown #if defined(PETSC_USE_COMPLEX)
7529566063dSJacob Faibussowitsch       PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT "  %18.16e %18.16e\n", m, A->cmap->n, 0., 0.));
753c337ccceSJed Brown #else
7549566063dSJacob Faibussowitsch       PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT "  %18.16e\n", m, A->cmap->n, 0.0));
755c337ccceSJed Brown #endif
756d00d2cf4SBarry Smith     }
7579566063dSJacob Faibussowitsch     PetscCall(PetscObjectGetName((PetscObject)A, &name));
7589566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIPrintf(viewer, "];\n %s = spconvert(zzz);\n", name));
7599566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE));
760fb9695e5SSatish Balay   } else if (format == PETSC_VIEWER_ASCII_COMMON) {
7619566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE));
76244cd7ae7SLois Curfman McInnes     for (i = 0; i < m; i++) {
7639566063dSJacob Faibussowitsch       PetscCall(PetscViewerASCIIPrintf(viewer, "row %" PetscInt_FMT ":", i));
76460e0710aSBarry Smith       for (j = a->i[i]; j < a->i[i + 1]; j++) {
765aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX)
76636db0b34SBarry Smith         if (PetscImaginaryPart(a->a[j]) > 0.0 && PetscRealPart(a->a[j]) != 0.0) {
7679566063dSJacob Faibussowitsch           PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g + %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j])));
76836db0b34SBarry Smith         } else if (PetscImaginaryPart(a->a[j]) < 0.0 && PetscRealPart(a->a[j]) != 0.0) {
7699566063dSJacob Faibussowitsch           PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g - %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)-PetscImaginaryPart(a->a[j])));
77036db0b34SBarry Smith         } else if (PetscRealPart(a->a[j]) != 0.0) {
7719566063dSJacob Faibussowitsch           PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)PetscRealPart(a->a[j])));
7726831982aSBarry Smith         }
77344cd7ae7SLois Curfman McInnes #else
7749566063dSJacob Faibussowitsch         if (a->a[j] != 0.0) PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)a->a[j]));
77544cd7ae7SLois Curfman McInnes #endif
77644cd7ae7SLois Curfman McInnes       }
7779566063dSJacob Faibussowitsch       PetscCall(PetscViewerASCIIPrintf(viewer, "\n"));
77844cd7ae7SLois Curfman McInnes     }
7799566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE));
780fb9695e5SSatish Balay   } else if (format == PETSC_VIEWER_ASCII_SYMMODU) {
78197f1f81fSBarry Smith     PetscInt nzd = 0, fshift = 1, *sptr;
7829566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE));
7839566063dSJacob Faibussowitsch     PetscCall(PetscMalloc1(m + 1, &sptr));
784496be53dSLois Curfman McInnes     for (i = 0; i < m; i++) {
785496be53dSLois Curfman McInnes       sptr[i] = nzd + 1;
78660e0710aSBarry Smith       for (j = a->i[i]; j < a->i[i + 1]; j++) {
787496be53dSLois Curfman McInnes         if (a->j[j] >= i) {
788aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX)
78936db0b34SBarry Smith           if (PetscImaginaryPart(a->a[j]) != 0.0 || PetscRealPart(a->a[j]) != 0.0) nzd++;
790496be53dSLois Curfman McInnes #else
791496be53dSLois Curfman McInnes           if (a->a[j] != 0.0) nzd++;
792496be53dSLois Curfman McInnes #endif
793496be53dSLois Curfman McInnes         }
794496be53dSLois Curfman McInnes       }
795496be53dSLois Curfman McInnes     }
7962e44a96cSLois Curfman McInnes     sptr[m] = nzd + 1;
7979566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " %" PetscInt_FMT "\n\n", m, nzd));
7982e44a96cSLois Curfman McInnes     for (i = 0; i < m + 1; i += 6) {
7992205254eSKarl Rupp       if (i + 4 < m) {
8009566063dSJacob Faibussowitsch         PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT "\n", sptr[i], sptr[i + 1], sptr[i + 2], sptr[i + 3], sptr[i + 4], sptr[i + 5]));
8012205254eSKarl Rupp       } else if (i + 3 < m) {
8029566063dSJacob Faibussowitsch         PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT "\n", sptr[i], sptr[i + 1], sptr[i + 2], sptr[i + 3], sptr[i + 4]));
8032205254eSKarl Rupp       } else if (i + 2 < m) {
8049566063dSJacob Faibussowitsch         PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT "\n", sptr[i], sptr[i + 1], sptr[i + 2], sptr[i + 3]));
8052205254eSKarl Rupp       } else if (i + 1 < m) {
8069566063dSJacob Faibussowitsch         PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT "\n", sptr[i], sptr[i + 1], sptr[i + 2]));
8072205254eSKarl Rupp       } else if (i < m) {
8089566063dSJacob Faibussowitsch         PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " %" PetscInt_FMT "\n", sptr[i], sptr[i + 1]));
8092205254eSKarl Rupp       } else {
8109566063dSJacob Faibussowitsch         PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT "\n", sptr[i]));
8112205254eSKarl Rupp       }
812496be53dSLois Curfman McInnes     }
8139566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIPrintf(viewer, "\n"));
8149566063dSJacob Faibussowitsch     PetscCall(PetscFree(sptr));
815496be53dSLois Curfman McInnes     for (i = 0; i < m; i++) {
81660e0710aSBarry Smith       for (j = a->i[i]; j < a->i[i + 1]; j++) {
8179566063dSJacob Faibussowitsch         if (a->j[j] >= i) PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " ", a->j[j] + fshift));
818496be53dSLois Curfman McInnes       }
8199566063dSJacob Faibussowitsch       PetscCall(PetscViewerASCIIPrintf(viewer, "\n"));
820496be53dSLois Curfman McInnes     }
8219566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIPrintf(viewer, "\n"));
822496be53dSLois Curfman McInnes     for (i = 0; i < m; i++) {
82360e0710aSBarry Smith       for (j = a->i[i]; j < a->i[i + 1]; j++) {
824496be53dSLois Curfman McInnes         if (a->j[j] >= i) {
825aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX)
82648a46eb9SPierre Jolivet           if (PetscImaginaryPart(a->a[j]) != 0.0 || PetscRealPart(a->a[j]) != 0.0) PetscCall(PetscViewerASCIIPrintf(viewer, " %18.16e %18.16e ", (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j])));
827496be53dSLois Curfman McInnes #else
8289566063dSJacob Faibussowitsch           if (a->a[j] != 0.0) PetscCall(PetscViewerASCIIPrintf(viewer, " %18.16e ", (double)a->a[j]));
829496be53dSLois Curfman McInnes #endif
830496be53dSLois Curfman McInnes         }
831496be53dSLois Curfman McInnes       }
8329566063dSJacob Faibussowitsch       PetscCall(PetscViewerASCIIPrintf(viewer, "\n"));
833496be53dSLois Curfman McInnes     }
8349566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE));
835fb9695e5SSatish Balay   } else if (format == PETSC_VIEWER_ASCII_DENSE) {
83697f1f81fSBarry Smith     PetscInt    cnt = 0, jcnt;
83787828ca2SBarry Smith     PetscScalar value;
83868f1ed48SBarry Smith #if defined(PETSC_USE_COMPLEX)
83968f1ed48SBarry Smith     PetscBool realonly = PETSC_TRUE;
84068f1ed48SBarry Smith 
84168f1ed48SBarry Smith     for (i = 0; i < a->i[m]; i++) {
84268f1ed48SBarry Smith       if (PetscImaginaryPart(a->a[i]) != 0.0) {
84368f1ed48SBarry Smith         realonly = PETSC_FALSE;
84468f1ed48SBarry Smith         break;
84568f1ed48SBarry Smith       }
84668f1ed48SBarry Smith     }
84768f1ed48SBarry Smith #endif
84802594712SBarry Smith 
8499566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE));
85002594712SBarry Smith     for (i = 0; i < m; i++) {
85102594712SBarry Smith       jcnt = 0;
852d0f46423SBarry Smith       for (j = 0; j < A->cmap->n; j++) {
853e24b481bSBarry Smith         if (jcnt < a->i[i + 1] - a->i[i] && j == a->j[cnt]) {
85402594712SBarry Smith           value = a->a[cnt++];
855e24b481bSBarry Smith           jcnt++;
85602594712SBarry Smith         } else {
85702594712SBarry Smith           value = 0.0;
85802594712SBarry Smith         }
859aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX)
86068f1ed48SBarry Smith         if (realonly) {
8619566063dSJacob Faibussowitsch           PetscCall(PetscViewerASCIIPrintf(viewer, " %7.5e ", (double)PetscRealPart(value)));
86268f1ed48SBarry Smith         } else {
8639566063dSJacob Faibussowitsch           PetscCall(PetscViewerASCIIPrintf(viewer, " %7.5e+%7.5e i ", (double)PetscRealPart(value), (double)PetscImaginaryPart(value)));
86468f1ed48SBarry Smith         }
86502594712SBarry Smith #else
8669566063dSJacob Faibussowitsch         PetscCall(PetscViewerASCIIPrintf(viewer, " %7.5e ", (double)value));
86702594712SBarry Smith #endif
86802594712SBarry Smith       }
8699566063dSJacob Faibussowitsch       PetscCall(PetscViewerASCIIPrintf(viewer, "\n"));
87002594712SBarry Smith     }
8719566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE));
8723c215bfdSMatthew Knepley   } else if (format == PETSC_VIEWER_ASCII_MATRIXMARKET) {
873150b93efSMatthew G. Knepley     PetscInt fshift = 1;
8749566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE));
8753c215bfdSMatthew Knepley #if defined(PETSC_USE_COMPLEX)
8769566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIPrintf(viewer, "%%%%MatrixMarket matrix coordinate complex general\n"));
8773c215bfdSMatthew Knepley #else
8789566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIPrintf(viewer, "%%%%MatrixMarket matrix coordinate real general\n"));
8793c215bfdSMatthew Knepley #endif
8809566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT "\n", m, A->cmap->n, a->nz));
8813c215bfdSMatthew Knepley     for (i = 0; i < m; i++) {
88260e0710aSBarry Smith       for (j = a->i[i]; j < a->i[i + 1]; j++) {
8833c215bfdSMatthew Knepley #if defined(PETSC_USE_COMPLEX)
8849566063dSJacob Faibussowitsch         PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT " %g %g\n", i + fshift, a->j[j] + fshift, (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j])));
8853c215bfdSMatthew Knepley #else
8869566063dSJacob Faibussowitsch         PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT " %g\n", i + fshift, a->j[j] + fshift, (double)a->a[j]));
8873c215bfdSMatthew Knepley #endif
8883c215bfdSMatthew Knepley       }
8893c215bfdSMatthew Knepley     }
8909566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE));
8913a40ed3dSBarry Smith   } else {
8929566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE));
893d5f3da31SBarry Smith     if (A->factortype) {
89416cd7e1dSShri Abhyankar       for (i = 0; i < m; i++) {
8959566063dSJacob Faibussowitsch         PetscCall(PetscViewerASCIIPrintf(viewer, "row %" PetscInt_FMT ":", i));
89616cd7e1dSShri Abhyankar         /* L part */
89760e0710aSBarry Smith         for (j = a->i[i]; j < a->i[i + 1]; j++) {
89816cd7e1dSShri Abhyankar #if defined(PETSC_USE_COMPLEX)
89916cd7e1dSShri Abhyankar           if (PetscImaginaryPart(a->a[j]) > 0.0) {
9009566063dSJacob Faibussowitsch             PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g + %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j])));
90116cd7e1dSShri Abhyankar           } else if (PetscImaginaryPart(a->a[j]) < 0.0) {
9029566063dSJacob Faibussowitsch             PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g - %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)(-PetscImaginaryPart(a->a[j]))));
90316cd7e1dSShri Abhyankar           } else {
9049566063dSJacob Faibussowitsch             PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)PetscRealPart(a->a[j])));
90516cd7e1dSShri Abhyankar           }
90616cd7e1dSShri Abhyankar #else
9079566063dSJacob Faibussowitsch           PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)a->a[j]));
90816cd7e1dSShri Abhyankar #endif
90916cd7e1dSShri Abhyankar         }
91016cd7e1dSShri Abhyankar         /* diagonal */
91116cd7e1dSShri Abhyankar         j = a->diag[i];
91216cd7e1dSShri Abhyankar #if defined(PETSC_USE_COMPLEX)
91316cd7e1dSShri Abhyankar         if (PetscImaginaryPart(a->a[j]) > 0.0) {
9149566063dSJacob Faibussowitsch           PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g + %g i)", a->j[j], (double)PetscRealPart(1.0 / a->a[j]), (double)PetscImaginaryPart(1.0 / a->a[j])));
91516cd7e1dSShri Abhyankar         } else if (PetscImaginaryPart(a->a[j]) < 0.0) {
9169566063dSJacob Faibussowitsch           PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g - %g i)", a->j[j], (double)PetscRealPart(1.0 / a->a[j]), (double)(-PetscImaginaryPart(1.0 / a->a[j]))));
91716cd7e1dSShri Abhyankar         } else {
9189566063dSJacob Faibussowitsch           PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)PetscRealPart(1.0 / a->a[j])));
91916cd7e1dSShri Abhyankar         }
92016cd7e1dSShri Abhyankar #else
9219566063dSJacob Faibussowitsch         PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)(1.0 / a->a[j])));
92216cd7e1dSShri Abhyankar #endif
92316cd7e1dSShri Abhyankar 
92416cd7e1dSShri Abhyankar         /* U part */
92560e0710aSBarry Smith         for (j = a->diag[i + 1] + 1; j < a->diag[i]; j++) {
92616cd7e1dSShri Abhyankar #if defined(PETSC_USE_COMPLEX)
92716cd7e1dSShri Abhyankar           if (PetscImaginaryPart(a->a[j]) > 0.0) {
9289566063dSJacob Faibussowitsch             PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g + %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j])));
92916cd7e1dSShri Abhyankar           } else if (PetscImaginaryPart(a->a[j]) < 0.0) {
9309566063dSJacob Faibussowitsch             PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g - %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)(-PetscImaginaryPart(a->a[j]))));
93116cd7e1dSShri Abhyankar           } else {
9329566063dSJacob Faibussowitsch             PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)PetscRealPart(a->a[j])));
93316cd7e1dSShri Abhyankar           }
93416cd7e1dSShri Abhyankar #else
9359566063dSJacob Faibussowitsch           PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)a->a[j]));
93616cd7e1dSShri Abhyankar #endif
93716cd7e1dSShri Abhyankar         }
9389566063dSJacob Faibussowitsch         PetscCall(PetscViewerASCIIPrintf(viewer, "\n"));
93916cd7e1dSShri Abhyankar       }
94016cd7e1dSShri Abhyankar     } else {
94117ab2063SBarry Smith       for (i = 0; i < m; i++) {
9429566063dSJacob Faibussowitsch         PetscCall(PetscViewerASCIIPrintf(viewer, "row %" PetscInt_FMT ":", i));
94360e0710aSBarry Smith         for (j = a->i[i]; j < a->i[i + 1]; j++) {
944aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX)
94536db0b34SBarry Smith           if (PetscImaginaryPart(a->a[j]) > 0.0) {
9469566063dSJacob Faibussowitsch             PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g + %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j])));
94736db0b34SBarry Smith           } else if (PetscImaginaryPart(a->a[j]) < 0.0) {
9489566063dSJacob Faibussowitsch             PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g - %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)-PetscImaginaryPart(a->a[j])));
9493a40ed3dSBarry Smith           } else {
9509566063dSJacob Faibussowitsch             PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)PetscRealPart(a->a[j])));
95117ab2063SBarry Smith           }
95217ab2063SBarry Smith #else
9539566063dSJacob Faibussowitsch           PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)a->a[j]));
95417ab2063SBarry Smith #endif
95517ab2063SBarry Smith         }
9569566063dSJacob Faibussowitsch         PetscCall(PetscViewerASCIIPrintf(viewer, "\n"));
95717ab2063SBarry Smith       }
95816cd7e1dSShri Abhyankar     }
9599566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE));
96017ab2063SBarry Smith   }
9619566063dSJacob Faibussowitsch   PetscCall(PetscViewerFlush(viewer));
9623ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
963416022c9SBarry Smith }
964416022c9SBarry Smith 
9659804daf3SBarry Smith #include <petscdraw.h>
966ba38deedSJacob Faibussowitsch static PetscErrorCode MatView_SeqAIJ_Draw_Zoom(PetscDraw draw, void *Aa)
967d71ae5a4SJacob Faibussowitsch {
968480ef9eaSBarry Smith   Mat                A = (Mat)Aa;
969416022c9SBarry Smith   Mat_SeqAIJ        *a = (Mat_SeqAIJ *)A->data;
970383922c3SLisandro Dalcin   PetscInt           i, j, m = A->rmap->n;
971383922c3SLisandro Dalcin   int                color;
972b05fc000SLisandro Dalcin   PetscReal          xl, yl, xr, yr, x_l, x_r, y_l, y_r;
973b0a32e0cSBarry Smith   PetscViewer        viewer;
974f3ef73ceSBarry Smith   PetscViewerFormat  format;
975fff043a9SJunchao Zhang   const PetscScalar *aa;
976cddf8d76SBarry Smith 
9773a40ed3dSBarry Smith   PetscFunctionBegin;
9789566063dSJacob Faibussowitsch   PetscCall(PetscObjectQuery((PetscObject)A, "Zoomviewer", (PetscObject *)&viewer));
9799566063dSJacob Faibussowitsch   PetscCall(PetscViewerGetFormat(viewer, &format));
9809566063dSJacob Faibussowitsch   PetscCall(PetscDrawGetCoordinates(draw, &xl, &yl, &xr, &yr));
981383922c3SLisandro Dalcin 
982416022c9SBarry Smith   /* loop over matrix elements drawing boxes */
9839566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &aa));
984fb9695e5SSatish Balay   if (format != PETSC_VIEWER_DRAW_CONTOUR) {
985d0609cedSBarry Smith     PetscDrawCollectiveBegin(draw);
9860513a670SBarry Smith     /* Blue for negative, Cyan for zero and  Red for positive */
987b0a32e0cSBarry Smith     color = PETSC_DRAW_BLUE;
988416022c9SBarry Smith     for (i = 0; i < m; i++) {
9899371c9d4SSatish Balay       y_l = m - i - 1.0;
9909371c9d4SSatish Balay       y_r = y_l + 1.0;
991bfeeae90SHong Zhang       for (j = a->i[i]; j < a->i[i + 1]; j++) {
9929371c9d4SSatish Balay         x_l = a->j[j];
9939371c9d4SSatish Balay         x_r = x_l + 1.0;
994fff043a9SJunchao Zhang         if (PetscRealPart(aa[j]) >= 0.) continue;
9959566063dSJacob Faibussowitsch         PetscCall(PetscDrawRectangle(draw, x_l, y_l, x_r, y_r, color, color, color, color));
996cddf8d76SBarry Smith       }
997cddf8d76SBarry Smith     }
998b0a32e0cSBarry Smith     color = PETSC_DRAW_CYAN;
999cddf8d76SBarry Smith     for (i = 0; i < m; i++) {
10009371c9d4SSatish Balay       y_l = m - i - 1.0;
10019371c9d4SSatish Balay       y_r = y_l + 1.0;
1002bfeeae90SHong Zhang       for (j = a->i[i]; j < a->i[i + 1]; j++) {
10039371c9d4SSatish Balay         x_l = a->j[j];
10049371c9d4SSatish Balay         x_r = x_l + 1.0;
1005fff043a9SJunchao Zhang         if (aa[j] != 0.) continue;
10069566063dSJacob Faibussowitsch         PetscCall(PetscDrawRectangle(draw, x_l, y_l, x_r, y_r, color, color, color, color));
1007cddf8d76SBarry Smith       }
1008cddf8d76SBarry Smith     }
1009b0a32e0cSBarry Smith     color = PETSC_DRAW_RED;
1010cddf8d76SBarry Smith     for (i = 0; i < m; i++) {
10119371c9d4SSatish Balay       y_l = m - i - 1.0;
10129371c9d4SSatish Balay       y_r = y_l + 1.0;
1013bfeeae90SHong Zhang       for (j = a->i[i]; j < a->i[i + 1]; j++) {
10149371c9d4SSatish Balay         x_l = a->j[j];
10159371c9d4SSatish Balay         x_r = x_l + 1.0;
1016fff043a9SJunchao Zhang         if (PetscRealPart(aa[j]) <= 0.) continue;
10179566063dSJacob Faibussowitsch         PetscCall(PetscDrawRectangle(draw, x_l, y_l, x_r, y_r, color, color, color, color));
1018416022c9SBarry Smith       }
1019416022c9SBarry Smith     }
1020d0609cedSBarry Smith     PetscDrawCollectiveEnd(draw);
10210513a670SBarry Smith   } else {
10220513a670SBarry Smith     /* use contour shading to indicate magnitude of values */
10230513a670SBarry Smith     /* first determine max of all nonzero values */
1024b05fc000SLisandro Dalcin     PetscReal minv = 0.0, maxv = 0.0;
1025383922c3SLisandro Dalcin     PetscInt  nz = a->nz, count = 0;
1026b0a32e0cSBarry Smith     PetscDraw popup;
10270513a670SBarry Smith 
10280513a670SBarry Smith     for (i = 0; i < nz; i++) {
1029fff043a9SJunchao Zhang       if (PetscAbsScalar(aa[i]) > maxv) maxv = PetscAbsScalar(aa[i]);
10300513a670SBarry Smith     }
1031383922c3SLisandro Dalcin     if (minv >= maxv) maxv = minv + PETSC_SMALL;
10329566063dSJacob Faibussowitsch     PetscCall(PetscDrawGetPopup(draw, &popup));
10339566063dSJacob Faibussowitsch     PetscCall(PetscDrawScalePopup(popup, minv, maxv));
1034383922c3SLisandro Dalcin 
1035d0609cedSBarry Smith     PetscDrawCollectiveBegin(draw);
10360513a670SBarry Smith     for (i = 0; i < m; i++) {
1037383922c3SLisandro Dalcin       y_l = m - i - 1.0;
1038383922c3SLisandro Dalcin       y_r = y_l + 1.0;
1039bfeeae90SHong Zhang       for (j = a->i[i]; j < a->i[i + 1]; j++) {
1040383922c3SLisandro Dalcin         x_l   = a->j[j];
1041383922c3SLisandro Dalcin         x_r   = x_l + 1.0;
1042fff043a9SJunchao Zhang         color = PetscDrawRealToColor(PetscAbsScalar(aa[count]), minv, maxv);
10439566063dSJacob Faibussowitsch         PetscCall(PetscDrawRectangle(draw, x_l, y_l, x_r, y_r, color, color, color, color));
10440513a670SBarry Smith         count++;
10450513a670SBarry Smith       }
10460513a670SBarry Smith     }
1047d0609cedSBarry Smith     PetscDrawCollectiveEnd(draw);
10480513a670SBarry Smith   }
10499566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &aa));
10503ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
1051480ef9eaSBarry Smith }
1052cddf8d76SBarry Smith 
10539804daf3SBarry Smith #include <petscdraw.h>
1054ba38deedSJacob Faibussowitsch static PetscErrorCode MatView_SeqAIJ_Draw(Mat A, PetscViewer viewer)
1055d71ae5a4SJacob Faibussowitsch {
1056b0a32e0cSBarry Smith   PetscDraw draw;
105736db0b34SBarry Smith   PetscReal xr, yr, xl, yl, h, w;
1058ace3abfcSBarry Smith   PetscBool isnull;
1059480ef9eaSBarry Smith 
1060480ef9eaSBarry Smith   PetscFunctionBegin;
10619566063dSJacob Faibussowitsch   PetscCall(PetscViewerDrawGetDraw(viewer, 0, &draw));
10629566063dSJacob Faibussowitsch   PetscCall(PetscDrawIsNull(draw, &isnull));
10633ba16761SJacob Faibussowitsch   if (isnull) PetscFunctionReturn(PETSC_SUCCESS);
1064480ef9eaSBarry Smith 
10659371c9d4SSatish Balay   xr = A->cmap->n;
10669371c9d4SSatish Balay   yr = A->rmap->n;
10679371c9d4SSatish Balay   h  = yr / 10.0;
10689371c9d4SSatish Balay   w  = xr / 10.0;
10699371c9d4SSatish Balay   xr += w;
10709371c9d4SSatish Balay   yr += h;
10719371c9d4SSatish Balay   xl = -w;
10729371c9d4SSatish Balay   yl = -h;
10739566063dSJacob Faibussowitsch   PetscCall(PetscDrawSetCoordinates(draw, xl, yl, xr, yr));
10749566063dSJacob Faibussowitsch   PetscCall(PetscObjectCompose((PetscObject)A, "Zoomviewer", (PetscObject)viewer));
10759566063dSJacob Faibussowitsch   PetscCall(PetscDrawZoom(draw, MatView_SeqAIJ_Draw_Zoom, A));
10769566063dSJacob Faibussowitsch   PetscCall(PetscObjectCompose((PetscObject)A, "Zoomviewer", NULL));
10779566063dSJacob Faibussowitsch   PetscCall(PetscDrawSave(draw));
10783ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
1079416022c9SBarry Smith }
1080416022c9SBarry Smith 
1081d71ae5a4SJacob Faibussowitsch PetscErrorCode MatView_SeqAIJ(Mat A, PetscViewer viewer)
1082d71ae5a4SJacob Faibussowitsch {
1083ace3abfcSBarry Smith   PetscBool iascii, isbinary, isdraw;
1084416022c9SBarry Smith 
10853a40ed3dSBarry Smith   PetscFunctionBegin;
10869566063dSJacob Faibussowitsch   PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERASCII, &iascii));
10879566063dSJacob Faibussowitsch   PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERBINARY, &isbinary));
10889566063dSJacob Faibussowitsch   PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERDRAW, &isdraw));
10891baa6e33SBarry Smith   if (iascii) PetscCall(MatView_SeqAIJ_ASCII(A, viewer));
10901baa6e33SBarry Smith   else if (isbinary) PetscCall(MatView_SeqAIJ_Binary(A, viewer));
10911baa6e33SBarry Smith   else if (isdraw) PetscCall(MatView_SeqAIJ_Draw(A, viewer));
10929566063dSJacob Faibussowitsch   PetscCall(MatView_SeqAIJ_Inode(A, viewer));
10933ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
109417ab2063SBarry Smith }
109519bcc07fSBarry Smith 
1096d71ae5a4SJacob Faibussowitsch PetscErrorCode MatAssemblyEnd_SeqAIJ(Mat A, MatAssemblyType mode)
1097d71ae5a4SJacob Faibussowitsch {
1098416022c9SBarry Smith   Mat_SeqAIJ *a      = (Mat_SeqAIJ *)A->data;
1099580bdb30SBarry Smith   PetscInt    fshift = 0, i, *ai = a->i, *aj = a->j, *imax = a->imax;
1100bc43efbbSJunchao Zhang   PetscInt    m = A->rmap->n, *ip, N, *ailen = a->ilen, rmax = 0, n;
110154f21887SBarry Smith   MatScalar  *aa    = a->a, *ap;
11023447b6efSHong Zhang   PetscReal   ratio = 0.6;
110317ab2063SBarry Smith 
11043a40ed3dSBarry Smith   PetscFunctionBegin;
11053ba16761SJacob Faibussowitsch   if (mode == MAT_FLUSH_ASSEMBLY) PetscFunctionReturn(PETSC_SUCCESS);
11069566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJInvalidateDiagonal(A));
1107b215bc84SStefano Zampini   if (A->was_assembled && A->ass_nonzerostate == A->nonzerostate) {
1108b215bc84SStefano Zampini     /* we need to respect users asking to use or not the inodes routine in between matrix assemblies */
11099566063dSJacob Faibussowitsch     PetscCall(MatAssemblyEnd_SeqAIJ_Inode(A, mode));
11103ba16761SJacob Faibussowitsch     PetscFunctionReturn(PETSC_SUCCESS);
1111b215bc84SStefano Zampini   }
111217ab2063SBarry Smith 
111343ee02c3SBarry Smith   if (m) rmax = ailen[0]; /* determine row with most nonzeros */
111417ab2063SBarry Smith   for (i = 1; i < m; i++) {
1115416022c9SBarry Smith     /* move each row back by the amount of empty slots (fshift) before it*/
111617ab2063SBarry Smith     fshift += imax[i - 1] - ailen[i - 1];
111794a9d846SBarry Smith     rmax = PetscMax(rmax, ailen[i]);
111817ab2063SBarry Smith     if (fshift) {
1119bfeeae90SHong Zhang       ip = aj + ai[i];
1120bfeeae90SHong Zhang       ap = aa + ai[i];
112117ab2063SBarry Smith       N  = ailen[i];
11229566063dSJacob Faibussowitsch       PetscCall(PetscArraymove(ip - fshift, ip, N));
112348a46eb9SPierre Jolivet       if (!A->structure_only) PetscCall(PetscArraymove(ap - fshift, ap, N));
112417ab2063SBarry Smith     }
112517ab2063SBarry Smith     ai[i] = ai[i - 1] + ailen[i - 1];
112617ab2063SBarry Smith   }
112717ab2063SBarry Smith   if (m) {
112817ab2063SBarry Smith     fshift += imax[m - 1] - ailen[m - 1];
112917ab2063SBarry Smith     ai[m] = ai[m - 1] + ailen[m - 1];
113017ab2063SBarry Smith   }
113117ab2063SBarry Smith   /* reset ilen and imax for each row */
11327b083b7cSBarry Smith   a->nonzerorowcnt = 0;
1133396832f4SHong Zhang   if (A->structure_only) {
11349566063dSJacob Faibussowitsch     PetscCall(PetscFree(a->imax));
11359566063dSJacob Faibussowitsch     PetscCall(PetscFree(a->ilen));
1136396832f4SHong Zhang   } else { /* !A->structure_only */
113717ab2063SBarry Smith     for (i = 0; i < m; i++) {
113817ab2063SBarry Smith       ailen[i] = imax[i] = ai[i + 1] - ai[i];
11397b083b7cSBarry Smith       a->nonzerorowcnt += ((ai[i + 1] - ai[i]) > 0);
114017ab2063SBarry Smith     }
1141396832f4SHong Zhang   }
1142bfeeae90SHong Zhang   a->nz = ai[m];
1143aed4548fSBarry Smith   PetscCheck(!fshift || a->nounused != -1, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Unused space detected in matrix: %" PetscInt_FMT " X %" PetscInt_FMT ", %" PetscInt_FMT " unneeded", m, A->cmap->n, fshift);
1144bc43efbbSJunchao Zhang   PetscCall(MatMarkDiagonal_SeqAIJ(A)); // since diagonal info is used a lot, it is helpful to set them up at the end of assembly
1145bc43efbbSJunchao Zhang   a->diagonaldense = PETSC_TRUE;
1146bc43efbbSJunchao Zhang   n                = PetscMin(A->rmap->n, A->cmap->n);
1147bc43efbbSJunchao Zhang   for (i = 0; i < n; i++) {
1148bc43efbbSJunchao Zhang     if (a->diag[i] >= ai[i + 1]) {
1149bc43efbbSJunchao Zhang       a->diagonaldense = PETSC_FALSE;
1150bc43efbbSJunchao Zhang       break;
1151bc43efbbSJunchao Zhang     }
1152bc43efbbSJunchao Zhang   }
11539566063dSJacob Faibussowitsch   PetscCall(PetscInfo(A, "Matrix size: %" PetscInt_FMT " X %" PetscInt_FMT "; storage space: %" PetscInt_FMT " unneeded,%" PetscInt_FMT " used\n", m, A->cmap->n, fshift, a->nz));
11549566063dSJacob Faibussowitsch   PetscCall(PetscInfo(A, "Number of mallocs during MatSetValues() is %" PetscInt_FMT "\n", a->reallocs));
11559566063dSJacob Faibussowitsch   PetscCall(PetscInfo(A, "Maximum nonzeros in any row is %" PetscInt_FMT "\n", rmax));
11562205254eSKarl Rupp 
11578e58a170SBarry Smith   A->info.mallocs += a->reallocs;
1158dd5f02e7SSatish Balay   a->reallocs         = 0;
11596712e2f1SBarry Smith   A->info.nz_unneeded = (PetscReal)fshift;
116036db0b34SBarry Smith   a->rmax             = rmax;
11614e220ebcSLois Curfman McInnes 
116248a46eb9SPierre Jolivet   if (!A->structure_only) PetscCall(MatCheckCompressedRow(A, a->nonzerorowcnt, &a->compressedrow, a->i, m, ratio));
11639566063dSJacob Faibussowitsch   PetscCall(MatAssemblyEnd_SeqAIJ_Inode(A, mode));
11643ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
116517ab2063SBarry Smith }
116617ab2063SBarry Smith 
1167ba38deedSJacob Faibussowitsch static PetscErrorCode MatRealPart_SeqAIJ(Mat A)
1168d71ae5a4SJacob Faibussowitsch {
116999cafbc1SBarry Smith   Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data;
117099cafbc1SBarry Smith   PetscInt    i, nz = a->nz;
11712e5835c6SStefano Zampini   MatScalar  *aa;
117299cafbc1SBarry Smith 
117399cafbc1SBarry Smith   PetscFunctionBegin;
11749566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArray(A, &aa));
117599cafbc1SBarry Smith   for (i = 0; i < nz; i++) aa[i] = PetscRealPart(aa[i]);
11769566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArray(A, &aa));
11779566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJInvalidateDiagonal(A));
11783ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
117999cafbc1SBarry Smith }
118099cafbc1SBarry Smith 
1181ba38deedSJacob Faibussowitsch static PetscErrorCode MatImaginaryPart_SeqAIJ(Mat A)
1182d71ae5a4SJacob Faibussowitsch {
118399cafbc1SBarry Smith   Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data;
118499cafbc1SBarry Smith   PetscInt    i, nz = a->nz;
11852e5835c6SStefano Zampini   MatScalar  *aa;
118699cafbc1SBarry Smith 
118799cafbc1SBarry Smith   PetscFunctionBegin;
11889566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArray(A, &aa));
118999cafbc1SBarry Smith   for (i = 0; i < nz; i++) aa[i] = PetscImaginaryPart(aa[i]);
11909566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArray(A, &aa));
11919566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJInvalidateDiagonal(A));
11923ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
119399cafbc1SBarry Smith }
119499cafbc1SBarry Smith 
1195d71ae5a4SJacob Faibussowitsch PetscErrorCode MatZeroEntries_SeqAIJ(Mat A)
1196d71ae5a4SJacob Faibussowitsch {
1197fff043a9SJunchao Zhang   Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data;
1198fff043a9SJunchao Zhang   MatScalar  *aa;
11993a40ed3dSBarry Smith 
12003a40ed3dSBarry Smith   PetscFunctionBegin;
12019566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayWrite(A, &aa));
12029566063dSJacob Faibussowitsch   PetscCall(PetscArrayzero(aa, a->i[A->rmap->n]));
12039566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayWrite(A, &aa));
12049566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJInvalidateDiagonal(A));
12053ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
120617ab2063SBarry Smith }
1207416022c9SBarry Smith 
1208d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDestroy_SeqAIJ(Mat A)
1209d71ae5a4SJacob Faibussowitsch {
1210416022c9SBarry Smith   Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data;
1211d5d45c9bSBarry Smith 
12123a40ed3dSBarry Smith   PetscFunctionBegin;
1213b4e2f619SBarry Smith   if (A->hash_active) {
1214e3c72094SPierre Jolivet     A->ops[0] = a->cops;
1215b4e2f619SBarry Smith     PetscCall(PetscHMapIJVDestroy(&a->ht));
1216b4e2f619SBarry Smith     PetscCall(PetscFree(a->dnz));
1217b4e2f619SBarry Smith     A->hash_active = PETSC_FALSE;
1218b4e2f619SBarry Smith   }
1219b4e2f619SBarry Smith 
12203ba16761SJacob Faibussowitsch   PetscCall(PetscLogObjectState((PetscObject)A, "Rows=%" PetscInt_FMT ", Cols=%" PetscInt_FMT ", NZ=%" PetscInt_FMT, A->rmap->n, A->cmap->n, a->nz));
12219566063dSJacob Faibussowitsch   PetscCall(MatSeqXAIJFreeAIJ(A, &a->a, &a->j, &a->i));
12229566063dSJacob Faibussowitsch   PetscCall(ISDestroy(&a->row));
12239566063dSJacob Faibussowitsch   PetscCall(ISDestroy(&a->col));
12249566063dSJacob Faibussowitsch   PetscCall(PetscFree(a->diag));
12259566063dSJacob Faibussowitsch   PetscCall(PetscFree(a->ibdiag));
12269566063dSJacob Faibussowitsch   PetscCall(PetscFree(a->imax));
12279566063dSJacob Faibussowitsch   PetscCall(PetscFree(a->ilen));
12289566063dSJacob Faibussowitsch   PetscCall(PetscFree(a->ipre));
12299566063dSJacob Faibussowitsch   PetscCall(PetscFree3(a->idiag, a->mdiag, a->ssor_work));
12309566063dSJacob Faibussowitsch   PetscCall(PetscFree(a->solve_work));
12319566063dSJacob Faibussowitsch   PetscCall(ISDestroy(&a->icol));
12329566063dSJacob Faibussowitsch   PetscCall(PetscFree(a->saved_values));
12339566063dSJacob Faibussowitsch   PetscCall(PetscFree2(a->compressedrow.i, a->compressedrow.rindex));
12349566063dSJacob Faibussowitsch   PetscCall(MatDestroy_SeqAIJ_Inode(A));
12359566063dSJacob Faibussowitsch   PetscCall(PetscFree(A->data));
1236901853e0SKris Buschelman 
12376718818eSStefano Zampini   /* MatMatMultNumeric_SeqAIJ_SeqAIJ_Sorted may allocate this.
12386718818eSStefano Zampini      That function is so heavily used (sometimes in an hidden way through multnumeric function pointers)
12396718818eSStefano Zampini      that is hard to properly add this data to the MatProduct data. We free it here to avoid
12406718818eSStefano Zampini      users reusing the matrix object with different data to incur in obscure segmentation faults
12416718818eSStefano Zampini      due to different matrix sizes */
12429566063dSJacob Faibussowitsch   PetscCall(PetscObjectCompose((PetscObject)A, "__PETSc__ab_dense", NULL));
12436718818eSStefano Zampini 
12449566063dSJacob Faibussowitsch   PetscCall(PetscObjectChangeTypeName((PetscObject)A, NULL));
12452e956fe4SStefano Zampini   PetscCall(PetscObjectComposeFunction((PetscObject)A, "PetscMatlabEnginePut_C", NULL));
12462e956fe4SStefano Zampini   PetscCall(PetscObjectComposeFunction((PetscObject)A, "PetscMatlabEngineGet_C", NULL));
12479566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSeqAIJSetColumnIndices_C", NULL));
12489566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatStoreValues_C", NULL));
12499566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatRetrieveValues_C", NULL));
12509566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqsbaij_C", NULL));
12519566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqbaij_C", NULL));
12529566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijperm_C", NULL));
12532e956fe4SStefano Zampini   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijsell_C", NULL));
12542e956fe4SStefano Zampini #if defined(PETSC_HAVE_MKL_SPARSE)
12552e956fe4SStefano Zampini   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijmkl_C", NULL));
12562e956fe4SStefano Zampini #endif
12574222ddf1SHong Zhang #if defined(PETSC_HAVE_CUDA)
12589566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijcusparse_C", NULL));
12599566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaijcusparse_seqaij_C", NULL));
12609566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaij_seqaijcusparse_C", NULL));
12614222ddf1SHong Zhang #endif
1262d5e393b6SSuyash Tandon #if defined(PETSC_HAVE_HIP)
1263d5e393b6SSuyash Tandon   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijhipsparse_C", NULL));
1264d5e393b6SSuyash Tandon   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaijhipsparse_seqaij_C", NULL));
1265d5e393b6SSuyash Tandon   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaij_seqaijhipsparse_C", NULL));
1266d5e393b6SSuyash Tandon #endif
12673d0639e7SStefano Zampini #if defined(PETSC_HAVE_KOKKOS_KERNELS)
12689566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijkokkos_C", NULL));
12693d0639e7SStefano Zampini #endif
12709566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijcrl_C", NULL));
1271af8000cdSHong Zhang #if defined(PETSC_HAVE_ELEMENTAL)
12729566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_elemental_C", NULL));
1273af8000cdSHong Zhang #endif
1274d24d4204SJose E. Roman #if defined(PETSC_HAVE_SCALAPACK)
12759566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_scalapack_C", NULL));
1276d24d4204SJose E. Roman #endif
127763c07aadSStefano Zampini #if defined(PETSC_HAVE_HYPRE)
12789566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_hypre_C", NULL));
12799566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_transpose_seqaij_seqaij_C", NULL));
128063c07aadSStefano Zampini #endif
12819566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqdense_C", NULL));
12829566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqsell_C", NULL));
12839566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_is_C", NULL));
12849566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatIsTranspose_C", NULL));
12852e956fe4SStefano Zampini   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatIsHermitianTranspose_C", NULL));
12869566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSeqAIJSetPreallocation_C", NULL));
12879566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatResetPreallocation_C", NULL));
12889566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSeqAIJSetPreallocationCSR_C", NULL));
12899566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatReorderForNonzeroDiagonal_C", NULL));
12909566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_is_seqaij_C", NULL));
12919566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqdense_seqaij_C", NULL));
12929566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaij_seqaij_C", NULL));
12939566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSeqAIJKron_C", NULL));
12949566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSetPreallocationCOO_C", NULL));
12959566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSetValuesCOO_C", NULL));
12962e956fe4SStefano Zampini   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatFactorGetSolverType_C", NULL));
12972e956fe4SStefano Zampini   /* these calls do not belong here: the subclasses Duplicate/Destroy are wrong */
12982e956fe4SStefano Zampini   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaijsell_seqaij_C", NULL));
12992e956fe4SStefano Zampini   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaijperm_seqaij_C", NULL));
13002e956fe4SStefano Zampini   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijviennacl_C", NULL));
13012e956fe4SStefano Zampini   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaijviennacl_seqdense_C", NULL));
13022e956fe4SStefano Zampini   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaijviennacl_seqaij_C", NULL));
13033ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
130417ab2063SBarry Smith }
130517ab2063SBarry Smith 
1306d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetOption_SeqAIJ(Mat A, MatOption op, PetscBool flg)
1307d71ae5a4SJacob Faibussowitsch {
1308416022c9SBarry Smith   Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data;
13093a40ed3dSBarry Smith 
13103a40ed3dSBarry Smith   PetscFunctionBegin;
1311a65d3064SKris Buschelman   switch (op) {
1312d71ae5a4SJacob Faibussowitsch   case MAT_ROW_ORIENTED:
1313d71ae5a4SJacob Faibussowitsch     a->roworiented = flg;
1314d71ae5a4SJacob Faibussowitsch     break;
1315d71ae5a4SJacob Faibussowitsch   case MAT_KEEP_NONZERO_PATTERN:
1316d71ae5a4SJacob Faibussowitsch     a->keepnonzeropattern = flg;
1317d71ae5a4SJacob Faibussowitsch     break;
1318d71ae5a4SJacob Faibussowitsch   case MAT_NEW_NONZERO_LOCATIONS:
1319d71ae5a4SJacob Faibussowitsch     a->nonew = (flg ? 0 : 1);
1320d71ae5a4SJacob Faibussowitsch     break;
1321d71ae5a4SJacob Faibussowitsch   case MAT_NEW_NONZERO_LOCATION_ERR:
1322d71ae5a4SJacob Faibussowitsch     a->nonew = (flg ? -1 : 0);
1323d71ae5a4SJacob Faibussowitsch     break;
1324d71ae5a4SJacob Faibussowitsch   case MAT_NEW_NONZERO_ALLOCATION_ERR:
1325d71ae5a4SJacob Faibussowitsch     a->nonew = (flg ? -2 : 0);
1326d71ae5a4SJacob Faibussowitsch     break;
1327d71ae5a4SJacob Faibussowitsch   case MAT_UNUSED_NONZERO_LOCATION_ERR:
1328d71ae5a4SJacob Faibussowitsch     a->nounused = (flg ? -1 : 0);
1329d71ae5a4SJacob Faibussowitsch     break;
1330d71ae5a4SJacob Faibussowitsch   case MAT_IGNORE_ZERO_ENTRIES:
1331d71ae5a4SJacob Faibussowitsch     a->ignorezeroentries = flg;
1332d71ae5a4SJacob Faibussowitsch     break;
13333d472b54SHong Zhang   case MAT_SPD:
1334b1646e73SJed Brown   case MAT_SYMMETRIC:
1335b1646e73SJed Brown   case MAT_STRUCTURALLY_SYMMETRIC:
1336b1646e73SJed Brown   case MAT_HERMITIAN:
1337b1646e73SJed Brown   case MAT_SYMMETRY_ETERNAL:
1338957cac9fSHong Zhang   case MAT_STRUCTURE_ONLY:
1339b94d7dedSBarry Smith   case MAT_STRUCTURAL_SYMMETRY_ETERNAL:
1340b94d7dedSBarry Smith   case MAT_SPD_ETERNAL:
1341b94d7dedSBarry Smith     /* if the diagonal matrix is square it inherits some of the properties above */
13425021d80fSJed Brown     break;
13438c78258cSHong Zhang   case MAT_FORCE_DIAGONAL_ENTRIES:
1344a65d3064SKris Buschelman   case MAT_IGNORE_OFF_PROC_ENTRIES:
1345d71ae5a4SJacob Faibussowitsch   case MAT_USE_HASH_TABLE:
1346d71ae5a4SJacob Faibussowitsch     PetscCall(PetscInfo(A, "Option %s ignored\n", MatOptions[op]));
1347d71ae5a4SJacob Faibussowitsch     break;
1348d71ae5a4SJacob Faibussowitsch   case MAT_USE_INODES:
1349d71ae5a4SJacob Faibussowitsch     PetscCall(MatSetOption_SeqAIJ_Inode(A, MAT_USE_INODES, flg));
1350d71ae5a4SJacob Faibussowitsch     break;
1351d71ae5a4SJacob Faibussowitsch   case MAT_SUBMAT_SINGLEIS:
1352d71ae5a4SJacob Faibussowitsch     A->submat_singleis = flg;
1353d71ae5a4SJacob Faibussowitsch     break;
1354071fcb05SBarry Smith   case MAT_SORTED_FULL:
1355071fcb05SBarry Smith     if (flg) A->ops->setvalues = MatSetValues_SeqAIJ_SortedFull;
1356071fcb05SBarry Smith     else A->ops->setvalues = MatSetValues_SeqAIJ;
1357071fcb05SBarry Smith     break;
1358d71ae5a4SJacob Faibussowitsch   case MAT_FORM_EXPLICIT_TRANSPOSE:
1359d71ae5a4SJacob Faibussowitsch     A->form_explicit_transpose = flg;
1360d71ae5a4SJacob Faibussowitsch     break;
1361d71ae5a4SJacob Faibussowitsch   default:
1362d71ae5a4SJacob Faibussowitsch     SETERRQ(PETSC_COMM_SELF, PETSC_ERR_SUP, "unknown option %d", op);
1363a65d3064SKris Buschelman   }
13643ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
136517ab2063SBarry Smith }
136617ab2063SBarry Smith 
1367ba38deedSJacob Faibussowitsch static PetscErrorCode MatGetDiagonal_SeqAIJ(Mat A, Vec v)
1368d71ae5a4SJacob Faibussowitsch {
1369416022c9SBarry Smith   Mat_SeqAIJ        *a = (Mat_SeqAIJ *)A->data;
1370fdc842d1SBarry Smith   PetscInt           i, j, n, *ai = a->i, *aj = a->j;
1371c898d852SStefano Zampini   PetscScalar       *x;
1372c898d852SStefano Zampini   const PetscScalar *aa;
137317ab2063SBarry Smith 
13743a40ed3dSBarry Smith   PetscFunctionBegin;
13759566063dSJacob Faibussowitsch   PetscCall(VecGetLocalSize(v, &n));
137608401ef6SPierre Jolivet   PetscCheck(n == A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Nonconforming matrix and vector");
13779566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &aa));
1378d5f3da31SBarry Smith   if (A->factortype == MAT_FACTOR_ILU || A->factortype == MAT_FACTOR_LU) {
1379d3e70bfaSHong Zhang     PetscInt *diag = a->diag;
13809566063dSJacob Faibussowitsch     PetscCall(VecGetArrayWrite(v, &x));
13812c990fa1SHong Zhang     for (i = 0; i < n; i++) x[i] = 1.0 / aa[diag[i]];
13829566063dSJacob Faibussowitsch     PetscCall(VecRestoreArrayWrite(v, &x));
13839566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJRestoreArrayRead(A, &aa));
13843ba16761SJacob Faibussowitsch     PetscFunctionReturn(PETSC_SUCCESS);
138535e7444dSHong Zhang   }
138635e7444dSHong Zhang 
13879566063dSJacob Faibussowitsch   PetscCall(VecGetArrayWrite(v, &x));
138835e7444dSHong Zhang   for (i = 0; i < n; i++) {
1389fdc842d1SBarry Smith     x[i] = 0.0;
139035e7444dSHong Zhang     for (j = ai[i]; j < ai[i + 1]; j++) {
139135e7444dSHong Zhang       if (aj[j] == i) {
139235e7444dSHong Zhang         x[i] = aa[j];
139317ab2063SBarry Smith         break;
139417ab2063SBarry Smith       }
139517ab2063SBarry Smith     }
139617ab2063SBarry Smith   }
13979566063dSJacob Faibussowitsch   PetscCall(VecRestoreArrayWrite(v, &x));
13989566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &aa));
13993ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
140017ab2063SBarry Smith }
140117ab2063SBarry Smith 
1402c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/ftn-kernels/fmult.h>
1403d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMultTransposeAdd_SeqAIJ(Mat A, Vec xx, Vec zz, Vec yy)
1404d71ae5a4SJacob Faibussowitsch {
1405416022c9SBarry Smith   Mat_SeqAIJ        *a = (Mat_SeqAIJ *)A->data;
14065f22a7b3SSebastian Grimberg   const MatScalar   *aa;
1407d9ca1df4SBarry Smith   PetscScalar       *y;
1408d9ca1df4SBarry Smith   const PetscScalar *x;
1409d0f46423SBarry Smith   PetscInt           m = A->rmap->n;
14105c897100SBarry Smith #if !defined(PETSC_USE_FORTRAN_KERNEL_MULTTRANSPOSEAIJ)
14115f22a7b3SSebastian Grimberg   const MatScalar  *v;
1412a77337e4SBarry Smith   PetscScalar       alpha;
1413d9ca1df4SBarry Smith   PetscInt          n, i, j;
1414d9ca1df4SBarry Smith   const PetscInt   *idx, *ii, *ridx = NULL;
14153447b6efSHong Zhang   Mat_CompressedRow cprow    = a->compressedrow;
1416ace3abfcSBarry Smith   PetscBool         usecprow = cprow.use;
14175c897100SBarry Smith #endif
141817ab2063SBarry Smith 
14193a40ed3dSBarry Smith   PetscFunctionBegin;
14209566063dSJacob Faibussowitsch   if (zz != yy) PetscCall(VecCopy(zz, yy));
14219566063dSJacob Faibussowitsch   PetscCall(VecGetArrayRead(xx, &x));
14229566063dSJacob Faibussowitsch   PetscCall(VecGetArray(yy, &y));
14239566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &aa));
14245c897100SBarry Smith 
14255c897100SBarry Smith #if defined(PETSC_USE_FORTRAN_KERNEL_MULTTRANSPOSEAIJ)
1426fff043a9SJunchao Zhang   fortranmulttransposeaddaij_(&m, x, a->i, a->j, aa, y);
14275c897100SBarry Smith #else
14283447b6efSHong Zhang   if (usecprow) {
14293447b6efSHong Zhang     m    = cprow.nrows;
14303447b6efSHong Zhang     ii   = cprow.i;
14317b2bb3b9SHong Zhang     ridx = cprow.rindex;
14323447b6efSHong Zhang   } else {
14333447b6efSHong Zhang     ii = a->i;
14343447b6efSHong Zhang   }
143517ab2063SBarry Smith   for (i = 0; i < m; i++) {
14363447b6efSHong Zhang     idx = a->j + ii[i];
1437fff043a9SJunchao Zhang     v   = aa + ii[i];
14383447b6efSHong Zhang     n   = ii[i + 1] - ii[i];
14393447b6efSHong Zhang     if (usecprow) {
14407b2bb3b9SHong Zhang       alpha = x[ridx[i]];
14413447b6efSHong Zhang     } else {
144217ab2063SBarry Smith       alpha = x[i];
14433447b6efSHong Zhang     }
144404fbf559SBarry Smith     for (j = 0; j < n; j++) y[idx[j]] += alpha * v[j];
144517ab2063SBarry Smith   }
14465c897100SBarry Smith #endif
14479566063dSJacob Faibussowitsch   PetscCall(PetscLogFlops(2.0 * a->nz));
14489566063dSJacob Faibussowitsch   PetscCall(VecRestoreArrayRead(xx, &x));
14499566063dSJacob Faibussowitsch   PetscCall(VecRestoreArray(yy, &y));
14509566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &aa));
14513ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
145217ab2063SBarry Smith }
145317ab2063SBarry Smith 
1454d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMultTranspose_SeqAIJ(Mat A, Vec xx, Vec yy)
1455d71ae5a4SJacob Faibussowitsch {
14565c897100SBarry Smith   PetscFunctionBegin;
14579566063dSJacob Faibussowitsch   PetscCall(VecSet(yy, 0.0));
14589566063dSJacob Faibussowitsch   PetscCall(MatMultTransposeAdd_SeqAIJ(A, xx, yy, yy));
14593ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
14605c897100SBarry Smith }
14615c897100SBarry Smith 
1462c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/ftn-kernels/fmult.h>
146378b84d54SShri Abhyankar 
1464d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMult_SeqAIJ(Mat A, Vec xx, Vec yy)
1465d71ae5a4SJacob Faibussowitsch {
1466416022c9SBarry Smith   Mat_SeqAIJ        *a = (Mat_SeqAIJ *)A->data;
1467d9fead3dSBarry Smith   PetscScalar       *y;
146854f21887SBarry Smith   const PetscScalar *x;
14695914357eSBarry Smith   const MatScalar   *a_a;
1470003131ecSBarry Smith   PetscInt           m = A->rmap->n;
14715914357eSBarry Smith   const PetscInt    *ii, *ridx = NULL;
1472ace3abfcSBarry Smith   PetscBool          usecprow = a->compressedrow.use;
147317ab2063SBarry Smith 
1474b6410449SSatish Balay #if defined(PETSC_HAVE_PRAGMA_DISJOINT)
147597952fefSHong Zhang   #pragma disjoint(*x, *y, *aa)
1476fee21e36SBarry Smith #endif
1477fee21e36SBarry Smith 
14783a40ed3dSBarry Smith   PetscFunctionBegin;
1479b215bc84SStefano Zampini   if (a->inode.use && a->inode.checked) {
14809566063dSJacob Faibussowitsch     PetscCall(MatMult_SeqAIJ_Inode(A, xx, yy));
14813ba16761SJacob Faibussowitsch     PetscFunctionReturn(PETSC_SUCCESS);
1482b215bc84SStefano Zampini   }
14839566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &a_a));
14849566063dSJacob Faibussowitsch   PetscCall(VecGetArrayRead(xx, &x));
14859566063dSJacob Faibussowitsch   PetscCall(VecGetArray(yy, &y));
1486416022c9SBarry Smith   ii = a->i;
14874eb6d288SHong Zhang   if (usecprow) { /* use compressed row format */
14889566063dSJacob Faibussowitsch     PetscCall(PetscArrayzero(y, m));
148997952fefSHong Zhang     m    = a->compressedrow.nrows;
149097952fefSHong Zhang     ii   = a->compressedrow.i;
149197952fefSHong Zhang     ridx = a->compressedrow.rindex;
14925914357eSBarry Smith     PetscPragmaUseOMPKernels(parallel for)
14935914357eSBarry Smith     for (PetscInt i = 0; i < m; i++) {
14945914357eSBarry Smith       PetscInt           n   = ii[i + 1] - ii[i];
14955914357eSBarry Smith       const PetscInt    *aj  = a->j + ii[i];
14965914357eSBarry Smith       const PetscScalar *aa  = a_a + ii[i];
14975914357eSBarry Smith       PetscScalar        sum = 0.0;
1498003131ecSBarry Smith       PetscSparseDensePlusDot(sum, x, aa, aj, n);
1499003131ecSBarry Smith       /* for (j=0; j<n; j++) sum += (*aa++)*x[*aj++]; */
150097952fefSHong Zhang       y[*ridx++] = sum;
150197952fefSHong Zhang     }
150297952fefSHong Zhang   } else { /* do not use compressed row format */
1503b05257ddSBarry Smith #if defined(PETSC_USE_FORTRAN_KERNEL_MULTAIJ)
15045914357eSBarry Smith     fortranmultaij_(&m, x, ii, a->j, a_a, y);
1505b05257ddSBarry Smith #else
15065914357eSBarry Smith     PetscPragmaUseOMPKernels(parallel for)
15075914357eSBarry Smith     for (PetscInt i = 0; i < m; i++) {
15085914357eSBarry Smith       PetscInt           n   = ii[i + 1] - ii[i];
15095914357eSBarry Smith       const PetscInt    *aj  = a->j + ii[i];
15105914357eSBarry Smith       const PetscScalar *aa  = a_a + ii[i];
15115914357eSBarry Smith       PetscScalar        sum = 0.0;
1512003131ecSBarry Smith       PetscSparseDensePlusDot(sum, x, aa, aj, n);
151317ab2063SBarry Smith       y[i] = sum;
151417ab2063SBarry Smith     }
15158d195f9aSBarry Smith #endif
1516b05257ddSBarry Smith   }
15179566063dSJacob Faibussowitsch   PetscCall(PetscLogFlops(2.0 * a->nz - a->nonzerorowcnt));
15189566063dSJacob Faibussowitsch   PetscCall(VecRestoreArrayRead(xx, &x));
15199566063dSJacob Faibussowitsch   PetscCall(VecRestoreArray(yy, &y));
15209566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &a_a));
15213ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
152217ab2063SBarry Smith }
152317ab2063SBarry Smith 
1524ba38deedSJacob Faibussowitsch // HACK!!!!! Used by src/mat/tests/ex170.c
1525ba38deedSJacob Faibussowitsch PETSC_EXTERN PetscErrorCode MatMultMax_SeqAIJ(Mat A, Vec xx, Vec yy)
1526d71ae5a4SJacob Faibussowitsch {
1527b434eb95SMatthew G. Knepley   Mat_SeqAIJ        *a = (Mat_SeqAIJ *)A->data;
1528b434eb95SMatthew G. Knepley   PetscScalar       *y;
1529b434eb95SMatthew G. Knepley   const PetscScalar *x;
1530fff043a9SJunchao Zhang   const MatScalar   *aa, *a_a;
1531b434eb95SMatthew G. Knepley   PetscInt           m = A->rmap->n;
1532b434eb95SMatthew G. Knepley   const PetscInt    *aj, *ii, *ridx   = NULL;
1533b434eb95SMatthew G. Knepley   PetscInt           n, i, nonzerorow = 0;
1534b434eb95SMatthew G. Knepley   PetscScalar        sum;
1535b434eb95SMatthew G. Knepley   PetscBool          usecprow = a->compressedrow.use;
1536b434eb95SMatthew G. Knepley 
1537b434eb95SMatthew G. Knepley #if defined(PETSC_HAVE_PRAGMA_DISJOINT)
1538b434eb95SMatthew G. Knepley   #pragma disjoint(*x, *y, *aa)
1539b434eb95SMatthew G. Knepley #endif
1540b434eb95SMatthew G. Knepley 
1541b434eb95SMatthew G. Knepley   PetscFunctionBegin;
15429566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &a_a));
15439566063dSJacob Faibussowitsch   PetscCall(VecGetArrayRead(xx, &x));
15449566063dSJacob Faibussowitsch   PetscCall(VecGetArray(yy, &y));
1545b434eb95SMatthew G. Knepley   if (usecprow) { /* use compressed row format */
1546b434eb95SMatthew G. Knepley     m    = a->compressedrow.nrows;
1547b434eb95SMatthew G. Knepley     ii   = a->compressedrow.i;
1548b434eb95SMatthew G. Knepley     ridx = a->compressedrow.rindex;
1549b434eb95SMatthew G. Knepley     for (i = 0; i < m; i++) {
1550b434eb95SMatthew G. Knepley       n   = ii[i + 1] - ii[i];
1551b434eb95SMatthew G. Knepley       aj  = a->j + ii[i];
1552fff043a9SJunchao Zhang       aa  = a_a + ii[i];
1553b434eb95SMatthew G. Knepley       sum = 0.0;
1554b434eb95SMatthew G. Knepley       nonzerorow += (n > 0);
1555b434eb95SMatthew G. Knepley       PetscSparseDenseMaxDot(sum, x, aa, aj, n);
1556b434eb95SMatthew G. Knepley       /* for (j=0; j<n; j++) sum += (*aa++)*x[*aj++]; */
1557b434eb95SMatthew G. Knepley       y[*ridx++] = sum;
1558b434eb95SMatthew G. Knepley     }
1559b434eb95SMatthew G. Knepley   } else { /* do not use compressed row format */
15603d3eaba7SBarry Smith     ii = a->i;
1561b434eb95SMatthew G. Knepley     for (i = 0; i < m; i++) {
1562b434eb95SMatthew G. Knepley       n   = ii[i + 1] - ii[i];
1563b434eb95SMatthew G. Knepley       aj  = a->j + ii[i];
1564fff043a9SJunchao Zhang       aa  = a_a + ii[i];
1565b434eb95SMatthew G. Knepley       sum = 0.0;
1566b434eb95SMatthew G. Knepley       nonzerorow += (n > 0);
1567b434eb95SMatthew G. Knepley       PetscSparseDenseMaxDot(sum, x, aa, aj, n);
1568b434eb95SMatthew G. Knepley       y[i] = sum;
1569b434eb95SMatthew G. Knepley     }
1570b434eb95SMatthew G. Knepley   }
15719566063dSJacob Faibussowitsch   PetscCall(PetscLogFlops(2.0 * a->nz - nonzerorow));
15729566063dSJacob Faibussowitsch   PetscCall(VecRestoreArrayRead(xx, &x));
15739566063dSJacob Faibussowitsch   PetscCall(VecRestoreArray(yy, &y));
15749566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &a_a));
15753ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
1576b434eb95SMatthew G. Knepley }
1577b434eb95SMatthew G. Knepley 
1578ba38deedSJacob Faibussowitsch // HACK!!!!! Used by src/mat/tests/ex170.c
1579ba38deedSJacob Faibussowitsch PETSC_EXTERN PetscErrorCode MatMultAddMax_SeqAIJ(Mat A, Vec xx, Vec yy, Vec zz)
1580d71ae5a4SJacob Faibussowitsch {
1581b434eb95SMatthew G. Knepley   Mat_SeqAIJ        *a = (Mat_SeqAIJ *)A->data;
1582b434eb95SMatthew G. Knepley   PetscScalar       *y, *z;
1583b434eb95SMatthew G. Knepley   const PetscScalar *x;
1584fff043a9SJunchao Zhang   const MatScalar   *aa, *a_a;
1585b434eb95SMatthew G. Knepley   PetscInt           m = A->rmap->n, *aj, *ii;
1586b434eb95SMatthew G. Knepley   PetscInt           n, i, *ridx = NULL;
1587b434eb95SMatthew G. Knepley   PetscScalar        sum;
1588b434eb95SMatthew G. Knepley   PetscBool          usecprow = a->compressedrow.use;
1589b434eb95SMatthew G. Knepley 
1590b434eb95SMatthew G. Knepley   PetscFunctionBegin;
15919566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &a_a));
15929566063dSJacob Faibussowitsch   PetscCall(VecGetArrayRead(xx, &x));
15939566063dSJacob Faibussowitsch   PetscCall(VecGetArrayPair(yy, zz, &y, &z));
1594b434eb95SMatthew G. Knepley   if (usecprow) { /* use compressed row format */
159548a46eb9SPierre Jolivet     if (zz != yy) PetscCall(PetscArraycpy(z, y, m));
1596b434eb95SMatthew G. Knepley     m    = a->compressedrow.nrows;
1597b434eb95SMatthew G. Knepley     ii   = a->compressedrow.i;
1598b434eb95SMatthew G. Knepley     ridx = a->compressedrow.rindex;
1599b434eb95SMatthew G. Knepley     for (i = 0; i < m; i++) {
1600b434eb95SMatthew G. Knepley       n   = ii[i + 1] - ii[i];
1601b434eb95SMatthew G. Knepley       aj  = a->j + ii[i];
1602fff043a9SJunchao Zhang       aa  = a_a + ii[i];
1603b434eb95SMatthew G. Knepley       sum = y[*ridx];
1604b434eb95SMatthew G. Knepley       PetscSparseDenseMaxDot(sum, x, aa, aj, n);
1605b434eb95SMatthew G. Knepley       z[*ridx++] = sum;
1606b434eb95SMatthew G. Knepley     }
1607b434eb95SMatthew G. Knepley   } else { /* do not use compressed row format */
16083d3eaba7SBarry Smith     ii = a->i;
1609b434eb95SMatthew G. Knepley     for (i = 0; i < m; i++) {
1610b434eb95SMatthew G. Knepley       n   = ii[i + 1] - ii[i];
1611b434eb95SMatthew G. Knepley       aj  = a->j + ii[i];
1612fff043a9SJunchao Zhang       aa  = a_a + ii[i];
1613b434eb95SMatthew G. Knepley       sum = y[i];
1614b434eb95SMatthew G. Knepley       PetscSparseDenseMaxDot(sum, x, aa, aj, n);
1615b434eb95SMatthew G. Knepley       z[i] = sum;
1616b434eb95SMatthew G. Knepley     }
1617b434eb95SMatthew G. Knepley   }
16189566063dSJacob Faibussowitsch   PetscCall(PetscLogFlops(2.0 * a->nz));
16199566063dSJacob Faibussowitsch   PetscCall(VecRestoreArrayRead(xx, &x));
16209566063dSJacob Faibussowitsch   PetscCall(VecRestoreArrayPair(yy, zz, &y, &z));
16219566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &a_a));
16223ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
1623b434eb95SMatthew G. Knepley }
1624b434eb95SMatthew G. Knepley 
1625c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/ftn-kernels/fmultadd.h>
1626d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMultAdd_SeqAIJ(Mat A, Vec xx, Vec yy, Vec zz)
1627d71ae5a4SJacob Faibussowitsch {
1628416022c9SBarry Smith   Mat_SeqAIJ        *a = (Mat_SeqAIJ *)A->data;
1629f15663dcSBarry Smith   PetscScalar       *y, *z;
1630f15663dcSBarry Smith   const PetscScalar *x;
16315914357eSBarry Smith   const MatScalar   *a_a;
16325914357eSBarry Smith   const PetscInt    *ii, *ridx = NULL;
16335914357eSBarry Smith   PetscInt           m        = A->rmap->n;
1634ace3abfcSBarry Smith   PetscBool          usecprow = a->compressedrow.use;
16359ea0dfa2SSatish Balay 
16363a40ed3dSBarry Smith   PetscFunctionBegin;
1637b215bc84SStefano Zampini   if (a->inode.use && a->inode.checked) {
16389566063dSJacob Faibussowitsch     PetscCall(MatMultAdd_SeqAIJ_Inode(A, xx, yy, zz));
16393ba16761SJacob Faibussowitsch     PetscFunctionReturn(PETSC_SUCCESS);
1640b215bc84SStefano Zampini   }
16419566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &a_a));
16429566063dSJacob Faibussowitsch   PetscCall(VecGetArrayRead(xx, &x));
16439566063dSJacob Faibussowitsch   PetscCall(VecGetArrayPair(yy, zz, &y, &z));
16444eb6d288SHong Zhang   if (usecprow) { /* use compressed row format */
164548a46eb9SPierre Jolivet     if (zz != yy) PetscCall(PetscArraycpy(z, y, m));
164697952fefSHong Zhang     m    = a->compressedrow.nrows;
164797952fefSHong Zhang     ii   = a->compressedrow.i;
164897952fefSHong Zhang     ridx = a->compressedrow.rindex;
16495914357eSBarry Smith     for (PetscInt i = 0; i < m; i++) {
16505914357eSBarry Smith       PetscInt           n   = ii[i + 1] - ii[i];
16515914357eSBarry Smith       const PetscInt    *aj  = a->j + ii[i];
16525914357eSBarry Smith       const PetscScalar *aa  = a_a + ii[i];
16535914357eSBarry Smith       PetscScalar        sum = y[*ridx];
1654f15663dcSBarry Smith       PetscSparseDensePlusDot(sum, x, aa, aj, n);
165597952fefSHong Zhang       z[*ridx++] = sum;
165697952fefSHong Zhang     }
165797952fefSHong Zhang   } else { /* do not use compressed row format */
16583d3eaba7SBarry Smith     ii = a->i;
1659f15663dcSBarry Smith #if defined(PETSC_USE_FORTRAN_KERNEL_MULTADDAIJ)
16605914357eSBarry Smith     fortranmultaddaij_(&m, x, ii, a->j, a_a, y, z);
1661f15663dcSBarry Smith #else
16625914357eSBarry Smith     PetscPragmaUseOMPKernels(parallel for)
16635914357eSBarry Smith     for (PetscInt i = 0; i < m; i++) {
16645914357eSBarry Smith       PetscInt           n   = ii[i + 1] - ii[i];
16655914357eSBarry Smith       const PetscInt    *aj  = a->j + ii[i];
16665914357eSBarry Smith       const PetscScalar *aa  = a_a + ii[i];
16675914357eSBarry Smith       PetscScalar        sum = y[i];
1668f15663dcSBarry Smith       PetscSparseDensePlusDot(sum, x, aa, aj, n);
166917ab2063SBarry Smith       z[i] = sum;
167017ab2063SBarry Smith     }
167102ab625aSSatish Balay #endif
1672f15663dcSBarry Smith   }
16739566063dSJacob Faibussowitsch   PetscCall(PetscLogFlops(2.0 * a->nz));
16749566063dSJacob Faibussowitsch   PetscCall(VecRestoreArrayRead(xx, &x));
16759566063dSJacob Faibussowitsch   PetscCall(VecRestoreArrayPair(yy, zz, &y, &z));
16769566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &a_a));
16773ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
167817ab2063SBarry Smith }
167917ab2063SBarry Smith 
168017ab2063SBarry Smith /*
16810b4b7b1cSBarry Smith      Adds diagonal pointers to sparse matrix nonzero structure.
168217ab2063SBarry Smith */
1683d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMarkDiagonal_SeqAIJ(Mat A)
1684d71ae5a4SJacob Faibussowitsch {
1685416022c9SBarry Smith   Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data;
1686d0f46423SBarry Smith   PetscInt    i, j, m = A->rmap->n;
1687c0c07093SJunchao Zhang   PetscBool   alreadySet = PETSC_TRUE;
168817ab2063SBarry Smith 
16893a40ed3dSBarry Smith   PetscFunctionBegin;
169009f38230SBarry Smith   if (!a->diag) {
16919566063dSJacob Faibussowitsch     PetscCall(PetscMalloc1(m, &a->diag));
1692c0c07093SJunchao Zhang     alreadySet = PETSC_FALSE;
169309f38230SBarry Smith   }
1694d0f46423SBarry Smith   for (i = 0; i < A->rmap->n; i++) {
1695c0c07093SJunchao Zhang     /* If A's diagonal is already correctly set, this fast track enables cheap and repeated MatMarkDiagonal_SeqAIJ() calls */
1696c0c07093SJunchao Zhang     if (alreadySet) {
1697c0c07093SJunchao Zhang       PetscInt pos = a->diag[i];
1698c0c07093SJunchao Zhang       if (pos >= a->i[i] && pos < a->i[i + 1] && a->j[pos] == i) continue;
1699c0c07093SJunchao Zhang     }
1700c0c07093SJunchao Zhang 
170109f38230SBarry Smith     a->diag[i] = a->i[i + 1];
1702bfeeae90SHong Zhang     for (j = a->i[i]; j < a->i[i + 1]; j++) {
1703bfeeae90SHong Zhang       if (a->j[j] == i) {
170409f38230SBarry Smith         a->diag[i] = j;
170517ab2063SBarry Smith         break;
170617ab2063SBarry Smith       }
170717ab2063SBarry Smith     }
170817ab2063SBarry Smith   }
17093ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
171017ab2063SBarry Smith }
171117ab2063SBarry Smith 
1712ba38deedSJacob Faibussowitsch static PetscErrorCode MatShift_SeqAIJ(Mat A, PetscScalar v)
1713d71ae5a4SJacob Faibussowitsch {
171461ecd0c6SBarry Smith   Mat_SeqAIJ     *a    = (Mat_SeqAIJ *)A->data;
171561ecd0c6SBarry Smith   const PetscInt *diag = (const PetscInt *)a->diag;
171661ecd0c6SBarry Smith   const PetscInt *ii   = (const PetscInt *)a->i;
171761ecd0c6SBarry Smith   PetscInt        i, *mdiag = NULL;
171861ecd0c6SBarry Smith   PetscInt        cnt = 0; /* how many diagonals are missing */
171961ecd0c6SBarry Smith 
172061ecd0c6SBarry Smith   PetscFunctionBegin;
172161ecd0c6SBarry Smith   if (!A->preallocated || !a->nz) {
17229566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJSetPreallocation(A, 1, NULL));
17239566063dSJacob Faibussowitsch     PetscCall(MatShift_Basic(A, v));
17243ba16761SJacob Faibussowitsch     PetscFunctionReturn(PETSC_SUCCESS);
172561ecd0c6SBarry Smith   }
172661ecd0c6SBarry Smith 
172761ecd0c6SBarry Smith   if (a->diagonaldense) {
172861ecd0c6SBarry Smith     cnt = 0;
172961ecd0c6SBarry Smith   } else {
17309566063dSJacob Faibussowitsch     PetscCall(PetscCalloc1(A->rmap->n, &mdiag));
173161ecd0c6SBarry Smith     for (i = 0; i < A->rmap->n; i++) {
1732349d3b71SJunchao Zhang       if (i < A->cmap->n && diag[i] >= ii[i + 1]) { /* 'out of range' rows never have diagonals */
173361ecd0c6SBarry Smith         cnt++;
173461ecd0c6SBarry Smith         mdiag[i] = 1;
173561ecd0c6SBarry Smith       }
173661ecd0c6SBarry Smith     }
173761ecd0c6SBarry Smith   }
173861ecd0c6SBarry Smith   if (!cnt) {
17399566063dSJacob Faibussowitsch     PetscCall(MatShift_Basic(A, v));
174061ecd0c6SBarry Smith   } else {
1741b6f2aa54SBarry Smith     PetscScalar       *olda = a->a; /* preserve pointers to current matrix nonzeros structure and values */
1742b6f2aa54SBarry Smith     PetscInt          *oldj = a->j, *oldi = a->i;
17439f0612e4SBarry Smith     PetscBool          free_a = a->free_a, free_ij = a->free_ij;
17446ea2a7edSJunchao Zhang     const PetscScalar *Aa;
17456ea2a7edSJunchao Zhang 
17466ea2a7edSJunchao Zhang     PetscCall(MatSeqAIJGetArrayRead(A, &Aa)); // sync the host
17476ea2a7edSJunchao Zhang     PetscCall(MatSeqAIJRestoreArrayRead(A, &Aa));
174861ecd0c6SBarry Smith 
174961ecd0c6SBarry Smith     a->a = NULL;
175061ecd0c6SBarry Smith     a->j = NULL;
175161ecd0c6SBarry Smith     a->i = NULL;
175261ecd0c6SBarry Smith     /* increase the values in imax for each row where a diagonal is being inserted then reallocate the matrix data structures */
1753ad540459SPierre Jolivet     for (i = 0; i < PetscMin(A->rmap->n, A->cmap->n); i++) a->imax[i] += mdiag[i];
17549566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(A, 0, a->imax));
175561ecd0c6SBarry Smith 
175661ecd0c6SBarry Smith     /* copy old values into new matrix data structure */
175761ecd0c6SBarry Smith     for (i = 0; i < A->rmap->n; i++) {
17589566063dSJacob Faibussowitsch       PetscCall(MatSetValues(A, 1, &i, a->imax[i] - mdiag[i], &oldj[oldi[i]], &olda[oldi[i]], ADD_VALUES));
175948a46eb9SPierre Jolivet       if (i < A->cmap->n) PetscCall(MatSetValue(A, i, i, v, ADD_VALUES));
1760447d62f5SStefano Zampini     }
17619566063dSJacob Faibussowitsch     PetscCall(MatAssemblyBegin(A, MAT_FINAL_ASSEMBLY));
17629566063dSJacob Faibussowitsch     PetscCall(MatAssemblyEnd(A, MAT_FINAL_ASSEMBLY));
17639f0612e4SBarry Smith     if (free_a) PetscCall(PetscShmgetDeallocateArray((void **)&olda));
17649f0612e4SBarry Smith     if (free_ij) PetscCall(PetscShmgetDeallocateArray((void **)&oldj));
17659f0612e4SBarry Smith     if (free_ij) PetscCall(PetscShmgetDeallocateArray((void **)&oldi));
176661ecd0c6SBarry Smith   }
17679566063dSJacob Faibussowitsch   PetscCall(PetscFree(mdiag));
176861ecd0c6SBarry Smith   a->diagonaldense = PETSC_TRUE;
17693ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
177061ecd0c6SBarry Smith }
177161ecd0c6SBarry Smith 
1772be5855fcSBarry Smith /*
1773be5855fcSBarry Smith      Checks for missing diagonals
1774be5855fcSBarry Smith */
1775d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMissingDiagonal_SeqAIJ(Mat A, PetscBool *missing, PetscInt *d)
1776d71ae5a4SJacob Faibussowitsch {
1777be5855fcSBarry Smith   Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data;
17787734d3b5SMatthew G. Knepley   PetscInt   *diag, *ii = a->i, i;
1779be5855fcSBarry Smith 
1780be5855fcSBarry Smith   PetscFunctionBegin;
178109f38230SBarry Smith   *missing = PETSC_FALSE;
17827734d3b5SMatthew G. Knepley   if (A->rmap->n > 0 && !ii) {
178309f38230SBarry Smith     *missing = PETSC_TRUE;
178409f38230SBarry Smith     if (d) *d = 0;
17859566063dSJacob Faibussowitsch     PetscCall(PetscInfo(A, "Matrix has no entries therefore is missing diagonal\n"));
178609f38230SBarry Smith   } else {
178701445905SHong Zhang     PetscInt n;
178801445905SHong Zhang     n    = PetscMin(A->rmap->n, A->cmap->n);
1789f1e2ffcdSBarry Smith     diag = a->diag;
179001445905SHong Zhang     for (i = 0; i < n; i++) {
17917734d3b5SMatthew G. Knepley       if (diag[i] >= ii[i + 1]) {
179209f38230SBarry Smith         *missing = PETSC_TRUE;
179309f38230SBarry Smith         if (d) *d = i;
17949566063dSJacob Faibussowitsch         PetscCall(PetscInfo(A, "Matrix is missing diagonal number %" PetscInt_FMT "\n", i));
1795358d2f5dSShri Abhyankar         break;
179609f38230SBarry Smith       }
1797be5855fcSBarry Smith     }
1798be5855fcSBarry Smith   }
17993ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
1800be5855fcSBarry Smith }
1801be5855fcSBarry Smith 
18020da83c2eSBarry Smith #include <petscblaslapack.h>
18030da83c2eSBarry Smith #include <petsc/private/kernels/blockinvert.h>
18040da83c2eSBarry Smith 
18050da83c2eSBarry Smith /*
18060da83c2eSBarry Smith     Note that values is allocated externally by the PC and then passed into this routine
18070da83c2eSBarry Smith */
1808ba38deedSJacob Faibussowitsch static PetscErrorCode MatInvertVariableBlockDiagonal_SeqAIJ(Mat A, PetscInt nblocks, const PetscInt *bsizes, PetscScalar *diag)
1809d71ae5a4SJacob Faibussowitsch {
18100da83c2eSBarry Smith   PetscInt        n = A->rmap->n, i, ncnt = 0, *indx, j, bsizemax = 0, *v_pivots;
18110da83c2eSBarry Smith   PetscBool       allowzeropivot, zeropivotdetected = PETSC_FALSE;
18120da83c2eSBarry Smith   const PetscReal shift = 0.0;
18130da83c2eSBarry Smith   PetscInt        ipvt[5];
18144e208921SJed Brown   PetscCount      flops = 0;
18150da83c2eSBarry Smith   PetscScalar     work[25], *v_work;
18160da83c2eSBarry Smith 
18170da83c2eSBarry Smith   PetscFunctionBegin;
18180da83c2eSBarry Smith   allowzeropivot = PetscNot(A->erroriffailure);
18190da83c2eSBarry Smith   for (i = 0; i < nblocks; i++) ncnt += bsizes[i];
182008401ef6SPierre Jolivet   PetscCheck(ncnt == n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Total blocksizes %" PetscInt_FMT " doesn't match number matrix rows %" PetscInt_FMT, ncnt, n);
1821ad540459SPierre Jolivet   for (i = 0; i < nblocks; i++) bsizemax = PetscMax(bsizemax, bsizes[i]);
18229566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(bsizemax, &indx));
182348a46eb9SPierre Jolivet   if (bsizemax > 7) PetscCall(PetscMalloc2(bsizemax, &v_work, bsizemax, &v_pivots));
18240da83c2eSBarry Smith   ncnt = 0;
18250da83c2eSBarry Smith   for (i = 0; i < nblocks; i++) {
18260da83c2eSBarry Smith     for (j = 0; j < bsizes[i]; j++) indx[j] = ncnt + j;
18279566063dSJacob Faibussowitsch     PetscCall(MatGetValues(A, bsizes[i], indx, bsizes[i], indx, diag));
18280da83c2eSBarry Smith     switch (bsizes[i]) {
1829d71ae5a4SJacob Faibussowitsch     case 1:
1830d71ae5a4SJacob Faibussowitsch       *diag = 1.0 / (*diag);
1831d71ae5a4SJacob Faibussowitsch       break;
18320da83c2eSBarry Smith     case 2:
18339566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_inverse_A_2(diag, shift, allowzeropivot, &zeropivotdetected));
18340da83c2eSBarry Smith       if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT;
18359566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_transpose_A_2(diag));
18360da83c2eSBarry Smith       break;
18370da83c2eSBarry Smith     case 3:
18389566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_inverse_A_3(diag, shift, allowzeropivot, &zeropivotdetected));
18390da83c2eSBarry Smith       if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT;
18409566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_transpose_A_3(diag));
18410da83c2eSBarry Smith       break;
18420da83c2eSBarry Smith     case 4:
18439566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_inverse_A_4(diag, shift, allowzeropivot, &zeropivotdetected));
18440da83c2eSBarry Smith       if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT;
18459566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_transpose_A_4(diag));
18460da83c2eSBarry Smith       break;
18470da83c2eSBarry Smith     case 5:
18489566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_inverse_A_5(diag, ipvt, work, shift, allowzeropivot, &zeropivotdetected));
18490da83c2eSBarry Smith       if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT;
18509566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_transpose_A_5(diag));
18510da83c2eSBarry Smith       break;
18520da83c2eSBarry Smith     case 6:
18539566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_inverse_A_6(diag, shift, allowzeropivot, &zeropivotdetected));
18540da83c2eSBarry Smith       if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT;
18559566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_transpose_A_6(diag));
18560da83c2eSBarry Smith       break;
18570da83c2eSBarry Smith     case 7:
18589566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_inverse_A_7(diag, shift, allowzeropivot, &zeropivotdetected));
18590da83c2eSBarry Smith       if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT;
18609566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_transpose_A_7(diag));
18610da83c2eSBarry Smith       break;
18620da83c2eSBarry Smith     default:
18639566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_inverse_A(bsizes[i], diag, v_pivots, v_work, allowzeropivot, &zeropivotdetected));
18640da83c2eSBarry Smith       if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT;
18659566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_transpose_A_N(diag, bsizes[i]));
18660da83c2eSBarry Smith     }
18670da83c2eSBarry Smith     ncnt += bsizes[i];
18680da83c2eSBarry Smith     diag += bsizes[i] * bsizes[i];
1869baa50dc0SBrad Aagaard     flops += 2 * PetscPowInt64(bsizes[i], 3) / 3;
18700da83c2eSBarry Smith   }
18713ba16761SJacob Faibussowitsch   PetscCall(PetscLogFlops(flops));
187248a46eb9SPierre Jolivet   if (bsizemax > 7) PetscCall(PetscFree2(v_work, v_pivots));
18739566063dSJacob Faibussowitsch   PetscCall(PetscFree(indx));
18743ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
18750da83c2eSBarry Smith }
18760da83c2eSBarry Smith 
1877422a814eSBarry Smith /*
1878422a814eSBarry Smith    Negative shift indicates do not generate an error if there is a zero diagonal, just invert it anyways
1879422a814eSBarry Smith */
1880ba38deedSJacob Faibussowitsch static PetscErrorCode MatInvertDiagonal_SeqAIJ(Mat A, PetscScalar omega, PetscScalar fshift)
1881d71ae5a4SJacob Faibussowitsch {
188271f1c65dSBarry Smith   Mat_SeqAIJ      *a = (Mat_SeqAIJ *)A->data;
1883d0f46423SBarry Smith   PetscInt         i, *diag, m = A->rmap->n;
18842e5835c6SStefano Zampini   const MatScalar *v;
188554f21887SBarry Smith   PetscScalar     *idiag, *mdiag;
188671f1c65dSBarry Smith 
188771f1c65dSBarry Smith   PetscFunctionBegin;
18883ba16761SJacob Faibussowitsch   if (a->idiagvalid) PetscFunctionReturn(PETSC_SUCCESS);
18899566063dSJacob Faibussowitsch   PetscCall(MatMarkDiagonal_SeqAIJ(A));
189071f1c65dSBarry Smith   diag = a->diag;
18914dfa11a4SJacob Faibussowitsch   if (!a->idiag) { PetscCall(PetscMalloc3(m, &a->idiag, m, &a->mdiag, m, &a->ssor_work)); }
18922e5835c6SStefano Zampini 
189371f1c65dSBarry Smith   mdiag = a->mdiag;
189471f1c65dSBarry Smith   idiag = a->idiag;
18959566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &v));
1896422a814eSBarry Smith   if (omega == 1.0 && PetscRealPart(fshift) <= 0.0) {
189771f1c65dSBarry Smith     for (i = 0; i < m; i++) {
189871f1c65dSBarry Smith       mdiag[i] = v[diag[i]];
1899899639b0SHong Zhang       if (!PetscAbsScalar(mdiag[i])) { /* zero diagonal */
1900899639b0SHong Zhang         if (PetscRealPart(fshift)) {
19019566063dSJacob Faibussowitsch           PetscCall(PetscInfo(A, "Zero diagonal on row %" PetscInt_FMT "\n", i));
19027b6c816cSBarry Smith           A->factorerrortype             = MAT_FACTOR_NUMERIC_ZEROPIVOT;
19037b6c816cSBarry Smith           A->factorerror_zeropivot_value = 0.0;
19047b6c816cSBarry Smith           A->factorerror_zeropivot_row   = i;
190598921bdaSJacob Faibussowitsch         } else SETERRQ(PETSC_COMM_SELF, PETSC_ERR_ARG_INCOMP, "Zero diagonal on row %" PetscInt_FMT, i);
1906899639b0SHong Zhang       }
190771f1c65dSBarry Smith       idiag[i] = 1.0 / v[diag[i]];
190871f1c65dSBarry Smith     }
19099566063dSJacob Faibussowitsch     PetscCall(PetscLogFlops(m));
191071f1c65dSBarry Smith   } else {
191171f1c65dSBarry Smith     for (i = 0; i < m; i++) {
191271f1c65dSBarry Smith       mdiag[i] = v[diag[i]];
191371f1c65dSBarry Smith       idiag[i] = omega / (fshift + v[diag[i]]);
191471f1c65dSBarry Smith     }
19159566063dSJacob Faibussowitsch     PetscCall(PetscLogFlops(2.0 * m));
191671f1c65dSBarry Smith   }
191771f1c65dSBarry Smith   a->idiagvalid = PETSC_TRUE;
19189566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &v));
19193ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
192071f1c65dSBarry Smith }
192171f1c65dSBarry Smith 
1922d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSOR_SeqAIJ(Mat A, Vec bb, PetscReal omega, MatSORType flag, PetscReal fshift, PetscInt its, PetscInt lits, Vec xx)
1923d71ae5a4SJacob Faibussowitsch {
1924416022c9SBarry Smith   Mat_SeqAIJ        *a = (Mat_SeqAIJ *)A->data;
1925e6d1f457SBarry Smith   PetscScalar       *x, d, sum, *t, scale;
19262e5835c6SStefano Zampini   const MatScalar   *v, *idiag = NULL, *mdiag, *aa;
192754f21887SBarry Smith   const PetscScalar *b, *bs, *xb, *ts;
19283d3eaba7SBarry Smith   PetscInt           n, m = A->rmap->n, i;
192997f1f81fSBarry Smith   const PetscInt    *idx, *diag;
193017ab2063SBarry Smith 
19313a40ed3dSBarry Smith   PetscFunctionBegin;
1932b215bc84SStefano Zampini   if (a->inode.use && a->inode.checked && omega == 1.0 && fshift == 0.0) {
19339566063dSJacob Faibussowitsch     PetscCall(MatSOR_SeqAIJ_Inode(A, bb, omega, flag, fshift, its, lits, xx));
19343ba16761SJacob Faibussowitsch     PetscFunctionReturn(PETSC_SUCCESS);
1935b215bc84SStefano Zampini   }
1936b965ef7fSBarry Smith   its = its * lits;
193791723122SBarry Smith 
193871f1c65dSBarry Smith   if (fshift != a->fshift || omega != a->omega) a->idiagvalid = PETSC_FALSE; /* must recompute idiag[] */
19399566063dSJacob Faibussowitsch   if (!a->idiagvalid) PetscCall(MatInvertDiagonal_SeqAIJ(A, omega, fshift));
194071f1c65dSBarry Smith   a->fshift = fshift;
194171f1c65dSBarry Smith   a->omega  = omega;
1942ed480e8bSBarry Smith 
194371f1c65dSBarry Smith   diag  = a->diag;
194471f1c65dSBarry Smith   t     = a->ssor_work;
1945ed480e8bSBarry Smith   idiag = a->idiag;
194671f1c65dSBarry Smith   mdiag = a->mdiag;
1947ed480e8bSBarry Smith 
19489566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &aa));
19499566063dSJacob Faibussowitsch   PetscCall(VecGetArray(xx, &x));
19509566063dSJacob Faibussowitsch   PetscCall(VecGetArrayRead(bb, &b));
1951ed480e8bSBarry Smith   /* We count flops by assuming the upper triangular and lower triangular parts have the same number of nonzeros */
195217ab2063SBarry Smith   if (flag == SOR_APPLY_UPPER) {
195317ab2063SBarry Smith     /* apply (U + D/omega) to the vector */
1954ed480e8bSBarry Smith     bs = b;
195517ab2063SBarry Smith     for (i = 0; i < m; i++) {
195671f1c65dSBarry Smith       d   = fshift + mdiag[i];
1957416022c9SBarry Smith       n   = a->i[i + 1] - diag[i] - 1;
1958ed480e8bSBarry Smith       idx = a->j + diag[i] + 1;
19592e5835c6SStefano Zampini       v   = aa + diag[i] + 1;
196017ab2063SBarry Smith       sum = b[i] * d / omega;
1961003131ecSBarry Smith       PetscSparseDensePlusDot(sum, bs, v, idx, n);
196217ab2063SBarry Smith       x[i] = sum;
196317ab2063SBarry Smith     }
19649566063dSJacob Faibussowitsch     PetscCall(VecRestoreArray(xx, &x));
19659566063dSJacob Faibussowitsch     PetscCall(VecRestoreArrayRead(bb, &b));
19669566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJRestoreArrayRead(A, &aa));
19679566063dSJacob Faibussowitsch     PetscCall(PetscLogFlops(a->nz));
19683ba16761SJacob Faibussowitsch     PetscFunctionReturn(PETSC_SUCCESS);
196917ab2063SBarry Smith   }
1970c783ea89SBarry Smith 
197108401ef6SPierre Jolivet   PetscCheck(flag != SOR_APPLY_LOWER, PETSC_COMM_SELF, PETSC_ERR_SUP, "SOR_APPLY_LOWER is not implemented");
1972f7d195e4SLawrence Mitchell   if (flag & SOR_EISENSTAT) {
19734c500f23SPierre Jolivet     /* Let  A = L + U + D; where L is lower triangular,
1974887ee2caSBarry Smith     U is upper triangular, E = D/omega; This routine applies
197517ab2063SBarry Smith 
197617ab2063SBarry Smith             (L + E)^{-1} A (U + E)^{-1}
197717ab2063SBarry Smith 
1978887ee2caSBarry Smith     to a vector efficiently using Eisenstat's trick.
197917ab2063SBarry Smith     */
198017ab2063SBarry Smith     scale = (2.0 / omega) - 1.0;
198117ab2063SBarry Smith 
198217ab2063SBarry Smith     /*  x = (E + U)^{-1} b */
198317ab2063SBarry Smith     for (i = m - 1; i >= 0; i--) {
1984416022c9SBarry Smith       n   = a->i[i + 1] - diag[i] - 1;
1985ed480e8bSBarry Smith       idx = a->j + diag[i] + 1;
19862e5835c6SStefano Zampini       v   = aa + diag[i] + 1;
198717ab2063SBarry Smith       sum = b[i];
1988e6d1f457SBarry Smith       PetscSparseDenseMinusDot(sum, x, v, idx, n);
1989ed480e8bSBarry Smith       x[i] = sum * idiag[i];
199017ab2063SBarry Smith     }
199117ab2063SBarry Smith 
199217ab2063SBarry Smith     /*  t = b - (2*E - D)x */
19932e5835c6SStefano Zampini     v = aa;
19942205254eSKarl Rupp     for (i = 0; i < m; i++) t[i] = b[i] - scale * (v[*diag++]) * x[i];
199517ab2063SBarry Smith 
199617ab2063SBarry Smith     /*  t = (E + L)^{-1}t */
1997ed480e8bSBarry Smith     ts   = t;
1998416022c9SBarry Smith     diag = a->diag;
199917ab2063SBarry Smith     for (i = 0; i < m; i++) {
2000416022c9SBarry Smith       n   = diag[i] - a->i[i];
2001ed480e8bSBarry Smith       idx = a->j + a->i[i];
20022e5835c6SStefano Zampini       v   = aa + a->i[i];
200317ab2063SBarry Smith       sum = t[i];
2004003131ecSBarry Smith       PetscSparseDenseMinusDot(sum, ts, v, idx, n);
2005ed480e8bSBarry Smith       t[i] = sum * idiag[i];
2006733d66baSBarry Smith       /*  x = x + t */
2007733d66baSBarry Smith       x[i] += t[i];
200817ab2063SBarry Smith     }
200917ab2063SBarry Smith 
20109566063dSJacob Faibussowitsch     PetscCall(PetscLogFlops(6.0 * m - 1 + 2.0 * a->nz));
20119566063dSJacob Faibussowitsch     PetscCall(VecRestoreArray(xx, &x));
20129566063dSJacob Faibussowitsch     PetscCall(VecRestoreArrayRead(bb, &b));
20133ba16761SJacob Faibussowitsch     PetscFunctionReturn(PETSC_SUCCESS);
201417ab2063SBarry Smith   }
201517ab2063SBarry Smith   if (flag & SOR_ZERO_INITIAL_GUESS) {
201617ab2063SBarry Smith     if (flag & SOR_FORWARD_SWEEP || flag & SOR_LOCAL_FORWARD_SWEEP) {
201717ab2063SBarry Smith       for (i = 0; i < m; i++) {
2018416022c9SBarry Smith         n   = diag[i] - a->i[i];
2019ed480e8bSBarry Smith         idx = a->j + a->i[i];
20202e5835c6SStefano Zampini         v   = aa + a->i[i];
202117ab2063SBarry Smith         sum = b[i];
2022e6d1f457SBarry Smith         PetscSparseDenseMinusDot(sum, x, v, idx, n);
20235c99c7daSBarry Smith         t[i] = sum;
2024ed480e8bSBarry Smith         x[i] = sum * idiag[i];
202517ab2063SBarry Smith       }
20265c99c7daSBarry Smith       xb = t;
20279566063dSJacob Faibussowitsch       PetscCall(PetscLogFlops(a->nz));
20283a40ed3dSBarry Smith     } else xb = b;
202917ab2063SBarry Smith     if (flag & SOR_BACKWARD_SWEEP || flag & SOR_LOCAL_BACKWARD_SWEEP) {
203017ab2063SBarry Smith       for (i = m - 1; i >= 0; i--) {
2031416022c9SBarry Smith         n   = a->i[i + 1] - diag[i] - 1;
2032ed480e8bSBarry Smith         idx = a->j + diag[i] + 1;
20332e5835c6SStefano Zampini         v   = aa + diag[i] + 1;
203417ab2063SBarry Smith         sum = xb[i];
2035e6d1f457SBarry Smith         PetscSparseDenseMinusDot(sum, x, v, idx, n);
20365c99c7daSBarry Smith         if (xb == b) {
2037ed480e8bSBarry Smith           x[i] = sum * idiag[i];
20385c99c7daSBarry Smith         } else {
2039b19a5dc2SMark Adams           x[i] = (1 - omega) * x[i] + sum * idiag[i]; /* omega in idiag */
204017ab2063SBarry Smith         }
20415c99c7daSBarry Smith       }
20429566063dSJacob Faibussowitsch       PetscCall(PetscLogFlops(a->nz)); /* assumes 1/2 in upper */
204317ab2063SBarry Smith     }
204417ab2063SBarry Smith     its--;
204517ab2063SBarry Smith   }
204617ab2063SBarry Smith   while (its--) {
204717ab2063SBarry Smith     if (flag & SOR_FORWARD_SWEEP || flag & SOR_LOCAL_FORWARD_SWEEP) {
204817ab2063SBarry Smith       for (i = 0; i < m; i++) {
2049b19a5dc2SMark Adams         /* lower */
2050b19a5dc2SMark Adams         n   = diag[i] - a->i[i];
2051ed480e8bSBarry Smith         idx = a->j + a->i[i];
20522e5835c6SStefano Zampini         v   = aa + a->i[i];
205317ab2063SBarry Smith         sum = b[i];
2054e6d1f457SBarry Smith         PetscSparseDenseMinusDot(sum, x, v, idx, n);
2055b19a5dc2SMark Adams         t[i] = sum; /* save application of the lower-triangular part */
2056b19a5dc2SMark Adams         /* upper */
2057b19a5dc2SMark Adams         n   = a->i[i + 1] - diag[i] - 1;
2058b19a5dc2SMark Adams         idx = a->j + diag[i] + 1;
20592e5835c6SStefano Zampini         v   = aa + diag[i] + 1;
2060b19a5dc2SMark Adams         PetscSparseDenseMinusDot(sum, x, v, idx, n);
2061b19a5dc2SMark Adams         x[i] = (1. - omega) * x[i] + sum * idiag[i]; /* omega in idiag */
206217ab2063SBarry Smith       }
2063b19a5dc2SMark Adams       xb = t;
20649566063dSJacob Faibussowitsch       PetscCall(PetscLogFlops(2.0 * a->nz));
2065b19a5dc2SMark Adams     } else xb = b;
206617ab2063SBarry Smith     if (flag & SOR_BACKWARD_SWEEP || flag & SOR_LOCAL_BACKWARD_SWEEP) {
206717ab2063SBarry Smith       for (i = m - 1; i >= 0; i--) {
2068b19a5dc2SMark Adams         sum = xb[i];
2069b19a5dc2SMark Adams         if (xb == b) {
2070b19a5dc2SMark Adams           /* whole matrix (no checkpointing available) */
2071416022c9SBarry Smith           n   = a->i[i + 1] - a->i[i];
2072ed480e8bSBarry Smith           idx = a->j + a->i[i];
20732e5835c6SStefano Zampini           v   = aa + a->i[i];
2074e6d1f457SBarry Smith           PetscSparseDenseMinusDot(sum, x, v, idx, n);
2075ed480e8bSBarry Smith           x[i] = (1. - omega) * x[i] + (sum + mdiag[i] * x[i]) * idiag[i];
2076b19a5dc2SMark Adams         } else { /* lower-triangular part has been saved, so only apply upper-triangular */
2077b19a5dc2SMark Adams           n   = a->i[i + 1] - diag[i] - 1;
2078b19a5dc2SMark Adams           idx = a->j + diag[i] + 1;
20792e5835c6SStefano Zampini           v   = aa + diag[i] + 1;
2080b19a5dc2SMark Adams           PetscSparseDenseMinusDot(sum, x, v, idx, n);
2081b19a5dc2SMark Adams           x[i] = (1. - omega) * x[i] + sum * idiag[i]; /* omega in idiag */
208217ab2063SBarry Smith         }
2083b19a5dc2SMark Adams       }
2084b19a5dc2SMark Adams       if (xb == b) {
20859566063dSJacob Faibussowitsch         PetscCall(PetscLogFlops(2.0 * a->nz));
2086b19a5dc2SMark Adams       } else {
20879566063dSJacob Faibussowitsch         PetscCall(PetscLogFlops(a->nz)); /* assumes 1/2 in upper */
2088b19a5dc2SMark Adams       }
208917ab2063SBarry Smith     }
209017ab2063SBarry Smith   }
20919566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &aa));
20929566063dSJacob Faibussowitsch   PetscCall(VecRestoreArray(xx, &x));
20939566063dSJacob Faibussowitsch   PetscCall(VecRestoreArrayRead(bb, &b));
20943ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
209517ab2063SBarry Smith }
209617ab2063SBarry Smith 
2097ba38deedSJacob Faibussowitsch static PetscErrorCode MatGetInfo_SeqAIJ(Mat A, MatInfoType flag, MatInfo *info)
2098d71ae5a4SJacob Faibussowitsch {
2099416022c9SBarry Smith   Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data;
21004e220ebcSLois Curfman McInnes 
21013a40ed3dSBarry Smith   PetscFunctionBegin;
21024e220ebcSLois Curfman McInnes   info->block_size   = 1.0;
21033966268fSBarry Smith   info->nz_allocated = a->maxnz;
21043966268fSBarry Smith   info->nz_used      = a->nz;
21053966268fSBarry Smith   info->nz_unneeded  = (a->maxnz - a->nz);
21063966268fSBarry Smith   info->assemblies   = A->num_ass;
21073966268fSBarry Smith   info->mallocs      = A->info.mallocs;
21084dfa11a4SJacob Faibussowitsch   info->memory       = 0; /* REVIEW ME */
2109d5f3da31SBarry Smith   if (A->factortype) {
21104e220ebcSLois Curfman McInnes     info->fill_ratio_given  = A->info.fill_ratio_given;
21114e220ebcSLois Curfman McInnes     info->fill_ratio_needed = A->info.fill_ratio_needed;
21124e220ebcSLois Curfman McInnes     info->factor_mallocs    = A->info.factor_mallocs;
21134e220ebcSLois Curfman McInnes   } else {
21144e220ebcSLois Curfman McInnes     info->fill_ratio_given  = 0;
21154e220ebcSLois Curfman McInnes     info->fill_ratio_needed = 0;
21164e220ebcSLois Curfman McInnes     info->factor_mallocs    = 0;
21174e220ebcSLois Curfman McInnes   }
21183ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
211917ab2063SBarry Smith }
212017ab2063SBarry Smith 
2121ba38deedSJacob Faibussowitsch static PetscErrorCode MatZeroRows_SeqAIJ(Mat A, PetscInt N, const PetscInt rows[], PetscScalar diag, Vec x, Vec b)
2122d71ae5a4SJacob Faibussowitsch {
2123416022c9SBarry Smith   Mat_SeqAIJ        *a = (Mat_SeqAIJ *)A->data;
2124c7da8527SEric Chamberland   PetscInt           i, m = A->rmap->n - 1;
212597b48c8fSBarry Smith   const PetscScalar *xx;
21262e5835c6SStefano Zampini   PetscScalar       *bb, *aa;
2127c7da8527SEric Chamberland   PetscInt           d = 0;
212817ab2063SBarry Smith 
21293a40ed3dSBarry Smith   PetscFunctionBegin;
213097b48c8fSBarry Smith   if (x && b) {
21319566063dSJacob Faibussowitsch     PetscCall(VecGetArrayRead(x, &xx));
21329566063dSJacob Faibussowitsch     PetscCall(VecGetArray(b, &bb));
213397b48c8fSBarry Smith     for (i = 0; i < N; i++) {
2134aed4548fSBarry Smith       PetscCheck(rows[i] >= 0 && rows[i] <= m, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "row %" PetscInt_FMT " out of range", rows[i]);
2135447d62f5SStefano Zampini       if (rows[i] >= A->cmap->n) continue;
213697b48c8fSBarry Smith       bb[rows[i]] = diag * xx[rows[i]];
213797b48c8fSBarry Smith     }
21389566063dSJacob Faibussowitsch     PetscCall(VecRestoreArrayRead(x, &xx));
21399566063dSJacob Faibussowitsch     PetscCall(VecRestoreArray(b, &bb));
214097b48c8fSBarry Smith   }
214197b48c8fSBarry Smith 
21429566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArray(A, &aa));
2143a9817697SBarry Smith   if (a->keepnonzeropattern) {
2144f1e2ffcdSBarry Smith     for (i = 0; i < N; i++) {
2145aed4548fSBarry Smith       PetscCheck(rows[i] >= 0 && rows[i] <= m, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "row %" PetscInt_FMT " out of range", rows[i]);
21469566063dSJacob Faibussowitsch       PetscCall(PetscArrayzero(&aa[a->i[rows[i]]], a->ilen[rows[i]]));
2147f1e2ffcdSBarry Smith     }
2148f4df32b1SMatthew Knepley     if (diag != 0.0) {
2149c7da8527SEric Chamberland       for (i = 0; i < N; i++) {
2150c7da8527SEric Chamberland         d = rows[i];
2151447d62f5SStefano Zampini         if (rows[i] >= A->cmap->n) continue;
215208401ef6SPierre Jolivet         PetscCheck(a->diag[d] < a->i[d + 1], PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Matrix is missing diagonal entry in the zeroed row %" PetscInt_FMT, d);
2153c7da8527SEric Chamberland       }
2154f1e2ffcdSBarry Smith       for (i = 0; i < N; i++) {
2155447d62f5SStefano Zampini         if (rows[i] >= A->cmap->n) continue;
21562e5835c6SStefano Zampini         aa[a->diag[rows[i]]] = diag;
2157f1e2ffcdSBarry Smith       }
2158f1e2ffcdSBarry Smith     }
2159f1e2ffcdSBarry Smith   } else {
2160f4df32b1SMatthew Knepley     if (diag != 0.0) {
216117ab2063SBarry Smith       for (i = 0; i < N; i++) {
2162aed4548fSBarry Smith         PetscCheck(rows[i] >= 0 && rows[i] <= m, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "row %" PetscInt_FMT " out of range", rows[i]);
21637ae801bdSBarry Smith         if (a->ilen[rows[i]] > 0) {
2164447d62f5SStefano Zampini           if (rows[i] >= A->cmap->n) {
2165447d62f5SStefano Zampini             a->ilen[rows[i]] = 0;
2166447d62f5SStefano Zampini           } else {
2167416022c9SBarry Smith             a->ilen[rows[i]]    = 1;
21682e5835c6SStefano Zampini             aa[a->i[rows[i]]]   = diag;
2169bfeeae90SHong Zhang             a->j[a->i[rows[i]]] = rows[i];
2170447d62f5SStefano Zampini           }
2171447d62f5SStefano Zampini         } else if (rows[i] < A->cmap->n) { /* in case row was completely empty */
21729566063dSJacob Faibussowitsch           PetscCall(MatSetValues_SeqAIJ(A, 1, &rows[i], 1, &rows[i], &diag, INSERT_VALUES));
217317ab2063SBarry Smith         }
217417ab2063SBarry Smith       }
21753a40ed3dSBarry Smith     } else {
217617ab2063SBarry Smith       for (i = 0; i < N; i++) {
2177aed4548fSBarry Smith         PetscCheck(rows[i] >= 0 && rows[i] <= m, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "row %" PetscInt_FMT " out of range", rows[i]);
2178416022c9SBarry Smith         a->ilen[rows[i]] = 0;
217917ab2063SBarry Smith       }
218017ab2063SBarry Smith     }
2181e56f5c9eSBarry Smith     A->nonzerostate++;
2182f1e2ffcdSBarry Smith   }
21839566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArray(A, &aa));
2184dbbe0bcdSBarry Smith   PetscUseTypeMethod(A, assemblyend, MAT_FINAL_ASSEMBLY);
21853ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
218617ab2063SBarry Smith }
218717ab2063SBarry Smith 
2188ba38deedSJacob Faibussowitsch static PetscErrorCode MatZeroRowsColumns_SeqAIJ(Mat A, PetscInt N, const PetscInt rows[], PetscScalar diag, Vec x, Vec b)
2189d71ae5a4SJacob Faibussowitsch {
21906e169961SBarry Smith   Mat_SeqAIJ        *a = (Mat_SeqAIJ *)A->data;
21916e169961SBarry Smith   PetscInt           i, j, m = A->rmap->n - 1, d = 0;
21922b40b63fSBarry Smith   PetscBool          missing, *zeroed, vecs = PETSC_FALSE;
21936e169961SBarry Smith   const PetscScalar *xx;
21942e5835c6SStefano Zampini   PetscScalar       *bb, *aa;
21956e169961SBarry Smith 
21966e169961SBarry Smith   PetscFunctionBegin;
21973ba16761SJacob Faibussowitsch   if (!N) PetscFunctionReturn(PETSC_SUCCESS);
21989566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArray(A, &aa));
21996e169961SBarry Smith   if (x && b) {
22009566063dSJacob Faibussowitsch     PetscCall(VecGetArrayRead(x, &xx));
22019566063dSJacob Faibussowitsch     PetscCall(VecGetArray(b, &bb));
22022b40b63fSBarry Smith     vecs = PETSC_TRUE;
22036e169961SBarry Smith   }
22049566063dSJacob Faibussowitsch   PetscCall(PetscCalloc1(A->rmap->n, &zeroed));
22056e169961SBarry Smith   for (i = 0; i < N; i++) {
2206aed4548fSBarry Smith     PetscCheck(rows[i] >= 0 && rows[i] <= m, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "row %" PetscInt_FMT " out of range", rows[i]);
22078e3a54c0SPierre Jolivet     PetscCall(PetscArrayzero(PetscSafePointerPlusOffset(aa, a->i[rows[i]]), a->ilen[rows[i]]));
22082205254eSKarl Rupp 
22096e169961SBarry Smith     zeroed[rows[i]] = PETSC_TRUE;
22106e169961SBarry Smith   }
22116e169961SBarry Smith   for (i = 0; i < A->rmap->n; i++) {
22126e169961SBarry Smith     if (!zeroed[i]) {
22136e169961SBarry Smith       for (j = a->i[i]; j < a->i[i + 1]; j++) {
22144cf107fdSStefano Zampini         if (a->j[j] < A->rmap->n && zeroed[a->j[j]]) {
22152e5835c6SStefano Zampini           if (vecs) bb[i] -= aa[j] * xx[a->j[j]];
22162e5835c6SStefano Zampini           aa[j] = 0.0;
22176e169961SBarry Smith         }
22186e169961SBarry Smith       }
22194cf107fdSStefano Zampini     } else if (vecs && i < A->cmap->N) bb[i] = diag * xx[i];
22206e169961SBarry Smith   }
22216e169961SBarry Smith   if (x && b) {
22229566063dSJacob Faibussowitsch     PetscCall(VecRestoreArrayRead(x, &xx));
22239566063dSJacob Faibussowitsch     PetscCall(VecRestoreArray(b, &bb));
22246e169961SBarry Smith   }
22259566063dSJacob Faibussowitsch   PetscCall(PetscFree(zeroed));
22266e169961SBarry Smith   if (diag != 0.0) {
22279566063dSJacob Faibussowitsch     PetscCall(MatMissingDiagonal_SeqAIJ(A, &missing, &d));
22281d5a398dSstefano_zampini     if (missing) {
22291d5a398dSstefano_zampini       for (i = 0; i < N; i++) {
22304cf107fdSStefano Zampini         if (rows[i] >= A->cmap->N) continue;
2231aed4548fSBarry Smith         PetscCheck(!a->nonew || rows[i] < d, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Matrix is missing diagonal entry in row %" PetscInt_FMT " (%" PetscInt_FMT ")", d, rows[i]);
22329566063dSJacob Faibussowitsch         PetscCall(MatSetValues_SeqAIJ(A, 1, &rows[i], 1, &rows[i], &diag, INSERT_VALUES));
22331d5a398dSstefano_zampini       }
22341d5a398dSstefano_zampini     } else {
2235ad540459SPierre Jolivet       for (i = 0; i < N; i++) aa[a->diag[rows[i]]] = diag;
22366e169961SBarry Smith     }
22371d5a398dSstefano_zampini   }
22389566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArray(A, &aa));
2239dbbe0bcdSBarry Smith   PetscUseTypeMethod(A, assemblyend, MAT_FINAL_ASSEMBLY);
22403ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
22416e169961SBarry Smith }
22426e169961SBarry Smith 
2243d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetRow_SeqAIJ(Mat A, PetscInt row, PetscInt *nz, PetscInt **idx, PetscScalar **v)
2244d71ae5a4SJacob Faibussowitsch {
2245fff043a9SJunchao Zhang   Mat_SeqAIJ        *a = (Mat_SeqAIJ *)A->data;
2246fff043a9SJunchao Zhang   const PetscScalar *aa;
224717ab2063SBarry Smith 
22483a40ed3dSBarry Smith   PetscFunctionBegin;
22499566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &aa));
2250416022c9SBarry Smith   *nz = a->i[row + 1] - a->i[row];
22518e3a54c0SPierre Jolivet   if (v) *v = PetscSafePointerPlusOffset((PetscScalar *)aa, a->i[row]);
225217ab2063SBarry Smith   if (idx) {
22535c0db29aSPierre Jolivet     if (*nz && a->j) *idx = a->j + a->i[row];
2254f4259b30SLisandro Dalcin     else *idx = NULL;
225517ab2063SBarry Smith   }
22569566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &aa));
22573ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
225817ab2063SBarry Smith }
225917ab2063SBarry Smith 
2260d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRestoreRow_SeqAIJ(Mat A, PetscInt row, PetscInt *nz, PetscInt **idx, PetscScalar **v)
2261d71ae5a4SJacob Faibussowitsch {
22623a40ed3dSBarry Smith   PetscFunctionBegin;
22633ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
226417ab2063SBarry Smith }
226517ab2063SBarry Smith 
2266ba38deedSJacob Faibussowitsch static PetscErrorCode MatNorm_SeqAIJ(Mat A, NormType type, PetscReal *nrm)
2267d71ae5a4SJacob Faibussowitsch {
2268416022c9SBarry Smith   Mat_SeqAIJ      *a = (Mat_SeqAIJ *)A->data;
22692e5835c6SStefano Zampini   const MatScalar *v;
227036db0b34SBarry Smith   PetscReal        sum = 0.0;
227197f1f81fSBarry Smith   PetscInt         i, j;
227217ab2063SBarry Smith 
22733a40ed3dSBarry Smith   PetscFunctionBegin;
22749566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &v));
227517ab2063SBarry Smith   if (type == NORM_FROBENIUS) {
2276570b7f6dSBarry Smith #if defined(PETSC_USE_REAL___FP16)
2277570b7f6dSBarry Smith     PetscBLASInt one = 1, nz = a->nz;
2278792fecdfSBarry Smith     PetscCallBLAS("BLASnrm2", *nrm = BLASnrm2_(&nz, v, &one));
2279570b7f6dSBarry Smith #else
2280416022c9SBarry Smith     for (i = 0; i < a->nz; i++) {
22819371c9d4SSatish Balay       sum += PetscRealPart(PetscConj(*v) * (*v));
22829371c9d4SSatish Balay       v++;
228317ab2063SBarry Smith     }
22848f1a2a5eSBarry Smith     *nrm = PetscSqrtReal(sum);
2285570b7f6dSBarry Smith #endif
22869566063dSJacob Faibussowitsch     PetscCall(PetscLogFlops(2.0 * a->nz));
22873a40ed3dSBarry Smith   } else if (type == NORM_1) {
228836db0b34SBarry Smith     PetscReal *tmp;
228997f1f81fSBarry Smith     PetscInt  *jj = a->j;
22909566063dSJacob Faibussowitsch     PetscCall(PetscCalloc1(A->cmap->n + 1, &tmp));
2291064f8208SBarry Smith     *nrm = 0.0;
2292416022c9SBarry Smith     for (j = 0; j < a->nz; j++) {
22939371c9d4SSatish Balay       tmp[*jj++] += PetscAbsScalar(*v);
22949371c9d4SSatish Balay       v++;
229517ab2063SBarry Smith     }
2296d0f46423SBarry Smith     for (j = 0; j < A->cmap->n; j++) {
2297064f8208SBarry Smith       if (tmp[j] > *nrm) *nrm = tmp[j];
229817ab2063SBarry Smith     }
22999566063dSJacob Faibussowitsch     PetscCall(PetscFree(tmp));
23009566063dSJacob Faibussowitsch     PetscCall(PetscLogFlops(PetscMax(a->nz - 1, 0)));
23013a40ed3dSBarry Smith   } else if (type == NORM_INFINITY) {
2302064f8208SBarry Smith     *nrm = 0.0;
2303d0f46423SBarry Smith     for (j = 0; j < A->rmap->n; j++) {
23048e3a54c0SPierre Jolivet       const PetscScalar *v2 = PetscSafePointerPlusOffset(v, a->i[j]);
230517ab2063SBarry Smith       sum                   = 0.0;
2306416022c9SBarry Smith       for (i = 0; i < a->i[j + 1] - a->i[j]; i++) {
23079371c9d4SSatish Balay         sum += PetscAbsScalar(*v2);
23089371c9d4SSatish Balay         v2++;
230917ab2063SBarry Smith       }
2310064f8208SBarry Smith       if (sum > *nrm) *nrm = sum;
231117ab2063SBarry Smith     }
23129566063dSJacob Faibussowitsch     PetscCall(PetscLogFlops(PetscMax(a->nz - 1, 0)));
2313f23aa3ddSBarry Smith   } else SETERRQ(PETSC_COMM_SELF, PETSC_ERR_SUP, "No support for two norm");
23149566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &v));
23153ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
231617ab2063SBarry Smith }
231717ab2063SBarry Smith 
2318ba38deedSJacob Faibussowitsch static PetscErrorCode MatIsTranspose_SeqAIJ(Mat A, Mat B, PetscReal tol, PetscBool *f)
2319d71ae5a4SJacob Faibussowitsch {
23203d3eaba7SBarry Smith   Mat_SeqAIJ      *aij = (Mat_SeqAIJ *)A->data, *bij = (Mat_SeqAIJ *)B->data;
232154f21887SBarry Smith   PetscInt        *adx, *bdx, *aii, *bii, *aptr, *bptr;
23222e5835c6SStefano Zampini   const MatScalar *va, *vb;
232397f1f81fSBarry Smith   PetscInt         ma, na, mb, nb, i;
2324cd0d46ebSvictorle 
2325cd0d46ebSvictorle   PetscFunctionBegin;
23269566063dSJacob Faibussowitsch   PetscCall(MatGetSize(A, &ma, &na));
23279566063dSJacob Faibussowitsch   PetscCall(MatGetSize(B, &mb, &nb));
23285485867bSBarry Smith   if (ma != nb || na != mb) {
23295485867bSBarry Smith     *f = PETSC_FALSE;
23303ba16761SJacob Faibussowitsch     PetscFunctionReturn(PETSC_SUCCESS);
23315485867bSBarry Smith   }
23329566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &va));
23339566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(B, &vb));
23349371c9d4SSatish Balay   aii = aij->i;
23359371c9d4SSatish Balay   bii = bij->i;
23369371c9d4SSatish Balay   adx = aij->j;
23379371c9d4SSatish Balay   bdx = bij->j;
23389566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(ma, &aptr));
23399566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(mb, &bptr));
2340cd0d46ebSvictorle   for (i = 0; i < ma; i++) aptr[i] = aii[i];
2341cd0d46ebSvictorle   for (i = 0; i < mb; i++) bptr[i] = bii[i];
2342cd0d46ebSvictorle 
2343cd0d46ebSvictorle   *f = PETSC_TRUE;
2344cd0d46ebSvictorle   for (i = 0; i < ma; i++) {
2345cd0d46ebSvictorle     while (aptr[i] < aii[i + 1]) {
234697f1f81fSBarry Smith       PetscInt    idc, idr;
23475485867bSBarry Smith       PetscScalar vc, vr;
2348cd0d46ebSvictorle       /* column/row index/value */
23495485867bSBarry Smith       idc = adx[aptr[i]];
23505485867bSBarry Smith       idr = bdx[bptr[idc]];
23515485867bSBarry Smith       vc  = va[aptr[i]];
23525485867bSBarry Smith       vr  = vb[bptr[idc]];
23535485867bSBarry Smith       if (i != idr || PetscAbsScalar(vc - vr) > tol) {
23545485867bSBarry Smith         *f = PETSC_FALSE;
23555485867bSBarry Smith         goto done;
2356cd0d46ebSvictorle       } else {
23575485867bSBarry Smith         aptr[i]++;
23585485867bSBarry Smith         if (B || i != idc) bptr[idc]++;
2359cd0d46ebSvictorle       }
2360cd0d46ebSvictorle     }
2361cd0d46ebSvictorle   }
2362cd0d46ebSvictorle done:
23639566063dSJacob Faibussowitsch   PetscCall(PetscFree(aptr));
23649566063dSJacob Faibussowitsch   PetscCall(PetscFree(bptr));
23659566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &va));
23669566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(B, &vb));
23673ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
2368cd0d46ebSvictorle }
2369cd0d46ebSvictorle 
2370ba38deedSJacob Faibussowitsch static PetscErrorCode MatIsHermitianTranspose_SeqAIJ(Mat A, Mat B, PetscReal tol, PetscBool *f)
2371d71ae5a4SJacob Faibussowitsch {
23723d3eaba7SBarry Smith   Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data, *bij = (Mat_SeqAIJ *)B->data;
237354f21887SBarry Smith   PetscInt   *adx, *bdx, *aii, *bii, *aptr, *bptr;
237454f21887SBarry Smith   MatScalar  *va, *vb;
23751cbb95d3SBarry Smith   PetscInt    ma, na, mb, nb, i;
23761cbb95d3SBarry Smith 
23771cbb95d3SBarry Smith   PetscFunctionBegin;
23789566063dSJacob Faibussowitsch   PetscCall(MatGetSize(A, &ma, &na));
23799566063dSJacob Faibussowitsch   PetscCall(MatGetSize(B, &mb, &nb));
23801cbb95d3SBarry Smith   if (ma != nb || na != mb) {
23811cbb95d3SBarry Smith     *f = PETSC_FALSE;
23823ba16761SJacob Faibussowitsch     PetscFunctionReturn(PETSC_SUCCESS);
23831cbb95d3SBarry Smith   }
23849371c9d4SSatish Balay   aii = aij->i;
23859371c9d4SSatish Balay   bii = bij->i;
23869371c9d4SSatish Balay   adx = aij->j;
23879371c9d4SSatish Balay   bdx = bij->j;
23889371c9d4SSatish Balay   va  = aij->a;
23899371c9d4SSatish Balay   vb  = bij->a;
23909566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(ma, &aptr));
23919566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(mb, &bptr));
23921cbb95d3SBarry Smith   for (i = 0; i < ma; i++) aptr[i] = aii[i];
23931cbb95d3SBarry Smith   for (i = 0; i < mb; i++) bptr[i] = bii[i];
23941cbb95d3SBarry Smith 
23951cbb95d3SBarry Smith   *f = PETSC_TRUE;
23961cbb95d3SBarry Smith   for (i = 0; i < ma; i++) {
23971cbb95d3SBarry Smith     while (aptr[i] < aii[i + 1]) {
23981cbb95d3SBarry Smith       PetscInt    idc, idr;
23991cbb95d3SBarry Smith       PetscScalar vc, vr;
24001cbb95d3SBarry Smith       /* column/row index/value */
24011cbb95d3SBarry Smith       idc = adx[aptr[i]];
24021cbb95d3SBarry Smith       idr = bdx[bptr[idc]];
24031cbb95d3SBarry Smith       vc  = va[aptr[i]];
24041cbb95d3SBarry Smith       vr  = vb[bptr[idc]];
24051cbb95d3SBarry Smith       if (i != idr || PetscAbsScalar(vc - PetscConj(vr)) > tol) {
24061cbb95d3SBarry Smith         *f = PETSC_FALSE;
24071cbb95d3SBarry Smith         goto done;
24081cbb95d3SBarry Smith       } else {
24091cbb95d3SBarry Smith         aptr[i]++;
24101cbb95d3SBarry Smith         if (B || i != idc) bptr[idc]++;
24111cbb95d3SBarry Smith       }
24121cbb95d3SBarry Smith     }
24131cbb95d3SBarry Smith   }
24141cbb95d3SBarry Smith done:
24159566063dSJacob Faibussowitsch   PetscCall(PetscFree(aptr));
24169566063dSJacob Faibussowitsch   PetscCall(PetscFree(bptr));
24173ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
24181cbb95d3SBarry Smith }
24191cbb95d3SBarry Smith 
2420d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDiagonalScale_SeqAIJ(Mat A, Vec ll, Vec rr)
2421d71ae5a4SJacob Faibussowitsch {
2422416022c9SBarry Smith   Mat_SeqAIJ        *a = (Mat_SeqAIJ *)A->data;
2423fff8e43fSBarry Smith   const PetscScalar *l, *r;
2424fff8e43fSBarry Smith   PetscScalar        x;
242554f21887SBarry Smith   MatScalar         *v;
2426fff8e43fSBarry Smith   PetscInt           i, j, m = A->rmap->n, n = A->cmap->n, M, nz = a->nz;
2427fff8e43fSBarry Smith   const PetscInt    *jj;
242817ab2063SBarry Smith 
24293a40ed3dSBarry Smith   PetscFunctionBegin;
243017ab2063SBarry Smith   if (ll) {
24313ea7c6a1SSatish Balay     /* The local size is used so that VecMPI can be passed to this routine
24323ea7c6a1SSatish Balay        by MatDiagonalScale_MPIAIJ */
24339566063dSJacob Faibussowitsch     PetscCall(VecGetLocalSize(ll, &m));
243408401ef6SPierre Jolivet     PetscCheck(m == A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Left scaling vector wrong length");
24359566063dSJacob Faibussowitsch     PetscCall(VecGetArrayRead(ll, &l));
24369566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJGetArray(A, &v));
243717ab2063SBarry Smith     for (i = 0; i < m; i++) {
243817ab2063SBarry Smith       x = l[i];
2439416022c9SBarry Smith       M = a->i[i + 1] - a->i[i];
24402205254eSKarl Rupp       for (j = 0; j < M; j++) (*v++) *= x;
244117ab2063SBarry Smith     }
24429566063dSJacob Faibussowitsch     PetscCall(VecRestoreArrayRead(ll, &l));
24439566063dSJacob Faibussowitsch     PetscCall(PetscLogFlops(nz));
24449566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJRestoreArray(A, &v));
244517ab2063SBarry Smith   }
244617ab2063SBarry Smith   if (rr) {
24479566063dSJacob Faibussowitsch     PetscCall(VecGetLocalSize(rr, &n));
244808401ef6SPierre Jolivet     PetscCheck(n == A->cmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Right scaling vector wrong length");
24499566063dSJacob Faibussowitsch     PetscCall(VecGetArrayRead(rr, &r));
24509566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJGetArray(A, &v));
24512e5835c6SStefano Zampini     jj = a->j;
24522205254eSKarl Rupp     for (i = 0; i < nz; i++) (*v++) *= r[*jj++];
24539566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJRestoreArray(A, &v));
24549566063dSJacob Faibussowitsch     PetscCall(VecRestoreArrayRead(rr, &r));
24559566063dSJacob Faibussowitsch     PetscCall(PetscLogFlops(nz));
245617ab2063SBarry Smith   }
24579566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJInvalidateDiagonal(A));
24583ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
245917ab2063SBarry Smith }
246017ab2063SBarry Smith 
2461d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateSubMatrix_SeqAIJ(Mat A, IS isrow, IS iscol, PetscInt csize, MatReuse scall, Mat *B)
2462d71ae5a4SJacob Faibussowitsch {
2463db02288aSLois Curfman McInnes   Mat_SeqAIJ        *a = (Mat_SeqAIJ *)A->data, *c;
2464d0f46423SBarry Smith   PetscInt          *smap, i, k, kstart, kend, oldcols = A->cmap->n, *lens;
246597f1f81fSBarry Smith   PetscInt           row, mat_i, *mat_j, tcol, first, step, *mat_ilen, sum, lensi;
24665d0c19d7SBarry Smith   const PetscInt    *irow, *icol;
24672e5835c6SStefano Zampini   const PetscScalar *aa;
24685d0c19d7SBarry Smith   PetscInt           nrows, ncols;
246997f1f81fSBarry Smith   PetscInt          *starts, *j_new, *i_new, *aj = a->j, *ai = a->i, ii, *ailen = a->ilen;
2470fb3c7e2dSJunchao Zhang   MatScalar         *a_new, *mat_a, *c_a;
2471416022c9SBarry Smith   Mat                C;
2472cdc6f3adSToby Isaac   PetscBool          stride;
247317ab2063SBarry Smith 
24743a40ed3dSBarry Smith   PetscFunctionBegin;
24759566063dSJacob Faibussowitsch   PetscCall(ISGetIndices(isrow, &irow));
24769566063dSJacob Faibussowitsch   PetscCall(ISGetLocalSize(isrow, &nrows));
24779566063dSJacob Faibussowitsch   PetscCall(ISGetLocalSize(iscol, &ncols));
247817ab2063SBarry Smith 
24799566063dSJacob Faibussowitsch   PetscCall(PetscObjectTypeCompare((PetscObject)iscol, ISSTRIDE, &stride));
2480ff718158SBarry Smith   if (stride) {
24819566063dSJacob Faibussowitsch     PetscCall(ISStrideGetInfo(iscol, &first, &step));
2482ff718158SBarry Smith   } else {
2483ff718158SBarry Smith     first = 0;
2484ff718158SBarry Smith     step  = 0;
2485ff718158SBarry Smith   }
2486fee21e36SBarry Smith   if (stride && step == 1) {
248702834360SBarry Smith     /* special case of contiguous rows */
24889566063dSJacob Faibussowitsch     PetscCall(PetscMalloc2(nrows, &lens, nrows, &starts));
248902834360SBarry Smith     /* loop over new rows determining lens and starting points */
249002834360SBarry Smith     for (i = 0; i < nrows; i++) {
2491bfeeae90SHong Zhang       kstart    = ai[irow[i]];
2492a2744918SBarry Smith       kend      = kstart + ailen[irow[i]];
2493a91a9bebSLisandro Dalcin       starts[i] = kstart;
249402834360SBarry Smith       for (k = kstart; k < kend; k++) {
2495bfeeae90SHong Zhang         if (aj[k] >= first) {
249602834360SBarry Smith           starts[i] = k;
249702834360SBarry Smith           break;
249802834360SBarry Smith         }
249902834360SBarry Smith       }
2500a2744918SBarry Smith       sum = 0;
250102834360SBarry Smith       while (k < kend) {
2502bfeeae90SHong Zhang         if (aj[k++] >= first + ncols) break;
2503a2744918SBarry Smith         sum++;
250402834360SBarry Smith       }
2505a2744918SBarry Smith       lens[i] = sum;
250602834360SBarry Smith     }
250702834360SBarry Smith     /* create submatrix */
2508cddf8d76SBarry Smith     if (scall == MAT_REUSE_MATRIX) {
250997f1f81fSBarry Smith       PetscInt n_cols, n_rows;
25109566063dSJacob Faibussowitsch       PetscCall(MatGetSize(*B, &n_rows, &n_cols));
2511aed4548fSBarry Smith       PetscCheck(n_rows == nrows && n_cols == ncols, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Reused submatrix wrong size");
25129566063dSJacob Faibussowitsch       PetscCall(MatZeroEntries(*B));
251308480c60SBarry Smith       C = *B;
25143a40ed3dSBarry Smith     } else {
25153bef6203SJed Brown       PetscInt rbs, cbs;
25169566063dSJacob Faibussowitsch       PetscCall(MatCreate(PetscObjectComm((PetscObject)A), &C));
25179566063dSJacob Faibussowitsch       PetscCall(MatSetSizes(C, nrows, ncols, PETSC_DETERMINE, PETSC_DETERMINE));
25189566063dSJacob Faibussowitsch       PetscCall(ISGetBlockSize(isrow, &rbs));
25199566063dSJacob Faibussowitsch       PetscCall(ISGetBlockSize(iscol, &cbs));
25209566063dSJacob Faibussowitsch       PetscCall(MatSetBlockSizes(C, rbs, cbs));
25219566063dSJacob Faibussowitsch       PetscCall(MatSetType(C, ((PetscObject)A)->type_name));
25229566063dSJacob Faibussowitsch       PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(C, 0, lens));
252308480c60SBarry Smith     }
2524db02288aSLois Curfman McInnes     c = (Mat_SeqAIJ *)C->data;
2525db02288aSLois Curfman McInnes 
252602834360SBarry Smith     /* loop over rows inserting into submatrix */
2527fb3c7e2dSJunchao Zhang     PetscCall(MatSeqAIJGetArrayWrite(C, &a_new)); // Not 'a_new = c->a-new', since that raw usage ignores offload state of C
2528db02288aSLois Curfman McInnes     j_new = c->j;
2529db02288aSLois Curfman McInnes     i_new = c->i;
25309566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJGetArrayRead(A, &aa));
253102834360SBarry Smith     for (i = 0; i < nrows; i++) {
2532a2744918SBarry Smith       ii    = starts[i];
2533a2744918SBarry Smith       lensi = lens[i];
2534810441c8SPierre Jolivet       if (lensi) {
2535ad540459SPierre Jolivet         for (k = 0; k < lensi; k++) *j_new++ = aj[ii + k] - first;
25369566063dSJacob Faibussowitsch         PetscCall(PetscArraycpy(a_new, aa + starts[i], lensi));
2537a2744918SBarry Smith         a_new += lensi;
2538810441c8SPierre Jolivet       }
2539a2744918SBarry Smith       i_new[i + 1] = i_new[i] + lensi;
2540a2744918SBarry Smith       c->ilen[i]   = lensi;
254102834360SBarry Smith     }
2542fb3c7e2dSJunchao Zhang     PetscCall(MatSeqAIJRestoreArrayWrite(C, &a_new)); // Set C's offload state properly
25439566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJRestoreArrayRead(A, &aa));
25449566063dSJacob Faibussowitsch     PetscCall(PetscFree2(lens, starts));
25453a40ed3dSBarry Smith   } else {
25469566063dSJacob Faibussowitsch     PetscCall(ISGetIndices(iscol, &icol));
25479566063dSJacob Faibussowitsch     PetscCall(PetscCalloc1(oldcols, &smap));
25489566063dSJacob Faibussowitsch     PetscCall(PetscMalloc1(1 + nrows, &lens));
25494dcab191SBarry Smith     for (i = 0; i < ncols; i++) {
25506bdcaf15SBarry Smith       PetscCheck(icol[i] < oldcols, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Requesting column beyond largest column icol[%" PetscInt_FMT "] %" PetscInt_FMT " >= A->cmap->n %" PetscInt_FMT, i, icol[i], oldcols);
25514dcab191SBarry Smith       smap[icol[i]] = i + 1;
25524dcab191SBarry Smith     }
25534dcab191SBarry Smith 
255402834360SBarry Smith     /* determine lens of each row */
255502834360SBarry Smith     for (i = 0; i < nrows; i++) {
2556bfeeae90SHong Zhang       kstart  = ai[irow[i]];
255702834360SBarry Smith       kend    = kstart + a->ilen[irow[i]];
255802834360SBarry Smith       lens[i] = 0;
255902834360SBarry Smith       for (k = kstart; k < kend; k++) {
2560ad540459SPierre Jolivet         if (smap[aj[k]]) lens[i]++;
256102834360SBarry Smith       }
256202834360SBarry Smith     }
256317ab2063SBarry Smith     /* Create and fill new matrix */
2564a2744918SBarry Smith     if (scall == MAT_REUSE_MATRIX) {
2565ace3abfcSBarry Smith       PetscBool equal;
25660f5bd95cSBarry Smith 
256799141d43SSatish Balay       c = (Mat_SeqAIJ *)((*B)->data);
2568aed4548fSBarry Smith       PetscCheck((*B)->rmap->n == nrows && (*B)->cmap->n == ncols, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Cannot reuse matrix. wrong size");
25699566063dSJacob Faibussowitsch       PetscCall(PetscArraycmp(c->ilen, lens, (*B)->rmap->n, &equal));
2570fdfbdca6SPierre Jolivet       PetscCheck(equal, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Cannot reuse matrix. wrong number of nonzeros");
25719566063dSJacob Faibussowitsch       PetscCall(PetscArrayzero(c->ilen, (*B)->rmap->n));
257208480c60SBarry Smith       C = *B;
25733a40ed3dSBarry Smith     } else {
25743bef6203SJed Brown       PetscInt rbs, cbs;
25759566063dSJacob Faibussowitsch       PetscCall(MatCreate(PetscObjectComm((PetscObject)A), &C));
25769566063dSJacob Faibussowitsch       PetscCall(MatSetSizes(C, nrows, ncols, PETSC_DETERMINE, PETSC_DETERMINE));
25779566063dSJacob Faibussowitsch       PetscCall(ISGetBlockSize(isrow, &rbs));
25789566063dSJacob Faibussowitsch       PetscCall(ISGetBlockSize(iscol, &cbs));
257937a5e0faSPierre Jolivet       if (rbs > 1 || cbs > 1) PetscCall(MatSetBlockSizes(C, rbs, cbs));
25809566063dSJacob Faibussowitsch       PetscCall(MatSetType(C, ((PetscObject)A)->type_name));
25819566063dSJacob Faibussowitsch       PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(C, 0, lens));
258208480c60SBarry Smith     }
25839566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJGetArrayRead(A, &aa));
2584fb3c7e2dSJunchao Zhang 
2585f4f49eeaSPierre Jolivet     c = (Mat_SeqAIJ *)C->data;
2586fb3c7e2dSJunchao Zhang     PetscCall(MatSeqAIJGetArrayWrite(C, &c_a)); // Not 'c->a', since that raw usage ignores offload state of C
258717ab2063SBarry Smith     for (i = 0; i < nrows; i++) {
258899141d43SSatish Balay       row      = irow[i];
2589bfeeae90SHong Zhang       kstart   = ai[row];
259099141d43SSatish Balay       kend     = kstart + a->ilen[row];
2591bfeeae90SHong Zhang       mat_i    = c->i[i];
25928e3a54c0SPierre Jolivet       mat_j    = PetscSafePointerPlusOffset(c->j, mat_i);
25938e3a54c0SPierre Jolivet       mat_a    = PetscSafePointerPlusOffset(c_a, mat_i);
259499141d43SSatish Balay       mat_ilen = c->ilen + i;
259517ab2063SBarry Smith       for (k = kstart; k < kend; k++) {
2596bfeeae90SHong Zhang         if ((tcol = smap[a->j[k]])) {
2597ed480e8bSBarry Smith           *mat_j++ = tcol - 1;
25982e5835c6SStefano Zampini           *mat_a++ = aa[k];
259999141d43SSatish Balay           (*mat_ilen)++;
260017ab2063SBarry Smith         }
260117ab2063SBarry Smith       }
260217ab2063SBarry Smith     }
26039566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJRestoreArrayRead(A, &aa));
260402834360SBarry Smith     /* Free work space */
26059566063dSJacob Faibussowitsch     PetscCall(ISRestoreIndices(iscol, &icol));
26069566063dSJacob Faibussowitsch     PetscCall(PetscFree(smap));
26079566063dSJacob Faibussowitsch     PetscCall(PetscFree(lens));
2608cdc6f3adSToby Isaac     /* sort */
2609cdc6f3adSToby Isaac     for (i = 0; i < nrows; i++) {
2610cdc6f3adSToby Isaac       PetscInt ilen;
2611cdc6f3adSToby Isaac 
2612cdc6f3adSToby Isaac       mat_i = c->i[i];
26138e3a54c0SPierre Jolivet       mat_j = PetscSafePointerPlusOffset(c->j, mat_i);
26148e3a54c0SPierre Jolivet       mat_a = PetscSafePointerPlusOffset(c_a, mat_i);
2615cdc6f3adSToby Isaac       ilen  = c->ilen[i];
26169566063dSJacob Faibussowitsch       PetscCall(PetscSortIntWithScalarArray(ilen, mat_j, mat_a));
2617cdc6f3adSToby Isaac     }
2618fb3c7e2dSJunchao Zhang     PetscCall(MatSeqAIJRestoreArrayWrite(C, &c_a));
261902834360SBarry Smith   }
26208c3ff71bSJunchao Zhang #if defined(PETSC_HAVE_DEVICE)
26219566063dSJacob Faibussowitsch   PetscCall(MatBindToCPU(C, A->boundtocpu));
2622305c6ccfSStefano Zampini #endif
26239566063dSJacob Faibussowitsch   PetscCall(MatAssemblyBegin(C, MAT_FINAL_ASSEMBLY));
26249566063dSJacob Faibussowitsch   PetscCall(MatAssemblyEnd(C, MAT_FINAL_ASSEMBLY));
262517ab2063SBarry Smith 
26269566063dSJacob Faibussowitsch   PetscCall(ISRestoreIndices(isrow, &irow));
2627416022c9SBarry Smith   *B = C;
26283ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
262917ab2063SBarry Smith }
263017ab2063SBarry Smith 
2631ba38deedSJacob Faibussowitsch static PetscErrorCode MatGetMultiProcBlock_SeqAIJ(Mat mat, MPI_Comm subComm, MatReuse scall, Mat *subMat)
2632d71ae5a4SJacob Faibussowitsch {
263382d44351SHong Zhang   Mat B;
263482d44351SHong Zhang 
263582d44351SHong Zhang   PetscFunctionBegin;
2636c2d650bdSHong Zhang   if (scall == MAT_INITIAL_MATRIX) {
26379566063dSJacob Faibussowitsch     PetscCall(MatCreate(subComm, &B));
26389566063dSJacob Faibussowitsch     PetscCall(MatSetSizes(B, mat->rmap->n, mat->cmap->n, mat->rmap->n, mat->cmap->n));
26399566063dSJacob Faibussowitsch     PetscCall(MatSetBlockSizesFromMats(B, mat, mat));
26409566063dSJacob Faibussowitsch     PetscCall(MatSetType(B, MATSEQAIJ));
26419566063dSJacob Faibussowitsch     PetscCall(MatDuplicateNoCreate_SeqAIJ(B, mat, MAT_COPY_VALUES, PETSC_TRUE));
264282d44351SHong Zhang     *subMat = B;
2643c2d650bdSHong Zhang   } else {
26449566063dSJacob Faibussowitsch     PetscCall(MatCopy_SeqAIJ(mat, *subMat, SAME_NONZERO_PATTERN));
2645c2d650bdSHong Zhang   }
26463ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
264782d44351SHong Zhang }
264882d44351SHong Zhang 
2649ba38deedSJacob Faibussowitsch static PetscErrorCode MatILUFactor_SeqAIJ(Mat inA, IS row, IS col, const MatFactorInfo *info)
2650d71ae5a4SJacob Faibussowitsch {
265163b91edcSBarry Smith   Mat_SeqAIJ *a = (Mat_SeqAIJ *)inA->data;
265263b91edcSBarry Smith   Mat         outA;
2653ace3abfcSBarry Smith   PetscBool   row_identity, col_identity;
265463b91edcSBarry Smith 
26553a40ed3dSBarry Smith   PetscFunctionBegin;
265608401ef6SPierre Jolivet   PetscCheck(info->levels == 0, PETSC_COMM_SELF, PETSC_ERR_SUP, "Only levels=0 supported for in-place ilu");
26571df811f5SHong Zhang 
26589566063dSJacob Faibussowitsch   PetscCall(ISIdentity(row, &row_identity));
26599566063dSJacob Faibussowitsch   PetscCall(ISIdentity(col, &col_identity));
2660a871dcd8SBarry Smith 
266163b91edcSBarry Smith   outA             = inA;
2662d5f3da31SBarry Smith   outA->factortype = MAT_FACTOR_LU;
26639566063dSJacob Faibussowitsch   PetscCall(PetscFree(inA->solvertype));
26649566063dSJacob Faibussowitsch   PetscCall(PetscStrallocpy(MATSOLVERPETSC, &inA->solvertype));
26652205254eSKarl Rupp 
26669566063dSJacob Faibussowitsch   PetscCall(PetscObjectReference((PetscObject)row));
26679566063dSJacob Faibussowitsch   PetscCall(ISDestroy(&a->row));
26682205254eSKarl Rupp 
2669c3122656SLisandro Dalcin   a->row = row;
26702205254eSKarl Rupp 
26719566063dSJacob Faibussowitsch   PetscCall(PetscObjectReference((PetscObject)col));
26729566063dSJacob Faibussowitsch   PetscCall(ISDestroy(&a->col));
26732205254eSKarl Rupp 
2674c3122656SLisandro Dalcin   a->col = col;
267563b91edcSBarry Smith 
267636db0b34SBarry Smith   /* Create the inverse permutation so that it can be used in MatLUFactorNumeric() */
26779566063dSJacob Faibussowitsch   PetscCall(ISDestroy(&a->icol));
26789566063dSJacob Faibussowitsch   PetscCall(ISInvertPermutation(col, PETSC_DECIDE, &a->icol));
2679f0ec6fceSSatish Balay 
268094a9d846SBarry Smith   if (!a->solve_work) { /* this matrix may have been factored before */
26819566063dSJacob Faibussowitsch     PetscCall(PetscMalloc1(inA->rmap->n + 1, &a->solve_work));
268294a9d846SBarry Smith   }
268363b91edcSBarry Smith 
26849566063dSJacob Faibussowitsch   PetscCall(MatMarkDiagonal_SeqAIJ(inA));
2685137fb511SHong Zhang   if (row_identity && col_identity) {
26869566063dSJacob Faibussowitsch     PetscCall(MatLUFactorNumeric_SeqAIJ_inplace(outA, inA, info));
2687137fb511SHong Zhang   } else {
26889566063dSJacob Faibussowitsch     PetscCall(MatLUFactorNumeric_SeqAIJ_InplaceWithPerm(outA, inA, info));
2689137fb511SHong Zhang   }
26903ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
2691a871dcd8SBarry Smith }
2692a871dcd8SBarry Smith 
2693d71ae5a4SJacob Faibussowitsch PetscErrorCode MatScale_SeqAIJ(Mat inA, PetscScalar alpha)
2694d71ae5a4SJacob Faibussowitsch {
2695f0b747eeSBarry Smith   Mat_SeqAIJ  *a = (Mat_SeqAIJ *)inA->data;
2696dfa0f9e5SStefano Zampini   PetscScalar *v;
2697c5df96a5SBarry Smith   PetscBLASInt one = 1, bnz;
26983a40ed3dSBarry Smith 
26993a40ed3dSBarry Smith   PetscFunctionBegin;
27009566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArray(inA, &v));
27019566063dSJacob Faibussowitsch   PetscCall(PetscBLASIntCast(a->nz, &bnz));
2702792fecdfSBarry Smith   PetscCallBLAS("BLASscal", BLASscal_(&bnz, &alpha, v, &one));
27039566063dSJacob Faibussowitsch   PetscCall(PetscLogFlops(a->nz));
27049566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArray(inA, &v));
27059566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJInvalidateDiagonal(inA));
27063ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
2707f0b747eeSBarry Smith }
2708f0b747eeSBarry Smith 
2709d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDestroySubMatrix_Private(Mat_SubSppt *submatj)
2710d71ae5a4SJacob Faibussowitsch {
271116b64355SHong Zhang   PetscInt i;
271216b64355SHong Zhang 
271316b64355SHong Zhang   PetscFunctionBegin;
271416b64355SHong Zhang   if (!submatj->id) { /* delete data that are linked only to submats[id=0] */
27159566063dSJacob Faibussowitsch     PetscCall(PetscFree4(submatj->sbuf1, submatj->ptr, submatj->tmp, submatj->ctr));
271616b64355SHong Zhang 
271748a46eb9SPierre Jolivet     for (i = 0; i < submatj->nrqr; ++i) PetscCall(PetscFree(submatj->sbuf2[i]));
27189566063dSJacob Faibussowitsch     PetscCall(PetscFree3(submatj->sbuf2, submatj->req_size, submatj->req_source1));
271916b64355SHong Zhang 
272016b64355SHong Zhang     if (submatj->rbuf1) {
27219566063dSJacob Faibussowitsch       PetscCall(PetscFree(submatj->rbuf1[0]));
27229566063dSJacob Faibussowitsch       PetscCall(PetscFree(submatj->rbuf1));
272316b64355SHong Zhang     }
272416b64355SHong Zhang 
272548a46eb9SPierre Jolivet     for (i = 0; i < submatj->nrqs; ++i) PetscCall(PetscFree(submatj->rbuf3[i]));
27269566063dSJacob Faibussowitsch     PetscCall(PetscFree3(submatj->req_source2, submatj->rbuf2, submatj->rbuf3));
27279566063dSJacob Faibussowitsch     PetscCall(PetscFree(submatj->pa));
272816b64355SHong Zhang   }
272916b64355SHong Zhang 
273016b64355SHong Zhang #if defined(PETSC_USE_CTABLE)
2731eec179cfSJacob Faibussowitsch   PetscCall(PetscHMapIDestroy(&submatj->rmap));
27329566063dSJacob Faibussowitsch   if (submatj->cmap_loc) PetscCall(PetscFree(submatj->cmap_loc));
27339566063dSJacob Faibussowitsch   PetscCall(PetscFree(submatj->rmap_loc));
273416b64355SHong Zhang #else
27359566063dSJacob Faibussowitsch   PetscCall(PetscFree(submatj->rmap));
273616b64355SHong Zhang #endif
273716b64355SHong Zhang 
273816b64355SHong Zhang   if (!submatj->allcolumns) {
273916b64355SHong Zhang #if defined(PETSC_USE_CTABLE)
2740eec179cfSJacob Faibussowitsch     PetscCall(PetscHMapIDestroy((PetscHMapI *)&submatj->cmap));
274116b64355SHong Zhang #else
27429566063dSJacob Faibussowitsch     PetscCall(PetscFree(submatj->cmap));
274316b64355SHong Zhang #endif
274416b64355SHong Zhang   }
27459566063dSJacob Faibussowitsch   PetscCall(PetscFree(submatj->row2proc));
274616b64355SHong Zhang 
27479566063dSJacob Faibussowitsch   PetscCall(PetscFree(submatj));
27483ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
274916b64355SHong Zhang }
275016b64355SHong Zhang 
2751d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDestroySubMatrix_SeqAIJ(Mat C)
2752d71ae5a4SJacob Faibussowitsch {
275316b64355SHong Zhang   Mat_SeqAIJ  *c       = (Mat_SeqAIJ *)C->data;
27545c39f6d9SHong Zhang   Mat_SubSppt *submatj = c->submatis1;
275516b64355SHong Zhang 
275616b64355SHong Zhang   PetscFunctionBegin;
27579566063dSJacob Faibussowitsch   PetscCall((*submatj->destroy)(C));
27589566063dSJacob Faibussowitsch   PetscCall(MatDestroySubMatrix_Private(submatj));
27593ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
276016b64355SHong Zhang }
276116b64355SHong Zhang 
276289a1a59bSHong Zhang /* Note this has code duplication with MatDestroySubMatrices_SeqBAIJ() */
2763ba38deedSJacob Faibussowitsch static PetscErrorCode MatDestroySubMatrices_SeqAIJ(PetscInt n, Mat *mat[])
2764d71ae5a4SJacob Faibussowitsch {
27652d033e1fSHong Zhang   PetscInt     i;
27660fb991dcSHong Zhang   Mat          C;
27670fb991dcSHong Zhang   Mat_SeqAIJ  *c;
27680fb991dcSHong Zhang   Mat_SubSppt *submatj;
27692d033e1fSHong Zhang 
27702d033e1fSHong Zhang   PetscFunctionBegin;
27712d033e1fSHong Zhang   for (i = 0; i < n; i++) {
27720fb991dcSHong Zhang     C       = (*mat)[i];
27730fb991dcSHong Zhang     c       = (Mat_SeqAIJ *)C->data;
27740fb991dcSHong Zhang     submatj = c->submatis1;
27752d033e1fSHong Zhang     if (submatj) {
2776682e4c99SStefano Zampini       if (--((PetscObject)C)->refct <= 0) {
277726cc229bSBarry Smith         PetscCall(PetscFree(C->factorprefix));
27789566063dSJacob Faibussowitsch         PetscCall((*submatj->destroy)(C));
27799566063dSJacob Faibussowitsch         PetscCall(MatDestroySubMatrix_Private(submatj));
27809566063dSJacob Faibussowitsch         PetscCall(PetscFree(C->defaultvectype));
27813faff063SStefano Zampini         PetscCall(PetscFree(C->defaultrandtype));
27829566063dSJacob Faibussowitsch         PetscCall(PetscLayoutDestroy(&C->rmap));
27839566063dSJacob Faibussowitsch         PetscCall(PetscLayoutDestroy(&C->cmap));
27849566063dSJacob Faibussowitsch         PetscCall(PetscHeaderDestroy(&C));
2785682e4c99SStefano Zampini       }
27862d033e1fSHong Zhang     } else {
27879566063dSJacob Faibussowitsch       PetscCall(MatDestroy(&C));
27882d033e1fSHong Zhang     }
27892d033e1fSHong Zhang   }
279086e85357SHong Zhang 
279163a75b2aSHong Zhang   /* Destroy Dummy submatrices created for reuse */
27929566063dSJacob Faibussowitsch   PetscCall(MatDestroySubMatrices_Dummy(n, mat));
279363a75b2aSHong Zhang 
27949566063dSJacob Faibussowitsch   PetscCall(PetscFree(*mat));
27953ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
27962d033e1fSHong Zhang }
27972d033e1fSHong Zhang 
2798ba38deedSJacob Faibussowitsch static PetscErrorCode MatCreateSubMatrices_SeqAIJ(Mat A, PetscInt n, const IS irow[], const IS icol[], MatReuse scall, Mat *B[])
2799d71ae5a4SJacob Faibussowitsch {
280097f1f81fSBarry Smith   PetscInt i;
2801cddf8d76SBarry Smith 
28023a40ed3dSBarry Smith   PetscFunctionBegin;
280348a46eb9SPierre Jolivet   if (scall == MAT_INITIAL_MATRIX) PetscCall(PetscCalloc1(n + 1, B));
2804cddf8d76SBarry Smith 
280548a46eb9SPierre Jolivet   for (i = 0; i < n; i++) PetscCall(MatCreateSubMatrix_SeqAIJ(A, irow[i], icol[i], PETSC_DECIDE, scall, &(*B)[i]));
28063ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
2807cddf8d76SBarry Smith }
2808cddf8d76SBarry Smith 
2809ba38deedSJacob Faibussowitsch static PetscErrorCode MatIncreaseOverlap_SeqAIJ(Mat A, PetscInt is_max, IS is[], PetscInt ov)
2810d71ae5a4SJacob Faibussowitsch {
2811e4d965acSSatish Balay   Mat_SeqAIJ     *a = (Mat_SeqAIJ *)A->data;
28129a88ca10SBarry Smith   PetscInt        row, i, j, k, l, ll, m, n, *nidx, isz, val;
28135d0c19d7SBarry Smith   const PetscInt *idx;
28149a88ca10SBarry Smith   PetscInt        start, end, *ai, *aj, bs = (A->rmap->bs > 0 && A->rmap->bs == A->cmap->bs) ? A->rmap->bs : 1;
2815f1af5d2fSBarry Smith   PetscBT         table;
2816bbd702dbSSatish Balay 
28173a40ed3dSBarry Smith   PetscFunctionBegin;
28189a88ca10SBarry Smith   m  = A->rmap->n / bs;
2819e4d965acSSatish Balay   ai = a->i;
2820bfeeae90SHong Zhang   aj = a->j;
28218a047759SSatish Balay 
282208401ef6SPierre Jolivet   PetscCheck(ov >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "illegal negative overlap value used");
282306763907SSatish Balay 
28249566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(m + 1, &nidx));
28259566063dSJacob Faibussowitsch   PetscCall(PetscBTCreate(m, &table));
282606763907SSatish Balay 
2827e4d965acSSatish Balay   for (i = 0; i < is_max; i++) {
2828b97fc60eSLois Curfman McInnes     /* Initialize the two local arrays */
2829e4d965acSSatish Balay     isz = 0;
28309566063dSJacob Faibussowitsch     PetscCall(PetscBTMemzero(m, table));
2831e4d965acSSatish Balay 
2832e4d965acSSatish Balay     /* Extract the indices, assume there can be duplicate entries */
28339566063dSJacob Faibussowitsch     PetscCall(ISGetIndices(is[i], &idx));
28349566063dSJacob Faibussowitsch     PetscCall(ISGetLocalSize(is[i], &n));
2835e4d965acSSatish Balay 
28369a88ca10SBarry Smith     if (bs > 1) {
28379a88ca10SBarry Smith       /* Enter these into the temp arrays. I.e., mark table[row], enter row into new index */
28389a88ca10SBarry Smith       for (j = 0; j < n; ++j) {
28399a88ca10SBarry Smith         if (!PetscBTLookupSet(table, idx[j] / bs)) nidx[isz++] = idx[j] / bs;
28409a88ca10SBarry Smith       }
28419a88ca10SBarry Smith       PetscCall(ISRestoreIndices(is[i], &idx));
28429a88ca10SBarry Smith       PetscCall(ISDestroy(&is[i]));
28439a88ca10SBarry Smith 
28449a88ca10SBarry Smith       k = 0;
28459a88ca10SBarry Smith       for (j = 0; j < ov; j++) { /* for each overlap */
28469a88ca10SBarry Smith         n = isz;
28479a88ca10SBarry Smith         for (; k < n; k++) { /* do only those rows in nidx[k], which are not done yet */
28489a88ca10SBarry Smith           for (ll = 0; ll < bs; ll++) {
28499a88ca10SBarry Smith             row   = bs * nidx[k] + ll;
28509a88ca10SBarry Smith             start = ai[row];
28519a88ca10SBarry Smith             end   = ai[row + 1];
28529a88ca10SBarry Smith             for (l = start; l < end; l++) {
28539a88ca10SBarry Smith               val = aj[l] / bs;
28549a88ca10SBarry Smith               if (!PetscBTLookupSet(table, val)) nidx[isz++] = val;
28559a88ca10SBarry Smith             }
28569a88ca10SBarry Smith           }
28579a88ca10SBarry Smith         }
28589a88ca10SBarry Smith       }
285957508eceSPierre Jolivet       PetscCall(ISCreateBlock(PETSC_COMM_SELF, bs, isz, nidx, PETSC_COPY_VALUES, is + i));
28609a88ca10SBarry Smith     } else {
2861dd097bc3SLois Curfman McInnes       /* Enter these into the temp arrays. I.e., mark table[row], enter row into new index */
2862e4d965acSSatish Balay       for (j = 0; j < n; ++j) {
28632205254eSKarl Rupp         if (!PetscBTLookupSet(table, idx[j])) nidx[isz++] = idx[j];
28644dcbc457SBarry Smith       }
28659566063dSJacob Faibussowitsch       PetscCall(ISRestoreIndices(is[i], &idx));
28669566063dSJacob Faibussowitsch       PetscCall(ISDestroy(&is[i]));
2867e4d965acSSatish Balay 
286804a348a9SBarry Smith       k = 0;
286904a348a9SBarry Smith       for (j = 0; j < ov; j++) { /* for each overlap */
287004a348a9SBarry Smith         n = isz;
287106763907SSatish Balay         for (; k < n; k++) { /* do only those rows in nidx[k], which are not done yet */
2872e4d965acSSatish Balay           row   = nidx[k];
2873e4d965acSSatish Balay           start = ai[row];
2874e4d965acSSatish Balay           end   = ai[row + 1];
287504a348a9SBarry Smith           for (l = start; l < end; l++) {
2876efb16452SHong Zhang             val = aj[l];
28772205254eSKarl Rupp             if (!PetscBTLookupSet(table, val)) nidx[isz++] = val;
2878e4d965acSSatish Balay           }
2879e4d965acSSatish Balay         }
2880e4d965acSSatish Balay       }
288157508eceSPierre Jolivet       PetscCall(ISCreateGeneral(PETSC_COMM_SELF, isz, nidx, PETSC_COPY_VALUES, is + i));
2882e4d965acSSatish Balay     }
28839a88ca10SBarry Smith   }
28849566063dSJacob Faibussowitsch   PetscCall(PetscBTDestroy(&table));
28859566063dSJacob Faibussowitsch   PetscCall(PetscFree(nidx));
28863ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
28874dcbc457SBarry Smith }
288817ab2063SBarry Smith 
2889ba38deedSJacob Faibussowitsch static PetscErrorCode MatPermute_SeqAIJ(Mat A, IS rowp, IS colp, Mat *B)
2890d71ae5a4SJacob Faibussowitsch {
28910513a670SBarry Smith   Mat_SeqAIJ     *a = (Mat_SeqAIJ *)A->data;
28923b98c0a2SBarry Smith   PetscInt        i, nz = 0, m = A->rmap->n, n = A->cmap->n;
28935d0c19d7SBarry Smith   const PetscInt *row, *col;
28945d0c19d7SBarry Smith   PetscInt       *cnew, j, *lens;
289556cd22aeSBarry Smith   IS              icolp, irowp;
28960298fd71SBarry Smith   PetscInt       *cwork = NULL;
28970298fd71SBarry Smith   PetscScalar    *vwork = NULL;
28980513a670SBarry Smith 
28993a40ed3dSBarry Smith   PetscFunctionBegin;
29009566063dSJacob Faibussowitsch   PetscCall(ISInvertPermutation(rowp, PETSC_DECIDE, &irowp));
29019566063dSJacob Faibussowitsch   PetscCall(ISGetIndices(irowp, &row));
29029566063dSJacob Faibussowitsch   PetscCall(ISInvertPermutation(colp, PETSC_DECIDE, &icolp));
29039566063dSJacob Faibussowitsch   PetscCall(ISGetIndices(icolp, &col));
29040513a670SBarry Smith 
29050513a670SBarry Smith   /* determine lengths of permuted rows */
29069566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(m + 1, &lens));
29072205254eSKarl Rupp   for (i = 0; i < m; i++) lens[row[i]] = a->i[i + 1] - a->i[i];
29089566063dSJacob Faibussowitsch   PetscCall(MatCreate(PetscObjectComm((PetscObject)A), B));
29099566063dSJacob Faibussowitsch   PetscCall(MatSetSizes(*B, m, n, m, n));
29109566063dSJacob Faibussowitsch   PetscCall(MatSetBlockSizesFromMats(*B, A, A));
29119566063dSJacob Faibussowitsch   PetscCall(MatSetType(*B, ((PetscObject)A)->type_name));
29129566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(*B, 0, lens));
29139566063dSJacob Faibussowitsch   PetscCall(PetscFree(lens));
29140513a670SBarry Smith 
29159566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(n, &cnew));
29160513a670SBarry Smith   for (i = 0; i < m; i++) {
29179566063dSJacob Faibussowitsch     PetscCall(MatGetRow_SeqAIJ(A, i, &nz, &cwork, &vwork));
29182205254eSKarl Rupp     for (j = 0; j < nz; j++) cnew[j] = col[cwork[j]];
29199566063dSJacob Faibussowitsch     PetscCall(MatSetValues_SeqAIJ(*B, 1, &row[i], nz, cnew, vwork, INSERT_VALUES));
29209566063dSJacob Faibussowitsch     PetscCall(MatRestoreRow_SeqAIJ(A, i, &nz, &cwork, &vwork));
29210513a670SBarry Smith   }
29229566063dSJacob Faibussowitsch   PetscCall(PetscFree(cnew));
29232205254eSKarl Rupp 
29243c7d62e4SBarry Smith   (*B)->assembled = PETSC_FALSE;
29252205254eSKarl Rupp 
29268c3ff71bSJunchao Zhang #if defined(PETSC_HAVE_DEVICE)
29279566063dSJacob Faibussowitsch   PetscCall(MatBindToCPU(*B, A->boundtocpu));
29289fe5e383SStefano Zampini #endif
29299566063dSJacob Faibussowitsch   PetscCall(MatAssemblyBegin(*B, MAT_FINAL_ASSEMBLY));
29309566063dSJacob Faibussowitsch   PetscCall(MatAssemblyEnd(*B, MAT_FINAL_ASSEMBLY));
29319566063dSJacob Faibussowitsch   PetscCall(ISRestoreIndices(irowp, &row));
29329566063dSJacob Faibussowitsch   PetscCall(ISRestoreIndices(icolp, &col));
29339566063dSJacob Faibussowitsch   PetscCall(ISDestroy(&irowp));
29349566063dSJacob Faibussowitsch   PetscCall(ISDestroy(&icolp));
293548a46eb9SPierre Jolivet   if (rowp == colp) PetscCall(MatPropagateSymmetryOptions(A, *B));
29363ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
29370513a670SBarry Smith }
29380513a670SBarry Smith 
2939d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCopy_SeqAIJ(Mat A, Mat B, MatStructure str)
2940d71ae5a4SJacob Faibussowitsch {
2941cb5b572fSBarry Smith   PetscFunctionBegin;
294233f4a19fSKris Buschelman   /* If the two matrices have the same copy implementation, use fast copy. */
294333f4a19fSKris Buschelman   if (str == SAME_NONZERO_PATTERN && (A->ops->copy == B->ops->copy)) {
2944be6bf707SBarry Smith     Mat_SeqAIJ        *a = (Mat_SeqAIJ *)A->data;
2945be6bf707SBarry Smith     Mat_SeqAIJ        *b = (Mat_SeqAIJ *)B->data;
29462e5835c6SStefano Zampini     const PetscScalar *aa;
2947be6bf707SBarry Smith 
29489566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJGetArrayRead(A, &aa));
294908401ef6SPierre Jolivet     PetscCheck(a->i[A->rmap->n] == b->i[B->rmap->n], PETSC_COMM_SELF, PETSC_ERR_ARG_INCOMP, "Number of nonzeros in two matrices are different %" PetscInt_FMT " != %" PetscInt_FMT, a->i[A->rmap->n], b->i[B->rmap->n]);
29509566063dSJacob Faibussowitsch     PetscCall(PetscArraycpy(b->a, aa, a->i[A->rmap->n]));
29519566063dSJacob Faibussowitsch     PetscCall(PetscObjectStateIncrease((PetscObject)B));
29529566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJRestoreArrayRead(A, &aa));
2953cb5b572fSBarry Smith   } else {
29549566063dSJacob Faibussowitsch     PetscCall(MatCopy_Basic(A, B, str));
2955cb5b572fSBarry Smith   }
29563ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
2957cb5b572fSBarry Smith }
2958cb5b572fSBarry Smith 
2959d71ae5a4SJacob Faibussowitsch PETSC_INTERN PetscErrorCode MatSeqAIJGetArray_SeqAIJ(Mat A, PetscScalar *array[])
2960d71ae5a4SJacob Faibussowitsch {
29616c0721eeSBarry Smith   Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data;
29626e111a19SKarl Rupp 
29636c0721eeSBarry Smith   PetscFunctionBegin;
29646c0721eeSBarry Smith   *array = a->a;
29653ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
29666c0721eeSBarry Smith }
29676c0721eeSBarry Smith 
2968d71ae5a4SJacob Faibussowitsch PETSC_INTERN PetscErrorCode MatSeqAIJRestoreArray_SeqAIJ(Mat A, PetscScalar *array[])
2969d71ae5a4SJacob Faibussowitsch {
29706c0721eeSBarry Smith   PetscFunctionBegin;
2971f38c1e66SStefano Zampini   *array = NULL;
29723ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
29736c0721eeSBarry Smith }
2974273d9f13SBarry Smith 
29758229c054SShri Abhyankar /*
29768229c054SShri Abhyankar    Computes the number of nonzeros per row needed for preallocation when X and Y
29778229c054SShri Abhyankar    have different nonzero structure.
29788229c054SShri Abhyankar */
2979d71ae5a4SJacob Faibussowitsch PetscErrorCode MatAXPYGetPreallocation_SeqX_private(PetscInt m, const PetscInt *xi, const PetscInt *xj, const PetscInt *yi, const PetscInt *yj, PetscInt *nnz)
2980d71ae5a4SJacob Faibussowitsch {
2981b264fe52SHong Zhang   PetscInt i, j, k, nzx, nzy;
2982ec7775f6SShri Abhyankar 
2983ec7775f6SShri Abhyankar   PetscFunctionBegin;
2984ec7775f6SShri Abhyankar   /* Set the number of nonzeros in the new matrix */
2985ec7775f6SShri Abhyankar   for (i = 0; i < m; i++) {
29868e3a54c0SPierre Jolivet     const PetscInt *xjj = PetscSafePointerPlusOffset(xj, xi[i]), *yjj = PetscSafePointerPlusOffset(yj, yi[i]);
2987b264fe52SHong Zhang     nzx    = xi[i + 1] - xi[i];
2988b264fe52SHong Zhang     nzy    = yi[i + 1] - yi[i];
29898af7cee1SJed Brown     nnz[i] = 0;
29908af7cee1SJed Brown     for (j = 0, k = 0; j < nzx; j++) {                  /* Point in X */
2991b264fe52SHong Zhang       for (; k < nzy && yjj[k] < xjj[j]; k++) nnz[i]++; /* Catch up to X */
2992b264fe52SHong Zhang       if (k < nzy && yjj[k] == xjj[j]) k++;             /* Skip duplicate */
29938af7cee1SJed Brown       nnz[i]++;
29948af7cee1SJed Brown     }
29958af7cee1SJed Brown     for (; k < nzy; k++) nnz[i]++;
2996ec7775f6SShri Abhyankar   }
29973ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
2998ec7775f6SShri Abhyankar }
2999ec7775f6SShri Abhyankar 
3000d71ae5a4SJacob Faibussowitsch PetscErrorCode MatAXPYGetPreallocation_SeqAIJ(Mat Y, Mat X, PetscInt *nnz)
3001d71ae5a4SJacob Faibussowitsch {
3002b264fe52SHong Zhang   PetscInt    m = Y->rmap->N;
3003b264fe52SHong Zhang   Mat_SeqAIJ *x = (Mat_SeqAIJ *)X->data;
3004b264fe52SHong Zhang   Mat_SeqAIJ *y = (Mat_SeqAIJ *)Y->data;
3005b264fe52SHong Zhang 
3006b264fe52SHong Zhang   PetscFunctionBegin;
3007b264fe52SHong Zhang   /* Set the number of nonzeros in the new matrix */
30089566063dSJacob Faibussowitsch   PetscCall(MatAXPYGetPreallocation_SeqX_private(m, x->i, x->j, y->i, y->j, nnz));
30093ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3010b264fe52SHong Zhang }
3011b264fe52SHong Zhang 
3012d71ae5a4SJacob Faibussowitsch PetscErrorCode MatAXPY_SeqAIJ(Mat Y, PetscScalar a, Mat X, MatStructure str)
3013d71ae5a4SJacob Faibussowitsch {
3014ac90fabeSBarry Smith   Mat_SeqAIJ *x = (Mat_SeqAIJ *)X->data, *y = (Mat_SeqAIJ *)Y->data;
3015ac90fabeSBarry Smith 
3016ac90fabeSBarry Smith   PetscFunctionBegin;
3017134adf20SPierre Jolivet   if (str == UNKNOWN_NONZERO_PATTERN || (PetscDefined(USE_DEBUG) && str == SAME_NONZERO_PATTERN)) {
3018134adf20SPierre Jolivet     PetscBool e = x->nz == y->nz ? PETSC_TRUE : PETSC_FALSE;
3019134adf20SPierre Jolivet     if (e) {
30209566063dSJacob Faibussowitsch       PetscCall(PetscArraycmp(x->i, y->i, Y->rmap->n + 1, &e));
302181fa06acSBarry Smith       if (e) {
30229566063dSJacob Faibussowitsch         PetscCall(PetscArraycmp(x->j, y->j, y->nz, &e));
3023134adf20SPierre Jolivet         if (e) str = SAME_NONZERO_PATTERN;
302481fa06acSBarry Smith       }
302581fa06acSBarry Smith     }
302654c59aa7SJacob Faibussowitsch     if (!e) PetscCheck(str != SAME_NONZERO_PATTERN, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONG, "MatStructure is not SAME_NONZERO_PATTERN");
302781fa06acSBarry Smith   }
3028ac90fabeSBarry Smith   if (str == SAME_NONZERO_PATTERN) {
30292e5835c6SStefano Zampini     const PetscScalar *xa;
30302e5835c6SStefano Zampini     PetscScalar       *ya, alpha = a;
303181fa06acSBarry Smith     PetscBLASInt       one = 1, bnz;
303281fa06acSBarry Smith 
30339566063dSJacob Faibussowitsch     PetscCall(PetscBLASIntCast(x->nz, &bnz));
30349566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJGetArray(Y, &ya));
30359566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJGetArrayRead(X, &xa));
3036792fecdfSBarry Smith     PetscCallBLAS("BLASaxpy", BLASaxpy_(&bnz, &alpha, xa, &one, ya, &one));
30379566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJRestoreArrayRead(X, &xa));
30389566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJRestoreArray(Y, &ya));
30399566063dSJacob Faibussowitsch     PetscCall(PetscLogFlops(2.0 * bnz));
30409566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJInvalidateDiagonal(Y));
30419566063dSJacob Faibussowitsch     PetscCall(PetscObjectStateIncrease((PetscObject)Y));
3042ab784542SHong Zhang   } else if (str == SUBSET_NONZERO_PATTERN) { /* nonzeros of X is a subset of Y's */
30439566063dSJacob Faibussowitsch     PetscCall(MatAXPY_Basic(Y, a, X, str));
3044ac90fabeSBarry Smith   } else {
30458229c054SShri Abhyankar     Mat       B;
30468229c054SShri Abhyankar     PetscInt *nnz;
30479566063dSJacob Faibussowitsch     PetscCall(PetscMalloc1(Y->rmap->N, &nnz));
30489566063dSJacob Faibussowitsch     PetscCall(MatCreate(PetscObjectComm((PetscObject)Y), &B));
30499566063dSJacob Faibussowitsch     PetscCall(PetscObjectSetName((PetscObject)B, ((PetscObject)Y)->name));
30509566063dSJacob Faibussowitsch     PetscCall(MatSetLayouts(B, Y->rmap, Y->cmap));
30519566063dSJacob Faibussowitsch     PetscCall(MatSetType(B, ((PetscObject)Y)->type_name));
30529566063dSJacob Faibussowitsch     PetscCall(MatAXPYGetPreallocation_SeqAIJ(Y, X, nnz));
30539566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJSetPreallocation(B, 0, nnz));
30549566063dSJacob Faibussowitsch     PetscCall(MatAXPY_BasicWithPreallocation(B, Y, a, X, str));
30559566063dSJacob Faibussowitsch     PetscCall(MatHeaderMerge(Y, &B));
30569bb234a9SBarry Smith     PetscCall(MatSeqAIJCheckInode(Y));
30579566063dSJacob Faibussowitsch     PetscCall(PetscFree(nnz));
3058ac90fabeSBarry Smith   }
30593ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3060ac90fabeSBarry Smith }
3061ac90fabeSBarry Smith 
3062d71ae5a4SJacob Faibussowitsch PETSC_INTERN PetscErrorCode MatConjugate_SeqAIJ(Mat mat)
3063d71ae5a4SJacob Faibussowitsch {
3064354c94deSBarry Smith #if defined(PETSC_USE_COMPLEX)
3065354c94deSBarry Smith   Mat_SeqAIJ  *aij = (Mat_SeqAIJ *)mat->data;
3066354c94deSBarry Smith   PetscInt     i, nz;
3067354c94deSBarry Smith   PetscScalar *a;
3068354c94deSBarry Smith 
3069354c94deSBarry Smith   PetscFunctionBegin;
3070354c94deSBarry Smith   nz = aij->nz;
30719566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArray(mat, &a));
30722205254eSKarl Rupp   for (i = 0; i < nz; i++) a[i] = PetscConj(a[i]);
30739566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArray(mat, &a));
3074354c94deSBarry Smith #else
3075354c94deSBarry Smith   PetscFunctionBegin;
3076354c94deSBarry Smith #endif
30773ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3078354c94deSBarry Smith }
3079354c94deSBarry Smith 
3080ba38deedSJacob Faibussowitsch static PetscErrorCode MatGetRowMaxAbs_SeqAIJ(Mat A, Vec v, PetscInt idx[])
3081d71ae5a4SJacob Faibussowitsch {
3082e34fafa9SBarry Smith   Mat_SeqAIJ      *a = (Mat_SeqAIJ *)A->data;
3083d0f46423SBarry Smith   PetscInt         i, j, m = A->rmap->n, *ai, *aj, ncols, n;
3084e34fafa9SBarry Smith   PetscReal        atmp;
3085985db425SBarry Smith   PetscScalar     *x;
3086ce496241SStefano Zampini   const MatScalar *aa, *av;
3087e34fafa9SBarry Smith 
3088e34fafa9SBarry Smith   PetscFunctionBegin;
308928b400f6SJacob Faibussowitsch   PetscCheck(!A->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix");
30909566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &av));
3091ce496241SStefano Zampini   aa = av;
3092e34fafa9SBarry Smith   ai = a->i;
3093e34fafa9SBarry Smith   aj = a->j;
3094e34fafa9SBarry Smith 
30959566063dSJacob Faibussowitsch   PetscCall(VecGetArrayWrite(v, &x));
30969566063dSJacob Faibussowitsch   PetscCall(VecGetLocalSize(v, &n));
309708401ef6SPierre Jolivet   PetscCheck(n == A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Nonconforming matrix and vector");
3098e34fafa9SBarry Smith   for (i = 0; i < m; i++) {
30999371c9d4SSatish Balay     ncols = ai[1] - ai[0];
31009371c9d4SSatish Balay     ai++;
3101*62e5df07SMark Adams     x[i] = 0;
3102e34fafa9SBarry Smith     for (j = 0; j < ncols; j++) {
3103985db425SBarry Smith       atmp = PetscAbsScalar(*aa);
31049371c9d4SSatish Balay       if (PetscAbsScalar(x[i]) < atmp) {
31059371c9d4SSatish Balay         x[i] = atmp;
31069371c9d4SSatish Balay         if (idx) idx[i] = *aj;
31079371c9d4SSatish Balay       }
31089371c9d4SSatish Balay       aa++;
31099371c9d4SSatish Balay       aj++;
3110985db425SBarry Smith     }
3111985db425SBarry Smith   }
31129566063dSJacob Faibussowitsch   PetscCall(VecRestoreArrayWrite(v, &x));
31139566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &av));
31143ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3115985db425SBarry Smith }
3116985db425SBarry Smith 
3117eede4a3fSMark Adams static PetscErrorCode MatGetRowSumAbs_SeqAIJ(Mat A, Vec v)
3118eede4a3fSMark Adams {
3119eede4a3fSMark Adams   Mat_SeqAIJ      *a = (Mat_SeqAIJ *)A->data;
3120eede4a3fSMark Adams   PetscInt         i, j, m = A->rmap->n, *ai, ncols, n;
3121eede4a3fSMark Adams   PetscScalar     *x;
3122eede4a3fSMark Adams   const MatScalar *aa, *av;
3123eede4a3fSMark Adams 
3124eede4a3fSMark Adams   PetscFunctionBegin;
3125eede4a3fSMark Adams   PetscCheck(!A->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix");
3126eede4a3fSMark Adams   PetscCall(MatSeqAIJGetArrayRead(A, &av));
3127eede4a3fSMark Adams   aa = av;
3128eede4a3fSMark Adams   ai = a->i;
3129eede4a3fSMark Adams 
3130eede4a3fSMark Adams   PetscCall(VecGetArrayWrite(v, &x));
3131eede4a3fSMark Adams   PetscCall(VecGetLocalSize(v, &n));
3132eede4a3fSMark Adams   PetscCheck(n == A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Nonconforming matrix and vector");
3133eede4a3fSMark Adams   for (i = 0; i < m; i++) {
3134eede4a3fSMark Adams     ncols = ai[1] - ai[0];
3135eede4a3fSMark Adams     ai++;
3136*62e5df07SMark Adams     x[i] = 0;
3137eede4a3fSMark Adams     for (j = 0; j < ncols; j++) {
3138eede4a3fSMark Adams       x[i] += PetscAbsScalar(*aa);
3139eede4a3fSMark Adams       aa++;
3140eede4a3fSMark Adams     }
3141eede4a3fSMark Adams   }
3142eede4a3fSMark Adams   PetscCall(VecRestoreArrayWrite(v, &x));
3143eede4a3fSMark Adams   PetscCall(MatSeqAIJRestoreArrayRead(A, &av));
3144eede4a3fSMark Adams   PetscFunctionReturn(PETSC_SUCCESS);
3145eede4a3fSMark Adams }
3146eede4a3fSMark Adams 
3147ba38deedSJacob Faibussowitsch static PetscErrorCode MatGetRowMax_SeqAIJ(Mat A, Vec v, PetscInt idx[])
3148d71ae5a4SJacob Faibussowitsch {
3149985db425SBarry Smith   Mat_SeqAIJ      *a = (Mat_SeqAIJ *)A->data;
3150d0f46423SBarry Smith   PetscInt         i, j, m = A->rmap->n, *ai, *aj, ncols, n;
3151985db425SBarry Smith   PetscScalar     *x;
3152ce496241SStefano Zampini   const MatScalar *aa, *av;
3153985db425SBarry Smith 
3154985db425SBarry Smith   PetscFunctionBegin;
315528b400f6SJacob Faibussowitsch   PetscCheck(!A->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix");
31569566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &av));
3157ce496241SStefano Zampini   aa = av;
3158985db425SBarry Smith   ai = a->i;
3159985db425SBarry Smith   aj = a->j;
3160985db425SBarry Smith 
31619566063dSJacob Faibussowitsch   PetscCall(VecGetArrayWrite(v, &x));
31629566063dSJacob Faibussowitsch   PetscCall(VecGetLocalSize(v, &n));
316308401ef6SPierre Jolivet   PetscCheck(n == A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Nonconforming matrix and vector");
3164985db425SBarry Smith   for (i = 0; i < m; i++) {
31659371c9d4SSatish Balay     ncols = ai[1] - ai[0];
31669371c9d4SSatish Balay     ai++;
3167d0f46423SBarry Smith     if (ncols == A->cmap->n) { /* row is dense */
31689371c9d4SSatish Balay       x[i] = *aa;
31699371c9d4SSatish Balay       if (idx) idx[i] = 0;
3170985db425SBarry Smith     } else { /* row is sparse so already KNOW maximum is 0.0 or higher */
3171985db425SBarry Smith       x[i] = 0.0;
3172985db425SBarry Smith       if (idx) {
3173985db425SBarry Smith         for (j = 0; j < ncols; j++) { /* find first implicit 0.0 in the row */
3174985db425SBarry Smith           if (aj[j] > j) {
3175985db425SBarry Smith             idx[i] = j;
3176985db425SBarry Smith             break;
3177985db425SBarry Smith           }
3178985db425SBarry Smith         }
31791a254869SHong Zhang         /* in case first implicit 0.0 in the row occurs at ncols-th column */
31801a254869SHong Zhang         if (j == ncols && j < A->cmap->n) idx[i] = j;
3181985db425SBarry Smith       }
3182985db425SBarry Smith     }
3183985db425SBarry Smith     for (j = 0; j < ncols; j++) {
31849371c9d4SSatish Balay       if (PetscRealPart(x[i]) < PetscRealPart(*aa)) {
31859371c9d4SSatish Balay         x[i] = *aa;
31869371c9d4SSatish Balay         if (idx) idx[i] = *aj;
31879371c9d4SSatish Balay       }
31889371c9d4SSatish Balay       aa++;
31899371c9d4SSatish Balay       aj++;
3190985db425SBarry Smith     }
3191985db425SBarry Smith   }
31929566063dSJacob Faibussowitsch   PetscCall(VecRestoreArrayWrite(v, &x));
31939566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &av));
31943ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3195985db425SBarry Smith }
3196985db425SBarry Smith 
3197ba38deedSJacob Faibussowitsch static PetscErrorCode MatGetRowMinAbs_SeqAIJ(Mat A, Vec v, PetscInt idx[])
3198d71ae5a4SJacob Faibussowitsch {
3199c87e5d42SMatthew Knepley   Mat_SeqAIJ      *a = (Mat_SeqAIJ *)A->data;
3200c87e5d42SMatthew Knepley   PetscInt         i, j, m = A->rmap->n, *ai, *aj, ncols, n;
3201ce496241SStefano Zampini   PetscScalar     *x;
3202ce496241SStefano Zampini   const MatScalar *aa, *av;
3203c87e5d42SMatthew Knepley 
3204c87e5d42SMatthew Knepley   PetscFunctionBegin;
32059566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &av));
3206ce496241SStefano Zampini   aa = av;
3207c87e5d42SMatthew Knepley   ai = a->i;
3208c87e5d42SMatthew Knepley   aj = a->j;
3209c87e5d42SMatthew Knepley 
32109566063dSJacob Faibussowitsch   PetscCall(VecGetArrayWrite(v, &x));
32119566063dSJacob Faibussowitsch   PetscCall(VecGetLocalSize(v, &n));
321208401ef6SPierre Jolivet   PetscCheck(n == m, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Nonconforming matrix and vector, %" PetscInt_FMT " vs. %" PetscInt_FMT " rows", m, n);
3213c87e5d42SMatthew Knepley   for (i = 0; i < m; i++) {
32149371c9d4SSatish Balay     ncols = ai[1] - ai[0];
32159371c9d4SSatish Balay     ai++;
3216f07e67edSHong Zhang     if (ncols == A->cmap->n) { /* row is dense */
32179371c9d4SSatish Balay       x[i] = *aa;
32189371c9d4SSatish Balay       if (idx) idx[i] = 0;
3219f07e67edSHong Zhang     } else { /* row is sparse so already KNOW minimum is 0.0 or higher */
3220f07e67edSHong Zhang       x[i] = 0.0;
3221f07e67edSHong Zhang       if (idx) { /* find first implicit 0.0 in the row */
3222289a08f5SMatthew Knepley         for (j = 0; j < ncols; j++) {
3223f07e67edSHong Zhang           if (aj[j] > j) {
3224f07e67edSHong Zhang             idx[i] = j;
32252205254eSKarl Rupp             break;
32262205254eSKarl Rupp           }
3227289a08f5SMatthew Knepley         }
3228f07e67edSHong Zhang         /* in case first implicit 0.0 in the row occurs at ncols-th column */
3229f07e67edSHong Zhang         if (j == ncols && j < A->cmap->n) idx[i] = j;
3230f07e67edSHong Zhang       }
3231289a08f5SMatthew Knepley     }
3232c87e5d42SMatthew Knepley     for (j = 0; j < ncols; j++) {
32339371c9d4SSatish Balay       if (PetscAbsScalar(x[i]) > PetscAbsScalar(*aa)) {
32349371c9d4SSatish Balay         x[i] = *aa;
32359371c9d4SSatish Balay         if (idx) idx[i] = *aj;
32369371c9d4SSatish Balay       }
32379371c9d4SSatish Balay       aa++;
32389371c9d4SSatish Balay       aj++;
3239c87e5d42SMatthew Knepley     }
3240c87e5d42SMatthew Knepley   }
32419566063dSJacob Faibussowitsch   PetscCall(VecRestoreArrayWrite(v, &x));
32429566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &av));
32433ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3244c87e5d42SMatthew Knepley }
3245c87e5d42SMatthew Knepley 
3246ba38deedSJacob Faibussowitsch static PetscErrorCode MatGetRowMin_SeqAIJ(Mat A, Vec v, PetscInt idx[])
3247d71ae5a4SJacob Faibussowitsch {
3248985db425SBarry Smith   Mat_SeqAIJ      *a = (Mat_SeqAIJ *)A->data;
3249d9ca1df4SBarry Smith   PetscInt         i, j, m = A->rmap->n, ncols, n;
3250d9ca1df4SBarry Smith   const PetscInt  *ai, *aj;
3251985db425SBarry Smith   PetscScalar     *x;
3252ce496241SStefano Zampini   const MatScalar *aa, *av;
3253985db425SBarry Smith 
3254985db425SBarry Smith   PetscFunctionBegin;
325528b400f6SJacob Faibussowitsch   PetscCheck(!A->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix");
32569566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &av));
3257ce496241SStefano Zampini   aa = av;
3258985db425SBarry Smith   ai = a->i;
3259985db425SBarry Smith   aj = a->j;
3260985db425SBarry Smith 
32619566063dSJacob Faibussowitsch   PetscCall(VecGetArrayWrite(v, &x));
32629566063dSJacob Faibussowitsch   PetscCall(VecGetLocalSize(v, &n));
326308401ef6SPierre Jolivet   PetscCheck(n == m, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Nonconforming matrix and vector");
3264985db425SBarry Smith   for (i = 0; i < m; i++) {
32659371c9d4SSatish Balay     ncols = ai[1] - ai[0];
32669371c9d4SSatish Balay     ai++;
3267d0f46423SBarry Smith     if (ncols == A->cmap->n) { /* row is dense */
32689371c9d4SSatish Balay       x[i] = *aa;
32699371c9d4SSatish Balay       if (idx) idx[i] = 0;
3270985db425SBarry Smith     } else { /* row is sparse so already KNOW minimum is 0.0 or lower */
3271985db425SBarry Smith       x[i] = 0.0;
3272985db425SBarry Smith       if (idx) { /* find first implicit 0.0 in the row */
3273985db425SBarry Smith         for (j = 0; j < ncols; j++) {
3274985db425SBarry Smith           if (aj[j] > j) {
3275985db425SBarry Smith             idx[i] = j;
3276985db425SBarry Smith             break;
3277985db425SBarry Smith           }
3278985db425SBarry Smith         }
3279fa213d2fSHong Zhang         /* in case first implicit 0.0 in the row occurs at ncols-th column */
3280fa213d2fSHong Zhang         if (j == ncols && j < A->cmap->n) idx[i] = j;
3281985db425SBarry Smith       }
3282985db425SBarry Smith     }
3283985db425SBarry Smith     for (j = 0; j < ncols; j++) {
32849371c9d4SSatish Balay       if (PetscRealPart(x[i]) > PetscRealPart(*aa)) {
32859371c9d4SSatish Balay         x[i] = *aa;
32869371c9d4SSatish Balay         if (idx) idx[i] = *aj;
32879371c9d4SSatish Balay       }
32889371c9d4SSatish Balay       aa++;
32899371c9d4SSatish Balay       aj++;
3290e34fafa9SBarry Smith     }
3291e34fafa9SBarry Smith   }
32929566063dSJacob Faibussowitsch   PetscCall(VecRestoreArrayWrite(v, &x));
32939566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &av));
32943ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3295e34fafa9SBarry Smith }
3296bbead8a2SBarry Smith 
3297ba38deedSJacob Faibussowitsch static PetscErrorCode MatInvertBlockDiagonal_SeqAIJ(Mat A, const PetscScalar **values)
3298d71ae5a4SJacob Faibussowitsch {
3299bbead8a2SBarry Smith   Mat_SeqAIJ     *a = (Mat_SeqAIJ *)A->data;
330033d57670SJed Brown   PetscInt        i, bs = PetscAbs(A->rmap->bs), mbs = A->rmap->n / bs, ipvt[5], bs2 = bs * bs, *v_pivots, ij[7], *IJ, j;
3301bbead8a2SBarry Smith   MatScalar      *diag, work[25], *v_work;
33020da83c2eSBarry Smith   const PetscReal shift = 0.0;
33031a9391e3SHong Zhang   PetscBool       allowzeropivot, zeropivotdetected = PETSC_FALSE;
3304bbead8a2SBarry Smith 
3305bbead8a2SBarry Smith   PetscFunctionBegin;
3306a455e926SHong Zhang   allowzeropivot = PetscNot(A->erroriffailure);
33074a0d0026SBarry Smith   if (a->ibdiagvalid) {
33084a0d0026SBarry Smith     if (values) *values = a->ibdiag;
33093ba16761SJacob Faibussowitsch     PetscFunctionReturn(PETSC_SUCCESS);
33104a0d0026SBarry Smith   }
33119566063dSJacob Faibussowitsch   PetscCall(MatMarkDiagonal_SeqAIJ(A));
33124dfa11a4SJacob Faibussowitsch   if (!a->ibdiag) { PetscCall(PetscMalloc1(bs2 * mbs, &a->ibdiag)); }
3313bbead8a2SBarry Smith   diag = a->ibdiag;
3314bbead8a2SBarry Smith   if (values) *values = a->ibdiag;
3315bbead8a2SBarry Smith   /* factor and invert each block */
3316bbead8a2SBarry Smith   switch (bs) {
3317bbead8a2SBarry Smith   case 1:
3318bbead8a2SBarry Smith     for (i = 0; i < mbs; i++) {
33199566063dSJacob Faibussowitsch       PetscCall(MatGetValues(A, 1, &i, 1, &i, diag + i));
3320ec1892c8SHong Zhang       if (PetscAbsScalar(diag[i] + shift) < PETSC_MACHINE_EPSILON) {
3321ec1892c8SHong Zhang         if (allowzeropivot) {
33227b6c816cSBarry Smith           A->factorerrortype             = MAT_FACTOR_NUMERIC_ZEROPIVOT;
33237b6c816cSBarry Smith           A->factorerror_zeropivot_value = PetscAbsScalar(diag[i]);
33247b6c816cSBarry Smith           A->factorerror_zeropivot_row   = i;
33259566063dSJacob Faibussowitsch           PetscCall(PetscInfo(A, "Zero pivot, row %" PetscInt_FMT " pivot %g tolerance %g\n", i, (double)PetscAbsScalar(diag[i]), (double)PETSC_MACHINE_EPSILON));
332698921bdaSJacob Faibussowitsch         } else SETERRQ(PETSC_COMM_SELF, PETSC_ERR_MAT_LU_ZRPVT, "Zero pivot, row %" PetscInt_FMT " pivot %g tolerance %g", i, (double)PetscAbsScalar(diag[i]), (double)PETSC_MACHINE_EPSILON);
3327ec1892c8SHong Zhang       }
3328bbead8a2SBarry Smith       diag[i] = (PetscScalar)1.0 / (diag[i] + shift);
3329bbead8a2SBarry Smith     }
3330bbead8a2SBarry Smith     break;
3331bbead8a2SBarry Smith   case 2:
3332bbead8a2SBarry Smith     for (i = 0; i < mbs; i++) {
33339371c9d4SSatish Balay       ij[0] = 2 * i;
33349371c9d4SSatish Balay       ij[1] = 2 * i + 1;
33359566063dSJacob Faibussowitsch       PetscCall(MatGetValues(A, 2, ij, 2, ij, diag));
33369566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_inverse_A_2(diag, shift, allowzeropivot, &zeropivotdetected));
33377b6c816cSBarry Smith       if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT;
33389566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_transpose_A_2(diag));
3339bbead8a2SBarry Smith       diag += 4;
3340bbead8a2SBarry Smith     }
3341bbead8a2SBarry Smith     break;
3342bbead8a2SBarry Smith   case 3:
3343bbead8a2SBarry Smith     for (i = 0; i < mbs; i++) {
33449371c9d4SSatish Balay       ij[0] = 3 * i;
33459371c9d4SSatish Balay       ij[1] = 3 * i + 1;
33469371c9d4SSatish Balay       ij[2] = 3 * i + 2;
33479566063dSJacob Faibussowitsch       PetscCall(MatGetValues(A, 3, ij, 3, ij, diag));
33489566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_inverse_A_3(diag, shift, allowzeropivot, &zeropivotdetected));
33497b6c816cSBarry Smith       if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT;
33509566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_transpose_A_3(diag));
3351bbead8a2SBarry Smith       diag += 9;
3352bbead8a2SBarry Smith     }
3353bbead8a2SBarry Smith     break;
3354bbead8a2SBarry Smith   case 4:
3355bbead8a2SBarry Smith     for (i = 0; i < mbs; i++) {
33569371c9d4SSatish Balay       ij[0] = 4 * i;
33579371c9d4SSatish Balay       ij[1] = 4 * i + 1;
33589371c9d4SSatish Balay       ij[2] = 4 * i + 2;
33599371c9d4SSatish Balay       ij[3] = 4 * i + 3;
33609566063dSJacob Faibussowitsch       PetscCall(MatGetValues(A, 4, ij, 4, ij, diag));
33619566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_inverse_A_4(diag, shift, allowzeropivot, &zeropivotdetected));
33627b6c816cSBarry Smith       if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT;
33639566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_transpose_A_4(diag));
3364bbead8a2SBarry Smith       diag += 16;
3365bbead8a2SBarry Smith     }
3366bbead8a2SBarry Smith     break;
3367bbead8a2SBarry Smith   case 5:
3368bbead8a2SBarry Smith     for (i = 0; i < mbs; i++) {
33699371c9d4SSatish Balay       ij[0] = 5 * i;
33709371c9d4SSatish Balay       ij[1] = 5 * i + 1;
33719371c9d4SSatish Balay       ij[2] = 5 * i + 2;
33729371c9d4SSatish Balay       ij[3] = 5 * i + 3;
33739371c9d4SSatish Balay       ij[4] = 5 * i + 4;
33749566063dSJacob Faibussowitsch       PetscCall(MatGetValues(A, 5, ij, 5, ij, diag));
33759566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_inverse_A_5(diag, ipvt, work, shift, allowzeropivot, &zeropivotdetected));
33767b6c816cSBarry Smith       if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT;
33779566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_transpose_A_5(diag));
3378bbead8a2SBarry Smith       diag += 25;
3379bbead8a2SBarry Smith     }
3380bbead8a2SBarry Smith     break;
3381bbead8a2SBarry Smith   case 6:
3382bbead8a2SBarry Smith     for (i = 0; i < mbs; i++) {
33839371c9d4SSatish Balay       ij[0] = 6 * i;
33849371c9d4SSatish Balay       ij[1] = 6 * i + 1;
33859371c9d4SSatish Balay       ij[2] = 6 * i + 2;
33869371c9d4SSatish Balay       ij[3] = 6 * i + 3;
33879371c9d4SSatish Balay       ij[4] = 6 * i + 4;
33889371c9d4SSatish Balay       ij[5] = 6 * i + 5;
33899566063dSJacob Faibussowitsch       PetscCall(MatGetValues(A, 6, ij, 6, ij, diag));
33909566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_inverse_A_6(diag, shift, allowzeropivot, &zeropivotdetected));
33917b6c816cSBarry Smith       if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT;
33929566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_transpose_A_6(diag));
3393bbead8a2SBarry Smith       diag += 36;
3394bbead8a2SBarry Smith     }
3395bbead8a2SBarry Smith     break;
3396bbead8a2SBarry Smith   case 7:
3397bbead8a2SBarry Smith     for (i = 0; i < mbs; i++) {
33989371c9d4SSatish Balay       ij[0] = 7 * i;
33999371c9d4SSatish Balay       ij[1] = 7 * i + 1;
34009371c9d4SSatish Balay       ij[2] = 7 * i + 2;
34019371c9d4SSatish Balay       ij[3] = 7 * i + 3;
34029371c9d4SSatish Balay       ij[4] = 7 * i + 4;
34039371c9d4SSatish Balay       ij[5] = 7 * i + 5;
3404cdd8bf47SJunchao Zhang       ij[6] = 7 * i + 6;
34059566063dSJacob Faibussowitsch       PetscCall(MatGetValues(A, 7, ij, 7, ij, diag));
34069566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_inverse_A_7(diag, shift, allowzeropivot, &zeropivotdetected));
34077b6c816cSBarry Smith       if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT;
34089566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_transpose_A_7(diag));
3409bbead8a2SBarry Smith       diag += 49;
3410bbead8a2SBarry Smith     }
3411bbead8a2SBarry Smith     break;
3412bbead8a2SBarry Smith   default:
34139566063dSJacob Faibussowitsch     PetscCall(PetscMalloc3(bs, &v_work, bs, &v_pivots, bs, &IJ));
3414bbead8a2SBarry Smith     for (i = 0; i < mbs; i++) {
3415ad540459SPierre Jolivet       for (j = 0; j < bs; j++) IJ[j] = bs * i + j;
34169566063dSJacob Faibussowitsch       PetscCall(MatGetValues(A, bs, IJ, bs, IJ, diag));
34179566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_inverse_A(bs, diag, v_pivots, v_work, allowzeropivot, &zeropivotdetected));
34187b6c816cSBarry Smith       if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT;
34199566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_transpose_A_N(diag, bs));
3420bbead8a2SBarry Smith       diag += bs2;
3421bbead8a2SBarry Smith     }
34229566063dSJacob Faibussowitsch     PetscCall(PetscFree3(v_work, v_pivots, IJ));
3423bbead8a2SBarry Smith   }
3424bbead8a2SBarry Smith   a->ibdiagvalid = PETSC_TRUE;
34253ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3426bbead8a2SBarry Smith }
3427bbead8a2SBarry Smith 
3428d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatSetRandom_SeqAIJ(Mat x, PetscRandom rctx)
3429d71ae5a4SJacob Faibussowitsch {
343073a71a0fSBarry Smith   Mat_SeqAIJ *aij = (Mat_SeqAIJ *)x->data;
3431fff043a9SJunchao Zhang   PetscScalar a, *aa;
343273a71a0fSBarry Smith   PetscInt    m, n, i, j, col;
343373a71a0fSBarry Smith 
343473a71a0fSBarry Smith   PetscFunctionBegin;
343573a71a0fSBarry Smith   if (!x->assembled) {
34369566063dSJacob Faibussowitsch     PetscCall(MatGetSize(x, &m, &n));
343773a71a0fSBarry Smith     for (i = 0; i < m; i++) {
343873a71a0fSBarry Smith       for (j = 0; j < aij->imax[i]; j++) {
34399566063dSJacob Faibussowitsch         PetscCall(PetscRandomGetValue(rctx, &a));
344073a71a0fSBarry Smith         col = (PetscInt)(n * PetscRealPart(a));
34419566063dSJacob Faibussowitsch         PetscCall(MatSetValues(x, 1, &i, 1, &col, &a, ADD_VALUES));
344273a71a0fSBarry Smith       }
344373a71a0fSBarry Smith     }
3444e2ce353bSJunchao Zhang   } else {
34459566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJGetArrayWrite(x, &aa));
34469566063dSJacob Faibussowitsch     for (i = 0; i < aij->nz; i++) PetscCall(PetscRandomGetValue(rctx, aa + i));
34479566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJRestoreArrayWrite(x, &aa));
3448e2ce353bSJunchao Zhang   }
34499566063dSJacob Faibussowitsch   PetscCall(MatAssemblyBegin(x, MAT_FINAL_ASSEMBLY));
34509566063dSJacob Faibussowitsch   PetscCall(MatAssemblyEnd(x, MAT_FINAL_ASSEMBLY));
34513ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
345273a71a0fSBarry Smith }
345373a71a0fSBarry Smith 
3454679944adSJunchao Zhang /* Like MatSetRandom_SeqAIJ, but do not set values on columns in range of [low, high) */
3455d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetRandomSkipColumnRange_SeqAIJ_Private(Mat x, PetscInt low, PetscInt high, PetscRandom rctx)
3456d71ae5a4SJacob Faibussowitsch {
3457679944adSJunchao Zhang   Mat_SeqAIJ *aij = (Mat_SeqAIJ *)x->data;
3458679944adSJunchao Zhang   PetscScalar a;
3459679944adSJunchao Zhang   PetscInt    m, n, i, j, col, nskip;
3460679944adSJunchao Zhang 
3461679944adSJunchao Zhang   PetscFunctionBegin;
3462679944adSJunchao Zhang   nskip = high - low;
34639566063dSJacob Faibussowitsch   PetscCall(MatGetSize(x, &m, &n));
3464679944adSJunchao Zhang   n -= nskip; /* shrink number of columns where nonzeros can be set */
3465679944adSJunchao Zhang   for (i = 0; i < m; i++) {
3466679944adSJunchao Zhang     for (j = 0; j < aij->imax[i]; j++) {
34679566063dSJacob Faibussowitsch       PetscCall(PetscRandomGetValue(rctx, &a));
3468679944adSJunchao Zhang       col = (PetscInt)(n * PetscRealPart(a));
3469679944adSJunchao Zhang       if (col >= low) col += nskip; /* shift col rightward to skip the hole */
34709566063dSJacob Faibussowitsch       PetscCall(MatSetValues(x, 1, &i, 1, &col, &a, ADD_VALUES));
3471679944adSJunchao Zhang     }
3472e2ce353bSJunchao Zhang   }
34739566063dSJacob Faibussowitsch   PetscCall(MatAssemblyBegin(x, MAT_FINAL_ASSEMBLY));
34749566063dSJacob Faibussowitsch   PetscCall(MatAssemblyEnd(x, MAT_FINAL_ASSEMBLY));
34753ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3476679944adSJunchao Zhang }
3477679944adSJunchao Zhang 
34780a6ffc59SBarry Smith static struct _MatOps MatOps_Values = {MatSetValues_SeqAIJ,
3479cb5b572fSBarry Smith                                        MatGetRow_SeqAIJ,
3480cb5b572fSBarry Smith                                        MatRestoreRow_SeqAIJ,
3481cb5b572fSBarry Smith                                        MatMult_SeqAIJ,
348297304618SKris Buschelman                                        /*  4*/ MatMultAdd_SeqAIJ,
34837c922b88SBarry Smith                                        MatMultTranspose_SeqAIJ,
34847c922b88SBarry Smith                                        MatMultTransposeAdd_SeqAIJ,
3485f4259b30SLisandro Dalcin                                        NULL,
3486f4259b30SLisandro Dalcin                                        NULL,
3487f4259b30SLisandro Dalcin                                        NULL,
3488f4259b30SLisandro Dalcin                                        /* 10*/ NULL,
3489cb5b572fSBarry Smith                                        MatLUFactor_SeqAIJ,
3490f4259b30SLisandro Dalcin                                        NULL,
349141f059aeSBarry Smith                                        MatSOR_SeqAIJ,
349291e9d3e2SHong Zhang                                        MatTranspose_SeqAIJ,
349397304618SKris Buschelman                                        /*1 5*/ MatGetInfo_SeqAIJ,
3494cb5b572fSBarry Smith                                        MatEqual_SeqAIJ,
3495cb5b572fSBarry Smith                                        MatGetDiagonal_SeqAIJ,
3496cb5b572fSBarry Smith                                        MatDiagonalScale_SeqAIJ,
3497cb5b572fSBarry Smith                                        MatNorm_SeqAIJ,
3498f4259b30SLisandro Dalcin                                        /* 20*/ NULL,
3499cb5b572fSBarry Smith                                        MatAssemblyEnd_SeqAIJ,
3500cb5b572fSBarry Smith                                        MatSetOption_SeqAIJ,
3501cb5b572fSBarry Smith                                        MatZeroEntries_SeqAIJ,
3502d519adbfSMatthew Knepley                                        /* 24*/ MatZeroRows_SeqAIJ,
3503f4259b30SLisandro Dalcin                                        NULL,
3504f4259b30SLisandro Dalcin                                        NULL,
3505f4259b30SLisandro Dalcin                                        NULL,
3506f4259b30SLisandro Dalcin                                        NULL,
350726cec326SBarry Smith                                        /* 29*/ MatSetUp_Seq_Hash,
3508f4259b30SLisandro Dalcin                                        NULL,
3509f4259b30SLisandro Dalcin                                        NULL,
3510f4259b30SLisandro Dalcin                                        NULL,
3511f4259b30SLisandro Dalcin                                        NULL,
3512d519adbfSMatthew Knepley                                        /* 34*/ MatDuplicate_SeqAIJ,
3513f4259b30SLisandro Dalcin                                        NULL,
3514f4259b30SLisandro Dalcin                                        NULL,
3515cb5b572fSBarry Smith                                        MatILUFactor_SeqAIJ,
3516f4259b30SLisandro Dalcin                                        NULL,
3517d519adbfSMatthew Knepley                                        /* 39*/ MatAXPY_SeqAIJ,
35187dae84e0SHong Zhang                                        MatCreateSubMatrices_SeqAIJ,
3519cb5b572fSBarry Smith                                        MatIncreaseOverlap_SeqAIJ,
3520cb5b572fSBarry Smith                                        MatGetValues_SeqAIJ,
3521cb5b572fSBarry Smith                                        MatCopy_SeqAIJ,
3522d519adbfSMatthew Knepley                                        /* 44*/ MatGetRowMax_SeqAIJ,
3523cb5b572fSBarry Smith                                        MatScale_SeqAIJ,
35247d68702bSBarry Smith                                        MatShift_SeqAIJ,
352579299369SBarry Smith                                        MatDiagonalSet_SeqAIJ,
35266e169961SBarry Smith                                        MatZeroRowsColumns_SeqAIJ,
352773a71a0fSBarry Smith                                        /* 49*/ MatSetRandom_SeqAIJ,
35283b2fbd54SBarry Smith                                        MatGetRowIJ_SeqAIJ,
35293b2fbd54SBarry Smith                                        MatRestoreRowIJ_SeqAIJ,
35303b2fbd54SBarry Smith                                        MatGetColumnIJ_SeqAIJ,
3531a93ec695SBarry Smith                                        MatRestoreColumnIJ_SeqAIJ,
353293dfae19SHong Zhang                                        /* 54*/ MatFDColoringCreate_SeqXAIJ,
3533f4259b30SLisandro Dalcin                                        NULL,
3534f4259b30SLisandro Dalcin                                        NULL,
3535cda55fadSBarry Smith                                        MatPermute_SeqAIJ,
3536f4259b30SLisandro Dalcin                                        NULL,
3537f4259b30SLisandro Dalcin                                        /* 59*/ NULL,
3538b9b97703SBarry Smith                                        MatDestroy_SeqAIJ,
3539b9b97703SBarry Smith                                        MatView_SeqAIJ,
3540f4259b30SLisandro Dalcin                                        NULL,
3541f4259b30SLisandro Dalcin                                        NULL,
3542f4259b30SLisandro Dalcin                                        /* 64*/ NULL,
3543321b30b9SSatish Balay                                        MatMatMatMultNumeric_SeqAIJ_SeqAIJ_SeqAIJ,
3544f4259b30SLisandro Dalcin                                        NULL,
3545f4259b30SLisandro Dalcin                                        NULL,
3546f4259b30SLisandro Dalcin                                        NULL,
3547d519adbfSMatthew Knepley                                        /* 69*/ MatGetRowMaxAbs_SeqAIJ,
3548c87e5d42SMatthew Knepley                                        MatGetRowMinAbs_SeqAIJ,
3549f4259b30SLisandro Dalcin                                        NULL,
3550f4259b30SLisandro Dalcin                                        NULL,
3551f4259b30SLisandro Dalcin                                        NULL,
3552f4259b30SLisandro Dalcin                                        /* 74*/ NULL,
35533acb8795SBarry Smith                                        MatFDColoringApply_AIJ,
3554f4259b30SLisandro Dalcin                                        NULL,
3555f4259b30SLisandro Dalcin                                        NULL,
3556f4259b30SLisandro Dalcin                                        NULL,
35576ce1633cSBarry Smith                                        /* 79*/ MatFindZeroDiagonals_SeqAIJ,
3558f4259b30SLisandro Dalcin                                        NULL,
3559f4259b30SLisandro Dalcin                                        NULL,
3560f4259b30SLisandro Dalcin                                        NULL,
3561bc011b1eSHong Zhang                                        MatLoad_SeqAIJ,
35626cff0a6bSPierre Jolivet                                        /* 84*/ NULL,
35636cff0a6bSPierre Jolivet                                        NULL,
3564f4259b30SLisandro Dalcin                                        NULL,
3565f4259b30SLisandro Dalcin                                        NULL,
3566f4259b30SLisandro Dalcin                                        NULL,
3567f4259b30SLisandro Dalcin                                        /* 89*/ NULL,
3568f4259b30SLisandro Dalcin                                        NULL,
356926be0446SHong Zhang                                        MatMatMultNumeric_SeqAIJ_SeqAIJ,
3570f4259b30SLisandro Dalcin                                        NULL,
3571f4259b30SLisandro Dalcin                                        NULL,
35728fa4b5a6SHong Zhang                                        /* 94*/ MatPtAPNumeric_SeqAIJ_SeqAIJ_SparseAxpy,
3573f4259b30SLisandro Dalcin                                        NULL,
3574f4259b30SLisandro Dalcin                                        NULL,
35756fc122caSHong Zhang                                        MatMatTransposeMultNumeric_SeqAIJ_SeqAIJ,
3576f4259b30SLisandro Dalcin                                        NULL,
35774222ddf1SHong Zhang                                        /* 99*/ MatProductSetFromOptions_SeqAIJ,
3578f4259b30SLisandro Dalcin                                        NULL,
3579f4259b30SLisandro Dalcin                                        NULL,
358087d4246cSBarry Smith                                        MatConjugate_SeqAIJ,
3581f4259b30SLisandro Dalcin                                        NULL,
3582d519adbfSMatthew Knepley                                        /*104*/ MatSetValuesRow_SeqAIJ,
358399cafbc1SBarry Smith                                        MatRealPart_SeqAIJ,
3584f5edf698SHong Zhang                                        MatImaginaryPart_SeqAIJ,
3585f4259b30SLisandro Dalcin                                        NULL,
3586f4259b30SLisandro Dalcin                                        NULL,
3587cbd44569SHong Zhang                                        /*109*/ MatMatSolve_SeqAIJ,
3588f4259b30SLisandro Dalcin                                        NULL,
35892af78befSBarry Smith                                        MatGetRowMin_SeqAIJ,
3590f4259b30SLisandro Dalcin                                        NULL,
3591599ef60dSHong Zhang                                        MatMissingDiagonal_SeqAIJ,
3592f4259b30SLisandro Dalcin                                        /*114*/ NULL,
3593f4259b30SLisandro Dalcin                                        NULL,
3594f4259b30SLisandro Dalcin                                        NULL,
3595f4259b30SLisandro Dalcin                                        NULL,
3596f4259b30SLisandro Dalcin                                        NULL,
3597f4259b30SLisandro Dalcin                                        /*119*/ NULL,
3598f4259b30SLisandro Dalcin                                        NULL,
3599f4259b30SLisandro Dalcin                                        NULL,
3600f4259b30SLisandro Dalcin                                        NULL,
3601b3a44c85SBarry Smith                                        MatGetMultiProcBlock_SeqAIJ,
36020716a85fSBarry Smith                                        /*124*/ MatFindNonzeroRows_SeqAIJ,
3603a873a8cdSSam Reynolds                                        MatGetColumnReductions_SeqAIJ,
360437868618SMatthew G Knepley                                        MatInvertBlockDiagonal_SeqAIJ,
36050da83c2eSBarry Smith                                        MatInvertVariableBlockDiagonal_SeqAIJ,
3606f4259b30SLisandro Dalcin                                        NULL,
3607f4259b30SLisandro Dalcin                                        /*129*/ NULL,
3608f4259b30SLisandro Dalcin                                        NULL,
3609f4259b30SLisandro Dalcin                                        NULL,
361075648e8dSHong Zhang                                        MatTransposeMatMultNumeric_SeqAIJ_SeqAIJ,
3611b9af6bddSHong Zhang                                        MatTransposeColoringCreate_SeqAIJ,
3612b9af6bddSHong Zhang                                        /*134*/ MatTransColoringApplySpToDen_SeqAIJ,
36132b8ad9a3SHong Zhang                                        MatTransColoringApplyDenToSp_SeqAIJ,
3614f4259b30SLisandro Dalcin                                        NULL,
3615f4259b30SLisandro Dalcin                                        NULL,
36163964eb88SJed Brown                                        MatRARtNumeric_SeqAIJ_SeqAIJ,
3617f4259b30SLisandro Dalcin                                        /*139*/ NULL,
3618f4259b30SLisandro Dalcin                                        NULL,
3619f4259b30SLisandro Dalcin                                        NULL,
36203a062f41SBarry Smith                                        MatFDColoringSetUp_SeqXAIJ,
36219c8f2541SHong Zhang                                        MatFindOffBlockDiagonalEntries_SeqAIJ,
36224222ddf1SHong Zhang                                        MatCreateMPIMatConcatenateSeqMat_SeqAIJ,
36234222ddf1SHong Zhang                                        /*145*/ MatDestroySubMatrices_SeqAIJ,
3624f4259b30SLisandro Dalcin                                        NULL,
362572833a62Smarkadams4                                        NULL,
362672833a62Smarkadams4                                        MatCreateGraph_Simple_AIJ,
36272d776b49SBarry Smith                                        NULL,
3628dec0b466SHong Zhang                                        /*150*/ MatTransposeSymbolic_SeqAIJ,
3629eede4a3fSMark Adams                                        MatEliminateZeros_SeqAIJ,
36304cc2b5b5SPierre Jolivet                                        MatGetRowSumAbs_SeqAIJ,
363142ce410bSJunchao Zhang                                        NULL,
363242ce410bSJunchao Zhang                                        NULL,
36334cc2b5b5SPierre Jolivet                                        NULL};
363417ab2063SBarry Smith 
3635ba38deedSJacob Faibussowitsch static PetscErrorCode MatSeqAIJSetColumnIndices_SeqAIJ(Mat mat, PetscInt *indices)
3636d71ae5a4SJacob Faibussowitsch {
3637bef8e0ddSBarry Smith   Mat_SeqAIJ *aij = (Mat_SeqAIJ *)mat->data;
363897f1f81fSBarry Smith   PetscInt    i, nz, n;
3639bef8e0ddSBarry Smith 
3640bef8e0ddSBarry Smith   PetscFunctionBegin;
3641bef8e0ddSBarry Smith   nz = aij->maxnz;
3642d0f46423SBarry Smith   n  = mat->rmap->n;
3643ad540459SPierre Jolivet   for (i = 0; i < nz; i++) aij->j[i] = indices[i];
3644bef8e0ddSBarry Smith   aij->nz = nz;
3645ad540459SPierre Jolivet   for (i = 0; i < n; i++) aij->ilen[i] = aij->imax[i];
36463ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3647bef8e0ddSBarry Smith }
3648bef8e0ddSBarry Smith 
3649a3bb6f32SFande Kong /*
3650ddea5d60SJunchao Zhang  * Given a sparse matrix with global column indices, compact it by using a local column space.
3651ddea5d60SJunchao Zhang  * The result matrix helps saving memory in other algorithms, such as MatPtAPSymbolic_MPIAIJ_MPIAIJ_scalable()
3652ddea5d60SJunchao Zhang  */
3653d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJCompactOutExtraColumns_SeqAIJ(Mat mat, ISLocalToGlobalMapping *mapping)
3654d71ae5a4SJacob Faibussowitsch {
3655a3bb6f32SFande Kong   Mat_SeqAIJ   *aij = (Mat_SeqAIJ *)mat->data;
3656eec179cfSJacob Faibussowitsch   PetscHMapI    gid1_lid1;
3657eec179cfSJacob Faibussowitsch   PetscHashIter tpos;
365825b670f0SStefano Zampini   PetscInt      gid, lid, i, ec, nz = aij->nz;
365925b670f0SStefano Zampini   PetscInt     *garray, *jj = aij->j;
3660a3bb6f32SFande Kong 
3661a3bb6f32SFande Kong   PetscFunctionBegin;
3662a3bb6f32SFande Kong   PetscValidHeaderSpecific(mat, MAT_CLASSID, 1);
36634f572ea9SToby Isaac   PetscAssertPointer(mapping, 2);
3664a3bb6f32SFande Kong   /* use a table */
3665eec179cfSJacob Faibussowitsch   PetscCall(PetscHMapICreateWithSize(mat->rmap->n, &gid1_lid1));
3666a3bb6f32SFande Kong   ec = 0;
366725b670f0SStefano Zampini   for (i = 0; i < nz; i++) {
366825b670f0SStefano Zampini     PetscInt data, gid1 = jj[i] + 1;
3669eec179cfSJacob Faibussowitsch     PetscCall(PetscHMapIGetWithDefault(gid1_lid1, gid1, 0, &data));
3670a3bb6f32SFande Kong     if (!data) {
3671a3bb6f32SFande Kong       /* one based table */
3672c76ffc5fSJacob Faibussowitsch       PetscCall(PetscHMapISet(gid1_lid1, gid1, ++ec));
3673a3bb6f32SFande Kong     }
3674a3bb6f32SFande Kong   }
3675a3bb6f32SFande Kong   /* form array of columns we need */
36769566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(ec, &garray));
3677eec179cfSJacob Faibussowitsch   PetscHashIterBegin(gid1_lid1, tpos);
3678eec179cfSJacob Faibussowitsch   while (!PetscHashIterAtEnd(gid1_lid1, tpos)) {
3679eec179cfSJacob Faibussowitsch     PetscHashIterGetKey(gid1_lid1, tpos, gid);
3680eec179cfSJacob Faibussowitsch     PetscHashIterGetVal(gid1_lid1, tpos, lid);
3681eec179cfSJacob Faibussowitsch     PetscHashIterNext(gid1_lid1, tpos);
3682a3bb6f32SFande Kong     gid--;
3683a3bb6f32SFande Kong     lid--;
3684a3bb6f32SFande Kong     garray[lid] = gid;
3685a3bb6f32SFande Kong   }
36869566063dSJacob Faibussowitsch   PetscCall(PetscSortInt(ec, garray)); /* sort, and rebuild */
3687eec179cfSJacob Faibussowitsch   PetscCall(PetscHMapIClear(gid1_lid1));
3688c76ffc5fSJacob Faibussowitsch   for (i = 0; i < ec; i++) PetscCall(PetscHMapISet(gid1_lid1, garray[i] + 1, i + 1));
3689a3bb6f32SFande Kong   /* compact out the extra columns in B */
369025b670f0SStefano Zampini   for (i = 0; i < nz; i++) {
369125b670f0SStefano Zampini     PetscInt gid1 = jj[i] + 1;
3692eec179cfSJacob Faibussowitsch     PetscCall(PetscHMapIGetWithDefault(gid1_lid1, gid1, 0, &lid));
3693a3bb6f32SFande Kong     lid--;
369425b670f0SStefano Zampini     jj[i] = lid;
3695a3bb6f32SFande Kong   }
36969566063dSJacob Faibussowitsch   PetscCall(PetscLayoutDestroy(&mat->cmap));
3697eec179cfSJacob Faibussowitsch   PetscCall(PetscHMapIDestroy(&gid1_lid1));
36989566063dSJacob Faibussowitsch   PetscCall(PetscLayoutCreateFromSizes(PetscObjectComm((PetscObject)mat), ec, ec, 1, &mat->cmap));
36999566063dSJacob Faibussowitsch   PetscCall(ISLocalToGlobalMappingCreate(PETSC_COMM_SELF, mat->cmap->bs, mat->cmap->n, garray, PETSC_OWN_POINTER, mapping));
37009566063dSJacob Faibussowitsch   PetscCall(ISLocalToGlobalMappingSetType(*mapping, ISLOCALTOGLOBALMAPPINGHASH));
37013ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3702a3bb6f32SFande Kong }
3703a3bb6f32SFande Kong 
3704bef8e0ddSBarry Smith /*@
3705bef8e0ddSBarry Smith   MatSeqAIJSetColumnIndices - Set the column indices for all the rows
3706bef8e0ddSBarry Smith   in the matrix.
3707bef8e0ddSBarry Smith 
3708bef8e0ddSBarry Smith   Input Parameters:
370911a5261eSBarry Smith + mat     - the `MATSEQAIJ` matrix
3710bef8e0ddSBarry Smith - indices - the column indices
3711bef8e0ddSBarry Smith 
371215091d37SBarry Smith   Level: advanced
371315091d37SBarry Smith 
3714bef8e0ddSBarry Smith   Notes:
3715bef8e0ddSBarry Smith   This can be called if you have precomputed the nonzero structure of the
3716bef8e0ddSBarry Smith   matrix and want to provide it to the matrix object to improve the performance
371711a5261eSBarry Smith   of the `MatSetValues()` operation.
3718bef8e0ddSBarry Smith 
3719bef8e0ddSBarry Smith   You MUST have set the correct numbers of nonzeros per row in the call to
372011a5261eSBarry Smith   `MatCreateSeqAIJ()`, and the columns indices MUST be sorted.
3721bef8e0ddSBarry Smith 
372211a5261eSBarry Smith   MUST be called before any calls to `MatSetValues()`
3723bef8e0ddSBarry Smith 
3724b9617806SBarry Smith   The indices should start with zero, not one.
3725b9617806SBarry Smith 
37261cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MATSEQAIJ`
3727bef8e0ddSBarry Smith @*/
3728d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetColumnIndices(Mat mat, PetscInt *indices)
3729d71ae5a4SJacob Faibussowitsch {
3730bef8e0ddSBarry Smith   PetscFunctionBegin;
37310700a824SBarry Smith   PetscValidHeaderSpecific(mat, MAT_CLASSID, 1);
37324f572ea9SToby Isaac   PetscAssertPointer(indices, 2);
3733cac4c232SBarry Smith   PetscUseMethod(mat, "MatSeqAIJSetColumnIndices_C", (Mat, PetscInt *), (mat, indices));
37343ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3735bef8e0ddSBarry Smith }
3736bef8e0ddSBarry Smith 
3737ba38deedSJacob Faibussowitsch static PetscErrorCode MatStoreValues_SeqAIJ(Mat mat)
3738d71ae5a4SJacob Faibussowitsch {
3739be6bf707SBarry Smith   Mat_SeqAIJ *aij = (Mat_SeqAIJ *)mat->data;
3740d0f46423SBarry Smith   size_t      nz  = aij->i[mat->rmap->n];
3741be6bf707SBarry Smith 
3742be6bf707SBarry Smith   PetscFunctionBegin;
374328b400f6SJacob Faibussowitsch   PetscCheck(aij->nonew, PETSC_COMM_SELF, PETSC_ERR_ORDER, "Must call MatSetOption(A,MAT_NEW_NONZERO_LOCATIONS,PETSC_FALSE);first");
3744be6bf707SBarry Smith 
3745be6bf707SBarry Smith   /* allocate space for values if not already there */
37464dfa11a4SJacob Faibussowitsch   if (!aij->saved_values) { PetscCall(PetscMalloc1(nz + 1, &aij->saved_values)); }
3747be6bf707SBarry Smith 
3748be6bf707SBarry Smith   /* copy values over */
37499566063dSJacob Faibussowitsch   PetscCall(PetscArraycpy(aij->saved_values, aij->a, nz));
37503ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3751be6bf707SBarry Smith }
3752be6bf707SBarry Smith 
3753be6bf707SBarry Smith /*@
375420f4b53cSBarry Smith   MatStoreValues - Stashes a copy of the matrix values; this allows reusing of the linear part of a Jacobian, while recomputing only the
3755be6bf707SBarry Smith   nonlinear portion.
3756be6bf707SBarry Smith 
3757c3339decSBarry Smith   Logically Collect
3758be6bf707SBarry Smith 
375927430b45SBarry Smith   Input Parameter:
376011a5261eSBarry Smith . mat - the matrix (currently only `MATAIJ` matrices support this option)
3761be6bf707SBarry Smith 
376215091d37SBarry Smith   Level: advanced
376315091d37SBarry Smith 
37642920cce0SJacob Faibussowitsch   Example Usage:
376527430b45SBarry Smith .vb
37662ef1f0ffSBarry Smith     Using SNES
376727430b45SBarry Smith     Create Jacobian matrix
376827430b45SBarry Smith     Set linear terms into matrix
376927430b45SBarry Smith     Apply boundary conditions to matrix, at this time matrix must have
377027430b45SBarry Smith       final nonzero structure (i.e. setting the nonlinear terms and applying
377127430b45SBarry Smith       boundary conditions again will not change the nonzero structure
377227430b45SBarry Smith     MatSetOption(mat, MAT_NEW_NONZERO_LOCATIONS, PETSC_FALSE);
377327430b45SBarry Smith     MatStoreValues(mat);
377427430b45SBarry Smith     Call SNESSetJacobian() with matrix
377527430b45SBarry Smith     In your Jacobian routine
377627430b45SBarry Smith       MatRetrieveValues(mat);
377727430b45SBarry Smith       Set nonlinear terms in matrix
3778be6bf707SBarry Smith 
377927430b45SBarry Smith     Without `SNESSolve()`, i.e. when you handle nonlinear solve yourself:
378027430b45SBarry Smith     // build linear portion of Jacobian
378127430b45SBarry Smith     MatSetOption(mat, MAT_NEW_NONZERO_LOCATIONS, PETSC_FALSE);
378227430b45SBarry Smith     MatStoreValues(mat);
378327430b45SBarry Smith     loop over nonlinear iterations
378427430b45SBarry Smith        MatRetrieveValues(mat);
378527430b45SBarry Smith        // call MatSetValues(mat,...) to set nonliner portion of Jacobian
378627430b45SBarry Smith        // call MatAssemblyBegin/End() on matrix
378727430b45SBarry Smith        Solve linear system with Jacobian
378827430b45SBarry Smith     endloop
378927430b45SBarry Smith .ve
3790be6bf707SBarry Smith 
3791be6bf707SBarry Smith   Notes:
3792da81f932SPierre Jolivet   Matrix must already be assembled before calling this routine
379311a5261eSBarry Smith   Must set the matrix option `MatSetOption`(mat,`MAT_NEW_NONZERO_LOCATIONS`,`PETSC_FALSE`); before
3794be6bf707SBarry Smith   calling this routine.
3795be6bf707SBarry Smith 
37960c468ba9SBarry Smith   When this is called multiple times it overwrites the previous set of stored values
37970c468ba9SBarry Smith   and does not allocated additional space.
37980c468ba9SBarry Smith 
3799fe59aa6dSJacob Faibussowitsch .seealso: [](ch_matrices), `Mat`, `MatRetrieveValues()`
3800be6bf707SBarry Smith @*/
3801d71ae5a4SJacob Faibussowitsch PetscErrorCode MatStoreValues(Mat mat)
3802d71ae5a4SJacob Faibussowitsch {
3803be6bf707SBarry Smith   PetscFunctionBegin;
38040700a824SBarry Smith   PetscValidHeaderSpecific(mat, MAT_CLASSID, 1);
380528b400f6SJacob Faibussowitsch   PetscCheck(mat->assembled, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for unassembled matrix");
380628b400f6SJacob Faibussowitsch   PetscCheck(!mat->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix");
3807cac4c232SBarry Smith   PetscUseMethod(mat, "MatStoreValues_C", (Mat), (mat));
38083ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3809be6bf707SBarry Smith }
3810be6bf707SBarry Smith 
3811ba38deedSJacob Faibussowitsch static PetscErrorCode MatRetrieveValues_SeqAIJ(Mat mat)
3812d71ae5a4SJacob Faibussowitsch {
3813be6bf707SBarry Smith   Mat_SeqAIJ *aij = (Mat_SeqAIJ *)mat->data;
3814d0f46423SBarry Smith   PetscInt    nz  = aij->i[mat->rmap->n];
3815be6bf707SBarry Smith 
3816be6bf707SBarry Smith   PetscFunctionBegin;
381728b400f6SJacob Faibussowitsch   PetscCheck(aij->nonew, PETSC_COMM_SELF, PETSC_ERR_ORDER, "Must call MatSetOption(A,MAT_NEW_NONZERO_LOCATIONS,PETSC_FALSE);first");
381828b400f6SJacob Faibussowitsch   PetscCheck(aij->saved_values, PETSC_COMM_SELF, PETSC_ERR_ORDER, "Must call MatStoreValues(A);first");
3819be6bf707SBarry Smith   /* copy values over */
38209566063dSJacob Faibussowitsch   PetscCall(PetscArraycpy(aij->a, aij->saved_values, nz));
38213ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3822be6bf707SBarry Smith }
3823be6bf707SBarry Smith 
3824be6bf707SBarry Smith /*@
382520f4b53cSBarry Smith   MatRetrieveValues - Retrieves the copy of the matrix values that was stored with `MatStoreValues()`
3826be6bf707SBarry Smith 
3827c3339decSBarry Smith   Logically Collect
3828be6bf707SBarry Smith 
38292fe279fdSBarry Smith   Input Parameter:
383011a5261eSBarry Smith . mat - the matrix (currently only `MATAIJ` matrices support this option)
3831be6bf707SBarry Smith 
383215091d37SBarry Smith   Level: advanced
383315091d37SBarry Smith 
38341cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatStoreValues()`
3835be6bf707SBarry Smith @*/
3836d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRetrieveValues(Mat mat)
3837d71ae5a4SJacob Faibussowitsch {
3838be6bf707SBarry Smith   PetscFunctionBegin;
38390700a824SBarry Smith   PetscValidHeaderSpecific(mat, MAT_CLASSID, 1);
384028b400f6SJacob Faibussowitsch   PetscCheck(mat->assembled, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for unassembled matrix");
384128b400f6SJacob Faibussowitsch   PetscCheck(!mat->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix");
3842cac4c232SBarry Smith   PetscUseMethod(mat, "MatRetrieveValues_C", (Mat), (mat));
38433ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3844be6bf707SBarry Smith }
3845be6bf707SBarry Smith 
38465d83a8b1SBarry Smith /*@
384711a5261eSBarry Smith   MatCreateSeqAIJ - Creates a sparse matrix in `MATSEQAIJ` (compressed row) format
38480d15e28bSLois Curfman McInnes   (the default parallel PETSc format).  For good matrix assembly performance
384920f4b53cSBarry Smith   the user should preallocate the matrix storage by setting the parameter `nz`
385020f4b53cSBarry Smith   (or the array `nnz`).
385117ab2063SBarry Smith 
3852d083f849SBarry Smith   Collective
3853db81eaa0SLois Curfman McInnes 
385417ab2063SBarry Smith   Input Parameters:
385511a5261eSBarry Smith + comm - MPI communicator, set to `PETSC_COMM_SELF`
385617ab2063SBarry Smith . m    - number of rows
385717ab2063SBarry Smith . n    - number of columns
385817ab2063SBarry Smith . nz   - number of nonzeros per row (same for all rows)
385951c19458SBarry Smith - nnz  - array containing the number of nonzeros in the various rows
38600298fd71SBarry Smith          (possibly different for each row) or NULL
386117ab2063SBarry Smith 
386217ab2063SBarry Smith   Output Parameter:
3863416022c9SBarry Smith . A - the matrix
386417ab2063SBarry Smith 
38652ef1f0ffSBarry Smith   Options Database Keys:
38662ef1f0ffSBarry Smith + -mat_no_inode            - Do not use inodes
38672ef1f0ffSBarry Smith - -mat_inode_limit <limit> - Sets inode limit (max limit=5)
38682ef1f0ffSBarry Smith 
38692ef1f0ffSBarry Smith   Level: intermediate
3870175b88e8SBarry Smith 
3871b259b22eSLois Curfman McInnes   Notes:
387277433607SBarry Smith   It is recommend to use `MatCreateFromOptions()` instead of this routine
387377433607SBarry Smith 
38742ef1f0ffSBarry Smith   If `nnz` is given then `nz` is ignored
387549a6f317SBarry Smith 
38762ef1f0ffSBarry Smith   The `MATSEQAIJ` format, also called
38772ef1f0ffSBarry Smith   compressed row storage, is fully compatible with standard Fortran
38780002213bSLois Curfman McInnes   storage.  That is, the stored row and column indices can begin at
38792ef1f0ffSBarry Smith   either one (as in Fortran) or zero.
388017ab2063SBarry Smith 
388120f4b53cSBarry Smith   Specify the preallocated storage with either `nz` or `nnz` (not both).
38822ef1f0ffSBarry Smith   Set `nz` = `PETSC_DEFAULT` and `nnz` = `NULL` for PETSc to control dynamic memory
388320f4b53cSBarry Smith   allocation.
388417ab2063SBarry Smith 
3885682d7d0cSBarry Smith   By default, this format uses inodes (identical nodes) when possible, to
38864fca80b9SLois Curfman McInnes   improve numerical efficiency of matrix-vector products and solves. We
3887682d7d0cSBarry Smith   search for consecutive rows with the same nonzero structure, thereby
38886c7ebb05SLois Curfman McInnes   reusing matrix information to achieve increased efficiency.
38896c7ebb05SLois Curfman McInnes 
38901cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, [Sparse Matrix Creation](sec_matsparse), `MatCreate()`, `MatCreateAIJ()`, `MatSetValues()`, `MatSeqAIJSetColumnIndices()`, `MatCreateSeqAIJWithArrays()`
389117ab2063SBarry Smith @*/
3892d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateSeqAIJ(MPI_Comm comm, PetscInt m, PetscInt n, PetscInt nz, const PetscInt nnz[], Mat *A)
3893d71ae5a4SJacob Faibussowitsch {
38943a40ed3dSBarry Smith   PetscFunctionBegin;
38959566063dSJacob Faibussowitsch   PetscCall(MatCreate(comm, A));
38969566063dSJacob Faibussowitsch   PetscCall(MatSetSizes(*A, m, n, m, n));
38979566063dSJacob Faibussowitsch   PetscCall(MatSetType(*A, MATSEQAIJ));
38989566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(*A, nz, nnz));
38993ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3900273d9f13SBarry Smith }
3901273d9f13SBarry Smith 
39025d83a8b1SBarry Smith /*@
3903273d9f13SBarry Smith   MatSeqAIJSetPreallocation - For good matrix assembly performance
3904273d9f13SBarry Smith   the user should preallocate the matrix storage by setting the parameter nz
3905273d9f13SBarry Smith   (or the array nnz).  By setting these parameters accurately, performance
3906273d9f13SBarry Smith   during matrix assembly can be increased by more than a factor of 50.
3907273d9f13SBarry Smith 
3908d083f849SBarry Smith   Collective
3909273d9f13SBarry Smith 
3910273d9f13SBarry Smith   Input Parameters:
39111c4f3114SJed Brown + B   - The matrix
3912273d9f13SBarry Smith . nz  - number of nonzeros per row (same for all rows)
3913273d9f13SBarry Smith - nnz - array containing the number of nonzeros in the various rows
39140298fd71SBarry Smith          (possibly different for each row) or NULL
3915273d9f13SBarry Smith 
39162ef1f0ffSBarry Smith   Options Database Keys:
39172ef1f0ffSBarry Smith + -mat_no_inode            - Do not use inodes
39182ef1f0ffSBarry Smith - -mat_inode_limit <limit> - Sets inode limit (max limit=5)
39192ef1f0ffSBarry Smith 
39202ef1f0ffSBarry Smith   Level: intermediate
39212ef1f0ffSBarry Smith 
3922273d9f13SBarry Smith   Notes:
39232ef1f0ffSBarry Smith   If `nnz` is given then `nz` is ignored
392449a6f317SBarry Smith 
392511a5261eSBarry Smith   The `MATSEQAIJ` format also called
39262ef1f0ffSBarry Smith   compressed row storage, is fully compatible with standard Fortran
3927273d9f13SBarry Smith   storage.  That is, the stored row and column indices can begin at
3928273d9f13SBarry Smith   either one (as in Fortran) or zero.  See the users' manual for details.
3929273d9f13SBarry Smith 
39302ef1f0ffSBarry Smith   Specify the preallocated storage with either `nz` or `nnz` (not both).
39312ef1f0ffSBarry Smith   Set nz = `PETSC_DEFAULT` and `nnz` = `NULL` for PETSc to control dynamic memory
39322ef1f0ffSBarry Smith   allocation.
3933273d9f13SBarry Smith 
393411a5261eSBarry Smith   You can call `MatGetInfo()` to get information on how effective the preallocation was;
3935aa95bbe8SBarry Smith   for example the fields mallocs,nz_allocated,nz_used,nz_unneeded;
3936aa95bbe8SBarry Smith   You can also run with the option -info and look for messages with the string
3937aa95bbe8SBarry Smith   malloc in them to see if additional memory allocation was needed.
3938aa95bbe8SBarry Smith 
393911a5261eSBarry Smith   Developer Notes:
394011a5261eSBarry Smith   Use nz of `MAT_SKIP_ALLOCATION` to not allocate any space for the matrix
3941a96a251dSBarry Smith   entries or columns indices
3942a96a251dSBarry Smith 
3943273d9f13SBarry Smith   By default, this format uses inodes (identical nodes) when possible, to
3944273d9f13SBarry Smith   improve numerical efficiency of matrix-vector products and solves. We
3945273d9f13SBarry Smith   search for consecutive rows with the same nonzero structure, thereby
3946273d9f13SBarry Smith   reusing matrix information to achieve increased efficiency.
3947273d9f13SBarry Smith 
39481cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatCreate()`, `MatCreateAIJ()`, `MatSetValues()`, `MatSeqAIJSetColumnIndices()`, `MatCreateSeqAIJWithArrays()`, `MatGetInfo()`,
3949db781477SPatrick Sanan           `MatSeqAIJSetTotalPreallocation()`
3950273d9f13SBarry Smith @*/
3951d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetPreallocation(Mat B, PetscInt nz, const PetscInt nnz[])
3952d71ae5a4SJacob Faibussowitsch {
3953a23d5eceSKris Buschelman   PetscFunctionBegin;
39546ba663aaSJed Brown   PetscValidHeaderSpecific(B, MAT_CLASSID, 1);
39556ba663aaSJed Brown   PetscValidType(B, 1);
3956cac4c232SBarry Smith   PetscTryMethod(B, "MatSeqAIJSetPreallocation_C", (Mat, PetscInt, const PetscInt[]), (B, nz, nnz));
39573ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3958a23d5eceSKris Buschelman }
3959a23d5eceSKris Buschelman 
3960d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetPreallocation_SeqAIJ(Mat B, PetscInt nz, const PetscInt *nnz)
3961d71ae5a4SJacob Faibussowitsch {
3962ad79cf63SBarry Smith   Mat_SeqAIJ *b              = (Mat_SeqAIJ *)B->data;
39632576faa2SJed Brown   PetscBool   skipallocation = PETSC_FALSE, realalloc = PETSC_FALSE;
396497f1f81fSBarry Smith   PetscInt    i;
3965273d9f13SBarry Smith 
3966273d9f13SBarry Smith   PetscFunctionBegin;
3967ad79cf63SBarry Smith   if (B->hash_active) {
3968aea10558SJacob Faibussowitsch     B->ops[0] = b->cops;
3969ad79cf63SBarry Smith     PetscCall(PetscHMapIJVDestroy(&b->ht));
3970ad79cf63SBarry Smith     PetscCall(PetscFree(b->dnz));
3971ad79cf63SBarry Smith     B->hash_active = PETSC_FALSE;
3972ad79cf63SBarry Smith   }
39732576faa2SJed Brown   if (nz >= 0 || nnz) realalloc = PETSC_TRUE;
3974a96a251dSBarry Smith   if (nz == MAT_SKIP_ALLOCATION) {
3975c461c341SBarry Smith     skipallocation = PETSC_TRUE;
3976c461c341SBarry Smith     nz             = 0;
3977c461c341SBarry Smith   }
39789566063dSJacob Faibussowitsch   PetscCall(PetscLayoutSetUp(B->rmap));
39799566063dSJacob Faibussowitsch   PetscCall(PetscLayoutSetUp(B->cmap));
3980899cda47SBarry Smith 
3981435da068SBarry Smith   if (nz == PETSC_DEFAULT || nz == PETSC_DECIDE) nz = 5;
398208401ef6SPierre Jolivet   PetscCheck(nz >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "nz cannot be less than 0: value %" PetscInt_FMT, nz);
39839f0612e4SBarry Smith   if (nnz) {
3984d0f46423SBarry Smith     for (i = 0; i < B->rmap->n; i++) {
398508401ef6SPierre Jolivet       PetscCheck(nnz[i] >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "nnz cannot be less than 0: local row %" PetscInt_FMT " value %" PetscInt_FMT, i, nnz[i]);
398608401ef6SPierre Jolivet       PetscCheck(nnz[i] <= B->cmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "nnz cannot be greater than row length: local row %" PetscInt_FMT " value %" PetscInt_FMT " rowlength %" PetscInt_FMT, i, nnz[i], B->cmap->n);
3987b73539f3SBarry Smith     }
3988b73539f3SBarry Smith   }
3989b73539f3SBarry Smith 
3990273d9f13SBarry Smith   B->preallocated = PETSC_TRUE;
3991ab93d7beSBarry Smith   if (!skipallocation) {
39924dfa11a4SJacob Faibussowitsch     if (!b->imax) { PetscCall(PetscMalloc1(B->rmap->n, &b->imax)); }
3993071fcb05SBarry Smith     if (!b->ilen) {
3994071fcb05SBarry Smith       /* b->ilen will count nonzeros in each row so far. */
39959566063dSJacob Faibussowitsch       PetscCall(PetscCalloc1(B->rmap->n, &b->ilen));
3996071fcb05SBarry Smith     } else {
39979566063dSJacob Faibussowitsch       PetscCall(PetscMemzero(b->ilen, B->rmap->n * sizeof(PetscInt)));
39982ee49352SLisandro Dalcin     }
3999aa624791SPierre Jolivet     if (!b->ipre) PetscCall(PetscMalloc1(B->rmap->n, &b->ipre));
4000273d9f13SBarry Smith     if (!nnz) {
4001435da068SBarry Smith       if (nz == PETSC_DEFAULT || nz == PETSC_DECIDE) nz = 10;
4002c62bd62aSJed Brown       else if (nz < 0) nz = 1;
40035d2a9ed1SStefano Zampini       nz = PetscMin(nz, B->cmap->n);
4004d0f46423SBarry Smith       for (i = 0; i < B->rmap->n; i++) b->imax[i] = nz;
4005c43c4a61SBarry Smith       PetscCall(PetscIntMultError(nz, B->rmap->n, &nz));
4006273d9f13SBarry Smith     } else {
4007c73702f5SBarry Smith       PetscInt64 nz64 = 0;
40089371c9d4SSatish Balay       for (i = 0; i < B->rmap->n; i++) {
40099371c9d4SSatish Balay         b->imax[i] = nnz[i];
40109371c9d4SSatish Balay         nz64 += nnz[i];
40119371c9d4SSatish Balay       }
40129566063dSJacob Faibussowitsch       PetscCall(PetscIntCast(nz64, &nz));
4013273d9f13SBarry Smith     }
4014ab93d7beSBarry Smith 
4015273d9f13SBarry Smith     /* allocate the matrix space */
40169566063dSJacob Faibussowitsch     PetscCall(MatSeqXAIJFreeAIJ(B, &b->a, &b->j, &b->i));
40179f0612e4SBarry Smith     PetscCall(PetscShmgetAllocateArray(nz, sizeof(PetscInt), (void **)&b->j));
40189f0612e4SBarry Smith     PetscCall(PetscShmgetAllocateArray(B->rmap->n + 1, sizeof(PetscInt), (void **)&b->i));
40199f0612e4SBarry Smith     b->free_ij = PETSC_TRUE;
4020396832f4SHong Zhang     if (B->structure_only) {
40219f0612e4SBarry Smith       b->free_a = PETSC_FALSE;
4022396832f4SHong Zhang     } else {
40239f0612e4SBarry Smith       PetscCall(PetscShmgetAllocateArray(nz, sizeof(PetscScalar), (void **)&b->a));
40249f0612e4SBarry Smith       b->free_a = PETSC_TRUE;
4025396832f4SHong Zhang     }
4026bfeeae90SHong Zhang     b->i[0] = 0;
4027ad540459SPierre Jolivet     for (i = 1; i < B->rmap->n + 1; i++) b->i[i] = b->i[i - 1] + b->imax[i - 1];
4028c461c341SBarry Smith   } else {
4029e6b907acSBarry Smith     b->free_a  = PETSC_FALSE;
4030e6b907acSBarry Smith     b->free_ij = PETSC_FALSE;
4031c461c341SBarry Smith   }
4032273d9f13SBarry Smith 
4033846b4da1SFande Kong   if (b->ipre && nnz != b->ipre && b->imax) {
4034846b4da1SFande Kong     /* reserve user-requested sparsity */
40359566063dSJacob Faibussowitsch     PetscCall(PetscArraycpy(b->ipre, b->imax, B->rmap->n));
4036846b4da1SFande Kong   }
4037846b4da1SFande Kong 
4038273d9f13SBarry Smith   b->nz               = 0;
4039273d9f13SBarry Smith   b->maxnz            = nz;
4040273d9f13SBarry Smith   B->info.nz_unneeded = (double)b->maxnz;
40411baa6e33SBarry Smith   if (realalloc) PetscCall(MatSetOption(B, MAT_NEW_NONZERO_ALLOCATION_ERR, PETSC_TRUE));
4042cb7b82ddSBarry Smith   B->was_assembled = PETSC_FALSE;
4043cb7b82ddSBarry Smith   B->assembled     = PETSC_FALSE;
40445519a089SJose E. Roman   /* We simply deem preallocation has changed nonzero state. Updating the state
40455519a089SJose E. Roman      will give clients (like AIJKokkos) a chance to know something has happened.
40465519a089SJose E. Roman   */
40475519a089SJose E. Roman   B->nonzerostate++;
40483ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
4049273d9f13SBarry Smith }
4050273d9f13SBarry Smith 
4051ba38deedSJacob Faibussowitsch static PetscErrorCode MatResetPreallocation_SeqAIJ(Mat A)
4052d71ae5a4SJacob Faibussowitsch {
4053846b4da1SFande Kong   Mat_SeqAIJ *a;
4054a5bbaf83SFande Kong   PetscInt    i;
40551f14be2bSBarry Smith   PetscBool   skipreset;
4056846b4da1SFande Kong 
4057846b4da1SFande Kong   PetscFunctionBegin;
4058846b4da1SFande Kong   PetscValidHeaderSpecific(A, MAT_CLASSID, 1);
405914d0e64fSAlex Lindsay 
406014d0e64fSAlex Lindsay   /* Check local size. If zero, then return */
40613ba16761SJacob Faibussowitsch   if (!A->rmap->n) PetscFunctionReturn(PETSC_SUCCESS);
406214d0e64fSAlex Lindsay 
4063846b4da1SFande Kong   a = (Mat_SeqAIJ *)A->data;
40642c814fdeSFande Kong   /* if no saved info, we error out */
406528b400f6SJacob Faibussowitsch   PetscCheck(a->ipre, PETSC_COMM_SELF, PETSC_ERR_ARG_NULL, "No saved preallocation info ");
40662c814fdeSFande Kong 
40671f14be2bSBarry Smith   PetscCheck(a->i && a->imax && a->ilen, PETSC_COMM_SELF, PETSC_ERR_ARG_NULL, "Memory info is incomplete, and can not reset preallocation ");
40682c814fdeSFande Kong 
40691f14be2bSBarry Smith   PetscCall(PetscArraycmp(a->ipre, a->ilen, A->rmap->n, &skipreset));
40701f14be2bSBarry Smith   if (!skipreset) {
40719566063dSJacob Faibussowitsch     PetscCall(PetscArraycpy(a->imax, a->ipre, A->rmap->n));
40729566063dSJacob Faibussowitsch     PetscCall(PetscArrayzero(a->ilen, A->rmap->n));
4073846b4da1SFande Kong     a->i[0] = 0;
4074ad540459SPierre Jolivet     for (i = 1; i < A->rmap->n + 1; i++) a->i[i] = a->i[i - 1] + a->imax[i - 1];
4075846b4da1SFande Kong     A->preallocated     = PETSC_TRUE;
4076846b4da1SFande Kong     a->nz               = 0;
4077846b4da1SFande Kong     a->maxnz            = a->i[A->rmap->n];
4078846b4da1SFande Kong     A->info.nz_unneeded = (double)a->maxnz;
4079846b4da1SFande Kong     A->was_assembled    = PETSC_FALSE;
4080846b4da1SFande Kong     A->assembled        = PETSC_FALSE;
40811f14be2bSBarry Smith   }
40823ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
4083846b4da1SFande Kong }
4084846b4da1SFande Kong 
408558d36128SBarry Smith /*@
408611a5261eSBarry Smith   MatSeqAIJSetPreallocationCSR - Allocates memory for a sparse sequential matrix in `MATSEQAIJ` format.
4087a1661176SMatthew Knepley 
4088a1661176SMatthew Knepley   Input Parameters:
4089a1661176SMatthew Knepley + B - the matrix
4090d8a51d2aSBarry Smith . i - the indices into `j` for the start of each row (indices start with zero)
4091d8a51d2aSBarry Smith . j - the column indices for each row (indices start with zero) these must be sorted for each row
4092d8a51d2aSBarry Smith - v - optional values in the matrix, use `NULL` if not provided
4093a1661176SMatthew Knepley 
4094a1661176SMatthew Knepley   Level: developer
4095a1661176SMatthew Knepley 
40966a9b8d82SBarry Smith   Notes:
40972ef1f0ffSBarry Smith   The `i`,`j`,`v` values are COPIED with this routine; to avoid the copy use `MatCreateSeqAIJWithArrays()`
409858d36128SBarry Smith 
40996a9b8d82SBarry Smith   This routine may be called multiple times with different nonzero patterns (or the same nonzero pattern). The nonzero
41006a9b8d82SBarry Smith   structure will be the union of all the previous nonzero structures.
41016a9b8d82SBarry Smith 
41026a9b8d82SBarry Smith   Developer Notes:
41032ef1f0ffSBarry Smith   An optimization could be added to the implementation where it checks if the `i`, and `j` are identical to the current `i` and `j` and
41042ef1f0ffSBarry Smith   then just copies the `v` values directly with `PetscMemcpy()`.
41056a9b8d82SBarry Smith 
410611a5261eSBarry Smith   This routine could also take a `PetscCopyMode` argument to allow sharing the values instead of always copying them.
41076a9b8d82SBarry Smith 
4108fe59aa6dSJacob Faibussowitsch .seealso: [](ch_matrices), `Mat`, `MatCreate()`, `MatCreateSeqAIJ()`, `MatSetValues()`, `MatSeqAIJSetPreallocation()`, `MATSEQAIJ`, `MatResetPreallocation()`
4109a1661176SMatthew Knepley @*/
4110d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetPreallocationCSR(Mat B, const PetscInt i[], const PetscInt j[], const PetscScalar v[])
4111d71ae5a4SJacob Faibussowitsch {
4112a1661176SMatthew Knepley   PetscFunctionBegin;
41130700a824SBarry Smith   PetscValidHeaderSpecific(B, MAT_CLASSID, 1);
41146ba663aaSJed Brown   PetscValidType(B, 1);
4115cac4c232SBarry Smith   PetscTryMethod(B, "MatSeqAIJSetPreallocationCSR_C", (Mat, const PetscInt[], const PetscInt[], const PetscScalar[]), (B, i, j, v));
41163ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
4117a1661176SMatthew Knepley }
4118a1661176SMatthew Knepley 
4119ba38deedSJacob Faibussowitsch static PetscErrorCode MatSeqAIJSetPreallocationCSR_SeqAIJ(Mat B, const PetscInt Ii[], const PetscInt J[], const PetscScalar v[])
4120d71ae5a4SJacob Faibussowitsch {
4121a1661176SMatthew Knepley   PetscInt  i;
4122a1661176SMatthew Knepley   PetscInt  m, n;
4123a1661176SMatthew Knepley   PetscInt  nz;
41246a9b8d82SBarry Smith   PetscInt *nnz;
4125a1661176SMatthew Knepley 
4126a1661176SMatthew Knepley   PetscFunctionBegin;
4127aed4548fSBarry Smith   PetscCheck(Ii[0] == 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Ii[0] must be 0 it is %" PetscInt_FMT, Ii[0]);
4128779a8d59SSatish Balay 
41299566063dSJacob Faibussowitsch   PetscCall(PetscLayoutSetUp(B->rmap));
41309566063dSJacob Faibussowitsch   PetscCall(PetscLayoutSetUp(B->cmap));
4131779a8d59SSatish Balay 
41329566063dSJacob Faibussowitsch   PetscCall(MatGetSize(B, &m, &n));
41339566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(m + 1, &nnz));
4134a1661176SMatthew Knepley   for (i = 0; i < m; i++) {
4135b7940d39SSatish Balay     nz = Ii[i + 1] - Ii[i];
413608401ef6SPierre Jolivet     PetscCheck(nz >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Local row %" PetscInt_FMT " has a negative number of columns %" PetscInt_FMT, i, nz);
4137a1661176SMatthew Knepley     nnz[i] = nz;
4138a1661176SMatthew Knepley   }
41399566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJSetPreallocation(B, 0, nnz));
41409566063dSJacob Faibussowitsch   PetscCall(PetscFree(nnz));
4141a1661176SMatthew Knepley 
41428e3a54c0SPierre Jolivet   for (i = 0; i < m; i++) PetscCall(MatSetValues_SeqAIJ(B, 1, &i, Ii[i + 1] - Ii[i], J + Ii[i], PetscSafePointerPlusOffset(v, Ii[i]), INSERT_VALUES));
4143a1661176SMatthew Knepley 
41449566063dSJacob Faibussowitsch   PetscCall(MatAssemblyBegin(B, MAT_FINAL_ASSEMBLY));
41459566063dSJacob Faibussowitsch   PetscCall(MatAssemblyEnd(B, MAT_FINAL_ASSEMBLY));
4146a1661176SMatthew Knepley 
41479566063dSJacob Faibussowitsch   PetscCall(MatSetOption(B, MAT_NEW_NONZERO_LOCATION_ERR, PETSC_TRUE));
41483ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
4149a1661176SMatthew Knepley }
4150a1661176SMatthew Knepley 
4151ad7e164aSPierre Jolivet /*@
41522ef1f0ffSBarry Smith   MatSeqAIJKron - Computes `C`, the Kronecker product of `A` and `B`.
4153ad7e164aSPierre Jolivet 
4154ad7e164aSPierre Jolivet   Input Parameters:
4155ad7e164aSPierre Jolivet + A     - left-hand side matrix
4156ad7e164aSPierre Jolivet . B     - right-hand side matrix
415711a5261eSBarry Smith - reuse - either `MAT_INITIAL_MATRIX` or `MAT_REUSE_MATRIX`
4158ad7e164aSPierre Jolivet 
4159ad7e164aSPierre Jolivet   Output Parameter:
41602ef1f0ffSBarry Smith . C - Kronecker product of `A` and `B`
4161ad7e164aSPierre Jolivet 
4162ad7e164aSPierre Jolivet   Level: intermediate
4163ad7e164aSPierre Jolivet 
416411a5261eSBarry Smith   Note:
416511a5261eSBarry Smith   `MAT_REUSE_MATRIX` can only be used when the nonzero structure of the product matrix has not changed from that last call to `MatSeqAIJKron()`.
4166ad7e164aSPierre Jolivet 
41671cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatCreateSeqAIJ()`, `MATSEQAIJ`, `MATKAIJ`, `MatReuse`
4168ad7e164aSPierre Jolivet @*/
4169d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJKron(Mat A, Mat B, MatReuse reuse, Mat *C)
4170d71ae5a4SJacob Faibussowitsch {
4171ad7e164aSPierre Jolivet   PetscFunctionBegin;
4172ad7e164aSPierre Jolivet   PetscValidHeaderSpecific(A, MAT_CLASSID, 1);
4173ad7e164aSPierre Jolivet   PetscValidType(A, 1);
4174ad7e164aSPierre Jolivet   PetscValidHeaderSpecific(B, MAT_CLASSID, 2);
4175ad7e164aSPierre Jolivet   PetscValidType(B, 2);
41764f572ea9SToby Isaac   PetscAssertPointer(C, 4);
4177ad7e164aSPierre Jolivet   if (reuse == MAT_REUSE_MATRIX) {
4178ad7e164aSPierre Jolivet     PetscValidHeaderSpecific(*C, MAT_CLASSID, 4);
4179ad7e164aSPierre Jolivet     PetscValidType(*C, 4);
4180ad7e164aSPierre Jolivet   }
4181cac4c232SBarry Smith   PetscTryMethod(A, "MatSeqAIJKron_C", (Mat, Mat, MatReuse, Mat *), (A, B, reuse, C));
41823ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
4183ad7e164aSPierre Jolivet }
4184ad7e164aSPierre Jolivet 
4185ba38deedSJacob Faibussowitsch static PetscErrorCode MatSeqAIJKron_SeqAIJ(Mat A, Mat B, MatReuse reuse, Mat *C)
4186d71ae5a4SJacob Faibussowitsch {
4187ad7e164aSPierre Jolivet   Mat                newmat;
4188ad7e164aSPierre Jolivet   Mat_SeqAIJ        *a = (Mat_SeqAIJ *)A->data;
4189ad7e164aSPierre Jolivet   Mat_SeqAIJ        *b = (Mat_SeqAIJ *)B->data;
4190ad7e164aSPierre Jolivet   PetscScalar       *v;
4191fff043a9SJunchao Zhang   const PetscScalar *aa, *ba;
4192ad7e164aSPierre Jolivet   PetscInt          *i, *j, m, n, p, q, nnz = 0, am = A->rmap->n, bm = B->rmap->n, an = A->cmap->n, bn = B->cmap->n;
4193ad7e164aSPierre Jolivet   PetscBool          flg;
4194ad7e164aSPierre Jolivet 
4195ad7e164aSPierre Jolivet   PetscFunctionBegin;
419628b400f6SJacob Faibussowitsch   PetscCheck(!A->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix");
419728b400f6SJacob Faibussowitsch   PetscCheck(A->assembled, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for unassembled matrix");
419828b400f6SJacob Faibussowitsch   PetscCheck(!B->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix");
419928b400f6SJacob Faibussowitsch   PetscCheck(B->assembled, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for unassembled matrix");
42009566063dSJacob Faibussowitsch   PetscCall(PetscObjectTypeCompare((PetscObject)B, MATSEQAIJ, &flg));
420128b400f6SJacob Faibussowitsch   PetscCheck(flg, PETSC_COMM_SELF, PETSC_ERR_SUP, "MatType %s", ((PetscObject)B)->type_name);
4202aed4548fSBarry Smith   PetscCheck(reuse == MAT_INITIAL_MATRIX || reuse == MAT_REUSE_MATRIX, PETSC_COMM_SELF, PETSC_ERR_SUP, "MatReuse %d", (int)reuse);
4203ad7e164aSPierre Jolivet   if (reuse == MAT_INITIAL_MATRIX) {
42049566063dSJacob Faibussowitsch     PetscCall(PetscMalloc2(am * bm + 1, &i, a->i[am] * b->i[bm], &j));
42059566063dSJacob Faibussowitsch     PetscCall(MatCreate(PETSC_COMM_SELF, &newmat));
42069566063dSJacob Faibussowitsch     PetscCall(MatSetSizes(newmat, am * bm, an * bn, am * bm, an * bn));
42079566063dSJacob Faibussowitsch     PetscCall(MatSetType(newmat, MATAIJ));
4208ad7e164aSPierre Jolivet     i[0] = 0;
4209ad7e164aSPierre Jolivet     for (m = 0; m < am; ++m) {
4210ad7e164aSPierre Jolivet       for (p = 0; p < bm; ++p) {
4211ad7e164aSPierre Jolivet         i[m * bm + p + 1] = i[m * bm + p] + (a->i[m + 1] - a->i[m]) * (b->i[p + 1] - b->i[p]);
4212ad7e164aSPierre Jolivet         for (n = a->i[m]; n < a->i[m + 1]; ++n) {
4213ad540459SPierre Jolivet           for (q = b->i[p]; q < b->i[p + 1]; ++q) j[nnz++] = a->j[n] * bn + b->j[q];
4214ad7e164aSPierre Jolivet         }
4215ad7e164aSPierre Jolivet       }
4216ad7e164aSPierre Jolivet     }
42179566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJSetPreallocationCSR(newmat, i, j, NULL));
4218ad7e164aSPierre Jolivet     *C = newmat;
42199566063dSJacob Faibussowitsch     PetscCall(PetscFree2(i, j));
4220ad7e164aSPierre Jolivet     nnz = 0;
4221ad7e164aSPierre Jolivet   }
42229566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArray(*C, &v));
42239566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &aa));
42249566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(B, &ba));
4225ad7e164aSPierre Jolivet   for (m = 0; m < am; ++m) {
4226ad7e164aSPierre Jolivet     for (p = 0; p < bm; ++p) {
4227ad7e164aSPierre Jolivet       for (n = a->i[m]; n < a->i[m + 1]; ++n) {
4228ad540459SPierre Jolivet         for (q = b->i[p]; q < b->i[p + 1]; ++q) v[nnz++] = aa[n] * ba[q];
4229ad7e164aSPierre Jolivet       }
4230ad7e164aSPierre Jolivet     }
4231ad7e164aSPierre Jolivet   }
42329566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArray(*C, &v));
42339566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &aa));
42349566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(B, &ba));
42353ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
4236ad7e164aSPierre Jolivet }
4237ad7e164aSPierre Jolivet 
4238c6db04a5SJed Brown #include <../src/mat/impls/dense/seq/dense.h>
4239af0996ceSBarry Smith #include <petsc/private/kernels/petscaxpy.h>
4240170fe5c8SBarry Smith 
4241170fe5c8SBarry Smith /*
4242170fe5c8SBarry Smith     Computes (B'*A')' since computing B*A directly is untenable
4243170fe5c8SBarry Smith 
4244170fe5c8SBarry Smith                n                       p                          p
42452da392ccSBarry Smith         [             ]       [             ]         [                 ]
42462da392ccSBarry Smith       m [      A      ]  *  n [       B     ]   =   m [         C       ]
42472da392ccSBarry Smith         [             ]       [             ]         [                 ]
4248170fe5c8SBarry Smith 
4249170fe5c8SBarry Smith */
4250d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMatMultNumeric_SeqDense_SeqAIJ(Mat A, Mat B, Mat C)
4251d71ae5a4SJacob Faibussowitsch {
4252170fe5c8SBarry Smith   Mat_SeqDense      *sub_a = (Mat_SeqDense *)A->data;
4253170fe5c8SBarry Smith   Mat_SeqAIJ        *sub_b = (Mat_SeqAIJ *)B->data;
4254170fe5c8SBarry Smith   Mat_SeqDense      *sub_c = (Mat_SeqDense *)C->data;
425586214ceeSStefano Zampini   PetscInt           i, j, n, m, q, p;
4256170fe5c8SBarry Smith   const PetscInt    *ii, *idx;
4257170fe5c8SBarry Smith   const PetscScalar *b, *a, *a_q;
4258170fe5c8SBarry Smith   PetscScalar       *c, *c_q;
425986214ceeSStefano Zampini   PetscInt           clda = sub_c->lda;
426086214ceeSStefano Zampini   PetscInt           alda = sub_a->lda;
4261170fe5c8SBarry Smith 
4262170fe5c8SBarry Smith   PetscFunctionBegin;
4263d0f46423SBarry Smith   m = A->rmap->n;
4264d0f46423SBarry Smith   n = A->cmap->n;
4265d0f46423SBarry Smith   p = B->cmap->n;
4266170fe5c8SBarry Smith   a = sub_a->v;
4267170fe5c8SBarry Smith   b = sub_b->a;
4268170fe5c8SBarry Smith   c = sub_c->v;
426986214ceeSStefano Zampini   if (clda == m) {
42709566063dSJacob Faibussowitsch     PetscCall(PetscArrayzero(c, m * p));
427186214ceeSStefano Zampini   } else {
427286214ceeSStefano Zampini     for (j = 0; j < p; j++)
42739371c9d4SSatish Balay       for (i = 0; i < m; i++) c[j * clda + i] = 0.0;
427486214ceeSStefano Zampini   }
4275170fe5c8SBarry Smith   ii  = sub_b->i;
4276170fe5c8SBarry Smith   idx = sub_b->j;
4277170fe5c8SBarry Smith   for (i = 0; i < n; i++) {
4278170fe5c8SBarry Smith     q = ii[i + 1] - ii[i];
4279170fe5c8SBarry Smith     while (q-- > 0) {
428086214ceeSStefano Zampini       c_q = c + clda * (*idx);
428186214ceeSStefano Zampini       a_q = a + alda * i;
4282854c7f52SBarry Smith       PetscKernelAXPY(c_q, *b, a_q, m);
4283170fe5c8SBarry Smith       idx++;
4284170fe5c8SBarry Smith       b++;
4285170fe5c8SBarry Smith     }
4286170fe5c8SBarry Smith   }
42873ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
4288170fe5c8SBarry Smith }
4289170fe5c8SBarry Smith 
4290d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMatMultSymbolic_SeqDense_SeqAIJ(Mat A, Mat B, PetscReal fill, Mat C)
4291d71ae5a4SJacob Faibussowitsch {
4292d0f46423SBarry Smith   PetscInt  m = A->rmap->n, n = B->cmap->n;
429386214ceeSStefano Zampini   PetscBool cisdense;
4294170fe5c8SBarry Smith 
4295170fe5c8SBarry Smith   PetscFunctionBegin;
429608401ef6SPierre Jolivet   PetscCheck(A->cmap->n == B->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "A->cmap->n %" PetscInt_FMT " != B->rmap->n %" PetscInt_FMT, A->cmap->n, B->rmap->n);
42979566063dSJacob Faibussowitsch   PetscCall(MatSetSizes(C, m, n, m, n));
42989566063dSJacob Faibussowitsch   PetscCall(MatSetBlockSizesFromMats(C, A, B));
4299d5e393b6SSuyash Tandon   PetscCall(PetscObjectTypeCompareAny((PetscObject)C, &cisdense, MATSEQDENSE, MATSEQDENSECUDA, MATSEQDENSEHIP, ""));
430048a46eb9SPierre Jolivet   if (!cisdense) PetscCall(MatSetType(C, MATDENSE));
43019566063dSJacob Faibussowitsch   PetscCall(MatSetUp(C));
4302d73949e8SHong Zhang 
43034222ddf1SHong Zhang   C->ops->matmultnumeric = MatMatMultNumeric_SeqDense_SeqAIJ;
43043ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
4305170fe5c8SBarry Smith }
4306170fe5c8SBarry Smith 
43070bad9183SKris Buschelman /*MC
4308fafad747SKris Buschelman    MATSEQAIJ - MATSEQAIJ = "seqaij" - A matrix type to be used for sequential sparse matrices,
43090bad9183SKris Buschelman    based on compressed sparse row format.
43100bad9183SKris Buschelman 
43112ef1f0ffSBarry Smith    Options Database Key:
43120bad9183SKris Buschelman . -mat_type seqaij - sets the matrix type to "seqaij" during a call to MatSetFromOptions()
43130bad9183SKris Buschelman 
43140bad9183SKris Buschelman    Level: beginner
43150bad9183SKris Buschelman 
43160cd7f59aSBarry Smith    Notes:
43172ef1f0ffSBarry Smith     `MatSetValues()` may be called for this matrix type with a `NULL` argument for the numerical values,
43180cd7f59aSBarry Smith     in this case the values associated with the rows and columns one passes in are set to zero
43190cd7f59aSBarry Smith     in the matrix
43200cd7f59aSBarry Smith 
432111a5261eSBarry Smith     `MatSetOptions`(,`MAT_STRUCTURE_ONLY`,`PETSC_TRUE`) may be called for this matrix type. In this no
432211a5261eSBarry Smith     space is allocated for the nonzero entries and any entries passed with `MatSetValues()` are ignored
43230cd7f59aSBarry Smith 
432411a5261eSBarry Smith   Developer Note:
43252ef1f0ffSBarry Smith     It would be nice if all matrix formats supported passing `NULL` in for the numerical values
43260cd7f59aSBarry Smith 
43271cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatCreateSeqAIJ()`, `MatSetFromOptions()`, `MatSetType()`, `MatCreate()`, `MatType`, `MATSELL`, `MATSEQSELL`, `MATMPISELL`
43280bad9183SKris Buschelman M*/
43290bad9183SKris Buschelman 
4330ccd284c7SBarry Smith /*MC
4331ccd284c7SBarry Smith    MATAIJ - MATAIJ = "aij" - A matrix type to be used for sparse matrices.
4332ccd284c7SBarry Smith 
433311a5261eSBarry Smith    This matrix type is identical to `MATSEQAIJ` when constructed with a single process communicator,
433411a5261eSBarry Smith    and `MATMPIAIJ` otherwise.  As a result, for single process communicators,
433511a5261eSBarry Smith    `MatSeqAIJSetPreallocation()` is supported, and similarly `MatMPIAIJSetPreallocation()` is supported
4336ccd284c7SBarry Smith    for communicators controlling multiple processes.  It is recommended that you call both of
4337ccd284c7SBarry Smith    the above preallocation routines for simplicity.
4338ccd284c7SBarry Smith 
43392ef1f0ffSBarry Smith    Options Database Key:
434011a5261eSBarry Smith . -mat_type aij - sets the matrix type to "aij" during a call to `MatSetFromOptions()`
4341ccd284c7SBarry Smith 
43422ef1f0ffSBarry Smith   Level: beginner
43432ef1f0ffSBarry Smith 
434411a5261eSBarry Smith    Note:
434511a5261eSBarry Smith    Subclasses include `MATAIJCUSPARSE`, `MATAIJPERM`, `MATAIJSELL`, `MATAIJMKL`, `MATAIJCRL`, and also automatically switches over to use inodes when
4346ccd284c7SBarry Smith    enough exist.
4347ccd284c7SBarry Smith 
43481cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatCreateAIJ()`, `MatCreateSeqAIJ()`, `MATSEQAIJ`, `MATMPIAIJ`, `MATSELL`, `MATSEQSELL`, `MATMPISELL`
4349ccd284c7SBarry Smith M*/
4350ccd284c7SBarry Smith 
4351ccd284c7SBarry Smith /*MC
4352ccd284c7SBarry Smith    MATAIJCRL - MATAIJCRL = "aijcrl" - A matrix type to be used for sparse matrices.
4353ccd284c7SBarry Smith 
43542ef1f0ffSBarry Smith    Options Database Key:
43552ef1f0ffSBarry Smith . -mat_type aijcrl - sets the matrix type to "aijcrl" during a call to `MatSetFromOptions()`
43562ef1f0ffSBarry Smith 
43572ef1f0ffSBarry Smith   Level: beginner
43582ef1f0ffSBarry Smith 
43592ef1f0ffSBarry Smith    Note:
436011a5261eSBarry Smith    This matrix type is identical to `MATSEQAIJCRL` when constructed with a single process communicator,
436111a5261eSBarry Smith    and `MATMPIAIJCRL` otherwise.  As a result, for single process communicators,
436211a5261eSBarry Smith    `MatSeqAIJSetPreallocation()` is supported, and similarly `MatMPIAIJSetPreallocation()` is supported
4363ccd284c7SBarry Smith    for communicators controlling multiple processes.  It is recommended that you call both of
4364ccd284c7SBarry Smith    the above preallocation routines for simplicity.
4365ccd284c7SBarry Smith 
43661cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatCreateMPIAIJCRL`, `MATSEQAIJCRL`, `MATMPIAIJCRL`, `MATSEQAIJCRL`, `MATMPIAIJCRL`
4367ccd284c7SBarry Smith M*/
4368ccd284c7SBarry Smith 
43697906f579SHong Zhang PETSC_INTERN PetscErrorCode MatConvert_SeqAIJ_SeqAIJCRL(Mat, MatType, MatReuse, Mat *);
43707906f579SHong Zhang #if defined(PETSC_HAVE_ELEMENTAL)
43717906f579SHong Zhang PETSC_INTERN PetscErrorCode MatConvert_SeqAIJ_Elemental(Mat, MatType, MatReuse, Mat *);
43727906f579SHong Zhang #endif
4373d24d4204SJose E. Roman #if defined(PETSC_HAVE_SCALAPACK)
4374d24d4204SJose E. Roman PETSC_INTERN PetscErrorCode MatConvert_AIJ_ScaLAPACK(Mat, MatType, MatReuse, Mat *);
4375d24d4204SJose E. Roman #endif
43767906f579SHong Zhang #if defined(PETSC_HAVE_HYPRE)
43777906f579SHong Zhang PETSC_INTERN PetscErrorCode MatConvert_AIJ_HYPRE(Mat A, MatType, MatReuse, Mat *);
43787906f579SHong Zhang #endif
43797906f579SHong Zhang 
4380d4002b98SHong Zhang PETSC_EXTERN PetscErrorCode MatConvert_SeqAIJ_SeqSELL(Mat, MatType, MatReuse, Mat *);
4381c9225affSStefano Zampini PETSC_INTERN PetscErrorCode MatConvert_XAIJ_IS(Mat, MatType, MatReuse, Mat *);
43824222ddf1SHong Zhang PETSC_INTERN PetscErrorCode MatProductSetFromOptions_IS_XAIJ(Mat);
43837906f579SHong Zhang 
43848c778c55SBarry Smith /*@C
438511a5261eSBarry Smith   MatSeqAIJGetArray - gives read/write access to the array where the data for a `MATSEQAIJ` matrix is stored
43868c778c55SBarry Smith 
43878c778c55SBarry Smith   Not Collective
43888c778c55SBarry Smith 
43898c778c55SBarry Smith   Input Parameter:
4390fe59aa6dSJacob Faibussowitsch . A - a `MATSEQAIJ` matrix
43918c778c55SBarry Smith 
43928c778c55SBarry Smith   Output Parameter:
43938c778c55SBarry Smith . array - pointer to the data
43948c778c55SBarry Smith 
43958c778c55SBarry Smith   Level: intermediate
43968c778c55SBarry Smith 
4397fe59aa6dSJacob Faibussowitsch   Fortran Notes:
43980ab4885dSBarry Smith   `MatSeqAIJGetArray()` Fortran binding is deprecated (since PETSc 3.19), use `MatSeqAIJGetArrayF90()`
43990ab4885dSBarry Smith 
44001cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJRestoreArray()`, `MatSeqAIJGetArrayF90()`
44018c778c55SBarry Smith @*/
44025d83a8b1SBarry Smith PetscErrorCode MatSeqAIJGetArray(Mat A, PetscScalar *array[])
4403d71ae5a4SJacob Faibussowitsch {
4404d67d9f35SJunchao Zhang   Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data;
44058c778c55SBarry Smith 
44068c778c55SBarry Smith   PetscFunctionBegin;
4407d67d9f35SJunchao Zhang   if (aij->ops->getarray) {
44089566063dSJacob Faibussowitsch     PetscCall((*aij->ops->getarray)(A, array));
4409d67d9f35SJunchao Zhang   } else {
4410d67d9f35SJunchao Zhang     *array = aij->a;
4411d67d9f35SJunchao Zhang   }
44123ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
4413d67d9f35SJunchao Zhang }
4414d67d9f35SJunchao Zhang 
4415d67d9f35SJunchao Zhang /*@C
441611a5261eSBarry Smith   MatSeqAIJRestoreArray - returns access to the array where the data for a `MATSEQAIJ` matrix is stored obtained by `MatSeqAIJGetArray()`
4417d67d9f35SJunchao Zhang 
4418d67d9f35SJunchao Zhang   Not Collective
4419d67d9f35SJunchao Zhang 
4420d67d9f35SJunchao Zhang   Input Parameters:
4421fe59aa6dSJacob Faibussowitsch + A     - a `MATSEQAIJ` matrix
4422d67d9f35SJunchao Zhang - array - pointer to the data
4423d67d9f35SJunchao Zhang 
4424d67d9f35SJunchao Zhang   Level: intermediate
4425d67d9f35SJunchao Zhang 
4426fe59aa6dSJacob Faibussowitsch   Fortran Notes:
44270ab4885dSBarry Smith   `MatSeqAIJRestoreArray()` Fortran binding is deprecated (since PETSc 3.19), use `MatSeqAIJRestoreArrayF90()`
44280ab4885dSBarry Smith 
44291cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJGetArray()`, `MatSeqAIJRestoreArrayF90()`
4430d67d9f35SJunchao Zhang @*/
44315d83a8b1SBarry Smith PetscErrorCode MatSeqAIJRestoreArray(Mat A, PetscScalar *array[])
4432d71ae5a4SJacob Faibussowitsch {
4433d67d9f35SJunchao Zhang   Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data;
4434d67d9f35SJunchao Zhang 
4435d67d9f35SJunchao Zhang   PetscFunctionBegin;
4436d67d9f35SJunchao Zhang   if (aij->ops->restorearray) {
44379566063dSJacob Faibussowitsch     PetscCall((*aij->ops->restorearray)(A, array));
4438d67d9f35SJunchao Zhang   } else {
4439d67d9f35SJunchao Zhang     *array = NULL;
4440d67d9f35SJunchao Zhang   }
44419566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJInvalidateDiagonal(A));
44429566063dSJacob Faibussowitsch   PetscCall(PetscObjectStateIncrease((PetscObject)A));
44433ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
44448c778c55SBarry Smith }
44458c778c55SBarry Smith 
444621e72a00SBarry Smith /*@C
444711a5261eSBarry Smith   MatSeqAIJGetArrayRead - gives read-only access to the array where the data for a `MATSEQAIJ` matrix is stored
44488f1ea47aSStefano Zampini 
44490ab4885dSBarry Smith   Not Collective; No Fortran Support
44508f1ea47aSStefano Zampini 
44518f1ea47aSStefano Zampini   Input Parameter:
4452fe59aa6dSJacob Faibussowitsch . A - a `MATSEQAIJ` matrix
44538f1ea47aSStefano Zampini 
44548f1ea47aSStefano Zampini   Output Parameter:
44558f1ea47aSStefano Zampini . array - pointer to the data
44568f1ea47aSStefano Zampini 
44578f1ea47aSStefano Zampini   Level: intermediate
44588f1ea47aSStefano Zampini 
44591cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJGetArray()`, `MatSeqAIJRestoreArrayRead()`
44608f1ea47aSStefano Zampini @*/
44615d83a8b1SBarry Smith PetscErrorCode MatSeqAIJGetArrayRead(Mat A, const PetscScalar *array[])
4462d71ae5a4SJacob Faibussowitsch {
4463d67d9f35SJunchao Zhang   Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data;
44648f1ea47aSStefano Zampini 
44658f1ea47aSStefano Zampini   PetscFunctionBegin;
4466d67d9f35SJunchao Zhang   if (aij->ops->getarrayread) {
44679566063dSJacob Faibussowitsch     PetscCall((*aij->ops->getarrayread)(A, array));
4468d67d9f35SJunchao Zhang   } else {
4469d67d9f35SJunchao Zhang     *array = aij->a;
4470d67d9f35SJunchao Zhang   }
44713ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
44728f1ea47aSStefano Zampini }
44738f1ea47aSStefano Zampini 
44748f1ea47aSStefano Zampini /*@C
447511a5261eSBarry Smith   MatSeqAIJRestoreArrayRead - restore the read-only access array obtained from `MatSeqAIJGetArrayRead()`
44768f1ea47aSStefano Zampini 
44770ab4885dSBarry Smith   Not Collective; No Fortran Support
44788f1ea47aSStefano Zampini 
44798f1ea47aSStefano Zampini   Input Parameter:
4480fe59aa6dSJacob Faibussowitsch . A - a `MATSEQAIJ` matrix
44818f1ea47aSStefano Zampini 
44828f1ea47aSStefano Zampini   Output Parameter:
44838f1ea47aSStefano Zampini . array - pointer to the data
44848f1ea47aSStefano Zampini 
44858f1ea47aSStefano Zampini   Level: intermediate
44868f1ea47aSStefano Zampini 
44871cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJGetArray()`, `MatSeqAIJGetArrayRead()`
44888f1ea47aSStefano Zampini @*/
44895d83a8b1SBarry Smith PetscErrorCode MatSeqAIJRestoreArrayRead(Mat A, const PetscScalar *array[])
4490d71ae5a4SJacob Faibussowitsch {
4491d67d9f35SJunchao Zhang   Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data;
44928f1ea47aSStefano Zampini 
44938f1ea47aSStefano Zampini   PetscFunctionBegin;
4494d67d9f35SJunchao Zhang   if (aij->ops->restorearrayread) {
44959566063dSJacob Faibussowitsch     PetscCall((*aij->ops->restorearrayread)(A, array));
4496d67d9f35SJunchao Zhang   } else {
4497d67d9f35SJunchao Zhang     *array = NULL;
4498d67d9f35SJunchao Zhang   }
44993ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
4500d67d9f35SJunchao Zhang }
4501d67d9f35SJunchao Zhang 
4502d67d9f35SJunchao Zhang /*@C
450311a5261eSBarry Smith   MatSeqAIJGetArrayWrite - gives write-only access to the array where the data for a `MATSEQAIJ` matrix is stored
4504d67d9f35SJunchao Zhang 
45050ab4885dSBarry Smith   Not Collective; No Fortran Support
4506d67d9f35SJunchao Zhang 
4507d67d9f35SJunchao Zhang   Input Parameter:
4508fe59aa6dSJacob Faibussowitsch . A - a `MATSEQAIJ` matrix
4509d67d9f35SJunchao Zhang 
4510d67d9f35SJunchao Zhang   Output Parameter:
4511d67d9f35SJunchao Zhang . array - pointer to the data
4512d67d9f35SJunchao Zhang 
4513d67d9f35SJunchao Zhang   Level: intermediate
4514d67d9f35SJunchao Zhang 
45151cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJGetArray()`, `MatSeqAIJRestoreArrayRead()`
4516d67d9f35SJunchao Zhang @*/
45175d83a8b1SBarry Smith PetscErrorCode MatSeqAIJGetArrayWrite(Mat A, PetscScalar *array[])
4518d71ae5a4SJacob Faibussowitsch {
4519d67d9f35SJunchao Zhang   Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data;
4520d67d9f35SJunchao Zhang 
4521d67d9f35SJunchao Zhang   PetscFunctionBegin;
4522d67d9f35SJunchao Zhang   if (aij->ops->getarraywrite) {
45239566063dSJacob Faibussowitsch     PetscCall((*aij->ops->getarraywrite)(A, array));
4524d67d9f35SJunchao Zhang   } else {
4525d67d9f35SJunchao Zhang     *array = aij->a;
4526d67d9f35SJunchao Zhang   }
45279566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJInvalidateDiagonal(A));
45289566063dSJacob Faibussowitsch   PetscCall(PetscObjectStateIncrease((PetscObject)A));
45293ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
4530d67d9f35SJunchao Zhang }
4531d67d9f35SJunchao Zhang 
4532d67d9f35SJunchao Zhang /*@C
4533d67d9f35SJunchao Zhang   MatSeqAIJRestoreArrayWrite - restore the read-only access array obtained from MatSeqAIJGetArrayRead
4534d67d9f35SJunchao Zhang 
45350ab4885dSBarry Smith   Not Collective; No Fortran Support
4536d67d9f35SJunchao Zhang 
4537d67d9f35SJunchao Zhang   Input Parameter:
4538fe59aa6dSJacob Faibussowitsch . A - a MATSEQAIJ matrix
4539d67d9f35SJunchao Zhang 
4540d67d9f35SJunchao Zhang   Output Parameter:
4541d67d9f35SJunchao Zhang . array - pointer to the data
4542d67d9f35SJunchao Zhang 
4543d67d9f35SJunchao Zhang   Level: intermediate
4544d67d9f35SJunchao Zhang 
45451cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJGetArray()`, `MatSeqAIJGetArrayRead()`
4546d67d9f35SJunchao Zhang @*/
45475d83a8b1SBarry Smith PetscErrorCode MatSeqAIJRestoreArrayWrite(Mat A, PetscScalar *array[])
4548d71ae5a4SJacob Faibussowitsch {
4549d67d9f35SJunchao Zhang   Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data;
4550d67d9f35SJunchao Zhang 
4551d67d9f35SJunchao Zhang   PetscFunctionBegin;
4552d67d9f35SJunchao Zhang   if (aij->ops->restorearraywrite) {
45539566063dSJacob Faibussowitsch     PetscCall((*aij->ops->restorearraywrite)(A, array));
4554d67d9f35SJunchao Zhang   } else {
4555d67d9f35SJunchao Zhang     *array = NULL;
4556d67d9f35SJunchao Zhang   }
45573ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
45588f1ea47aSStefano Zampini }
45598f1ea47aSStefano Zampini 
45608f1ea47aSStefano Zampini /*@C
456111a5261eSBarry Smith   MatSeqAIJGetCSRAndMemType - Get the CSR arrays and the memory type of the `MATSEQAIJ` matrix
45627ee59b9bSJunchao Zhang 
45630ab4885dSBarry Smith   Not Collective; No Fortran Support
45647ee59b9bSJunchao Zhang 
45657ee59b9bSJunchao Zhang   Input Parameter:
456611a5261eSBarry Smith . mat - a matrix of type `MATSEQAIJ` or its subclasses
45677ee59b9bSJunchao Zhang 
45687ee59b9bSJunchao Zhang   Output Parameters:
45697ee59b9bSJunchao Zhang + i     - row map array of the matrix
45707ee59b9bSJunchao Zhang . j     - column index array of the matrix
45717ee59b9bSJunchao Zhang . a     - data array of the matrix
4572fe59aa6dSJacob Faibussowitsch - mtype - memory type of the arrays
45737ee59b9bSJunchao Zhang 
4574fe59aa6dSJacob Faibussowitsch   Level: developer
45752ef1f0ffSBarry Smith 
45767ee59b9bSJunchao Zhang   Notes:
45772ef1f0ffSBarry Smith   Any of the output parameters can be `NULL`, in which case the corresponding value is not returned.
45787ee59b9bSJunchao Zhang   If mat is a device matrix, the arrays are on the device. Otherwise, they are on the host.
45797ee59b9bSJunchao Zhang 
45807ee59b9bSJunchao Zhang   One can call this routine on a preallocated but not assembled matrix to just get the memory of the CSR underneath the matrix.
45812ef1f0ffSBarry Smith   If the matrix is assembled, the data array `a` is guaranteed to have the latest values of the matrix.
45827ee59b9bSJunchao Zhang 
45831cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJGetArray()`, `MatSeqAIJGetArrayRead()`
45847ee59b9bSJunchao Zhang @*/
45855d83a8b1SBarry Smith PetscErrorCode MatSeqAIJGetCSRAndMemType(Mat mat, const PetscInt *i[], const PetscInt *j[], PetscScalar *a[], PetscMemType *mtype)
4586d71ae5a4SJacob Faibussowitsch {
45877ee59b9bSJunchao Zhang   Mat_SeqAIJ *aij = (Mat_SeqAIJ *)mat->data;
45887ee59b9bSJunchao Zhang 
45897ee59b9bSJunchao Zhang   PetscFunctionBegin;
45907ee59b9bSJunchao Zhang   PetscCheck(mat->preallocated, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "matrix is not preallocated");
45917ee59b9bSJunchao Zhang   if (aij->ops->getcsrandmemtype) {
45927ee59b9bSJunchao Zhang     PetscCall((*aij->ops->getcsrandmemtype)(mat, i, j, a, mtype));
45937ee59b9bSJunchao Zhang   } else {
45947ee59b9bSJunchao Zhang     if (i) *i = aij->i;
45957ee59b9bSJunchao Zhang     if (j) *j = aij->j;
45967ee59b9bSJunchao Zhang     if (a) *a = aij->a;
45977ee59b9bSJunchao Zhang     if (mtype) *mtype = PETSC_MEMTYPE_HOST;
45987ee59b9bSJunchao Zhang   }
45993ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
46007ee59b9bSJunchao Zhang }
46017ee59b9bSJunchao Zhang 
4602cc4c1da9SBarry Smith /*@
460321e72a00SBarry Smith   MatSeqAIJGetMaxRowNonzeros - returns the maximum number of nonzeros in any row
460421e72a00SBarry Smith 
460521e72a00SBarry Smith   Not Collective
460621e72a00SBarry Smith 
460721e72a00SBarry Smith   Input Parameter:
4608fe59aa6dSJacob Faibussowitsch . A - a `MATSEQAIJ` matrix
460921e72a00SBarry Smith 
461021e72a00SBarry Smith   Output Parameter:
461121e72a00SBarry Smith . nz - the maximum number of nonzeros in any row
461221e72a00SBarry Smith 
461321e72a00SBarry Smith   Level: intermediate
461421e72a00SBarry Smith 
46151cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJRestoreArray()`, `MatSeqAIJGetArrayF90()`
461621e72a00SBarry Smith @*/
4617d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJGetMaxRowNonzeros(Mat A, PetscInt *nz)
4618d71ae5a4SJacob Faibussowitsch {
461921e72a00SBarry Smith   Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data;
462021e72a00SBarry Smith 
462121e72a00SBarry Smith   PetscFunctionBegin;
462221e72a00SBarry Smith   *nz = aij->rmax;
46233ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
462421e72a00SBarry Smith }
462521e72a00SBarry Smith 
46262c4ab24aSJunchao Zhang static PetscErrorCode MatCOOStructDestroy_SeqAIJ(void *data)
46272c4ab24aSJunchao Zhang {
46282c4ab24aSJunchao Zhang   MatCOOStruct_SeqAIJ *coo = (MatCOOStruct_SeqAIJ *)data;
46294d86920dSPierre Jolivet 
46302c4ab24aSJunchao Zhang   PetscFunctionBegin;
46312c4ab24aSJunchao Zhang   PetscCall(PetscFree(coo->perm));
46322c4ab24aSJunchao Zhang   PetscCall(PetscFree(coo->jmap));
46332c4ab24aSJunchao Zhang   PetscCall(PetscFree(coo));
46342c4ab24aSJunchao Zhang   PetscFunctionReturn(PETSC_SUCCESS);
46352c4ab24aSJunchao Zhang }
46362c4ab24aSJunchao Zhang 
4637d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetPreallocationCOO_SeqAIJ(Mat mat, PetscCount coo_n, PetscInt coo_i[], PetscInt coo_j[])
4638d71ae5a4SJacob Faibussowitsch {
4639394ed5ebSJunchao Zhang   MPI_Comm             comm;
4640394ed5ebSJunchao Zhang   PetscInt            *i, *j;
46410d88f7f4SJunchao Zhang   PetscInt             M, N, row, iprev;
4642394ed5ebSJunchao Zhang   PetscCount           k, p, q, nneg, nnz, start, end; /* Index the coo array, so use PetscCount as their type */
4643394ed5ebSJunchao Zhang   PetscInt            *Ai;                             /* Change to PetscCount once we use it for row pointers */
4644394ed5ebSJunchao Zhang   PetscInt            *Aj;
4645394ed5ebSJunchao Zhang   PetscScalar         *Aa;
4646f4f49eeaSPierre Jolivet   Mat_SeqAIJ          *seqaij = (Mat_SeqAIJ *)mat->data;
4647cbc6b225SStefano Zampini   MatType              rtype;
4648394ed5ebSJunchao Zhang   PetscCount          *perm, *jmap;
46492c4ab24aSJunchao Zhang   MatCOOStruct_SeqAIJ *coo;
46500d88f7f4SJunchao Zhang   PetscBool            isorted;
46519f0612e4SBarry Smith   PetscBool            hypre;
46529f0612e4SBarry Smith   const char          *name;
4653394ed5ebSJunchao Zhang 
4654394ed5ebSJunchao Zhang   PetscFunctionBegin;
46559566063dSJacob Faibussowitsch   PetscCall(PetscObjectGetComm((PetscObject)mat, &comm));
46569566063dSJacob Faibussowitsch   PetscCall(MatGetSize(mat, &M, &N));
4657e8729f6fSJunchao Zhang   i = coo_i;
4658e8729f6fSJunchao Zhang   j = coo_j;
46599566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(coo_n, &perm));
46600d88f7f4SJunchao Zhang 
46610d88f7f4SJunchao Zhang   /* Ignore entries with negative row or col indices; at the same time, check if i[] is already sorted (e.g., MatConvert_AlJ_HYPRE results in this case) */
46620d88f7f4SJunchao Zhang   isorted = PETSC_TRUE;
46630d88f7f4SJunchao Zhang   iprev   = PETSC_INT_MIN;
46640d88f7f4SJunchao Zhang   for (k = 0; k < coo_n; k++) {
4665394ed5ebSJunchao Zhang     if (j[k] < 0) i[k] = -1;
46660d88f7f4SJunchao Zhang     if (isorted) {
46670d88f7f4SJunchao Zhang       if (i[k] < iprev) isorted = PETSC_FALSE;
46680d88f7f4SJunchao Zhang       else iprev = i[k];
46690d88f7f4SJunchao Zhang     }
4670394ed5ebSJunchao Zhang     perm[k] = k;
4671394ed5ebSJunchao Zhang   }
4672394ed5ebSJunchao Zhang 
46730d88f7f4SJunchao Zhang   /* Sort by row if not already */
46740d88f7f4SJunchao Zhang   if (!isorted) PetscCall(PetscSortIntWithIntCountArrayPair(coo_n, i, j, perm));
4675651b1cf9SStefano Zampini 
4676651b1cf9SStefano Zampini   /* Advance k to the first row with a non-negative index */
4677651b1cf9SStefano Zampini   for (k = 0; k < coo_n; k++)
46789371c9d4SSatish Balay     if (i[k] >= 0) break;
4679394ed5ebSJunchao Zhang   nneg = k;
46809566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(coo_n - nneg + 1, &jmap)); /* +1 to make a CSR-like data structure. jmap[i] originally is the number of repeats for i-th nonzero */
4681394ed5ebSJunchao Zhang   nnz = 0;                                          /* Total number of unique nonzeros to be counted */
468235cb6cd3SPierre Jolivet   jmap++;                                           /* Inc jmap by 1 for convenience */
4683394ed5ebSJunchao Zhang 
46849f0612e4SBarry Smith   PetscCall(PetscShmgetAllocateArray(M + 1, sizeof(PetscInt), (void **)&Ai)); /* CSR of A */
46859f0612e4SBarry Smith   PetscCall(PetscArrayzero(Ai, M + 1));
46869f0612e4SBarry Smith   PetscCall(PetscShmgetAllocateArray(coo_n - nneg, sizeof(PetscInt), (void **)&Aj)); /* We have at most coo_n-nneg unique nonzeros */
4687394ed5ebSJunchao Zhang 
4688651b1cf9SStefano Zampini   PetscCall(PetscObjectGetName((PetscObject)mat, &name));
4689651b1cf9SStefano Zampini   PetscCall(PetscStrcmp("_internal_COO_mat_for_hypre", name, &hypre));
4690651b1cf9SStefano Zampini 
4691394ed5ebSJunchao Zhang   /* In each row, sort by column, then unique column indices to get row length */
469235cb6cd3SPierre Jolivet   Ai++;  /* Inc by 1 for convenience */
4693394ed5ebSJunchao Zhang   q = 0; /* q-th unique nonzero, with q starting from 0 */
4694394ed5ebSJunchao Zhang   while (k < coo_n) {
46950d88f7f4SJunchao Zhang     PetscBool strictly_sorted; // this row is strictly sorted?
46960d88f7f4SJunchao Zhang     PetscInt  jprev;
46970d88f7f4SJunchao Zhang 
46980d88f7f4SJunchao Zhang     /* get [start,end) indices for this row; also check if cols in this row are strictly sorted */
4699394ed5ebSJunchao Zhang     row             = i[k];
47000d88f7f4SJunchao Zhang     start           = k;
47010d88f7f4SJunchao Zhang     jprev           = PETSC_INT_MIN;
47020d88f7f4SJunchao Zhang     strictly_sorted = PETSC_TRUE;
47030d88f7f4SJunchao Zhang     while (k < coo_n && i[k] == row) {
47040d88f7f4SJunchao Zhang       if (strictly_sorted) {
47050d88f7f4SJunchao Zhang         if (j[k] <= jprev) strictly_sorted = PETSC_FALSE;
47060d88f7f4SJunchao Zhang         else jprev = j[k];
47070d88f7f4SJunchao Zhang       }
47080d88f7f4SJunchao Zhang       k++;
47090d88f7f4SJunchao Zhang     }
4710394ed5ebSJunchao Zhang     end = k;
47110d88f7f4SJunchao Zhang 
4712651b1cf9SStefano Zampini     /* hack for HYPRE: swap min column to diag so that diagonal values will go first */
4713651b1cf9SStefano Zampini     if (hypre) {
47141690c2aeSBarry Smith       PetscInt  minj    = PETSC_INT_MAX;
4715651b1cf9SStefano Zampini       PetscBool hasdiag = PETSC_FALSE;
47160d88f7f4SJunchao Zhang 
47170d88f7f4SJunchao Zhang       if (strictly_sorted) { // fast path to swap the first and the diag
47180d88f7f4SJunchao Zhang         PetscCount tmp;
47190d88f7f4SJunchao Zhang         for (p = start; p < end; p++) {
47200d88f7f4SJunchao Zhang           if (j[p] == row && p != start) {
47210d88f7f4SJunchao Zhang             j[p]        = j[start];
47220d88f7f4SJunchao Zhang             j[start]    = row;
47230d88f7f4SJunchao Zhang             tmp         = perm[start];
47240d88f7f4SJunchao Zhang             perm[start] = perm[p];
47250d88f7f4SJunchao Zhang             perm[p]     = tmp;
47260d88f7f4SJunchao Zhang             break;
47270d88f7f4SJunchao Zhang           }
47280d88f7f4SJunchao Zhang         }
47290d88f7f4SJunchao Zhang       } else {
4730651b1cf9SStefano Zampini         for (p = start; p < end; p++) {
4731651b1cf9SStefano Zampini           hasdiag = (PetscBool)(hasdiag || (j[p] == row));
4732651b1cf9SStefano Zampini           minj    = PetscMin(minj, j[p]);
4733651b1cf9SStefano Zampini         }
47340d88f7f4SJunchao Zhang 
4735651b1cf9SStefano Zampini         if (hasdiag) {
4736651b1cf9SStefano Zampini           for (p = start; p < end; p++) {
4737651b1cf9SStefano Zampini             if (j[p] == minj) j[p] = row;
4738651b1cf9SStefano Zampini             else if (j[p] == row) j[p] = minj;
4739651b1cf9SStefano Zampini           }
4740651b1cf9SStefano Zampini         }
4741651b1cf9SStefano Zampini       }
47420d88f7f4SJunchao Zhang     }
47430d88f7f4SJunchao Zhang     // sort by columns in a row
47440d88f7f4SJunchao Zhang     if (!strictly_sorted) PetscCall(PetscSortIntWithCountArray(end - start, j + start, perm + start));
4745651b1cf9SStefano Zampini 
47460d88f7f4SJunchao Zhang     if (strictly_sorted) { // fast path to set Aj[], jmap[], Ai[], nnz, q
47470d88f7f4SJunchao Zhang       for (p = start; p < end; p++, q++) {
47480d88f7f4SJunchao Zhang         Aj[q]   = j[p];
47490d88f7f4SJunchao Zhang         jmap[q] = 1;
47500d88f7f4SJunchao Zhang       }
47516497c311SBarry Smith       PetscCall(PetscIntCast(end - start, Ai + row));
47520d88f7f4SJunchao Zhang       nnz += Ai[row]; // q is already advanced
47530d88f7f4SJunchao Zhang     } else {
4754394ed5ebSJunchao Zhang       /* Find number of unique col entries in this row */
4755394ed5ebSJunchao Zhang       Aj[q]   = j[start]; /* Log the first nonzero in this row */
4756651b1cf9SStefano Zampini       jmap[q] = 1;        /* Number of repeats of this nonzero entry */
4757394ed5ebSJunchao Zhang       Ai[row] = 1;
4758394ed5ebSJunchao Zhang       nnz++;
4759394ed5ebSJunchao Zhang 
4760394ed5ebSJunchao Zhang       for (p = start + 1; p < end; p++) { /* Scan remaining nonzero in this row */
4761394ed5ebSJunchao Zhang         if (j[p] != j[p - 1]) {           /* Meet a new nonzero */
4762394ed5ebSJunchao Zhang           q++;
4763394ed5ebSJunchao Zhang           jmap[q] = 1;
4764394ed5ebSJunchao Zhang           Aj[q]   = j[p];
4765394ed5ebSJunchao Zhang           Ai[row]++;
4766394ed5ebSJunchao Zhang           nnz++;
4767394ed5ebSJunchao Zhang         } else {
4768394ed5ebSJunchao Zhang           jmap[q]++;
4769394ed5ebSJunchao Zhang         }
4770394ed5ebSJunchao Zhang       }
4771394ed5ebSJunchao Zhang       q++; /* Move to next row and thus next unique nonzero */
4772394ed5ebSJunchao Zhang     }
47730d88f7f4SJunchao Zhang   }
47740d88f7f4SJunchao Zhang 
4775394ed5ebSJunchao Zhang   Ai--; /* Back to the beginning of Ai[] */
4776394ed5ebSJunchao Zhang   for (k = 0; k < M; k++) Ai[k + 1] += Ai[k];
47770d88f7f4SJunchao Zhang   jmap--; // Back to the beginning of jmap[]
4778394ed5ebSJunchao Zhang   jmap[0] = 0;
4779394ed5ebSJunchao Zhang   for (k = 0; k < nnz; k++) jmap[k + 1] += jmap[k];
47800d88f7f4SJunchao Zhang 
47819f0612e4SBarry Smith   if (nnz < coo_n - nneg) { /* Reallocate with actual number of unique nonzeros */
4782394ed5ebSJunchao Zhang     PetscCount *jmap_new;
4783394ed5ebSJunchao Zhang     PetscInt   *Aj_new;
4784394ed5ebSJunchao Zhang 
47859566063dSJacob Faibussowitsch     PetscCall(PetscMalloc1(nnz + 1, &jmap_new));
47869566063dSJacob Faibussowitsch     PetscCall(PetscArraycpy(jmap_new, jmap, nnz + 1));
47879566063dSJacob Faibussowitsch     PetscCall(PetscFree(jmap));
4788394ed5ebSJunchao Zhang     jmap = jmap_new;
4789394ed5ebSJunchao Zhang 
47909f0612e4SBarry Smith     PetscCall(PetscShmgetAllocateArray(nnz, sizeof(PetscInt), (void **)&Aj_new));
47919566063dSJacob Faibussowitsch     PetscCall(PetscArraycpy(Aj_new, Aj, nnz));
47929f0612e4SBarry Smith     PetscCall(PetscShmgetDeallocateArray((void **)&Aj));
4793394ed5ebSJunchao Zhang     Aj = Aj_new;
4794394ed5ebSJunchao Zhang   }
4795394ed5ebSJunchao Zhang 
4796394ed5ebSJunchao Zhang   if (nneg) { /* Discard heading entries with negative indices in perm[], as we'll access it from index 0 in MatSetValuesCOO */
4797394ed5ebSJunchao Zhang     PetscCount *perm_new;
4798cbc6b225SStefano Zampini 
47999566063dSJacob Faibussowitsch     PetscCall(PetscMalloc1(coo_n - nneg, &perm_new));
48009566063dSJacob Faibussowitsch     PetscCall(PetscArraycpy(perm_new, perm + nneg, coo_n - nneg));
48019566063dSJacob Faibussowitsch     PetscCall(PetscFree(perm));
4802394ed5ebSJunchao Zhang     perm = perm_new;
4803394ed5ebSJunchao Zhang   }
4804394ed5ebSJunchao Zhang 
48059566063dSJacob Faibussowitsch   PetscCall(MatGetRootType_Private(mat, &rtype));
48069f0612e4SBarry Smith   PetscCall(PetscShmgetAllocateArray(nnz, sizeof(PetscScalar), (void **)&Aa));
48079f0612e4SBarry Smith   PetscCall(PetscArrayzero(Aa, nnz));
48089566063dSJacob Faibussowitsch   PetscCall(MatSetSeqAIJWithArrays_private(PETSC_COMM_SELF, M, N, Ai, Aj, Aa, rtype, mat));
4809394ed5ebSJunchao Zhang 
4810394ed5ebSJunchao Zhang   seqaij->free_a = seqaij->free_ij = PETSC_TRUE; /* Let newmat own Ai, Aj and Aa */
48112c4ab24aSJunchao Zhang 
48122c4ab24aSJunchao Zhang   // Put the COO struct in a container and then attach that to the matrix
48132c4ab24aSJunchao Zhang   PetscCall(PetscMalloc1(1, &coo));
48146497c311SBarry Smith   PetscCall(PetscIntCast(nnz, &coo->nz));
48152c4ab24aSJunchao Zhang   coo->n    = coo_n;
48162c4ab24aSJunchao Zhang   coo->Atot = coo_n - nneg; // Annz is seqaij->nz, so no need to record that again
48172c4ab24aSJunchao Zhang   coo->jmap = jmap;         // of length nnz+1
48182c4ab24aSJunchao Zhang   coo->perm = perm;
481903e76207SPierre Jolivet   PetscCall(PetscObjectContainerCompose((PetscObject)mat, "__PETSc_MatCOOStruct_Host", coo, MatCOOStructDestroy_SeqAIJ));
48203ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
4821394ed5ebSJunchao Zhang }
4822394ed5ebSJunchao Zhang 
4823d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatSetValuesCOO_SeqAIJ(Mat A, const PetscScalar v[], InsertMode imode)
4824d71ae5a4SJacob Faibussowitsch {
4825394ed5ebSJunchao Zhang   Mat_SeqAIJ          *aseq = (Mat_SeqAIJ *)A->data;
4826394ed5ebSJunchao Zhang   PetscCount           i, j, Annz = aseq->nz;
48272c4ab24aSJunchao Zhang   PetscCount          *perm, *jmap;
4828394ed5ebSJunchao Zhang   PetscScalar         *Aa;
48292c4ab24aSJunchao Zhang   PetscContainer       container;
48302c4ab24aSJunchao Zhang   MatCOOStruct_SeqAIJ *coo;
4831394ed5ebSJunchao Zhang 
4832394ed5ebSJunchao Zhang   PetscFunctionBegin;
48332c4ab24aSJunchao Zhang   PetscCall(PetscObjectQuery((PetscObject)A, "__PETSc_MatCOOStruct_Host", (PetscObject *)&container));
48342c4ab24aSJunchao Zhang   PetscCheck(container, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Not found MatCOOStruct on this matrix");
48352c4ab24aSJunchao Zhang   PetscCall(PetscContainerGetPointer(container, (void **)&coo));
48362c4ab24aSJunchao Zhang   perm = coo->perm;
48372c4ab24aSJunchao Zhang   jmap = coo->jmap;
48389566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArray(A, &Aa));
4839394ed5ebSJunchao Zhang   for (i = 0; i < Annz; i++) {
4840b6c38306SJunchao Zhang     PetscScalar sum = 0.0;
4841b6c38306SJunchao Zhang     for (j = jmap[i]; j < jmap[i + 1]; j++) sum += v[perm[j]];
4842b6c38306SJunchao Zhang     Aa[i] = (imode == INSERT_VALUES ? 0.0 : Aa[i]) + sum;
4843394ed5ebSJunchao Zhang   }
48449566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArray(A, &Aa));
48453ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
4846394ed5ebSJunchao Zhang }
4847394ed5ebSJunchao Zhang 
484834b5b067SBarry Smith #if defined(PETSC_HAVE_CUDA)
48495063d097SStefano Zampini PETSC_INTERN PetscErrorCode MatConvert_SeqAIJ_SeqAIJCUSPARSE(Mat, MatType, MatReuse, Mat *);
485002fe1965SBarry Smith #endif
4851d5e393b6SSuyash Tandon #if defined(PETSC_HAVE_HIP)
4852d5e393b6SSuyash Tandon PETSC_INTERN PetscErrorCode MatConvert_SeqAIJ_SeqAIJHIPSPARSE(Mat, MatType, MatReuse, Mat *);
4853d5e393b6SSuyash Tandon #endif
48543d0639e7SStefano Zampini #if defined(PETSC_HAVE_KOKKOS_KERNELS)
48555063d097SStefano Zampini PETSC_INTERN PetscErrorCode MatConvert_SeqAIJ_SeqAIJKokkos(Mat, MatType, MatReuse, Mat *);
48563d0639e7SStefano Zampini #endif
485702fe1965SBarry Smith 
4858d71ae5a4SJacob Faibussowitsch PETSC_EXTERN PetscErrorCode MatCreate_SeqAIJ(Mat B)
4859d71ae5a4SJacob Faibussowitsch {
4860273d9f13SBarry Smith   Mat_SeqAIJ *b;
486138baddfdSBarry Smith   PetscMPIInt size;
4862273d9f13SBarry Smith 
4863273d9f13SBarry Smith   PetscFunctionBegin;
48649566063dSJacob Faibussowitsch   PetscCallMPI(MPI_Comm_size(PetscObjectComm((PetscObject)B), &size));
486508401ef6SPierre Jolivet   PetscCheck(size <= 1, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Comm must be of size 1");
4866273d9f13SBarry Smith 
48674dfa11a4SJacob Faibussowitsch   PetscCall(PetscNew(&b));
48682205254eSKarl Rupp 
4869b0a32e0cSBarry Smith   B->data   = (void *)b;
4870aea10558SJacob Faibussowitsch   B->ops[0] = MatOps_Values;
4871071fcb05SBarry Smith   if (B->sortedfull) B->ops->setvalues = MatSetValues_SeqAIJ_SortedFull;
48722205254eSKarl Rupp 
4873f4259b30SLisandro Dalcin   b->row                = NULL;
4874f4259b30SLisandro Dalcin   b->col                = NULL;
4875f4259b30SLisandro Dalcin   b->icol               = NULL;
4876b810aeb4SBarry Smith   b->reallocs           = 0;
487736db0b34SBarry Smith   b->ignorezeroentries  = PETSC_FALSE;
4878f1e2ffcdSBarry Smith   b->roworiented        = PETSC_TRUE;
4879416022c9SBarry Smith   b->nonew              = 0;
4880f4259b30SLisandro Dalcin   b->diag               = NULL;
4881f4259b30SLisandro Dalcin   b->solve_work         = NULL;
4882f4259b30SLisandro Dalcin   B->spptr              = NULL;
4883f4259b30SLisandro Dalcin   b->saved_values       = NULL;
4884f4259b30SLisandro Dalcin   b->idiag              = NULL;
4885f4259b30SLisandro Dalcin   b->mdiag              = NULL;
4886f4259b30SLisandro Dalcin   b->ssor_work          = NULL;
488771f1c65dSBarry Smith   b->omega              = 1.0;
488871f1c65dSBarry Smith   b->fshift             = 0.0;
488971f1c65dSBarry Smith   b->idiagvalid         = PETSC_FALSE;
4890bbead8a2SBarry Smith   b->ibdiagvalid        = PETSC_FALSE;
4891a9817697SBarry Smith   b->keepnonzeropattern = PETSC_FALSE;
489217ab2063SBarry Smith 
48939566063dSJacob Faibussowitsch   PetscCall(PetscObjectChangeTypeName((PetscObject)B, MATSEQAIJ));
4894d1e78c4fSBarry Smith #if defined(PETSC_HAVE_MATLAB)
48959566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "PetscMatlabEnginePut_C", MatlabEnginePut_SeqAIJ));
48969566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "PetscMatlabEngineGet_C", MatlabEngineGet_SeqAIJ));
4897b3866ffcSBarry Smith #endif
48989566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSeqAIJSetColumnIndices_C", MatSeqAIJSetColumnIndices_SeqAIJ));
48999566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatStoreValues_C", MatStoreValues_SeqAIJ));
49009566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatRetrieveValues_C", MatRetrieveValues_SeqAIJ));
49019566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqsbaij_C", MatConvert_SeqAIJ_SeqSBAIJ));
49029566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqbaij_C", MatConvert_SeqAIJ_SeqBAIJ));
49039566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijperm_C", MatConvert_SeqAIJ_SeqAIJPERM));
49049566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijsell_C", MatConvert_SeqAIJ_SeqAIJSELL));
49059779e05dSSatish Balay #if defined(PETSC_HAVE_MKL_SPARSE)
49069566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijmkl_C", MatConvert_SeqAIJ_SeqAIJMKL));
4907191b95cbSRichard Tran Mills #endif
490834b5b067SBarry Smith #if defined(PETSC_HAVE_CUDA)
49099566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijcusparse_C", MatConvert_SeqAIJ_SeqAIJCUSPARSE));
49109566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_seqaijcusparse_seqaij_C", MatProductSetFromOptions_SeqAIJ));
49119566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_seqaij_seqaijcusparse_C", MatProductSetFromOptions_SeqAIJ));
491202fe1965SBarry Smith #endif
4913d5e393b6SSuyash Tandon #if defined(PETSC_HAVE_HIP)
4914d5e393b6SSuyash Tandon   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijhipsparse_C", MatConvert_SeqAIJ_SeqAIJHIPSPARSE));
4915d5e393b6SSuyash Tandon   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_seqaijhipsparse_seqaij_C", MatProductSetFromOptions_SeqAIJ));
4916d5e393b6SSuyash Tandon   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_seqaij_seqaijhipsparse_C", MatProductSetFromOptions_SeqAIJ));
4917d5e393b6SSuyash Tandon #endif
49183d0639e7SStefano Zampini #if defined(PETSC_HAVE_KOKKOS_KERNELS)
49199566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijkokkos_C", MatConvert_SeqAIJ_SeqAIJKokkos));
49203d0639e7SStefano Zampini #endif
49219566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijcrl_C", MatConvert_SeqAIJ_SeqAIJCRL));
4922af8000cdSHong Zhang #if defined(PETSC_HAVE_ELEMENTAL)
49239566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_elemental_C", MatConvert_SeqAIJ_Elemental));
4924af8000cdSHong Zhang #endif
4925d24d4204SJose E. Roman #if defined(PETSC_HAVE_SCALAPACK)
49269566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_scalapack_C", MatConvert_AIJ_ScaLAPACK));
4927d24d4204SJose E. Roman #endif
492863c07aadSStefano Zampini #if defined(PETSC_HAVE_HYPRE)
49299566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_hypre_C", MatConvert_AIJ_HYPRE));
49309566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_transpose_seqaij_seqaij_C", MatProductSetFromOptions_Transpose_AIJ_AIJ));
493163c07aadSStefano Zampini #endif
49329566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqdense_C", MatConvert_SeqAIJ_SeqDense));
49339566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqsell_C", MatConvert_SeqAIJ_SeqSELL));
49349566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_is_C", MatConvert_XAIJ_IS));
49359566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatIsTranspose_C", MatIsTranspose_SeqAIJ));
493614e4dea2SJose E. Roman   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatIsHermitianTranspose_C", MatIsHermitianTranspose_SeqAIJ));
49379566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSeqAIJSetPreallocation_C", MatSeqAIJSetPreallocation_SeqAIJ));
49389566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatResetPreallocation_C", MatResetPreallocation_SeqAIJ));
49399566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSeqAIJSetPreallocationCSR_C", MatSeqAIJSetPreallocationCSR_SeqAIJ));
49409566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatReorderForNonzeroDiagonal_C", MatReorderForNonzeroDiagonal_SeqAIJ));
49419566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_is_seqaij_C", MatProductSetFromOptions_IS_XAIJ));
49429566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_seqdense_seqaij_C", MatProductSetFromOptions_SeqDense_SeqAIJ));
49439566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_seqaij_seqaij_C", MatProductSetFromOptions_SeqAIJ));
49449566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSeqAIJKron_C", MatSeqAIJKron_SeqAIJ));
49459566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSetPreallocationCOO_C", MatSetPreallocationCOO_SeqAIJ));
49469566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSetValuesCOO_C", MatSetValuesCOO_SeqAIJ));
49479566063dSJacob Faibussowitsch   PetscCall(MatCreate_SeqAIJ_Inode(B));
49489566063dSJacob Faibussowitsch   PetscCall(PetscObjectChangeTypeName((PetscObject)B, MATSEQAIJ));
49499566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJSetTypeFromOptions(B)); /* this allows changing the matrix subtype to say MATSEQAIJPERM */
49503ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
495117ab2063SBarry Smith }
495217ab2063SBarry Smith 
4953b24902e0SBarry Smith /*
49543893b582SJunchao Zhang     Given a matrix generated with MatGetFactor() duplicates all the information in A into C
4955b24902e0SBarry Smith */
4956d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDuplicateNoCreate_SeqAIJ(Mat C, Mat A, MatDuplicateOption cpvalues, PetscBool mallocmatspace)
4957d71ae5a4SJacob Faibussowitsch {
49582a350339SBarry Smith   Mat_SeqAIJ *c = (Mat_SeqAIJ *)C->data, *a = (Mat_SeqAIJ *)A->data;
4959071fcb05SBarry Smith   PetscInt    m = A->rmap->n, i;
496017ab2063SBarry Smith 
49613a40ed3dSBarry Smith   PetscFunctionBegin;
4962aed4548fSBarry Smith   PetscCheck(A->assembled || cpvalues == MAT_DO_NOT_COPY_VALUES, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Cannot duplicate unassembled matrix");
4963273d9f13SBarry Smith 
4964d5f3da31SBarry Smith   C->factortype    = A->factortype;
4965f4259b30SLisandro Dalcin   c->row           = NULL;
4966f4259b30SLisandro Dalcin   c->col           = NULL;
4967f4259b30SLisandro Dalcin   c->icol          = NULL;
49686ad4291fSHong Zhang   c->reallocs      = 0;
4969bc43efbbSJunchao Zhang   c->diagonaldense = a->diagonaldense;
497017ab2063SBarry Smith 
497169272f91SPierre Jolivet   C->assembled = A->assembled;
497217ab2063SBarry Smith 
497369272f91SPierre Jolivet   if (A->preallocated) {
49749566063dSJacob Faibussowitsch     PetscCall(PetscLayoutReference(A->rmap, &C->rmap));
49759566063dSJacob Faibussowitsch     PetscCall(PetscLayoutReference(A->cmap, &C->cmap));
4976eec197d1SBarry Smith 
497731fe6a7dSBarry Smith     if (!A->hash_active) {
49789566063dSJacob Faibussowitsch       PetscCall(PetscMalloc1(m, &c->imax));
49799566063dSJacob Faibussowitsch       PetscCall(PetscMemcpy(c->imax, a->imax, m * sizeof(PetscInt)));
49809566063dSJacob Faibussowitsch       PetscCall(PetscMalloc1(m, &c->ilen));
49819566063dSJacob Faibussowitsch       PetscCall(PetscMemcpy(c->ilen, a->ilen, m * sizeof(PetscInt)));
498217ab2063SBarry Smith 
498317ab2063SBarry Smith       /* allocate the matrix space */
4984f77e22a1SHong Zhang       if (mallocmatspace) {
49859f0612e4SBarry Smith         PetscCall(PetscShmgetAllocateArray(a->i[m], sizeof(PetscScalar), (void **)&c->a));
49869f0612e4SBarry Smith         PetscCall(PetscShmgetAllocateArray(a->i[m], sizeof(PetscInt), (void **)&c->j));
49879f0612e4SBarry Smith         PetscCall(PetscShmgetAllocateArray(m + 1, sizeof(PetscInt), (void **)&c->i));
49889566063dSJacob Faibussowitsch         PetscCall(PetscArraycpy(c->i, a->i, m + 1));
49899f0612e4SBarry Smith         c->free_a  = PETSC_TRUE;
49909f0612e4SBarry Smith         c->free_ij = PETSC_TRUE;
499117ab2063SBarry Smith         if (m > 0) {
49929566063dSJacob Faibussowitsch           PetscCall(PetscArraycpy(c->j, a->j, a->i[m]));
4993be6bf707SBarry Smith           if (cpvalues == MAT_COPY_VALUES) {
49942e5835c6SStefano Zampini             const PetscScalar *aa;
49952e5835c6SStefano Zampini 
49969566063dSJacob Faibussowitsch             PetscCall(MatSeqAIJGetArrayRead(A, &aa));
49979566063dSJacob Faibussowitsch             PetscCall(PetscArraycpy(c->a, aa, a->i[m]));
49989566063dSJacob Faibussowitsch             PetscCall(MatSeqAIJGetArrayRead(A, &aa));
4999be6bf707SBarry Smith           } else {
50009566063dSJacob Faibussowitsch             PetscCall(PetscArrayzero(c->a, a->i[m]));
500117ab2063SBarry Smith           }
500208480c60SBarry Smith         }
5003f77e22a1SHong Zhang       }
500431fe6a7dSBarry Smith       C->preallocated = PETSC_TRUE;
500531fe6a7dSBarry Smith     } else {
500631fe6a7dSBarry Smith       PetscCheck(mallocmatspace, PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_WRONGSTATE, "Cannot malloc matrix memory from a non-preallocated matrix");
500731fe6a7dSBarry Smith       PetscCall(MatSetUp(C));
500831fe6a7dSBarry Smith     }
500917ab2063SBarry Smith 
50106ad4291fSHong Zhang     c->ignorezeroentries = a->ignorezeroentries;
5011416022c9SBarry Smith     c->roworiented       = a->roworiented;
5012416022c9SBarry Smith     c->nonew             = a->nonew;
5013416022c9SBarry Smith     if (a->diag) {
50149566063dSJacob Faibussowitsch       PetscCall(PetscMalloc1(m + 1, &c->diag));
50159566063dSJacob Faibussowitsch       PetscCall(PetscMemcpy(c->diag, a->diag, m * sizeof(PetscInt)));
5016071fcb05SBarry Smith     } else c->diag = NULL;
50172205254eSKarl Rupp 
5018f4259b30SLisandro Dalcin     c->solve_work         = NULL;
5019f4259b30SLisandro Dalcin     c->saved_values       = NULL;
5020f4259b30SLisandro Dalcin     c->idiag              = NULL;
5021f4259b30SLisandro Dalcin     c->ssor_work          = NULL;
5022a9817697SBarry Smith     c->keepnonzeropattern = a->keepnonzeropattern;
50236ad4291fSHong Zhang 
5024893ad86cSHong Zhang     c->rmax  = a->rmax;
5025416022c9SBarry Smith     c->nz    = a->nz;
50268ed568f8SMatthew G Knepley     c->maxnz = a->nz; /* Since we allocate exactly the right amount */
5027754ec7b1SSatish Balay 
50286ad4291fSHong Zhang     c->compressedrow.use   = a->compressedrow.use;
50296ad4291fSHong Zhang     c->compressedrow.nrows = a->compressedrow.nrows;
5030cd6b891eSBarry Smith     if (a->compressedrow.use) {
50316ad4291fSHong Zhang       i = a->compressedrow.nrows;
50329566063dSJacob Faibussowitsch       PetscCall(PetscMalloc2(i + 1, &c->compressedrow.i, i, &c->compressedrow.rindex));
50339566063dSJacob Faibussowitsch       PetscCall(PetscArraycpy(c->compressedrow.i, a->compressedrow.i, i + 1));
50349566063dSJacob Faibussowitsch       PetscCall(PetscArraycpy(c->compressedrow.rindex, a->compressedrow.rindex, i));
503527ea64f8SHong Zhang     } else {
503627ea64f8SHong Zhang       c->compressedrow.use    = PETSC_FALSE;
50370298fd71SBarry Smith       c->compressedrow.i      = NULL;
50380298fd71SBarry Smith       c->compressedrow.rindex = NULL;
50396ad4291fSHong Zhang     }
5040ea632784SBarry Smith     c->nonzerorowcnt = a->nonzerorowcnt;
5041e56f5c9eSBarry Smith     C->nonzerostate  = A->nonzerostate;
50424846f1f5SKris Buschelman 
50439566063dSJacob Faibussowitsch     PetscCall(MatDuplicate_SeqAIJ_Inode(A, cpvalues, &C));
504469272f91SPierre Jolivet   }
50459566063dSJacob Faibussowitsch   PetscCall(PetscFunctionListDuplicate(((PetscObject)A)->qlist, &((PetscObject)C)->qlist));
50463ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
504717ab2063SBarry Smith }
504817ab2063SBarry Smith 
5049d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDuplicate_SeqAIJ(Mat A, MatDuplicateOption cpvalues, Mat *B)
5050d71ae5a4SJacob Faibussowitsch {
5051b24902e0SBarry Smith   PetscFunctionBegin;
50529566063dSJacob Faibussowitsch   PetscCall(MatCreate(PetscObjectComm((PetscObject)A), B));
50539566063dSJacob Faibussowitsch   PetscCall(MatSetSizes(*B, A->rmap->n, A->cmap->n, A->rmap->n, A->cmap->n));
505448a46eb9SPierre Jolivet   if (!(A->rmap->n % A->rmap->bs) && !(A->cmap->n % A->cmap->bs)) PetscCall(MatSetBlockSizesFromMats(*B, A, A));
50559566063dSJacob Faibussowitsch   PetscCall(MatSetType(*B, ((PetscObject)A)->type_name));
50569566063dSJacob Faibussowitsch   PetscCall(MatDuplicateNoCreate_SeqAIJ(*B, A, cpvalues, PETSC_TRUE));
50573ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
5058b24902e0SBarry Smith }
5059b24902e0SBarry Smith 
5060d71ae5a4SJacob Faibussowitsch PetscErrorCode MatLoad_SeqAIJ(Mat newMat, PetscViewer viewer)
5061d71ae5a4SJacob Faibussowitsch {
506252f91c60SVaclav Hapla   PetscBool isbinary, ishdf5;
506352f91c60SVaclav Hapla 
506452f91c60SVaclav Hapla   PetscFunctionBegin;
506552f91c60SVaclav Hapla   PetscValidHeaderSpecific(newMat, MAT_CLASSID, 1);
506652f91c60SVaclav Hapla   PetscValidHeaderSpecific(viewer, PETSC_VIEWER_CLASSID, 2);
5067c27b3999SVaclav Hapla   /* force binary viewer to load .info file if it has not yet done so */
50689566063dSJacob Faibussowitsch   PetscCall(PetscViewerSetUp(viewer));
50699566063dSJacob Faibussowitsch   PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERBINARY, &isbinary));
50709566063dSJacob Faibussowitsch   PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERHDF5, &ishdf5));
507152f91c60SVaclav Hapla   if (isbinary) {
50729566063dSJacob Faibussowitsch     PetscCall(MatLoad_SeqAIJ_Binary(newMat, viewer));
507352f91c60SVaclav Hapla   } else if (ishdf5) {
507452f91c60SVaclav Hapla #if defined(PETSC_HAVE_HDF5)
50759566063dSJacob Faibussowitsch     PetscCall(MatLoad_AIJ_HDF5(newMat, viewer));
507652f91c60SVaclav Hapla #else
507752f91c60SVaclav Hapla     SETERRQ(PetscObjectComm((PetscObject)newMat), PETSC_ERR_SUP, "HDF5 not supported in this build.\nPlease reconfigure using --download-hdf5");
507852f91c60SVaclav Hapla #endif
507952f91c60SVaclav Hapla   } else {
508098921bdaSJacob Faibussowitsch     SETERRQ(PetscObjectComm((PetscObject)newMat), PETSC_ERR_SUP, "Viewer type %s not yet supported for reading %s matrices", ((PetscObject)viewer)->type_name, ((PetscObject)newMat)->type_name);
508152f91c60SVaclav Hapla   }
50823ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
508352f91c60SVaclav Hapla }
508452f91c60SVaclav Hapla 
5085d71ae5a4SJacob Faibussowitsch PetscErrorCode MatLoad_SeqAIJ_Binary(Mat mat, PetscViewer viewer)
5086d71ae5a4SJacob Faibussowitsch {
50873ea6fe3dSLisandro Dalcin   Mat_SeqAIJ *a = (Mat_SeqAIJ *)mat->data;
50883ea6fe3dSLisandro Dalcin   PetscInt    header[4], *rowlens, M, N, nz, sum, rows, cols, i;
5089fbdbba38SShri Abhyankar 
5090fbdbba38SShri Abhyankar   PetscFunctionBegin;
50919566063dSJacob Faibussowitsch   PetscCall(PetscViewerSetUp(viewer));
5092bbead8a2SBarry Smith 
50933ea6fe3dSLisandro Dalcin   /* read in matrix header */
50949566063dSJacob Faibussowitsch   PetscCall(PetscViewerBinaryRead(viewer, header, 4, NULL, PETSC_INT));
509508401ef6SPierre Jolivet   PetscCheck(header[0] == MAT_FILE_CLASSID, PETSC_COMM_SELF, PETSC_ERR_FILE_UNEXPECTED, "Not a matrix object in file");
50969371c9d4SSatish Balay   M  = header[1];
50979371c9d4SSatish Balay   N  = header[2];
50989371c9d4SSatish Balay   nz = header[3];
509908401ef6SPierre Jolivet   PetscCheck(M >= 0, PetscObjectComm((PetscObject)viewer), PETSC_ERR_FILE_UNEXPECTED, "Matrix row size (%" PetscInt_FMT ") in file is negative", M);
510008401ef6SPierre Jolivet   PetscCheck(N >= 0, PetscObjectComm((PetscObject)viewer), PETSC_ERR_FILE_UNEXPECTED, "Matrix column size (%" PetscInt_FMT ") in file is negative", N);
510108401ef6SPierre Jolivet   PetscCheck(nz >= 0, PETSC_COMM_SELF, PETSC_ERR_FILE_UNEXPECTED, "Matrix stored in special format on disk, cannot load as SeqAIJ");
5102fbdbba38SShri Abhyankar 
51033ea6fe3dSLisandro Dalcin   /* set block sizes from the viewer's .info file */
51049566063dSJacob Faibussowitsch   PetscCall(MatLoad_Binary_BlockSizes(mat, viewer));
51053ea6fe3dSLisandro Dalcin   /* set local and global sizes if not set already */
51063ea6fe3dSLisandro Dalcin   if (mat->rmap->n < 0) mat->rmap->n = M;
51073ea6fe3dSLisandro Dalcin   if (mat->cmap->n < 0) mat->cmap->n = N;
51083ea6fe3dSLisandro Dalcin   if (mat->rmap->N < 0) mat->rmap->N = M;
51093ea6fe3dSLisandro Dalcin   if (mat->cmap->N < 0) mat->cmap->N = N;
51109566063dSJacob Faibussowitsch   PetscCall(PetscLayoutSetUp(mat->rmap));
51119566063dSJacob Faibussowitsch   PetscCall(PetscLayoutSetUp(mat->cmap));
51123ea6fe3dSLisandro Dalcin 
51133ea6fe3dSLisandro Dalcin   /* check if the matrix sizes are correct */
51149566063dSJacob Faibussowitsch   PetscCall(MatGetSize(mat, &rows, &cols));
5115aed4548fSBarry Smith   PetscCheck(M == rows && N == cols, PETSC_COMM_SELF, PETSC_ERR_FILE_UNEXPECTED, "Matrix in file of different sizes (%" PetscInt_FMT ", %" PetscInt_FMT ") than the input matrix (%" PetscInt_FMT ", %" PetscInt_FMT ")", M, N, rows, cols);
51163ea6fe3dSLisandro Dalcin 
5117fbdbba38SShri Abhyankar   /* read in row lengths */
51189566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(M, &rowlens));
51199566063dSJacob Faibussowitsch   PetscCall(PetscViewerBinaryRead(viewer, rowlens, M, NULL, PETSC_INT));
51203ea6fe3dSLisandro Dalcin   /* check if sum(rowlens) is same as nz */
51219371c9d4SSatish Balay   sum = 0;
51229371c9d4SSatish Balay   for (i = 0; i < M; i++) sum += rowlens[i];
512308401ef6SPierre Jolivet   PetscCheck(sum == nz, PETSC_COMM_SELF, PETSC_ERR_FILE_UNEXPECTED, "Inconsistent matrix data in file: nonzeros = %" PetscInt_FMT ", sum-row-lengths = %" PetscInt_FMT, nz, sum);
51243ea6fe3dSLisandro Dalcin   /* preallocate and check sizes */
51259566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(mat, 0, rowlens));
51269566063dSJacob Faibussowitsch   PetscCall(MatGetSize(mat, &rows, &cols));
5127aed4548fSBarry Smith   PetscCheck(M == rows && N == cols, PETSC_COMM_SELF, PETSC_ERR_FILE_UNEXPECTED, "Matrix in file of different length (%" PetscInt_FMT ", %" PetscInt_FMT ") than the input matrix (%" PetscInt_FMT ", %" PetscInt_FMT ")", M, N, rows, cols);
51283ea6fe3dSLisandro Dalcin   /* store row lengths */
51299566063dSJacob Faibussowitsch   PetscCall(PetscArraycpy(a->ilen, rowlens, M));
51309566063dSJacob Faibussowitsch   PetscCall(PetscFree(rowlens));
5131fbdbba38SShri Abhyankar 
51323ea6fe3dSLisandro Dalcin   /* fill in "i" row pointers */
51339371c9d4SSatish Balay   a->i[0] = 0;
51349371c9d4SSatish Balay   for (i = 0; i < M; i++) a->i[i + 1] = a->i[i] + a->ilen[i];
51353ea6fe3dSLisandro Dalcin   /* read in "j" column indices */
51369566063dSJacob Faibussowitsch   PetscCall(PetscViewerBinaryRead(viewer, a->j, nz, NULL, PETSC_INT));
51373ea6fe3dSLisandro Dalcin   /* read in "a" nonzero values */
51389566063dSJacob Faibussowitsch   PetscCall(PetscViewerBinaryRead(viewer, a->a, nz, NULL, PETSC_SCALAR));
5139fbdbba38SShri Abhyankar 
51409566063dSJacob Faibussowitsch   PetscCall(MatAssemblyBegin(mat, MAT_FINAL_ASSEMBLY));
51419566063dSJacob Faibussowitsch   PetscCall(MatAssemblyEnd(mat, MAT_FINAL_ASSEMBLY));
51423ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
5143fbdbba38SShri Abhyankar }
5144fbdbba38SShri Abhyankar 
5145d71ae5a4SJacob Faibussowitsch PetscErrorCode MatEqual_SeqAIJ(Mat A, Mat B, PetscBool *flg)
5146d71ae5a4SJacob Faibussowitsch {
51477264ac53SSatish Balay   Mat_SeqAIJ        *a = (Mat_SeqAIJ *)A->data, *b = (Mat_SeqAIJ *)B->data;
5148fff043a9SJunchao Zhang   const PetscScalar *aa, *ba;
5149eeffb40dSHong Zhang #if defined(PETSC_USE_COMPLEX)
5150eeffb40dSHong Zhang   PetscInt k;
5151eeffb40dSHong Zhang #endif
51527264ac53SSatish Balay 
51533a40ed3dSBarry Smith   PetscFunctionBegin;
5154bfeeae90SHong Zhang   /* If the  matrix dimensions are not equal,or no of nonzeros */
5155d0f46423SBarry Smith   if ((A->rmap->n != B->rmap->n) || (A->cmap->n != B->cmap->n) || (a->nz != b->nz)) {
5156ca44d042SBarry Smith     *flg = PETSC_FALSE;
51573ba16761SJacob Faibussowitsch     PetscFunctionReturn(PETSC_SUCCESS);
5158bcd2baecSBarry Smith   }
51597264ac53SSatish Balay 
51607264ac53SSatish Balay   /* if the a->i are the same */
51619566063dSJacob Faibussowitsch   PetscCall(PetscArraycmp(a->i, b->i, A->rmap->n + 1, flg));
51623ba16761SJacob Faibussowitsch   if (!*flg) PetscFunctionReturn(PETSC_SUCCESS);
51637264ac53SSatish Balay 
51647264ac53SSatish Balay   /* if a->j are the same */
51659566063dSJacob Faibussowitsch   PetscCall(PetscArraycmp(a->j, b->j, a->nz, flg));
51663ba16761SJacob Faibussowitsch   if (!*flg) PetscFunctionReturn(PETSC_SUCCESS);
5167bcd2baecSBarry Smith 
51689566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &aa));
51699566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(B, &ba));
5170bcd2baecSBarry Smith   /* if a->a are the same */
5171eeffb40dSHong Zhang #if defined(PETSC_USE_COMPLEX)
5172eeffb40dSHong Zhang   for (k = 0; k < a->nz; k++) {
5173fff043a9SJunchao Zhang     if (PetscRealPart(aa[k]) != PetscRealPart(ba[k]) || PetscImaginaryPart(aa[k]) != PetscImaginaryPart(ba[k])) {
5174eeffb40dSHong Zhang       *flg = PETSC_FALSE;
51753ba16761SJacob Faibussowitsch       PetscFunctionReturn(PETSC_SUCCESS);
5176eeffb40dSHong Zhang     }
5177eeffb40dSHong Zhang   }
5178eeffb40dSHong Zhang #else
51799566063dSJacob Faibussowitsch   PetscCall(PetscArraycmp(aa, ba, a->nz, flg));
5180eeffb40dSHong Zhang #endif
51819566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &aa));
51829566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(B, &ba));
51833ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
51847264ac53SSatish Balay }
518536db0b34SBarry Smith 
518605869f15SSatish Balay /*@
518711a5261eSBarry Smith   MatCreateSeqAIJWithArrays - Creates an sequential `MATSEQAIJ` matrix using matrix elements (in CSR format)
518836db0b34SBarry Smith   provided by the user.
518936db0b34SBarry Smith 
5190d083f849SBarry Smith   Collective
519136db0b34SBarry Smith 
519236db0b34SBarry Smith   Input Parameters:
519336db0b34SBarry Smith + comm - must be an MPI communicator of size 1
519436db0b34SBarry Smith . m    - number of rows
519536db0b34SBarry Smith . n    - number of columns
5196483a2f95SBarry Smith . i    - row indices; that is i[0] = 0, i[row] = i[row-1] + number of elements in that row of the matrix
519736db0b34SBarry Smith . j    - column indices
519836db0b34SBarry Smith - a    - matrix values
519936db0b34SBarry Smith 
520036db0b34SBarry Smith   Output Parameter:
520136db0b34SBarry Smith . mat - the matrix
520236db0b34SBarry Smith 
520336db0b34SBarry Smith   Level: intermediate
520436db0b34SBarry Smith 
520536db0b34SBarry Smith   Notes:
52062ef1f0ffSBarry Smith   The `i`, `j`, and `a` arrays are not copied by this routine, the user must free these arrays
5207292fb18eSBarry Smith   once the matrix is destroyed and not before
520836db0b34SBarry Smith 
520936db0b34SBarry Smith   You cannot set new nonzero locations into this matrix, that will generate an error.
521036db0b34SBarry Smith 
52112ef1f0ffSBarry Smith   The `i` and `j` indices are 0 based
521236db0b34SBarry Smith 
5213a4552177SSatish Balay   The format which is used for the sparse matrix input, is equivalent to a
5214a4552177SSatish Balay   row-major ordering.. i.e for the following matrix, the input data expected is
52158eef79e4SBarry Smith   as shown
52162ef1f0ffSBarry Smith .vb
52172ef1f0ffSBarry Smith         1 0 0
52182ef1f0ffSBarry Smith         2 0 3
52192ef1f0ffSBarry Smith         4 5 6
5220a4552177SSatish Balay 
52212ef1f0ffSBarry Smith         i =  {0,1,3,6}  [size = nrow+1  = 3+1]
52222ef1f0ffSBarry Smith         j =  {0,0,2,0,1,2}  [size = 6]; values must be sorted for each row
52232ef1f0ffSBarry Smith         v =  {1,2,3,4,5,6}  [size = 6]
52242ef1f0ffSBarry Smith .ve
5225a4552177SSatish Balay 
52261cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatCreate()`, `MatCreateAIJ()`, `MatCreateSeqAIJ()`, `MatCreateMPIAIJWithArrays()`, `MatMPIAIJSetPreallocationCSR()`
522736db0b34SBarry Smith @*/
5228d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateSeqAIJWithArrays(MPI_Comm comm, PetscInt m, PetscInt n, PetscInt i[], PetscInt j[], PetscScalar a[], Mat *mat)
5229d71ae5a4SJacob Faibussowitsch {
5230cbcfb4deSHong Zhang   PetscInt    ii;
523136db0b34SBarry Smith   Mat_SeqAIJ *aij;
5232cbcfb4deSHong Zhang   PetscInt    jj;
523336db0b34SBarry Smith 
523436db0b34SBarry Smith   PetscFunctionBegin;
5235aed4548fSBarry Smith   PetscCheck(m <= 0 || i[0] == 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "i (row indices) must start with 0");
52369566063dSJacob Faibussowitsch   PetscCall(MatCreate(comm, mat));
52379566063dSJacob Faibussowitsch   PetscCall(MatSetSizes(*mat, m, n, m, n));
52389566063dSJacob Faibussowitsch   /* PetscCall(MatSetBlockSizes(*mat,,)); */
52399566063dSJacob Faibussowitsch   PetscCall(MatSetType(*mat, MATSEQAIJ));
52409566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(*mat, MAT_SKIP_ALLOCATION, NULL));
5241ab93d7beSBarry Smith   aij = (Mat_SeqAIJ *)(*mat)->data;
52429566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(m, &aij->imax));
52439566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(m, &aij->ilen));
5244ab93d7beSBarry Smith 
524536db0b34SBarry Smith   aij->i       = i;
524636db0b34SBarry Smith   aij->j       = j;
524736db0b34SBarry Smith   aij->a       = a;
524836db0b34SBarry Smith   aij->nonew   = -1; /*this indicates that inserting a new value in the matrix that generates a new nonzero is an error*/
5249e6b907acSBarry Smith   aij->free_a  = PETSC_FALSE;
5250e6b907acSBarry Smith   aij->free_ij = PETSC_FALSE;
525136db0b34SBarry Smith 
5252cbc6b225SStefano Zampini   for (ii = 0, aij->nonzerorowcnt = 0, aij->rmax = 0; ii < m; ii++) {
525336db0b34SBarry Smith     aij->ilen[ii] = aij->imax[ii] = i[ii + 1] - i[ii];
525476bd3646SJed Brown     if (PetscDefined(USE_DEBUG)) {
5255aed4548fSBarry Smith       PetscCheck(i[ii + 1] - i[ii] >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Negative row length in i (row indices) row = %" PetscInt_FMT " length = %" PetscInt_FMT, ii, i[ii + 1] - i[ii]);
52569985e31cSBarry Smith       for (jj = i[ii] + 1; jj < i[ii + 1]; jj++) {
525708401ef6SPierre Jolivet         PetscCheck(j[jj] >= j[jj - 1], PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Column entry number %" PetscInt_FMT " (actual column %" PetscInt_FMT ") in row %" PetscInt_FMT " is not sorted", jj - i[ii], j[jj], ii);
525808401ef6SPierre Jolivet         PetscCheck(j[jj] != j[jj - 1], PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Column entry number %" PetscInt_FMT " (actual column %" PetscInt_FMT ") in row %" PetscInt_FMT " is identical to previous entry", jj - i[ii], j[jj], ii);
52599985e31cSBarry Smith       }
526036db0b34SBarry Smith     }
526176bd3646SJed Brown   }
526276bd3646SJed Brown   if (PetscDefined(USE_DEBUG)) {
526336db0b34SBarry Smith     for (ii = 0; ii < aij->i[m]; ii++) {
526408401ef6SPierre Jolivet       PetscCheck(j[ii] >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Negative column index at location = %" PetscInt_FMT " index = %" PetscInt_FMT, ii, j[ii]);
5265da0802e2SStefano Zampini       PetscCheck(j[ii] <= n - 1, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Column index to large at location = %" PetscInt_FMT " index = %" PetscInt_FMT " last column = %" PetscInt_FMT, ii, j[ii], n - 1);
526636db0b34SBarry Smith     }
526776bd3646SJed Brown   }
526836db0b34SBarry Smith 
52699566063dSJacob Faibussowitsch   PetscCall(MatAssemblyBegin(*mat, MAT_FINAL_ASSEMBLY));
52709566063dSJacob Faibussowitsch   PetscCall(MatAssemblyEnd(*mat, MAT_FINAL_ASSEMBLY));
52713ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
527236db0b34SBarry Smith }
5273cbc6b225SStefano Zampini 
5274f62e3866SBarry Smith /*@
527511a5261eSBarry Smith   MatCreateSeqAIJFromTriple - Creates an sequential `MATSEQAIJ` matrix using matrix elements (in COO format)
52768a0b0e6bSVictor Minden   provided by the user.
52778a0b0e6bSVictor Minden 
5278d083f849SBarry Smith   Collective
52798a0b0e6bSVictor Minden 
52808a0b0e6bSVictor Minden   Input Parameters:
52818a0b0e6bSVictor Minden + comm - must be an MPI communicator of size 1
52828a0b0e6bSVictor Minden . m    - number of rows
52838a0b0e6bSVictor Minden . n    - number of columns
52848a0b0e6bSVictor Minden . i    - row indices
52858a0b0e6bSVictor Minden . j    - column indices
52861230e6d1SVictor Minden . a    - matrix values
52871230e6d1SVictor Minden . nz   - number of nonzeros
52882ef1f0ffSBarry Smith - idx  - if the `i` and `j` indices start with 1 use `PETSC_TRUE` otherwise use `PETSC_FALSE`
52898a0b0e6bSVictor Minden 
52908a0b0e6bSVictor Minden   Output Parameter:
52918a0b0e6bSVictor Minden . mat - the matrix
52928a0b0e6bSVictor Minden 
52938a0b0e6bSVictor Minden   Level: intermediate
52948a0b0e6bSVictor Minden 
5295f62e3866SBarry Smith   Example:
5296f62e3866SBarry Smith   For the following matrix, the input data expected is as shown (using 0 based indexing)
52979e99939fSJunchao Zhang .vb
52988a0b0e6bSVictor Minden         1 0 0
52998a0b0e6bSVictor Minden         2 0 3
53008a0b0e6bSVictor Minden         4 5 6
53018a0b0e6bSVictor Minden 
53028a0b0e6bSVictor Minden         i =  {0,1,1,2,2,2}
53038a0b0e6bSVictor Minden         j =  {0,0,2,0,1,2}
53048a0b0e6bSVictor Minden         v =  {1,2,3,4,5,6}
53059e99939fSJunchao Zhang .ve
5306fe59aa6dSJacob Faibussowitsch 
53072ef1f0ffSBarry Smith   Note:
5308d7547e51SJunchao Zhang   Instead of using this function, users should also consider `MatSetPreallocationCOO()` and `MatSetValuesCOO()`, which allow repeated or remote entries,
5309d7547e51SJunchao Zhang   and are particularly useful in iterative applications.
53108a0b0e6bSVictor Minden 
53111cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatCreate()`, `MatCreateAIJ()`, `MatCreateSeqAIJ()`, `MatCreateSeqAIJWithArrays()`, `MatMPIAIJSetPreallocationCSR()`, `MatSetValuesCOO()`, `MatSetPreallocationCOO()`
53128a0b0e6bSVictor Minden @*/
5313d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateSeqAIJFromTriple(MPI_Comm comm, PetscInt m, PetscInt n, PetscInt i[], PetscInt j[], PetscScalar a[], Mat *mat, PetscInt nz, PetscBool idx)
5314d71ae5a4SJacob Faibussowitsch {
5315d021a1c5SVictor Minden   PetscInt ii, *nnz, one = 1, row, col;
53168a0b0e6bSVictor Minden 
53178a0b0e6bSVictor Minden   PetscFunctionBegin;
53189566063dSJacob Faibussowitsch   PetscCall(PetscCalloc1(m, &nnz));
5319ad540459SPierre Jolivet   for (ii = 0; ii < nz; ii++) nnz[i[ii] - !!idx] += 1;
53209566063dSJacob Faibussowitsch   PetscCall(MatCreate(comm, mat));
53219566063dSJacob Faibussowitsch   PetscCall(MatSetSizes(*mat, m, n, m, n));
53229566063dSJacob Faibussowitsch   PetscCall(MatSetType(*mat, MATSEQAIJ));
53239566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(*mat, 0, nnz));
53241230e6d1SVictor Minden   for (ii = 0; ii < nz; ii++) {
53251230e6d1SVictor Minden     if (idx) {
53261230e6d1SVictor Minden       row = i[ii] - 1;
53271230e6d1SVictor Minden       col = j[ii] - 1;
53281230e6d1SVictor Minden     } else {
53291230e6d1SVictor Minden       row = i[ii];
53301230e6d1SVictor Minden       col = j[ii];
53318a0b0e6bSVictor Minden     }
53329566063dSJacob Faibussowitsch     PetscCall(MatSetValues(*mat, one, &row, one, &col, &a[ii], ADD_VALUES));
53338a0b0e6bSVictor Minden   }
53349566063dSJacob Faibussowitsch   PetscCall(MatAssemblyBegin(*mat, MAT_FINAL_ASSEMBLY));
53359566063dSJacob Faibussowitsch   PetscCall(MatAssemblyEnd(*mat, MAT_FINAL_ASSEMBLY));
53369566063dSJacob Faibussowitsch   PetscCall(PetscFree(nnz));
53373ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
53388a0b0e6bSVictor Minden }
533936db0b34SBarry Smith 
5340d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJInvalidateDiagonal(Mat A)
5341d71ae5a4SJacob Faibussowitsch {
5342acf2f550SJed Brown   Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data;
5343acf2f550SJed Brown 
5344acf2f550SJed Brown   PetscFunctionBegin;
5345acf2f550SJed Brown   a->idiagvalid  = PETSC_FALSE;
5346acf2f550SJed Brown   a->ibdiagvalid = PETSC_FALSE;
53472205254eSKarl Rupp 
53489566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJInvalidateDiagonal_Inode(A));
53493ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
5350acf2f550SJed Brown }
5351acf2f550SJed Brown 
5352d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateMPIMatConcatenateSeqMat_SeqAIJ(MPI_Comm comm, Mat inmat, PetscInt n, MatReuse scall, Mat *outmat)
5353d71ae5a4SJacob Faibussowitsch {
53549c8f2541SHong Zhang   PetscFunctionBegin;
53559566063dSJacob Faibussowitsch   PetscCall(MatCreateMPIMatConcatenateSeqMat_MPIAIJ(comm, inmat, n, scall, outmat));
53563ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
53579c8f2541SHong Zhang }
53589c8f2541SHong Zhang 
535981824310SBarry Smith /*
536053dd7562SDmitry Karpeev  Permute A into C's *local* index space using rowemb,colemb.
536153dd7562SDmitry Karpeev  The embedding are supposed to be injections and the above implies that the range of rowemb is a subset
536253dd7562SDmitry Karpeev  of [0,m), colemb is in [0,n).
536353dd7562SDmitry Karpeev  If pattern == DIFFERENT_NONZERO_PATTERN, C is preallocated according to A.
536453dd7562SDmitry Karpeev  */
5365d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetSeqMat_SeqAIJ(Mat C, IS rowemb, IS colemb, MatStructure pattern, Mat B)
5366d71ae5a4SJacob Faibussowitsch {
536753dd7562SDmitry Karpeev   /* If making this function public, change the error returned in this function away from _PLIB. */
536853dd7562SDmitry Karpeev   Mat_SeqAIJ     *Baij;
536953dd7562SDmitry Karpeev   PetscBool       seqaij;
537053dd7562SDmitry Karpeev   PetscInt        m, n, *nz, i, j, count;
537153dd7562SDmitry Karpeev   PetscScalar     v;
537253dd7562SDmitry Karpeev   const PetscInt *rowindices, *colindices;
537353dd7562SDmitry Karpeev 
537453dd7562SDmitry Karpeev   PetscFunctionBegin;
53753ba16761SJacob Faibussowitsch   if (!B) PetscFunctionReturn(PETSC_SUCCESS);
537653dd7562SDmitry Karpeev   /* Check to make sure the target matrix (and embeddings) are compatible with C and each other. */
53779566063dSJacob Faibussowitsch   PetscCall(PetscObjectBaseTypeCompare((PetscObject)B, MATSEQAIJ, &seqaij));
537828b400f6SJacob Faibussowitsch   PetscCheck(seqaij, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Input matrix is of wrong type");
537953dd7562SDmitry Karpeev   if (rowemb) {
53809566063dSJacob Faibussowitsch     PetscCall(ISGetLocalSize(rowemb, &m));
538108401ef6SPierre Jolivet     PetscCheck(m == B->rmap->n, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Row IS of size %" PetscInt_FMT " is incompatible with matrix row size %" PetscInt_FMT, m, B->rmap->n);
538253dd7562SDmitry Karpeev   } else {
538308401ef6SPierre Jolivet     PetscCheck(C->rmap->n == B->rmap->n, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Input matrix is row-incompatible with the target matrix");
538453dd7562SDmitry Karpeev   }
538553dd7562SDmitry Karpeev   if (colemb) {
53869566063dSJacob Faibussowitsch     PetscCall(ISGetLocalSize(colemb, &n));
538708401ef6SPierre Jolivet     PetscCheck(n == B->cmap->n, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Diag col IS of size %" PetscInt_FMT " is incompatible with input matrix col size %" PetscInt_FMT, n, B->cmap->n);
538853dd7562SDmitry Karpeev   } else {
538908401ef6SPierre Jolivet     PetscCheck(C->cmap->n == B->cmap->n, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Input matrix is col-incompatible with the target matrix");
539053dd7562SDmitry Karpeev   }
539153dd7562SDmitry Karpeev 
5392f4f49eeaSPierre Jolivet   Baij = (Mat_SeqAIJ *)B->data;
539353dd7562SDmitry Karpeev   if (pattern == DIFFERENT_NONZERO_PATTERN) {
53949566063dSJacob Faibussowitsch     PetscCall(PetscMalloc1(B->rmap->n, &nz));
5395ad540459SPierre Jolivet     for (i = 0; i < B->rmap->n; i++) nz[i] = Baij->i[i + 1] - Baij->i[i];
53969566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJSetPreallocation(C, 0, nz));
53979566063dSJacob Faibussowitsch     PetscCall(PetscFree(nz));
539853dd7562SDmitry Karpeev   }
539948a46eb9SPierre Jolivet   if (pattern == SUBSET_NONZERO_PATTERN) PetscCall(MatZeroEntries(C));
540053dd7562SDmitry Karpeev   count      = 0;
540153dd7562SDmitry Karpeev   rowindices = NULL;
540253dd7562SDmitry Karpeev   colindices = NULL;
540348a46eb9SPierre Jolivet   if (rowemb) PetscCall(ISGetIndices(rowemb, &rowindices));
540448a46eb9SPierre Jolivet   if (colemb) PetscCall(ISGetIndices(colemb, &colindices));
540553dd7562SDmitry Karpeev   for (i = 0; i < B->rmap->n; i++) {
540653dd7562SDmitry Karpeev     PetscInt row;
540753dd7562SDmitry Karpeev     row = i;
540853dd7562SDmitry Karpeev     if (rowindices) row = rowindices[i];
540953dd7562SDmitry Karpeev     for (j = Baij->i[i]; j < Baij->i[i + 1]; j++) {
541053dd7562SDmitry Karpeev       PetscInt col;
541153dd7562SDmitry Karpeev       col = Baij->j[count];
541253dd7562SDmitry Karpeev       if (colindices) col = colindices[col];
541353dd7562SDmitry Karpeev       v = Baij->a[count];
54149566063dSJacob Faibussowitsch       PetscCall(MatSetValues(C, 1, &row, 1, &col, &v, INSERT_VALUES));
541553dd7562SDmitry Karpeev       ++count;
541653dd7562SDmitry Karpeev     }
541753dd7562SDmitry Karpeev   }
541853dd7562SDmitry Karpeev   /* FIXME: set C's nonzerostate correctly. */
541953dd7562SDmitry Karpeev   /* Assembly for C is necessary. */
542053dd7562SDmitry Karpeev   C->preallocated  = PETSC_TRUE;
542153dd7562SDmitry Karpeev   C->assembled     = PETSC_TRUE;
542253dd7562SDmitry Karpeev   C->was_assembled = PETSC_FALSE;
54233ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
542453dd7562SDmitry Karpeev }
542553dd7562SDmitry Karpeev 
542658c11ad4SPierre Jolivet PetscErrorCode MatEliminateZeros_SeqAIJ(Mat A, PetscBool keep)
5427dec0b466SHong Zhang {
5428dec0b466SHong Zhang   Mat_SeqAIJ *a  = (Mat_SeqAIJ *)A->data;
5429dec0b466SHong Zhang   MatScalar  *aa = a->a;
5430dec0b466SHong Zhang   PetscInt    m = A->rmap->n, fshift = 0, fshift_prev = 0, i, k;
5431dec0b466SHong Zhang   PetscInt   *ailen = a->ilen, *imax = a->imax, *ai = a->i, *aj = a->j, rmax = 0;
5432dec0b466SHong Zhang 
5433dec0b466SHong Zhang   PetscFunctionBegin;
5434dec0b466SHong Zhang   PetscCheck(A->assembled, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Cannot eliminate zeros for unassembled matrix");
5435dec0b466SHong Zhang   if (m) rmax = ailen[0]; /* determine row with most nonzeros */
5436dec0b466SHong Zhang   for (i = 1; i <= m; i++) {
5437dec0b466SHong Zhang     /* move each nonzero entry back by the amount of zero slots (fshift) before it*/
5438dec0b466SHong Zhang     for (k = ai[i - 1]; k < ai[i]; k++) {
543958c11ad4SPierre Jolivet       if (aa[k] == 0 && (aj[k] != i - 1 || !keep)) fshift++;
5440dec0b466SHong Zhang       else {
5441dec0b466SHong Zhang         if (aa[k] == 0 && aj[k] == i - 1) PetscCall(PetscInfo(A, "Keep the diagonal zero at row %" PetscInt_FMT "\n", i - 1));
5442dec0b466SHong Zhang         aa[k - fshift] = aa[k];
5443dec0b466SHong Zhang         aj[k - fshift] = aj[k];
5444dec0b466SHong Zhang       }
5445dec0b466SHong Zhang     }
5446dec0b466SHong Zhang     ai[i - 1] -= fshift_prev; // safe to update ai[i-1] now since it will not be used in the next iteration
5447dec0b466SHong Zhang     fshift_prev = fshift;
5448dec0b466SHong Zhang     /* reset ilen and imax for each row */
5449dec0b466SHong Zhang     ailen[i - 1] = imax[i - 1] = ai[i] - fshift - ai[i - 1];
5450dec0b466SHong Zhang     a->nonzerorowcnt += ((ai[i] - fshift - ai[i - 1]) > 0);
5451dec0b466SHong Zhang     rmax = PetscMax(rmax, ailen[i - 1]);
5452dec0b466SHong Zhang   }
5453312eded4SPierre Jolivet   if (fshift) {
5454dec0b466SHong Zhang     if (m) {
5455dec0b466SHong Zhang       ai[m] -= fshift;
5456dec0b466SHong Zhang       a->nz = ai[m];
5457dec0b466SHong Zhang     }
5458dec0b466SHong Zhang     PetscCall(PetscInfo(A, "Matrix size: %" PetscInt_FMT " X %" PetscInt_FMT "; zeros eliminated: %" PetscInt_FMT "; nonzeros left: %" PetscInt_FMT "\n", m, A->cmap->n, fshift, a->nz));
5459312eded4SPierre Jolivet     A->nonzerostate++;
5460dec0b466SHong Zhang     A->info.nz_unneeded += (PetscReal)fshift;
5461dec0b466SHong Zhang     a->rmax = rmax;
5462dec0b466SHong Zhang     if (a->inode.use && a->inode.checked) PetscCall(MatSeqAIJCheckInode(A));
5463dec0b466SHong Zhang     PetscCall(MatAssemblyBegin(A, MAT_FINAL_ASSEMBLY));
5464dec0b466SHong Zhang     PetscCall(MatAssemblyEnd(A, MAT_FINAL_ASSEMBLY));
5465312eded4SPierre Jolivet   }
54663ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
5467dec0b466SHong Zhang }
5468dec0b466SHong Zhang 
54694099cc6bSBarry Smith PetscFunctionList MatSeqAIJList = NULL;
54704099cc6bSBarry Smith 
5471cc4c1da9SBarry Smith /*@
547211a5261eSBarry Smith   MatSeqAIJSetType - Converts a `MATSEQAIJ` matrix to a subtype
54734099cc6bSBarry Smith 
5474c3339decSBarry Smith   Collective
54754099cc6bSBarry Smith 
54764099cc6bSBarry Smith   Input Parameters:
54774099cc6bSBarry Smith + mat    - the matrix object
54784099cc6bSBarry Smith - matype - matrix type
54794099cc6bSBarry Smith 
54804099cc6bSBarry Smith   Options Database Key:
54814e187271SRichard Tran Mills . -mat_seqaij_type  <method> - for example seqaijcrl
54824099cc6bSBarry Smith 
54834099cc6bSBarry Smith   Level: intermediate
54844099cc6bSBarry Smith 
5485fe59aa6dSJacob Faibussowitsch .seealso: [](ch_matrices), `Mat`, `PCSetType()`, `VecSetType()`, `MatCreate()`, `MatType`
54864099cc6bSBarry Smith @*/
5487d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetType(Mat mat, MatType matype)
5488d71ae5a4SJacob Faibussowitsch {
54894099cc6bSBarry Smith   PetscBool sametype;
54905f80ce2aSJacob Faibussowitsch   PetscErrorCode (*r)(Mat, MatType, MatReuse, Mat *);
54914099cc6bSBarry Smith 
54924099cc6bSBarry Smith   PetscFunctionBegin;
54934099cc6bSBarry Smith   PetscValidHeaderSpecific(mat, MAT_CLASSID, 1);
54949566063dSJacob Faibussowitsch   PetscCall(PetscObjectTypeCompare((PetscObject)mat, matype, &sametype));
54953ba16761SJacob Faibussowitsch   if (sametype) PetscFunctionReturn(PETSC_SUCCESS);
54964099cc6bSBarry Smith 
54979566063dSJacob Faibussowitsch   PetscCall(PetscFunctionListFind(MatSeqAIJList, matype, &r));
54986adde796SStefano Zampini   PetscCheck(r, PetscObjectComm((PetscObject)mat), PETSC_ERR_ARG_UNKNOWN_TYPE, "Unknown Mat type given: %s", matype);
54999566063dSJacob Faibussowitsch   PetscCall((*r)(mat, matype, MAT_INPLACE_MATRIX, &mat));
55003ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
55014099cc6bSBarry Smith }
55024099cc6bSBarry Smith 
55034099cc6bSBarry Smith /*@C
550411a5261eSBarry Smith   MatSeqAIJRegister -  - Adds a new sub-matrix type for sequential `MATSEQAIJ` matrices
55054099cc6bSBarry Smith 
5506cc4c1da9SBarry Smith   Not Collective, No Fortran Support
55074099cc6bSBarry Smith 
55084099cc6bSBarry Smith   Input Parameters:
5509fe59aa6dSJacob Faibussowitsch + sname    - name of a new user-defined matrix type, for example `MATSEQAIJCRL`
55104099cc6bSBarry Smith - function - routine to convert to subtype
55114099cc6bSBarry Smith 
55122ef1f0ffSBarry Smith   Level: advanced
55132ef1f0ffSBarry Smith 
55144099cc6bSBarry Smith   Notes:
551511a5261eSBarry Smith   `MatSeqAIJRegister()` may be called multiple times to add several user-defined solvers.
55164099cc6bSBarry Smith 
55174099cc6bSBarry Smith   Then, your matrix can be chosen with the procedural interface at runtime via the option
55184099cc6bSBarry Smith $     -mat_seqaij_type my_mat
55194099cc6bSBarry Smith 
55201cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJRegisterAll()`
55214099cc6bSBarry Smith @*/
5522d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJRegister(const char sname[], PetscErrorCode (*function)(Mat, MatType, MatReuse, Mat *))
5523d71ae5a4SJacob Faibussowitsch {
55244099cc6bSBarry Smith   PetscFunctionBegin;
55259566063dSJacob Faibussowitsch   PetscCall(MatInitializePackage());
55269566063dSJacob Faibussowitsch   PetscCall(PetscFunctionListAdd(&MatSeqAIJList, sname, function));
55273ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
55284099cc6bSBarry Smith }
55294099cc6bSBarry Smith 
55304099cc6bSBarry Smith PetscBool MatSeqAIJRegisterAllCalled = PETSC_FALSE;
55314099cc6bSBarry Smith 
55324099cc6bSBarry Smith /*@C
553311a5261eSBarry Smith   MatSeqAIJRegisterAll - Registers all of the matrix subtypes of `MATSSEQAIJ`
55344099cc6bSBarry Smith 
55354099cc6bSBarry Smith   Not Collective
55364099cc6bSBarry Smith 
55374099cc6bSBarry Smith   Level: advanced
55384099cc6bSBarry Smith 
55392ef1f0ffSBarry Smith   Note:
55402ef1f0ffSBarry Smith   This registers the versions of `MATSEQAIJ` for GPUs
55412ef1f0ffSBarry Smith 
55421cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatRegisterAll()`, `MatSeqAIJRegister()`
55434099cc6bSBarry Smith @*/
5544d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJRegisterAll(void)
5545d71ae5a4SJacob Faibussowitsch {
55464099cc6bSBarry Smith   PetscFunctionBegin;
55473ba16761SJacob Faibussowitsch   if (MatSeqAIJRegisterAllCalled) PetscFunctionReturn(PETSC_SUCCESS);
55484099cc6bSBarry Smith   MatSeqAIJRegisterAllCalled = PETSC_TRUE;
55494099cc6bSBarry Smith 
55509566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRegister(MATSEQAIJCRL, MatConvert_SeqAIJ_SeqAIJCRL));
55519566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRegister(MATSEQAIJPERM, MatConvert_SeqAIJ_SeqAIJPERM));
55529566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRegister(MATSEQAIJSELL, MatConvert_SeqAIJ_SeqAIJSELL));
55539779e05dSSatish Balay #if defined(PETSC_HAVE_MKL_SPARSE)
55549566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRegister(MATSEQAIJMKL, MatConvert_SeqAIJ_SeqAIJMKL));
5555485f9817SRichard Tran Mills #endif
55565063d097SStefano Zampini #if defined(PETSC_HAVE_CUDA)
55579566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRegister(MATSEQAIJCUSPARSE, MatConvert_SeqAIJ_SeqAIJCUSPARSE));
55585063d097SStefano Zampini #endif
5559d5e393b6SSuyash Tandon #if defined(PETSC_HAVE_HIP)
5560d5e393b6SSuyash Tandon   PetscCall(MatSeqAIJRegister(MATSEQAIJHIPSPARSE, MatConvert_SeqAIJ_SeqAIJHIPSPARSE));
5561d5e393b6SSuyash Tandon #endif
55625063d097SStefano Zampini #if defined(PETSC_HAVE_KOKKOS_KERNELS)
55639566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRegister(MATSEQAIJKOKKOS, MatConvert_SeqAIJ_SeqAIJKokkos));
55645063d097SStefano Zampini #endif
55654099cc6bSBarry Smith #if defined(PETSC_HAVE_VIENNACL) && defined(PETSC_HAVE_VIENNACL_NO_CUDA)
55669566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRegister(MATMPIAIJVIENNACL, MatConvert_SeqAIJ_SeqAIJViennaCL));
55674099cc6bSBarry Smith #endif
55683ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
55694099cc6bSBarry Smith }
557053dd7562SDmitry Karpeev 
557153dd7562SDmitry Karpeev /*
557281824310SBarry Smith     Special version for direct calls from Fortran
557381824310SBarry Smith */
557481824310SBarry Smith #if defined(PETSC_HAVE_FORTRAN_CAPS)
557581824310SBarry Smith   #define matsetvaluesseqaij_ MATSETVALUESSEQAIJ
557681824310SBarry Smith #elif !defined(PETSC_HAVE_FORTRAN_UNDERSCORE)
557781824310SBarry Smith   #define matsetvaluesseqaij_ matsetvaluesseqaij
557881824310SBarry Smith #endif
557981824310SBarry Smith 
558081824310SBarry Smith /* Change these macros so can be used in void function */
558198921bdaSJacob Faibussowitsch 
558298921bdaSJacob Faibussowitsch /* Change these macros so can be used in void function */
55839566063dSJacob Faibussowitsch /* Identical to PetscCallVoid, except it assigns to *_ierr */
55849566063dSJacob Faibussowitsch #undef PetscCall
55859371c9d4SSatish Balay #define PetscCall(...) \
55869371c9d4SSatish Balay   do { \
55875f80ce2aSJacob Faibussowitsch     PetscErrorCode ierr_msv_mpiaij = __VA_ARGS__; \
558898921bdaSJacob Faibussowitsch     if (PetscUnlikely(ierr_msv_mpiaij)) { \
558998921bdaSJacob Faibussowitsch       *_ierr = PetscError(PETSC_COMM_SELF, __LINE__, PETSC_FUNCTION_NAME, __FILE__, ierr_msv_mpiaij, PETSC_ERROR_REPEAT, " "); \
559098921bdaSJacob Faibussowitsch       return; \
559198921bdaSJacob Faibussowitsch     } \
559298921bdaSJacob Faibussowitsch   } while (0)
559398921bdaSJacob Faibussowitsch 
559498921bdaSJacob Faibussowitsch #undef SETERRQ
55959371c9d4SSatish Balay #define SETERRQ(comm, ierr, ...) \
55969371c9d4SSatish Balay   do { \
559798921bdaSJacob Faibussowitsch     *_ierr = PetscError(comm, __LINE__, PETSC_FUNCTION_NAME, __FILE__, ierr, PETSC_ERROR_INITIAL, __VA_ARGS__); \
559898921bdaSJacob Faibussowitsch     return; \
559998921bdaSJacob Faibussowitsch   } while (0)
560081824310SBarry Smith 
5601d71ae5a4SJacob Faibussowitsch PETSC_EXTERN void matsetvaluesseqaij_(Mat *AA, PetscInt *mm, const PetscInt im[], PetscInt *nn, const PetscInt in[], const PetscScalar v[], InsertMode *isis, PetscErrorCode *_ierr)
5602d71ae5a4SJacob Faibussowitsch {
560381824310SBarry Smith   Mat         A = *AA;
560481824310SBarry Smith   PetscInt    m = *mm, n = *nn;
560581824310SBarry Smith   InsertMode  is = *isis;
560681824310SBarry Smith   Mat_SeqAIJ *a  = (Mat_SeqAIJ *)A->data;
560781824310SBarry Smith   PetscInt   *rp, k, low, high, t, ii, row, nrow, i, col, l, rmax, N;
560881824310SBarry Smith   PetscInt   *imax, *ai, *ailen;
560981824310SBarry Smith   PetscInt   *aj, nonew = a->nonew, lastcol = -1;
561054f21887SBarry Smith   MatScalar  *ap, value, *aa;
5611ace3abfcSBarry Smith   PetscBool   ignorezeroentries = a->ignorezeroentries;
5612ace3abfcSBarry Smith   PetscBool   roworiented       = a->roworiented;
561381824310SBarry Smith 
561481824310SBarry Smith   PetscFunctionBegin;
56154994cf47SJed Brown   MatCheckPreallocated(A, 1);
561681824310SBarry Smith   imax  = a->imax;
561781824310SBarry Smith   ai    = a->i;
561881824310SBarry Smith   ailen = a->ilen;
561981824310SBarry Smith   aj    = a->j;
562081824310SBarry Smith   aa    = a->a;
562181824310SBarry Smith 
562281824310SBarry Smith   for (k = 0; k < m; k++) { /* loop over added rows */
562381824310SBarry Smith     row = im[k];
562481824310SBarry Smith     if (row < 0) continue;
56255f80ce2aSJacob Faibussowitsch     PetscCheck(row < A->rmap->n, PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_OUTOFRANGE, "Row too large");
56269371c9d4SSatish Balay     rp   = aj + ai[row];
56279371c9d4SSatish Balay     ap   = aa + ai[row];
56289371c9d4SSatish Balay     rmax = imax[row];
56299371c9d4SSatish Balay     nrow = ailen[row];
563081824310SBarry Smith     low  = 0;
563181824310SBarry Smith     high = nrow;
563281824310SBarry Smith     for (l = 0; l < n; l++) { /* loop over added columns */
563381824310SBarry Smith       if (in[l] < 0) continue;
56345f80ce2aSJacob Faibussowitsch       PetscCheck(in[l] < A->cmap->n, PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_OUTOFRANGE, "Column too large");
563581824310SBarry Smith       col = in[l];
56362205254eSKarl Rupp       if (roworiented) value = v[l + k * n];
56372205254eSKarl Rupp       else value = v[k + l * m];
56382205254eSKarl Rupp 
563981824310SBarry Smith       if (value == 0.0 && ignorezeroentries && (is == ADD_VALUES)) continue;
564081824310SBarry Smith 
56412205254eSKarl Rupp       if (col <= lastcol) low = 0;
56422205254eSKarl Rupp       else high = nrow;
564381824310SBarry Smith       lastcol = col;
564481824310SBarry Smith       while (high - low > 5) {
564581824310SBarry Smith         t = (low + high) / 2;
564681824310SBarry Smith         if (rp[t] > col) high = t;
564781824310SBarry Smith         else low = t;
564881824310SBarry Smith       }
564981824310SBarry Smith       for (i = low; i < high; i++) {
565081824310SBarry Smith         if (rp[i] > col) break;
565181824310SBarry Smith         if (rp[i] == col) {
565281824310SBarry Smith           if (is == ADD_VALUES) ap[i] += value;
565381824310SBarry Smith           else ap[i] = value;
565481824310SBarry Smith           goto noinsert;
565581824310SBarry Smith         }
565681824310SBarry Smith       }
565781824310SBarry Smith       if (value == 0.0 && ignorezeroentries) goto noinsert;
565881824310SBarry Smith       if (nonew == 1) goto noinsert;
56595f80ce2aSJacob Faibussowitsch       PetscCheck(nonew != -1, PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_OUTOFRANGE, "Inserting a new nonzero in the matrix");
5660fef13f97SBarry Smith       MatSeqXAIJReallocateAIJ(A, A->rmap->n, 1, nrow, row, col, rmax, aa, ai, aj, rp, ap, imax, nonew, MatScalar);
56619371c9d4SSatish Balay       N = nrow++ - 1;
56629371c9d4SSatish Balay       a->nz++;
56639371c9d4SSatish Balay       high++;
566481824310SBarry Smith       /* shift up all the later entries in this row */
566581824310SBarry Smith       for (ii = N; ii >= i; ii--) {
566681824310SBarry Smith         rp[ii + 1] = rp[ii];
566781824310SBarry Smith         ap[ii + 1] = ap[ii];
566881824310SBarry Smith       }
566981824310SBarry Smith       rp[i] = col;
567081824310SBarry Smith       ap[i] = value;
567181824310SBarry Smith     noinsert:;
567281824310SBarry Smith       low = i + 1;
567381824310SBarry Smith     }
567481824310SBarry Smith     ailen[row] = nrow;
567581824310SBarry Smith   }
567681824310SBarry Smith   PetscFunctionReturnVoid();
567781824310SBarry Smith }
567898921bdaSJacob Faibussowitsch /* Undefining these here since they were redefined from their original definition above! No
567998921bdaSJacob Faibussowitsch  * other PETSc functions should be defined past this point, as it is impossible to recover the
568098921bdaSJacob Faibussowitsch  * original definitions */
56819566063dSJacob Faibussowitsch #undef PetscCall
568298921bdaSJacob Faibussowitsch #undef SETERRQ
5683