xref: /petsc/src/mat/impls/aij/seq/aij.c (revision b44f4de476a10dd52a698c0f9a8f47d015bd1e19)
1d5d45c9bSBarry Smith /*
23369ce9aSBarry Smith     Defines the basic matrix operations for the AIJ (compressed row)
3d5d45c9bSBarry Smith   matrix storage format.
4d5d45c9bSBarry Smith */
53369ce9aSBarry Smith 
6c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/aij.h> /*I "petscmat.h" I*/
7c6db04a5SJed Brown #include <petscblaslapack.h>
8c6db04a5SJed Brown #include <petscbt.h>
9af0996ceSBarry Smith #include <petsc/private/kernels/blocktranspose.h>
100716a85fSBarry Smith 
1126cec326SBarry Smith /* defines MatSetValues_Seq_Hash(), MatAssemblyEnd_Seq_Hash(), MatSetUp_Seq_Hash() */
1226cec326SBarry Smith #define TYPE AIJ
1326cec326SBarry Smith #define TYPE_BS
1426cec326SBarry Smith #include "../src/mat/impls/aij/seq/seqhashmatsetvalues.h"
1526cec326SBarry Smith #include "../src/mat/impls/aij/seq/seqhashmat.h"
1626cec326SBarry Smith #undef TYPE
1726cec326SBarry Smith #undef TYPE_BS
1826cec326SBarry Smith 
19ba38deedSJacob Faibussowitsch static PetscErrorCode MatSeqAIJSetTypeFromOptions(Mat A)
20d71ae5a4SJacob Faibussowitsch {
214099cc6bSBarry Smith   PetscBool flg;
224099cc6bSBarry Smith   char      type[256];
234099cc6bSBarry Smith 
244099cc6bSBarry Smith   PetscFunctionBegin;
25d0609cedSBarry Smith   PetscObjectOptionsBegin((PetscObject)A);
269566063dSJacob Faibussowitsch   PetscCall(PetscOptionsFList("-mat_seqaij_type", "Matrix SeqAIJ type", "MatSeqAIJSetType", MatSeqAIJList, "seqaij", type, 256, &flg));
279566063dSJacob Faibussowitsch   if (flg) PetscCall(MatSeqAIJSetType(A, type));
28d0609cedSBarry Smith   PetscOptionsEnd();
293ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
304099cc6bSBarry Smith }
314099cc6bSBarry Smith 
32ba38deedSJacob Faibussowitsch static PetscErrorCode MatGetColumnReductions_SeqAIJ(Mat A, PetscInt type, PetscReal *reductions)
33d71ae5a4SJacob Faibussowitsch {
340716a85fSBarry Smith   PetscInt    i, m, n;
350716a85fSBarry Smith   Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data;
360716a85fSBarry Smith 
370716a85fSBarry Smith   PetscFunctionBegin;
389566063dSJacob Faibussowitsch   PetscCall(MatGetSize(A, &m, &n));
399566063dSJacob Faibussowitsch   PetscCall(PetscArrayzero(reductions, n));
400716a85fSBarry Smith   if (type == NORM_2) {
41ad540459SPierre Jolivet     for (i = 0; i < aij->i[m]; i++) reductions[aij->j[i]] += PetscAbsScalar(aij->a[i] * aij->a[i]);
420716a85fSBarry Smith   } else if (type == NORM_1) {
43ad540459SPierre Jolivet     for (i = 0; i < aij->i[m]; i++) reductions[aij->j[i]] += PetscAbsScalar(aij->a[i]);
440716a85fSBarry Smith   } else if (type == NORM_INFINITY) {
45ad540459SPierre Jolivet     for (i = 0; i < aij->i[m]; i++) reductions[aij->j[i]] = PetscMax(PetscAbsScalar(aij->a[i]), reductions[aij->j[i]]);
46857cbf51SRichard Tran Mills   } else if (type == REDUCTION_SUM_REALPART || type == REDUCTION_MEAN_REALPART) {
47ad540459SPierre Jolivet     for (i = 0; i < aij->i[m]; i++) reductions[aij->j[i]] += PetscRealPart(aij->a[i]);
48857cbf51SRichard Tran Mills   } else if (type == REDUCTION_SUM_IMAGINARYPART || type == REDUCTION_MEAN_IMAGINARYPART) {
49ad540459SPierre Jolivet     for (i = 0; i < aij->i[m]; i++) reductions[aij->j[i]] += PetscImaginaryPart(aij->a[i]);
506adde796SStefano Zampini   } else SETERRQ(PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_WRONG, "Unknown reduction type");
510716a85fSBarry Smith 
520716a85fSBarry Smith   if (type == NORM_2) {
53a873a8cdSSam Reynolds     for (i = 0; i < n; i++) reductions[i] = PetscSqrtReal(reductions[i]);
54857cbf51SRichard Tran Mills   } else if (type == REDUCTION_MEAN_REALPART || type == REDUCTION_MEAN_IMAGINARYPART) {
55a873a8cdSSam Reynolds     for (i = 0; i < n; i++) reductions[i] /= m;
560716a85fSBarry Smith   }
573ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
580716a85fSBarry Smith }
590716a85fSBarry Smith 
60ba38deedSJacob Faibussowitsch static PetscErrorCode MatFindOffBlockDiagonalEntries_SeqAIJ(Mat A, IS *is)
61d71ae5a4SJacob Faibussowitsch {
623a062f41SBarry Smith   Mat_SeqAIJ     *a = (Mat_SeqAIJ *)A->data;
633a062f41SBarry Smith   PetscInt        i, m = A->rmap->n, cnt = 0, bs = A->rmap->bs;
643a062f41SBarry Smith   const PetscInt *jj = a->j, *ii = a->i;
653a062f41SBarry Smith   PetscInt       *rows;
663a062f41SBarry Smith 
673a062f41SBarry Smith   PetscFunctionBegin;
683a062f41SBarry Smith   for (i = 0; i < m; i++) {
69ad540459SPierre Jolivet     if ((ii[i] != ii[i + 1]) && ((jj[ii[i]] < bs * (i / bs)) || (jj[ii[i + 1] - 1] > bs * ((i + bs) / bs) - 1))) cnt++;
703a062f41SBarry Smith   }
719566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(cnt, &rows));
723a062f41SBarry Smith   cnt = 0;
733a062f41SBarry Smith   for (i = 0; i < m; i++) {
743a062f41SBarry Smith     if ((ii[i] != ii[i + 1]) && ((jj[ii[i]] < bs * (i / bs)) || (jj[ii[i + 1] - 1] > bs * ((i + bs) / bs) - 1))) {
753a062f41SBarry Smith       rows[cnt] = i;
763a062f41SBarry Smith       cnt++;
773a062f41SBarry Smith     }
783a062f41SBarry Smith   }
799566063dSJacob Faibussowitsch   PetscCall(ISCreateGeneral(PETSC_COMM_SELF, cnt, rows, PETSC_OWN_POINTER, is));
803ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
813a062f41SBarry Smith }
823a062f41SBarry Smith 
83d71ae5a4SJacob Faibussowitsch PetscErrorCode MatFindZeroDiagonals_SeqAIJ_Private(Mat A, PetscInt *nrows, PetscInt **zrows)
84d71ae5a4SJacob Faibussowitsch {
856ce1633cSBarry Smith   Mat_SeqAIJ      *a = (Mat_SeqAIJ *)A->data;
86fff043a9SJunchao Zhang   const MatScalar *aa;
876ce1633cSBarry Smith   PetscInt         i, m = A->rmap->n, cnt = 0;
88b2db7409Sstefano_zampini   const PetscInt  *ii = a->i, *jj = a->j, *diag;
896ce1633cSBarry Smith   PetscInt        *rows;
906ce1633cSBarry Smith 
916ce1633cSBarry Smith   PetscFunctionBegin;
929566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &aa));
939566063dSJacob Faibussowitsch   PetscCall(MatMarkDiagonal_SeqAIJ(A));
946ce1633cSBarry Smith   diag = a->diag;
956ce1633cSBarry Smith   for (i = 0; i < m; i++) {
96ad540459SPierre Jolivet     if ((diag[i] >= ii[i + 1]) || (jj[diag[i]] != i) || (aa[diag[i]] == 0.0)) cnt++;
976ce1633cSBarry Smith   }
989566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(cnt, &rows));
996ce1633cSBarry Smith   cnt = 0;
1006ce1633cSBarry Smith   for (i = 0; i < m; i++) {
101ad540459SPierre Jolivet     if ((diag[i] >= ii[i + 1]) || (jj[diag[i]] != i) || (aa[diag[i]] == 0.0)) rows[cnt++] = i;
1026ce1633cSBarry Smith   }
103f1f41ecbSJed Brown   *nrows = cnt;
104f1f41ecbSJed Brown   *zrows = rows;
1059566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &aa));
1063ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
107f1f41ecbSJed Brown }
108f1f41ecbSJed Brown 
109ba38deedSJacob Faibussowitsch static PetscErrorCode MatFindZeroDiagonals_SeqAIJ(Mat A, IS *zrows)
110d71ae5a4SJacob Faibussowitsch {
111f1f41ecbSJed Brown   PetscInt nrows, *rows;
112f1f41ecbSJed Brown 
113f1f41ecbSJed Brown   PetscFunctionBegin;
1140298fd71SBarry Smith   *zrows = NULL;
1159566063dSJacob Faibussowitsch   PetscCall(MatFindZeroDiagonals_SeqAIJ_Private(A, &nrows, &rows));
1169566063dSJacob Faibussowitsch   PetscCall(ISCreateGeneral(PetscObjectComm((PetscObject)A), nrows, rows, PETSC_OWN_POINTER, zrows));
1173ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
1186ce1633cSBarry Smith }
1196ce1633cSBarry Smith 
120ba38deedSJacob Faibussowitsch static PetscErrorCode MatFindNonzeroRows_SeqAIJ(Mat A, IS *keptrows)
121d71ae5a4SJacob Faibussowitsch {
122b3a44c85SBarry Smith   Mat_SeqAIJ      *a = (Mat_SeqAIJ *)A->data;
123b3a44c85SBarry Smith   const MatScalar *aa;
124b3a44c85SBarry Smith   PetscInt         m = A->rmap->n, cnt = 0;
125b3a44c85SBarry Smith   const PetscInt  *ii;
126b3a44c85SBarry Smith   PetscInt         n, i, j, *rows;
127b3a44c85SBarry Smith 
128b3a44c85SBarry Smith   PetscFunctionBegin;
1299566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &aa));
130f4259b30SLisandro Dalcin   *keptrows = NULL;
131b3a44c85SBarry Smith   ii        = a->i;
132b3a44c85SBarry Smith   for (i = 0; i < m; i++) {
133b3a44c85SBarry Smith     n = ii[i + 1] - ii[i];
134b3a44c85SBarry Smith     if (!n) {
135b3a44c85SBarry Smith       cnt++;
136b3a44c85SBarry Smith       goto ok1;
137b3a44c85SBarry Smith     }
1382e5835c6SStefano Zampini     for (j = ii[i]; j < ii[i + 1]; j++) {
139b3a44c85SBarry Smith       if (aa[j] != 0.0) goto ok1;
140b3a44c85SBarry Smith     }
141b3a44c85SBarry Smith     cnt++;
142b3a44c85SBarry Smith   ok1:;
143b3a44c85SBarry Smith   }
1442e5835c6SStefano Zampini   if (!cnt) {
1459566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJRestoreArrayRead(A, &aa));
1463ba16761SJacob Faibussowitsch     PetscFunctionReturn(PETSC_SUCCESS);
1472e5835c6SStefano Zampini   }
1489566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(A->rmap->n - cnt, &rows));
149b3a44c85SBarry Smith   cnt = 0;
150b3a44c85SBarry Smith   for (i = 0; i < m; i++) {
151b3a44c85SBarry Smith     n = ii[i + 1] - ii[i];
152b3a44c85SBarry Smith     if (!n) continue;
1532e5835c6SStefano Zampini     for (j = ii[i]; j < ii[i + 1]; j++) {
154b3a44c85SBarry Smith       if (aa[j] != 0.0) {
155b3a44c85SBarry Smith         rows[cnt++] = i;
156b3a44c85SBarry Smith         break;
157b3a44c85SBarry Smith       }
158b3a44c85SBarry Smith     }
159b3a44c85SBarry Smith   }
1609566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &aa));
1619566063dSJacob Faibussowitsch   PetscCall(ISCreateGeneral(PETSC_COMM_SELF, cnt, rows, PETSC_OWN_POINTER, keptrows));
1623ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
163b3a44c85SBarry Smith }
164b3a44c85SBarry Smith 
165d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDiagonalSet_SeqAIJ(Mat Y, Vec D, InsertMode is)
166d71ae5a4SJacob Faibussowitsch {
16779299369SBarry Smith   Mat_SeqAIJ        *aij = (Mat_SeqAIJ *)Y->data;
16899e65526SBarry Smith   PetscInt           i, m = Y->rmap->n;
16999e65526SBarry Smith   const PetscInt    *diag;
1702e5835c6SStefano Zampini   MatScalar         *aa;
17199e65526SBarry Smith   const PetscScalar *v;
172ace3abfcSBarry Smith   PetscBool          missing;
17379299369SBarry Smith 
17479299369SBarry Smith   PetscFunctionBegin;
17509f38230SBarry Smith   if (Y->assembled) {
1769566063dSJacob Faibussowitsch     PetscCall(MatMissingDiagonal_SeqAIJ(Y, &missing, NULL));
17709f38230SBarry Smith     if (!missing) {
17879299369SBarry Smith       diag = aij->diag;
1799566063dSJacob Faibussowitsch       PetscCall(VecGetArrayRead(D, &v));
1809566063dSJacob Faibussowitsch       PetscCall(MatSeqAIJGetArray(Y, &aa));
18179299369SBarry Smith       if (is == INSERT_VALUES) {
182ad540459SPierre Jolivet         for (i = 0; i < m; i++) aa[diag[i]] = v[i];
18379299369SBarry Smith       } else {
184ad540459SPierre Jolivet         for (i = 0; i < m; i++) aa[diag[i]] += v[i];
18579299369SBarry Smith       }
1869566063dSJacob Faibussowitsch       PetscCall(MatSeqAIJRestoreArray(Y, &aa));
1879566063dSJacob Faibussowitsch       PetscCall(VecRestoreArrayRead(D, &v));
1883ba16761SJacob Faibussowitsch       PetscFunctionReturn(PETSC_SUCCESS);
18979299369SBarry Smith     }
1909566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJInvalidateDiagonal(Y));
19109f38230SBarry Smith   }
1929566063dSJacob Faibussowitsch   PetscCall(MatDiagonalSet_Default(Y, D, is));
1933ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
19409f38230SBarry Smith }
19579299369SBarry Smith 
196d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetRowIJ_SeqAIJ(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *m, const PetscInt *ia[], const PetscInt *ja[], PetscBool *done)
197d71ae5a4SJacob Faibussowitsch {
198416022c9SBarry Smith   Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data;
19997f1f81fSBarry Smith   PetscInt    i, ishift;
20017ab2063SBarry Smith 
2013a40ed3dSBarry Smith   PetscFunctionBegin;
202f1f2ae84SBarry Smith   if (m) *m = A->rmap->n;
2033ba16761SJacob Faibussowitsch   if (!ia) PetscFunctionReturn(PETSC_SUCCESS);
204bfeeae90SHong Zhang   ishift = 0;
205b94d7dedSBarry Smith   if (symmetric && A->structurally_symmetric != PETSC_BOOL3_TRUE) {
2069566063dSJacob Faibussowitsch     PetscCall(MatToSymmetricIJ_SeqAIJ(A->rmap->n, a->i, a->j, PETSC_TRUE, ishift, oshift, (PetscInt **)ia, (PetscInt **)ja));
207bfeeae90SHong Zhang   } else if (oshift == 1) {
2081a83f524SJed Brown     PetscInt *tia;
209d0f46423SBarry Smith     PetscInt  nz = a->i[A->rmap->n];
2103b2fbd54SBarry Smith     /* malloc space and  add 1 to i and j indices */
2119566063dSJacob Faibussowitsch     PetscCall(PetscMalloc1(A->rmap->n + 1, &tia));
2121a83f524SJed Brown     for (i = 0; i < A->rmap->n + 1; i++) tia[i] = a->i[i] + 1;
2131a83f524SJed Brown     *ia = tia;
214ecc77c7aSBarry Smith     if (ja) {
2151a83f524SJed Brown       PetscInt *tja;
2169566063dSJacob Faibussowitsch       PetscCall(PetscMalloc1(nz + 1, &tja));
2171a83f524SJed Brown       for (i = 0; i < nz; i++) tja[i] = a->j[i] + 1;
2181a83f524SJed Brown       *ja = tja;
219ecc77c7aSBarry Smith     }
2206945ee14SBarry Smith   } else {
221ecc77c7aSBarry Smith     *ia = a->i;
222ecc77c7aSBarry Smith     if (ja) *ja = a->j;
223a2ce50c7SBarry Smith   }
2243ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
225a2744918SBarry Smith }
226a2744918SBarry Smith 
227d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRestoreRowIJ_SeqAIJ(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *n, const PetscInt *ia[], const PetscInt *ja[], PetscBool *done)
228d71ae5a4SJacob Faibussowitsch {
2293a40ed3dSBarry Smith   PetscFunctionBegin;
2303ba16761SJacob Faibussowitsch   if (!ia) PetscFunctionReturn(PETSC_SUCCESS);
231b94d7dedSBarry Smith   if ((symmetric && A->structurally_symmetric != PETSC_BOOL3_TRUE) || oshift == 1) {
2329566063dSJacob Faibussowitsch     PetscCall(PetscFree(*ia));
2339566063dSJacob Faibussowitsch     if (ja) PetscCall(PetscFree(*ja));
234bcd2baecSBarry Smith   }
2353ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
23617ab2063SBarry Smith }
23717ab2063SBarry Smith 
238d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetColumnIJ_SeqAIJ(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *nn, const PetscInt *ia[], const PetscInt *ja[], PetscBool *done)
239d71ae5a4SJacob Faibussowitsch {
2403b2fbd54SBarry Smith   Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data;
241d0f46423SBarry Smith   PetscInt    i, *collengths, *cia, *cja, n = A->cmap->n, m = A->rmap->n;
24297f1f81fSBarry Smith   PetscInt    nz = a->i[m], row, *jj, mr, col;
2433b2fbd54SBarry Smith 
2443a40ed3dSBarry Smith   PetscFunctionBegin;
245899cda47SBarry Smith   *nn = n;
2463ba16761SJacob Faibussowitsch   if (!ia) PetscFunctionReturn(PETSC_SUCCESS);
2473b2fbd54SBarry Smith   if (symmetric) {
2489566063dSJacob Faibussowitsch     PetscCall(MatToSymmetricIJ_SeqAIJ(A->rmap->n, a->i, a->j, PETSC_TRUE, 0, oshift, (PetscInt **)ia, (PetscInt **)ja));
2493b2fbd54SBarry Smith   } else {
2509566063dSJacob Faibussowitsch     PetscCall(PetscCalloc1(n, &collengths));
2519566063dSJacob Faibussowitsch     PetscCall(PetscMalloc1(n + 1, &cia));
2529566063dSJacob Faibussowitsch     PetscCall(PetscMalloc1(nz, &cja));
2533b2fbd54SBarry Smith     jj = a->j;
254ad540459SPierre Jolivet     for (i = 0; i < nz; i++) collengths[jj[i]]++;
2553b2fbd54SBarry Smith     cia[0] = oshift;
256ad540459SPierre Jolivet     for (i = 0; i < n; i++) cia[i + 1] = cia[i] + collengths[i];
2579566063dSJacob Faibussowitsch     PetscCall(PetscArrayzero(collengths, n));
2583b2fbd54SBarry Smith     jj = a->j;
259a93ec695SBarry Smith     for (row = 0; row < m; row++) {
260a93ec695SBarry Smith       mr = a->i[row + 1] - a->i[row];
261a93ec695SBarry Smith       for (i = 0; i < mr; i++) {
262bfeeae90SHong Zhang         col = *jj++;
2632205254eSKarl Rupp 
2643b2fbd54SBarry Smith         cja[cia[col] + collengths[col]++ - oshift] = row + oshift;
2653b2fbd54SBarry Smith       }
2663b2fbd54SBarry Smith     }
2679566063dSJacob Faibussowitsch     PetscCall(PetscFree(collengths));
2689371c9d4SSatish Balay     *ia = cia;
2699371c9d4SSatish Balay     *ja = cja;
2703b2fbd54SBarry Smith   }
2713ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
2723b2fbd54SBarry Smith }
2733b2fbd54SBarry Smith 
274d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRestoreColumnIJ_SeqAIJ(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *n, const PetscInt *ia[], const PetscInt *ja[], PetscBool *done)
275d71ae5a4SJacob Faibussowitsch {
2763a40ed3dSBarry Smith   PetscFunctionBegin;
2773ba16761SJacob Faibussowitsch   if (!ia) PetscFunctionReturn(PETSC_SUCCESS);
2783b2fbd54SBarry Smith 
2799566063dSJacob Faibussowitsch   PetscCall(PetscFree(*ia));
2809566063dSJacob Faibussowitsch   PetscCall(PetscFree(*ja));
2813ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
2823b2fbd54SBarry Smith }
2833b2fbd54SBarry Smith 
2847cee066cSHong Zhang /*
2857cee066cSHong Zhang  MatGetColumnIJ_SeqAIJ_Color() and MatRestoreColumnIJ_SeqAIJ_Color() are customized from
2867cee066cSHong Zhang  MatGetColumnIJ_SeqAIJ() and MatRestoreColumnIJ_SeqAIJ() by adding an output
287040ebd07SHong Zhang  spidx[], index of a->a, to be used in MatTransposeColoringCreate_SeqAIJ() and MatFDColoringCreate_SeqXAIJ()
2887cee066cSHong Zhang */
289d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetColumnIJ_SeqAIJ_Color(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *nn, const PetscInt *ia[], const PetscInt *ja[], PetscInt *spidx[], PetscBool *done)
290d71ae5a4SJacob Faibussowitsch {
2917cee066cSHong Zhang   Mat_SeqAIJ     *a = (Mat_SeqAIJ *)A->data;
2927cee066cSHong Zhang   PetscInt        i, *collengths, *cia, *cja, n = A->cmap->n, m = A->rmap->n;
293071fcb05SBarry Smith   PetscInt        nz = a->i[m], row, mr, col, tmp;
2947cee066cSHong Zhang   PetscInt       *cspidx;
295071fcb05SBarry Smith   const PetscInt *jj;
2967cee066cSHong Zhang 
2977cee066cSHong Zhang   PetscFunctionBegin;
2987cee066cSHong Zhang   *nn = n;
2993ba16761SJacob Faibussowitsch   if (!ia) PetscFunctionReturn(PETSC_SUCCESS);
300625f6d37SHong Zhang 
3019566063dSJacob Faibussowitsch   PetscCall(PetscCalloc1(n, &collengths));
3029566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(n + 1, &cia));
3039566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(nz, &cja));
3049566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(nz, &cspidx));
3057cee066cSHong Zhang   jj = a->j;
306ad540459SPierre Jolivet   for (i = 0; i < nz; i++) collengths[jj[i]]++;
3077cee066cSHong Zhang   cia[0] = oshift;
308ad540459SPierre Jolivet   for (i = 0; i < n; i++) cia[i + 1] = cia[i] + collengths[i];
3099566063dSJacob Faibussowitsch   PetscCall(PetscArrayzero(collengths, n));
3107cee066cSHong Zhang   jj = a->j;
3117cee066cSHong Zhang   for (row = 0; row < m; row++) {
3127cee066cSHong Zhang     mr = a->i[row + 1] - a->i[row];
3137cee066cSHong Zhang     for (i = 0; i < mr; i++) {
3147cee066cSHong Zhang       col         = *jj++;
315071fcb05SBarry Smith       tmp         = cia[col] + collengths[col]++ - oshift;
316071fcb05SBarry Smith       cspidx[tmp] = a->i[row] + i; /* index of a->j */
317071fcb05SBarry Smith       cja[tmp]    = row + oshift;
3187cee066cSHong Zhang     }
3197cee066cSHong Zhang   }
3209566063dSJacob Faibussowitsch   PetscCall(PetscFree(collengths));
321071fcb05SBarry Smith   *ia    = cia;
322071fcb05SBarry Smith   *ja    = cja;
3237cee066cSHong Zhang   *spidx = cspidx;
3243ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3257cee066cSHong Zhang }
3267cee066cSHong Zhang 
327d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRestoreColumnIJ_SeqAIJ_Color(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *n, const PetscInt *ia[], const PetscInt *ja[], PetscInt *spidx[], PetscBool *done)
328d71ae5a4SJacob Faibussowitsch {
3297cee066cSHong Zhang   PetscFunctionBegin;
3309566063dSJacob Faibussowitsch   PetscCall(MatRestoreColumnIJ_SeqAIJ(A, oshift, symmetric, inodecompressed, n, ia, ja, done));
3319566063dSJacob Faibussowitsch   PetscCall(PetscFree(*spidx));
3323ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3337cee066cSHong Zhang }
3347cee066cSHong Zhang 
335ba38deedSJacob Faibussowitsch static PetscErrorCode MatSetValuesRow_SeqAIJ(Mat A, PetscInt row, const PetscScalar v[])
336d71ae5a4SJacob Faibussowitsch {
33787d4246cSBarry Smith   Mat_SeqAIJ  *a  = (Mat_SeqAIJ *)A->data;
33887d4246cSBarry Smith   PetscInt    *ai = a->i;
339fff043a9SJunchao Zhang   PetscScalar *aa;
34087d4246cSBarry Smith 
34187d4246cSBarry Smith   PetscFunctionBegin;
3429566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArray(A, &aa));
3439566063dSJacob Faibussowitsch   PetscCall(PetscArraycpy(aa + ai[row], v, ai[row + 1] - ai[row]));
3449566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArray(A, &aa));
3453ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
34687d4246cSBarry Smith }
34787d4246cSBarry Smith 
348bd04181cSBarry Smith /*
349bd04181cSBarry Smith     MatSeqAIJSetValuesLocalFast - An optimized version of MatSetValuesLocal() for SeqAIJ matrices with several assumptions
350bd04181cSBarry Smith 
351bd04181cSBarry Smith       -   a single row of values is set with each call
352bd04181cSBarry Smith       -   no row or column indices are negative or (in error) larger than the number of rows or columns
353bd04181cSBarry Smith       -   the values are always added to the matrix, not set
354bd04181cSBarry Smith       -   no new locations are introduced in the nonzero structure of the matrix
355bd04181cSBarry Smith 
3561f763a69SBarry Smith      This does NOT assume the global column indices are sorted
357bd04181cSBarry Smith 
3581f763a69SBarry Smith */
359bd04181cSBarry Smith 
360af0996ceSBarry Smith #include <petsc/private/isimpl.h>
361d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetValuesLocalFast(Mat A, PetscInt m, const PetscInt im[], PetscInt n, const PetscInt in[], const PetscScalar v[], InsertMode is)
362d71ae5a4SJacob Faibussowitsch {
363189e4007SBarry Smith   Mat_SeqAIJ     *a = (Mat_SeqAIJ *)A->data;
3641f763a69SBarry Smith   PetscInt        low, high, t, row, nrow, i, col, l;
3651f763a69SBarry Smith   const PetscInt *rp, *ai = a->i, *ailen = a->ilen, *aj = a->j;
3661f763a69SBarry Smith   PetscInt        lastcol = -1;
367fff043a9SJunchao Zhang   MatScalar      *ap, value, *aa;
368189e4007SBarry Smith   const PetscInt *ridx = A->rmap->mapping->indices, *cidx = A->cmap->mapping->indices;
369189e4007SBarry Smith 
370fff043a9SJunchao Zhang   PetscFunctionBegin;
3719566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArray(A, &aa));
372f38dd0b8SBarry Smith   row  = ridx[im[0]];
3731f763a69SBarry Smith   rp   = aj + ai[row];
3741f763a69SBarry Smith   ap   = aa + ai[row];
3751f763a69SBarry Smith   nrow = ailen[row];
376189e4007SBarry Smith   low  = 0;
377189e4007SBarry Smith   high = nrow;
378189e4007SBarry Smith   for (l = 0; l < n; l++) { /* loop over added columns */
379189e4007SBarry Smith     col   = cidx[in[l]];
380f38dd0b8SBarry Smith     value = v[l];
381189e4007SBarry Smith 
382189e4007SBarry Smith     if (col <= lastcol) low = 0;
383189e4007SBarry Smith     else high = nrow;
384189e4007SBarry Smith     lastcol = col;
385189e4007SBarry Smith     while (high - low > 5) {
386189e4007SBarry Smith       t = (low + high) / 2;
387189e4007SBarry Smith       if (rp[t] > col) high = t;
388189e4007SBarry Smith       else low = t;
389189e4007SBarry Smith     }
390189e4007SBarry Smith     for (i = low; i < high; i++) {
391189e4007SBarry Smith       if (rp[i] == col) {
3921f763a69SBarry Smith         ap[i] += value;
393189e4007SBarry Smith         low = i + 1;
3941f763a69SBarry Smith         break;
395189e4007SBarry Smith       }
396189e4007SBarry Smith     }
397189e4007SBarry Smith   }
3989566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArray(A, &aa));
3993ba16761SJacob Faibussowitsch   return PETSC_SUCCESS;
400189e4007SBarry Smith }
401189e4007SBarry Smith 
402d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetValues_SeqAIJ(Mat A, PetscInt m, const PetscInt im[], PetscInt n, const PetscInt in[], const PetscScalar v[], InsertMode is)
403d71ae5a4SJacob Faibussowitsch {
404416022c9SBarry Smith   Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data;
405e2ee6c50SBarry Smith   PetscInt   *rp, k, low, high, t, ii, row, nrow, i, col, l, rmax, N;
40697f1f81fSBarry Smith   PetscInt   *imax = a->imax, *ai = a->i, *ailen = a->ilen;
407e2ee6c50SBarry Smith   PetscInt   *aj = a->j, nonew = a->nonew, lastcol = -1;
408ce496241SStefano Zampini   MatScalar  *ap = NULL, value = 0.0, *aa;
409ace3abfcSBarry Smith   PetscBool   ignorezeroentries = a->ignorezeroentries;
410ace3abfcSBarry Smith   PetscBool   roworiented       = a->roworiented;
41117ab2063SBarry Smith 
4123a40ed3dSBarry Smith   PetscFunctionBegin;
4139566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArray(A, &aa));
41417ab2063SBarry Smith   for (k = 0; k < m; k++) { /* loop over added rows */
415416022c9SBarry Smith     row = im[k];
4165ef9f2a5SBarry Smith     if (row < 0) continue;
4176bdcaf15SBarry Smith     PetscCheck(row < A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Row too large: row %" PetscInt_FMT " max %" PetscInt_FMT, row, A->rmap->n - 1);
4188e3a54c0SPierre Jolivet     rp = PetscSafePointerPlusOffset(aj, ai[row]);
4198e3a54c0SPierre Jolivet     if (!A->structure_only) ap = PetscSafePointerPlusOffset(aa, ai[row]);
4209371c9d4SSatish Balay     rmax = imax[row];
4219371c9d4SSatish Balay     nrow = ailen[row];
422416022c9SBarry Smith     low  = 0;
423c71e6ed7SBarry Smith     high = nrow;
42417ab2063SBarry Smith     for (l = 0; l < n; l++) { /* loop over added columns */
4255ef9f2a5SBarry Smith       if (in[l] < 0) continue;
4266bdcaf15SBarry Smith       PetscCheck(in[l] < A->cmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Column too large: col %" PetscInt_FMT " max %" PetscInt_FMT, in[l], A->cmap->n - 1);
427bfeeae90SHong Zhang       col = in[l];
428071fcb05SBarry Smith       if (v && !A->structure_only) value = roworiented ? v[l + k * n] : v[k + l * m];
429071fcb05SBarry Smith       if (!A->structure_only && value == 0.0 && ignorezeroentries && is == ADD_VALUES && row != col) continue;
43036db0b34SBarry Smith 
4312205254eSKarl Rupp       if (col <= lastcol) low = 0;
4322205254eSKarl Rupp       else high = nrow;
433e2ee6c50SBarry Smith       lastcol = col;
434416022c9SBarry Smith       while (high - low > 5) {
435416022c9SBarry Smith         t = (low + high) / 2;
436416022c9SBarry Smith         if (rp[t] > col) high = t;
437416022c9SBarry Smith         else low = t;
43817ab2063SBarry Smith       }
439416022c9SBarry Smith       for (i = low; i < high; i++) {
44017ab2063SBarry Smith         if (rp[i] > col) break;
44117ab2063SBarry Smith         if (rp[i] == col) {
442876c6284SHong Zhang           if (!A->structure_only) {
4430c0d7e18SFande Kong             if (is == ADD_VALUES) {
4440c0d7e18SFande Kong               ap[i] += value;
4450c0d7e18SFande Kong               (void)PetscLogFlops(1.0);
4469371c9d4SSatish Balay             } else ap[i] = value;
447720833daSHong Zhang           }
448e44c0bd4SBarry Smith           low = i + 1;
44917ab2063SBarry Smith           goto noinsert;
45017ab2063SBarry Smith         }
45117ab2063SBarry Smith       }
452dcd36c23SBarry Smith       if (value == 0.0 && ignorezeroentries && row != col) goto noinsert;
453c2653b3dSLois Curfman McInnes       if (nonew == 1) goto noinsert;
45408401ef6SPierre Jolivet       PetscCheck(nonew != -1, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Inserting a new nonzero at (%" PetscInt_FMT ",%" PetscInt_FMT ") in the matrix", row, col);
455720833daSHong Zhang       if (A->structure_only) {
456876c6284SHong Zhang         MatSeqXAIJReallocateAIJ_structure_only(A, A->rmap->n, 1, nrow, row, col, rmax, ai, aj, rp, imax, nonew, MatScalar);
457720833daSHong Zhang       } else {
458fef13f97SBarry Smith         MatSeqXAIJReallocateAIJ(A, A->rmap->n, 1, nrow, row, col, rmax, aa, ai, aj, rp, ap, imax, nonew, MatScalar);
459720833daSHong Zhang       }
4609371c9d4SSatish Balay       N = nrow++ - 1;
4619371c9d4SSatish Balay       a->nz++;
4629371c9d4SSatish Balay       high++;
463416022c9SBarry Smith       /* shift up all the later entries in this row */
4649566063dSJacob Faibussowitsch       PetscCall(PetscArraymove(rp + i + 1, rp + i, N - i + 1));
46517ab2063SBarry Smith       rp[i] = col;
466580bdb30SBarry Smith       if (!A->structure_only) {
4679566063dSJacob Faibussowitsch         PetscCall(PetscArraymove(ap + i + 1, ap + i, N - i + 1));
468580bdb30SBarry Smith         ap[i] = value;
469580bdb30SBarry Smith       }
470416022c9SBarry Smith       low = i + 1;
471e44c0bd4SBarry Smith     noinsert:;
47217ab2063SBarry Smith     }
47317ab2063SBarry Smith     ailen[row] = nrow;
47417ab2063SBarry Smith   }
4759566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArray(A, &aa));
4763ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
47717ab2063SBarry Smith }
47817ab2063SBarry Smith 
479ba38deedSJacob Faibussowitsch static PetscErrorCode MatSetValues_SeqAIJ_SortedFullNoPreallocation(Mat A, PetscInt m, const PetscInt im[], PetscInt n, const PetscInt in[], const PetscScalar v[], InsertMode is)
480d71ae5a4SJacob Faibussowitsch {
48119b08ed1SBarry Smith   Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data;
48219b08ed1SBarry Smith   PetscInt   *rp, k, row;
48319b08ed1SBarry Smith   PetscInt   *ai = a->i;
48419b08ed1SBarry Smith   PetscInt   *aj = a->j;
485fff043a9SJunchao Zhang   MatScalar  *aa, *ap;
48619b08ed1SBarry Smith 
48719b08ed1SBarry Smith   PetscFunctionBegin;
48828b400f6SJacob Faibussowitsch   PetscCheck(!A->was_assembled, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Cannot call on assembled matrix.");
48908401ef6SPierre Jolivet   PetscCheck(m * n + a->nz <= a->maxnz, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Number of entries in matrix will be larger than maximum nonzeros allocated for %" PetscInt_FMT " in MatSeqAIJSetTotalPreallocation()", a->maxnz);
490fff043a9SJunchao Zhang 
4919566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArray(A, &aa));
49219b08ed1SBarry Smith   for (k = 0; k < m; k++) { /* loop over added rows */
49319b08ed1SBarry Smith     row = im[k];
49419b08ed1SBarry Smith     rp  = aj + ai[row];
4958e3a54c0SPierre Jolivet     ap  = PetscSafePointerPlusOffset(aa, ai[row]);
49619b08ed1SBarry Smith 
4979566063dSJacob Faibussowitsch     PetscCall(PetscMemcpy(rp, in, n * sizeof(PetscInt)));
49819b08ed1SBarry Smith     if (!A->structure_only) {
49919b08ed1SBarry Smith       if (v) {
5009566063dSJacob Faibussowitsch         PetscCall(PetscMemcpy(ap, v, n * sizeof(PetscScalar)));
50119b08ed1SBarry Smith         v += n;
50219b08ed1SBarry Smith       } else {
5039566063dSJacob Faibussowitsch         PetscCall(PetscMemzero(ap, n * sizeof(PetscScalar)));
50419b08ed1SBarry Smith       }
50519b08ed1SBarry Smith     }
50619b08ed1SBarry Smith     a->ilen[row]  = n;
50719b08ed1SBarry Smith     a->imax[row]  = n;
50819b08ed1SBarry Smith     a->i[row + 1] = a->i[row] + n;
50919b08ed1SBarry Smith     a->nz += n;
51019b08ed1SBarry Smith   }
5119566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArray(A, &aa));
5123ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
51319b08ed1SBarry Smith }
51419b08ed1SBarry Smith 
51519b08ed1SBarry Smith /*@
51619b08ed1SBarry Smith   MatSeqAIJSetTotalPreallocation - Sets an upper bound on the total number of expected nonzeros in the matrix.
51719b08ed1SBarry Smith 
51819b08ed1SBarry Smith   Input Parameters:
51911a5261eSBarry Smith + A       - the `MATSEQAIJ` matrix
52019b08ed1SBarry Smith - nztotal - bound on the number of nonzeros
52119b08ed1SBarry Smith 
52219b08ed1SBarry Smith   Level: advanced
52319b08ed1SBarry Smith 
52419b08ed1SBarry Smith   Notes:
52519b08ed1SBarry Smith   This can be called if you will be provided the matrix row by row (from row zero) with sorted column indices for each row.
52611a5261eSBarry Smith   Simply call `MatSetValues()` after this call to provide the matrix entries in the usual manner. This matrix may be used
52719b08ed1SBarry Smith   as always with multiple matrix assemblies.
52819b08ed1SBarry Smith 
5291cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSetOption()`, `MAT_SORTED_FULL`, `MatSetValues()`, `MatSeqAIJSetPreallocation()`
53019b08ed1SBarry Smith @*/
531d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetTotalPreallocation(Mat A, PetscInt nztotal)
532d71ae5a4SJacob Faibussowitsch {
53319b08ed1SBarry Smith   Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data;
53419b08ed1SBarry Smith 
53519b08ed1SBarry Smith   PetscFunctionBegin;
5369566063dSJacob Faibussowitsch   PetscCall(PetscLayoutSetUp(A->rmap));
5379566063dSJacob Faibussowitsch   PetscCall(PetscLayoutSetUp(A->cmap));
53819b08ed1SBarry Smith   a->maxnz = nztotal;
5394dfa11a4SJacob Faibussowitsch   if (!a->imax) { PetscCall(PetscMalloc1(A->rmap->n, &a->imax)); }
54019b08ed1SBarry Smith   if (!a->ilen) {
5419566063dSJacob Faibussowitsch     PetscCall(PetscMalloc1(A->rmap->n, &a->ilen));
54219b08ed1SBarry Smith   } else {
5439566063dSJacob Faibussowitsch     PetscCall(PetscMemzero(a->ilen, A->rmap->n * sizeof(PetscInt)));
54419b08ed1SBarry Smith   }
54519b08ed1SBarry Smith 
54619b08ed1SBarry Smith   /* allocate the matrix space */
5479f0612e4SBarry Smith   PetscCall(PetscShmgetAllocateArray(A->rmap->n + 1, sizeof(PetscInt), (void **)&a->i));
5489f0612e4SBarry Smith   PetscCall(PetscShmgetAllocateArray(nztotal, sizeof(PetscInt), (void **)&a->j));
5499f0612e4SBarry Smith   a->free_ij = PETSC_TRUE;
55019b08ed1SBarry Smith   if (A->structure_only) {
55119b08ed1SBarry Smith     a->free_a = PETSC_FALSE;
55219b08ed1SBarry Smith   } else {
5539f0612e4SBarry Smith     PetscCall(PetscShmgetAllocateArray(nztotal, sizeof(PetscScalar), (void **)&a->a));
55419b08ed1SBarry Smith     a->free_a = PETSC_TRUE;
55519b08ed1SBarry Smith   }
5569f0612e4SBarry Smith   a->i[0]           = 0;
55719b08ed1SBarry Smith   A->ops->setvalues = MatSetValues_SeqAIJ_SortedFullNoPreallocation;
55819b08ed1SBarry Smith   A->preallocated   = PETSC_TRUE;
5593ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
56019b08ed1SBarry Smith }
56119b08ed1SBarry Smith 
562ba38deedSJacob Faibussowitsch static PetscErrorCode MatSetValues_SeqAIJ_SortedFull(Mat A, PetscInt m, const PetscInt im[], PetscInt n, const PetscInt in[], const PetscScalar v[], InsertMode is)
563d71ae5a4SJacob Faibussowitsch {
564071fcb05SBarry Smith   Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data;
565071fcb05SBarry Smith   PetscInt   *rp, k, row;
566071fcb05SBarry Smith   PetscInt   *ai = a->i, *ailen = a->ilen;
567071fcb05SBarry Smith   PetscInt   *aj = a->j;
568fff043a9SJunchao Zhang   MatScalar  *aa, *ap;
569071fcb05SBarry Smith 
570071fcb05SBarry Smith   PetscFunctionBegin;
5719566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArray(A, &aa));
572071fcb05SBarry Smith   for (k = 0; k < m; k++) { /* loop over added rows */
573071fcb05SBarry Smith     row = im[k];
5746bdcaf15SBarry Smith     PetscCheck(n <= a->imax[row], PETSC_COMM_SELF, PETSC_ERR_ARG_WRONG, "Preallocation for row %" PetscInt_FMT " does not match number of columns provided", n);
575071fcb05SBarry Smith     rp = aj + ai[row];
576071fcb05SBarry Smith     ap = aa + ai[row];
57748a46eb9SPierre Jolivet     if (!A->was_assembled) PetscCall(PetscMemcpy(rp, in, n * sizeof(PetscInt)));
578071fcb05SBarry Smith     if (!A->structure_only) {
579071fcb05SBarry Smith       if (v) {
5809566063dSJacob Faibussowitsch         PetscCall(PetscMemcpy(ap, v, n * sizeof(PetscScalar)));
581071fcb05SBarry Smith         v += n;
582071fcb05SBarry Smith       } else {
5839566063dSJacob Faibussowitsch         PetscCall(PetscMemzero(ap, n * sizeof(PetscScalar)));
584071fcb05SBarry Smith       }
585071fcb05SBarry Smith     }
586071fcb05SBarry Smith     ailen[row] = n;
587071fcb05SBarry Smith     a->nz += n;
588071fcb05SBarry Smith   }
5899566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArray(A, &aa));
5903ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
591071fcb05SBarry Smith }
592071fcb05SBarry Smith 
593ba38deedSJacob Faibussowitsch static PetscErrorCode MatGetValues_SeqAIJ(Mat A, PetscInt m, const PetscInt im[], PetscInt n, const PetscInt in[], PetscScalar v[])
594d71ae5a4SJacob Faibussowitsch {
5957eb43aa7SLois Curfman McInnes   Mat_SeqAIJ      *a = (Mat_SeqAIJ *)A->data;
59697f1f81fSBarry Smith   PetscInt        *rp, k, low, high, t, row, nrow, i, col, l, *aj = a->j;
59797f1f81fSBarry Smith   PetscInt        *ai = a->i, *ailen = a->ilen;
5984e208921SJed Brown   const MatScalar *ap, *aa;
5997eb43aa7SLois Curfman McInnes 
6003a40ed3dSBarry Smith   PetscFunctionBegin;
6014e208921SJed Brown   PetscCall(MatSeqAIJGetArrayRead(A, &aa));
6027eb43aa7SLois Curfman McInnes   for (k = 0; k < m; k++) { /* loop over rows */
6037eb43aa7SLois Curfman McInnes     row = im[k];
6049371c9d4SSatish Balay     if (row < 0) {
6059371c9d4SSatish Balay       v += n;
6069371c9d4SSatish Balay       continue;
6079371c9d4SSatish Balay     } /* negative row */
60854c59aa7SJacob Faibussowitsch     PetscCheck(row < A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Row too large: row %" PetscInt_FMT " max %" PetscInt_FMT, row, A->rmap->n - 1);
6098e3a54c0SPierre Jolivet     rp   = PetscSafePointerPlusOffset(aj, ai[row]);
6108e3a54c0SPierre Jolivet     ap   = PetscSafePointerPlusOffset(aa, ai[row]);
6117eb43aa7SLois Curfman McInnes     nrow = ailen[row];
6127eb43aa7SLois Curfman McInnes     for (l = 0; l < n; l++) { /* loop over columns */
6139371c9d4SSatish Balay       if (in[l] < 0) {
6149371c9d4SSatish Balay         v++;
6159371c9d4SSatish Balay         continue;
6169371c9d4SSatish Balay       } /* negative column */
61754c59aa7SJacob Faibussowitsch       PetscCheck(in[l] < A->cmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Column too large: col %" PetscInt_FMT " max %" PetscInt_FMT, in[l], A->cmap->n - 1);
618bfeeae90SHong Zhang       col  = in[l];
6199371c9d4SSatish Balay       high = nrow;
6209371c9d4SSatish Balay       low  = 0; /* assume unsorted */
6217eb43aa7SLois Curfman McInnes       while (high - low > 5) {
6227eb43aa7SLois Curfman McInnes         t = (low + high) / 2;
6237eb43aa7SLois Curfman McInnes         if (rp[t] > col) high = t;
6247eb43aa7SLois Curfman McInnes         else low = t;
6257eb43aa7SLois Curfman McInnes       }
6267eb43aa7SLois Curfman McInnes       for (i = low; i < high; i++) {
6277eb43aa7SLois Curfman McInnes         if (rp[i] > col) break;
6287eb43aa7SLois Curfman McInnes         if (rp[i] == col) {
629b49de8d1SLois Curfman McInnes           *v++ = ap[i];
6307eb43aa7SLois Curfman McInnes           goto finished;
6317eb43aa7SLois Curfman McInnes         }
6327eb43aa7SLois Curfman McInnes       }
63397e567efSBarry Smith       *v++ = 0.0;
6347eb43aa7SLois Curfman McInnes     finished:;
6357eb43aa7SLois Curfman McInnes     }
6367eb43aa7SLois Curfman McInnes   }
6374e208921SJed Brown   PetscCall(MatSeqAIJRestoreArrayRead(A, &aa));
6383ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
6397eb43aa7SLois Curfman McInnes }
6407eb43aa7SLois Curfman McInnes 
641ba38deedSJacob Faibussowitsch static PetscErrorCode MatView_SeqAIJ_Binary(Mat mat, PetscViewer viewer)
642d71ae5a4SJacob Faibussowitsch {
6433ea6fe3dSLisandro Dalcin   Mat_SeqAIJ        *A = (Mat_SeqAIJ *)mat->data;
644c898d852SStefano Zampini   const PetscScalar *av;
6453ea6fe3dSLisandro Dalcin   PetscInt           header[4], M, N, m, nz, i;
6463ea6fe3dSLisandro Dalcin   PetscInt          *rowlens;
64717ab2063SBarry Smith 
6483a40ed3dSBarry Smith   PetscFunctionBegin;
6499566063dSJacob Faibussowitsch   PetscCall(PetscViewerSetUp(viewer));
6502205254eSKarl Rupp 
6513ea6fe3dSLisandro Dalcin   M  = mat->rmap->N;
6523ea6fe3dSLisandro Dalcin   N  = mat->cmap->N;
6533ea6fe3dSLisandro Dalcin   m  = mat->rmap->n;
6543ea6fe3dSLisandro Dalcin   nz = A->nz;
655416022c9SBarry Smith 
6563ea6fe3dSLisandro Dalcin   /* write matrix header */
6573ea6fe3dSLisandro Dalcin   header[0] = MAT_FILE_CLASSID;
6589371c9d4SSatish Balay   header[1] = M;
6599371c9d4SSatish Balay   header[2] = N;
6609371c9d4SSatish Balay   header[3] = nz;
6619566063dSJacob Faibussowitsch   PetscCall(PetscViewerBinaryWrite(viewer, header, 4, PETSC_INT));
662416022c9SBarry Smith 
6633ea6fe3dSLisandro Dalcin   /* fill in and store row lengths */
6649566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(m, &rowlens));
6653ea6fe3dSLisandro Dalcin   for (i = 0; i < m; i++) rowlens[i] = A->i[i + 1] - A->i[i];
666e457bb90SBarry Smith   if (PetscDefined(USE_DEBUG)) {
667e457bb90SBarry Smith     PetscInt mnz = 0;
668e457bb90SBarry Smith 
669e457bb90SBarry Smith     for (i = 0; i < m; i++) mnz += rowlens[i];
670e457bb90SBarry Smith     PetscCheck(nz == mnz, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Row lens %" PetscInt_FMT " do not sum to nz %" PetscInt_FMT, mnz, nz);
671e457bb90SBarry Smith   }
6729566063dSJacob Faibussowitsch   PetscCall(PetscViewerBinaryWrite(viewer, rowlens, m, PETSC_INT));
6739566063dSJacob Faibussowitsch   PetscCall(PetscFree(rowlens));
6743ea6fe3dSLisandro Dalcin   /* store column indices */
6759566063dSJacob Faibussowitsch   PetscCall(PetscViewerBinaryWrite(viewer, A->j, nz, PETSC_INT));
676416022c9SBarry Smith   /* store nonzero values */
6779566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(mat, &av));
6789566063dSJacob Faibussowitsch   PetscCall(PetscViewerBinaryWrite(viewer, av, nz, PETSC_SCALAR));
6799566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(mat, &av));
680b37d52dbSMark F. Adams 
6813ea6fe3dSLisandro Dalcin   /* write block size option to the viewer's .info file */
6829566063dSJacob Faibussowitsch   PetscCall(MatView_Binary_BlockSizes(mat, viewer));
6833ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
68417ab2063SBarry Smith }
685416022c9SBarry Smith 
686d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatView_SeqAIJ_ASCII_structonly(Mat A, PetscViewer viewer)
687d71ae5a4SJacob Faibussowitsch {
6887dc0baabSHong Zhang   Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data;
6897dc0baabSHong Zhang   PetscInt    i, k, m = A->rmap->N;
6907dc0baabSHong Zhang 
6917dc0baabSHong Zhang   PetscFunctionBegin;
6929566063dSJacob Faibussowitsch   PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE));
6937dc0baabSHong Zhang   for (i = 0; i < m; i++) {
6949566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIPrintf(viewer, "row %" PetscInt_FMT ":", i));
69548a46eb9SPierre Jolivet     for (k = a->i[i]; k < a->i[i + 1]; k++) PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ") ", a->j[k]));
6969566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIPrintf(viewer, "\n"));
6977dc0baabSHong Zhang   }
6989566063dSJacob Faibussowitsch   PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE));
6993ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
7007dc0baabSHong Zhang }
7017dc0baabSHong Zhang 
70209573ac7SBarry Smith extern PetscErrorCode MatSeqAIJFactorInfo_Matlab(Mat, PetscViewer);
703cd155464SBarry Smith 
704ba38deedSJacob Faibussowitsch static PetscErrorCode MatView_SeqAIJ_ASCII(Mat A, PetscViewer viewer)
705d71ae5a4SJacob Faibussowitsch {
706416022c9SBarry Smith   Mat_SeqAIJ        *a = (Mat_SeqAIJ *)A->data;
707c898d852SStefano Zampini   const PetscScalar *av;
70860e0710aSBarry Smith   PetscInt           i, j, m = A->rmap->n;
709e060cb09SBarry Smith   const char        *name;
710f3ef73ceSBarry Smith   PetscViewerFormat  format;
71117ab2063SBarry Smith 
7123a40ed3dSBarry Smith   PetscFunctionBegin;
7137dc0baabSHong Zhang   if (A->structure_only) {
7149566063dSJacob Faibussowitsch     PetscCall(MatView_SeqAIJ_ASCII_structonly(A, viewer));
7153ba16761SJacob Faibussowitsch     PetscFunctionReturn(PETSC_SUCCESS);
7167dc0baabSHong Zhang   }
71743e49210SHong Zhang 
7189566063dSJacob Faibussowitsch   PetscCall(PetscViewerGetFormat(viewer, &format));
719bd6a2ce3SJunchao Zhang   // By petsc's rule, even PETSC_VIEWER_ASCII_INFO_DETAIL doesn't print matrix entries
7203ba16761SJacob Faibussowitsch   if (format == PETSC_VIEWER_ASCII_FACTOR_INFO || format == PETSC_VIEWER_ASCII_INFO || format == PETSC_VIEWER_ASCII_INFO_DETAIL) PetscFunctionReturn(PETSC_SUCCESS);
7212e5835c6SStefano Zampini 
722c898d852SStefano Zampini   /* trigger copy to CPU if needed */
7239566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &av));
7249566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &av));
72571c2f376SKris Buschelman   if (format == PETSC_VIEWER_ASCII_MATLAB) {
72697f1f81fSBarry Smith     PetscInt nofinalvalue = 0;
72760e0710aSBarry Smith     if (m && ((a->i[m] == a->i[m - 1]) || (a->j[a->nz - 1] != A->cmap->n - 1))) {
728c337ccceSJed Brown       /* Need a dummy value to ensure the dimension of the matrix. */
729d00d2cf4SBarry Smith       nofinalvalue = 1;
730d00d2cf4SBarry Smith     }
7319566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE));
7329566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIPrintf(viewer, "%% Size = %" PetscInt_FMT " %" PetscInt_FMT " \n", m, A->cmap->n));
7339566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIPrintf(viewer, "%% Nonzeros = %" PetscInt_FMT " \n", a->nz));
734fbfe6fa7SJed Brown #if defined(PETSC_USE_COMPLEX)
7359566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIPrintf(viewer, "zzz = zeros(%" PetscInt_FMT ",4);\n", a->nz + nofinalvalue));
736fbfe6fa7SJed Brown #else
7379566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIPrintf(viewer, "zzz = zeros(%" PetscInt_FMT ",3);\n", a->nz + nofinalvalue));
738fbfe6fa7SJed Brown #endif
7399566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIPrintf(viewer, "zzz = [\n"));
74017ab2063SBarry Smith 
74117ab2063SBarry Smith     for (i = 0; i < m; i++) {
74260e0710aSBarry Smith       for (j = a->i[i]; j < a->i[i + 1]; j++) {
743aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX)
7449566063dSJacob Faibussowitsch         PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT "  %18.16e %18.16e\n", i + 1, a->j[j] + 1, (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j])));
74517ab2063SBarry Smith #else
7469566063dSJacob Faibussowitsch         PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT "  %18.16e\n", i + 1, a->j[j] + 1, (double)a->a[j]));
74717ab2063SBarry Smith #endif
74817ab2063SBarry Smith       }
74917ab2063SBarry Smith     }
750d00d2cf4SBarry Smith     if (nofinalvalue) {
751c337ccceSJed Brown #if defined(PETSC_USE_COMPLEX)
7529566063dSJacob Faibussowitsch       PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT "  %18.16e %18.16e\n", m, A->cmap->n, 0., 0.));
753c337ccceSJed Brown #else
7549566063dSJacob Faibussowitsch       PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT "  %18.16e\n", m, A->cmap->n, 0.0));
755c337ccceSJed Brown #endif
756d00d2cf4SBarry Smith     }
7579566063dSJacob Faibussowitsch     PetscCall(PetscObjectGetName((PetscObject)A, &name));
7589566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIPrintf(viewer, "];\n %s = spconvert(zzz);\n", name));
7599566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE));
760fb9695e5SSatish Balay   } else if (format == PETSC_VIEWER_ASCII_COMMON) {
7619566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE));
76244cd7ae7SLois Curfman McInnes     for (i = 0; i < m; i++) {
7639566063dSJacob Faibussowitsch       PetscCall(PetscViewerASCIIPrintf(viewer, "row %" PetscInt_FMT ":", i));
76460e0710aSBarry Smith       for (j = a->i[i]; j < a->i[i + 1]; j++) {
765aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX)
76636db0b34SBarry Smith         if (PetscImaginaryPart(a->a[j]) > 0.0 && PetscRealPart(a->a[j]) != 0.0) {
7679566063dSJacob Faibussowitsch           PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g + %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j])));
76836db0b34SBarry Smith         } else if (PetscImaginaryPart(a->a[j]) < 0.0 && PetscRealPart(a->a[j]) != 0.0) {
7699566063dSJacob Faibussowitsch           PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g - %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)-PetscImaginaryPart(a->a[j])));
77036db0b34SBarry Smith         } else if (PetscRealPart(a->a[j]) != 0.0) {
7719566063dSJacob Faibussowitsch           PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)PetscRealPart(a->a[j])));
7726831982aSBarry Smith         }
77344cd7ae7SLois Curfman McInnes #else
7749566063dSJacob Faibussowitsch         if (a->a[j] != 0.0) PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)a->a[j]));
77544cd7ae7SLois Curfman McInnes #endif
77644cd7ae7SLois Curfman McInnes       }
7779566063dSJacob Faibussowitsch       PetscCall(PetscViewerASCIIPrintf(viewer, "\n"));
77844cd7ae7SLois Curfman McInnes     }
7799566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE));
780fb9695e5SSatish Balay   } else if (format == PETSC_VIEWER_ASCII_SYMMODU) {
78197f1f81fSBarry Smith     PetscInt nzd = 0, fshift = 1, *sptr;
7829566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE));
7839566063dSJacob Faibussowitsch     PetscCall(PetscMalloc1(m + 1, &sptr));
784496be53dSLois Curfman McInnes     for (i = 0; i < m; i++) {
785496be53dSLois Curfman McInnes       sptr[i] = nzd + 1;
78660e0710aSBarry Smith       for (j = a->i[i]; j < a->i[i + 1]; j++) {
787496be53dSLois Curfman McInnes         if (a->j[j] >= i) {
788aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX)
78936db0b34SBarry Smith           if (PetscImaginaryPart(a->a[j]) != 0.0 || PetscRealPart(a->a[j]) != 0.0) nzd++;
790496be53dSLois Curfman McInnes #else
791496be53dSLois Curfman McInnes           if (a->a[j] != 0.0) nzd++;
792496be53dSLois Curfman McInnes #endif
793496be53dSLois Curfman McInnes         }
794496be53dSLois Curfman McInnes       }
795496be53dSLois Curfman McInnes     }
7962e44a96cSLois Curfman McInnes     sptr[m] = nzd + 1;
7979566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " %" PetscInt_FMT "\n\n", m, nzd));
7982e44a96cSLois Curfman McInnes     for (i = 0; i < m + 1; i += 6) {
7992205254eSKarl Rupp       if (i + 4 < m) {
8009566063dSJacob Faibussowitsch         PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT "\n", sptr[i], sptr[i + 1], sptr[i + 2], sptr[i + 3], sptr[i + 4], sptr[i + 5]));
8012205254eSKarl Rupp       } else if (i + 3 < m) {
8029566063dSJacob Faibussowitsch         PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT "\n", sptr[i], sptr[i + 1], sptr[i + 2], sptr[i + 3], sptr[i + 4]));
8032205254eSKarl Rupp       } else if (i + 2 < m) {
8049566063dSJacob Faibussowitsch         PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT "\n", sptr[i], sptr[i + 1], sptr[i + 2], sptr[i + 3]));
8052205254eSKarl Rupp       } else if (i + 1 < m) {
8069566063dSJacob Faibussowitsch         PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT "\n", sptr[i], sptr[i + 1], sptr[i + 2]));
8072205254eSKarl Rupp       } else if (i < m) {
8089566063dSJacob Faibussowitsch         PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " %" PetscInt_FMT "\n", sptr[i], sptr[i + 1]));
8092205254eSKarl Rupp       } else {
8109566063dSJacob Faibussowitsch         PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT "\n", sptr[i]));
8112205254eSKarl Rupp       }
812496be53dSLois Curfman McInnes     }
8139566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIPrintf(viewer, "\n"));
8149566063dSJacob Faibussowitsch     PetscCall(PetscFree(sptr));
815496be53dSLois Curfman McInnes     for (i = 0; i < m; i++) {
81660e0710aSBarry Smith       for (j = a->i[i]; j < a->i[i + 1]; j++) {
8179566063dSJacob Faibussowitsch         if (a->j[j] >= i) PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " ", a->j[j] + fshift));
818496be53dSLois Curfman McInnes       }
8199566063dSJacob Faibussowitsch       PetscCall(PetscViewerASCIIPrintf(viewer, "\n"));
820496be53dSLois Curfman McInnes     }
8219566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIPrintf(viewer, "\n"));
822496be53dSLois Curfman McInnes     for (i = 0; i < m; i++) {
82360e0710aSBarry Smith       for (j = a->i[i]; j < a->i[i + 1]; j++) {
824496be53dSLois Curfman McInnes         if (a->j[j] >= i) {
825aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX)
82648a46eb9SPierre Jolivet           if (PetscImaginaryPart(a->a[j]) != 0.0 || PetscRealPart(a->a[j]) != 0.0) PetscCall(PetscViewerASCIIPrintf(viewer, " %18.16e %18.16e ", (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j])));
827496be53dSLois Curfman McInnes #else
8289566063dSJacob Faibussowitsch           if (a->a[j] != 0.0) PetscCall(PetscViewerASCIIPrintf(viewer, " %18.16e ", (double)a->a[j]));
829496be53dSLois Curfman McInnes #endif
830496be53dSLois Curfman McInnes         }
831496be53dSLois Curfman McInnes       }
8329566063dSJacob Faibussowitsch       PetscCall(PetscViewerASCIIPrintf(viewer, "\n"));
833496be53dSLois Curfman McInnes     }
8349566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE));
835fb9695e5SSatish Balay   } else if (format == PETSC_VIEWER_ASCII_DENSE) {
83697f1f81fSBarry Smith     PetscInt    cnt = 0, jcnt;
83787828ca2SBarry Smith     PetscScalar value;
83868f1ed48SBarry Smith #if defined(PETSC_USE_COMPLEX)
83968f1ed48SBarry Smith     PetscBool realonly = PETSC_TRUE;
84068f1ed48SBarry Smith 
84168f1ed48SBarry Smith     for (i = 0; i < a->i[m]; i++) {
84268f1ed48SBarry Smith       if (PetscImaginaryPart(a->a[i]) != 0.0) {
84368f1ed48SBarry Smith         realonly = PETSC_FALSE;
84468f1ed48SBarry Smith         break;
84568f1ed48SBarry Smith       }
84668f1ed48SBarry Smith     }
84768f1ed48SBarry Smith #endif
84802594712SBarry Smith 
8499566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE));
85002594712SBarry Smith     for (i = 0; i < m; i++) {
85102594712SBarry Smith       jcnt = 0;
852d0f46423SBarry Smith       for (j = 0; j < A->cmap->n; j++) {
853e24b481bSBarry Smith         if (jcnt < a->i[i + 1] - a->i[i] && j == a->j[cnt]) {
85402594712SBarry Smith           value = a->a[cnt++];
855e24b481bSBarry Smith           jcnt++;
85602594712SBarry Smith         } else {
85702594712SBarry Smith           value = 0.0;
85802594712SBarry Smith         }
859aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX)
86068f1ed48SBarry Smith         if (realonly) {
8619566063dSJacob Faibussowitsch           PetscCall(PetscViewerASCIIPrintf(viewer, " %7.5e ", (double)PetscRealPart(value)));
86268f1ed48SBarry Smith         } else {
8639566063dSJacob Faibussowitsch           PetscCall(PetscViewerASCIIPrintf(viewer, " %7.5e+%7.5e i ", (double)PetscRealPart(value), (double)PetscImaginaryPart(value)));
86468f1ed48SBarry Smith         }
86502594712SBarry Smith #else
8669566063dSJacob Faibussowitsch         PetscCall(PetscViewerASCIIPrintf(viewer, " %7.5e ", (double)value));
86702594712SBarry Smith #endif
86802594712SBarry Smith       }
8699566063dSJacob Faibussowitsch       PetscCall(PetscViewerASCIIPrintf(viewer, "\n"));
87002594712SBarry Smith     }
8719566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE));
8723c215bfdSMatthew Knepley   } else if (format == PETSC_VIEWER_ASCII_MATRIXMARKET) {
873150b93efSMatthew G. Knepley     PetscInt fshift = 1;
8749566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE));
8753c215bfdSMatthew Knepley #if defined(PETSC_USE_COMPLEX)
8769566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIPrintf(viewer, "%%%%MatrixMarket matrix coordinate complex general\n"));
8773c215bfdSMatthew Knepley #else
8789566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIPrintf(viewer, "%%%%MatrixMarket matrix coordinate real general\n"));
8793c215bfdSMatthew Knepley #endif
8809566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT "\n", m, A->cmap->n, a->nz));
8813c215bfdSMatthew Knepley     for (i = 0; i < m; i++) {
88260e0710aSBarry Smith       for (j = a->i[i]; j < a->i[i + 1]; j++) {
8833c215bfdSMatthew Knepley #if defined(PETSC_USE_COMPLEX)
8849566063dSJacob Faibussowitsch         PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT " %g %g\n", i + fshift, a->j[j] + fshift, (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j])));
8853c215bfdSMatthew Knepley #else
8869566063dSJacob Faibussowitsch         PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT " %g\n", i + fshift, a->j[j] + fshift, (double)a->a[j]));
8873c215bfdSMatthew Knepley #endif
8883c215bfdSMatthew Knepley       }
8893c215bfdSMatthew Knepley     }
8909566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE));
8913a40ed3dSBarry Smith   } else {
8929566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE));
893d5f3da31SBarry Smith     if (A->factortype) {
89416cd7e1dSShri Abhyankar       for (i = 0; i < m; i++) {
8959566063dSJacob Faibussowitsch         PetscCall(PetscViewerASCIIPrintf(viewer, "row %" PetscInt_FMT ":", i));
89616cd7e1dSShri Abhyankar         /* L part */
89760e0710aSBarry Smith         for (j = a->i[i]; j < a->i[i + 1]; j++) {
89816cd7e1dSShri Abhyankar #if defined(PETSC_USE_COMPLEX)
89916cd7e1dSShri Abhyankar           if (PetscImaginaryPart(a->a[j]) > 0.0) {
9009566063dSJacob Faibussowitsch             PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g + %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j])));
90116cd7e1dSShri Abhyankar           } else if (PetscImaginaryPart(a->a[j]) < 0.0) {
9029566063dSJacob Faibussowitsch             PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g - %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)(-PetscImaginaryPart(a->a[j]))));
90316cd7e1dSShri Abhyankar           } else {
9049566063dSJacob Faibussowitsch             PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)PetscRealPart(a->a[j])));
90516cd7e1dSShri Abhyankar           }
90616cd7e1dSShri Abhyankar #else
9079566063dSJacob Faibussowitsch           PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)a->a[j]));
90816cd7e1dSShri Abhyankar #endif
90916cd7e1dSShri Abhyankar         }
91016cd7e1dSShri Abhyankar         /* diagonal */
91116cd7e1dSShri Abhyankar         j = a->diag[i];
91216cd7e1dSShri Abhyankar #if defined(PETSC_USE_COMPLEX)
91316cd7e1dSShri Abhyankar         if (PetscImaginaryPart(a->a[j]) > 0.0) {
914835f2295SStefano Zampini           PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g + %g i)", a->j[j], (double)PetscRealPart(1 / a->a[j]), (double)PetscImaginaryPart(1 / a->a[j])));
91516cd7e1dSShri Abhyankar         } else if (PetscImaginaryPart(a->a[j]) < 0.0) {
916835f2295SStefano Zampini           PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g - %g i)", a->j[j], (double)PetscRealPart(1 / a->a[j]), (double)(-PetscImaginaryPart(1 / a->a[j]))));
91716cd7e1dSShri Abhyankar         } else {
918835f2295SStefano Zampini           PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)PetscRealPart(1 / a->a[j])));
91916cd7e1dSShri Abhyankar         }
92016cd7e1dSShri Abhyankar #else
921835f2295SStefano Zampini         PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)(1 / a->a[j])));
92216cd7e1dSShri Abhyankar #endif
92316cd7e1dSShri Abhyankar 
92416cd7e1dSShri Abhyankar         /* U part */
92560e0710aSBarry Smith         for (j = a->diag[i + 1] + 1; j < a->diag[i]; j++) {
92616cd7e1dSShri Abhyankar #if defined(PETSC_USE_COMPLEX)
92716cd7e1dSShri Abhyankar           if (PetscImaginaryPart(a->a[j]) > 0.0) {
9289566063dSJacob Faibussowitsch             PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g + %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j])));
92916cd7e1dSShri Abhyankar           } else if (PetscImaginaryPart(a->a[j]) < 0.0) {
9309566063dSJacob Faibussowitsch             PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g - %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)(-PetscImaginaryPart(a->a[j]))));
93116cd7e1dSShri Abhyankar           } else {
9329566063dSJacob Faibussowitsch             PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)PetscRealPart(a->a[j])));
93316cd7e1dSShri Abhyankar           }
93416cd7e1dSShri Abhyankar #else
9359566063dSJacob Faibussowitsch           PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)a->a[j]));
93616cd7e1dSShri Abhyankar #endif
93716cd7e1dSShri Abhyankar         }
9389566063dSJacob Faibussowitsch         PetscCall(PetscViewerASCIIPrintf(viewer, "\n"));
93916cd7e1dSShri Abhyankar       }
94016cd7e1dSShri Abhyankar     } else {
94117ab2063SBarry Smith       for (i = 0; i < m; i++) {
9429566063dSJacob Faibussowitsch         PetscCall(PetscViewerASCIIPrintf(viewer, "row %" PetscInt_FMT ":", i));
94360e0710aSBarry Smith         for (j = a->i[i]; j < a->i[i + 1]; j++) {
944aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX)
94536db0b34SBarry Smith           if (PetscImaginaryPart(a->a[j]) > 0.0) {
9469566063dSJacob Faibussowitsch             PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g + %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j])));
94736db0b34SBarry Smith           } else if (PetscImaginaryPart(a->a[j]) < 0.0) {
9489566063dSJacob Faibussowitsch             PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g - %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)-PetscImaginaryPart(a->a[j])));
9493a40ed3dSBarry Smith           } else {
9509566063dSJacob Faibussowitsch             PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)PetscRealPart(a->a[j])));
95117ab2063SBarry Smith           }
95217ab2063SBarry Smith #else
9539566063dSJacob Faibussowitsch           PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)a->a[j]));
95417ab2063SBarry Smith #endif
95517ab2063SBarry Smith         }
9569566063dSJacob Faibussowitsch         PetscCall(PetscViewerASCIIPrintf(viewer, "\n"));
95717ab2063SBarry Smith       }
95816cd7e1dSShri Abhyankar     }
9599566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE));
96017ab2063SBarry Smith   }
9619566063dSJacob Faibussowitsch   PetscCall(PetscViewerFlush(viewer));
9623ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
963416022c9SBarry Smith }
964416022c9SBarry Smith 
9659804daf3SBarry Smith #include <petscdraw.h>
966ba38deedSJacob Faibussowitsch static PetscErrorCode MatView_SeqAIJ_Draw_Zoom(PetscDraw draw, void *Aa)
967d71ae5a4SJacob Faibussowitsch {
968480ef9eaSBarry Smith   Mat                A = (Mat)Aa;
969416022c9SBarry Smith   Mat_SeqAIJ        *a = (Mat_SeqAIJ *)A->data;
970383922c3SLisandro Dalcin   PetscInt           i, j, m = A->rmap->n;
971383922c3SLisandro Dalcin   int                color;
972b05fc000SLisandro Dalcin   PetscReal          xl, yl, xr, yr, x_l, x_r, y_l, y_r;
973b0a32e0cSBarry Smith   PetscViewer        viewer;
974f3ef73ceSBarry Smith   PetscViewerFormat  format;
975fff043a9SJunchao Zhang   const PetscScalar *aa;
976cddf8d76SBarry Smith 
9773a40ed3dSBarry Smith   PetscFunctionBegin;
9789566063dSJacob Faibussowitsch   PetscCall(PetscObjectQuery((PetscObject)A, "Zoomviewer", (PetscObject *)&viewer));
9799566063dSJacob Faibussowitsch   PetscCall(PetscViewerGetFormat(viewer, &format));
9809566063dSJacob Faibussowitsch   PetscCall(PetscDrawGetCoordinates(draw, &xl, &yl, &xr, &yr));
981383922c3SLisandro Dalcin 
982416022c9SBarry Smith   /* loop over matrix elements drawing boxes */
9839566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &aa));
984fb9695e5SSatish Balay   if (format != PETSC_VIEWER_DRAW_CONTOUR) {
985d0609cedSBarry Smith     PetscDrawCollectiveBegin(draw);
9860513a670SBarry Smith     /* Blue for negative, Cyan for zero and  Red for positive */
987b0a32e0cSBarry Smith     color = PETSC_DRAW_BLUE;
988416022c9SBarry Smith     for (i = 0; i < m; i++) {
9899371c9d4SSatish Balay       y_l = m - i - 1.0;
9909371c9d4SSatish Balay       y_r = y_l + 1.0;
991bfeeae90SHong Zhang       for (j = a->i[i]; j < a->i[i + 1]; j++) {
9929371c9d4SSatish Balay         x_l = a->j[j];
9939371c9d4SSatish Balay         x_r = x_l + 1.0;
994fff043a9SJunchao Zhang         if (PetscRealPart(aa[j]) >= 0.) continue;
9959566063dSJacob Faibussowitsch         PetscCall(PetscDrawRectangle(draw, x_l, y_l, x_r, y_r, color, color, color, color));
996cddf8d76SBarry Smith       }
997cddf8d76SBarry Smith     }
998b0a32e0cSBarry Smith     color = PETSC_DRAW_CYAN;
999cddf8d76SBarry Smith     for (i = 0; i < m; i++) {
10009371c9d4SSatish Balay       y_l = m - i - 1.0;
10019371c9d4SSatish Balay       y_r = y_l + 1.0;
1002bfeeae90SHong Zhang       for (j = a->i[i]; j < a->i[i + 1]; j++) {
10039371c9d4SSatish Balay         x_l = a->j[j];
10049371c9d4SSatish Balay         x_r = x_l + 1.0;
1005fff043a9SJunchao Zhang         if (aa[j] != 0.) continue;
10069566063dSJacob Faibussowitsch         PetscCall(PetscDrawRectangle(draw, x_l, y_l, x_r, y_r, color, color, color, color));
1007cddf8d76SBarry Smith       }
1008cddf8d76SBarry Smith     }
1009b0a32e0cSBarry Smith     color = PETSC_DRAW_RED;
1010cddf8d76SBarry Smith     for (i = 0; i < m; i++) {
10119371c9d4SSatish Balay       y_l = m - i - 1.0;
10129371c9d4SSatish Balay       y_r = y_l + 1.0;
1013bfeeae90SHong Zhang       for (j = a->i[i]; j < a->i[i + 1]; j++) {
10149371c9d4SSatish Balay         x_l = a->j[j];
10159371c9d4SSatish Balay         x_r = x_l + 1.0;
1016fff043a9SJunchao Zhang         if (PetscRealPart(aa[j]) <= 0.) continue;
10179566063dSJacob Faibussowitsch         PetscCall(PetscDrawRectangle(draw, x_l, y_l, x_r, y_r, color, color, color, color));
1018416022c9SBarry Smith       }
1019416022c9SBarry Smith     }
1020d0609cedSBarry Smith     PetscDrawCollectiveEnd(draw);
10210513a670SBarry Smith   } else {
10220513a670SBarry Smith     /* use contour shading to indicate magnitude of values */
10230513a670SBarry Smith     /* first determine max of all nonzero values */
1024b05fc000SLisandro Dalcin     PetscReal minv = 0.0, maxv = 0.0;
1025383922c3SLisandro Dalcin     PetscInt  nz = a->nz, count = 0;
1026b0a32e0cSBarry Smith     PetscDraw popup;
10270513a670SBarry Smith 
10280513a670SBarry Smith     for (i = 0; i < nz; i++) {
1029fff043a9SJunchao Zhang       if (PetscAbsScalar(aa[i]) > maxv) maxv = PetscAbsScalar(aa[i]);
10300513a670SBarry Smith     }
1031383922c3SLisandro Dalcin     if (minv >= maxv) maxv = minv + PETSC_SMALL;
10329566063dSJacob Faibussowitsch     PetscCall(PetscDrawGetPopup(draw, &popup));
10339566063dSJacob Faibussowitsch     PetscCall(PetscDrawScalePopup(popup, minv, maxv));
1034383922c3SLisandro Dalcin 
1035d0609cedSBarry Smith     PetscDrawCollectiveBegin(draw);
10360513a670SBarry Smith     for (i = 0; i < m; i++) {
1037383922c3SLisandro Dalcin       y_l = m - i - 1.0;
1038383922c3SLisandro Dalcin       y_r = y_l + 1.0;
1039bfeeae90SHong Zhang       for (j = a->i[i]; j < a->i[i + 1]; j++) {
1040383922c3SLisandro Dalcin         x_l   = a->j[j];
1041383922c3SLisandro Dalcin         x_r   = x_l + 1.0;
1042fff043a9SJunchao Zhang         color = PetscDrawRealToColor(PetscAbsScalar(aa[count]), minv, maxv);
10439566063dSJacob Faibussowitsch         PetscCall(PetscDrawRectangle(draw, x_l, y_l, x_r, y_r, color, color, color, color));
10440513a670SBarry Smith         count++;
10450513a670SBarry Smith       }
10460513a670SBarry Smith     }
1047d0609cedSBarry Smith     PetscDrawCollectiveEnd(draw);
10480513a670SBarry Smith   }
10499566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &aa));
10503ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
1051480ef9eaSBarry Smith }
1052cddf8d76SBarry Smith 
10539804daf3SBarry Smith #include <petscdraw.h>
1054ba38deedSJacob Faibussowitsch static PetscErrorCode MatView_SeqAIJ_Draw(Mat A, PetscViewer viewer)
1055d71ae5a4SJacob Faibussowitsch {
1056b0a32e0cSBarry Smith   PetscDraw draw;
105736db0b34SBarry Smith   PetscReal xr, yr, xl, yl, h, w;
1058ace3abfcSBarry Smith   PetscBool isnull;
1059480ef9eaSBarry Smith 
1060480ef9eaSBarry Smith   PetscFunctionBegin;
10619566063dSJacob Faibussowitsch   PetscCall(PetscViewerDrawGetDraw(viewer, 0, &draw));
10629566063dSJacob Faibussowitsch   PetscCall(PetscDrawIsNull(draw, &isnull));
10633ba16761SJacob Faibussowitsch   if (isnull) PetscFunctionReturn(PETSC_SUCCESS);
1064480ef9eaSBarry Smith 
10659371c9d4SSatish Balay   xr = A->cmap->n;
10669371c9d4SSatish Balay   yr = A->rmap->n;
10679371c9d4SSatish Balay   h  = yr / 10.0;
10689371c9d4SSatish Balay   w  = xr / 10.0;
10699371c9d4SSatish Balay   xr += w;
10709371c9d4SSatish Balay   yr += h;
10719371c9d4SSatish Balay   xl = -w;
10729371c9d4SSatish Balay   yl = -h;
10739566063dSJacob Faibussowitsch   PetscCall(PetscDrawSetCoordinates(draw, xl, yl, xr, yr));
10749566063dSJacob Faibussowitsch   PetscCall(PetscObjectCompose((PetscObject)A, "Zoomviewer", (PetscObject)viewer));
10759566063dSJacob Faibussowitsch   PetscCall(PetscDrawZoom(draw, MatView_SeqAIJ_Draw_Zoom, A));
10769566063dSJacob Faibussowitsch   PetscCall(PetscObjectCompose((PetscObject)A, "Zoomviewer", NULL));
10779566063dSJacob Faibussowitsch   PetscCall(PetscDrawSave(draw));
10783ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
1079416022c9SBarry Smith }
1080416022c9SBarry Smith 
1081d71ae5a4SJacob Faibussowitsch PetscErrorCode MatView_SeqAIJ(Mat A, PetscViewer viewer)
1082d71ae5a4SJacob Faibussowitsch {
1083ace3abfcSBarry Smith   PetscBool iascii, isbinary, isdraw;
1084416022c9SBarry Smith 
10853a40ed3dSBarry Smith   PetscFunctionBegin;
10869566063dSJacob Faibussowitsch   PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERASCII, &iascii));
10879566063dSJacob Faibussowitsch   PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERBINARY, &isbinary));
10889566063dSJacob Faibussowitsch   PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERDRAW, &isdraw));
10891baa6e33SBarry Smith   if (iascii) PetscCall(MatView_SeqAIJ_ASCII(A, viewer));
10901baa6e33SBarry Smith   else if (isbinary) PetscCall(MatView_SeqAIJ_Binary(A, viewer));
10911baa6e33SBarry Smith   else if (isdraw) PetscCall(MatView_SeqAIJ_Draw(A, viewer));
10929566063dSJacob Faibussowitsch   PetscCall(MatView_SeqAIJ_Inode(A, viewer));
10933ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
109417ab2063SBarry Smith }
109519bcc07fSBarry Smith 
1096d71ae5a4SJacob Faibussowitsch PetscErrorCode MatAssemblyEnd_SeqAIJ(Mat A, MatAssemblyType mode)
1097d71ae5a4SJacob Faibussowitsch {
1098416022c9SBarry Smith   Mat_SeqAIJ *a      = (Mat_SeqAIJ *)A->data;
1099580bdb30SBarry Smith   PetscInt    fshift = 0, i, *ai = a->i, *aj = a->j, *imax = a->imax;
1100bc43efbbSJunchao Zhang   PetscInt    m = A->rmap->n, *ip, N, *ailen = a->ilen, rmax = 0, n;
110154f21887SBarry Smith   MatScalar  *aa    = a->a, *ap;
11023447b6efSHong Zhang   PetscReal   ratio = 0.6;
110317ab2063SBarry Smith 
11043a40ed3dSBarry Smith   PetscFunctionBegin;
11053ba16761SJacob Faibussowitsch   if (mode == MAT_FLUSH_ASSEMBLY) PetscFunctionReturn(PETSC_SUCCESS);
11069566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJInvalidateDiagonal(A));
1107b215bc84SStefano Zampini   if (A->was_assembled && A->ass_nonzerostate == A->nonzerostate) {
1108b215bc84SStefano Zampini     /* we need to respect users asking to use or not the inodes routine in between matrix assemblies */
11099566063dSJacob Faibussowitsch     PetscCall(MatAssemblyEnd_SeqAIJ_Inode(A, mode));
11103ba16761SJacob Faibussowitsch     PetscFunctionReturn(PETSC_SUCCESS);
1111b215bc84SStefano Zampini   }
111217ab2063SBarry Smith 
111343ee02c3SBarry Smith   if (m) rmax = ailen[0]; /* determine row with most nonzeros */
111417ab2063SBarry Smith   for (i = 1; i < m; i++) {
1115416022c9SBarry Smith     /* move each row back by the amount of empty slots (fshift) before it*/
111617ab2063SBarry Smith     fshift += imax[i - 1] - ailen[i - 1];
111794a9d846SBarry Smith     rmax = PetscMax(rmax, ailen[i]);
111817ab2063SBarry Smith     if (fshift) {
1119bfeeae90SHong Zhang       ip = aj + ai[i];
1120bfeeae90SHong Zhang       ap = aa + ai[i];
112117ab2063SBarry Smith       N  = ailen[i];
11229566063dSJacob Faibussowitsch       PetscCall(PetscArraymove(ip - fshift, ip, N));
112348a46eb9SPierre Jolivet       if (!A->structure_only) PetscCall(PetscArraymove(ap - fshift, ap, N));
112417ab2063SBarry Smith     }
112517ab2063SBarry Smith     ai[i] = ai[i - 1] + ailen[i - 1];
112617ab2063SBarry Smith   }
112717ab2063SBarry Smith   if (m) {
112817ab2063SBarry Smith     fshift += imax[m - 1] - ailen[m - 1];
112917ab2063SBarry Smith     ai[m] = ai[m - 1] + ailen[m - 1];
113017ab2063SBarry Smith   }
113117ab2063SBarry Smith   /* reset ilen and imax for each row */
11327b083b7cSBarry Smith   a->nonzerorowcnt = 0;
1133396832f4SHong Zhang   if (A->structure_only) {
11349566063dSJacob Faibussowitsch     PetscCall(PetscFree(a->imax));
11359566063dSJacob Faibussowitsch     PetscCall(PetscFree(a->ilen));
1136396832f4SHong Zhang   } else { /* !A->structure_only */
113717ab2063SBarry Smith     for (i = 0; i < m; i++) {
113817ab2063SBarry Smith       ailen[i] = imax[i] = ai[i + 1] - ai[i];
11397b083b7cSBarry Smith       a->nonzerorowcnt += ((ai[i + 1] - ai[i]) > 0);
114017ab2063SBarry Smith     }
1141396832f4SHong Zhang   }
1142bfeeae90SHong Zhang   a->nz = ai[m];
1143aed4548fSBarry Smith   PetscCheck(!fshift || a->nounused != -1, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Unused space detected in matrix: %" PetscInt_FMT " X %" PetscInt_FMT ", %" PetscInt_FMT " unneeded", m, A->cmap->n, fshift);
1144bc43efbbSJunchao Zhang   PetscCall(MatMarkDiagonal_SeqAIJ(A)); // since diagonal info is used a lot, it is helpful to set them up at the end of assembly
1145bc43efbbSJunchao Zhang   a->diagonaldense = PETSC_TRUE;
1146bc43efbbSJunchao Zhang   n                = PetscMin(A->rmap->n, A->cmap->n);
1147bc43efbbSJunchao Zhang   for (i = 0; i < n; i++) {
1148bc43efbbSJunchao Zhang     if (a->diag[i] >= ai[i + 1]) {
1149bc43efbbSJunchao Zhang       a->diagonaldense = PETSC_FALSE;
1150bc43efbbSJunchao Zhang       break;
1151bc43efbbSJunchao Zhang     }
1152bc43efbbSJunchao Zhang   }
11539566063dSJacob Faibussowitsch   PetscCall(PetscInfo(A, "Matrix size: %" PetscInt_FMT " X %" PetscInt_FMT "; storage space: %" PetscInt_FMT " unneeded,%" PetscInt_FMT " used\n", m, A->cmap->n, fshift, a->nz));
11549566063dSJacob Faibussowitsch   PetscCall(PetscInfo(A, "Number of mallocs during MatSetValues() is %" PetscInt_FMT "\n", a->reallocs));
11559566063dSJacob Faibussowitsch   PetscCall(PetscInfo(A, "Maximum nonzeros in any row is %" PetscInt_FMT "\n", rmax));
11562205254eSKarl Rupp 
11578e58a170SBarry Smith   A->info.mallocs += a->reallocs;
1158dd5f02e7SSatish Balay   a->reallocs         = 0;
11596712e2f1SBarry Smith   A->info.nz_unneeded = (PetscReal)fshift;
116036db0b34SBarry Smith   a->rmax             = rmax;
11614e220ebcSLois Curfman McInnes 
116248a46eb9SPierre Jolivet   if (!A->structure_only) PetscCall(MatCheckCompressedRow(A, a->nonzerorowcnt, &a->compressedrow, a->i, m, ratio));
11639566063dSJacob Faibussowitsch   PetscCall(MatAssemblyEnd_SeqAIJ_Inode(A, mode));
11643ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
116517ab2063SBarry Smith }
116617ab2063SBarry Smith 
1167ba38deedSJacob Faibussowitsch static PetscErrorCode MatRealPart_SeqAIJ(Mat A)
1168d71ae5a4SJacob Faibussowitsch {
116999cafbc1SBarry Smith   Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data;
117099cafbc1SBarry Smith   PetscInt    i, nz = a->nz;
11712e5835c6SStefano Zampini   MatScalar  *aa;
117299cafbc1SBarry Smith 
117399cafbc1SBarry Smith   PetscFunctionBegin;
11749566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArray(A, &aa));
117599cafbc1SBarry Smith   for (i = 0; i < nz; i++) aa[i] = PetscRealPart(aa[i]);
11769566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArray(A, &aa));
11779566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJInvalidateDiagonal(A));
11783ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
117999cafbc1SBarry Smith }
118099cafbc1SBarry Smith 
1181ba38deedSJacob Faibussowitsch static PetscErrorCode MatImaginaryPart_SeqAIJ(Mat A)
1182d71ae5a4SJacob Faibussowitsch {
118399cafbc1SBarry Smith   Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data;
118499cafbc1SBarry Smith   PetscInt    i, nz = a->nz;
11852e5835c6SStefano Zampini   MatScalar  *aa;
118699cafbc1SBarry Smith 
118799cafbc1SBarry Smith   PetscFunctionBegin;
11889566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArray(A, &aa));
118999cafbc1SBarry Smith   for (i = 0; i < nz; i++) aa[i] = PetscImaginaryPart(aa[i]);
11909566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArray(A, &aa));
11919566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJInvalidateDiagonal(A));
11923ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
119399cafbc1SBarry Smith }
119499cafbc1SBarry Smith 
1195d71ae5a4SJacob Faibussowitsch PetscErrorCode MatZeroEntries_SeqAIJ(Mat A)
1196d71ae5a4SJacob Faibussowitsch {
1197fff043a9SJunchao Zhang   Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data;
1198fff043a9SJunchao Zhang   MatScalar  *aa;
11993a40ed3dSBarry Smith 
12003a40ed3dSBarry Smith   PetscFunctionBegin;
12019566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayWrite(A, &aa));
12029566063dSJacob Faibussowitsch   PetscCall(PetscArrayzero(aa, a->i[A->rmap->n]));
12039566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayWrite(A, &aa));
12049566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJInvalidateDiagonal(A));
12053ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
120617ab2063SBarry Smith }
1207416022c9SBarry Smith 
1208674b392bSAlexander static PetscErrorCode MatReset_SeqAIJ(Mat A)
1209d71ae5a4SJacob Faibussowitsch {
1210416022c9SBarry Smith   Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data;
1211d5d45c9bSBarry Smith 
12123a40ed3dSBarry Smith   PetscFunctionBegin;
1213b4e2f619SBarry Smith   if (A->hash_active) {
1214e3c72094SPierre Jolivet     A->ops[0] = a->cops;
1215b4e2f619SBarry Smith     PetscCall(PetscHMapIJVDestroy(&a->ht));
1216b4e2f619SBarry Smith     PetscCall(PetscFree(a->dnz));
1217b4e2f619SBarry Smith     A->hash_active = PETSC_FALSE;
1218b4e2f619SBarry Smith   }
1219b4e2f619SBarry Smith 
12203ba16761SJacob Faibussowitsch   PetscCall(PetscLogObjectState((PetscObject)A, "Rows=%" PetscInt_FMT ", Cols=%" PetscInt_FMT ", NZ=%" PetscInt_FMT, A->rmap->n, A->cmap->n, a->nz));
12219566063dSJacob Faibussowitsch   PetscCall(MatSeqXAIJFreeAIJ(A, &a->a, &a->j, &a->i));
12229566063dSJacob Faibussowitsch   PetscCall(ISDestroy(&a->row));
12239566063dSJacob Faibussowitsch   PetscCall(ISDestroy(&a->col));
12249566063dSJacob Faibussowitsch   PetscCall(PetscFree(a->diag));
12259566063dSJacob Faibussowitsch   PetscCall(PetscFree(a->ibdiag));
12269566063dSJacob Faibussowitsch   PetscCall(PetscFree(a->imax));
12279566063dSJacob Faibussowitsch   PetscCall(PetscFree(a->ilen));
12289566063dSJacob Faibussowitsch   PetscCall(PetscFree(a->ipre));
12299566063dSJacob Faibussowitsch   PetscCall(PetscFree3(a->idiag, a->mdiag, a->ssor_work));
12309566063dSJacob Faibussowitsch   PetscCall(PetscFree(a->solve_work));
12319566063dSJacob Faibussowitsch   PetscCall(ISDestroy(&a->icol));
12329566063dSJacob Faibussowitsch   PetscCall(PetscFree(a->saved_values));
12339566063dSJacob Faibussowitsch   PetscCall(PetscFree2(a->compressedrow.i, a->compressedrow.rindex));
12349566063dSJacob Faibussowitsch   PetscCall(MatDestroy_SeqAIJ_Inode(A));
1235674b392bSAlexander   PetscFunctionReturn(PETSC_SUCCESS);
1236674b392bSAlexander }
1237674b392bSAlexander 
1238674b392bSAlexander static PetscErrorCode MatResetHash_SeqAIJ(Mat A)
1239674b392bSAlexander {
1240674b392bSAlexander   PetscFunctionBegin;
1241674b392bSAlexander   PetscCall(MatReset_SeqAIJ(A));
1242674b392bSAlexander   PetscCall(MatCreate_SeqAIJ_Inode(A));
1243674b392bSAlexander   PetscCall(MatSetUp_Seq_Hash(A));
1244674b392bSAlexander   A->nonzerostate++;
1245674b392bSAlexander   PetscFunctionReturn(PETSC_SUCCESS);
1246674b392bSAlexander }
1247674b392bSAlexander 
1248674b392bSAlexander PetscErrorCode MatDestroy_SeqAIJ(Mat A)
1249674b392bSAlexander {
1250674b392bSAlexander   PetscFunctionBegin;
1251674b392bSAlexander   PetscCall(MatReset_SeqAIJ(A));
12529566063dSJacob Faibussowitsch   PetscCall(PetscFree(A->data));
1253901853e0SKris Buschelman 
12546718818eSStefano Zampini   /* MatMatMultNumeric_SeqAIJ_SeqAIJ_Sorted may allocate this.
12556718818eSStefano Zampini      That function is so heavily used (sometimes in an hidden way through multnumeric function pointers)
12566718818eSStefano Zampini      that is hard to properly add this data to the MatProduct data. We free it here to avoid
12576718818eSStefano Zampini      users reusing the matrix object with different data to incur in obscure segmentation faults
12586718818eSStefano Zampini      due to different matrix sizes */
12599566063dSJacob Faibussowitsch   PetscCall(PetscObjectCompose((PetscObject)A, "__PETSc__ab_dense", NULL));
12606718818eSStefano Zampini 
12619566063dSJacob Faibussowitsch   PetscCall(PetscObjectChangeTypeName((PetscObject)A, NULL));
12622e956fe4SStefano Zampini   PetscCall(PetscObjectComposeFunction((PetscObject)A, "PetscMatlabEnginePut_C", NULL));
12632e956fe4SStefano Zampini   PetscCall(PetscObjectComposeFunction((PetscObject)A, "PetscMatlabEngineGet_C", NULL));
12649566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSeqAIJSetColumnIndices_C", NULL));
12659566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatStoreValues_C", NULL));
12669566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatRetrieveValues_C", NULL));
12679566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqsbaij_C", NULL));
12689566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqbaij_C", NULL));
12699566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijperm_C", NULL));
12702e956fe4SStefano Zampini   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijsell_C", NULL));
12712e956fe4SStefano Zampini #if defined(PETSC_HAVE_MKL_SPARSE)
12722e956fe4SStefano Zampini   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijmkl_C", NULL));
12732e956fe4SStefano Zampini #endif
12744222ddf1SHong Zhang #if defined(PETSC_HAVE_CUDA)
12759566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijcusparse_C", NULL));
12769566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaijcusparse_seqaij_C", NULL));
12779566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaij_seqaijcusparse_C", NULL));
12784222ddf1SHong Zhang #endif
1279d5e393b6SSuyash Tandon #if defined(PETSC_HAVE_HIP)
1280d5e393b6SSuyash Tandon   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijhipsparse_C", NULL));
1281d5e393b6SSuyash Tandon   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaijhipsparse_seqaij_C", NULL));
1282d5e393b6SSuyash Tandon   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaij_seqaijhipsparse_C", NULL));
1283d5e393b6SSuyash Tandon #endif
12843d0639e7SStefano Zampini #if defined(PETSC_HAVE_KOKKOS_KERNELS)
12859566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijkokkos_C", NULL));
12863d0639e7SStefano Zampini #endif
12879566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijcrl_C", NULL));
1288af8000cdSHong Zhang #if defined(PETSC_HAVE_ELEMENTAL)
12899566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_elemental_C", NULL));
1290af8000cdSHong Zhang #endif
1291d24d4204SJose E. Roman #if defined(PETSC_HAVE_SCALAPACK)
12929566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_scalapack_C", NULL));
1293d24d4204SJose E. Roman #endif
129463c07aadSStefano Zampini #if defined(PETSC_HAVE_HYPRE)
12959566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_hypre_C", NULL));
12969566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_transpose_seqaij_seqaij_C", NULL));
129763c07aadSStefano Zampini #endif
12989566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqdense_C", NULL));
12999566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqsell_C", NULL));
13009566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_is_C", NULL));
13019566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatIsTranspose_C", NULL));
13022e956fe4SStefano Zampini   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatIsHermitianTranspose_C", NULL));
13039566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSeqAIJSetPreallocation_C", NULL));
13049566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatResetPreallocation_C", NULL));
1305674b392bSAlexander   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatResetHash_C", NULL));
13069566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSeqAIJSetPreallocationCSR_C", NULL));
13079566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatReorderForNonzeroDiagonal_C", NULL));
13089566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_is_seqaij_C", NULL));
13099566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqdense_seqaij_C", NULL));
13109566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaij_seqaij_C", NULL));
13119566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSeqAIJKron_C", NULL));
13129566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSetPreallocationCOO_C", NULL));
13139566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSetValuesCOO_C", NULL));
13142e956fe4SStefano Zampini   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatFactorGetSolverType_C", NULL));
13152e956fe4SStefano Zampini   /* these calls do not belong here: the subclasses Duplicate/Destroy are wrong */
13162e956fe4SStefano Zampini   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaijsell_seqaij_C", NULL));
13172e956fe4SStefano Zampini   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaijperm_seqaij_C", NULL));
13182e956fe4SStefano Zampini   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijviennacl_C", NULL));
13192e956fe4SStefano Zampini   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaijviennacl_seqdense_C", NULL));
13202e956fe4SStefano Zampini   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaijviennacl_seqaij_C", NULL));
13213ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
132217ab2063SBarry Smith }
132317ab2063SBarry Smith 
1324d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetOption_SeqAIJ(Mat A, MatOption op, PetscBool flg)
1325d71ae5a4SJacob Faibussowitsch {
1326416022c9SBarry Smith   Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data;
13273a40ed3dSBarry Smith 
13283a40ed3dSBarry Smith   PetscFunctionBegin;
1329a65d3064SKris Buschelman   switch (op) {
1330d71ae5a4SJacob Faibussowitsch   case MAT_ROW_ORIENTED:
1331d71ae5a4SJacob Faibussowitsch     a->roworiented = flg;
1332d71ae5a4SJacob Faibussowitsch     break;
1333d71ae5a4SJacob Faibussowitsch   case MAT_KEEP_NONZERO_PATTERN:
1334d71ae5a4SJacob Faibussowitsch     a->keepnonzeropattern = flg;
1335d71ae5a4SJacob Faibussowitsch     break;
1336d71ae5a4SJacob Faibussowitsch   case MAT_NEW_NONZERO_LOCATIONS:
1337d71ae5a4SJacob Faibussowitsch     a->nonew = (flg ? 0 : 1);
1338d71ae5a4SJacob Faibussowitsch     break;
1339d71ae5a4SJacob Faibussowitsch   case MAT_NEW_NONZERO_LOCATION_ERR:
1340d71ae5a4SJacob Faibussowitsch     a->nonew = (flg ? -1 : 0);
1341d71ae5a4SJacob Faibussowitsch     break;
1342d71ae5a4SJacob Faibussowitsch   case MAT_NEW_NONZERO_ALLOCATION_ERR:
1343d71ae5a4SJacob Faibussowitsch     a->nonew = (flg ? -2 : 0);
1344d71ae5a4SJacob Faibussowitsch     break;
1345d71ae5a4SJacob Faibussowitsch   case MAT_UNUSED_NONZERO_LOCATION_ERR:
1346d71ae5a4SJacob Faibussowitsch     a->nounused = (flg ? -1 : 0);
1347d71ae5a4SJacob Faibussowitsch     break;
1348d71ae5a4SJacob Faibussowitsch   case MAT_IGNORE_ZERO_ENTRIES:
1349d71ae5a4SJacob Faibussowitsch     a->ignorezeroentries = flg;
1350d71ae5a4SJacob Faibussowitsch     break;
1351d71ae5a4SJacob Faibussowitsch   case MAT_USE_INODES:
1352d71ae5a4SJacob Faibussowitsch     PetscCall(MatSetOption_SeqAIJ_Inode(A, MAT_USE_INODES, flg));
1353d71ae5a4SJacob Faibussowitsch     break;
1354d71ae5a4SJacob Faibussowitsch   case MAT_SUBMAT_SINGLEIS:
1355d71ae5a4SJacob Faibussowitsch     A->submat_singleis = flg;
1356d71ae5a4SJacob Faibussowitsch     break;
1357071fcb05SBarry Smith   case MAT_SORTED_FULL:
1358071fcb05SBarry Smith     if (flg) A->ops->setvalues = MatSetValues_SeqAIJ_SortedFull;
1359071fcb05SBarry Smith     else A->ops->setvalues = MatSetValues_SeqAIJ;
1360071fcb05SBarry Smith     break;
1361d71ae5a4SJacob Faibussowitsch   case MAT_FORM_EXPLICIT_TRANSPOSE:
1362d71ae5a4SJacob Faibussowitsch     A->form_explicit_transpose = flg;
1363d71ae5a4SJacob Faibussowitsch     break;
1364d71ae5a4SJacob Faibussowitsch   default:
1365888c827cSStefano Zampini     break;
1366a65d3064SKris Buschelman   }
13673ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
136817ab2063SBarry Smith }
136917ab2063SBarry Smith 
1370ba38deedSJacob Faibussowitsch static PetscErrorCode MatGetDiagonal_SeqAIJ(Mat A, Vec v)
1371d71ae5a4SJacob Faibussowitsch {
1372416022c9SBarry Smith   Mat_SeqAIJ        *a = (Mat_SeqAIJ *)A->data;
1373fdc842d1SBarry Smith   PetscInt           i, j, n, *ai = a->i, *aj = a->j;
1374c898d852SStefano Zampini   PetscScalar       *x;
1375c898d852SStefano Zampini   const PetscScalar *aa;
137617ab2063SBarry Smith 
13773a40ed3dSBarry Smith   PetscFunctionBegin;
13789566063dSJacob Faibussowitsch   PetscCall(VecGetLocalSize(v, &n));
137908401ef6SPierre Jolivet   PetscCheck(n == A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Nonconforming matrix and vector");
13809566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &aa));
1381d5f3da31SBarry Smith   if (A->factortype == MAT_FACTOR_ILU || A->factortype == MAT_FACTOR_LU) {
1382d3e70bfaSHong Zhang     PetscInt *diag = a->diag;
13839566063dSJacob Faibussowitsch     PetscCall(VecGetArrayWrite(v, &x));
13842c990fa1SHong Zhang     for (i = 0; i < n; i++) x[i] = 1.0 / aa[diag[i]];
13859566063dSJacob Faibussowitsch     PetscCall(VecRestoreArrayWrite(v, &x));
13869566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJRestoreArrayRead(A, &aa));
13873ba16761SJacob Faibussowitsch     PetscFunctionReturn(PETSC_SUCCESS);
138835e7444dSHong Zhang   }
138935e7444dSHong Zhang 
13909566063dSJacob Faibussowitsch   PetscCall(VecGetArrayWrite(v, &x));
139135e7444dSHong Zhang   for (i = 0; i < n; i++) {
1392fdc842d1SBarry Smith     x[i] = 0.0;
139335e7444dSHong Zhang     for (j = ai[i]; j < ai[i + 1]; j++) {
139435e7444dSHong Zhang       if (aj[j] == i) {
139535e7444dSHong Zhang         x[i] = aa[j];
139617ab2063SBarry Smith         break;
139717ab2063SBarry Smith       }
139817ab2063SBarry Smith     }
139917ab2063SBarry Smith   }
14009566063dSJacob Faibussowitsch   PetscCall(VecRestoreArrayWrite(v, &x));
14019566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &aa));
14023ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
140317ab2063SBarry Smith }
140417ab2063SBarry Smith 
1405c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/ftn-kernels/fmult.h>
1406d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMultTransposeAdd_SeqAIJ(Mat A, Vec xx, Vec zz, Vec yy)
1407d71ae5a4SJacob Faibussowitsch {
1408416022c9SBarry Smith   Mat_SeqAIJ        *a = (Mat_SeqAIJ *)A->data;
14095f22a7b3SSebastian Grimberg   const MatScalar   *aa;
1410d9ca1df4SBarry Smith   PetscScalar       *y;
1411d9ca1df4SBarry Smith   const PetscScalar *x;
1412d0f46423SBarry Smith   PetscInt           m = A->rmap->n;
14135c897100SBarry Smith #if !defined(PETSC_USE_FORTRAN_KERNEL_MULTTRANSPOSEAIJ)
14145f22a7b3SSebastian Grimberg   const MatScalar  *v;
1415a77337e4SBarry Smith   PetscScalar       alpha;
1416d9ca1df4SBarry Smith   PetscInt          n, i, j;
1417d9ca1df4SBarry Smith   const PetscInt   *idx, *ii, *ridx = NULL;
14183447b6efSHong Zhang   Mat_CompressedRow cprow    = a->compressedrow;
1419ace3abfcSBarry Smith   PetscBool         usecprow = cprow.use;
14205c897100SBarry Smith #endif
142117ab2063SBarry Smith 
14223a40ed3dSBarry Smith   PetscFunctionBegin;
14239566063dSJacob Faibussowitsch   if (zz != yy) PetscCall(VecCopy(zz, yy));
14249566063dSJacob Faibussowitsch   PetscCall(VecGetArrayRead(xx, &x));
14259566063dSJacob Faibussowitsch   PetscCall(VecGetArray(yy, &y));
14269566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &aa));
14275c897100SBarry Smith 
14285c897100SBarry Smith #if defined(PETSC_USE_FORTRAN_KERNEL_MULTTRANSPOSEAIJ)
1429fff043a9SJunchao Zhang   fortranmulttransposeaddaij_(&m, x, a->i, a->j, aa, y);
14305c897100SBarry Smith #else
14313447b6efSHong Zhang   if (usecprow) {
14323447b6efSHong Zhang     m    = cprow.nrows;
14333447b6efSHong Zhang     ii   = cprow.i;
14347b2bb3b9SHong Zhang     ridx = cprow.rindex;
14353447b6efSHong Zhang   } else {
14363447b6efSHong Zhang     ii = a->i;
14373447b6efSHong Zhang   }
143817ab2063SBarry Smith   for (i = 0; i < m; i++) {
14393447b6efSHong Zhang     idx = a->j + ii[i];
1440fff043a9SJunchao Zhang     v   = aa + ii[i];
14413447b6efSHong Zhang     n   = ii[i + 1] - ii[i];
14423447b6efSHong Zhang     if (usecprow) {
14437b2bb3b9SHong Zhang       alpha = x[ridx[i]];
14443447b6efSHong Zhang     } else {
144517ab2063SBarry Smith       alpha = x[i];
14463447b6efSHong Zhang     }
144704fbf559SBarry Smith     for (j = 0; j < n; j++) y[idx[j]] += alpha * v[j];
144817ab2063SBarry Smith   }
14495c897100SBarry Smith #endif
14509566063dSJacob Faibussowitsch   PetscCall(PetscLogFlops(2.0 * a->nz));
14519566063dSJacob Faibussowitsch   PetscCall(VecRestoreArrayRead(xx, &x));
14529566063dSJacob Faibussowitsch   PetscCall(VecRestoreArray(yy, &y));
14539566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &aa));
14543ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
145517ab2063SBarry Smith }
145617ab2063SBarry Smith 
1457d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMultTranspose_SeqAIJ(Mat A, Vec xx, Vec yy)
1458d71ae5a4SJacob Faibussowitsch {
14595c897100SBarry Smith   PetscFunctionBegin;
14609566063dSJacob Faibussowitsch   PetscCall(VecSet(yy, 0.0));
14619566063dSJacob Faibussowitsch   PetscCall(MatMultTransposeAdd_SeqAIJ(A, xx, yy, yy));
14623ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
14635c897100SBarry Smith }
14645c897100SBarry Smith 
1465c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/ftn-kernels/fmult.h>
146678b84d54SShri Abhyankar 
1467d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMult_SeqAIJ(Mat A, Vec xx, Vec yy)
1468d71ae5a4SJacob Faibussowitsch {
1469416022c9SBarry Smith   Mat_SeqAIJ        *a = (Mat_SeqAIJ *)A->data;
1470d9fead3dSBarry Smith   PetscScalar       *y;
147154f21887SBarry Smith   const PetscScalar *x;
14725914357eSBarry Smith   const MatScalar   *a_a;
1473003131ecSBarry Smith   PetscInt           m = A->rmap->n;
14745914357eSBarry Smith   const PetscInt    *ii, *ridx = NULL;
1475ace3abfcSBarry Smith   PetscBool          usecprow = a->compressedrow.use;
147617ab2063SBarry Smith 
1477b6410449SSatish Balay #if defined(PETSC_HAVE_PRAGMA_DISJOINT)
147897952fefSHong Zhang   #pragma disjoint(*x, *y, *aa)
1479fee21e36SBarry Smith #endif
1480fee21e36SBarry Smith 
14813a40ed3dSBarry Smith   PetscFunctionBegin;
1482b215bc84SStefano Zampini   if (a->inode.use && a->inode.checked) {
14839566063dSJacob Faibussowitsch     PetscCall(MatMult_SeqAIJ_Inode(A, xx, yy));
14843ba16761SJacob Faibussowitsch     PetscFunctionReturn(PETSC_SUCCESS);
1485b215bc84SStefano Zampini   }
14869566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &a_a));
14879566063dSJacob Faibussowitsch   PetscCall(VecGetArrayRead(xx, &x));
14889566063dSJacob Faibussowitsch   PetscCall(VecGetArray(yy, &y));
1489416022c9SBarry Smith   ii = a->i;
14904eb6d288SHong Zhang   if (usecprow) { /* use compressed row format */
14919566063dSJacob Faibussowitsch     PetscCall(PetscArrayzero(y, m));
149297952fefSHong Zhang     m    = a->compressedrow.nrows;
149397952fefSHong Zhang     ii   = a->compressedrow.i;
149497952fefSHong Zhang     ridx = a->compressedrow.rindex;
14955914357eSBarry Smith     PetscPragmaUseOMPKernels(parallel for)
14965914357eSBarry Smith     for (PetscInt i = 0; i < m; i++) {
14975914357eSBarry Smith       PetscInt           n   = ii[i + 1] - ii[i];
14985914357eSBarry Smith       const PetscInt    *aj  = a->j + ii[i];
14995914357eSBarry Smith       const PetscScalar *aa  = a_a + ii[i];
15005914357eSBarry Smith       PetscScalar        sum = 0.0;
1501003131ecSBarry Smith       PetscSparseDensePlusDot(sum, x, aa, aj, n);
1502003131ecSBarry Smith       /* for (j=0; j<n; j++) sum += (*aa++)*x[*aj++]; */
150397952fefSHong Zhang       y[*ridx++] = sum;
150497952fefSHong Zhang     }
150597952fefSHong Zhang   } else { /* do not use compressed row format */
1506b05257ddSBarry Smith #if defined(PETSC_USE_FORTRAN_KERNEL_MULTAIJ)
15075914357eSBarry Smith     fortranmultaij_(&m, x, ii, a->j, a_a, y);
1508b05257ddSBarry Smith #else
15095914357eSBarry Smith     PetscPragmaUseOMPKernels(parallel for)
15105914357eSBarry Smith     for (PetscInt i = 0; i < m; i++) {
15115914357eSBarry Smith       PetscInt           n   = ii[i + 1] - ii[i];
15125914357eSBarry Smith       const PetscInt    *aj  = a->j + ii[i];
15135914357eSBarry Smith       const PetscScalar *aa  = a_a + ii[i];
15145914357eSBarry Smith       PetscScalar        sum = 0.0;
1515003131ecSBarry Smith       PetscSparseDensePlusDot(sum, x, aa, aj, n);
151617ab2063SBarry Smith       y[i] = sum;
151717ab2063SBarry Smith     }
15188d195f9aSBarry Smith #endif
1519b05257ddSBarry Smith   }
15209566063dSJacob Faibussowitsch   PetscCall(PetscLogFlops(2.0 * a->nz - a->nonzerorowcnt));
15219566063dSJacob Faibussowitsch   PetscCall(VecRestoreArrayRead(xx, &x));
15229566063dSJacob Faibussowitsch   PetscCall(VecRestoreArray(yy, &y));
15239566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &a_a));
15243ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
152517ab2063SBarry Smith }
152617ab2063SBarry Smith 
1527ba38deedSJacob Faibussowitsch // HACK!!!!! Used by src/mat/tests/ex170.c
1528ba38deedSJacob Faibussowitsch PETSC_EXTERN PetscErrorCode MatMultMax_SeqAIJ(Mat A, Vec xx, Vec yy)
1529d71ae5a4SJacob Faibussowitsch {
1530b434eb95SMatthew G. Knepley   Mat_SeqAIJ        *a = (Mat_SeqAIJ *)A->data;
1531b434eb95SMatthew G. Knepley   PetscScalar       *y;
1532b434eb95SMatthew G. Knepley   const PetscScalar *x;
1533fff043a9SJunchao Zhang   const MatScalar   *aa, *a_a;
1534b434eb95SMatthew G. Knepley   PetscInt           m = A->rmap->n;
1535b434eb95SMatthew G. Knepley   const PetscInt    *aj, *ii, *ridx   = NULL;
1536b434eb95SMatthew G. Knepley   PetscInt           n, i, nonzerorow = 0;
1537b434eb95SMatthew G. Knepley   PetscScalar        sum;
1538b434eb95SMatthew G. Knepley   PetscBool          usecprow = a->compressedrow.use;
1539b434eb95SMatthew G. Knepley 
1540b434eb95SMatthew G. Knepley #if defined(PETSC_HAVE_PRAGMA_DISJOINT)
1541b434eb95SMatthew G. Knepley   #pragma disjoint(*x, *y, *aa)
1542b434eb95SMatthew G. Knepley #endif
1543b434eb95SMatthew G. Knepley 
1544b434eb95SMatthew G. Knepley   PetscFunctionBegin;
15459566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &a_a));
15469566063dSJacob Faibussowitsch   PetscCall(VecGetArrayRead(xx, &x));
15479566063dSJacob Faibussowitsch   PetscCall(VecGetArray(yy, &y));
1548b434eb95SMatthew G. Knepley   if (usecprow) { /* use compressed row format */
1549b434eb95SMatthew G. Knepley     m    = a->compressedrow.nrows;
1550b434eb95SMatthew G. Knepley     ii   = a->compressedrow.i;
1551b434eb95SMatthew G. Knepley     ridx = a->compressedrow.rindex;
1552b434eb95SMatthew G. Knepley     for (i = 0; i < m; i++) {
1553b434eb95SMatthew G. Knepley       n   = ii[i + 1] - ii[i];
1554b434eb95SMatthew G. Knepley       aj  = a->j + ii[i];
1555fff043a9SJunchao Zhang       aa  = a_a + ii[i];
1556b434eb95SMatthew G. Knepley       sum = 0.0;
1557b434eb95SMatthew G. Knepley       nonzerorow += (n > 0);
1558b434eb95SMatthew G. Knepley       PetscSparseDenseMaxDot(sum, x, aa, aj, n);
1559b434eb95SMatthew G. Knepley       /* for (j=0; j<n; j++) sum += (*aa++)*x[*aj++]; */
1560b434eb95SMatthew G. Knepley       y[*ridx++] = sum;
1561b434eb95SMatthew G. Knepley     }
1562b434eb95SMatthew G. Knepley   } else { /* do not use compressed row format */
15633d3eaba7SBarry Smith     ii = a->i;
1564b434eb95SMatthew G. Knepley     for (i = 0; i < m; i++) {
1565b434eb95SMatthew G. Knepley       n   = ii[i + 1] - ii[i];
1566b434eb95SMatthew G. Knepley       aj  = a->j + ii[i];
1567fff043a9SJunchao Zhang       aa  = a_a + ii[i];
1568b434eb95SMatthew G. Knepley       sum = 0.0;
1569b434eb95SMatthew G. Knepley       nonzerorow += (n > 0);
1570b434eb95SMatthew G. Knepley       PetscSparseDenseMaxDot(sum, x, aa, aj, n);
1571b434eb95SMatthew G. Knepley       y[i] = sum;
1572b434eb95SMatthew G. Knepley     }
1573b434eb95SMatthew G. Knepley   }
15749566063dSJacob Faibussowitsch   PetscCall(PetscLogFlops(2.0 * a->nz - nonzerorow));
15759566063dSJacob Faibussowitsch   PetscCall(VecRestoreArrayRead(xx, &x));
15769566063dSJacob Faibussowitsch   PetscCall(VecRestoreArray(yy, &y));
15779566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &a_a));
15783ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
1579b434eb95SMatthew G. Knepley }
1580b434eb95SMatthew G. Knepley 
1581ba38deedSJacob Faibussowitsch // HACK!!!!! Used by src/mat/tests/ex170.c
1582ba38deedSJacob Faibussowitsch PETSC_EXTERN PetscErrorCode MatMultAddMax_SeqAIJ(Mat A, Vec xx, Vec yy, Vec zz)
1583d71ae5a4SJacob Faibussowitsch {
1584b434eb95SMatthew G. Knepley   Mat_SeqAIJ        *a = (Mat_SeqAIJ *)A->data;
1585b434eb95SMatthew G. Knepley   PetscScalar       *y, *z;
1586b434eb95SMatthew G. Knepley   const PetscScalar *x;
1587fff043a9SJunchao Zhang   const MatScalar   *aa, *a_a;
1588b434eb95SMatthew G. Knepley   PetscInt           m = A->rmap->n, *aj, *ii;
1589b434eb95SMatthew G. Knepley   PetscInt           n, i, *ridx = NULL;
1590b434eb95SMatthew G. Knepley   PetscScalar        sum;
1591b434eb95SMatthew G. Knepley   PetscBool          usecprow = a->compressedrow.use;
1592b434eb95SMatthew G. Knepley 
1593b434eb95SMatthew G. Knepley   PetscFunctionBegin;
15949566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &a_a));
15959566063dSJacob Faibussowitsch   PetscCall(VecGetArrayRead(xx, &x));
15969566063dSJacob Faibussowitsch   PetscCall(VecGetArrayPair(yy, zz, &y, &z));
1597b434eb95SMatthew G. Knepley   if (usecprow) { /* use compressed row format */
159848a46eb9SPierre Jolivet     if (zz != yy) PetscCall(PetscArraycpy(z, y, m));
1599b434eb95SMatthew G. Knepley     m    = a->compressedrow.nrows;
1600b434eb95SMatthew G. Knepley     ii   = a->compressedrow.i;
1601b434eb95SMatthew G. Knepley     ridx = a->compressedrow.rindex;
1602b434eb95SMatthew G. Knepley     for (i = 0; i < m; i++) {
1603b434eb95SMatthew G. Knepley       n   = ii[i + 1] - ii[i];
1604b434eb95SMatthew G. Knepley       aj  = a->j + ii[i];
1605fff043a9SJunchao Zhang       aa  = a_a + ii[i];
1606b434eb95SMatthew G. Knepley       sum = y[*ridx];
1607b434eb95SMatthew G. Knepley       PetscSparseDenseMaxDot(sum, x, aa, aj, n);
1608b434eb95SMatthew G. Knepley       z[*ridx++] = sum;
1609b434eb95SMatthew G. Knepley     }
1610b434eb95SMatthew G. Knepley   } else { /* do not use compressed row format */
16113d3eaba7SBarry Smith     ii = a->i;
1612b434eb95SMatthew G. Knepley     for (i = 0; i < m; i++) {
1613b434eb95SMatthew G. Knepley       n   = ii[i + 1] - ii[i];
1614b434eb95SMatthew G. Knepley       aj  = a->j + ii[i];
1615fff043a9SJunchao Zhang       aa  = a_a + ii[i];
1616b434eb95SMatthew G. Knepley       sum = y[i];
1617b434eb95SMatthew G. Knepley       PetscSparseDenseMaxDot(sum, x, aa, aj, n);
1618b434eb95SMatthew G. Knepley       z[i] = sum;
1619b434eb95SMatthew G. Knepley     }
1620b434eb95SMatthew G. Knepley   }
16219566063dSJacob Faibussowitsch   PetscCall(PetscLogFlops(2.0 * a->nz));
16229566063dSJacob Faibussowitsch   PetscCall(VecRestoreArrayRead(xx, &x));
16239566063dSJacob Faibussowitsch   PetscCall(VecRestoreArrayPair(yy, zz, &y, &z));
16249566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &a_a));
16253ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
1626b434eb95SMatthew G. Knepley }
1627b434eb95SMatthew G. Knepley 
1628c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/ftn-kernels/fmultadd.h>
1629d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMultAdd_SeqAIJ(Mat A, Vec xx, Vec yy, Vec zz)
1630d71ae5a4SJacob Faibussowitsch {
1631416022c9SBarry Smith   Mat_SeqAIJ        *a = (Mat_SeqAIJ *)A->data;
1632f15663dcSBarry Smith   PetscScalar       *y, *z;
1633f15663dcSBarry Smith   const PetscScalar *x;
16345914357eSBarry Smith   const MatScalar   *a_a;
16355914357eSBarry Smith   const PetscInt    *ii, *ridx = NULL;
16365914357eSBarry Smith   PetscInt           m        = A->rmap->n;
1637ace3abfcSBarry Smith   PetscBool          usecprow = a->compressedrow.use;
16389ea0dfa2SSatish Balay 
16393a40ed3dSBarry Smith   PetscFunctionBegin;
1640b215bc84SStefano Zampini   if (a->inode.use && a->inode.checked) {
16419566063dSJacob Faibussowitsch     PetscCall(MatMultAdd_SeqAIJ_Inode(A, xx, yy, zz));
16423ba16761SJacob Faibussowitsch     PetscFunctionReturn(PETSC_SUCCESS);
1643b215bc84SStefano Zampini   }
16449566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &a_a));
16459566063dSJacob Faibussowitsch   PetscCall(VecGetArrayRead(xx, &x));
16469566063dSJacob Faibussowitsch   PetscCall(VecGetArrayPair(yy, zz, &y, &z));
16474eb6d288SHong Zhang   if (usecprow) { /* use compressed row format */
164848a46eb9SPierre Jolivet     if (zz != yy) PetscCall(PetscArraycpy(z, y, m));
164997952fefSHong Zhang     m    = a->compressedrow.nrows;
165097952fefSHong Zhang     ii   = a->compressedrow.i;
165197952fefSHong Zhang     ridx = a->compressedrow.rindex;
16525914357eSBarry Smith     for (PetscInt i = 0; i < m; i++) {
16535914357eSBarry Smith       PetscInt           n   = ii[i + 1] - ii[i];
16545914357eSBarry Smith       const PetscInt    *aj  = a->j + ii[i];
16555914357eSBarry Smith       const PetscScalar *aa  = a_a + ii[i];
16565914357eSBarry Smith       PetscScalar        sum = y[*ridx];
1657f15663dcSBarry Smith       PetscSparseDensePlusDot(sum, x, aa, aj, n);
165897952fefSHong Zhang       z[*ridx++] = sum;
165997952fefSHong Zhang     }
166097952fefSHong Zhang   } else { /* do not use compressed row format */
16613d3eaba7SBarry Smith     ii = a->i;
1662f15663dcSBarry Smith #if defined(PETSC_USE_FORTRAN_KERNEL_MULTADDAIJ)
16635914357eSBarry Smith     fortranmultaddaij_(&m, x, ii, a->j, a_a, y, z);
1664f15663dcSBarry Smith #else
16655914357eSBarry Smith     PetscPragmaUseOMPKernels(parallel for)
16665914357eSBarry Smith     for (PetscInt i = 0; i < m; i++) {
16675914357eSBarry Smith       PetscInt           n   = ii[i + 1] - ii[i];
16685914357eSBarry Smith       const PetscInt    *aj  = a->j + ii[i];
16695914357eSBarry Smith       const PetscScalar *aa  = a_a + ii[i];
16705914357eSBarry Smith       PetscScalar        sum = y[i];
1671f15663dcSBarry Smith       PetscSparseDensePlusDot(sum, x, aa, aj, n);
167217ab2063SBarry Smith       z[i] = sum;
167317ab2063SBarry Smith     }
167402ab625aSSatish Balay #endif
1675f15663dcSBarry Smith   }
16769566063dSJacob Faibussowitsch   PetscCall(PetscLogFlops(2.0 * a->nz));
16779566063dSJacob Faibussowitsch   PetscCall(VecRestoreArrayRead(xx, &x));
16789566063dSJacob Faibussowitsch   PetscCall(VecRestoreArrayPair(yy, zz, &y, &z));
16799566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &a_a));
16803ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
168117ab2063SBarry Smith }
168217ab2063SBarry Smith 
168317ab2063SBarry Smith /*
16840b4b7b1cSBarry Smith      Adds diagonal pointers to sparse matrix nonzero structure.
168517ab2063SBarry Smith */
1686d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMarkDiagonal_SeqAIJ(Mat A)
1687d71ae5a4SJacob Faibussowitsch {
1688416022c9SBarry Smith   Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data;
1689d0f46423SBarry Smith   PetscInt    i, j, m = A->rmap->n;
1690c0c07093SJunchao Zhang   PetscBool   alreadySet = PETSC_TRUE;
169117ab2063SBarry Smith 
16923a40ed3dSBarry Smith   PetscFunctionBegin;
169309f38230SBarry Smith   if (!a->diag) {
16949566063dSJacob Faibussowitsch     PetscCall(PetscMalloc1(m, &a->diag));
1695c0c07093SJunchao Zhang     alreadySet = PETSC_FALSE;
169609f38230SBarry Smith   }
1697d0f46423SBarry Smith   for (i = 0; i < A->rmap->n; i++) {
1698c0c07093SJunchao Zhang     /* If A's diagonal is already correctly set, this fast track enables cheap and repeated MatMarkDiagonal_SeqAIJ() calls */
1699c0c07093SJunchao Zhang     if (alreadySet) {
1700c0c07093SJunchao Zhang       PetscInt pos = a->diag[i];
1701c0c07093SJunchao Zhang       if (pos >= a->i[i] && pos < a->i[i + 1] && a->j[pos] == i) continue;
1702c0c07093SJunchao Zhang     }
1703c0c07093SJunchao Zhang 
170409f38230SBarry Smith     a->diag[i] = a->i[i + 1];
1705bfeeae90SHong Zhang     for (j = a->i[i]; j < a->i[i + 1]; j++) {
1706bfeeae90SHong Zhang       if (a->j[j] == i) {
170709f38230SBarry Smith         a->diag[i] = j;
170817ab2063SBarry Smith         break;
170917ab2063SBarry Smith       }
171017ab2063SBarry Smith     }
171117ab2063SBarry Smith   }
17123ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
171317ab2063SBarry Smith }
171417ab2063SBarry Smith 
1715ba38deedSJacob Faibussowitsch static PetscErrorCode MatShift_SeqAIJ(Mat A, PetscScalar v)
1716d71ae5a4SJacob Faibussowitsch {
171761ecd0c6SBarry Smith   Mat_SeqAIJ     *a    = (Mat_SeqAIJ *)A->data;
171861ecd0c6SBarry Smith   const PetscInt *diag = (const PetscInt *)a->diag;
171961ecd0c6SBarry Smith   const PetscInt *ii   = (const PetscInt *)a->i;
172061ecd0c6SBarry Smith   PetscInt        i, *mdiag = NULL;
172161ecd0c6SBarry Smith   PetscInt        cnt = 0; /* how many diagonals are missing */
172261ecd0c6SBarry Smith 
172361ecd0c6SBarry Smith   PetscFunctionBegin;
172461ecd0c6SBarry Smith   if (!A->preallocated || !a->nz) {
17259566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJSetPreallocation(A, 1, NULL));
17269566063dSJacob Faibussowitsch     PetscCall(MatShift_Basic(A, v));
17273ba16761SJacob Faibussowitsch     PetscFunctionReturn(PETSC_SUCCESS);
172861ecd0c6SBarry Smith   }
172961ecd0c6SBarry Smith 
173061ecd0c6SBarry Smith   if (a->diagonaldense) {
173161ecd0c6SBarry Smith     cnt = 0;
173261ecd0c6SBarry Smith   } else {
17339566063dSJacob Faibussowitsch     PetscCall(PetscCalloc1(A->rmap->n, &mdiag));
173461ecd0c6SBarry Smith     for (i = 0; i < A->rmap->n; i++) {
1735349d3b71SJunchao Zhang       if (i < A->cmap->n && diag[i] >= ii[i + 1]) { /* 'out of range' rows never have diagonals */
173661ecd0c6SBarry Smith         cnt++;
173761ecd0c6SBarry Smith         mdiag[i] = 1;
173861ecd0c6SBarry Smith       }
173961ecd0c6SBarry Smith     }
174061ecd0c6SBarry Smith   }
174161ecd0c6SBarry Smith   if (!cnt) {
17429566063dSJacob Faibussowitsch     PetscCall(MatShift_Basic(A, v));
174361ecd0c6SBarry Smith   } else {
1744b6f2aa54SBarry Smith     PetscScalar       *olda = a->a; /* preserve pointers to current matrix nonzeros structure and values */
1745b6f2aa54SBarry Smith     PetscInt          *oldj = a->j, *oldi = a->i;
17469f0612e4SBarry Smith     PetscBool          free_a = a->free_a, free_ij = a->free_ij;
17476ea2a7edSJunchao Zhang     const PetscScalar *Aa;
17486ea2a7edSJunchao Zhang 
17496ea2a7edSJunchao Zhang     PetscCall(MatSeqAIJGetArrayRead(A, &Aa)); // sync the host
17506ea2a7edSJunchao Zhang     PetscCall(MatSeqAIJRestoreArrayRead(A, &Aa));
175161ecd0c6SBarry Smith 
175261ecd0c6SBarry Smith     a->a = NULL;
175361ecd0c6SBarry Smith     a->j = NULL;
175461ecd0c6SBarry Smith     a->i = NULL;
175561ecd0c6SBarry Smith     /* increase the values in imax for each row where a diagonal is being inserted then reallocate the matrix data structures */
1756ad540459SPierre Jolivet     for (i = 0; i < PetscMin(A->rmap->n, A->cmap->n); i++) a->imax[i] += mdiag[i];
17579566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(A, 0, a->imax));
175861ecd0c6SBarry Smith 
175961ecd0c6SBarry Smith     /* copy old values into new matrix data structure */
176061ecd0c6SBarry Smith     for (i = 0; i < A->rmap->n; i++) {
17619566063dSJacob Faibussowitsch       PetscCall(MatSetValues(A, 1, &i, a->imax[i] - mdiag[i], &oldj[oldi[i]], &olda[oldi[i]], ADD_VALUES));
176248a46eb9SPierre Jolivet       if (i < A->cmap->n) PetscCall(MatSetValue(A, i, i, v, ADD_VALUES));
1763447d62f5SStefano Zampini     }
17649566063dSJacob Faibussowitsch     PetscCall(MatAssemblyBegin(A, MAT_FINAL_ASSEMBLY));
17659566063dSJacob Faibussowitsch     PetscCall(MatAssemblyEnd(A, MAT_FINAL_ASSEMBLY));
17669f0612e4SBarry Smith     if (free_a) PetscCall(PetscShmgetDeallocateArray((void **)&olda));
17679f0612e4SBarry Smith     if (free_ij) PetscCall(PetscShmgetDeallocateArray((void **)&oldj));
17689f0612e4SBarry Smith     if (free_ij) PetscCall(PetscShmgetDeallocateArray((void **)&oldi));
176961ecd0c6SBarry Smith   }
17709566063dSJacob Faibussowitsch   PetscCall(PetscFree(mdiag));
177161ecd0c6SBarry Smith   a->diagonaldense = PETSC_TRUE;
17723ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
177361ecd0c6SBarry Smith }
177461ecd0c6SBarry Smith 
1775be5855fcSBarry Smith /*
1776be5855fcSBarry Smith      Checks for missing diagonals
1777be5855fcSBarry Smith */
1778d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMissingDiagonal_SeqAIJ(Mat A, PetscBool *missing, PetscInt *d)
1779d71ae5a4SJacob Faibussowitsch {
1780be5855fcSBarry Smith   Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data;
17817734d3b5SMatthew G. Knepley   PetscInt   *diag, *ii = a->i, i;
1782be5855fcSBarry Smith 
1783be5855fcSBarry Smith   PetscFunctionBegin;
178409f38230SBarry Smith   *missing = PETSC_FALSE;
17857734d3b5SMatthew G. Knepley   if (A->rmap->n > 0 && !ii) {
178609f38230SBarry Smith     *missing = PETSC_TRUE;
178709f38230SBarry Smith     if (d) *d = 0;
17889566063dSJacob Faibussowitsch     PetscCall(PetscInfo(A, "Matrix has no entries therefore is missing diagonal\n"));
178909f38230SBarry Smith   } else {
179001445905SHong Zhang     PetscInt n;
179101445905SHong Zhang     n    = PetscMin(A->rmap->n, A->cmap->n);
1792f1e2ffcdSBarry Smith     diag = a->diag;
179301445905SHong Zhang     for (i = 0; i < n; i++) {
17947734d3b5SMatthew G. Knepley       if (diag[i] >= ii[i + 1]) {
179509f38230SBarry Smith         *missing = PETSC_TRUE;
179609f38230SBarry Smith         if (d) *d = i;
17979566063dSJacob Faibussowitsch         PetscCall(PetscInfo(A, "Matrix is missing diagonal number %" PetscInt_FMT "\n", i));
1798358d2f5dSShri Abhyankar         break;
179909f38230SBarry Smith       }
1800be5855fcSBarry Smith     }
1801be5855fcSBarry Smith   }
18023ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
1803be5855fcSBarry Smith }
1804be5855fcSBarry Smith 
18050da83c2eSBarry Smith #include <petscblaslapack.h>
18060da83c2eSBarry Smith #include <petsc/private/kernels/blockinvert.h>
18070da83c2eSBarry Smith 
18080da83c2eSBarry Smith /*
18090da83c2eSBarry Smith     Note that values is allocated externally by the PC and then passed into this routine
18100da83c2eSBarry Smith */
1811ba38deedSJacob Faibussowitsch static PetscErrorCode MatInvertVariableBlockDiagonal_SeqAIJ(Mat A, PetscInt nblocks, const PetscInt *bsizes, PetscScalar *diag)
1812d71ae5a4SJacob Faibussowitsch {
18130da83c2eSBarry Smith   PetscInt        n = A->rmap->n, i, ncnt = 0, *indx, j, bsizemax = 0, *v_pivots;
18140da83c2eSBarry Smith   PetscBool       allowzeropivot, zeropivotdetected = PETSC_FALSE;
18150da83c2eSBarry Smith   const PetscReal shift = 0.0;
18160da83c2eSBarry Smith   PetscInt        ipvt[5];
18174e208921SJed Brown   PetscCount      flops = 0;
18180da83c2eSBarry Smith   PetscScalar     work[25], *v_work;
18190da83c2eSBarry Smith 
18200da83c2eSBarry Smith   PetscFunctionBegin;
18210da83c2eSBarry Smith   allowzeropivot = PetscNot(A->erroriffailure);
18220da83c2eSBarry Smith   for (i = 0; i < nblocks; i++) ncnt += bsizes[i];
182308401ef6SPierre Jolivet   PetscCheck(ncnt == n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Total blocksizes %" PetscInt_FMT " doesn't match number matrix rows %" PetscInt_FMT, ncnt, n);
1824ad540459SPierre Jolivet   for (i = 0; i < nblocks; i++) bsizemax = PetscMax(bsizemax, bsizes[i]);
18259566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(bsizemax, &indx));
182648a46eb9SPierre Jolivet   if (bsizemax > 7) PetscCall(PetscMalloc2(bsizemax, &v_work, bsizemax, &v_pivots));
18270da83c2eSBarry Smith   ncnt = 0;
18280da83c2eSBarry Smith   for (i = 0; i < nblocks; i++) {
18290da83c2eSBarry Smith     for (j = 0; j < bsizes[i]; j++) indx[j] = ncnt + j;
18309566063dSJacob Faibussowitsch     PetscCall(MatGetValues(A, bsizes[i], indx, bsizes[i], indx, diag));
18310da83c2eSBarry Smith     switch (bsizes[i]) {
1832d71ae5a4SJacob Faibussowitsch     case 1:
1833d71ae5a4SJacob Faibussowitsch       *diag = 1.0 / (*diag);
1834d71ae5a4SJacob Faibussowitsch       break;
18350da83c2eSBarry Smith     case 2:
18369566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_inverse_A_2(diag, shift, allowzeropivot, &zeropivotdetected));
18370da83c2eSBarry Smith       if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT;
18389566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_transpose_A_2(diag));
18390da83c2eSBarry Smith       break;
18400da83c2eSBarry Smith     case 3:
18419566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_inverse_A_3(diag, shift, allowzeropivot, &zeropivotdetected));
18420da83c2eSBarry Smith       if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT;
18439566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_transpose_A_3(diag));
18440da83c2eSBarry Smith       break;
18450da83c2eSBarry Smith     case 4:
18469566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_inverse_A_4(diag, shift, allowzeropivot, &zeropivotdetected));
18470da83c2eSBarry Smith       if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT;
18489566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_transpose_A_4(diag));
18490da83c2eSBarry Smith       break;
18500da83c2eSBarry Smith     case 5:
18519566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_inverse_A_5(diag, ipvt, work, shift, allowzeropivot, &zeropivotdetected));
18520da83c2eSBarry Smith       if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT;
18539566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_transpose_A_5(diag));
18540da83c2eSBarry Smith       break;
18550da83c2eSBarry Smith     case 6:
18569566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_inverse_A_6(diag, shift, allowzeropivot, &zeropivotdetected));
18570da83c2eSBarry Smith       if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT;
18589566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_transpose_A_6(diag));
18590da83c2eSBarry Smith       break;
18600da83c2eSBarry Smith     case 7:
18619566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_inverse_A_7(diag, shift, allowzeropivot, &zeropivotdetected));
18620da83c2eSBarry Smith       if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT;
18639566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_transpose_A_7(diag));
18640da83c2eSBarry Smith       break;
18650da83c2eSBarry Smith     default:
18669566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_inverse_A(bsizes[i], diag, v_pivots, v_work, allowzeropivot, &zeropivotdetected));
18670da83c2eSBarry Smith       if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT;
18689566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_transpose_A_N(diag, bsizes[i]));
18690da83c2eSBarry Smith     }
18700da83c2eSBarry Smith     ncnt += bsizes[i];
18710da83c2eSBarry Smith     diag += bsizes[i] * bsizes[i];
1872baa50dc0SBrad Aagaard     flops += 2 * PetscPowInt64(bsizes[i], 3) / 3;
18730da83c2eSBarry Smith   }
18743ba16761SJacob Faibussowitsch   PetscCall(PetscLogFlops(flops));
187548a46eb9SPierre Jolivet   if (bsizemax > 7) PetscCall(PetscFree2(v_work, v_pivots));
18769566063dSJacob Faibussowitsch   PetscCall(PetscFree(indx));
18773ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
18780da83c2eSBarry Smith }
18790da83c2eSBarry Smith 
1880422a814eSBarry Smith /*
1881422a814eSBarry Smith    Negative shift indicates do not generate an error if there is a zero diagonal, just invert it anyways
1882422a814eSBarry Smith */
1883ba38deedSJacob Faibussowitsch static PetscErrorCode MatInvertDiagonal_SeqAIJ(Mat A, PetscScalar omega, PetscScalar fshift)
1884d71ae5a4SJacob Faibussowitsch {
188571f1c65dSBarry Smith   Mat_SeqAIJ      *a = (Mat_SeqAIJ *)A->data;
1886d0f46423SBarry Smith   PetscInt         i, *diag, m = A->rmap->n;
18872e5835c6SStefano Zampini   const MatScalar *v;
188854f21887SBarry Smith   PetscScalar     *idiag, *mdiag;
188971f1c65dSBarry Smith 
189071f1c65dSBarry Smith   PetscFunctionBegin;
18913ba16761SJacob Faibussowitsch   if (a->idiagvalid) PetscFunctionReturn(PETSC_SUCCESS);
18929566063dSJacob Faibussowitsch   PetscCall(MatMarkDiagonal_SeqAIJ(A));
189371f1c65dSBarry Smith   diag = a->diag;
18944dfa11a4SJacob Faibussowitsch   if (!a->idiag) { PetscCall(PetscMalloc3(m, &a->idiag, m, &a->mdiag, m, &a->ssor_work)); }
18952e5835c6SStefano Zampini 
189671f1c65dSBarry Smith   mdiag = a->mdiag;
189771f1c65dSBarry Smith   idiag = a->idiag;
18989566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &v));
1899422a814eSBarry Smith   if (omega == 1.0 && PetscRealPart(fshift) <= 0.0) {
190071f1c65dSBarry Smith     for (i = 0; i < m; i++) {
190171f1c65dSBarry Smith       mdiag[i] = v[diag[i]];
1902899639b0SHong Zhang       if (!PetscAbsScalar(mdiag[i])) { /* zero diagonal */
1903899639b0SHong Zhang         if (PetscRealPart(fshift)) {
19049566063dSJacob Faibussowitsch           PetscCall(PetscInfo(A, "Zero diagonal on row %" PetscInt_FMT "\n", i));
19057b6c816cSBarry Smith           A->factorerrortype             = MAT_FACTOR_NUMERIC_ZEROPIVOT;
19067b6c816cSBarry Smith           A->factorerror_zeropivot_value = 0.0;
19077b6c816cSBarry Smith           A->factorerror_zeropivot_row   = i;
190898921bdaSJacob Faibussowitsch         } else SETERRQ(PETSC_COMM_SELF, PETSC_ERR_ARG_INCOMP, "Zero diagonal on row %" PetscInt_FMT, i);
1909899639b0SHong Zhang       }
191071f1c65dSBarry Smith       idiag[i] = 1.0 / v[diag[i]];
191171f1c65dSBarry Smith     }
19129566063dSJacob Faibussowitsch     PetscCall(PetscLogFlops(m));
191371f1c65dSBarry Smith   } else {
191471f1c65dSBarry Smith     for (i = 0; i < m; i++) {
191571f1c65dSBarry Smith       mdiag[i] = v[diag[i]];
191671f1c65dSBarry Smith       idiag[i] = omega / (fshift + v[diag[i]]);
191771f1c65dSBarry Smith     }
19189566063dSJacob Faibussowitsch     PetscCall(PetscLogFlops(2.0 * m));
191971f1c65dSBarry Smith   }
192071f1c65dSBarry Smith   a->idiagvalid = PETSC_TRUE;
19219566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &v));
19223ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
192371f1c65dSBarry Smith }
192471f1c65dSBarry Smith 
1925d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSOR_SeqAIJ(Mat A, Vec bb, PetscReal omega, MatSORType flag, PetscReal fshift, PetscInt its, PetscInt lits, Vec xx)
1926d71ae5a4SJacob Faibussowitsch {
1927416022c9SBarry Smith   Mat_SeqAIJ        *a = (Mat_SeqAIJ *)A->data;
1928e6d1f457SBarry Smith   PetscScalar       *x, d, sum, *t, scale;
19292e5835c6SStefano Zampini   const MatScalar   *v, *idiag = NULL, *mdiag, *aa;
193054f21887SBarry Smith   const PetscScalar *b, *bs, *xb, *ts;
19313d3eaba7SBarry Smith   PetscInt           n, m = A->rmap->n, i;
193297f1f81fSBarry Smith   const PetscInt    *idx, *diag;
193317ab2063SBarry Smith 
19343a40ed3dSBarry Smith   PetscFunctionBegin;
1935b215bc84SStefano Zampini   if (a->inode.use && a->inode.checked && omega == 1.0 && fshift == 0.0) {
19369566063dSJacob Faibussowitsch     PetscCall(MatSOR_SeqAIJ_Inode(A, bb, omega, flag, fshift, its, lits, xx));
19373ba16761SJacob Faibussowitsch     PetscFunctionReturn(PETSC_SUCCESS);
1938b215bc84SStefano Zampini   }
1939b965ef7fSBarry Smith   its = its * lits;
194091723122SBarry Smith 
194171f1c65dSBarry Smith   if (fshift != a->fshift || omega != a->omega) a->idiagvalid = PETSC_FALSE; /* must recompute idiag[] */
19429566063dSJacob Faibussowitsch   if (!a->idiagvalid) PetscCall(MatInvertDiagonal_SeqAIJ(A, omega, fshift));
194371f1c65dSBarry Smith   a->fshift = fshift;
194471f1c65dSBarry Smith   a->omega  = omega;
1945ed480e8bSBarry Smith 
194671f1c65dSBarry Smith   diag  = a->diag;
194771f1c65dSBarry Smith   t     = a->ssor_work;
1948ed480e8bSBarry Smith   idiag = a->idiag;
194971f1c65dSBarry Smith   mdiag = a->mdiag;
1950ed480e8bSBarry Smith 
19519566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &aa));
19529566063dSJacob Faibussowitsch   PetscCall(VecGetArray(xx, &x));
19539566063dSJacob Faibussowitsch   PetscCall(VecGetArrayRead(bb, &b));
1954ed480e8bSBarry Smith   /* We count flops by assuming the upper triangular and lower triangular parts have the same number of nonzeros */
195517ab2063SBarry Smith   if (flag == SOR_APPLY_UPPER) {
195617ab2063SBarry Smith     /* apply (U + D/omega) to the vector */
1957ed480e8bSBarry Smith     bs = b;
195817ab2063SBarry Smith     for (i = 0; i < m; i++) {
195971f1c65dSBarry Smith       d   = fshift + mdiag[i];
1960416022c9SBarry Smith       n   = a->i[i + 1] - diag[i] - 1;
1961ed480e8bSBarry Smith       idx = a->j + diag[i] + 1;
19622e5835c6SStefano Zampini       v   = aa + diag[i] + 1;
196317ab2063SBarry Smith       sum = b[i] * d / omega;
1964003131ecSBarry Smith       PetscSparseDensePlusDot(sum, bs, v, idx, n);
196517ab2063SBarry Smith       x[i] = sum;
196617ab2063SBarry Smith     }
19679566063dSJacob Faibussowitsch     PetscCall(VecRestoreArray(xx, &x));
19689566063dSJacob Faibussowitsch     PetscCall(VecRestoreArrayRead(bb, &b));
19699566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJRestoreArrayRead(A, &aa));
19709566063dSJacob Faibussowitsch     PetscCall(PetscLogFlops(a->nz));
19713ba16761SJacob Faibussowitsch     PetscFunctionReturn(PETSC_SUCCESS);
197217ab2063SBarry Smith   }
1973c783ea89SBarry Smith 
197408401ef6SPierre Jolivet   PetscCheck(flag != SOR_APPLY_LOWER, PETSC_COMM_SELF, PETSC_ERR_SUP, "SOR_APPLY_LOWER is not implemented");
1975f7d195e4SLawrence Mitchell   if (flag & SOR_EISENSTAT) {
19764c500f23SPierre Jolivet     /* Let  A = L + U + D; where L is lower triangular,
1977887ee2caSBarry Smith     U is upper triangular, E = D/omega; This routine applies
197817ab2063SBarry Smith 
197917ab2063SBarry Smith             (L + E)^{-1} A (U + E)^{-1}
198017ab2063SBarry Smith 
1981887ee2caSBarry Smith     to a vector efficiently using Eisenstat's trick.
198217ab2063SBarry Smith     */
198317ab2063SBarry Smith     scale = (2.0 / omega) - 1.0;
198417ab2063SBarry Smith 
198517ab2063SBarry Smith     /*  x = (E + U)^{-1} b */
198617ab2063SBarry Smith     for (i = m - 1; i >= 0; i--) {
1987416022c9SBarry Smith       n   = a->i[i + 1] - diag[i] - 1;
1988ed480e8bSBarry Smith       idx = a->j + diag[i] + 1;
19892e5835c6SStefano Zampini       v   = aa + diag[i] + 1;
199017ab2063SBarry Smith       sum = b[i];
1991e6d1f457SBarry Smith       PetscSparseDenseMinusDot(sum, x, v, idx, n);
1992ed480e8bSBarry Smith       x[i] = sum * idiag[i];
199317ab2063SBarry Smith     }
199417ab2063SBarry Smith 
199517ab2063SBarry Smith     /*  t = b - (2*E - D)x */
19962e5835c6SStefano Zampini     v = aa;
19972205254eSKarl Rupp     for (i = 0; i < m; i++) t[i] = b[i] - scale * (v[*diag++]) * x[i];
199817ab2063SBarry Smith 
199917ab2063SBarry Smith     /*  t = (E + L)^{-1}t */
2000ed480e8bSBarry Smith     ts   = t;
2001416022c9SBarry Smith     diag = a->diag;
200217ab2063SBarry Smith     for (i = 0; i < m; i++) {
2003416022c9SBarry Smith       n   = diag[i] - a->i[i];
2004ed480e8bSBarry Smith       idx = a->j + a->i[i];
20052e5835c6SStefano Zampini       v   = aa + a->i[i];
200617ab2063SBarry Smith       sum = t[i];
2007003131ecSBarry Smith       PetscSparseDenseMinusDot(sum, ts, v, idx, n);
2008ed480e8bSBarry Smith       t[i] = sum * idiag[i];
2009733d66baSBarry Smith       /*  x = x + t */
2010733d66baSBarry Smith       x[i] += t[i];
201117ab2063SBarry Smith     }
201217ab2063SBarry Smith 
20139566063dSJacob Faibussowitsch     PetscCall(PetscLogFlops(6.0 * m - 1 + 2.0 * a->nz));
20149566063dSJacob Faibussowitsch     PetscCall(VecRestoreArray(xx, &x));
20159566063dSJacob Faibussowitsch     PetscCall(VecRestoreArrayRead(bb, &b));
20163ba16761SJacob Faibussowitsch     PetscFunctionReturn(PETSC_SUCCESS);
201717ab2063SBarry Smith   }
201817ab2063SBarry Smith   if (flag & SOR_ZERO_INITIAL_GUESS) {
201917ab2063SBarry Smith     if (flag & SOR_FORWARD_SWEEP || flag & SOR_LOCAL_FORWARD_SWEEP) {
202017ab2063SBarry Smith       for (i = 0; i < m; i++) {
2021416022c9SBarry Smith         n   = diag[i] - a->i[i];
2022ed480e8bSBarry Smith         idx = a->j + a->i[i];
20232e5835c6SStefano Zampini         v   = aa + a->i[i];
202417ab2063SBarry Smith         sum = b[i];
2025e6d1f457SBarry Smith         PetscSparseDenseMinusDot(sum, x, v, idx, n);
20265c99c7daSBarry Smith         t[i] = sum;
2027ed480e8bSBarry Smith         x[i] = sum * idiag[i];
202817ab2063SBarry Smith       }
20295c99c7daSBarry Smith       xb = t;
20309566063dSJacob Faibussowitsch       PetscCall(PetscLogFlops(a->nz));
20313a40ed3dSBarry Smith     } else xb = b;
203217ab2063SBarry Smith     if (flag & SOR_BACKWARD_SWEEP || flag & SOR_LOCAL_BACKWARD_SWEEP) {
203317ab2063SBarry Smith       for (i = m - 1; i >= 0; i--) {
2034416022c9SBarry Smith         n   = a->i[i + 1] - diag[i] - 1;
2035ed480e8bSBarry Smith         idx = a->j + diag[i] + 1;
20362e5835c6SStefano Zampini         v   = aa + diag[i] + 1;
203717ab2063SBarry Smith         sum = xb[i];
2038e6d1f457SBarry Smith         PetscSparseDenseMinusDot(sum, x, v, idx, n);
20395c99c7daSBarry Smith         if (xb == b) {
2040ed480e8bSBarry Smith           x[i] = sum * idiag[i];
20415c99c7daSBarry Smith         } else {
2042b19a5dc2SMark Adams           x[i] = (1 - omega) * x[i] + sum * idiag[i]; /* omega in idiag */
204317ab2063SBarry Smith         }
20445c99c7daSBarry Smith       }
20459566063dSJacob Faibussowitsch       PetscCall(PetscLogFlops(a->nz)); /* assumes 1/2 in upper */
204617ab2063SBarry Smith     }
204717ab2063SBarry Smith     its--;
204817ab2063SBarry Smith   }
204917ab2063SBarry Smith   while (its--) {
205017ab2063SBarry Smith     if (flag & SOR_FORWARD_SWEEP || flag & SOR_LOCAL_FORWARD_SWEEP) {
205117ab2063SBarry Smith       for (i = 0; i < m; i++) {
2052b19a5dc2SMark Adams         /* lower */
2053b19a5dc2SMark Adams         n   = diag[i] - a->i[i];
2054ed480e8bSBarry Smith         idx = a->j + a->i[i];
20552e5835c6SStefano Zampini         v   = aa + a->i[i];
205617ab2063SBarry Smith         sum = b[i];
2057e6d1f457SBarry Smith         PetscSparseDenseMinusDot(sum, x, v, idx, n);
2058b19a5dc2SMark Adams         t[i] = sum; /* save application of the lower-triangular part */
2059b19a5dc2SMark Adams         /* upper */
2060b19a5dc2SMark Adams         n   = a->i[i + 1] - diag[i] - 1;
2061b19a5dc2SMark Adams         idx = a->j + diag[i] + 1;
20622e5835c6SStefano Zampini         v   = aa + diag[i] + 1;
2063b19a5dc2SMark Adams         PetscSparseDenseMinusDot(sum, x, v, idx, n);
2064b19a5dc2SMark Adams         x[i] = (1. - omega) * x[i] + sum * idiag[i]; /* omega in idiag */
206517ab2063SBarry Smith       }
2066b19a5dc2SMark Adams       xb = t;
20679566063dSJacob Faibussowitsch       PetscCall(PetscLogFlops(2.0 * a->nz));
2068b19a5dc2SMark Adams     } else xb = b;
206917ab2063SBarry Smith     if (flag & SOR_BACKWARD_SWEEP || flag & SOR_LOCAL_BACKWARD_SWEEP) {
207017ab2063SBarry Smith       for (i = m - 1; i >= 0; i--) {
2071b19a5dc2SMark Adams         sum = xb[i];
2072b19a5dc2SMark Adams         if (xb == b) {
2073b19a5dc2SMark Adams           /* whole matrix (no checkpointing available) */
2074416022c9SBarry Smith           n   = a->i[i + 1] - a->i[i];
2075ed480e8bSBarry Smith           idx = a->j + a->i[i];
20762e5835c6SStefano Zampini           v   = aa + a->i[i];
2077e6d1f457SBarry Smith           PetscSparseDenseMinusDot(sum, x, v, idx, n);
2078ed480e8bSBarry Smith           x[i] = (1. - omega) * x[i] + (sum + mdiag[i] * x[i]) * idiag[i];
2079b19a5dc2SMark Adams         } else { /* lower-triangular part has been saved, so only apply upper-triangular */
2080b19a5dc2SMark Adams           n   = a->i[i + 1] - diag[i] - 1;
2081b19a5dc2SMark Adams           idx = a->j + diag[i] + 1;
20822e5835c6SStefano Zampini           v   = aa + diag[i] + 1;
2083b19a5dc2SMark Adams           PetscSparseDenseMinusDot(sum, x, v, idx, n);
2084b19a5dc2SMark Adams           x[i] = (1. - omega) * x[i] + sum * idiag[i]; /* omega in idiag */
208517ab2063SBarry Smith         }
2086b19a5dc2SMark Adams       }
2087b19a5dc2SMark Adams       if (xb == b) {
20889566063dSJacob Faibussowitsch         PetscCall(PetscLogFlops(2.0 * a->nz));
2089b19a5dc2SMark Adams       } else {
20909566063dSJacob Faibussowitsch         PetscCall(PetscLogFlops(a->nz)); /* assumes 1/2 in upper */
2091b19a5dc2SMark Adams       }
209217ab2063SBarry Smith     }
209317ab2063SBarry Smith   }
20949566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &aa));
20959566063dSJacob Faibussowitsch   PetscCall(VecRestoreArray(xx, &x));
20969566063dSJacob Faibussowitsch   PetscCall(VecRestoreArrayRead(bb, &b));
20973ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
209817ab2063SBarry Smith }
209917ab2063SBarry Smith 
2100ba38deedSJacob Faibussowitsch static PetscErrorCode MatGetInfo_SeqAIJ(Mat A, MatInfoType flag, MatInfo *info)
2101d71ae5a4SJacob Faibussowitsch {
2102416022c9SBarry Smith   Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data;
21034e220ebcSLois Curfman McInnes 
21043a40ed3dSBarry Smith   PetscFunctionBegin;
21054e220ebcSLois Curfman McInnes   info->block_size   = 1.0;
21063966268fSBarry Smith   info->nz_allocated = a->maxnz;
21073966268fSBarry Smith   info->nz_used      = a->nz;
21083966268fSBarry Smith   info->nz_unneeded  = (a->maxnz - a->nz);
21093966268fSBarry Smith   info->assemblies   = A->num_ass;
21103966268fSBarry Smith   info->mallocs      = A->info.mallocs;
21114dfa11a4SJacob Faibussowitsch   info->memory       = 0; /* REVIEW ME */
2112d5f3da31SBarry Smith   if (A->factortype) {
21134e220ebcSLois Curfman McInnes     info->fill_ratio_given  = A->info.fill_ratio_given;
21144e220ebcSLois Curfman McInnes     info->fill_ratio_needed = A->info.fill_ratio_needed;
21154e220ebcSLois Curfman McInnes     info->factor_mallocs    = A->info.factor_mallocs;
21164e220ebcSLois Curfman McInnes   } else {
21174e220ebcSLois Curfman McInnes     info->fill_ratio_given  = 0;
21184e220ebcSLois Curfman McInnes     info->fill_ratio_needed = 0;
21194e220ebcSLois Curfman McInnes     info->factor_mallocs    = 0;
21204e220ebcSLois Curfman McInnes   }
21213ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
212217ab2063SBarry Smith }
212317ab2063SBarry Smith 
2124ba38deedSJacob Faibussowitsch static PetscErrorCode MatZeroRows_SeqAIJ(Mat A, PetscInt N, const PetscInt rows[], PetscScalar diag, Vec x, Vec b)
2125d71ae5a4SJacob Faibussowitsch {
2126416022c9SBarry Smith   Mat_SeqAIJ        *a = (Mat_SeqAIJ *)A->data;
2127c7da8527SEric Chamberland   PetscInt           i, m = A->rmap->n - 1;
212897b48c8fSBarry Smith   const PetscScalar *xx;
21292e5835c6SStefano Zampini   PetscScalar       *bb, *aa;
2130c7da8527SEric Chamberland   PetscInt           d = 0;
213117ab2063SBarry Smith 
21323a40ed3dSBarry Smith   PetscFunctionBegin;
213397b48c8fSBarry Smith   if (x && b) {
21349566063dSJacob Faibussowitsch     PetscCall(VecGetArrayRead(x, &xx));
21359566063dSJacob Faibussowitsch     PetscCall(VecGetArray(b, &bb));
213697b48c8fSBarry Smith     for (i = 0; i < N; i++) {
2137aed4548fSBarry Smith       PetscCheck(rows[i] >= 0 && rows[i] <= m, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "row %" PetscInt_FMT " out of range", rows[i]);
2138447d62f5SStefano Zampini       if (rows[i] >= A->cmap->n) continue;
213997b48c8fSBarry Smith       bb[rows[i]] = diag * xx[rows[i]];
214097b48c8fSBarry Smith     }
21419566063dSJacob Faibussowitsch     PetscCall(VecRestoreArrayRead(x, &xx));
21429566063dSJacob Faibussowitsch     PetscCall(VecRestoreArray(b, &bb));
214397b48c8fSBarry Smith   }
214497b48c8fSBarry Smith 
21459566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArray(A, &aa));
2146a9817697SBarry Smith   if (a->keepnonzeropattern) {
2147f1e2ffcdSBarry Smith     for (i = 0; i < N; i++) {
2148aed4548fSBarry Smith       PetscCheck(rows[i] >= 0 && rows[i] <= m, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "row %" PetscInt_FMT " out of range", rows[i]);
21499566063dSJacob Faibussowitsch       PetscCall(PetscArrayzero(&aa[a->i[rows[i]]], a->ilen[rows[i]]));
2150f1e2ffcdSBarry Smith     }
2151f4df32b1SMatthew Knepley     if (diag != 0.0) {
2152c7da8527SEric Chamberland       for (i = 0; i < N; i++) {
2153c7da8527SEric Chamberland         d = rows[i];
2154447d62f5SStefano Zampini         if (rows[i] >= A->cmap->n) continue;
215508401ef6SPierre Jolivet         PetscCheck(a->diag[d] < a->i[d + 1], PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Matrix is missing diagonal entry in the zeroed row %" PetscInt_FMT, d);
2156c7da8527SEric Chamberland       }
2157f1e2ffcdSBarry Smith       for (i = 0; i < N; i++) {
2158447d62f5SStefano Zampini         if (rows[i] >= A->cmap->n) continue;
21592e5835c6SStefano Zampini         aa[a->diag[rows[i]]] = diag;
2160f1e2ffcdSBarry Smith       }
2161f1e2ffcdSBarry Smith     }
2162f1e2ffcdSBarry Smith   } else {
2163f4df32b1SMatthew Knepley     if (diag != 0.0) {
216417ab2063SBarry Smith       for (i = 0; i < N; i++) {
2165aed4548fSBarry Smith         PetscCheck(rows[i] >= 0 && rows[i] <= m, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "row %" PetscInt_FMT " out of range", rows[i]);
21667ae801bdSBarry Smith         if (a->ilen[rows[i]] > 0) {
2167447d62f5SStefano Zampini           if (rows[i] >= A->cmap->n) {
2168447d62f5SStefano Zampini             a->ilen[rows[i]] = 0;
2169447d62f5SStefano Zampini           } else {
2170416022c9SBarry Smith             a->ilen[rows[i]]    = 1;
21712e5835c6SStefano Zampini             aa[a->i[rows[i]]]   = diag;
2172bfeeae90SHong Zhang             a->j[a->i[rows[i]]] = rows[i];
2173447d62f5SStefano Zampini           }
2174447d62f5SStefano Zampini         } else if (rows[i] < A->cmap->n) { /* in case row was completely empty */
21759566063dSJacob Faibussowitsch           PetscCall(MatSetValues_SeqAIJ(A, 1, &rows[i], 1, &rows[i], &diag, INSERT_VALUES));
217617ab2063SBarry Smith         }
217717ab2063SBarry Smith       }
21783a40ed3dSBarry Smith     } else {
217917ab2063SBarry Smith       for (i = 0; i < N; i++) {
2180aed4548fSBarry Smith         PetscCheck(rows[i] >= 0 && rows[i] <= m, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "row %" PetscInt_FMT " out of range", rows[i]);
2181416022c9SBarry Smith         a->ilen[rows[i]] = 0;
218217ab2063SBarry Smith       }
218317ab2063SBarry Smith     }
2184e56f5c9eSBarry Smith     A->nonzerostate++;
2185f1e2ffcdSBarry Smith   }
21869566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArray(A, &aa));
2187dbbe0bcdSBarry Smith   PetscUseTypeMethod(A, assemblyend, MAT_FINAL_ASSEMBLY);
21883ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
218917ab2063SBarry Smith }
219017ab2063SBarry Smith 
2191ba38deedSJacob Faibussowitsch static PetscErrorCode MatZeroRowsColumns_SeqAIJ(Mat A, PetscInt N, const PetscInt rows[], PetscScalar diag, Vec x, Vec b)
2192d71ae5a4SJacob Faibussowitsch {
21936e169961SBarry Smith   Mat_SeqAIJ        *a = (Mat_SeqAIJ *)A->data;
21946e169961SBarry Smith   PetscInt           i, j, m = A->rmap->n - 1, d = 0;
21952b40b63fSBarry Smith   PetscBool          missing, *zeroed, vecs = PETSC_FALSE;
21966e169961SBarry Smith   const PetscScalar *xx;
21972e5835c6SStefano Zampini   PetscScalar       *bb, *aa;
21986e169961SBarry Smith 
21996e169961SBarry Smith   PetscFunctionBegin;
22003ba16761SJacob Faibussowitsch   if (!N) PetscFunctionReturn(PETSC_SUCCESS);
22019566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArray(A, &aa));
22026e169961SBarry Smith   if (x && b) {
22039566063dSJacob Faibussowitsch     PetscCall(VecGetArrayRead(x, &xx));
22049566063dSJacob Faibussowitsch     PetscCall(VecGetArray(b, &bb));
22052b40b63fSBarry Smith     vecs = PETSC_TRUE;
22066e169961SBarry Smith   }
22079566063dSJacob Faibussowitsch   PetscCall(PetscCalloc1(A->rmap->n, &zeroed));
22086e169961SBarry Smith   for (i = 0; i < N; i++) {
2209aed4548fSBarry Smith     PetscCheck(rows[i] >= 0 && rows[i] <= m, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "row %" PetscInt_FMT " out of range", rows[i]);
22108e3a54c0SPierre Jolivet     PetscCall(PetscArrayzero(PetscSafePointerPlusOffset(aa, a->i[rows[i]]), a->ilen[rows[i]]));
22112205254eSKarl Rupp 
22126e169961SBarry Smith     zeroed[rows[i]] = PETSC_TRUE;
22136e169961SBarry Smith   }
22146e169961SBarry Smith   for (i = 0; i < A->rmap->n; i++) {
22156e169961SBarry Smith     if (!zeroed[i]) {
22166e169961SBarry Smith       for (j = a->i[i]; j < a->i[i + 1]; j++) {
22174cf107fdSStefano Zampini         if (a->j[j] < A->rmap->n && zeroed[a->j[j]]) {
22182e5835c6SStefano Zampini           if (vecs) bb[i] -= aa[j] * xx[a->j[j]];
22192e5835c6SStefano Zampini           aa[j] = 0.0;
22206e169961SBarry Smith         }
22216e169961SBarry Smith       }
22224cf107fdSStefano Zampini     } else if (vecs && i < A->cmap->N) bb[i] = diag * xx[i];
22236e169961SBarry Smith   }
22246e169961SBarry Smith   if (x && b) {
22259566063dSJacob Faibussowitsch     PetscCall(VecRestoreArrayRead(x, &xx));
22269566063dSJacob Faibussowitsch     PetscCall(VecRestoreArray(b, &bb));
22276e169961SBarry Smith   }
22289566063dSJacob Faibussowitsch   PetscCall(PetscFree(zeroed));
22296e169961SBarry Smith   if (diag != 0.0) {
22309566063dSJacob Faibussowitsch     PetscCall(MatMissingDiagonal_SeqAIJ(A, &missing, &d));
22311d5a398dSstefano_zampini     if (missing) {
22321d5a398dSstefano_zampini       for (i = 0; i < N; i++) {
22334cf107fdSStefano Zampini         if (rows[i] >= A->cmap->N) continue;
2234aed4548fSBarry Smith         PetscCheck(!a->nonew || rows[i] < d, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Matrix is missing diagonal entry in row %" PetscInt_FMT " (%" PetscInt_FMT ")", d, rows[i]);
22359566063dSJacob Faibussowitsch         PetscCall(MatSetValues_SeqAIJ(A, 1, &rows[i], 1, &rows[i], &diag, INSERT_VALUES));
22361d5a398dSstefano_zampini       }
22371d5a398dSstefano_zampini     } else {
2238ad540459SPierre Jolivet       for (i = 0; i < N; i++) aa[a->diag[rows[i]]] = diag;
22396e169961SBarry Smith     }
22401d5a398dSstefano_zampini   }
22419566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArray(A, &aa));
2242dbbe0bcdSBarry Smith   PetscUseTypeMethod(A, assemblyend, MAT_FINAL_ASSEMBLY);
22433ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
22446e169961SBarry Smith }
22456e169961SBarry Smith 
2246d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetRow_SeqAIJ(Mat A, PetscInt row, PetscInt *nz, PetscInt **idx, PetscScalar **v)
2247d71ae5a4SJacob Faibussowitsch {
2248fff043a9SJunchao Zhang   Mat_SeqAIJ        *a = (Mat_SeqAIJ *)A->data;
2249fff043a9SJunchao Zhang   const PetscScalar *aa;
225017ab2063SBarry Smith 
22513a40ed3dSBarry Smith   PetscFunctionBegin;
22529566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &aa));
2253416022c9SBarry Smith   *nz = a->i[row + 1] - a->i[row];
22548e3a54c0SPierre Jolivet   if (v) *v = PetscSafePointerPlusOffset((PetscScalar *)aa, a->i[row]);
225517ab2063SBarry Smith   if (idx) {
22565c0db29aSPierre Jolivet     if (*nz && a->j) *idx = a->j + a->i[row];
2257f4259b30SLisandro Dalcin     else *idx = NULL;
225817ab2063SBarry Smith   }
22599566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &aa));
22603ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
226117ab2063SBarry Smith }
226217ab2063SBarry Smith 
2263d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRestoreRow_SeqAIJ(Mat A, PetscInt row, PetscInt *nz, PetscInt **idx, PetscScalar **v)
2264d71ae5a4SJacob Faibussowitsch {
22653a40ed3dSBarry Smith   PetscFunctionBegin;
22663ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
226717ab2063SBarry Smith }
226817ab2063SBarry Smith 
2269ba38deedSJacob Faibussowitsch static PetscErrorCode MatNorm_SeqAIJ(Mat A, NormType type, PetscReal *nrm)
2270d71ae5a4SJacob Faibussowitsch {
2271416022c9SBarry Smith   Mat_SeqAIJ      *a = (Mat_SeqAIJ *)A->data;
22722e5835c6SStefano Zampini   const MatScalar *v;
227336db0b34SBarry Smith   PetscReal        sum = 0.0;
227497f1f81fSBarry Smith   PetscInt         i, j;
227517ab2063SBarry Smith 
22763a40ed3dSBarry Smith   PetscFunctionBegin;
22779566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &v));
227817ab2063SBarry Smith   if (type == NORM_FROBENIUS) {
2279570b7f6dSBarry Smith #if defined(PETSC_USE_REAL___FP16)
2280570b7f6dSBarry Smith     PetscBLASInt one = 1, nz = a->nz;
2281792fecdfSBarry Smith     PetscCallBLAS("BLASnrm2", *nrm = BLASnrm2_(&nz, v, &one));
2282570b7f6dSBarry Smith #else
2283416022c9SBarry Smith     for (i = 0; i < a->nz; i++) {
22849371c9d4SSatish Balay       sum += PetscRealPart(PetscConj(*v) * (*v));
22859371c9d4SSatish Balay       v++;
228617ab2063SBarry Smith     }
22878f1a2a5eSBarry Smith     *nrm = PetscSqrtReal(sum);
2288570b7f6dSBarry Smith #endif
22899566063dSJacob Faibussowitsch     PetscCall(PetscLogFlops(2.0 * a->nz));
22903a40ed3dSBarry Smith   } else if (type == NORM_1) {
229136db0b34SBarry Smith     PetscReal *tmp;
229297f1f81fSBarry Smith     PetscInt  *jj = a->j;
22939566063dSJacob Faibussowitsch     PetscCall(PetscCalloc1(A->cmap->n + 1, &tmp));
2294064f8208SBarry Smith     *nrm = 0.0;
2295416022c9SBarry Smith     for (j = 0; j < a->nz; j++) {
22969371c9d4SSatish Balay       tmp[*jj++] += PetscAbsScalar(*v);
22979371c9d4SSatish Balay       v++;
229817ab2063SBarry Smith     }
2299d0f46423SBarry Smith     for (j = 0; j < A->cmap->n; j++) {
2300064f8208SBarry Smith       if (tmp[j] > *nrm) *nrm = tmp[j];
230117ab2063SBarry Smith     }
23029566063dSJacob Faibussowitsch     PetscCall(PetscFree(tmp));
23039566063dSJacob Faibussowitsch     PetscCall(PetscLogFlops(PetscMax(a->nz - 1, 0)));
23043a40ed3dSBarry Smith   } else if (type == NORM_INFINITY) {
2305064f8208SBarry Smith     *nrm = 0.0;
2306d0f46423SBarry Smith     for (j = 0; j < A->rmap->n; j++) {
23078e3a54c0SPierre Jolivet       const PetscScalar *v2 = PetscSafePointerPlusOffset(v, a->i[j]);
230817ab2063SBarry Smith       sum                   = 0.0;
2309416022c9SBarry Smith       for (i = 0; i < a->i[j + 1] - a->i[j]; i++) {
23109371c9d4SSatish Balay         sum += PetscAbsScalar(*v2);
23119371c9d4SSatish Balay         v2++;
231217ab2063SBarry Smith       }
2313064f8208SBarry Smith       if (sum > *nrm) *nrm = sum;
231417ab2063SBarry Smith     }
23159566063dSJacob Faibussowitsch     PetscCall(PetscLogFlops(PetscMax(a->nz - 1, 0)));
2316f23aa3ddSBarry Smith   } else SETERRQ(PETSC_COMM_SELF, PETSC_ERR_SUP, "No support for two norm");
23179566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &v));
23183ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
231917ab2063SBarry Smith }
232017ab2063SBarry Smith 
2321ba38deedSJacob Faibussowitsch static PetscErrorCode MatIsTranspose_SeqAIJ(Mat A, Mat B, PetscReal tol, PetscBool *f)
2322d71ae5a4SJacob Faibussowitsch {
23233d3eaba7SBarry Smith   Mat_SeqAIJ      *aij = (Mat_SeqAIJ *)A->data, *bij = (Mat_SeqAIJ *)B->data;
232454f21887SBarry Smith   PetscInt        *adx, *bdx, *aii, *bii, *aptr, *bptr;
23252e5835c6SStefano Zampini   const MatScalar *va, *vb;
232697f1f81fSBarry Smith   PetscInt         ma, na, mb, nb, i;
2327cd0d46ebSvictorle 
2328cd0d46ebSvictorle   PetscFunctionBegin;
23299566063dSJacob Faibussowitsch   PetscCall(MatGetSize(A, &ma, &na));
23309566063dSJacob Faibussowitsch   PetscCall(MatGetSize(B, &mb, &nb));
23315485867bSBarry Smith   if (ma != nb || na != mb) {
23325485867bSBarry Smith     *f = PETSC_FALSE;
23333ba16761SJacob Faibussowitsch     PetscFunctionReturn(PETSC_SUCCESS);
23345485867bSBarry Smith   }
23359566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &va));
23369566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(B, &vb));
23379371c9d4SSatish Balay   aii = aij->i;
23389371c9d4SSatish Balay   bii = bij->i;
23399371c9d4SSatish Balay   adx = aij->j;
23409371c9d4SSatish Balay   bdx = bij->j;
23419566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(ma, &aptr));
23429566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(mb, &bptr));
2343cd0d46ebSvictorle   for (i = 0; i < ma; i++) aptr[i] = aii[i];
2344cd0d46ebSvictorle   for (i = 0; i < mb; i++) bptr[i] = bii[i];
2345cd0d46ebSvictorle 
2346cd0d46ebSvictorle   *f = PETSC_TRUE;
2347cd0d46ebSvictorle   for (i = 0; i < ma; i++) {
2348cd0d46ebSvictorle     while (aptr[i] < aii[i + 1]) {
234997f1f81fSBarry Smith       PetscInt    idc, idr;
23505485867bSBarry Smith       PetscScalar vc, vr;
2351cd0d46ebSvictorle       /* column/row index/value */
23525485867bSBarry Smith       idc = adx[aptr[i]];
23535485867bSBarry Smith       idr = bdx[bptr[idc]];
23545485867bSBarry Smith       vc  = va[aptr[i]];
23555485867bSBarry Smith       vr  = vb[bptr[idc]];
23565485867bSBarry Smith       if (i != idr || PetscAbsScalar(vc - vr) > tol) {
23575485867bSBarry Smith         *f = PETSC_FALSE;
23585485867bSBarry Smith         goto done;
2359cd0d46ebSvictorle       } else {
23605485867bSBarry Smith         aptr[i]++;
23615485867bSBarry Smith         if (B || i != idc) bptr[idc]++;
2362cd0d46ebSvictorle       }
2363cd0d46ebSvictorle     }
2364cd0d46ebSvictorle   }
2365cd0d46ebSvictorle done:
23669566063dSJacob Faibussowitsch   PetscCall(PetscFree(aptr));
23679566063dSJacob Faibussowitsch   PetscCall(PetscFree(bptr));
23689566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &va));
23699566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(B, &vb));
23703ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
2371cd0d46ebSvictorle }
2372cd0d46ebSvictorle 
2373ba38deedSJacob Faibussowitsch static PetscErrorCode MatIsHermitianTranspose_SeqAIJ(Mat A, Mat B, PetscReal tol, PetscBool *f)
2374d71ae5a4SJacob Faibussowitsch {
23753d3eaba7SBarry Smith   Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data, *bij = (Mat_SeqAIJ *)B->data;
237654f21887SBarry Smith   PetscInt   *adx, *bdx, *aii, *bii, *aptr, *bptr;
237754f21887SBarry Smith   MatScalar  *va, *vb;
23781cbb95d3SBarry Smith   PetscInt    ma, na, mb, nb, i;
23791cbb95d3SBarry Smith 
23801cbb95d3SBarry Smith   PetscFunctionBegin;
23819566063dSJacob Faibussowitsch   PetscCall(MatGetSize(A, &ma, &na));
23829566063dSJacob Faibussowitsch   PetscCall(MatGetSize(B, &mb, &nb));
23831cbb95d3SBarry Smith   if (ma != nb || na != mb) {
23841cbb95d3SBarry Smith     *f = PETSC_FALSE;
23853ba16761SJacob Faibussowitsch     PetscFunctionReturn(PETSC_SUCCESS);
23861cbb95d3SBarry Smith   }
23879371c9d4SSatish Balay   aii = aij->i;
23889371c9d4SSatish Balay   bii = bij->i;
23899371c9d4SSatish Balay   adx = aij->j;
23909371c9d4SSatish Balay   bdx = bij->j;
23919371c9d4SSatish Balay   va  = aij->a;
23929371c9d4SSatish Balay   vb  = bij->a;
23939566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(ma, &aptr));
23949566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(mb, &bptr));
23951cbb95d3SBarry Smith   for (i = 0; i < ma; i++) aptr[i] = aii[i];
23961cbb95d3SBarry Smith   for (i = 0; i < mb; i++) bptr[i] = bii[i];
23971cbb95d3SBarry Smith 
23981cbb95d3SBarry Smith   *f = PETSC_TRUE;
23991cbb95d3SBarry Smith   for (i = 0; i < ma; i++) {
24001cbb95d3SBarry Smith     while (aptr[i] < aii[i + 1]) {
24011cbb95d3SBarry Smith       PetscInt    idc, idr;
24021cbb95d3SBarry Smith       PetscScalar vc, vr;
24031cbb95d3SBarry Smith       /* column/row index/value */
24041cbb95d3SBarry Smith       idc = adx[aptr[i]];
24051cbb95d3SBarry Smith       idr = bdx[bptr[idc]];
24061cbb95d3SBarry Smith       vc  = va[aptr[i]];
24071cbb95d3SBarry Smith       vr  = vb[bptr[idc]];
24081cbb95d3SBarry Smith       if (i != idr || PetscAbsScalar(vc - PetscConj(vr)) > tol) {
24091cbb95d3SBarry Smith         *f = PETSC_FALSE;
24101cbb95d3SBarry Smith         goto done;
24111cbb95d3SBarry Smith       } else {
24121cbb95d3SBarry Smith         aptr[i]++;
24131cbb95d3SBarry Smith         if (B || i != idc) bptr[idc]++;
24141cbb95d3SBarry Smith       }
24151cbb95d3SBarry Smith     }
24161cbb95d3SBarry Smith   }
24171cbb95d3SBarry Smith done:
24189566063dSJacob Faibussowitsch   PetscCall(PetscFree(aptr));
24199566063dSJacob Faibussowitsch   PetscCall(PetscFree(bptr));
24203ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
24211cbb95d3SBarry Smith }
24221cbb95d3SBarry Smith 
2423d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDiagonalScale_SeqAIJ(Mat A, Vec ll, Vec rr)
2424d71ae5a4SJacob Faibussowitsch {
2425416022c9SBarry Smith   Mat_SeqAIJ        *a = (Mat_SeqAIJ *)A->data;
2426fff8e43fSBarry Smith   const PetscScalar *l, *r;
2427fff8e43fSBarry Smith   PetscScalar        x;
242854f21887SBarry Smith   MatScalar         *v;
2429fff8e43fSBarry Smith   PetscInt           i, j, m = A->rmap->n, n = A->cmap->n, M, nz = a->nz;
2430fff8e43fSBarry Smith   const PetscInt    *jj;
243117ab2063SBarry Smith 
24323a40ed3dSBarry Smith   PetscFunctionBegin;
243317ab2063SBarry Smith   if (ll) {
24343ea7c6a1SSatish Balay     /* The local size is used so that VecMPI can be passed to this routine
24353ea7c6a1SSatish Balay        by MatDiagonalScale_MPIAIJ */
24369566063dSJacob Faibussowitsch     PetscCall(VecGetLocalSize(ll, &m));
243708401ef6SPierre Jolivet     PetscCheck(m == A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Left scaling vector wrong length");
24389566063dSJacob Faibussowitsch     PetscCall(VecGetArrayRead(ll, &l));
24399566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJGetArray(A, &v));
244017ab2063SBarry Smith     for (i = 0; i < m; i++) {
244117ab2063SBarry Smith       x = l[i];
2442416022c9SBarry Smith       M = a->i[i + 1] - a->i[i];
24432205254eSKarl Rupp       for (j = 0; j < M; j++) (*v++) *= x;
244417ab2063SBarry Smith     }
24459566063dSJacob Faibussowitsch     PetscCall(VecRestoreArrayRead(ll, &l));
24469566063dSJacob Faibussowitsch     PetscCall(PetscLogFlops(nz));
24479566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJRestoreArray(A, &v));
244817ab2063SBarry Smith   }
244917ab2063SBarry Smith   if (rr) {
24509566063dSJacob Faibussowitsch     PetscCall(VecGetLocalSize(rr, &n));
245108401ef6SPierre Jolivet     PetscCheck(n == A->cmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Right scaling vector wrong length");
24529566063dSJacob Faibussowitsch     PetscCall(VecGetArrayRead(rr, &r));
24539566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJGetArray(A, &v));
24542e5835c6SStefano Zampini     jj = a->j;
24552205254eSKarl Rupp     for (i = 0; i < nz; i++) (*v++) *= r[*jj++];
24569566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJRestoreArray(A, &v));
24579566063dSJacob Faibussowitsch     PetscCall(VecRestoreArrayRead(rr, &r));
24589566063dSJacob Faibussowitsch     PetscCall(PetscLogFlops(nz));
245917ab2063SBarry Smith   }
24609566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJInvalidateDiagonal(A));
24613ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
246217ab2063SBarry Smith }
246317ab2063SBarry Smith 
2464d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateSubMatrix_SeqAIJ(Mat A, IS isrow, IS iscol, PetscInt csize, MatReuse scall, Mat *B)
2465d71ae5a4SJacob Faibussowitsch {
2466db02288aSLois Curfman McInnes   Mat_SeqAIJ        *a = (Mat_SeqAIJ *)A->data, *c;
2467d0f46423SBarry Smith   PetscInt          *smap, i, k, kstart, kend, oldcols = A->cmap->n, *lens;
246897f1f81fSBarry Smith   PetscInt           row, mat_i, *mat_j, tcol, first, step, *mat_ilen, sum, lensi;
24695d0c19d7SBarry Smith   const PetscInt    *irow, *icol;
24702e5835c6SStefano Zampini   const PetscScalar *aa;
24715d0c19d7SBarry Smith   PetscInt           nrows, ncols;
247297f1f81fSBarry Smith   PetscInt          *starts, *j_new, *i_new, *aj = a->j, *ai = a->i, ii, *ailen = a->ilen;
2473fb3c7e2dSJunchao Zhang   MatScalar         *a_new, *mat_a, *c_a;
2474416022c9SBarry Smith   Mat                C;
2475cdc6f3adSToby Isaac   PetscBool          stride;
247617ab2063SBarry Smith 
24773a40ed3dSBarry Smith   PetscFunctionBegin;
24789566063dSJacob Faibussowitsch   PetscCall(ISGetIndices(isrow, &irow));
24799566063dSJacob Faibussowitsch   PetscCall(ISGetLocalSize(isrow, &nrows));
24809566063dSJacob Faibussowitsch   PetscCall(ISGetLocalSize(iscol, &ncols));
248117ab2063SBarry Smith 
24829566063dSJacob Faibussowitsch   PetscCall(PetscObjectTypeCompare((PetscObject)iscol, ISSTRIDE, &stride));
2483ff718158SBarry Smith   if (stride) {
24849566063dSJacob Faibussowitsch     PetscCall(ISStrideGetInfo(iscol, &first, &step));
2485ff718158SBarry Smith   } else {
2486ff718158SBarry Smith     first = 0;
2487ff718158SBarry Smith     step  = 0;
2488ff718158SBarry Smith   }
2489fee21e36SBarry Smith   if (stride && step == 1) {
249002834360SBarry Smith     /* special case of contiguous rows */
24919566063dSJacob Faibussowitsch     PetscCall(PetscMalloc2(nrows, &lens, nrows, &starts));
249202834360SBarry Smith     /* loop over new rows determining lens and starting points */
249302834360SBarry Smith     for (i = 0; i < nrows; i++) {
2494bfeeae90SHong Zhang       kstart    = ai[irow[i]];
2495a2744918SBarry Smith       kend      = kstart + ailen[irow[i]];
2496a91a9bebSLisandro Dalcin       starts[i] = kstart;
249702834360SBarry Smith       for (k = kstart; k < kend; k++) {
2498bfeeae90SHong Zhang         if (aj[k] >= first) {
249902834360SBarry Smith           starts[i] = k;
250002834360SBarry Smith           break;
250102834360SBarry Smith         }
250202834360SBarry Smith       }
2503a2744918SBarry Smith       sum = 0;
250402834360SBarry Smith       while (k < kend) {
2505bfeeae90SHong Zhang         if (aj[k++] >= first + ncols) break;
2506a2744918SBarry Smith         sum++;
250702834360SBarry Smith       }
2508a2744918SBarry Smith       lens[i] = sum;
250902834360SBarry Smith     }
251002834360SBarry Smith     /* create submatrix */
2511cddf8d76SBarry Smith     if (scall == MAT_REUSE_MATRIX) {
251297f1f81fSBarry Smith       PetscInt n_cols, n_rows;
25139566063dSJacob Faibussowitsch       PetscCall(MatGetSize(*B, &n_rows, &n_cols));
2514aed4548fSBarry Smith       PetscCheck(n_rows == nrows && n_cols == ncols, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Reused submatrix wrong size");
25159566063dSJacob Faibussowitsch       PetscCall(MatZeroEntries(*B));
251608480c60SBarry Smith       C = *B;
25173a40ed3dSBarry Smith     } else {
25183bef6203SJed Brown       PetscInt rbs, cbs;
25199566063dSJacob Faibussowitsch       PetscCall(MatCreate(PetscObjectComm((PetscObject)A), &C));
25209566063dSJacob Faibussowitsch       PetscCall(MatSetSizes(C, nrows, ncols, PETSC_DETERMINE, PETSC_DETERMINE));
25219566063dSJacob Faibussowitsch       PetscCall(ISGetBlockSize(isrow, &rbs));
25229566063dSJacob Faibussowitsch       PetscCall(ISGetBlockSize(iscol, &cbs));
25239566063dSJacob Faibussowitsch       PetscCall(MatSetBlockSizes(C, rbs, cbs));
25249566063dSJacob Faibussowitsch       PetscCall(MatSetType(C, ((PetscObject)A)->type_name));
25259566063dSJacob Faibussowitsch       PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(C, 0, lens));
252608480c60SBarry Smith     }
2527db02288aSLois Curfman McInnes     c = (Mat_SeqAIJ *)C->data;
2528db02288aSLois Curfman McInnes 
252902834360SBarry Smith     /* loop over rows inserting into submatrix */
2530fb3c7e2dSJunchao Zhang     PetscCall(MatSeqAIJGetArrayWrite(C, &a_new)); // Not 'a_new = c->a-new', since that raw usage ignores offload state of C
2531db02288aSLois Curfman McInnes     j_new = c->j;
2532db02288aSLois Curfman McInnes     i_new = c->i;
25339566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJGetArrayRead(A, &aa));
253402834360SBarry Smith     for (i = 0; i < nrows; i++) {
2535a2744918SBarry Smith       ii    = starts[i];
2536a2744918SBarry Smith       lensi = lens[i];
2537810441c8SPierre Jolivet       if (lensi) {
2538ad540459SPierre Jolivet         for (k = 0; k < lensi; k++) *j_new++ = aj[ii + k] - first;
25399566063dSJacob Faibussowitsch         PetscCall(PetscArraycpy(a_new, aa + starts[i], lensi));
2540a2744918SBarry Smith         a_new += lensi;
2541810441c8SPierre Jolivet       }
2542a2744918SBarry Smith       i_new[i + 1] = i_new[i] + lensi;
2543a2744918SBarry Smith       c->ilen[i]   = lensi;
254402834360SBarry Smith     }
2545fb3c7e2dSJunchao Zhang     PetscCall(MatSeqAIJRestoreArrayWrite(C, &a_new)); // Set C's offload state properly
25469566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJRestoreArrayRead(A, &aa));
25479566063dSJacob Faibussowitsch     PetscCall(PetscFree2(lens, starts));
25483a40ed3dSBarry Smith   } else {
25499566063dSJacob Faibussowitsch     PetscCall(ISGetIndices(iscol, &icol));
25509566063dSJacob Faibussowitsch     PetscCall(PetscCalloc1(oldcols, &smap));
25519566063dSJacob Faibussowitsch     PetscCall(PetscMalloc1(1 + nrows, &lens));
25524dcab191SBarry Smith     for (i = 0; i < ncols; i++) {
25536bdcaf15SBarry Smith       PetscCheck(icol[i] < oldcols, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Requesting column beyond largest column icol[%" PetscInt_FMT "] %" PetscInt_FMT " >= A->cmap->n %" PetscInt_FMT, i, icol[i], oldcols);
25544dcab191SBarry Smith       smap[icol[i]] = i + 1;
25554dcab191SBarry Smith     }
25564dcab191SBarry Smith 
255702834360SBarry Smith     /* determine lens of each row */
255802834360SBarry Smith     for (i = 0; i < nrows; i++) {
2559bfeeae90SHong Zhang       kstart  = ai[irow[i]];
256002834360SBarry Smith       kend    = kstart + a->ilen[irow[i]];
256102834360SBarry Smith       lens[i] = 0;
256202834360SBarry Smith       for (k = kstart; k < kend; k++) {
2563ad540459SPierre Jolivet         if (smap[aj[k]]) lens[i]++;
256402834360SBarry Smith       }
256502834360SBarry Smith     }
256617ab2063SBarry Smith     /* Create and fill new matrix */
2567a2744918SBarry Smith     if (scall == MAT_REUSE_MATRIX) {
2568ace3abfcSBarry Smith       PetscBool equal;
25690f5bd95cSBarry Smith 
257099141d43SSatish Balay       c = (Mat_SeqAIJ *)((*B)->data);
2571aed4548fSBarry Smith       PetscCheck((*B)->rmap->n == nrows && (*B)->cmap->n == ncols, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Cannot reuse matrix. wrong size");
25729566063dSJacob Faibussowitsch       PetscCall(PetscArraycmp(c->ilen, lens, (*B)->rmap->n, &equal));
2573fdfbdca6SPierre Jolivet       PetscCheck(equal, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Cannot reuse matrix. wrong number of nonzeros");
25749566063dSJacob Faibussowitsch       PetscCall(PetscArrayzero(c->ilen, (*B)->rmap->n));
257508480c60SBarry Smith       C = *B;
25763a40ed3dSBarry Smith     } else {
25773bef6203SJed Brown       PetscInt rbs, cbs;
25789566063dSJacob Faibussowitsch       PetscCall(MatCreate(PetscObjectComm((PetscObject)A), &C));
25799566063dSJacob Faibussowitsch       PetscCall(MatSetSizes(C, nrows, ncols, PETSC_DETERMINE, PETSC_DETERMINE));
25809566063dSJacob Faibussowitsch       PetscCall(ISGetBlockSize(isrow, &rbs));
25819566063dSJacob Faibussowitsch       PetscCall(ISGetBlockSize(iscol, &cbs));
258237a5e0faSPierre Jolivet       if (rbs > 1 || cbs > 1) PetscCall(MatSetBlockSizes(C, rbs, cbs));
25839566063dSJacob Faibussowitsch       PetscCall(MatSetType(C, ((PetscObject)A)->type_name));
25849566063dSJacob Faibussowitsch       PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(C, 0, lens));
258508480c60SBarry Smith     }
25869566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJGetArrayRead(A, &aa));
2587fb3c7e2dSJunchao Zhang 
2588f4f49eeaSPierre Jolivet     c = (Mat_SeqAIJ *)C->data;
2589fb3c7e2dSJunchao Zhang     PetscCall(MatSeqAIJGetArrayWrite(C, &c_a)); // Not 'c->a', since that raw usage ignores offload state of C
259017ab2063SBarry Smith     for (i = 0; i < nrows; i++) {
259199141d43SSatish Balay       row      = irow[i];
2592bfeeae90SHong Zhang       kstart   = ai[row];
259399141d43SSatish Balay       kend     = kstart + a->ilen[row];
2594bfeeae90SHong Zhang       mat_i    = c->i[i];
25958e3a54c0SPierre Jolivet       mat_j    = PetscSafePointerPlusOffset(c->j, mat_i);
25968e3a54c0SPierre Jolivet       mat_a    = PetscSafePointerPlusOffset(c_a, mat_i);
259799141d43SSatish Balay       mat_ilen = c->ilen + i;
259817ab2063SBarry Smith       for (k = kstart; k < kend; k++) {
2599bfeeae90SHong Zhang         if ((tcol = smap[a->j[k]])) {
2600ed480e8bSBarry Smith           *mat_j++ = tcol - 1;
26012e5835c6SStefano Zampini           *mat_a++ = aa[k];
260299141d43SSatish Balay           (*mat_ilen)++;
260317ab2063SBarry Smith         }
260417ab2063SBarry Smith       }
260517ab2063SBarry Smith     }
26069566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJRestoreArrayRead(A, &aa));
260702834360SBarry Smith     /* Free work space */
26089566063dSJacob Faibussowitsch     PetscCall(ISRestoreIndices(iscol, &icol));
26099566063dSJacob Faibussowitsch     PetscCall(PetscFree(smap));
26109566063dSJacob Faibussowitsch     PetscCall(PetscFree(lens));
2611cdc6f3adSToby Isaac     /* sort */
2612cdc6f3adSToby Isaac     for (i = 0; i < nrows; i++) {
2613cdc6f3adSToby Isaac       PetscInt ilen;
2614cdc6f3adSToby Isaac 
2615cdc6f3adSToby Isaac       mat_i = c->i[i];
26168e3a54c0SPierre Jolivet       mat_j = PetscSafePointerPlusOffset(c->j, mat_i);
26178e3a54c0SPierre Jolivet       mat_a = PetscSafePointerPlusOffset(c_a, mat_i);
2618cdc6f3adSToby Isaac       ilen  = c->ilen[i];
26199566063dSJacob Faibussowitsch       PetscCall(PetscSortIntWithScalarArray(ilen, mat_j, mat_a));
2620cdc6f3adSToby Isaac     }
2621fb3c7e2dSJunchao Zhang     PetscCall(MatSeqAIJRestoreArrayWrite(C, &c_a));
262202834360SBarry Smith   }
26238c3ff71bSJunchao Zhang #if defined(PETSC_HAVE_DEVICE)
26249566063dSJacob Faibussowitsch   PetscCall(MatBindToCPU(C, A->boundtocpu));
2625305c6ccfSStefano Zampini #endif
26269566063dSJacob Faibussowitsch   PetscCall(MatAssemblyBegin(C, MAT_FINAL_ASSEMBLY));
26279566063dSJacob Faibussowitsch   PetscCall(MatAssemblyEnd(C, MAT_FINAL_ASSEMBLY));
262817ab2063SBarry Smith 
26299566063dSJacob Faibussowitsch   PetscCall(ISRestoreIndices(isrow, &irow));
2630416022c9SBarry Smith   *B = C;
26313ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
263217ab2063SBarry Smith }
263317ab2063SBarry Smith 
2634ba38deedSJacob Faibussowitsch static PetscErrorCode MatGetMultiProcBlock_SeqAIJ(Mat mat, MPI_Comm subComm, MatReuse scall, Mat *subMat)
2635d71ae5a4SJacob Faibussowitsch {
263682d44351SHong Zhang   Mat B;
263782d44351SHong Zhang 
263882d44351SHong Zhang   PetscFunctionBegin;
2639c2d650bdSHong Zhang   if (scall == MAT_INITIAL_MATRIX) {
26409566063dSJacob Faibussowitsch     PetscCall(MatCreate(subComm, &B));
26419566063dSJacob Faibussowitsch     PetscCall(MatSetSizes(B, mat->rmap->n, mat->cmap->n, mat->rmap->n, mat->cmap->n));
26429566063dSJacob Faibussowitsch     PetscCall(MatSetBlockSizesFromMats(B, mat, mat));
26439566063dSJacob Faibussowitsch     PetscCall(MatSetType(B, MATSEQAIJ));
26449566063dSJacob Faibussowitsch     PetscCall(MatDuplicateNoCreate_SeqAIJ(B, mat, MAT_COPY_VALUES, PETSC_TRUE));
264582d44351SHong Zhang     *subMat = B;
2646c2d650bdSHong Zhang   } else {
26479566063dSJacob Faibussowitsch     PetscCall(MatCopy_SeqAIJ(mat, *subMat, SAME_NONZERO_PATTERN));
2648c2d650bdSHong Zhang   }
26493ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
265082d44351SHong Zhang }
265182d44351SHong Zhang 
2652ba38deedSJacob Faibussowitsch static PetscErrorCode MatILUFactor_SeqAIJ(Mat inA, IS row, IS col, const MatFactorInfo *info)
2653d71ae5a4SJacob Faibussowitsch {
265463b91edcSBarry Smith   Mat_SeqAIJ *a = (Mat_SeqAIJ *)inA->data;
265563b91edcSBarry Smith   Mat         outA;
2656ace3abfcSBarry Smith   PetscBool   row_identity, col_identity;
265763b91edcSBarry Smith 
26583a40ed3dSBarry Smith   PetscFunctionBegin;
265908401ef6SPierre Jolivet   PetscCheck(info->levels == 0, PETSC_COMM_SELF, PETSC_ERR_SUP, "Only levels=0 supported for in-place ilu");
26601df811f5SHong Zhang 
26619566063dSJacob Faibussowitsch   PetscCall(ISIdentity(row, &row_identity));
26629566063dSJacob Faibussowitsch   PetscCall(ISIdentity(col, &col_identity));
2663a871dcd8SBarry Smith 
266463b91edcSBarry Smith   outA             = inA;
2665d5f3da31SBarry Smith   outA->factortype = MAT_FACTOR_LU;
26669566063dSJacob Faibussowitsch   PetscCall(PetscFree(inA->solvertype));
26679566063dSJacob Faibussowitsch   PetscCall(PetscStrallocpy(MATSOLVERPETSC, &inA->solvertype));
26682205254eSKarl Rupp 
26699566063dSJacob Faibussowitsch   PetscCall(PetscObjectReference((PetscObject)row));
26709566063dSJacob Faibussowitsch   PetscCall(ISDestroy(&a->row));
26712205254eSKarl Rupp 
2672c3122656SLisandro Dalcin   a->row = row;
26732205254eSKarl Rupp 
26749566063dSJacob Faibussowitsch   PetscCall(PetscObjectReference((PetscObject)col));
26759566063dSJacob Faibussowitsch   PetscCall(ISDestroy(&a->col));
26762205254eSKarl Rupp 
2677c3122656SLisandro Dalcin   a->col = col;
267863b91edcSBarry Smith 
267936db0b34SBarry Smith   /* Create the inverse permutation so that it can be used in MatLUFactorNumeric() */
26809566063dSJacob Faibussowitsch   PetscCall(ISDestroy(&a->icol));
26819566063dSJacob Faibussowitsch   PetscCall(ISInvertPermutation(col, PETSC_DECIDE, &a->icol));
2682f0ec6fceSSatish Balay 
268394a9d846SBarry Smith   if (!a->solve_work) { /* this matrix may have been factored before */
26849566063dSJacob Faibussowitsch     PetscCall(PetscMalloc1(inA->rmap->n + 1, &a->solve_work));
268594a9d846SBarry Smith   }
268663b91edcSBarry Smith 
26879566063dSJacob Faibussowitsch   PetscCall(MatMarkDiagonal_SeqAIJ(inA));
2688137fb511SHong Zhang   if (row_identity && col_identity) {
26899566063dSJacob Faibussowitsch     PetscCall(MatLUFactorNumeric_SeqAIJ_inplace(outA, inA, info));
2690137fb511SHong Zhang   } else {
26919566063dSJacob Faibussowitsch     PetscCall(MatLUFactorNumeric_SeqAIJ_InplaceWithPerm(outA, inA, info));
2692137fb511SHong Zhang   }
26933ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
2694a871dcd8SBarry Smith }
2695a871dcd8SBarry Smith 
2696d71ae5a4SJacob Faibussowitsch PetscErrorCode MatScale_SeqAIJ(Mat inA, PetscScalar alpha)
2697d71ae5a4SJacob Faibussowitsch {
2698f0b747eeSBarry Smith   Mat_SeqAIJ  *a = (Mat_SeqAIJ *)inA->data;
2699dfa0f9e5SStefano Zampini   PetscScalar *v;
2700c5df96a5SBarry Smith   PetscBLASInt one = 1, bnz;
27013a40ed3dSBarry Smith 
27023a40ed3dSBarry Smith   PetscFunctionBegin;
27039566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArray(inA, &v));
27049566063dSJacob Faibussowitsch   PetscCall(PetscBLASIntCast(a->nz, &bnz));
2705792fecdfSBarry Smith   PetscCallBLAS("BLASscal", BLASscal_(&bnz, &alpha, v, &one));
27069566063dSJacob Faibussowitsch   PetscCall(PetscLogFlops(a->nz));
27079566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArray(inA, &v));
27089566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJInvalidateDiagonal(inA));
27093ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
2710f0b747eeSBarry Smith }
2711f0b747eeSBarry Smith 
2712d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDestroySubMatrix_Private(Mat_SubSppt *submatj)
2713d71ae5a4SJacob Faibussowitsch {
271416b64355SHong Zhang   PetscInt i;
271516b64355SHong Zhang 
271616b64355SHong Zhang   PetscFunctionBegin;
271716b64355SHong Zhang   if (!submatj->id) { /* delete data that are linked only to submats[id=0] */
27189566063dSJacob Faibussowitsch     PetscCall(PetscFree4(submatj->sbuf1, submatj->ptr, submatj->tmp, submatj->ctr));
271916b64355SHong Zhang 
272048a46eb9SPierre Jolivet     for (i = 0; i < submatj->nrqr; ++i) PetscCall(PetscFree(submatj->sbuf2[i]));
27219566063dSJacob Faibussowitsch     PetscCall(PetscFree3(submatj->sbuf2, submatj->req_size, submatj->req_source1));
272216b64355SHong Zhang 
272316b64355SHong Zhang     if (submatj->rbuf1) {
27249566063dSJacob Faibussowitsch       PetscCall(PetscFree(submatj->rbuf1[0]));
27259566063dSJacob Faibussowitsch       PetscCall(PetscFree(submatj->rbuf1));
272616b64355SHong Zhang     }
272716b64355SHong Zhang 
272848a46eb9SPierre Jolivet     for (i = 0; i < submatj->nrqs; ++i) PetscCall(PetscFree(submatj->rbuf3[i]));
27299566063dSJacob Faibussowitsch     PetscCall(PetscFree3(submatj->req_source2, submatj->rbuf2, submatj->rbuf3));
27309566063dSJacob Faibussowitsch     PetscCall(PetscFree(submatj->pa));
273116b64355SHong Zhang   }
273216b64355SHong Zhang 
273316b64355SHong Zhang #if defined(PETSC_USE_CTABLE)
2734eec179cfSJacob Faibussowitsch   PetscCall(PetscHMapIDestroy(&submatj->rmap));
27359566063dSJacob Faibussowitsch   if (submatj->cmap_loc) PetscCall(PetscFree(submatj->cmap_loc));
27369566063dSJacob Faibussowitsch   PetscCall(PetscFree(submatj->rmap_loc));
273716b64355SHong Zhang #else
27389566063dSJacob Faibussowitsch   PetscCall(PetscFree(submatj->rmap));
273916b64355SHong Zhang #endif
274016b64355SHong Zhang 
274116b64355SHong Zhang   if (!submatj->allcolumns) {
274216b64355SHong Zhang #if defined(PETSC_USE_CTABLE)
2743835f2295SStefano Zampini     PetscCall(PetscHMapIDestroy(&submatj->cmap));
274416b64355SHong Zhang #else
27459566063dSJacob Faibussowitsch     PetscCall(PetscFree(submatj->cmap));
274616b64355SHong Zhang #endif
274716b64355SHong Zhang   }
27489566063dSJacob Faibussowitsch   PetscCall(PetscFree(submatj->row2proc));
274916b64355SHong Zhang 
27509566063dSJacob Faibussowitsch   PetscCall(PetscFree(submatj));
27513ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
275216b64355SHong Zhang }
275316b64355SHong Zhang 
2754d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDestroySubMatrix_SeqAIJ(Mat C)
2755d71ae5a4SJacob Faibussowitsch {
275616b64355SHong Zhang   Mat_SeqAIJ  *c       = (Mat_SeqAIJ *)C->data;
27575c39f6d9SHong Zhang   Mat_SubSppt *submatj = c->submatis1;
275816b64355SHong Zhang 
275916b64355SHong Zhang   PetscFunctionBegin;
27609566063dSJacob Faibussowitsch   PetscCall((*submatj->destroy)(C));
27619566063dSJacob Faibussowitsch   PetscCall(MatDestroySubMatrix_Private(submatj));
27623ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
276316b64355SHong Zhang }
276416b64355SHong Zhang 
276589a1a59bSHong Zhang /* Note this has code duplication with MatDestroySubMatrices_SeqBAIJ() */
2766ba38deedSJacob Faibussowitsch static PetscErrorCode MatDestroySubMatrices_SeqAIJ(PetscInt n, Mat *mat[])
2767d71ae5a4SJacob Faibussowitsch {
27682d033e1fSHong Zhang   PetscInt     i;
27690fb991dcSHong Zhang   Mat          C;
27700fb991dcSHong Zhang   Mat_SeqAIJ  *c;
27710fb991dcSHong Zhang   Mat_SubSppt *submatj;
27722d033e1fSHong Zhang 
27732d033e1fSHong Zhang   PetscFunctionBegin;
27742d033e1fSHong Zhang   for (i = 0; i < n; i++) {
27750fb991dcSHong Zhang     C       = (*mat)[i];
27760fb991dcSHong Zhang     c       = (Mat_SeqAIJ *)C->data;
27770fb991dcSHong Zhang     submatj = c->submatis1;
27782d033e1fSHong Zhang     if (submatj) {
2779682e4c99SStefano Zampini       if (--((PetscObject)C)->refct <= 0) {
278026cc229bSBarry Smith         PetscCall(PetscFree(C->factorprefix));
27819566063dSJacob Faibussowitsch         PetscCall((*submatj->destroy)(C));
27829566063dSJacob Faibussowitsch         PetscCall(MatDestroySubMatrix_Private(submatj));
27839566063dSJacob Faibussowitsch         PetscCall(PetscFree(C->defaultvectype));
27843faff063SStefano Zampini         PetscCall(PetscFree(C->defaultrandtype));
27859566063dSJacob Faibussowitsch         PetscCall(PetscLayoutDestroy(&C->rmap));
27869566063dSJacob Faibussowitsch         PetscCall(PetscLayoutDestroy(&C->cmap));
27879566063dSJacob Faibussowitsch         PetscCall(PetscHeaderDestroy(&C));
2788682e4c99SStefano Zampini       }
27892d033e1fSHong Zhang     } else {
27909566063dSJacob Faibussowitsch       PetscCall(MatDestroy(&C));
27912d033e1fSHong Zhang     }
27922d033e1fSHong Zhang   }
279386e85357SHong Zhang 
279463a75b2aSHong Zhang   /* Destroy Dummy submatrices created for reuse */
27959566063dSJacob Faibussowitsch   PetscCall(MatDestroySubMatrices_Dummy(n, mat));
279663a75b2aSHong Zhang 
27979566063dSJacob Faibussowitsch   PetscCall(PetscFree(*mat));
27983ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
27992d033e1fSHong Zhang }
28002d033e1fSHong Zhang 
2801ba38deedSJacob Faibussowitsch static PetscErrorCode MatCreateSubMatrices_SeqAIJ(Mat A, PetscInt n, const IS irow[], const IS icol[], MatReuse scall, Mat *B[])
2802d71ae5a4SJacob Faibussowitsch {
280397f1f81fSBarry Smith   PetscInt i;
2804cddf8d76SBarry Smith 
28053a40ed3dSBarry Smith   PetscFunctionBegin;
280648a46eb9SPierre Jolivet   if (scall == MAT_INITIAL_MATRIX) PetscCall(PetscCalloc1(n + 1, B));
2807cddf8d76SBarry Smith 
280848a46eb9SPierre Jolivet   for (i = 0; i < n; i++) PetscCall(MatCreateSubMatrix_SeqAIJ(A, irow[i], icol[i], PETSC_DECIDE, scall, &(*B)[i]));
28093ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
2810cddf8d76SBarry Smith }
2811cddf8d76SBarry Smith 
2812ba38deedSJacob Faibussowitsch static PetscErrorCode MatIncreaseOverlap_SeqAIJ(Mat A, PetscInt is_max, IS is[], PetscInt ov)
2813d71ae5a4SJacob Faibussowitsch {
2814e4d965acSSatish Balay   Mat_SeqAIJ     *a = (Mat_SeqAIJ *)A->data;
28159a88ca10SBarry Smith   PetscInt        row, i, j, k, l, ll, m, n, *nidx, isz, val;
28165d0c19d7SBarry Smith   const PetscInt *idx;
281758b7e2c1SStefano Zampini   PetscInt        start, end, *ai, *aj, bs = A->rmap->bs == A->cmap->bs ? A->rmap->bs : 1;
2818f1af5d2fSBarry Smith   PetscBT         table;
2819bbd702dbSSatish Balay 
28203a40ed3dSBarry Smith   PetscFunctionBegin;
28219a88ca10SBarry Smith   m  = A->rmap->n / bs;
2822e4d965acSSatish Balay   ai = a->i;
2823bfeeae90SHong Zhang   aj = a->j;
28248a047759SSatish Balay 
282508401ef6SPierre Jolivet   PetscCheck(ov >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "illegal negative overlap value used");
282606763907SSatish Balay 
28279566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(m + 1, &nidx));
28289566063dSJacob Faibussowitsch   PetscCall(PetscBTCreate(m, &table));
282906763907SSatish Balay 
2830e4d965acSSatish Balay   for (i = 0; i < is_max; i++) {
2831b97fc60eSLois Curfman McInnes     /* Initialize the two local arrays */
2832e4d965acSSatish Balay     isz = 0;
28339566063dSJacob Faibussowitsch     PetscCall(PetscBTMemzero(m, table));
2834e4d965acSSatish Balay 
2835e4d965acSSatish Balay     /* Extract the indices, assume there can be duplicate entries */
28369566063dSJacob Faibussowitsch     PetscCall(ISGetIndices(is[i], &idx));
28379566063dSJacob Faibussowitsch     PetscCall(ISGetLocalSize(is[i], &n));
2838e4d965acSSatish Balay 
28399a88ca10SBarry Smith     if (bs > 1) {
28409a88ca10SBarry Smith       /* Enter these into the temp arrays. I.e., mark table[row], enter row into new index */
28419a88ca10SBarry Smith       for (j = 0; j < n; ++j) {
28429a88ca10SBarry Smith         if (!PetscBTLookupSet(table, idx[j] / bs)) nidx[isz++] = idx[j] / bs;
28439a88ca10SBarry Smith       }
28449a88ca10SBarry Smith       PetscCall(ISRestoreIndices(is[i], &idx));
28459a88ca10SBarry Smith       PetscCall(ISDestroy(&is[i]));
28469a88ca10SBarry Smith 
28479a88ca10SBarry Smith       k = 0;
28489a88ca10SBarry Smith       for (j = 0; j < ov; j++) { /* for each overlap */
28499a88ca10SBarry Smith         n = isz;
28509a88ca10SBarry Smith         for (; k < n; k++) { /* do only those rows in nidx[k], which are not done yet */
28519a88ca10SBarry Smith           for (ll = 0; ll < bs; ll++) {
28529a88ca10SBarry Smith             row   = bs * nidx[k] + ll;
28539a88ca10SBarry Smith             start = ai[row];
28549a88ca10SBarry Smith             end   = ai[row + 1];
28559a88ca10SBarry Smith             for (l = start; l < end; l++) {
28569a88ca10SBarry Smith               val = aj[l] / bs;
28579a88ca10SBarry Smith               if (!PetscBTLookupSet(table, val)) nidx[isz++] = val;
28589a88ca10SBarry Smith             }
28599a88ca10SBarry Smith           }
28609a88ca10SBarry Smith         }
28619a88ca10SBarry Smith       }
286257508eceSPierre Jolivet       PetscCall(ISCreateBlock(PETSC_COMM_SELF, bs, isz, nidx, PETSC_COPY_VALUES, is + i));
28639a88ca10SBarry Smith     } else {
2864dd097bc3SLois Curfman McInnes       /* Enter these into the temp arrays. I.e., mark table[row], enter row into new index */
2865e4d965acSSatish Balay       for (j = 0; j < n; ++j) {
28662205254eSKarl Rupp         if (!PetscBTLookupSet(table, idx[j])) nidx[isz++] = idx[j];
28674dcbc457SBarry Smith       }
28689566063dSJacob Faibussowitsch       PetscCall(ISRestoreIndices(is[i], &idx));
28699566063dSJacob Faibussowitsch       PetscCall(ISDestroy(&is[i]));
2870e4d965acSSatish Balay 
287104a348a9SBarry Smith       k = 0;
287204a348a9SBarry Smith       for (j = 0; j < ov; j++) { /* for each overlap */
287304a348a9SBarry Smith         n = isz;
287406763907SSatish Balay         for (; k < n; k++) { /* do only those rows in nidx[k], which are not done yet */
2875e4d965acSSatish Balay           row   = nidx[k];
2876e4d965acSSatish Balay           start = ai[row];
2877e4d965acSSatish Balay           end   = ai[row + 1];
287804a348a9SBarry Smith           for (l = start; l < end; l++) {
2879efb16452SHong Zhang             val = aj[l];
28802205254eSKarl Rupp             if (!PetscBTLookupSet(table, val)) nidx[isz++] = val;
2881e4d965acSSatish Balay           }
2882e4d965acSSatish Balay         }
2883e4d965acSSatish Balay       }
288457508eceSPierre Jolivet       PetscCall(ISCreateGeneral(PETSC_COMM_SELF, isz, nidx, PETSC_COPY_VALUES, is + i));
2885e4d965acSSatish Balay     }
28869a88ca10SBarry Smith   }
28879566063dSJacob Faibussowitsch   PetscCall(PetscBTDestroy(&table));
28889566063dSJacob Faibussowitsch   PetscCall(PetscFree(nidx));
28893ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
28904dcbc457SBarry Smith }
289117ab2063SBarry Smith 
2892ba38deedSJacob Faibussowitsch static PetscErrorCode MatPermute_SeqAIJ(Mat A, IS rowp, IS colp, Mat *B)
2893d71ae5a4SJacob Faibussowitsch {
28940513a670SBarry Smith   Mat_SeqAIJ     *a = (Mat_SeqAIJ *)A->data;
28953b98c0a2SBarry Smith   PetscInt        i, nz = 0, m = A->rmap->n, n = A->cmap->n;
28965d0c19d7SBarry Smith   const PetscInt *row, *col;
28975d0c19d7SBarry Smith   PetscInt       *cnew, j, *lens;
289856cd22aeSBarry Smith   IS              icolp, irowp;
28990298fd71SBarry Smith   PetscInt       *cwork = NULL;
29000298fd71SBarry Smith   PetscScalar    *vwork = NULL;
29010513a670SBarry Smith 
29023a40ed3dSBarry Smith   PetscFunctionBegin;
29039566063dSJacob Faibussowitsch   PetscCall(ISInvertPermutation(rowp, PETSC_DECIDE, &irowp));
29049566063dSJacob Faibussowitsch   PetscCall(ISGetIndices(irowp, &row));
29059566063dSJacob Faibussowitsch   PetscCall(ISInvertPermutation(colp, PETSC_DECIDE, &icolp));
29069566063dSJacob Faibussowitsch   PetscCall(ISGetIndices(icolp, &col));
29070513a670SBarry Smith 
29080513a670SBarry Smith   /* determine lengths of permuted rows */
29099566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(m + 1, &lens));
29102205254eSKarl Rupp   for (i = 0; i < m; i++) lens[row[i]] = a->i[i + 1] - a->i[i];
29119566063dSJacob Faibussowitsch   PetscCall(MatCreate(PetscObjectComm((PetscObject)A), B));
29129566063dSJacob Faibussowitsch   PetscCall(MatSetSizes(*B, m, n, m, n));
29139566063dSJacob Faibussowitsch   PetscCall(MatSetBlockSizesFromMats(*B, A, A));
29149566063dSJacob Faibussowitsch   PetscCall(MatSetType(*B, ((PetscObject)A)->type_name));
29159566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(*B, 0, lens));
29169566063dSJacob Faibussowitsch   PetscCall(PetscFree(lens));
29170513a670SBarry Smith 
29189566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(n, &cnew));
29190513a670SBarry Smith   for (i = 0; i < m; i++) {
29209566063dSJacob Faibussowitsch     PetscCall(MatGetRow_SeqAIJ(A, i, &nz, &cwork, &vwork));
29212205254eSKarl Rupp     for (j = 0; j < nz; j++) cnew[j] = col[cwork[j]];
29229566063dSJacob Faibussowitsch     PetscCall(MatSetValues_SeqAIJ(*B, 1, &row[i], nz, cnew, vwork, INSERT_VALUES));
29239566063dSJacob Faibussowitsch     PetscCall(MatRestoreRow_SeqAIJ(A, i, &nz, &cwork, &vwork));
29240513a670SBarry Smith   }
29259566063dSJacob Faibussowitsch   PetscCall(PetscFree(cnew));
29262205254eSKarl Rupp 
29273c7d62e4SBarry Smith   (*B)->assembled = PETSC_FALSE;
29282205254eSKarl Rupp 
29298c3ff71bSJunchao Zhang #if defined(PETSC_HAVE_DEVICE)
29309566063dSJacob Faibussowitsch   PetscCall(MatBindToCPU(*B, A->boundtocpu));
29319fe5e383SStefano Zampini #endif
29329566063dSJacob Faibussowitsch   PetscCall(MatAssemblyBegin(*B, MAT_FINAL_ASSEMBLY));
29339566063dSJacob Faibussowitsch   PetscCall(MatAssemblyEnd(*B, MAT_FINAL_ASSEMBLY));
29349566063dSJacob Faibussowitsch   PetscCall(ISRestoreIndices(irowp, &row));
29359566063dSJacob Faibussowitsch   PetscCall(ISRestoreIndices(icolp, &col));
29369566063dSJacob Faibussowitsch   PetscCall(ISDestroy(&irowp));
29379566063dSJacob Faibussowitsch   PetscCall(ISDestroy(&icolp));
293848a46eb9SPierre Jolivet   if (rowp == colp) PetscCall(MatPropagateSymmetryOptions(A, *B));
29393ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
29400513a670SBarry Smith }
29410513a670SBarry Smith 
2942d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCopy_SeqAIJ(Mat A, Mat B, MatStructure str)
2943d71ae5a4SJacob Faibussowitsch {
2944cb5b572fSBarry Smith   PetscFunctionBegin;
294533f4a19fSKris Buschelman   /* If the two matrices have the same copy implementation, use fast copy. */
294633f4a19fSKris Buschelman   if (str == SAME_NONZERO_PATTERN && (A->ops->copy == B->ops->copy)) {
2947be6bf707SBarry Smith     Mat_SeqAIJ        *a = (Mat_SeqAIJ *)A->data;
2948be6bf707SBarry Smith     Mat_SeqAIJ        *b = (Mat_SeqAIJ *)B->data;
29492e5835c6SStefano Zampini     const PetscScalar *aa;
29503ac85a22SJunchao Zhang     PetscScalar       *bb;
2951be6bf707SBarry Smith 
29529566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJGetArrayRead(A, &aa));
29533ac85a22SJunchao Zhang     PetscCall(MatSeqAIJGetArrayWrite(B, &bb));
29543ac85a22SJunchao Zhang 
295508401ef6SPierre Jolivet     PetscCheck(a->i[A->rmap->n] == b->i[B->rmap->n], PETSC_COMM_SELF, PETSC_ERR_ARG_INCOMP, "Number of nonzeros in two matrices are different %" PetscInt_FMT " != %" PetscInt_FMT, a->i[A->rmap->n], b->i[B->rmap->n]);
29563ac85a22SJunchao Zhang     PetscCall(PetscArraycpy(bb, aa, a->i[A->rmap->n]));
29579566063dSJacob Faibussowitsch     PetscCall(PetscObjectStateIncrease((PetscObject)B));
29589566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJRestoreArrayRead(A, &aa));
29593ac85a22SJunchao Zhang     PetscCall(MatSeqAIJRestoreArrayWrite(B, &bb));
2960cb5b572fSBarry Smith   } else {
29619566063dSJacob Faibussowitsch     PetscCall(MatCopy_Basic(A, B, str));
2962cb5b572fSBarry Smith   }
29633ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
2964cb5b572fSBarry Smith }
2965cb5b572fSBarry Smith 
2966d71ae5a4SJacob Faibussowitsch PETSC_INTERN PetscErrorCode MatSeqAIJGetArray_SeqAIJ(Mat A, PetscScalar *array[])
2967d71ae5a4SJacob Faibussowitsch {
29686c0721eeSBarry Smith   Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data;
29696e111a19SKarl Rupp 
29706c0721eeSBarry Smith   PetscFunctionBegin;
29716c0721eeSBarry Smith   *array = a->a;
29723ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
29736c0721eeSBarry Smith }
29746c0721eeSBarry Smith 
2975d71ae5a4SJacob Faibussowitsch PETSC_INTERN PetscErrorCode MatSeqAIJRestoreArray_SeqAIJ(Mat A, PetscScalar *array[])
2976d71ae5a4SJacob Faibussowitsch {
29776c0721eeSBarry Smith   PetscFunctionBegin;
2978f38c1e66SStefano Zampini   *array = NULL;
29793ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
29806c0721eeSBarry Smith }
2981273d9f13SBarry Smith 
29828229c054SShri Abhyankar /*
29838229c054SShri Abhyankar    Computes the number of nonzeros per row needed for preallocation when X and Y
29848229c054SShri Abhyankar    have different nonzero structure.
29858229c054SShri Abhyankar */
2986d71ae5a4SJacob Faibussowitsch PetscErrorCode MatAXPYGetPreallocation_SeqX_private(PetscInt m, const PetscInt *xi, const PetscInt *xj, const PetscInt *yi, const PetscInt *yj, PetscInt *nnz)
2987d71ae5a4SJacob Faibussowitsch {
2988b264fe52SHong Zhang   PetscInt i, j, k, nzx, nzy;
2989ec7775f6SShri Abhyankar 
2990ec7775f6SShri Abhyankar   PetscFunctionBegin;
2991ec7775f6SShri Abhyankar   /* Set the number of nonzeros in the new matrix */
2992ec7775f6SShri Abhyankar   for (i = 0; i < m; i++) {
29938e3a54c0SPierre Jolivet     const PetscInt *xjj = PetscSafePointerPlusOffset(xj, xi[i]), *yjj = PetscSafePointerPlusOffset(yj, yi[i]);
2994b264fe52SHong Zhang     nzx    = xi[i + 1] - xi[i];
2995b264fe52SHong Zhang     nzy    = yi[i + 1] - yi[i];
29968af7cee1SJed Brown     nnz[i] = 0;
29978af7cee1SJed Brown     for (j = 0, k = 0; j < nzx; j++) {                  /* Point in X */
2998b264fe52SHong Zhang       for (; k < nzy && yjj[k] < xjj[j]; k++) nnz[i]++; /* Catch up to X */
2999b264fe52SHong Zhang       if (k < nzy && yjj[k] == xjj[j]) k++;             /* Skip duplicate */
30008af7cee1SJed Brown       nnz[i]++;
30018af7cee1SJed Brown     }
30028af7cee1SJed Brown     for (; k < nzy; k++) nnz[i]++;
3003ec7775f6SShri Abhyankar   }
30043ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3005ec7775f6SShri Abhyankar }
3006ec7775f6SShri Abhyankar 
3007d71ae5a4SJacob Faibussowitsch PetscErrorCode MatAXPYGetPreallocation_SeqAIJ(Mat Y, Mat X, PetscInt *nnz)
3008d71ae5a4SJacob Faibussowitsch {
3009b264fe52SHong Zhang   PetscInt    m = Y->rmap->N;
3010b264fe52SHong Zhang   Mat_SeqAIJ *x = (Mat_SeqAIJ *)X->data;
3011b264fe52SHong Zhang   Mat_SeqAIJ *y = (Mat_SeqAIJ *)Y->data;
3012b264fe52SHong Zhang 
3013b264fe52SHong Zhang   PetscFunctionBegin;
3014b264fe52SHong Zhang   /* Set the number of nonzeros in the new matrix */
30159566063dSJacob Faibussowitsch   PetscCall(MatAXPYGetPreallocation_SeqX_private(m, x->i, x->j, y->i, y->j, nnz));
30163ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3017b264fe52SHong Zhang }
3018b264fe52SHong Zhang 
3019d71ae5a4SJacob Faibussowitsch PetscErrorCode MatAXPY_SeqAIJ(Mat Y, PetscScalar a, Mat X, MatStructure str)
3020d71ae5a4SJacob Faibussowitsch {
3021ac90fabeSBarry Smith   Mat_SeqAIJ *x = (Mat_SeqAIJ *)X->data, *y = (Mat_SeqAIJ *)Y->data;
3022ac90fabeSBarry Smith 
3023ac90fabeSBarry Smith   PetscFunctionBegin;
3024134adf20SPierre Jolivet   if (str == UNKNOWN_NONZERO_PATTERN || (PetscDefined(USE_DEBUG) && str == SAME_NONZERO_PATTERN)) {
3025134adf20SPierre Jolivet     PetscBool e = x->nz == y->nz ? PETSC_TRUE : PETSC_FALSE;
3026134adf20SPierre Jolivet     if (e) {
30279566063dSJacob Faibussowitsch       PetscCall(PetscArraycmp(x->i, y->i, Y->rmap->n + 1, &e));
302881fa06acSBarry Smith       if (e) {
30299566063dSJacob Faibussowitsch         PetscCall(PetscArraycmp(x->j, y->j, y->nz, &e));
3030134adf20SPierre Jolivet         if (e) str = SAME_NONZERO_PATTERN;
303181fa06acSBarry Smith       }
303281fa06acSBarry Smith     }
303354c59aa7SJacob Faibussowitsch     if (!e) PetscCheck(str != SAME_NONZERO_PATTERN, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONG, "MatStructure is not SAME_NONZERO_PATTERN");
303481fa06acSBarry Smith   }
3035ac90fabeSBarry Smith   if (str == SAME_NONZERO_PATTERN) {
30362e5835c6SStefano Zampini     const PetscScalar *xa;
30372e5835c6SStefano Zampini     PetscScalar       *ya, alpha = a;
303881fa06acSBarry Smith     PetscBLASInt       one = 1, bnz;
303981fa06acSBarry Smith 
30409566063dSJacob Faibussowitsch     PetscCall(PetscBLASIntCast(x->nz, &bnz));
30419566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJGetArray(Y, &ya));
30429566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJGetArrayRead(X, &xa));
3043792fecdfSBarry Smith     PetscCallBLAS("BLASaxpy", BLASaxpy_(&bnz, &alpha, xa, &one, ya, &one));
30449566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJRestoreArrayRead(X, &xa));
30459566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJRestoreArray(Y, &ya));
30469566063dSJacob Faibussowitsch     PetscCall(PetscLogFlops(2.0 * bnz));
30479566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJInvalidateDiagonal(Y));
30489566063dSJacob Faibussowitsch     PetscCall(PetscObjectStateIncrease((PetscObject)Y));
3049ab784542SHong Zhang   } else if (str == SUBSET_NONZERO_PATTERN) { /* nonzeros of X is a subset of Y's */
30509566063dSJacob Faibussowitsch     PetscCall(MatAXPY_Basic(Y, a, X, str));
3051ac90fabeSBarry Smith   } else {
30528229c054SShri Abhyankar     Mat       B;
30538229c054SShri Abhyankar     PetscInt *nnz;
30549566063dSJacob Faibussowitsch     PetscCall(PetscMalloc1(Y->rmap->N, &nnz));
30559566063dSJacob Faibussowitsch     PetscCall(MatCreate(PetscObjectComm((PetscObject)Y), &B));
30569566063dSJacob Faibussowitsch     PetscCall(PetscObjectSetName((PetscObject)B, ((PetscObject)Y)->name));
30579566063dSJacob Faibussowitsch     PetscCall(MatSetLayouts(B, Y->rmap, Y->cmap));
30589566063dSJacob Faibussowitsch     PetscCall(MatSetType(B, ((PetscObject)Y)->type_name));
30599566063dSJacob Faibussowitsch     PetscCall(MatAXPYGetPreallocation_SeqAIJ(Y, X, nnz));
30609566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJSetPreallocation(B, 0, nnz));
30619566063dSJacob Faibussowitsch     PetscCall(MatAXPY_BasicWithPreallocation(B, Y, a, X, str));
30629566063dSJacob Faibussowitsch     PetscCall(MatHeaderMerge(Y, &B));
30639bb234a9SBarry Smith     PetscCall(MatSeqAIJCheckInode(Y));
30649566063dSJacob Faibussowitsch     PetscCall(PetscFree(nnz));
3065ac90fabeSBarry Smith   }
30663ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3067ac90fabeSBarry Smith }
3068ac90fabeSBarry Smith 
3069d71ae5a4SJacob Faibussowitsch PETSC_INTERN PetscErrorCode MatConjugate_SeqAIJ(Mat mat)
3070d71ae5a4SJacob Faibussowitsch {
3071354c94deSBarry Smith #if defined(PETSC_USE_COMPLEX)
3072354c94deSBarry Smith   Mat_SeqAIJ  *aij = (Mat_SeqAIJ *)mat->data;
3073354c94deSBarry Smith   PetscInt     i, nz;
3074354c94deSBarry Smith   PetscScalar *a;
3075354c94deSBarry Smith 
3076354c94deSBarry Smith   PetscFunctionBegin;
3077354c94deSBarry Smith   nz = aij->nz;
30789566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArray(mat, &a));
30792205254eSKarl Rupp   for (i = 0; i < nz; i++) a[i] = PetscConj(a[i]);
30809566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArray(mat, &a));
3081354c94deSBarry Smith #else
3082354c94deSBarry Smith   PetscFunctionBegin;
3083354c94deSBarry Smith #endif
30843ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3085354c94deSBarry Smith }
3086354c94deSBarry Smith 
3087ba38deedSJacob Faibussowitsch static PetscErrorCode MatGetRowMaxAbs_SeqAIJ(Mat A, Vec v, PetscInt idx[])
3088d71ae5a4SJacob Faibussowitsch {
3089e34fafa9SBarry Smith   Mat_SeqAIJ      *a = (Mat_SeqAIJ *)A->data;
3090d0f46423SBarry Smith   PetscInt         i, j, m = A->rmap->n, *ai, *aj, ncols, n;
3091e34fafa9SBarry Smith   PetscReal        atmp;
3092985db425SBarry Smith   PetscScalar     *x;
3093ce496241SStefano Zampini   const MatScalar *aa, *av;
3094e34fafa9SBarry Smith 
3095e34fafa9SBarry Smith   PetscFunctionBegin;
309628b400f6SJacob Faibussowitsch   PetscCheck(!A->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix");
30979566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &av));
3098ce496241SStefano Zampini   aa = av;
3099e34fafa9SBarry Smith   ai = a->i;
3100e34fafa9SBarry Smith   aj = a->j;
3101e34fafa9SBarry Smith 
31029566063dSJacob Faibussowitsch   PetscCall(VecGetArrayWrite(v, &x));
31039566063dSJacob Faibussowitsch   PetscCall(VecGetLocalSize(v, &n));
310408401ef6SPierre Jolivet   PetscCheck(n == A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Nonconforming matrix and vector");
3105e34fafa9SBarry Smith   for (i = 0; i < m; i++) {
31069371c9d4SSatish Balay     ncols = ai[1] - ai[0];
31079371c9d4SSatish Balay     ai++;
310862e5df07SMark Adams     x[i] = 0;
3109e34fafa9SBarry Smith     for (j = 0; j < ncols; j++) {
3110985db425SBarry Smith       atmp = PetscAbsScalar(*aa);
31119371c9d4SSatish Balay       if (PetscAbsScalar(x[i]) < atmp) {
31129371c9d4SSatish Balay         x[i] = atmp;
31139371c9d4SSatish Balay         if (idx) idx[i] = *aj;
31149371c9d4SSatish Balay       }
31159371c9d4SSatish Balay       aa++;
31169371c9d4SSatish Balay       aj++;
3117985db425SBarry Smith     }
3118985db425SBarry Smith   }
31199566063dSJacob Faibussowitsch   PetscCall(VecRestoreArrayWrite(v, &x));
31209566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &av));
31213ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3122985db425SBarry Smith }
3123985db425SBarry Smith 
3124eede4a3fSMark Adams static PetscErrorCode MatGetRowSumAbs_SeqAIJ(Mat A, Vec v)
3125eede4a3fSMark Adams {
3126eede4a3fSMark Adams   Mat_SeqAIJ      *a = (Mat_SeqAIJ *)A->data;
3127eede4a3fSMark Adams   PetscInt         i, j, m = A->rmap->n, *ai, ncols, n;
3128eede4a3fSMark Adams   PetscScalar     *x;
3129eede4a3fSMark Adams   const MatScalar *aa, *av;
3130eede4a3fSMark Adams 
3131eede4a3fSMark Adams   PetscFunctionBegin;
3132eede4a3fSMark Adams   PetscCheck(!A->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix");
3133eede4a3fSMark Adams   PetscCall(MatSeqAIJGetArrayRead(A, &av));
3134eede4a3fSMark Adams   aa = av;
3135eede4a3fSMark Adams   ai = a->i;
3136eede4a3fSMark Adams 
3137eede4a3fSMark Adams   PetscCall(VecGetArrayWrite(v, &x));
3138eede4a3fSMark Adams   PetscCall(VecGetLocalSize(v, &n));
3139eede4a3fSMark Adams   PetscCheck(n == A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Nonconforming matrix and vector");
3140eede4a3fSMark Adams   for (i = 0; i < m; i++) {
3141eede4a3fSMark Adams     ncols = ai[1] - ai[0];
3142eede4a3fSMark Adams     ai++;
314362e5df07SMark Adams     x[i] = 0;
3144eede4a3fSMark Adams     for (j = 0; j < ncols; j++) {
3145eede4a3fSMark Adams       x[i] += PetscAbsScalar(*aa);
3146eede4a3fSMark Adams       aa++;
3147eede4a3fSMark Adams     }
3148eede4a3fSMark Adams   }
3149eede4a3fSMark Adams   PetscCall(VecRestoreArrayWrite(v, &x));
3150eede4a3fSMark Adams   PetscCall(MatSeqAIJRestoreArrayRead(A, &av));
3151eede4a3fSMark Adams   PetscFunctionReturn(PETSC_SUCCESS);
3152eede4a3fSMark Adams }
3153eede4a3fSMark Adams 
3154ba38deedSJacob Faibussowitsch static PetscErrorCode MatGetRowMax_SeqAIJ(Mat A, Vec v, PetscInt idx[])
3155d71ae5a4SJacob Faibussowitsch {
3156985db425SBarry Smith   Mat_SeqAIJ      *a = (Mat_SeqAIJ *)A->data;
3157d0f46423SBarry Smith   PetscInt         i, j, m = A->rmap->n, *ai, *aj, ncols, n;
3158985db425SBarry Smith   PetscScalar     *x;
3159ce496241SStefano Zampini   const MatScalar *aa, *av;
3160985db425SBarry Smith 
3161985db425SBarry Smith   PetscFunctionBegin;
316228b400f6SJacob Faibussowitsch   PetscCheck(!A->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix");
31639566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &av));
3164ce496241SStefano Zampini   aa = av;
3165985db425SBarry Smith   ai = a->i;
3166985db425SBarry Smith   aj = a->j;
3167985db425SBarry Smith 
31689566063dSJacob Faibussowitsch   PetscCall(VecGetArrayWrite(v, &x));
31699566063dSJacob Faibussowitsch   PetscCall(VecGetLocalSize(v, &n));
317008401ef6SPierre Jolivet   PetscCheck(n == A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Nonconforming matrix and vector");
3171985db425SBarry Smith   for (i = 0; i < m; i++) {
31729371c9d4SSatish Balay     ncols = ai[1] - ai[0];
31739371c9d4SSatish Balay     ai++;
3174d0f46423SBarry Smith     if (ncols == A->cmap->n) { /* row is dense */
31759371c9d4SSatish Balay       x[i] = *aa;
31769371c9d4SSatish Balay       if (idx) idx[i] = 0;
3177985db425SBarry Smith     } else { /* row is sparse so already KNOW maximum is 0.0 or higher */
3178985db425SBarry Smith       x[i] = 0.0;
3179985db425SBarry Smith       if (idx) {
3180985db425SBarry Smith         for (j = 0; j < ncols; j++) { /* find first implicit 0.0 in the row */
3181985db425SBarry Smith           if (aj[j] > j) {
3182985db425SBarry Smith             idx[i] = j;
3183985db425SBarry Smith             break;
3184985db425SBarry Smith           }
3185985db425SBarry Smith         }
31861a254869SHong Zhang         /* in case first implicit 0.0 in the row occurs at ncols-th column */
31871a254869SHong Zhang         if (j == ncols && j < A->cmap->n) idx[i] = j;
3188985db425SBarry Smith       }
3189985db425SBarry Smith     }
3190985db425SBarry Smith     for (j = 0; j < ncols; j++) {
31919371c9d4SSatish Balay       if (PetscRealPart(x[i]) < PetscRealPart(*aa)) {
31929371c9d4SSatish Balay         x[i] = *aa;
31939371c9d4SSatish Balay         if (idx) idx[i] = *aj;
31949371c9d4SSatish Balay       }
31959371c9d4SSatish Balay       aa++;
31969371c9d4SSatish Balay       aj++;
3197985db425SBarry Smith     }
3198985db425SBarry Smith   }
31999566063dSJacob Faibussowitsch   PetscCall(VecRestoreArrayWrite(v, &x));
32009566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &av));
32013ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3202985db425SBarry Smith }
3203985db425SBarry Smith 
3204ba38deedSJacob Faibussowitsch static PetscErrorCode MatGetRowMinAbs_SeqAIJ(Mat A, Vec v, PetscInt idx[])
3205d71ae5a4SJacob Faibussowitsch {
3206c87e5d42SMatthew Knepley   Mat_SeqAIJ      *a = (Mat_SeqAIJ *)A->data;
3207c87e5d42SMatthew Knepley   PetscInt         i, j, m = A->rmap->n, *ai, *aj, ncols, n;
3208ce496241SStefano Zampini   PetscScalar     *x;
3209ce496241SStefano Zampini   const MatScalar *aa, *av;
3210c87e5d42SMatthew Knepley 
3211c87e5d42SMatthew Knepley   PetscFunctionBegin;
32129566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &av));
3213ce496241SStefano Zampini   aa = av;
3214c87e5d42SMatthew Knepley   ai = a->i;
3215c87e5d42SMatthew Knepley   aj = a->j;
3216c87e5d42SMatthew Knepley 
32179566063dSJacob Faibussowitsch   PetscCall(VecGetArrayWrite(v, &x));
32189566063dSJacob Faibussowitsch   PetscCall(VecGetLocalSize(v, &n));
321908401ef6SPierre Jolivet   PetscCheck(n == m, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Nonconforming matrix and vector, %" PetscInt_FMT " vs. %" PetscInt_FMT " rows", m, n);
3220c87e5d42SMatthew Knepley   for (i = 0; i < m; i++) {
32219371c9d4SSatish Balay     ncols = ai[1] - ai[0];
32229371c9d4SSatish Balay     ai++;
3223f07e67edSHong Zhang     if (ncols == A->cmap->n) { /* row is dense */
32249371c9d4SSatish Balay       x[i] = *aa;
32259371c9d4SSatish Balay       if (idx) idx[i] = 0;
3226f07e67edSHong Zhang     } else { /* row is sparse so already KNOW minimum is 0.0 or higher */
3227f07e67edSHong Zhang       x[i] = 0.0;
3228f07e67edSHong Zhang       if (idx) { /* find first implicit 0.0 in the row */
3229289a08f5SMatthew Knepley         for (j = 0; j < ncols; j++) {
3230f07e67edSHong Zhang           if (aj[j] > j) {
3231f07e67edSHong Zhang             idx[i] = j;
32322205254eSKarl Rupp             break;
32332205254eSKarl Rupp           }
3234289a08f5SMatthew Knepley         }
3235f07e67edSHong Zhang         /* in case first implicit 0.0 in the row occurs at ncols-th column */
3236f07e67edSHong Zhang         if (j == ncols && j < A->cmap->n) idx[i] = j;
3237f07e67edSHong Zhang       }
3238289a08f5SMatthew Knepley     }
3239c87e5d42SMatthew Knepley     for (j = 0; j < ncols; j++) {
32409371c9d4SSatish Balay       if (PetscAbsScalar(x[i]) > PetscAbsScalar(*aa)) {
32419371c9d4SSatish Balay         x[i] = *aa;
32429371c9d4SSatish Balay         if (idx) idx[i] = *aj;
32439371c9d4SSatish Balay       }
32449371c9d4SSatish Balay       aa++;
32459371c9d4SSatish Balay       aj++;
3246c87e5d42SMatthew Knepley     }
3247c87e5d42SMatthew Knepley   }
32489566063dSJacob Faibussowitsch   PetscCall(VecRestoreArrayWrite(v, &x));
32499566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &av));
32503ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3251c87e5d42SMatthew Knepley }
3252c87e5d42SMatthew Knepley 
3253ba38deedSJacob Faibussowitsch static PetscErrorCode MatGetRowMin_SeqAIJ(Mat A, Vec v, PetscInt idx[])
3254d71ae5a4SJacob Faibussowitsch {
3255985db425SBarry Smith   Mat_SeqAIJ      *a = (Mat_SeqAIJ *)A->data;
3256d9ca1df4SBarry Smith   PetscInt         i, j, m = A->rmap->n, ncols, n;
3257d9ca1df4SBarry Smith   const PetscInt  *ai, *aj;
3258985db425SBarry Smith   PetscScalar     *x;
3259ce496241SStefano Zampini   const MatScalar *aa, *av;
3260985db425SBarry Smith 
3261985db425SBarry Smith   PetscFunctionBegin;
326228b400f6SJacob Faibussowitsch   PetscCheck(!A->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix");
32639566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &av));
3264ce496241SStefano Zampini   aa = av;
3265985db425SBarry Smith   ai = a->i;
3266985db425SBarry Smith   aj = a->j;
3267985db425SBarry Smith 
32689566063dSJacob Faibussowitsch   PetscCall(VecGetArrayWrite(v, &x));
32699566063dSJacob Faibussowitsch   PetscCall(VecGetLocalSize(v, &n));
327008401ef6SPierre Jolivet   PetscCheck(n == m, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Nonconforming matrix and vector");
3271985db425SBarry Smith   for (i = 0; i < m; i++) {
32729371c9d4SSatish Balay     ncols = ai[1] - ai[0];
32739371c9d4SSatish Balay     ai++;
3274d0f46423SBarry Smith     if (ncols == A->cmap->n) { /* row is dense */
32759371c9d4SSatish Balay       x[i] = *aa;
32769371c9d4SSatish Balay       if (idx) idx[i] = 0;
3277985db425SBarry Smith     } else { /* row is sparse so already KNOW minimum is 0.0 or lower */
3278985db425SBarry Smith       x[i] = 0.0;
3279985db425SBarry Smith       if (idx) { /* find first implicit 0.0 in the row */
3280985db425SBarry Smith         for (j = 0; j < ncols; j++) {
3281985db425SBarry Smith           if (aj[j] > j) {
3282985db425SBarry Smith             idx[i] = j;
3283985db425SBarry Smith             break;
3284985db425SBarry Smith           }
3285985db425SBarry Smith         }
3286fa213d2fSHong Zhang         /* in case first implicit 0.0 in the row occurs at ncols-th column */
3287fa213d2fSHong Zhang         if (j == ncols && j < A->cmap->n) idx[i] = j;
3288985db425SBarry Smith       }
3289985db425SBarry Smith     }
3290985db425SBarry Smith     for (j = 0; j < ncols; j++) {
32919371c9d4SSatish Balay       if (PetscRealPart(x[i]) > PetscRealPart(*aa)) {
32929371c9d4SSatish Balay         x[i] = *aa;
32939371c9d4SSatish Balay         if (idx) idx[i] = *aj;
32949371c9d4SSatish Balay       }
32959371c9d4SSatish Balay       aa++;
32969371c9d4SSatish Balay       aj++;
3297e34fafa9SBarry Smith     }
3298e34fafa9SBarry Smith   }
32999566063dSJacob Faibussowitsch   PetscCall(VecRestoreArrayWrite(v, &x));
33009566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &av));
33013ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3302e34fafa9SBarry Smith }
3303bbead8a2SBarry Smith 
3304ba38deedSJacob Faibussowitsch static PetscErrorCode MatInvertBlockDiagonal_SeqAIJ(Mat A, const PetscScalar **values)
3305d71ae5a4SJacob Faibussowitsch {
3306bbead8a2SBarry Smith   Mat_SeqAIJ     *a = (Mat_SeqAIJ *)A->data;
330758b7e2c1SStefano Zampini   PetscInt        i, bs = A->rmap->bs, mbs = A->rmap->n / bs, ipvt[5], bs2 = bs * bs, *v_pivots, ij[7], *IJ, j;
3308bbead8a2SBarry Smith   MatScalar      *diag, work[25], *v_work;
33090da83c2eSBarry Smith   const PetscReal shift = 0.0;
33101a9391e3SHong Zhang   PetscBool       allowzeropivot, zeropivotdetected = PETSC_FALSE;
3311bbead8a2SBarry Smith 
3312bbead8a2SBarry Smith   PetscFunctionBegin;
3313a455e926SHong Zhang   allowzeropivot = PetscNot(A->erroriffailure);
33144a0d0026SBarry Smith   if (a->ibdiagvalid) {
33154a0d0026SBarry Smith     if (values) *values = a->ibdiag;
33163ba16761SJacob Faibussowitsch     PetscFunctionReturn(PETSC_SUCCESS);
33174a0d0026SBarry Smith   }
33189566063dSJacob Faibussowitsch   PetscCall(MatMarkDiagonal_SeqAIJ(A));
33194dfa11a4SJacob Faibussowitsch   if (!a->ibdiag) { PetscCall(PetscMalloc1(bs2 * mbs, &a->ibdiag)); }
3320bbead8a2SBarry Smith   diag = a->ibdiag;
3321bbead8a2SBarry Smith   if (values) *values = a->ibdiag;
3322bbead8a2SBarry Smith   /* factor and invert each block */
3323bbead8a2SBarry Smith   switch (bs) {
3324bbead8a2SBarry Smith   case 1:
3325bbead8a2SBarry Smith     for (i = 0; i < mbs; i++) {
33269566063dSJacob Faibussowitsch       PetscCall(MatGetValues(A, 1, &i, 1, &i, diag + i));
3327ec1892c8SHong Zhang       if (PetscAbsScalar(diag[i] + shift) < PETSC_MACHINE_EPSILON) {
3328ec1892c8SHong Zhang         if (allowzeropivot) {
33297b6c816cSBarry Smith           A->factorerrortype             = MAT_FACTOR_NUMERIC_ZEROPIVOT;
33307b6c816cSBarry Smith           A->factorerror_zeropivot_value = PetscAbsScalar(diag[i]);
33317b6c816cSBarry Smith           A->factorerror_zeropivot_row   = i;
33329566063dSJacob Faibussowitsch           PetscCall(PetscInfo(A, "Zero pivot, row %" PetscInt_FMT " pivot %g tolerance %g\n", i, (double)PetscAbsScalar(diag[i]), (double)PETSC_MACHINE_EPSILON));
333398921bdaSJacob Faibussowitsch         } else SETERRQ(PETSC_COMM_SELF, PETSC_ERR_MAT_LU_ZRPVT, "Zero pivot, row %" PetscInt_FMT " pivot %g tolerance %g", i, (double)PetscAbsScalar(diag[i]), (double)PETSC_MACHINE_EPSILON);
3334ec1892c8SHong Zhang       }
3335bbead8a2SBarry Smith       diag[i] = (PetscScalar)1.0 / (diag[i] + shift);
3336bbead8a2SBarry Smith     }
3337bbead8a2SBarry Smith     break;
3338bbead8a2SBarry Smith   case 2:
3339bbead8a2SBarry Smith     for (i = 0; i < mbs; i++) {
33409371c9d4SSatish Balay       ij[0] = 2 * i;
33419371c9d4SSatish Balay       ij[1] = 2 * i + 1;
33429566063dSJacob Faibussowitsch       PetscCall(MatGetValues(A, 2, ij, 2, ij, diag));
33439566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_inverse_A_2(diag, shift, allowzeropivot, &zeropivotdetected));
33447b6c816cSBarry Smith       if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT;
33459566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_transpose_A_2(diag));
3346bbead8a2SBarry Smith       diag += 4;
3347bbead8a2SBarry Smith     }
3348bbead8a2SBarry Smith     break;
3349bbead8a2SBarry Smith   case 3:
3350bbead8a2SBarry Smith     for (i = 0; i < mbs; i++) {
33519371c9d4SSatish Balay       ij[0] = 3 * i;
33529371c9d4SSatish Balay       ij[1] = 3 * i + 1;
33539371c9d4SSatish Balay       ij[2] = 3 * i + 2;
33549566063dSJacob Faibussowitsch       PetscCall(MatGetValues(A, 3, ij, 3, ij, diag));
33559566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_inverse_A_3(diag, shift, allowzeropivot, &zeropivotdetected));
33567b6c816cSBarry Smith       if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT;
33579566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_transpose_A_3(diag));
3358bbead8a2SBarry Smith       diag += 9;
3359bbead8a2SBarry Smith     }
3360bbead8a2SBarry Smith     break;
3361bbead8a2SBarry Smith   case 4:
3362bbead8a2SBarry Smith     for (i = 0; i < mbs; i++) {
33639371c9d4SSatish Balay       ij[0] = 4 * i;
33649371c9d4SSatish Balay       ij[1] = 4 * i + 1;
33659371c9d4SSatish Balay       ij[2] = 4 * i + 2;
33669371c9d4SSatish Balay       ij[3] = 4 * i + 3;
33679566063dSJacob Faibussowitsch       PetscCall(MatGetValues(A, 4, ij, 4, ij, diag));
33689566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_inverse_A_4(diag, shift, allowzeropivot, &zeropivotdetected));
33697b6c816cSBarry Smith       if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT;
33709566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_transpose_A_4(diag));
3371bbead8a2SBarry Smith       diag += 16;
3372bbead8a2SBarry Smith     }
3373bbead8a2SBarry Smith     break;
3374bbead8a2SBarry Smith   case 5:
3375bbead8a2SBarry Smith     for (i = 0; i < mbs; i++) {
33769371c9d4SSatish Balay       ij[0] = 5 * i;
33779371c9d4SSatish Balay       ij[1] = 5 * i + 1;
33789371c9d4SSatish Balay       ij[2] = 5 * i + 2;
33799371c9d4SSatish Balay       ij[3] = 5 * i + 3;
33809371c9d4SSatish Balay       ij[4] = 5 * i + 4;
33819566063dSJacob Faibussowitsch       PetscCall(MatGetValues(A, 5, ij, 5, ij, diag));
33829566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_inverse_A_5(diag, ipvt, work, shift, allowzeropivot, &zeropivotdetected));
33837b6c816cSBarry Smith       if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT;
33849566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_transpose_A_5(diag));
3385bbead8a2SBarry Smith       diag += 25;
3386bbead8a2SBarry Smith     }
3387bbead8a2SBarry Smith     break;
3388bbead8a2SBarry Smith   case 6:
3389bbead8a2SBarry Smith     for (i = 0; i < mbs; i++) {
33909371c9d4SSatish Balay       ij[0] = 6 * i;
33919371c9d4SSatish Balay       ij[1] = 6 * i + 1;
33929371c9d4SSatish Balay       ij[2] = 6 * i + 2;
33939371c9d4SSatish Balay       ij[3] = 6 * i + 3;
33949371c9d4SSatish Balay       ij[4] = 6 * i + 4;
33959371c9d4SSatish Balay       ij[5] = 6 * i + 5;
33969566063dSJacob Faibussowitsch       PetscCall(MatGetValues(A, 6, ij, 6, ij, diag));
33979566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_inverse_A_6(diag, shift, allowzeropivot, &zeropivotdetected));
33987b6c816cSBarry Smith       if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT;
33999566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_transpose_A_6(diag));
3400bbead8a2SBarry Smith       diag += 36;
3401bbead8a2SBarry Smith     }
3402bbead8a2SBarry Smith     break;
3403bbead8a2SBarry Smith   case 7:
3404bbead8a2SBarry Smith     for (i = 0; i < mbs; i++) {
34059371c9d4SSatish Balay       ij[0] = 7 * i;
34069371c9d4SSatish Balay       ij[1] = 7 * i + 1;
34079371c9d4SSatish Balay       ij[2] = 7 * i + 2;
34089371c9d4SSatish Balay       ij[3] = 7 * i + 3;
34099371c9d4SSatish Balay       ij[4] = 7 * i + 4;
34109371c9d4SSatish Balay       ij[5] = 7 * i + 5;
3411cdd8bf47SJunchao Zhang       ij[6] = 7 * i + 6;
34129566063dSJacob Faibussowitsch       PetscCall(MatGetValues(A, 7, ij, 7, ij, diag));
34139566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_inverse_A_7(diag, shift, allowzeropivot, &zeropivotdetected));
34147b6c816cSBarry Smith       if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT;
34159566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_transpose_A_7(diag));
3416bbead8a2SBarry Smith       diag += 49;
3417bbead8a2SBarry Smith     }
3418bbead8a2SBarry Smith     break;
3419bbead8a2SBarry Smith   default:
34209566063dSJacob Faibussowitsch     PetscCall(PetscMalloc3(bs, &v_work, bs, &v_pivots, bs, &IJ));
3421bbead8a2SBarry Smith     for (i = 0; i < mbs; i++) {
3422ad540459SPierre Jolivet       for (j = 0; j < bs; j++) IJ[j] = bs * i + j;
34239566063dSJacob Faibussowitsch       PetscCall(MatGetValues(A, bs, IJ, bs, IJ, diag));
34249566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_inverse_A(bs, diag, v_pivots, v_work, allowzeropivot, &zeropivotdetected));
34257b6c816cSBarry Smith       if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT;
34269566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_transpose_A_N(diag, bs));
3427bbead8a2SBarry Smith       diag += bs2;
3428bbead8a2SBarry Smith     }
34299566063dSJacob Faibussowitsch     PetscCall(PetscFree3(v_work, v_pivots, IJ));
3430bbead8a2SBarry Smith   }
3431bbead8a2SBarry Smith   a->ibdiagvalid = PETSC_TRUE;
34323ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3433bbead8a2SBarry Smith }
3434bbead8a2SBarry Smith 
3435d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatSetRandom_SeqAIJ(Mat x, PetscRandom rctx)
3436d71ae5a4SJacob Faibussowitsch {
343773a71a0fSBarry Smith   Mat_SeqAIJ *aij = (Mat_SeqAIJ *)x->data;
3438fff043a9SJunchao Zhang   PetscScalar a, *aa;
343973a71a0fSBarry Smith   PetscInt    m, n, i, j, col;
344073a71a0fSBarry Smith 
344173a71a0fSBarry Smith   PetscFunctionBegin;
344273a71a0fSBarry Smith   if (!x->assembled) {
34439566063dSJacob Faibussowitsch     PetscCall(MatGetSize(x, &m, &n));
344473a71a0fSBarry Smith     for (i = 0; i < m; i++) {
344573a71a0fSBarry Smith       for (j = 0; j < aij->imax[i]; j++) {
34469566063dSJacob Faibussowitsch         PetscCall(PetscRandomGetValue(rctx, &a));
344773a71a0fSBarry Smith         col = (PetscInt)(n * PetscRealPart(a));
34489566063dSJacob Faibussowitsch         PetscCall(MatSetValues(x, 1, &i, 1, &col, &a, ADD_VALUES));
344973a71a0fSBarry Smith       }
345073a71a0fSBarry Smith     }
3451e2ce353bSJunchao Zhang   } else {
34529566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJGetArrayWrite(x, &aa));
34539566063dSJacob Faibussowitsch     for (i = 0; i < aij->nz; i++) PetscCall(PetscRandomGetValue(rctx, aa + i));
34549566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJRestoreArrayWrite(x, &aa));
3455e2ce353bSJunchao Zhang   }
34569566063dSJacob Faibussowitsch   PetscCall(MatAssemblyBegin(x, MAT_FINAL_ASSEMBLY));
34579566063dSJacob Faibussowitsch   PetscCall(MatAssemblyEnd(x, MAT_FINAL_ASSEMBLY));
34583ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
345973a71a0fSBarry Smith }
346073a71a0fSBarry Smith 
3461679944adSJunchao Zhang /* Like MatSetRandom_SeqAIJ, but do not set values on columns in range of [low, high) */
3462d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetRandomSkipColumnRange_SeqAIJ_Private(Mat x, PetscInt low, PetscInt high, PetscRandom rctx)
3463d71ae5a4SJacob Faibussowitsch {
3464679944adSJunchao Zhang   Mat_SeqAIJ *aij = (Mat_SeqAIJ *)x->data;
3465679944adSJunchao Zhang   PetscScalar a;
3466679944adSJunchao Zhang   PetscInt    m, n, i, j, col, nskip;
3467679944adSJunchao Zhang 
3468679944adSJunchao Zhang   PetscFunctionBegin;
3469679944adSJunchao Zhang   nskip = high - low;
34709566063dSJacob Faibussowitsch   PetscCall(MatGetSize(x, &m, &n));
3471679944adSJunchao Zhang   n -= nskip; /* shrink number of columns where nonzeros can be set */
3472679944adSJunchao Zhang   for (i = 0; i < m; i++) {
3473679944adSJunchao Zhang     for (j = 0; j < aij->imax[i]; j++) {
34749566063dSJacob Faibussowitsch       PetscCall(PetscRandomGetValue(rctx, &a));
3475679944adSJunchao Zhang       col = (PetscInt)(n * PetscRealPart(a));
3476679944adSJunchao Zhang       if (col >= low) col += nskip; /* shift col rightward to skip the hole */
34779566063dSJacob Faibussowitsch       PetscCall(MatSetValues(x, 1, &i, 1, &col, &a, ADD_VALUES));
3478679944adSJunchao Zhang     }
3479e2ce353bSJunchao Zhang   }
34809566063dSJacob Faibussowitsch   PetscCall(MatAssemblyBegin(x, MAT_FINAL_ASSEMBLY));
34819566063dSJacob Faibussowitsch   PetscCall(MatAssemblyEnd(x, MAT_FINAL_ASSEMBLY));
34823ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3483679944adSJunchao Zhang }
3484679944adSJunchao Zhang 
34850a6ffc59SBarry Smith static struct _MatOps MatOps_Values = {MatSetValues_SeqAIJ,
3486cb5b572fSBarry Smith                                        MatGetRow_SeqAIJ,
3487cb5b572fSBarry Smith                                        MatRestoreRow_SeqAIJ,
3488cb5b572fSBarry Smith                                        MatMult_SeqAIJ,
348997304618SKris Buschelman                                        /*  4*/ MatMultAdd_SeqAIJ,
34907c922b88SBarry Smith                                        MatMultTranspose_SeqAIJ,
34917c922b88SBarry Smith                                        MatMultTransposeAdd_SeqAIJ,
3492f4259b30SLisandro Dalcin                                        NULL,
3493f4259b30SLisandro Dalcin                                        NULL,
3494f4259b30SLisandro Dalcin                                        NULL,
3495f4259b30SLisandro Dalcin                                        /* 10*/ NULL,
3496cb5b572fSBarry Smith                                        MatLUFactor_SeqAIJ,
3497f4259b30SLisandro Dalcin                                        NULL,
349841f059aeSBarry Smith                                        MatSOR_SeqAIJ,
349991e9d3e2SHong Zhang                                        MatTranspose_SeqAIJ,
350097304618SKris Buschelman                                        /*1 5*/ MatGetInfo_SeqAIJ,
3501cb5b572fSBarry Smith                                        MatEqual_SeqAIJ,
3502cb5b572fSBarry Smith                                        MatGetDiagonal_SeqAIJ,
3503cb5b572fSBarry Smith                                        MatDiagonalScale_SeqAIJ,
3504cb5b572fSBarry Smith                                        MatNorm_SeqAIJ,
3505f4259b30SLisandro Dalcin                                        /* 20*/ NULL,
3506cb5b572fSBarry Smith                                        MatAssemblyEnd_SeqAIJ,
3507cb5b572fSBarry Smith                                        MatSetOption_SeqAIJ,
3508cb5b572fSBarry Smith                                        MatZeroEntries_SeqAIJ,
3509d519adbfSMatthew Knepley                                        /* 24*/ MatZeroRows_SeqAIJ,
3510f4259b30SLisandro Dalcin                                        NULL,
3511f4259b30SLisandro Dalcin                                        NULL,
3512f4259b30SLisandro Dalcin                                        NULL,
3513f4259b30SLisandro Dalcin                                        NULL,
351426cec326SBarry Smith                                        /* 29*/ MatSetUp_Seq_Hash,
3515f4259b30SLisandro Dalcin                                        NULL,
3516f4259b30SLisandro Dalcin                                        NULL,
3517f4259b30SLisandro Dalcin                                        NULL,
3518f4259b30SLisandro Dalcin                                        NULL,
3519d519adbfSMatthew Knepley                                        /* 34*/ MatDuplicate_SeqAIJ,
3520f4259b30SLisandro Dalcin                                        NULL,
3521f4259b30SLisandro Dalcin                                        NULL,
3522cb5b572fSBarry Smith                                        MatILUFactor_SeqAIJ,
3523f4259b30SLisandro Dalcin                                        NULL,
3524d519adbfSMatthew Knepley                                        /* 39*/ MatAXPY_SeqAIJ,
35257dae84e0SHong Zhang                                        MatCreateSubMatrices_SeqAIJ,
3526cb5b572fSBarry Smith                                        MatIncreaseOverlap_SeqAIJ,
3527cb5b572fSBarry Smith                                        MatGetValues_SeqAIJ,
3528cb5b572fSBarry Smith                                        MatCopy_SeqAIJ,
3529d519adbfSMatthew Knepley                                        /* 44*/ MatGetRowMax_SeqAIJ,
3530cb5b572fSBarry Smith                                        MatScale_SeqAIJ,
35317d68702bSBarry Smith                                        MatShift_SeqAIJ,
353279299369SBarry Smith                                        MatDiagonalSet_SeqAIJ,
35336e169961SBarry Smith                                        MatZeroRowsColumns_SeqAIJ,
353473a71a0fSBarry Smith                                        /* 49*/ MatSetRandom_SeqAIJ,
35353b2fbd54SBarry Smith                                        MatGetRowIJ_SeqAIJ,
35363b2fbd54SBarry Smith                                        MatRestoreRowIJ_SeqAIJ,
35373b2fbd54SBarry Smith                                        MatGetColumnIJ_SeqAIJ,
3538a93ec695SBarry Smith                                        MatRestoreColumnIJ_SeqAIJ,
353993dfae19SHong Zhang                                        /* 54*/ MatFDColoringCreate_SeqXAIJ,
3540f4259b30SLisandro Dalcin                                        NULL,
3541f4259b30SLisandro Dalcin                                        NULL,
3542cda55fadSBarry Smith                                        MatPermute_SeqAIJ,
3543f4259b30SLisandro Dalcin                                        NULL,
3544f4259b30SLisandro Dalcin                                        /* 59*/ NULL,
3545b9b97703SBarry Smith                                        MatDestroy_SeqAIJ,
3546b9b97703SBarry Smith                                        MatView_SeqAIJ,
3547f4259b30SLisandro Dalcin                                        NULL,
3548f4259b30SLisandro Dalcin                                        NULL,
3549f4259b30SLisandro Dalcin                                        /* 64*/ NULL,
3550321b30b9SSatish Balay                                        MatMatMatMultNumeric_SeqAIJ_SeqAIJ_SeqAIJ,
3551f4259b30SLisandro Dalcin                                        NULL,
3552f4259b30SLisandro Dalcin                                        NULL,
3553f4259b30SLisandro Dalcin                                        NULL,
3554d519adbfSMatthew Knepley                                        /* 69*/ MatGetRowMaxAbs_SeqAIJ,
3555c87e5d42SMatthew Knepley                                        MatGetRowMinAbs_SeqAIJ,
3556f4259b30SLisandro Dalcin                                        NULL,
3557f4259b30SLisandro Dalcin                                        NULL,
3558f4259b30SLisandro Dalcin                                        NULL,
3559f4259b30SLisandro Dalcin                                        /* 74*/ NULL,
35603acb8795SBarry Smith                                        MatFDColoringApply_AIJ,
3561f4259b30SLisandro Dalcin                                        NULL,
3562f4259b30SLisandro Dalcin                                        NULL,
3563f4259b30SLisandro Dalcin                                        NULL,
35646ce1633cSBarry Smith                                        /* 79*/ MatFindZeroDiagonals_SeqAIJ,
3565f4259b30SLisandro Dalcin                                        NULL,
3566f4259b30SLisandro Dalcin                                        NULL,
3567f4259b30SLisandro Dalcin                                        NULL,
3568bc011b1eSHong Zhang                                        MatLoad_SeqAIJ,
35696cff0a6bSPierre Jolivet                                        /* 84*/ NULL,
35706cff0a6bSPierre Jolivet                                        NULL,
3571f4259b30SLisandro Dalcin                                        NULL,
3572f4259b30SLisandro Dalcin                                        NULL,
3573f4259b30SLisandro Dalcin                                        NULL,
3574f4259b30SLisandro Dalcin                                        /* 89*/ NULL,
3575f4259b30SLisandro Dalcin                                        NULL,
357626be0446SHong Zhang                                        MatMatMultNumeric_SeqAIJ_SeqAIJ,
3577f4259b30SLisandro Dalcin                                        NULL,
3578f4259b30SLisandro Dalcin                                        NULL,
35798fa4b5a6SHong Zhang                                        /* 94*/ MatPtAPNumeric_SeqAIJ_SeqAIJ_SparseAxpy,
3580f4259b30SLisandro Dalcin                                        NULL,
3581f4259b30SLisandro Dalcin                                        NULL,
35826fc122caSHong Zhang                                        MatMatTransposeMultNumeric_SeqAIJ_SeqAIJ,
3583f4259b30SLisandro Dalcin                                        NULL,
35844222ddf1SHong Zhang                                        /* 99*/ MatProductSetFromOptions_SeqAIJ,
3585f4259b30SLisandro Dalcin                                        NULL,
3586f4259b30SLisandro Dalcin                                        NULL,
358787d4246cSBarry Smith                                        MatConjugate_SeqAIJ,
3588f4259b30SLisandro Dalcin                                        NULL,
3589d519adbfSMatthew Knepley                                        /*104*/ MatSetValuesRow_SeqAIJ,
359099cafbc1SBarry Smith                                        MatRealPart_SeqAIJ,
3591f5edf698SHong Zhang                                        MatImaginaryPart_SeqAIJ,
3592f4259b30SLisandro Dalcin                                        NULL,
3593f4259b30SLisandro Dalcin                                        NULL,
3594cbd44569SHong Zhang                                        /*109*/ MatMatSolve_SeqAIJ,
3595f4259b30SLisandro Dalcin                                        NULL,
35962af78befSBarry Smith                                        MatGetRowMin_SeqAIJ,
3597f4259b30SLisandro Dalcin                                        NULL,
3598599ef60dSHong Zhang                                        MatMissingDiagonal_SeqAIJ,
3599f4259b30SLisandro Dalcin                                        /*114*/ NULL,
3600f4259b30SLisandro Dalcin                                        NULL,
3601f4259b30SLisandro Dalcin                                        NULL,
3602f4259b30SLisandro Dalcin                                        NULL,
3603f4259b30SLisandro Dalcin                                        NULL,
3604f4259b30SLisandro Dalcin                                        /*119*/ NULL,
3605f4259b30SLisandro Dalcin                                        NULL,
3606f4259b30SLisandro Dalcin                                        NULL,
3607f4259b30SLisandro Dalcin                                        NULL,
3608b3a44c85SBarry Smith                                        MatGetMultiProcBlock_SeqAIJ,
36090716a85fSBarry Smith                                        /*124*/ MatFindNonzeroRows_SeqAIJ,
3610a873a8cdSSam Reynolds                                        MatGetColumnReductions_SeqAIJ,
361137868618SMatthew G Knepley                                        MatInvertBlockDiagonal_SeqAIJ,
36120da83c2eSBarry Smith                                        MatInvertVariableBlockDiagonal_SeqAIJ,
3613f4259b30SLisandro Dalcin                                        NULL,
3614f4259b30SLisandro Dalcin                                        /*129*/ NULL,
3615f4259b30SLisandro Dalcin                                        NULL,
3616f4259b30SLisandro Dalcin                                        NULL,
361775648e8dSHong Zhang                                        MatTransposeMatMultNumeric_SeqAIJ_SeqAIJ,
3618b9af6bddSHong Zhang                                        MatTransposeColoringCreate_SeqAIJ,
3619b9af6bddSHong Zhang                                        /*134*/ MatTransColoringApplySpToDen_SeqAIJ,
36202b8ad9a3SHong Zhang                                        MatTransColoringApplyDenToSp_SeqAIJ,
3621f4259b30SLisandro Dalcin                                        NULL,
3622f4259b30SLisandro Dalcin                                        NULL,
36233964eb88SJed Brown                                        MatRARtNumeric_SeqAIJ_SeqAIJ,
3624f4259b30SLisandro Dalcin                                        /*139*/ NULL,
3625f4259b30SLisandro Dalcin                                        NULL,
3626f4259b30SLisandro Dalcin                                        NULL,
36273a062f41SBarry Smith                                        MatFDColoringSetUp_SeqXAIJ,
36289c8f2541SHong Zhang                                        MatFindOffBlockDiagonalEntries_SeqAIJ,
36294222ddf1SHong Zhang                                        MatCreateMPIMatConcatenateSeqMat_SeqAIJ,
36304222ddf1SHong Zhang                                        /*145*/ MatDestroySubMatrices_SeqAIJ,
3631f4259b30SLisandro Dalcin                                        NULL,
363272833a62Smarkadams4                                        NULL,
363372833a62Smarkadams4                                        MatCreateGraph_Simple_AIJ,
36342d776b49SBarry Smith                                        NULL,
3635dec0b466SHong Zhang                                        /*150*/ MatTransposeSymbolic_SeqAIJ,
3636eede4a3fSMark Adams                                        MatEliminateZeros_SeqAIJ,
36374cc2b5b5SPierre Jolivet                                        MatGetRowSumAbs_SeqAIJ,
363842ce410bSJunchao Zhang                                        NULL,
363942ce410bSJunchao Zhang                                        NULL,
3640fe1fc275SAlexander                                        /*155*/ NULL,
3641fe1fc275SAlexander                                        MatCopyHashToXAIJ_Seq_Hash};
364217ab2063SBarry Smith 
3643ba38deedSJacob Faibussowitsch static PetscErrorCode MatSeqAIJSetColumnIndices_SeqAIJ(Mat mat, PetscInt *indices)
3644d71ae5a4SJacob Faibussowitsch {
3645bef8e0ddSBarry Smith   Mat_SeqAIJ *aij = (Mat_SeqAIJ *)mat->data;
364697f1f81fSBarry Smith   PetscInt    i, nz, n;
3647bef8e0ddSBarry Smith 
3648bef8e0ddSBarry Smith   PetscFunctionBegin;
3649bef8e0ddSBarry Smith   nz = aij->maxnz;
3650d0f46423SBarry Smith   n  = mat->rmap->n;
3651ad540459SPierre Jolivet   for (i = 0; i < nz; i++) aij->j[i] = indices[i];
3652bef8e0ddSBarry Smith   aij->nz = nz;
3653ad540459SPierre Jolivet   for (i = 0; i < n; i++) aij->ilen[i] = aij->imax[i];
36543ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3655bef8e0ddSBarry Smith }
3656bef8e0ddSBarry Smith 
3657a3bb6f32SFande Kong /*
3658ddea5d60SJunchao Zhang  * Given a sparse matrix with global column indices, compact it by using a local column space.
3659ddea5d60SJunchao Zhang  * The result matrix helps saving memory in other algorithms, such as MatPtAPSymbolic_MPIAIJ_MPIAIJ_scalable()
3660ddea5d60SJunchao Zhang  */
3661d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJCompactOutExtraColumns_SeqAIJ(Mat mat, ISLocalToGlobalMapping *mapping)
3662d71ae5a4SJacob Faibussowitsch {
3663a3bb6f32SFande Kong   Mat_SeqAIJ   *aij = (Mat_SeqAIJ *)mat->data;
3664eec179cfSJacob Faibussowitsch   PetscHMapI    gid1_lid1;
3665eec179cfSJacob Faibussowitsch   PetscHashIter tpos;
366625b670f0SStefano Zampini   PetscInt      gid, lid, i, ec, nz = aij->nz;
366725b670f0SStefano Zampini   PetscInt     *garray, *jj = aij->j;
3668a3bb6f32SFande Kong 
3669a3bb6f32SFande Kong   PetscFunctionBegin;
3670a3bb6f32SFande Kong   PetscValidHeaderSpecific(mat, MAT_CLASSID, 1);
36714f572ea9SToby Isaac   PetscAssertPointer(mapping, 2);
3672a3bb6f32SFande Kong   /* use a table */
3673eec179cfSJacob Faibussowitsch   PetscCall(PetscHMapICreateWithSize(mat->rmap->n, &gid1_lid1));
3674a3bb6f32SFande Kong   ec = 0;
367525b670f0SStefano Zampini   for (i = 0; i < nz; i++) {
367625b670f0SStefano Zampini     PetscInt data, gid1 = jj[i] + 1;
3677eec179cfSJacob Faibussowitsch     PetscCall(PetscHMapIGetWithDefault(gid1_lid1, gid1, 0, &data));
3678a3bb6f32SFande Kong     if (!data) {
3679a3bb6f32SFande Kong       /* one based table */
3680c76ffc5fSJacob Faibussowitsch       PetscCall(PetscHMapISet(gid1_lid1, gid1, ++ec));
3681a3bb6f32SFande Kong     }
3682a3bb6f32SFande Kong   }
3683a3bb6f32SFande Kong   /* form array of columns we need */
36849566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(ec, &garray));
3685eec179cfSJacob Faibussowitsch   PetscHashIterBegin(gid1_lid1, tpos);
3686eec179cfSJacob Faibussowitsch   while (!PetscHashIterAtEnd(gid1_lid1, tpos)) {
3687eec179cfSJacob Faibussowitsch     PetscHashIterGetKey(gid1_lid1, tpos, gid);
3688eec179cfSJacob Faibussowitsch     PetscHashIterGetVal(gid1_lid1, tpos, lid);
3689eec179cfSJacob Faibussowitsch     PetscHashIterNext(gid1_lid1, tpos);
3690a3bb6f32SFande Kong     gid--;
3691a3bb6f32SFande Kong     lid--;
3692a3bb6f32SFande Kong     garray[lid] = gid;
3693a3bb6f32SFande Kong   }
36949566063dSJacob Faibussowitsch   PetscCall(PetscSortInt(ec, garray)); /* sort, and rebuild */
3695eec179cfSJacob Faibussowitsch   PetscCall(PetscHMapIClear(gid1_lid1));
3696c76ffc5fSJacob Faibussowitsch   for (i = 0; i < ec; i++) PetscCall(PetscHMapISet(gid1_lid1, garray[i] + 1, i + 1));
3697a3bb6f32SFande Kong   /* compact out the extra columns in B */
369825b670f0SStefano Zampini   for (i = 0; i < nz; i++) {
369925b670f0SStefano Zampini     PetscInt gid1 = jj[i] + 1;
3700eec179cfSJacob Faibussowitsch     PetscCall(PetscHMapIGetWithDefault(gid1_lid1, gid1, 0, &lid));
3701a3bb6f32SFande Kong     lid--;
370225b670f0SStefano Zampini     jj[i] = lid;
3703a3bb6f32SFande Kong   }
37049566063dSJacob Faibussowitsch   PetscCall(PetscLayoutDestroy(&mat->cmap));
3705eec179cfSJacob Faibussowitsch   PetscCall(PetscHMapIDestroy(&gid1_lid1));
37069566063dSJacob Faibussowitsch   PetscCall(PetscLayoutCreateFromSizes(PetscObjectComm((PetscObject)mat), ec, ec, 1, &mat->cmap));
37079566063dSJacob Faibussowitsch   PetscCall(ISLocalToGlobalMappingCreate(PETSC_COMM_SELF, mat->cmap->bs, mat->cmap->n, garray, PETSC_OWN_POINTER, mapping));
37089566063dSJacob Faibussowitsch   PetscCall(ISLocalToGlobalMappingSetType(*mapping, ISLOCALTOGLOBALMAPPINGHASH));
37093ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3710a3bb6f32SFande Kong }
3711a3bb6f32SFande Kong 
3712bef8e0ddSBarry Smith /*@
3713bef8e0ddSBarry Smith   MatSeqAIJSetColumnIndices - Set the column indices for all the rows
3714bef8e0ddSBarry Smith   in the matrix.
3715bef8e0ddSBarry Smith 
3716bef8e0ddSBarry Smith   Input Parameters:
371711a5261eSBarry Smith + mat     - the `MATSEQAIJ` matrix
3718bef8e0ddSBarry Smith - indices - the column indices
3719bef8e0ddSBarry Smith 
372015091d37SBarry Smith   Level: advanced
372115091d37SBarry Smith 
3722bef8e0ddSBarry Smith   Notes:
3723bef8e0ddSBarry Smith   This can be called if you have precomputed the nonzero structure of the
3724bef8e0ddSBarry Smith   matrix and want to provide it to the matrix object to improve the performance
372511a5261eSBarry Smith   of the `MatSetValues()` operation.
3726bef8e0ddSBarry Smith 
3727bef8e0ddSBarry Smith   You MUST have set the correct numbers of nonzeros per row in the call to
372811a5261eSBarry Smith   `MatCreateSeqAIJ()`, and the columns indices MUST be sorted.
3729bef8e0ddSBarry Smith 
373011a5261eSBarry Smith   MUST be called before any calls to `MatSetValues()`
3731bef8e0ddSBarry Smith 
3732b9617806SBarry Smith   The indices should start with zero, not one.
3733b9617806SBarry Smith 
37341cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MATSEQAIJ`
3735bef8e0ddSBarry Smith @*/
3736d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetColumnIndices(Mat mat, PetscInt *indices)
3737d71ae5a4SJacob Faibussowitsch {
3738bef8e0ddSBarry Smith   PetscFunctionBegin;
37390700a824SBarry Smith   PetscValidHeaderSpecific(mat, MAT_CLASSID, 1);
37404f572ea9SToby Isaac   PetscAssertPointer(indices, 2);
3741cac4c232SBarry Smith   PetscUseMethod(mat, "MatSeqAIJSetColumnIndices_C", (Mat, PetscInt *), (mat, indices));
37423ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3743bef8e0ddSBarry Smith }
3744bef8e0ddSBarry Smith 
3745ba38deedSJacob Faibussowitsch static PetscErrorCode MatStoreValues_SeqAIJ(Mat mat)
3746d71ae5a4SJacob Faibussowitsch {
3747be6bf707SBarry Smith   Mat_SeqAIJ *aij = (Mat_SeqAIJ *)mat->data;
3748d0f46423SBarry Smith   size_t      nz  = aij->i[mat->rmap->n];
3749be6bf707SBarry Smith 
3750be6bf707SBarry Smith   PetscFunctionBegin;
375128b400f6SJacob Faibussowitsch   PetscCheck(aij->nonew, PETSC_COMM_SELF, PETSC_ERR_ORDER, "Must call MatSetOption(A,MAT_NEW_NONZERO_LOCATIONS,PETSC_FALSE);first");
3752be6bf707SBarry Smith 
3753be6bf707SBarry Smith   /* allocate space for values if not already there */
37544dfa11a4SJacob Faibussowitsch   if (!aij->saved_values) { PetscCall(PetscMalloc1(nz + 1, &aij->saved_values)); }
3755be6bf707SBarry Smith 
3756be6bf707SBarry Smith   /* copy values over */
37579566063dSJacob Faibussowitsch   PetscCall(PetscArraycpy(aij->saved_values, aij->a, nz));
37583ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3759be6bf707SBarry Smith }
3760be6bf707SBarry Smith 
3761be6bf707SBarry Smith /*@
376220f4b53cSBarry Smith   MatStoreValues - Stashes a copy of the matrix values; this allows reusing of the linear part of a Jacobian, while recomputing only the
3763be6bf707SBarry Smith   nonlinear portion.
3764be6bf707SBarry Smith 
3765c3339decSBarry Smith   Logically Collect
3766be6bf707SBarry Smith 
376727430b45SBarry Smith   Input Parameter:
376811a5261eSBarry Smith . mat - the matrix (currently only `MATAIJ` matrices support this option)
3769be6bf707SBarry Smith 
377015091d37SBarry Smith   Level: advanced
377115091d37SBarry Smith 
37722920cce0SJacob Faibussowitsch   Example Usage:
377327430b45SBarry Smith .vb
37742ef1f0ffSBarry Smith     Using SNES
377527430b45SBarry Smith     Create Jacobian matrix
377627430b45SBarry Smith     Set linear terms into matrix
377727430b45SBarry Smith     Apply boundary conditions to matrix, at this time matrix must have
377827430b45SBarry Smith       final nonzero structure (i.e. setting the nonlinear terms and applying
377927430b45SBarry Smith       boundary conditions again will not change the nonzero structure
378027430b45SBarry Smith     MatSetOption(mat, MAT_NEW_NONZERO_LOCATIONS, PETSC_FALSE);
378127430b45SBarry Smith     MatStoreValues(mat);
378227430b45SBarry Smith     Call SNESSetJacobian() with matrix
378327430b45SBarry Smith     In your Jacobian routine
378427430b45SBarry Smith       MatRetrieveValues(mat);
378527430b45SBarry Smith       Set nonlinear terms in matrix
3786be6bf707SBarry Smith 
378727430b45SBarry Smith     Without `SNESSolve()`, i.e. when you handle nonlinear solve yourself:
378827430b45SBarry Smith     // build linear portion of Jacobian
378927430b45SBarry Smith     MatSetOption(mat, MAT_NEW_NONZERO_LOCATIONS, PETSC_FALSE);
379027430b45SBarry Smith     MatStoreValues(mat);
379127430b45SBarry Smith     loop over nonlinear iterations
379227430b45SBarry Smith        MatRetrieveValues(mat);
379327430b45SBarry Smith        // call MatSetValues(mat,...) to set nonliner portion of Jacobian
379427430b45SBarry Smith        // call MatAssemblyBegin/End() on matrix
379527430b45SBarry Smith        Solve linear system with Jacobian
379627430b45SBarry Smith     endloop
379727430b45SBarry Smith .ve
3798be6bf707SBarry Smith 
3799be6bf707SBarry Smith   Notes:
3800da81f932SPierre Jolivet   Matrix must already be assembled before calling this routine
380111a5261eSBarry Smith   Must set the matrix option `MatSetOption`(mat,`MAT_NEW_NONZERO_LOCATIONS`,`PETSC_FALSE`); before
3802be6bf707SBarry Smith   calling this routine.
3803be6bf707SBarry Smith 
38040c468ba9SBarry Smith   When this is called multiple times it overwrites the previous set of stored values
38050c468ba9SBarry Smith   and does not allocated additional space.
38060c468ba9SBarry Smith 
3807fe59aa6dSJacob Faibussowitsch .seealso: [](ch_matrices), `Mat`, `MatRetrieveValues()`
3808be6bf707SBarry Smith @*/
3809d71ae5a4SJacob Faibussowitsch PetscErrorCode MatStoreValues(Mat mat)
3810d71ae5a4SJacob Faibussowitsch {
3811be6bf707SBarry Smith   PetscFunctionBegin;
38120700a824SBarry Smith   PetscValidHeaderSpecific(mat, MAT_CLASSID, 1);
381328b400f6SJacob Faibussowitsch   PetscCheck(mat->assembled, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for unassembled matrix");
381428b400f6SJacob Faibussowitsch   PetscCheck(!mat->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix");
3815cac4c232SBarry Smith   PetscUseMethod(mat, "MatStoreValues_C", (Mat), (mat));
38163ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3817be6bf707SBarry Smith }
3818be6bf707SBarry Smith 
3819ba38deedSJacob Faibussowitsch static PetscErrorCode MatRetrieveValues_SeqAIJ(Mat mat)
3820d71ae5a4SJacob Faibussowitsch {
3821be6bf707SBarry Smith   Mat_SeqAIJ *aij = (Mat_SeqAIJ *)mat->data;
3822d0f46423SBarry Smith   PetscInt    nz  = aij->i[mat->rmap->n];
3823be6bf707SBarry Smith 
3824be6bf707SBarry Smith   PetscFunctionBegin;
382528b400f6SJacob Faibussowitsch   PetscCheck(aij->nonew, PETSC_COMM_SELF, PETSC_ERR_ORDER, "Must call MatSetOption(A,MAT_NEW_NONZERO_LOCATIONS,PETSC_FALSE);first");
382628b400f6SJacob Faibussowitsch   PetscCheck(aij->saved_values, PETSC_COMM_SELF, PETSC_ERR_ORDER, "Must call MatStoreValues(A);first");
3827be6bf707SBarry Smith   /* copy values over */
38289566063dSJacob Faibussowitsch   PetscCall(PetscArraycpy(aij->a, aij->saved_values, nz));
38293ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3830be6bf707SBarry Smith }
3831be6bf707SBarry Smith 
3832be6bf707SBarry Smith /*@
383320f4b53cSBarry Smith   MatRetrieveValues - Retrieves the copy of the matrix values that was stored with `MatStoreValues()`
3834be6bf707SBarry Smith 
3835c3339decSBarry Smith   Logically Collect
3836be6bf707SBarry Smith 
38372fe279fdSBarry Smith   Input Parameter:
383811a5261eSBarry Smith . mat - the matrix (currently only `MATAIJ` matrices support this option)
3839be6bf707SBarry Smith 
384015091d37SBarry Smith   Level: advanced
384115091d37SBarry Smith 
38421cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatStoreValues()`
3843be6bf707SBarry Smith @*/
3844d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRetrieveValues(Mat mat)
3845d71ae5a4SJacob Faibussowitsch {
3846be6bf707SBarry Smith   PetscFunctionBegin;
38470700a824SBarry Smith   PetscValidHeaderSpecific(mat, MAT_CLASSID, 1);
384828b400f6SJacob Faibussowitsch   PetscCheck(mat->assembled, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for unassembled matrix");
384928b400f6SJacob Faibussowitsch   PetscCheck(!mat->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix");
3850cac4c232SBarry Smith   PetscUseMethod(mat, "MatRetrieveValues_C", (Mat), (mat));
38513ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3852be6bf707SBarry Smith }
3853be6bf707SBarry Smith 
38545d83a8b1SBarry Smith /*@
385511a5261eSBarry Smith   MatCreateSeqAIJ - Creates a sparse matrix in `MATSEQAIJ` (compressed row) format
38560d15e28bSLois Curfman McInnes   (the default parallel PETSc format).  For good matrix assembly performance
385720f4b53cSBarry Smith   the user should preallocate the matrix storage by setting the parameter `nz`
385820f4b53cSBarry Smith   (or the array `nnz`).
385917ab2063SBarry Smith 
3860d083f849SBarry Smith   Collective
3861db81eaa0SLois Curfman McInnes 
386217ab2063SBarry Smith   Input Parameters:
386311a5261eSBarry Smith + comm - MPI communicator, set to `PETSC_COMM_SELF`
386417ab2063SBarry Smith . m    - number of rows
386517ab2063SBarry Smith . n    - number of columns
386617ab2063SBarry Smith . nz   - number of nonzeros per row (same for all rows)
386751c19458SBarry Smith - nnz  - array containing the number of nonzeros in the various rows
38680298fd71SBarry Smith          (possibly different for each row) or NULL
386917ab2063SBarry Smith 
387017ab2063SBarry Smith   Output Parameter:
3871416022c9SBarry Smith . A - the matrix
387217ab2063SBarry Smith 
38732ef1f0ffSBarry Smith   Options Database Keys:
38742ef1f0ffSBarry Smith + -mat_no_inode            - Do not use inodes
38752ef1f0ffSBarry Smith - -mat_inode_limit <limit> - Sets inode limit (max limit=5)
38762ef1f0ffSBarry Smith 
38772ef1f0ffSBarry Smith   Level: intermediate
3878175b88e8SBarry Smith 
3879b259b22eSLois Curfman McInnes   Notes:
388077433607SBarry Smith   It is recommend to use `MatCreateFromOptions()` instead of this routine
388177433607SBarry Smith 
38822ef1f0ffSBarry Smith   If `nnz` is given then `nz` is ignored
388349a6f317SBarry Smith 
38842ef1f0ffSBarry Smith   The `MATSEQAIJ` format, also called
38852ef1f0ffSBarry Smith   compressed row storage, is fully compatible with standard Fortran
38860002213bSLois Curfman McInnes   storage.  That is, the stored row and column indices can begin at
38872ef1f0ffSBarry Smith   either one (as in Fortran) or zero.
388817ab2063SBarry Smith 
388920f4b53cSBarry Smith   Specify the preallocated storage with either `nz` or `nnz` (not both).
38902ef1f0ffSBarry Smith   Set `nz` = `PETSC_DEFAULT` and `nnz` = `NULL` for PETSc to control dynamic memory
389120f4b53cSBarry Smith   allocation.
389217ab2063SBarry Smith 
3893682d7d0cSBarry Smith   By default, this format uses inodes (identical nodes) when possible, to
38944fca80b9SLois Curfman McInnes   improve numerical efficiency of matrix-vector products and solves. We
3895682d7d0cSBarry Smith   search for consecutive rows with the same nonzero structure, thereby
38966c7ebb05SLois Curfman McInnes   reusing matrix information to achieve increased efficiency.
38976c7ebb05SLois Curfman McInnes 
38981cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, [Sparse Matrix Creation](sec_matsparse), `MatCreate()`, `MatCreateAIJ()`, `MatSetValues()`, `MatSeqAIJSetColumnIndices()`, `MatCreateSeqAIJWithArrays()`
389917ab2063SBarry Smith @*/
3900d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateSeqAIJ(MPI_Comm comm, PetscInt m, PetscInt n, PetscInt nz, const PetscInt nnz[], Mat *A)
3901d71ae5a4SJacob Faibussowitsch {
39023a40ed3dSBarry Smith   PetscFunctionBegin;
39039566063dSJacob Faibussowitsch   PetscCall(MatCreate(comm, A));
39049566063dSJacob Faibussowitsch   PetscCall(MatSetSizes(*A, m, n, m, n));
39059566063dSJacob Faibussowitsch   PetscCall(MatSetType(*A, MATSEQAIJ));
39069566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(*A, nz, nnz));
39073ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3908273d9f13SBarry Smith }
3909273d9f13SBarry Smith 
39105d83a8b1SBarry Smith /*@
3911273d9f13SBarry Smith   MatSeqAIJSetPreallocation - For good matrix assembly performance
3912273d9f13SBarry Smith   the user should preallocate the matrix storage by setting the parameter nz
3913273d9f13SBarry Smith   (or the array nnz).  By setting these parameters accurately, performance
3914273d9f13SBarry Smith   during matrix assembly can be increased by more than a factor of 50.
3915273d9f13SBarry Smith 
3916d083f849SBarry Smith   Collective
3917273d9f13SBarry Smith 
3918273d9f13SBarry Smith   Input Parameters:
39191c4f3114SJed Brown + B   - The matrix
3920273d9f13SBarry Smith . nz  - number of nonzeros per row (same for all rows)
3921273d9f13SBarry Smith - nnz - array containing the number of nonzeros in the various rows
39220298fd71SBarry Smith          (possibly different for each row) or NULL
3923273d9f13SBarry Smith 
39242ef1f0ffSBarry Smith   Options Database Keys:
39252ef1f0ffSBarry Smith + -mat_no_inode            - Do not use inodes
39262ef1f0ffSBarry Smith - -mat_inode_limit <limit> - Sets inode limit (max limit=5)
39272ef1f0ffSBarry Smith 
39282ef1f0ffSBarry Smith   Level: intermediate
39292ef1f0ffSBarry Smith 
3930273d9f13SBarry Smith   Notes:
39312ef1f0ffSBarry Smith   If `nnz` is given then `nz` is ignored
393249a6f317SBarry Smith 
393311a5261eSBarry Smith   The `MATSEQAIJ` format also called
39342ef1f0ffSBarry Smith   compressed row storage, is fully compatible with standard Fortran
3935273d9f13SBarry Smith   storage.  That is, the stored row and column indices can begin at
3936273d9f13SBarry Smith   either one (as in Fortran) or zero.  See the users' manual for details.
3937273d9f13SBarry Smith 
39382ef1f0ffSBarry Smith   Specify the preallocated storage with either `nz` or `nnz` (not both).
39392ef1f0ffSBarry Smith   Set nz = `PETSC_DEFAULT` and `nnz` = `NULL` for PETSc to control dynamic memory
39402ef1f0ffSBarry Smith   allocation.
3941273d9f13SBarry Smith 
394211a5261eSBarry Smith   You can call `MatGetInfo()` to get information on how effective the preallocation was;
3943aa95bbe8SBarry Smith   for example the fields mallocs,nz_allocated,nz_used,nz_unneeded;
3944aa95bbe8SBarry Smith   You can also run with the option -info and look for messages with the string
3945aa95bbe8SBarry Smith   malloc in them to see if additional memory allocation was needed.
3946aa95bbe8SBarry Smith 
394711a5261eSBarry Smith   Developer Notes:
394811a5261eSBarry Smith   Use nz of `MAT_SKIP_ALLOCATION` to not allocate any space for the matrix
3949a96a251dSBarry Smith   entries or columns indices
3950a96a251dSBarry Smith 
3951273d9f13SBarry Smith   By default, this format uses inodes (identical nodes) when possible, to
3952273d9f13SBarry Smith   improve numerical efficiency of matrix-vector products and solves. We
3953273d9f13SBarry Smith   search for consecutive rows with the same nonzero structure, thereby
3954273d9f13SBarry Smith   reusing matrix information to achieve increased efficiency.
3955273d9f13SBarry Smith 
39561cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatCreate()`, `MatCreateAIJ()`, `MatSetValues()`, `MatSeqAIJSetColumnIndices()`, `MatCreateSeqAIJWithArrays()`, `MatGetInfo()`,
3957db781477SPatrick Sanan           `MatSeqAIJSetTotalPreallocation()`
3958273d9f13SBarry Smith @*/
3959d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetPreallocation(Mat B, PetscInt nz, const PetscInt nnz[])
3960d71ae5a4SJacob Faibussowitsch {
3961a23d5eceSKris Buschelman   PetscFunctionBegin;
39626ba663aaSJed Brown   PetscValidHeaderSpecific(B, MAT_CLASSID, 1);
39636ba663aaSJed Brown   PetscValidType(B, 1);
3964cac4c232SBarry Smith   PetscTryMethod(B, "MatSeqAIJSetPreallocation_C", (Mat, PetscInt, const PetscInt[]), (B, nz, nnz));
39653ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3966a23d5eceSKris Buschelman }
3967a23d5eceSKris Buschelman 
3968d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetPreallocation_SeqAIJ(Mat B, PetscInt nz, const PetscInt *nnz)
3969d71ae5a4SJacob Faibussowitsch {
3970ad79cf63SBarry Smith   Mat_SeqAIJ *b              = (Mat_SeqAIJ *)B->data;
39712576faa2SJed Brown   PetscBool   skipallocation = PETSC_FALSE, realalloc = PETSC_FALSE;
397297f1f81fSBarry Smith   PetscInt    i;
3973273d9f13SBarry Smith 
3974273d9f13SBarry Smith   PetscFunctionBegin;
3975ad79cf63SBarry Smith   if (B->hash_active) {
3976aea10558SJacob Faibussowitsch     B->ops[0] = b->cops;
3977ad79cf63SBarry Smith     PetscCall(PetscHMapIJVDestroy(&b->ht));
3978ad79cf63SBarry Smith     PetscCall(PetscFree(b->dnz));
3979ad79cf63SBarry Smith     B->hash_active = PETSC_FALSE;
3980ad79cf63SBarry Smith   }
39812576faa2SJed Brown   if (nz >= 0 || nnz) realalloc = PETSC_TRUE;
3982a96a251dSBarry Smith   if (nz == MAT_SKIP_ALLOCATION) {
3983c461c341SBarry Smith     skipallocation = PETSC_TRUE;
3984c461c341SBarry Smith     nz             = 0;
3985c461c341SBarry Smith   }
39869566063dSJacob Faibussowitsch   PetscCall(PetscLayoutSetUp(B->rmap));
39879566063dSJacob Faibussowitsch   PetscCall(PetscLayoutSetUp(B->cmap));
3988899cda47SBarry Smith 
3989435da068SBarry Smith   if (nz == PETSC_DEFAULT || nz == PETSC_DECIDE) nz = 5;
399008401ef6SPierre Jolivet   PetscCheck(nz >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "nz cannot be less than 0: value %" PetscInt_FMT, nz);
39919f0612e4SBarry Smith   if (nnz) {
3992d0f46423SBarry Smith     for (i = 0; i < B->rmap->n; i++) {
399308401ef6SPierre Jolivet       PetscCheck(nnz[i] >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "nnz cannot be less than 0: local row %" PetscInt_FMT " value %" PetscInt_FMT, i, nnz[i]);
399408401ef6SPierre Jolivet       PetscCheck(nnz[i] <= B->cmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "nnz cannot be greater than row length: local row %" PetscInt_FMT " value %" PetscInt_FMT " rowlength %" PetscInt_FMT, i, nnz[i], B->cmap->n);
3995b73539f3SBarry Smith     }
3996b73539f3SBarry Smith   }
3997b73539f3SBarry Smith 
3998273d9f13SBarry Smith   B->preallocated = PETSC_TRUE;
3999ab93d7beSBarry Smith   if (!skipallocation) {
40004dfa11a4SJacob Faibussowitsch     if (!b->imax) { PetscCall(PetscMalloc1(B->rmap->n, &b->imax)); }
4001071fcb05SBarry Smith     if (!b->ilen) {
4002071fcb05SBarry Smith       /* b->ilen will count nonzeros in each row so far. */
40039566063dSJacob Faibussowitsch       PetscCall(PetscCalloc1(B->rmap->n, &b->ilen));
4004071fcb05SBarry Smith     } else {
40059566063dSJacob Faibussowitsch       PetscCall(PetscMemzero(b->ilen, B->rmap->n * sizeof(PetscInt)));
40062ee49352SLisandro Dalcin     }
4007aa624791SPierre Jolivet     if (!b->ipre) PetscCall(PetscMalloc1(B->rmap->n, &b->ipre));
4008273d9f13SBarry Smith     if (!nnz) {
4009435da068SBarry Smith       if (nz == PETSC_DEFAULT || nz == PETSC_DECIDE) nz = 10;
4010c62bd62aSJed Brown       else if (nz < 0) nz = 1;
40115d2a9ed1SStefano Zampini       nz = PetscMin(nz, B->cmap->n);
4012d0f46423SBarry Smith       for (i = 0; i < B->rmap->n; i++) b->imax[i] = nz;
4013c43c4a61SBarry Smith       PetscCall(PetscIntMultError(nz, B->rmap->n, &nz));
4014273d9f13SBarry Smith     } else {
4015c73702f5SBarry Smith       PetscInt64 nz64 = 0;
40169371c9d4SSatish Balay       for (i = 0; i < B->rmap->n; i++) {
40179371c9d4SSatish Balay         b->imax[i] = nnz[i];
40189371c9d4SSatish Balay         nz64 += nnz[i];
40199371c9d4SSatish Balay       }
40209566063dSJacob Faibussowitsch       PetscCall(PetscIntCast(nz64, &nz));
4021273d9f13SBarry Smith     }
4022ab93d7beSBarry Smith 
4023273d9f13SBarry Smith     /* allocate the matrix space */
40249566063dSJacob Faibussowitsch     PetscCall(MatSeqXAIJFreeAIJ(B, &b->a, &b->j, &b->i));
40259f0612e4SBarry Smith     PetscCall(PetscShmgetAllocateArray(nz, sizeof(PetscInt), (void **)&b->j));
40269f0612e4SBarry Smith     PetscCall(PetscShmgetAllocateArray(B->rmap->n + 1, sizeof(PetscInt), (void **)&b->i));
40279f0612e4SBarry Smith     b->free_ij = PETSC_TRUE;
4028396832f4SHong Zhang     if (B->structure_only) {
40299f0612e4SBarry Smith       b->free_a = PETSC_FALSE;
4030396832f4SHong Zhang     } else {
40319f0612e4SBarry Smith       PetscCall(PetscShmgetAllocateArray(nz, sizeof(PetscScalar), (void **)&b->a));
40329f0612e4SBarry Smith       b->free_a = PETSC_TRUE;
4033396832f4SHong Zhang     }
4034bfeeae90SHong Zhang     b->i[0] = 0;
4035ad540459SPierre Jolivet     for (i = 1; i < B->rmap->n + 1; i++) b->i[i] = b->i[i - 1] + b->imax[i - 1];
4036c461c341SBarry Smith   } else {
4037e6b907acSBarry Smith     b->free_a  = PETSC_FALSE;
4038e6b907acSBarry Smith     b->free_ij = PETSC_FALSE;
4039c461c341SBarry Smith   }
4040273d9f13SBarry Smith 
4041846b4da1SFande Kong   if (b->ipre && nnz != b->ipre && b->imax) {
4042846b4da1SFande Kong     /* reserve user-requested sparsity */
40439566063dSJacob Faibussowitsch     PetscCall(PetscArraycpy(b->ipre, b->imax, B->rmap->n));
4044846b4da1SFande Kong   }
4045846b4da1SFande Kong 
4046273d9f13SBarry Smith   b->nz               = 0;
4047273d9f13SBarry Smith   b->maxnz            = nz;
4048273d9f13SBarry Smith   B->info.nz_unneeded = (double)b->maxnz;
40491baa6e33SBarry Smith   if (realalloc) PetscCall(MatSetOption(B, MAT_NEW_NONZERO_ALLOCATION_ERR, PETSC_TRUE));
4050cb7b82ddSBarry Smith   B->was_assembled = PETSC_FALSE;
4051cb7b82ddSBarry Smith   B->assembled     = PETSC_FALSE;
40525519a089SJose E. Roman   /* We simply deem preallocation has changed nonzero state. Updating the state
40535519a089SJose E. Roman      will give clients (like AIJKokkos) a chance to know something has happened.
40545519a089SJose E. Roman   */
40555519a089SJose E. Roman   B->nonzerostate++;
40563ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
4057273d9f13SBarry Smith }
4058273d9f13SBarry Smith 
40594c51d546SAlexander PetscErrorCode MatResetPreallocation_SeqAIJ_Private(Mat A, PetscBool *memoryreset)
4060d71ae5a4SJacob Faibussowitsch {
4061846b4da1SFande Kong   Mat_SeqAIJ *a;
4062a5bbaf83SFande Kong   PetscInt    i;
40631f14be2bSBarry Smith   PetscBool   skipreset;
4064846b4da1SFande Kong 
4065846b4da1SFande Kong   PetscFunctionBegin;
4066846b4da1SFande Kong   PetscValidHeaderSpecific(A, MAT_CLASSID, 1);
406714d0e64fSAlex Lindsay 
40684c51d546SAlexander   PetscCheck(A->insertmode == NOT_SET_VALUES, PETSC_COMM_SELF, PETSC_ERR_SUP, "Cannot reset preallocation after setting some values but not yet calling MatAssemblyBegin()/MatAssemblyEnd()");
40694c51d546SAlexander   if (A->num_ass == 0) PetscFunctionReturn(PETSC_SUCCESS);
40704c51d546SAlexander 
407114d0e64fSAlex Lindsay   /* Check local size. If zero, then return */
40723ba16761SJacob Faibussowitsch   if (!A->rmap->n) PetscFunctionReturn(PETSC_SUCCESS);
407314d0e64fSAlex Lindsay 
4074846b4da1SFande Kong   a = (Mat_SeqAIJ *)A->data;
40752c814fdeSFande Kong   /* if no saved info, we error out */
407628b400f6SJacob Faibussowitsch   PetscCheck(a->ipre, PETSC_COMM_SELF, PETSC_ERR_ARG_NULL, "No saved preallocation info ");
40772c814fdeSFande Kong 
40781f14be2bSBarry Smith   PetscCheck(a->i && a->imax && a->ilen, PETSC_COMM_SELF, PETSC_ERR_ARG_NULL, "Memory info is incomplete, and cannot reset preallocation ");
40792c814fdeSFande Kong 
40801f14be2bSBarry Smith   PetscCall(PetscArraycmp(a->ipre, a->ilen, A->rmap->n, &skipreset));
40814c51d546SAlexander   if (skipreset) PetscCall(MatZeroEntries(A));
40824c51d546SAlexander   else {
40839566063dSJacob Faibussowitsch     PetscCall(PetscArraycpy(a->imax, a->ipre, A->rmap->n));
40849566063dSJacob Faibussowitsch     PetscCall(PetscArrayzero(a->ilen, A->rmap->n));
4085846b4da1SFande Kong     a->i[0] = 0;
4086ad540459SPierre Jolivet     for (i = 1; i < A->rmap->n + 1; i++) a->i[i] = a->i[i - 1] + a->imax[i - 1];
4087846b4da1SFande Kong     A->preallocated     = PETSC_TRUE;
4088846b4da1SFande Kong     a->nz               = 0;
4089846b4da1SFande Kong     a->maxnz            = a->i[A->rmap->n];
4090846b4da1SFande Kong     A->info.nz_unneeded = (double)a->maxnz;
4091846b4da1SFande Kong     A->was_assembled    = PETSC_FALSE;
4092846b4da1SFande Kong     A->assembled        = PETSC_FALSE;
4093b3a35320SAlex Lindsay     A->nonzerostate++;
4094b3a35320SAlex Lindsay     /* Log that the state of this object has changed; this will help guarantee that preconditioners get re-setup */
4095b3a35320SAlex Lindsay     PetscCall(PetscObjectStateIncrease((PetscObject)A));
40961f14be2bSBarry Smith   }
40974c51d546SAlexander   if (memoryreset) *memoryreset = (PetscBool)!skipreset;
40984c51d546SAlexander   PetscFunctionReturn(PETSC_SUCCESS);
40994c51d546SAlexander }
41004c51d546SAlexander 
41014c51d546SAlexander static PetscErrorCode MatResetPreallocation_SeqAIJ(Mat A)
41024c51d546SAlexander {
41034c51d546SAlexander   PetscFunctionBegin;
41044c51d546SAlexander   PetscCall(MatResetPreallocation_SeqAIJ_Private(A, NULL));
41053ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
4106846b4da1SFande Kong }
4107846b4da1SFande Kong 
410858d36128SBarry Smith /*@
410911a5261eSBarry Smith   MatSeqAIJSetPreallocationCSR - Allocates memory for a sparse sequential matrix in `MATSEQAIJ` format.
4110a1661176SMatthew Knepley 
4111a1661176SMatthew Knepley   Input Parameters:
4112a1661176SMatthew Knepley + B - the matrix
4113d8a51d2aSBarry Smith . i - the indices into `j` for the start of each row (indices start with zero)
4114d8a51d2aSBarry Smith . j - the column indices for each row (indices start with zero) these must be sorted for each row
4115d8a51d2aSBarry Smith - v - optional values in the matrix, use `NULL` if not provided
4116a1661176SMatthew Knepley 
4117a1661176SMatthew Knepley   Level: developer
4118a1661176SMatthew Knepley 
41196a9b8d82SBarry Smith   Notes:
41202ef1f0ffSBarry Smith   The `i`,`j`,`v` values are COPIED with this routine; to avoid the copy use `MatCreateSeqAIJWithArrays()`
412158d36128SBarry Smith 
41226a9b8d82SBarry Smith   This routine may be called multiple times with different nonzero patterns (or the same nonzero pattern). The nonzero
41236a9b8d82SBarry Smith   structure will be the union of all the previous nonzero structures.
41246a9b8d82SBarry Smith 
41256a9b8d82SBarry Smith   Developer Notes:
41262ef1f0ffSBarry Smith   An optimization could be added to the implementation where it checks if the `i`, and `j` are identical to the current `i` and `j` and
41272ef1f0ffSBarry Smith   then just copies the `v` values directly with `PetscMemcpy()`.
41286a9b8d82SBarry Smith 
412911a5261eSBarry Smith   This routine could also take a `PetscCopyMode` argument to allow sharing the values instead of always copying them.
41306a9b8d82SBarry Smith 
4131fe59aa6dSJacob Faibussowitsch .seealso: [](ch_matrices), `Mat`, `MatCreate()`, `MatCreateSeqAIJ()`, `MatSetValues()`, `MatSeqAIJSetPreallocation()`, `MATSEQAIJ`, `MatResetPreallocation()`
4132a1661176SMatthew Knepley @*/
4133d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetPreallocationCSR(Mat B, const PetscInt i[], const PetscInt j[], const PetscScalar v[])
4134d71ae5a4SJacob Faibussowitsch {
4135a1661176SMatthew Knepley   PetscFunctionBegin;
41360700a824SBarry Smith   PetscValidHeaderSpecific(B, MAT_CLASSID, 1);
41376ba663aaSJed Brown   PetscValidType(B, 1);
4138cac4c232SBarry Smith   PetscTryMethod(B, "MatSeqAIJSetPreallocationCSR_C", (Mat, const PetscInt[], const PetscInt[], const PetscScalar[]), (B, i, j, v));
41393ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
4140a1661176SMatthew Knepley }
4141a1661176SMatthew Knepley 
4142ba38deedSJacob Faibussowitsch static PetscErrorCode MatSeqAIJSetPreallocationCSR_SeqAIJ(Mat B, const PetscInt Ii[], const PetscInt J[], const PetscScalar v[])
4143d71ae5a4SJacob Faibussowitsch {
4144a1661176SMatthew Knepley   PetscInt  i;
4145a1661176SMatthew Knepley   PetscInt  m, n;
4146a1661176SMatthew Knepley   PetscInt  nz;
41476a9b8d82SBarry Smith   PetscInt *nnz;
4148a1661176SMatthew Knepley 
4149a1661176SMatthew Knepley   PetscFunctionBegin;
4150aed4548fSBarry Smith   PetscCheck(Ii[0] == 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Ii[0] must be 0 it is %" PetscInt_FMT, Ii[0]);
4151779a8d59SSatish Balay 
41529566063dSJacob Faibussowitsch   PetscCall(PetscLayoutSetUp(B->rmap));
41539566063dSJacob Faibussowitsch   PetscCall(PetscLayoutSetUp(B->cmap));
4154779a8d59SSatish Balay 
41559566063dSJacob Faibussowitsch   PetscCall(MatGetSize(B, &m, &n));
41569566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(m + 1, &nnz));
4157a1661176SMatthew Knepley   for (i = 0; i < m; i++) {
4158b7940d39SSatish Balay     nz = Ii[i + 1] - Ii[i];
415908401ef6SPierre Jolivet     PetscCheck(nz >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Local row %" PetscInt_FMT " has a negative number of columns %" PetscInt_FMT, i, nz);
4160a1661176SMatthew Knepley     nnz[i] = nz;
4161a1661176SMatthew Knepley   }
41629566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJSetPreallocation(B, 0, nnz));
41639566063dSJacob Faibussowitsch   PetscCall(PetscFree(nnz));
4164a1661176SMatthew Knepley 
41658e3a54c0SPierre Jolivet   for (i = 0; i < m; i++) PetscCall(MatSetValues_SeqAIJ(B, 1, &i, Ii[i + 1] - Ii[i], J + Ii[i], PetscSafePointerPlusOffset(v, Ii[i]), INSERT_VALUES));
4166a1661176SMatthew Knepley 
41679566063dSJacob Faibussowitsch   PetscCall(MatAssemblyBegin(B, MAT_FINAL_ASSEMBLY));
41689566063dSJacob Faibussowitsch   PetscCall(MatAssemblyEnd(B, MAT_FINAL_ASSEMBLY));
4169a1661176SMatthew Knepley 
41709566063dSJacob Faibussowitsch   PetscCall(MatSetOption(B, MAT_NEW_NONZERO_LOCATION_ERR, PETSC_TRUE));
41713ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
4172a1661176SMatthew Knepley }
4173a1661176SMatthew Knepley 
4174ad7e164aSPierre Jolivet /*@
41752ef1f0ffSBarry Smith   MatSeqAIJKron - Computes `C`, the Kronecker product of `A` and `B`.
4176ad7e164aSPierre Jolivet 
4177ad7e164aSPierre Jolivet   Input Parameters:
4178ad7e164aSPierre Jolivet + A     - left-hand side matrix
4179ad7e164aSPierre Jolivet . B     - right-hand side matrix
418011a5261eSBarry Smith - reuse - either `MAT_INITIAL_MATRIX` or `MAT_REUSE_MATRIX`
4181ad7e164aSPierre Jolivet 
4182ad7e164aSPierre Jolivet   Output Parameter:
41832ef1f0ffSBarry Smith . C - Kronecker product of `A` and `B`
4184ad7e164aSPierre Jolivet 
4185ad7e164aSPierre Jolivet   Level: intermediate
4186ad7e164aSPierre Jolivet 
418711a5261eSBarry Smith   Note:
418811a5261eSBarry Smith   `MAT_REUSE_MATRIX` can only be used when the nonzero structure of the product matrix has not changed from that last call to `MatSeqAIJKron()`.
4189ad7e164aSPierre Jolivet 
41901cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatCreateSeqAIJ()`, `MATSEQAIJ`, `MATKAIJ`, `MatReuse`
4191ad7e164aSPierre Jolivet @*/
4192d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJKron(Mat A, Mat B, MatReuse reuse, Mat *C)
4193d71ae5a4SJacob Faibussowitsch {
4194ad7e164aSPierre Jolivet   PetscFunctionBegin;
4195ad7e164aSPierre Jolivet   PetscValidHeaderSpecific(A, MAT_CLASSID, 1);
4196ad7e164aSPierre Jolivet   PetscValidType(A, 1);
4197ad7e164aSPierre Jolivet   PetscValidHeaderSpecific(B, MAT_CLASSID, 2);
4198ad7e164aSPierre Jolivet   PetscValidType(B, 2);
41994f572ea9SToby Isaac   PetscAssertPointer(C, 4);
4200ad7e164aSPierre Jolivet   if (reuse == MAT_REUSE_MATRIX) {
4201ad7e164aSPierre Jolivet     PetscValidHeaderSpecific(*C, MAT_CLASSID, 4);
4202ad7e164aSPierre Jolivet     PetscValidType(*C, 4);
4203ad7e164aSPierre Jolivet   }
4204cac4c232SBarry Smith   PetscTryMethod(A, "MatSeqAIJKron_C", (Mat, Mat, MatReuse, Mat *), (A, B, reuse, C));
42053ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
4206ad7e164aSPierre Jolivet }
4207ad7e164aSPierre Jolivet 
4208ba38deedSJacob Faibussowitsch static PetscErrorCode MatSeqAIJKron_SeqAIJ(Mat A, Mat B, MatReuse reuse, Mat *C)
4209d71ae5a4SJacob Faibussowitsch {
4210ad7e164aSPierre Jolivet   Mat                newmat;
4211ad7e164aSPierre Jolivet   Mat_SeqAIJ        *a = (Mat_SeqAIJ *)A->data;
4212ad7e164aSPierre Jolivet   Mat_SeqAIJ        *b = (Mat_SeqAIJ *)B->data;
4213ad7e164aSPierre Jolivet   PetscScalar       *v;
4214fff043a9SJunchao Zhang   const PetscScalar *aa, *ba;
4215ad7e164aSPierre Jolivet   PetscInt          *i, *j, m, n, p, q, nnz = 0, am = A->rmap->n, bm = B->rmap->n, an = A->cmap->n, bn = B->cmap->n;
4216ad7e164aSPierre Jolivet   PetscBool          flg;
4217ad7e164aSPierre Jolivet 
4218ad7e164aSPierre Jolivet   PetscFunctionBegin;
421928b400f6SJacob Faibussowitsch   PetscCheck(!A->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix");
422028b400f6SJacob Faibussowitsch   PetscCheck(A->assembled, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for unassembled matrix");
422128b400f6SJacob Faibussowitsch   PetscCheck(!B->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix");
422228b400f6SJacob Faibussowitsch   PetscCheck(B->assembled, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for unassembled matrix");
42239566063dSJacob Faibussowitsch   PetscCall(PetscObjectTypeCompare((PetscObject)B, MATSEQAIJ, &flg));
422428b400f6SJacob Faibussowitsch   PetscCheck(flg, PETSC_COMM_SELF, PETSC_ERR_SUP, "MatType %s", ((PetscObject)B)->type_name);
4225aed4548fSBarry Smith   PetscCheck(reuse == MAT_INITIAL_MATRIX || reuse == MAT_REUSE_MATRIX, PETSC_COMM_SELF, PETSC_ERR_SUP, "MatReuse %d", (int)reuse);
4226ad7e164aSPierre Jolivet   if (reuse == MAT_INITIAL_MATRIX) {
42279566063dSJacob Faibussowitsch     PetscCall(PetscMalloc2(am * bm + 1, &i, a->i[am] * b->i[bm], &j));
42289566063dSJacob Faibussowitsch     PetscCall(MatCreate(PETSC_COMM_SELF, &newmat));
42299566063dSJacob Faibussowitsch     PetscCall(MatSetSizes(newmat, am * bm, an * bn, am * bm, an * bn));
42309566063dSJacob Faibussowitsch     PetscCall(MatSetType(newmat, MATAIJ));
4231ad7e164aSPierre Jolivet     i[0] = 0;
4232ad7e164aSPierre Jolivet     for (m = 0; m < am; ++m) {
4233ad7e164aSPierre Jolivet       for (p = 0; p < bm; ++p) {
4234ad7e164aSPierre Jolivet         i[m * bm + p + 1] = i[m * bm + p] + (a->i[m + 1] - a->i[m]) * (b->i[p + 1] - b->i[p]);
4235ad7e164aSPierre Jolivet         for (n = a->i[m]; n < a->i[m + 1]; ++n) {
4236ad540459SPierre Jolivet           for (q = b->i[p]; q < b->i[p + 1]; ++q) j[nnz++] = a->j[n] * bn + b->j[q];
4237ad7e164aSPierre Jolivet         }
4238ad7e164aSPierre Jolivet       }
4239ad7e164aSPierre Jolivet     }
42409566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJSetPreallocationCSR(newmat, i, j, NULL));
4241ad7e164aSPierre Jolivet     *C = newmat;
42429566063dSJacob Faibussowitsch     PetscCall(PetscFree2(i, j));
4243ad7e164aSPierre Jolivet     nnz = 0;
4244ad7e164aSPierre Jolivet   }
42459566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArray(*C, &v));
42469566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &aa));
42479566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(B, &ba));
4248ad7e164aSPierre Jolivet   for (m = 0; m < am; ++m) {
4249ad7e164aSPierre Jolivet     for (p = 0; p < bm; ++p) {
4250ad7e164aSPierre Jolivet       for (n = a->i[m]; n < a->i[m + 1]; ++n) {
4251ad540459SPierre Jolivet         for (q = b->i[p]; q < b->i[p + 1]; ++q) v[nnz++] = aa[n] * ba[q];
4252ad7e164aSPierre Jolivet       }
4253ad7e164aSPierre Jolivet     }
4254ad7e164aSPierre Jolivet   }
42559566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArray(*C, &v));
42569566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &aa));
42579566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(B, &ba));
42583ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
4259ad7e164aSPierre Jolivet }
4260ad7e164aSPierre Jolivet 
4261c6db04a5SJed Brown #include <../src/mat/impls/dense/seq/dense.h>
4262af0996ceSBarry Smith #include <petsc/private/kernels/petscaxpy.h>
4263170fe5c8SBarry Smith 
4264170fe5c8SBarry Smith /*
4265170fe5c8SBarry Smith     Computes (B'*A')' since computing B*A directly is untenable
4266170fe5c8SBarry Smith 
4267170fe5c8SBarry Smith                n                       p                          p
42682da392ccSBarry Smith         [             ]       [             ]         [                 ]
42692da392ccSBarry Smith       m [      A      ]  *  n [       B     ]   =   m [         C       ]
42702da392ccSBarry Smith         [             ]       [             ]         [                 ]
4271170fe5c8SBarry Smith 
4272170fe5c8SBarry Smith */
4273d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMatMultNumeric_SeqDense_SeqAIJ(Mat A, Mat B, Mat C)
4274d71ae5a4SJacob Faibussowitsch {
4275170fe5c8SBarry Smith   Mat_SeqDense      *sub_a = (Mat_SeqDense *)A->data;
4276170fe5c8SBarry Smith   Mat_SeqAIJ        *sub_b = (Mat_SeqAIJ *)B->data;
4277170fe5c8SBarry Smith   Mat_SeqDense      *sub_c = (Mat_SeqDense *)C->data;
427886214ceeSStefano Zampini   PetscInt           i, j, n, m, q, p;
4279170fe5c8SBarry Smith   const PetscInt    *ii, *idx;
4280170fe5c8SBarry Smith   const PetscScalar *b, *a, *a_q;
4281170fe5c8SBarry Smith   PetscScalar       *c, *c_q;
428286214ceeSStefano Zampini   PetscInt           clda = sub_c->lda;
428386214ceeSStefano Zampini   PetscInt           alda = sub_a->lda;
4284170fe5c8SBarry Smith 
4285170fe5c8SBarry Smith   PetscFunctionBegin;
4286d0f46423SBarry Smith   m = A->rmap->n;
4287d0f46423SBarry Smith   n = A->cmap->n;
4288d0f46423SBarry Smith   p = B->cmap->n;
4289170fe5c8SBarry Smith   a = sub_a->v;
4290170fe5c8SBarry Smith   b = sub_b->a;
4291170fe5c8SBarry Smith   c = sub_c->v;
429286214ceeSStefano Zampini   if (clda == m) {
42939566063dSJacob Faibussowitsch     PetscCall(PetscArrayzero(c, m * p));
429486214ceeSStefano Zampini   } else {
429586214ceeSStefano Zampini     for (j = 0; j < p; j++)
42969371c9d4SSatish Balay       for (i = 0; i < m; i++) c[j * clda + i] = 0.0;
429786214ceeSStefano Zampini   }
4298170fe5c8SBarry Smith   ii  = sub_b->i;
4299170fe5c8SBarry Smith   idx = sub_b->j;
4300170fe5c8SBarry Smith   for (i = 0; i < n; i++) {
4301170fe5c8SBarry Smith     q = ii[i + 1] - ii[i];
4302170fe5c8SBarry Smith     while (q-- > 0) {
430386214ceeSStefano Zampini       c_q = c + clda * (*idx);
430486214ceeSStefano Zampini       a_q = a + alda * i;
4305854c7f52SBarry Smith       PetscKernelAXPY(c_q, *b, a_q, m);
4306170fe5c8SBarry Smith       idx++;
4307170fe5c8SBarry Smith       b++;
4308170fe5c8SBarry Smith     }
4309170fe5c8SBarry Smith   }
43103ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
4311170fe5c8SBarry Smith }
4312170fe5c8SBarry Smith 
4313d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMatMultSymbolic_SeqDense_SeqAIJ(Mat A, Mat B, PetscReal fill, Mat C)
4314d71ae5a4SJacob Faibussowitsch {
4315d0f46423SBarry Smith   PetscInt  m = A->rmap->n, n = B->cmap->n;
431686214ceeSStefano Zampini   PetscBool cisdense;
4317170fe5c8SBarry Smith 
4318170fe5c8SBarry Smith   PetscFunctionBegin;
431908401ef6SPierre Jolivet   PetscCheck(A->cmap->n == B->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "A->cmap->n %" PetscInt_FMT " != B->rmap->n %" PetscInt_FMT, A->cmap->n, B->rmap->n);
43209566063dSJacob Faibussowitsch   PetscCall(MatSetSizes(C, m, n, m, n));
43219566063dSJacob Faibussowitsch   PetscCall(MatSetBlockSizesFromMats(C, A, B));
4322d5e393b6SSuyash Tandon   PetscCall(PetscObjectTypeCompareAny((PetscObject)C, &cisdense, MATSEQDENSE, MATSEQDENSECUDA, MATSEQDENSEHIP, ""));
432348a46eb9SPierre Jolivet   if (!cisdense) PetscCall(MatSetType(C, MATDENSE));
43249566063dSJacob Faibussowitsch   PetscCall(MatSetUp(C));
4325d73949e8SHong Zhang 
43264222ddf1SHong Zhang   C->ops->matmultnumeric = MatMatMultNumeric_SeqDense_SeqAIJ;
43273ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
4328170fe5c8SBarry Smith }
4329170fe5c8SBarry Smith 
43300bad9183SKris Buschelman /*MC
4331fafad747SKris Buschelman    MATSEQAIJ - MATSEQAIJ = "seqaij" - A matrix type to be used for sequential sparse matrices,
43320bad9183SKris Buschelman    based on compressed sparse row format.
43330bad9183SKris Buschelman 
43342ef1f0ffSBarry Smith    Options Database Key:
43350bad9183SKris Buschelman . -mat_type seqaij - sets the matrix type to "seqaij" during a call to MatSetFromOptions()
43360bad9183SKris Buschelman 
43370bad9183SKris Buschelman    Level: beginner
43380bad9183SKris Buschelman 
43390cd7f59aSBarry Smith    Notes:
43402ef1f0ffSBarry Smith     `MatSetValues()` may be called for this matrix type with a `NULL` argument for the numerical values,
43410cd7f59aSBarry Smith     in this case the values associated with the rows and columns one passes in are set to zero
43420cd7f59aSBarry Smith     in the matrix
43430cd7f59aSBarry Smith 
434411a5261eSBarry Smith     `MatSetOptions`(,`MAT_STRUCTURE_ONLY`,`PETSC_TRUE`) may be called for this matrix type. In this no
434511a5261eSBarry Smith     space is allocated for the nonzero entries and any entries passed with `MatSetValues()` are ignored
43460cd7f59aSBarry Smith 
434711a5261eSBarry Smith   Developer Note:
43482ef1f0ffSBarry Smith     It would be nice if all matrix formats supported passing `NULL` in for the numerical values
43490cd7f59aSBarry Smith 
43501cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatCreateSeqAIJ()`, `MatSetFromOptions()`, `MatSetType()`, `MatCreate()`, `MatType`, `MATSELL`, `MATSEQSELL`, `MATMPISELL`
43510bad9183SKris Buschelman M*/
43520bad9183SKris Buschelman 
4353ccd284c7SBarry Smith /*MC
4354ccd284c7SBarry Smith    MATAIJ - MATAIJ = "aij" - A matrix type to be used for sparse matrices.
4355ccd284c7SBarry Smith 
435611a5261eSBarry Smith    This matrix type is identical to `MATSEQAIJ` when constructed with a single process communicator,
435711a5261eSBarry Smith    and `MATMPIAIJ` otherwise.  As a result, for single process communicators,
435811a5261eSBarry Smith    `MatSeqAIJSetPreallocation()` is supported, and similarly `MatMPIAIJSetPreallocation()` is supported
4359ccd284c7SBarry Smith    for communicators controlling multiple processes.  It is recommended that you call both of
4360ccd284c7SBarry Smith    the above preallocation routines for simplicity.
4361ccd284c7SBarry Smith 
43622ef1f0ffSBarry Smith    Options Database Key:
436311a5261eSBarry Smith . -mat_type aij - sets the matrix type to "aij" during a call to `MatSetFromOptions()`
4364ccd284c7SBarry Smith 
43652ef1f0ffSBarry Smith   Level: beginner
43662ef1f0ffSBarry Smith 
436711a5261eSBarry Smith    Note:
436811a5261eSBarry Smith    Subclasses include `MATAIJCUSPARSE`, `MATAIJPERM`, `MATAIJSELL`, `MATAIJMKL`, `MATAIJCRL`, and also automatically switches over to use inodes when
4369ccd284c7SBarry Smith    enough exist.
4370ccd284c7SBarry Smith 
43711cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatCreateAIJ()`, `MatCreateSeqAIJ()`, `MATSEQAIJ`, `MATMPIAIJ`, `MATSELL`, `MATSEQSELL`, `MATMPISELL`
4372ccd284c7SBarry Smith M*/
4373ccd284c7SBarry Smith 
4374ccd284c7SBarry Smith /*MC
4375ccd284c7SBarry Smith    MATAIJCRL - MATAIJCRL = "aijcrl" - A matrix type to be used for sparse matrices.
4376ccd284c7SBarry Smith 
43772ef1f0ffSBarry Smith    Options Database Key:
43782ef1f0ffSBarry Smith . -mat_type aijcrl - sets the matrix type to "aijcrl" during a call to `MatSetFromOptions()`
43792ef1f0ffSBarry Smith 
43802ef1f0ffSBarry Smith   Level: beginner
43812ef1f0ffSBarry Smith 
43822ef1f0ffSBarry Smith    Note:
438311a5261eSBarry Smith    This matrix type is identical to `MATSEQAIJCRL` when constructed with a single process communicator,
438411a5261eSBarry Smith    and `MATMPIAIJCRL` otherwise.  As a result, for single process communicators,
438511a5261eSBarry Smith    `MatSeqAIJSetPreallocation()` is supported, and similarly `MatMPIAIJSetPreallocation()` is supported
4386ccd284c7SBarry Smith    for communicators controlling multiple processes.  It is recommended that you call both of
4387ccd284c7SBarry Smith    the above preallocation routines for simplicity.
4388ccd284c7SBarry Smith 
43891cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatCreateMPIAIJCRL`, `MATSEQAIJCRL`, `MATMPIAIJCRL`, `MATSEQAIJCRL`, `MATMPIAIJCRL`
4390ccd284c7SBarry Smith M*/
4391ccd284c7SBarry Smith 
43927906f579SHong Zhang PETSC_INTERN PetscErrorCode MatConvert_SeqAIJ_SeqAIJCRL(Mat, MatType, MatReuse, Mat *);
43937906f579SHong Zhang #if defined(PETSC_HAVE_ELEMENTAL)
43947906f579SHong Zhang PETSC_INTERN PetscErrorCode MatConvert_SeqAIJ_Elemental(Mat, MatType, MatReuse, Mat *);
43957906f579SHong Zhang #endif
4396d24d4204SJose E. Roman #if defined(PETSC_HAVE_SCALAPACK)
4397d24d4204SJose E. Roman PETSC_INTERN PetscErrorCode MatConvert_AIJ_ScaLAPACK(Mat, MatType, MatReuse, Mat *);
4398d24d4204SJose E. Roman #endif
43997906f579SHong Zhang #if defined(PETSC_HAVE_HYPRE)
44007906f579SHong Zhang PETSC_INTERN PetscErrorCode MatConvert_AIJ_HYPRE(Mat A, MatType, MatReuse, Mat *);
44017906f579SHong Zhang #endif
44027906f579SHong Zhang 
4403d4002b98SHong Zhang PETSC_EXTERN PetscErrorCode MatConvert_SeqAIJ_SeqSELL(Mat, MatType, MatReuse, Mat *);
4404c9225affSStefano Zampini PETSC_INTERN PetscErrorCode MatConvert_XAIJ_IS(Mat, MatType, MatReuse, Mat *);
44054222ddf1SHong Zhang PETSC_INTERN PetscErrorCode MatProductSetFromOptions_IS_XAIJ(Mat);
44067906f579SHong Zhang 
44078c778c55SBarry Smith /*@C
440811a5261eSBarry Smith   MatSeqAIJGetArray - gives read/write access to the array where the data for a `MATSEQAIJ` matrix is stored
44098c778c55SBarry Smith 
44108c778c55SBarry Smith   Not Collective
44118c778c55SBarry Smith 
44128c778c55SBarry Smith   Input Parameter:
4413fe59aa6dSJacob Faibussowitsch . A - a `MATSEQAIJ` matrix
44148c778c55SBarry Smith 
44158c778c55SBarry Smith   Output Parameter:
44168c778c55SBarry Smith . array - pointer to the data
44178c778c55SBarry Smith 
44188c778c55SBarry Smith   Level: intermediate
44198c778c55SBarry Smith 
4420ce78bad3SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJRestoreArray()`
44218c778c55SBarry Smith @*/
44225d83a8b1SBarry Smith PetscErrorCode MatSeqAIJGetArray(Mat A, PetscScalar *array[])
4423d71ae5a4SJacob Faibussowitsch {
4424d67d9f35SJunchao Zhang   Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data;
44258c778c55SBarry Smith 
44268c778c55SBarry Smith   PetscFunctionBegin;
4427d67d9f35SJunchao Zhang   if (aij->ops->getarray) {
44289566063dSJacob Faibussowitsch     PetscCall((*aij->ops->getarray)(A, array));
4429d67d9f35SJunchao Zhang   } else {
4430d67d9f35SJunchao Zhang     *array = aij->a;
4431d67d9f35SJunchao Zhang   }
44323ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
4433d67d9f35SJunchao Zhang }
4434d67d9f35SJunchao Zhang 
4435d67d9f35SJunchao Zhang /*@C
443611a5261eSBarry Smith   MatSeqAIJRestoreArray - returns access to the array where the data for a `MATSEQAIJ` matrix is stored obtained by `MatSeqAIJGetArray()`
4437d67d9f35SJunchao Zhang 
4438d67d9f35SJunchao Zhang   Not Collective
4439d67d9f35SJunchao Zhang 
4440d67d9f35SJunchao Zhang   Input Parameters:
4441fe59aa6dSJacob Faibussowitsch + A     - a `MATSEQAIJ` matrix
4442d67d9f35SJunchao Zhang - array - pointer to the data
4443d67d9f35SJunchao Zhang 
4444d67d9f35SJunchao Zhang   Level: intermediate
4445d67d9f35SJunchao Zhang 
4446ce78bad3SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJGetArray()`
4447d67d9f35SJunchao Zhang @*/
44485d83a8b1SBarry Smith PetscErrorCode MatSeqAIJRestoreArray(Mat A, PetscScalar *array[])
4449d71ae5a4SJacob Faibussowitsch {
4450d67d9f35SJunchao Zhang   Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data;
4451d67d9f35SJunchao Zhang 
4452d67d9f35SJunchao Zhang   PetscFunctionBegin;
4453d67d9f35SJunchao Zhang   if (aij->ops->restorearray) {
44549566063dSJacob Faibussowitsch     PetscCall((*aij->ops->restorearray)(A, array));
4455d67d9f35SJunchao Zhang   } else {
4456d67d9f35SJunchao Zhang     *array = NULL;
4457d67d9f35SJunchao Zhang   }
44589566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJInvalidateDiagonal(A));
44599566063dSJacob Faibussowitsch   PetscCall(PetscObjectStateIncrease((PetscObject)A));
44603ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
44618c778c55SBarry Smith }
44628c778c55SBarry Smith 
446321e72a00SBarry Smith /*@C
446411a5261eSBarry Smith   MatSeqAIJGetArrayRead - gives read-only access to the array where the data for a `MATSEQAIJ` matrix is stored
44658f1ea47aSStefano Zampini 
44660ab4885dSBarry Smith   Not Collective; No Fortran Support
44678f1ea47aSStefano Zampini 
44688f1ea47aSStefano Zampini   Input Parameter:
4469fe59aa6dSJacob Faibussowitsch . A - a `MATSEQAIJ` matrix
44708f1ea47aSStefano Zampini 
44718f1ea47aSStefano Zampini   Output Parameter:
44728f1ea47aSStefano Zampini . array - pointer to the data
44738f1ea47aSStefano Zampini 
44748f1ea47aSStefano Zampini   Level: intermediate
44758f1ea47aSStefano Zampini 
44761cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJGetArray()`, `MatSeqAIJRestoreArrayRead()`
44778f1ea47aSStefano Zampini @*/
44785d83a8b1SBarry Smith PetscErrorCode MatSeqAIJGetArrayRead(Mat A, const PetscScalar *array[])
4479d71ae5a4SJacob Faibussowitsch {
4480d67d9f35SJunchao Zhang   Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data;
44818f1ea47aSStefano Zampini 
44828f1ea47aSStefano Zampini   PetscFunctionBegin;
4483d67d9f35SJunchao Zhang   if (aij->ops->getarrayread) {
44849566063dSJacob Faibussowitsch     PetscCall((*aij->ops->getarrayread)(A, array));
4485d67d9f35SJunchao Zhang   } else {
4486d67d9f35SJunchao Zhang     *array = aij->a;
4487d67d9f35SJunchao Zhang   }
44883ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
44898f1ea47aSStefano Zampini }
44908f1ea47aSStefano Zampini 
44918f1ea47aSStefano Zampini /*@C
449211a5261eSBarry Smith   MatSeqAIJRestoreArrayRead - restore the read-only access array obtained from `MatSeqAIJGetArrayRead()`
44938f1ea47aSStefano Zampini 
44940ab4885dSBarry Smith   Not Collective; No Fortran Support
44958f1ea47aSStefano Zampini 
44968f1ea47aSStefano Zampini   Input Parameter:
4497fe59aa6dSJacob Faibussowitsch . A - a `MATSEQAIJ` matrix
44988f1ea47aSStefano Zampini 
44998f1ea47aSStefano Zampini   Output Parameter:
45008f1ea47aSStefano Zampini . array - pointer to the data
45018f1ea47aSStefano Zampini 
45028f1ea47aSStefano Zampini   Level: intermediate
45038f1ea47aSStefano Zampini 
45041cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJGetArray()`, `MatSeqAIJGetArrayRead()`
45058f1ea47aSStefano Zampini @*/
45065d83a8b1SBarry Smith PetscErrorCode MatSeqAIJRestoreArrayRead(Mat A, const PetscScalar *array[])
4507d71ae5a4SJacob Faibussowitsch {
4508d67d9f35SJunchao Zhang   Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data;
45098f1ea47aSStefano Zampini 
45108f1ea47aSStefano Zampini   PetscFunctionBegin;
4511d67d9f35SJunchao Zhang   if (aij->ops->restorearrayread) {
45129566063dSJacob Faibussowitsch     PetscCall((*aij->ops->restorearrayread)(A, array));
4513d67d9f35SJunchao Zhang   } else {
4514d67d9f35SJunchao Zhang     *array = NULL;
4515d67d9f35SJunchao Zhang   }
45163ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
4517d67d9f35SJunchao Zhang }
4518d67d9f35SJunchao Zhang 
4519d67d9f35SJunchao Zhang /*@C
452011a5261eSBarry Smith   MatSeqAIJGetArrayWrite - gives write-only access to the array where the data for a `MATSEQAIJ` matrix is stored
4521d67d9f35SJunchao Zhang 
45220ab4885dSBarry Smith   Not Collective; No Fortran Support
4523d67d9f35SJunchao Zhang 
4524d67d9f35SJunchao Zhang   Input Parameter:
4525fe59aa6dSJacob Faibussowitsch . A - a `MATSEQAIJ` matrix
4526d67d9f35SJunchao Zhang 
4527d67d9f35SJunchao Zhang   Output Parameter:
4528d67d9f35SJunchao Zhang . array - pointer to the data
4529d67d9f35SJunchao Zhang 
4530d67d9f35SJunchao Zhang   Level: intermediate
4531d67d9f35SJunchao Zhang 
45321cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJGetArray()`, `MatSeqAIJRestoreArrayRead()`
4533d67d9f35SJunchao Zhang @*/
45345d83a8b1SBarry Smith PetscErrorCode MatSeqAIJGetArrayWrite(Mat A, PetscScalar *array[])
4535d71ae5a4SJacob Faibussowitsch {
4536d67d9f35SJunchao Zhang   Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data;
4537d67d9f35SJunchao Zhang 
4538d67d9f35SJunchao Zhang   PetscFunctionBegin;
4539d67d9f35SJunchao Zhang   if (aij->ops->getarraywrite) {
45409566063dSJacob Faibussowitsch     PetscCall((*aij->ops->getarraywrite)(A, array));
4541d67d9f35SJunchao Zhang   } else {
4542d67d9f35SJunchao Zhang     *array = aij->a;
4543d67d9f35SJunchao Zhang   }
45449566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJInvalidateDiagonal(A));
45459566063dSJacob Faibussowitsch   PetscCall(PetscObjectStateIncrease((PetscObject)A));
45463ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
4547d67d9f35SJunchao Zhang }
4548d67d9f35SJunchao Zhang 
4549d67d9f35SJunchao Zhang /*@C
4550d67d9f35SJunchao Zhang   MatSeqAIJRestoreArrayWrite - restore the read-only access array obtained from MatSeqAIJGetArrayRead
4551d67d9f35SJunchao Zhang 
45520ab4885dSBarry Smith   Not Collective; No Fortran Support
4553d67d9f35SJunchao Zhang 
4554d67d9f35SJunchao Zhang   Input Parameter:
4555fe59aa6dSJacob Faibussowitsch . A - a MATSEQAIJ matrix
4556d67d9f35SJunchao Zhang 
4557d67d9f35SJunchao Zhang   Output Parameter:
4558d67d9f35SJunchao Zhang . array - pointer to the data
4559d67d9f35SJunchao Zhang 
4560d67d9f35SJunchao Zhang   Level: intermediate
4561d67d9f35SJunchao Zhang 
45621cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJGetArray()`, `MatSeqAIJGetArrayRead()`
4563d67d9f35SJunchao Zhang @*/
45645d83a8b1SBarry Smith PetscErrorCode MatSeqAIJRestoreArrayWrite(Mat A, PetscScalar *array[])
4565d71ae5a4SJacob Faibussowitsch {
4566d67d9f35SJunchao Zhang   Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data;
4567d67d9f35SJunchao Zhang 
4568d67d9f35SJunchao Zhang   PetscFunctionBegin;
4569d67d9f35SJunchao Zhang   if (aij->ops->restorearraywrite) {
45709566063dSJacob Faibussowitsch     PetscCall((*aij->ops->restorearraywrite)(A, array));
4571d67d9f35SJunchao Zhang   } else {
4572d67d9f35SJunchao Zhang     *array = NULL;
4573d67d9f35SJunchao Zhang   }
45743ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
45758f1ea47aSStefano Zampini }
45768f1ea47aSStefano Zampini 
45778f1ea47aSStefano Zampini /*@C
457811a5261eSBarry Smith   MatSeqAIJGetCSRAndMemType - Get the CSR arrays and the memory type of the `MATSEQAIJ` matrix
45797ee59b9bSJunchao Zhang 
45800ab4885dSBarry Smith   Not Collective; No Fortran Support
45817ee59b9bSJunchao Zhang 
45827ee59b9bSJunchao Zhang   Input Parameter:
458311a5261eSBarry Smith . mat - a matrix of type `MATSEQAIJ` or its subclasses
45847ee59b9bSJunchao Zhang 
45857ee59b9bSJunchao Zhang   Output Parameters:
45867ee59b9bSJunchao Zhang + i     - row map array of the matrix
45877ee59b9bSJunchao Zhang . j     - column index array of the matrix
45887ee59b9bSJunchao Zhang . a     - data array of the matrix
4589fe59aa6dSJacob Faibussowitsch - mtype - memory type of the arrays
45907ee59b9bSJunchao Zhang 
4591fe59aa6dSJacob Faibussowitsch   Level: developer
45922ef1f0ffSBarry Smith 
45937ee59b9bSJunchao Zhang   Notes:
45942ef1f0ffSBarry Smith   Any of the output parameters can be `NULL`, in which case the corresponding value is not returned.
45957ee59b9bSJunchao Zhang   If mat is a device matrix, the arrays are on the device. Otherwise, they are on the host.
45967ee59b9bSJunchao Zhang 
45977ee59b9bSJunchao Zhang   One can call this routine on a preallocated but not assembled matrix to just get the memory of the CSR underneath the matrix.
45982ef1f0ffSBarry Smith   If the matrix is assembled, the data array `a` is guaranteed to have the latest values of the matrix.
45997ee59b9bSJunchao Zhang 
46001cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJGetArray()`, `MatSeqAIJGetArrayRead()`
46017ee59b9bSJunchao Zhang @*/
46025d83a8b1SBarry Smith PetscErrorCode MatSeqAIJGetCSRAndMemType(Mat mat, const PetscInt *i[], const PetscInt *j[], PetscScalar *a[], PetscMemType *mtype)
4603d71ae5a4SJacob Faibussowitsch {
46047ee59b9bSJunchao Zhang   Mat_SeqAIJ *aij = (Mat_SeqAIJ *)mat->data;
46057ee59b9bSJunchao Zhang 
46067ee59b9bSJunchao Zhang   PetscFunctionBegin;
46077ee59b9bSJunchao Zhang   PetscCheck(mat->preallocated, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "matrix is not preallocated");
46087ee59b9bSJunchao Zhang   if (aij->ops->getcsrandmemtype) {
46097ee59b9bSJunchao Zhang     PetscCall((*aij->ops->getcsrandmemtype)(mat, i, j, a, mtype));
46107ee59b9bSJunchao Zhang   } else {
46117ee59b9bSJunchao Zhang     if (i) *i = aij->i;
46127ee59b9bSJunchao Zhang     if (j) *j = aij->j;
46137ee59b9bSJunchao Zhang     if (a) *a = aij->a;
46147ee59b9bSJunchao Zhang     if (mtype) *mtype = PETSC_MEMTYPE_HOST;
46157ee59b9bSJunchao Zhang   }
46163ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
46177ee59b9bSJunchao Zhang }
46187ee59b9bSJunchao Zhang 
4619cc4c1da9SBarry Smith /*@
462021e72a00SBarry Smith   MatSeqAIJGetMaxRowNonzeros - returns the maximum number of nonzeros in any row
462121e72a00SBarry Smith 
462221e72a00SBarry Smith   Not Collective
462321e72a00SBarry Smith 
462421e72a00SBarry Smith   Input Parameter:
4625fe59aa6dSJacob Faibussowitsch . A - a `MATSEQAIJ` matrix
462621e72a00SBarry Smith 
462721e72a00SBarry Smith   Output Parameter:
462821e72a00SBarry Smith . nz - the maximum number of nonzeros in any row
462921e72a00SBarry Smith 
463021e72a00SBarry Smith   Level: intermediate
463121e72a00SBarry Smith 
4632ce78bad3SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJRestoreArray()`
463321e72a00SBarry Smith @*/
4634d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJGetMaxRowNonzeros(Mat A, PetscInt *nz)
4635d71ae5a4SJacob Faibussowitsch {
463621e72a00SBarry Smith   Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data;
463721e72a00SBarry Smith 
463821e72a00SBarry Smith   PetscFunctionBegin;
463921e72a00SBarry Smith   *nz = aij->rmax;
46403ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
464121e72a00SBarry Smith }
464221e72a00SBarry Smith 
464349abdd8aSBarry Smith static PetscErrorCode MatCOOStructDestroy_SeqAIJ(void **data)
46442c4ab24aSJunchao Zhang {
464549abdd8aSBarry Smith   MatCOOStruct_SeqAIJ *coo = (MatCOOStruct_SeqAIJ *)*data;
46464d86920dSPierre Jolivet 
46472c4ab24aSJunchao Zhang   PetscFunctionBegin;
46482c4ab24aSJunchao Zhang   PetscCall(PetscFree(coo->perm));
46492c4ab24aSJunchao Zhang   PetscCall(PetscFree(coo->jmap));
46502c4ab24aSJunchao Zhang   PetscCall(PetscFree(coo));
46512c4ab24aSJunchao Zhang   PetscFunctionReturn(PETSC_SUCCESS);
46522c4ab24aSJunchao Zhang }
46532c4ab24aSJunchao Zhang 
4654d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetPreallocationCOO_SeqAIJ(Mat mat, PetscCount coo_n, PetscInt coo_i[], PetscInt coo_j[])
4655d71ae5a4SJacob Faibussowitsch {
4656394ed5ebSJunchao Zhang   MPI_Comm             comm;
4657394ed5ebSJunchao Zhang   PetscInt            *i, *j;
46580d88f7f4SJunchao Zhang   PetscInt             M, N, row, iprev;
4659394ed5ebSJunchao Zhang   PetscCount           k, p, q, nneg, nnz, start, end; /* Index the coo array, so use PetscCount as their type */
4660394ed5ebSJunchao Zhang   PetscInt            *Ai;                             /* Change to PetscCount once we use it for row pointers */
4661394ed5ebSJunchao Zhang   PetscInt            *Aj;
4662394ed5ebSJunchao Zhang   PetscScalar         *Aa;
4663f4f49eeaSPierre Jolivet   Mat_SeqAIJ          *seqaij = (Mat_SeqAIJ *)mat->data;
4664cbc6b225SStefano Zampini   MatType              rtype;
4665394ed5ebSJunchao Zhang   PetscCount          *perm, *jmap;
46662c4ab24aSJunchao Zhang   MatCOOStruct_SeqAIJ *coo;
46670d88f7f4SJunchao Zhang   PetscBool            isorted;
46689f0612e4SBarry Smith   PetscBool            hypre;
46699f0612e4SBarry Smith   const char          *name;
4670394ed5ebSJunchao Zhang 
4671394ed5ebSJunchao Zhang   PetscFunctionBegin;
46729566063dSJacob Faibussowitsch   PetscCall(PetscObjectGetComm((PetscObject)mat, &comm));
46739566063dSJacob Faibussowitsch   PetscCall(MatGetSize(mat, &M, &N));
4674e8729f6fSJunchao Zhang   i = coo_i;
4675e8729f6fSJunchao Zhang   j = coo_j;
46769566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(coo_n, &perm));
46770d88f7f4SJunchao Zhang 
46780d88f7f4SJunchao Zhang   /* Ignore entries with negative row or col indices; at the same time, check if i[] is already sorted (e.g., MatConvert_AlJ_HYPRE results in this case) */
46790d88f7f4SJunchao Zhang   isorted = PETSC_TRUE;
46800d88f7f4SJunchao Zhang   iprev   = PETSC_INT_MIN;
46810d88f7f4SJunchao Zhang   for (k = 0; k < coo_n; k++) {
4682394ed5ebSJunchao Zhang     if (j[k] < 0) i[k] = -1;
46830d88f7f4SJunchao Zhang     if (isorted) {
46840d88f7f4SJunchao Zhang       if (i[k] < iprev) isorted = PETSC_FALSE;
46850d88f7f4SJunchao Zhang       else iprev = i[k];
46860d88f7f4SJunchao Zhang     }
4687394ed5ebSJunchao Zhang     perm[k] = k;
4688394ed5ebSJunchao Zhang   }
4689394ed5ebSJunchao Zhang 
46900d88f7f4SJunchao Zhang   /* Sort by row if not already */
46910d88f7f4SJunchao Zhang   if (!isorted) PetscCall(PetscSortIntWithIntCountArrayPair(coo_n, i, j, perm));
4692651b1cf9SStefano Zampini 
4693651b1cf9SStefano Zampini   /* Advance k to the first row with a non-negative index */
4694651b1cf9SStefano Zampini   for (k = 0; k < coo_n; k++)
46959371c9d4SSatish Balay     if (i[k] >= 0) break;
4696394ed5ebSJunchao Zhang   nneg = k;
46979566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(coo_n - nneg + 1, &jmap)); /* +1 to make a CSR-like data structure. jmap[i] originally is the number of repeats for i-th nonzero */
4698394ed5ebSJunchao Zhang   nnz = 0;                                          /* Total number of unique nonzeros to be counted */
469935cb6cd3SPierre Jolivet   jmap++;                                           /* Inc jmap by 1 for convenience */
4700394ed5ebSJunchao Zhang 
47019f0612e4SBarry Smith   PetscCall(PetscShmgetAllocateArray(M + 1, sizeof(PetscInt), (void **)&Ai)); /* CSR of A */
47029f0612e4SBarry Smith   PetscCall(PetscArrayzero(Ai, M + 1));
47039f0612e4SBarry Smith   PetscCall(PetscShmgetAllocateArray(coo_n - nneg, sizeof(PetscInt), (void **)&Aj)); /* We have at most coo_n-nneg unique nonzeros */
4704394ed5ebSJunchao Zhang 
4705651b1cf9SStefano Zampini   PetscCall(PetscObjectGetName((PetscObject)mat, &name));
4706651b1cf9SStefano Zampini   PetscCall(PetscStrcmp("_internal_COO_mat_for_hypre", name, &hypre));
4707651b1cf9SStefano Zampini 
4708394ed5ebSJunchao Zhang   /* In each row, sort by column, then unique column indices to get row length */
470935cb6cd3SPierre Jolivet   Ai++;  /* Inc by 1 for convenience */
4710394ed5ebSJunchao Zhang   q = 0; /* q-th unique nonzero, with q starting from 0 */
4711394ed5ebSJunchao Zhang   while (k < coo_n) {
47120d88f7f4SJunchao Zhang     PetscBool strictly_sorted; // this row is strictly sorted?
47130d88f7f4SJunchao Zhang     PetscInt  jprev;
47140d88f7f4SJunchao Zhang 
47150d88f7f4SJunchao Zhang     /* get [start,end) indices for this row; also check if cols in this row are strictly sorted */
4716394ed5ebSJunchao Zhang     row             = i[k];
47170d88f7f4SJunchao Zhang     start           = k;
47180d88f7f4SJunchao Zhang     jprev           = PETSC_INT_MIN;
47190d88f7f4SJunchao Zhang     strictly_sorted = PETSC_TRUE;
47200d88f7f4SJunchao Zhang     while (k < coo_n && i[k] == row) {
47210d88f7f4SJunchao Zhang       if (strictly_sorted) {
47220d88f7f4SJunchao Zhang         if (j[k] <= jprev) strictly_sorted = PETSC_FALSE;
47230d88f7f4SJunchao Zhang         else jprev = j[k];
47240d88f7f4SJunchao Zhang       }
47250d88f7f4SJunchao Zhang       k++;
47260d88f7f4SJunchao Zhang     }
4727394ed5ebSJunchao Zhang     end = k;
47280d88f7f4SJunchao Zhang 
4729651b1cf9SStefano Zampini     /* hack for HYPRE: swap min column to diag so that diagonal values will go first */
4730651b1cf9SStefano Zampini     if (hypre) {
47311690c2aeSBarry Smith       PetscInt  minj    = PETSC_INT_MAX;
4732651b1cf9SStefano Zampini       PetscBool hasdiag = PETSC_FALSE;
47330d88f7f4SJunchao Zhang 
47340d88f7f4SJunchao Zhang       if (strictly_sorted) { // fast path to swap the first and the diag
47350d88f7f4SJunchao Zhang         PetscCount tmp;
47360d88f7f4SJunchao Zhang         for (p = start; p < end; p++) {
47370d88f7f4SJunchao Zhang           if (j[p] == row && p != start) {
47381c265611SJunchao Zhang             j[p]        = j[start]; // swap j[], so that the diagonal value will go first (manipulated by perm[])
47390d88f7f4SJunchao Zhang             j[start]    = row;
47400d88f7f4SJunchao Zhang             tmp         = perm[start];
47411c265611SJunchao Zhang             perm[start] = perm[p]; // also swap perm[] so we can save the call to PetscSortIntWithCountArray() below
47420d88f7f4SJunchao Zhang             perm[p]     = tmp;
47430d88f7f4SJunchao Zhang             break;
47440d88f7f4SJunchao Zhang           }
47450d88f7f4SJunchao Zhang         }
47460d88f7f4SJunchao Zhang       } else {
4747651b1cf9SStefano Zampini         for (p = start; p < end; p++) {
4748651b1cf9SStefano Zampini           hasdiag = (PetscBool)(hasdiag || (j[p] == row));
4749651b1cf9SStefano Zampini           minj    = PetscMin(minj, j[p]);
4750651b1cf9SStefano Zampini         }
47510d88f7f4SJunchao Zhang 
4752651b1cf9SStefano Zampini         if (hasdiag) {
4753651b1cf9SStefano Zampini           for (p = start; p < end; p++) {
4754651b1cf9SStefano Zampini             if (j[p] == minj) j[p] = row;
4755651b1cf9SStefano Zampini             else if (j[p] == row) j[p] = minj;
4756651b1cf9SStefano Zampini           }
4757651b1cf9SStefano Zampini         }
4758651b1cf9SStefano Zampini       }
47590d88f7f4SJunchao Zhang     }
47601c265611SJunchao Zhang     // sort by columns in a row. perm[] indicates their original order
47610d88f7f4SJunchao Zhang     if (!strictly_sorted) PetscCall(PetscSortIntWithCountArray(end - start, j + start, perm + start));
4762651b1cf9SStefano Zampini 
47630d88f7f4SJunchao Zhang     if (strictly_sorted) { // fast path to set Aj[], jmap[], Ai[], nnz, q
47640d88f7f4SJunchao Zhang       for (p = start; p < end; p++, q++) {
47650d88f7f4SJunchao Zhang         Aj[q]   = j[p];
47660d88f7f4SJunchao Zhang         jmap[q] = 1;
47670d88f7f4SJunchao Zhang       }
47686497c311SBarry Smith       PetscCall(PetscIntCast(end - start, Ai + row));
47690d88f7f4SJunchao Zhang       nnz += Ai[row]; // q is already advanced
47700d88f7f4SJunchao Zhang     } else {
4771394ed5ebSJunchao Zhang       /* Find number of unique col entries in this row */
4772394ed5ebSJunchao Zhang       Aj[q]   = j[start]; /* Log the first nonzero in this row */
4773651b1cf9SStefano Zampini       jmap[q] = 1;        /* Number of repeats of this nonzero entry */
4774394ed5ebSJunchao Zhang       Ai[row] = 1;
4775394ed5ebSJunchao Zhang       nnz++;
4776394ed5ebSJunchao Zhang 
4777394ed5ebSJunchao Zhang       for (p = start + 1; p < end; p++) { /* Scan remaining nonzero in this row */
4778394ed5ebSJunchao Zhang         if (j[p] != j[p - 1]) {           /* Meet a new nonzero */
4779394ed5ebSJunchao Zhang           q++;
4780394ed5ebSJunchao Zhang           jmap[q] = 1;
4781394ed5ebSJunchao Zhang           Aj[q]   = j[p];
4782394ed5ebSJunchao Zhang           Ai[row]++;
4783394ed5ebSJunchao Zhang           nnz++;
4784394ed5ebSJunchao Zhang         } else {
4785394ed5ebSJunchao Zhang           jmap[q]++;
4786394ed5ebSJunchao Zhang         }
4787394ed5ebSJunchao Zhang       }
4788394ed5ebSJunchao Zhang       q++; /* Move to next row and thus next unique nonzero */
4789394ed5ebSJunchao Zhang     }
47900d88f7f4SJunchao Zhang   }
47910d88f7f4SJunchao Zhang 
4792394ed5ebSJunchao Zhang   Ai--; /* Back to the beginning of Ai[] */
4793394ed5ebSJunchao Zhang   for (k = 0; k < M; k++) Ai[k + 1] += Ai[k];
47940d88f7f4SJunchao Zhang   jmap--; // Back to the beginning of jmap[]
4795394ed5ebSJunchao Zhang   jmap[0] = 0;
4796394ed5ebSJunchao Zhang   for (k = 0; k < nnz; k++) jmap[k + 1] += jmap[k];
47970d88f7f4SJunchao Zhang 
47989f0612e4SBarry Smith   if (nnz < coo_n - nneg) { /* Reallocate with actual number of unique nonzeros */
4799394ed5ebSJunchao Zhang     PetscCount *jmap_new;
4800394ed5ebSJunchao Zhang     PetscInt   *Aj_new;
4801394ed5ebSJunchao Zhang 
48029566063dSJacob Faibussowitsch     PetscCall(PetscMalloc1(nnz + 1, &jmap_new));
48039566063dSJacob Faibussowitsch     PetscCall(PetscArraycpy(jmap_new, jmap, nnz + 1));
48049566063dSJacob Faibussowitsch     PetscCall(PetscFree(jmap));
4805394ed5ebSJunchao Zhang     jmap = jmap_new;
4806394ed5ebSJunchao Zhang 
48079f0612e4SBarry Smith     PetscCall(PetscShmgetAllocateArray(nnz, sizeof(PetscInt), (void **)&Aj_new));
48089566063dSJacob Faibussowitsch     PetscCall(PetscArraycpy(Aj_new, Aj, nnz));
48099f0612e4SBarry Smith     PetscCall(PetscShmgetDeallocateArray((void **)&Aj));
4810394ed5ebSJunchao Zhang     Aj = Aj_new;
4811394ed5ebSJunchao Zhang   }
4812394ed5ebSJunchao Zhang 
4813394ed5ebSJunchao Zhang   if (nneg) { /* Discard heading entries with negative indices in perm[], as we'll access it from index 0 in MatSetValuesCOO */
4814394ed5ebSJunchao Zhang     PetscCount *perm_new;
4815cbc6b225SStefano Zampini 
48169566063dSJacob Faibussowitsch     PetscCall(PetscMalloc1(coo_n - nneg, &perm_new));
48179566063dSJacob Faibussowitsch     PetscCall(PetscArraycpy(perm_new, perm + nneg, coo_n - nneg));
48189566063dSJacob Faibussowitsch     PetscCall(PetscFree(perm));
4819394ed5ebSJunchao Zhang     perm = perm_new;
4820394ed5ebSJunchao Zhang   }
4821394ed5ebSJunchao Zhang 
48229566063dSJacob Faibussowitsch   PetscCall(MatGetRootType_Private(mat, &rtype));
48239f0612e4SBarry Smith   PetscCall(PetscShmgetAllocateArray(nnz, sizeof(PetscScalar), (void **)&Aa));
48249f0612e4SBarry Smith   PetscCall(PetscArrayzero(Aa, nnz));
48259566063dSJacob Faibussowitsch   PetscCall(MatSetSeqAIJWithArrays_private(PETSC_COMM_SELF, M, N, Ai, Aj, Aa, rtype, mat));
4826394ed5ebSJunchao Zhang 
4827394ed5ebSJunchao Zhang   seqaij->free_a = seqaij->free_ij = PETSC_TRUE; /* Let newmat own Ai, Aj and Aa */
48282c4ab24aSJunchao Zhang 
48292c4ab24aSJunchao Zhang   // Put the COO struct in a container and then attach that to the matrix
48302c4ab24aSJunchao Zhang   PetscCall(PetscMalloc1(1, &coo));
48316497c311SBarry Smith   PetscCall(PetscIntCast(nnz, &coo->nz));
48322c4ab24aSJunchao Zhang   coo->n    = coo_n;
48332c4ab24aSJunchao Zhang   coo->Atot = coo_n - nneg; // Annz is seqaij->nz, so no need to record that again
48342c4ab24aSJunchao Zhang   coo->jmap = jmap;         // of length nnz+1
48352c4ab24aSJunchao Zhang   coo->perm = perm;
483603e76207SPierre Jolivet   PetscCall(PetscObjectContainerCompose((PetscObject)mat, "__PETSc_MatCOOStruct_Host", coo, MatCOOStructDestroy_SeqAIJ));
48373ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
4838394ed5ebSJunchao Zhang }
4839394ed5ebSJunchao Zhang 
4840d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatSetValuesCOO_SeqAIJ(Mat A, const PetscScalar v[], InsertMode imode)
4841d71ae5a4SJacob Faibussowitsch {
4842394ed5ebSJunchao Zhang   Mat_SeqAIJ          *aseq = (Mat_SeqAIJ *)A->data;
4843394ed5ebSJunchao Zhang   PetscCount           i, j, Annz = aseq->nz;
48442c4ab24aSJunchao Zhang   PetscCount          *perm, *jmap;
4845394ed5ebSJunchao Zhang   PetscScalar         *Aa;
48462c4ab24aSJunchao Zhang   PetscContainer       container;
48472c4ab24aSJunchao Zhang   MatCOOStruct_SeqAIJ *coo;
4848394ed5ebSJunchao Zhang 
4849394ed5ebSJunchao Zhang   PetscFunctionBegin;
48502c4ab24aSJunchao Zhang   PetscCall(PetscObjectQuery((PetscObject)A, "__PETSc_MatCOOStruct_Host", (PetscObject *)&container));
48512c4ab24aSJunchao Zhang   PetscCheck(container, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Not found MatCOOStruct on this matrix");
48522c4ab24aSJunchao Zhang   PetscCall(PetscContainerGetPointer(container, (void **)&coo));
48532c4ab24aSJunchao Zhang   perm = coo->perm;
48542c4ab24aSJunchao Zhang   jmap = coo->jmap;
48559566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArray(A, &Aa));
4856394ed5ebSJunchao Zhang   for (i = 0; i < Annz; i++) {
4857b6c38306SJunchao Zhang     PetscScalar sum = 0.0;
4858b6c38306SJunchao Zhang     for (j = jmap[i]; j < jmap[i + 1]; j++) sum += v[perm[j]];
4859b6c38306SJunchao Zhang     Aa[i] = (imode == INSERT_VALUES ? 0.0 : Aa[i]) + sum;
4860394ed5ebSJunchao Zhang   }
48619566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArray(A, &Aa));
48623ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
4863394ed5ebSJunchao Zhang }
4864394ed5ebSJunchao Zhang 
486534b5b067SBarry Smith #if defined(PETSC_HAVE_CUDA)
48665063d097SStefano Zampini PETSC_INTERN PetscErrorCode MatConvert_SeqAIJ_SeqAIJCUSPARSE(Mat, MatType, MatReuse, Mat *);
486702fe1965SBarry Smith #endif
4868d5e393b6SSuyash Tandon #if defined(PETSC_HAVE_HIP)
4869d5e393b6SSuyash Tandon PETSC_INTERN PetscErrorCode MatConvert_SeqAIJ_SeqAIJHIPSPARSE(Mat, MatType, MatReuse, Mat *);
4870d5e393b6SSuyash Tandon #endif
48713d0639e7SStefano Zampini #if defined(PETSC_HAVE_KOKKOS_KERNELS)
48725063d097SStefano Zampini PETSC_INTERN PetscErrorCode MatConvert_SeqAIJ_SeqAIJKokkos(Mat, MatType, MatReuse, Mat *);
48733d0639e7SStefano Zampini #endif
487402fe1965SBarry Smith 
4875d71ae5a4SJacob Faibussowitsch PETSC_EXTERN PetscErrorCode MatCreate_SeqAIJ(Mat B)
4876d71ae5a4SJacob Faibussowitsch {
4877273d9f13SBarry Smith   Mat_SeqAIJ *b;
487838baddfdSBarry Smith   PetscMPIInt size;
4879273d9f13SBarry Smith 
4880273d9f13SBarry Smith   PetscFunctionBegin;
48819566063dSJacob Faibussowitsch   PetscCallMPI(MPI_Comm_size(PetscObjectComm((PetscObject)B), &size));
488208401ef6SPierre Jolivet   PetscCheck(size <= 1, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Comm must be of size 1");
4883273d9f13SBarry Smith 
48844dfa11a4SJacob Faibussowitsch   PetscCall(PetscNew(&b));
48852205254eSKarl Rupp 
4886b0a32e0cSBarry Smith   B->data   = (void *)b;
4887aea10558SJacob Faibussowitsch   B->ops[0] = MatOps_Values;
4888071fcb05SBarry Smith   if (B->sortedfull) B->ops->setvalues = MatSetValues_SeqAIJ_SortedFull;
48892205254eSKarl Rupp 
4890f4259b30SLisandro Dalcin   b->row                = NULL;
4891f4259b30SLisandro Dalcin   b->col                = NULL;
4892f4259b30SLisandro Dalcin   b->icol               = NULL;
4893b810aeb4SBarry Smith   b->reallocs           = 0;
489436db0b34SBarry Smith   b->ignorezeroentries  = PETSC_FALSE;
4895f1e2ffcdSBarry Smith   b->roworiented        = PETSC_TRUE;
4896416022c9SBarry Smith   b->nonew              = 0;
4897f4259b30SLisandro Dalcin   b->diag               = NULL;
4898f4259b30SLisandro Dalcin   b->solve_work         = NULL;
4899f4259b30SLisandro Dalcin   B->spptr              = NULL;
4900f4259b30SLisandro Dalcin   b->saved_values       = NULL;
4901f4259b30SLisandro Dalcin   b->idiag              = NULL;
4902f4259b30SLisandro Dalcin   b->mdiag              = NULL;
4903f4259b30SLisandro Dalcin   b->ssor_work          = NULL;
490471f1c65dSBarry Smith   b->omega              = 1.0;
490571f1c65dSBarry Smith   b->fshift             = 0.0;
490671f1c65dSBarry Smith   b->idiagvalid         = PETSC_FALSE;
4907bbead8a2SBarry Smith   b->ibdiagvalid        = PETSC_FALSE;
4908a9817697SBarry Smith   b->keepnonzeropattern = PETSC_FALSE;
490917ab2063SBarry Smith 
49109566063dSJacob Faibussowitsch   PetscCall(PetscObjectChangeTypeName((PetscObject)B, MATSEQAIJ));
4911d1e78c4fSBarry Smith #if defined(PETSC_HAVE_MATLAB)
49129566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "PetscMatlabEnginePut_C", MatlabEnginePut_SeqAIJ));
49139566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "PetscMatlabEngineGet_C", MatlabEngineGet_SeqAIJ));
4914b3866ffcSBarry Smith #endif
49159566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSeqAIJSetColumnIndices_C", MatSeqAIJSetColumnIndices_SeqAIJ));
49169566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatStoreValues_C", MatStoreValues_SeqAIJ));
49179566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatRetrieveValues_C", MatRetrieveValues_SeqAIJ));
49189566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqsbaij_C", MatConvert_SeqAIJ_SeqSBAIJ));
49199566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqbaij_C", MatConvert_SeqAIJ_SeqBAIJ));
49209566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijperm_C", MatConvert_SeqAIJ_SeqAIJPERM));
49219566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijsell_C", MatConvert_SeqAIJ_SeqAIJSELL));
49229779e05dSSatish Balay #if defined(PETSC_HAVE_MKL_SPARSE)
49239566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijmkl_C", MatConvert_SeqAIJ_SeqAIJMKL));
4924191b95cbSRichard Tran Mills #endif
492534b5b067SBarry Smith #if defined(PETSC_HAVE_CUDA)
49269566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijcusparse_C", MatConvert_SeqAIJ_SeqAIJCUSPARSE));
49279566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_seqaijcusparse_seqaij_C", MatProductSetFromOptions_SeqAIJ));
49289566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_seqaij_seqaijcusparse_C", MatProductSetFromOptions_SeqAIJ));
492902fe1965SBarry Smith #endif
4930d5e393b6SSuyash Tandon #if defined(PETSC_HAVE_HIP)
4931d5e393b6SSuyash Tandon   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijhipsparse_C", MatConvert_SeqAIJ_SeqAIJHIPSPARSE));
4932d5e393b6SSuyash Tandon   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_seqaijhipsparse_seqaij_C", MatProductSetFromOptions_SeqAIJ));
4933d5e393b6SSuyash Tandon   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_seqaij_seqaijhipsparse_C", MatProductSetFromOptions_SeqAIJ));
4934d5e393b6SSuyash Tandon #endif
49353d0639e7SStefano Zampini #if defined(PETSC_HAVE_KOKKOS_KERNELS)
49369566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijkokkos_C", MatConvert_SeqAIJ_SeqAIJKokkos));
49373d0639e7SStefano Zampini #endif
49389566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijcrl_C", MatConvert_SeqAIJ_SeqAIJCRL));
4939af8000cdSHong Zhang #if defined(PETSC_HAVE_ELEMENTAL)
49409566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_elemental_C", MatConvert_SeqAIJ_Elemental));
4941af8000cdSHong Zhang #endif
4942d24d4204SJose E. Roman #if defined(PETSC_HAVE_SCALAPACK)
49439566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_scalapack_C", MatConvert_AIJ_ScaLAPACK));
4944d24d4204SJose E. Roman #endif
494563c07aadSStefano Zampini #if defined(PETSC_HAVE_HYPRE)
49469566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_hypre_C", MatConvert_AIJ_HYPRE));
49479566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_transpose_seqaij_seqaij_C", MatProductSetFromOptions_Transpose_AIJ_AIJ));
494863c07aadSStefano Zampini #endif
49499566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqdense_C", MatConvert_SeqAIJ_SeqDense));
49509566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqsell_C", MatConvert_SeqAIJ_SeqSELL));
49519566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_is_C", MatConvert_XAIJ_IS));
49529566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatIsTranspose_C", MatIsTranspose_SeqAIJ));
495314e4dea2SJose E. Roman   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatIsHermitianTranspose_C", MatIsHermitianTranspose_SeqAIJ));
49549566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSeqAIJSetPreallocation_C", MatSeqAIJSetPreallocation_SeqAIJ));
49559566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatResetPreallocation_C", MatResetPreallocation_SeqAIJ));
4956674b392bSAlexander   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatResetHash_C", MatResetHash_SeqAIJ));
49579566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSeqAIJSetPreallocationCSR_C", MatSeqAIJSetPreallocationCSR_SeqAIJ));
49589566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatReorderForNonzeroDiagonal_C", MatReorderForNonzeroDiagonal_SeqAIJ));
49599566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_is_seqaij_C", MatProductSetFromOptions_IS_XAIJ));
49609566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_seqdense_seqaij_C", MatProductSetFromOptions_SeqDense_SeqAIJ));
49619566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_seqaij_seqaij_C", MatProductSetFromOptions_SeqAIJ));
49629566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSeqAIJKron_C", MatSeqAIJKron_SeqAIJ));
49639566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSetPreallocationCOO_C", MatSetPreallocationCOO_SeqAIJ));
49649566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSetValuesCOO_C", MatSetValuesCOO_SeqAIJ));
49659566063dSJacob Faibussowitsch   PetscCall(MatCreate_SeqAIJ_Inode(B));
49669566063dSJacob Faibussowitsch   PetscCall(PetscObjectChangeTypeName((PetscObject)B, MATSEQAIJ));
49679566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJSetTypeFromOptions(B)); /* this allows changing the matrix subtype to say MATSEQAIJPERM */
49683ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
496917ab2063SBarry Smith }
497017ab2063SBarry Smith 
4971b24902e0SBarry Smith /*
49723893b582SJunchao Zhang     Given a matrix generated with MatGetFactor() duplicates all the information in A into C
4973b24902e0SBarry Smith */
4974d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDuplicateNoCreate_SeqAIJ(Mat C, Mat A, MatDuplicateOption cpvalues, PetscBool mallocmatspace)
4975d71ae5a4SJacob Faibussowitsch {
49762a350339SBarry Smith   Mat_SeqAIJ *c = (Mat_SeqAIJ *)C->data, *a = (Mat_SeqAIJ *)A->data;
4977071fcb05SBarry Smith   PetscInt    m = A->rmap->n, i;
497817ab2063SBarry Smith 
49793a40ed3dSBarry Smith   PetscFunctionBegin;
4980aed4548fSBarry Smith   PetscCheck(A->assembled || cpvalues == MAT_DO_NOT_COPY_VALUES, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Cannot duplicate unassembled matrix");
4981273d9f13SBarry Smith 
4982d5f3da31SBarry Smith   C->factortype    = A->factortype;
4983f4259b30SLisandro Dalcin   c->row           = NULL;
4984f4259b30SLisandro Dalcin   c->col           = NULL;
4985f4259b30SLisandro Dalcin   c->icol          = NULL;
49866ad4291fSHong Zhang   c->reallocs      = 0;
4987bc43efbbSJunchao Zhang   c->diagonaldense = a->diagonaldense;
498817ab2063SBarry Smith 
498969272f91SPierre Jolivet   C->assembled = A->assembled;
499017ab2063SBarry Smith 
499169272f91SPierre Jolivet   if (A->preallocated) {
49929566063dSJacob Faibussowitsch     PetscCall(PetscLayoutReference(A->rmap, &C->rmap));
49939566063dSJacob Faibussowitsch     PetscCall(PetscLayoutReference(A->cmap, &C->cmap));
4994eec197d1SBarry Smith 
499531fe6a7dSBarry Smith     if (!A->hash_active) {
49969566063dSJacob Faibussowitsch       PetscCall(PetscMalloc1(m, &c->imax));
49979566063dSJacob Faibussowitsch       PetscCall(PetscMemcpy(c->imax, a->imax, m * sizeof(PetscInt)));
49989566063dSJacob Faibussowitsch       PetscCall(PetscMalloc1(m, &c->ilen));
49999566063dSJacob Faibussowitsch       PetscCall(PetscMemcpy(c->ilen, a->ilen, m * sizeof(PetscInt)));
500017ab2063SBarry Smith 
500117ab2063SBarry Smith       /* allocate the matrix space */
5002f77e22a1SHong Zhang       if (mallocmatspace) {
50039f0612e4SBarry Smith         PetscCall(PetscShmgetAllocateArray(a->i[m], sizeof(PetscScalar), (void **)&c->a));
50049f0612e4SBarry Smith         PetscCall(PetscShmgetAllocateArray(a->i[m], sizeof(PetscInt), (void **)&c->j));
50059f0612e4SBarry Smith         PetscCall(PetscShmgetAllocateArray(m + 1, sizeof(PetscInt), (void **)&c->i));
50069566063dSJacob Faibussowitsch         PetscCall(PetscArraycpy(c->i, a->i, m + 1));
50079f0612e4SBarry Smith         c->free_a  = PETSC_TRUE;
50089f0612e4SBarry Smith         c->free_ij = PETSC_TRUE;
500917ab2063SBarry Smith         if (m > 0) {
50109566063dSJacob Faibussowitsch           PetscCall(PetscArraycpy(c->j, a->j, a->i[m]));
5011be6bf707SBarry Smith           if (cpvalues == MAT_COPY_VALUES) {
50122e5835c6SStefano Zampini             const PetscScalar *aa;
50132e5835c6SStefano Zampini 
50149566063dSJacob Faibussowitsch             PetscCall(MatSeqAIJGetArrayRead(A, &aa));
50159566063dSJacob Faibussowitsch             PetscCall(PetscArraycpy(c->a, aa, a->i[m]));
50169566063dSJacob Faibussowitsch             PetscCall(MatSeqAIJGetArrayRead(A, &aa));
5017be6bf707SBarry Smith           } else {
50189566063dSJacob Faibussowitsch             PetscCall(PetscArrayzero(c->a, a->i[m]));
501917ab2063SBarry Smith           }
502008480c60SBarry Smith         }
5021f77e22a1SHong Zhang       }
502231fe6a7dSBarry Smith       C->preallocated = PETSC_TRUE;
502331fe6a7dSBarry Smith     } else {
502431fe6a7dSBarry Smith       PetscCheck(mallocmatspace, PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_WRONGSTATE, "Cannot malloc matrix memory from a non-preallocated matrix");
502531fe6a7dSBarry Smith       PetscCall(MatSetUp(C));
502631fe6a7dSBarry Smith     }
502717ab2063SBarry Smith 
50286ad4291fSHong Zhang     c->ignorezeroentries = a->ignorezeroentries;
5029416022c9SBarry Smith     c->roworiented       = a->roworiented;
5030416022c9SBarry Smith     c->nonew             = a->nonew;
5031416022c9SBarry Smith     if (a->diag) {
50329566063dSJacob Faibussowitsch       PetscCall(PetscMalloc1(m + 1, &c->diag));
50339566063dSJacob Faibussowitsch       PetscCall(PetscMemcpy(c->diag, a->diag, m * sizeof(PetscInt)));
5034071fcb05SBarry Smith     } else c->diag = NULL;
50352205254eSKarl Rupp 
5036f4259b30SLisandro Dalcin     c->solve_work         = NULL;
5037f4259b30SLisandro Dalcin     c->saved_values       = NULL;
5038f4259b30SLisandro Dalcin     c->idiag              = NULL;
5039f4259b30SLisandro Dalcin     c->ssor_work          = NULL;
5040a9817697SBarry Smith     c->keepnonzeropattern = a->keepnonzeropattern;
50416ad4291fSHong Zhang 
5042893ad86cSHong Zhang     c->rmax  = a->rmax;
5043416022c9SBarry Smith     c->nz    = a->nz;
50448ed568f8SMatthew G Knepley     c->maxnz = a->nz; /* Since we allocate exactly the right amount */
5045754ec7b1SSatish Balay 
50466ad4291fSHong Zhang     c->compressedrow.use   = a->compressedrow.use;
50476ad4291fSHong Zhang     c->compressedrow.nrows = a->compressedrow.nrows;
5048cd6b891eSBarry Smith     if (a->compressedrow.use) {
50496ad4291fSHong Zhang       i = a->compressedrow.nrows;
50509566063dSJacob Faibussowitsch       PetscCall(PetscMalloc2(i + 1, &c->compressedrow.i, i, &c->compressedrow.rindex));
50519566063dSJacob Faibussowitsch       PetscCall(PetscArraycpy(c->compressedrow.i, a->compressedrow.i, i + 1));
50529566063dSJacob Faibussowitsch       PetscCall(PetscArraycpy(c->compressedrow.rindex, a->compressedrow.rindex, i));
505327ea64f8SHong Zhang     } else {
505427ea64f8SHong Zhang       c->compressedrow.use    = PETSC_FALSE;
50550298fd71SBarry Smith       c->compressedrow.i      = NULL;
50560298fd71SBarry Smith       c->compressedrow.rindex = NULL;
50576ad4291fSHong Zhang     }
5058ea632784SBarry Smith     c->nonzerorowcnt = a->nonzerorowcnt;
5059e56f5c9eSBarry Smith     C->nonzerostate  = A->nonzerostate;
50604846f1f5SKris Buschelman 
50619566063dSJacob Faibussowitsch     PetscCall(MatDuplicate_SeqAIJ_Inode(A, cpvalues, &C));
506269272f91SPierre Jolivet   }
50639566063dSJacob Faibussowitsch   PetscCall(PetscFunctionListDuplicate(((PetscObject)A)->qlist, &((PetscObject)C)->qlist));
50643ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
506517ab2063SBarry Smith }
506617ab2063SBarry Smith 
5067d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDuplicate_SeqAIJ(Mat A, MatDuplicateOption cpvalues, Mat *B)
5068d71ae5a4SJacob Faibussowitsch {
5069b24902e0SBarry Smith   PetscFunctionBegin;
50709566063dSJacob Faibussowitsch   PetscCall(MatCreate(PetscObjectComm((PetscObject)A), B));
50719566063dSJacob Faibussowitsch   PetscCall(MatSetSizes(*B, A->rmap->n, A->cmap->n, A->rmap->n, A->cmap->n));
507248a46eb9SPierre Jolivet   if (!(A->rmap->n % A->rmap->bs) && !(A->cmap->n % A->cmap->bs)) PetscCall(MatSetBlockSizesFromMats(*B, A, A));
50739566063dSJacob Faibussowitsch   PetscCall(MatSetType(*B, ((PetscObject)A)->type_name));
50749566063dSJacob Faibussowitsch   PetscCall(MatDuplicateNoCreate_SeqAIJ(*B, A, cpvalues, PETSC_TRUE));
50753ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
5076b24902e0SBarry Smith }
5077b24902e0SBarry Smith 
5078d71ae5a4SJacob Faibussowitsch PetscErrorCode MatLoad_SeqAIJ(Mat newMat, PetscViewer viewer)
5079d71ae5a4SJacob Faibussowitsch {
508052f91c60SVaclav Hapla   PetscBool isbinary, ishdf5;
508152f91c60SVaclav Hapla 
508252f91c60SVaclav Hapla   PetscFunctionBegin;
508352f91c60SVaclav Hapla   PetscValidHeaderSpecific(newMat, MAT_CLASSID, 1);
508452f91c60SVaclav Hapla   PetscValidHeaderSpecific(viewer, PETSC_VIEWER_CLASSID, 2);
5085c27b3999SVaclav Hapla   /* force binary viewer to load .info file if it has not yet done so */
50869566063dSJacob Faibussowitsch   PetscCall(PetscViewerSetUp(viewer));
50879566063dSJacob Faibussowitsch   PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERBINARY, &isbinary));
50889566063dSJacob Faibussowitsch   PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERHDF5, &ishdf5));
508952f91c60SVaclav Hapla   if (isbinary) {
50909566063dSJacob Faibussowitsch     PetscCall(MatLoad_SeqAIJ_Binary(newMat, viewer));
509152f91c60SVaclav Hapla   } else if (ishdf5) {
509252f91c60SVaclav Hapla #if defined(PETSC_HAVE_HDF5)
50939566063dSJacob Faibussowitsch     PetscCall(MatLoad_AIJ_HDF5(newMat, viewer));
509452f91c60SVaclav Hapla #else
509552f91c60SVaclav Hapla     SETERRQ(PetscObjectComm((PetscObject)newMat), PETSC_ERR_SUP, "HDF5 not supported in this build.\nPlease reconfigure using --download-hdf5");
509652f91c60SVaclav Hapla #endif
509752f91c60SVaclav Hapla   } else {
509898921bdaSJacob Faibussowitsch     SETERRQ(PetscObjectComm((PetscObject)newMat), PETSC_ERR_SUP, "Viewer type %s not yet supported for reading %s matrices", ((PetscObject)viewer)->type_name, ((PetscObject)newMat)->type_name);
509952f91c60SVaclav Hapla   }
51003ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
510152f91c60SVaclav Hapla }
510252f91c60SVaclav Hapla 
5103d71ae5a4SJacob Faibussowitsch PetscErrorCode MatLoad_SeqAIJ_Binary(Mat mat, PetscViewer viewer)
5104d71ae5a4SJacob Faibussowitsch {
51053ea6fe3dSLisandro Dalcin   Mat_SeqAIJ *a = (Mat_SeqAIJ *)mat->data;
51063ea6fe3dSLisandro Dalcin   PetscInt    header[4], *rowlens, M, N, nz, sum, rows, cols, i;
5107fbdbba38SShri Abhyankar 
5108fbdbba38SShri Abhyankar   PetscFunctionBegin;
51099566063dSJacob Faibussowitsch   PetscCall(PetscViewerSetUp(viewer));
5110bbead8a2SBarry Smith 
51113ea6fe3dSLisandro Dalcin   /* read in matrix header */
51129566063dSJacob Faibussowitsch   PetscCall(PetscViewerBinaryRead(viewer, header, 4, NULL, PETSC_INT));
511308401ef6SPierre Jolivet   PetscCheck(header[0] == MAT_FILE_CLASSID, PETSC_COMM_SELF, PETSC_ERR_FILE_UNEXPECTED, "Not a matrix object in file");
51149371c9d4SSatish Balay   M  = header[1];
51159371c9d4SSatish Balay   N  = header[2];
51169371c9d4SSatish Balay   nz = header[3];
511708401ef6SPierre Jolivet   PetscCheck(M >= 0, PetscObjectComm((PetscObject)viewer), PETSC_ERR_FILE_UNEXPECTED, "Matrix row size (%" PetscInt_FMT ") in file is negative", M);
511808401ef6SPierre Jolivet   PetscCheck(N >= 0, PetscObjectComm((PetscObject)viewer), PETSC_ERR_FILE_UNEXPECTED, "Matrix column size (%" PetscInt_FMT ") in file is negative", N);
511908401ef6SPierre Jolivet   PetscCheck(nz >= 0, PETSC_COMM_SELF, PETSC_ERR_FILE_UNEXPECTED, "Matrix stored in special format on disk, cannot load as SeqAIJ");
5120fbdbba38SShri Abhyankar 
51213ea6fe3dSLisandro Dalcin   /* set block sizes from the viewer's .info file */
51229566063dSJacob Faibussowitsch   PetscCall(MatLoad_Binary_BlockSizes(mat, viewer));
51233ea6fe3dSLisandro Dalcin   /* set local and global sizes if not set already */
51243ea6fe3dSLisandro Dalcin   if (mat->rmap->n < 0) mat->rmap->n = M;
51253ea6fe3dSLisandro Dalcin   if (mat->cmap->n < 0) mat->cmap->n = N;
51263ea6fe3dSLisandro Dalcin   if (mat->rmap->N < 0) mat->rmap->N = M;
51273ea6fe3dSLisandro Dalcin   if (mat->cmap->N < 0) mat->cmap->N = N;
51289566063dSJacob Faibussowitsch   PetscCall(PetscLayoutSetUp(mat->rmap));
51299566063dSJacob Faibussowitsch   PetscCall(PetscLayoutSetUp(mat->cmap));
51303ea6fe3dSLisandro Dalcin 
51313ea6fe3dSLisandro Dalcin   /* check if the matrix sizes are correct */
51329566063dSJacob Faibussowitsch   PetscCall(MatGetSize(mat, &rows, &cols));
5133aed4548fSBarry Smith   PetscCheck(M == rows && N == cols, PETSC_COMM_SELF, PETSC_ERR_FILE_UNEXPECTED, "Matrix in file of different sizes (%" PetscInt_FMT ", %" PetscInt_FMT ") than the input matrix (%" PetscInt_FMT ", %" PetscInt_FMT ")", M, N, rows, cols);
51343ea6fe3dSLisandro Dalcin 
5135fbdbba38SShri Abhyankar   /* read in row lengths */
51369566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(M, &rowlens));
51379566063dSJacob Faibussowitsch   PetscCall(PetscViewerBinaryRead(viewer, rowlens, M, NULL, PETSC_INT));
51383ea6fe3dSLisandro Dalcin   /* check if sum(rowlens) is same as nz */
51399371c9d4SSatish Balay   sum = 0;
51409371c9d4SSatish Balay   for (i = 0; i < M; i++) sum += rowlens[i];
514108401ef6SPierre Jolivet   PetscCheck(sum == nz, PETSC_COMM_SELF, PETSC_ERR_FILE_UNEXPECTED, "Inconsistent matrix data in file: nonzeros = %" PetscInt_FMT ", sum-row-lengths = %" PetscInt_FMT, nz, sum);
51423ea6fe3dSLisandro Dalcin   /* preallocate and check sizes */
51439566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(mat, 0, rowlens));
51449566063dSJacob Faibussowitsch   PetscCall(MatGetSize(mat, &rows, &cols));
5145aed4548fSBarry Smith   PetscCheck(M == rows && N == cols, PETSC_COMM_SELF, PETSC_ERR_FILE_UNEXPECTED, "Matrix in file of different length (%" PetscInt_FMT ", %" PetscInt_FMT ") than the input matrix (%" PetscInt_FMT ", %" PetscInt_FMT ")", M, N, rows, cols);
51463ea6fe3dSLisandro Dalcin   /* store row lengths */
51479566063dSJacob Faibussowitsch   PetscCall(PetscArraycpy(a->ilen, rowlens, M));
51489566063dSJacob Faibussowitsch   PetscCall(PetscFree(rowlens));
5149fbdbba38SShri Abhyankar 
51503ea6fe3dSLisandro Dalcin   /* fill in "i" row pointers */
51519371c9d4SSatish Balay   a->i[0] = 0;
51529371c9d4SSatish Balay   for (i = 0; i < M; i++) a->i[i + 1] = a->i[i] + a->ilen[i];
51533ea6fe3dSLisandro Dalcin   /* read in "j" column indices */
51549566063dSJacob Faibussowitsch   PetscCall(PetscViewerBinaryRead(viewer, a->j, nz, NULL, PETSC_INT));
51553ea6fe3dSLisandro Dalcin   /* read in "a" nonzero values */
51569566063dSJacob Faibussowitsch   PetscCall(PetscViewerBinaryRead(viewer, a->a, nz, NULL, PETSC_SCALAR));
5157fbdbba38SShri Abhyankar 
51589566063dSJacob Faibussowitsch   PetscCall(MatAssemblyBegin(mat, MAT_FINAL_ASSEMBLY));
51599566063dSJacob Faibussowitsch   PetscCall(MatAssemblyEnd(mat, MAT_FINAL_ASSEMBLY));
51603ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
5161fbdbba38SShri Abhyankar }
5162fbdbba38SShri Abhyankar 
5163d71ae5a4SJacob Faibussowitsch PetscErrorCode MatEqual_SeqAIJ(Mat A, Mat B, PetscBool *flg)
5164d71ae5a4SJacob Faibussowitsch {
51657264ac53SSatish Balay   Mat_SeqAIJ        *a = (Mat_SeqAIJ *)A->data, *b = (Mat_SeqAIJ *)B->data;
5166fff043a9SJunchao Zhang   const PetscScalar *aa, *ba;
5167eeffb40dSHong Zhang #if defined(PETSC_USE_COMPLEX)
5168eeffb40dSHong Zhang   PetscInt k;
5169eeffb40dSHong Zhang #endif
51707264ac53SSatish Balay 
51713a40ed3dSBarry Smith   PetscFunctionBegin;
5172bfeeae90SHong Zhang   /* If the  matrix dimensions are not equal,or no of nonzeros */
5173d0f46423SBarry Smith   if ((A->rmap->n != B->rmap->n) || (A->cmap->n != B->cmap->n) || (a->nz != b->nz)) {
5174ca44d042SBarry Smith     *flg = PETSC_FALSE;
51753ba16761SJacob Faibussowitsch     PetscFunctionReturn(PETSC_SUCCESS);
5176bcd2baecSBarry Smith   }
51777264ac53SSatish Balay 
51787264ac53SSatish Balay   /* if the a->i are the same */
51799566063dSJacob Faibussowitsch   PetscCall(PetscArraycmp(a->i, b->i, A->rmap->n + 1, flg));
51803ba16761SJacob Faibussowitsch   if (!*flg) PetscFunctionReturn(PETSC_SUCCESS);
51817264ac53SSatish Balay 
51827264ac53SSatish Balay   /* if a->j are the same */
51839566063dSJacob Faibussowitsch   PetscCall(PetscArraycmp(a->j, b->j, a->nz, flg));
51843ba16761SJacob Faibussowitsch   if (!*flg) PetscFunctionReturn(PETSC_SUCCESS);
5185bcd2baecSBarry Smith 
51869566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &aa));
51879566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(B, &ba));
5188bcd2baecSBarry Smith   /* if a->a are the same */
5189eeffb40dSHong Zhang #if defined(PETSC_USE_COMPLEX)
5190eeffb40dSHong Zhang   for (k = 0; k < a->nz; k++) {
5191fff043a9SJunchao Zhang     if (PetscRealPart(aa[k]) != PetscRealPart(ba[k]) || PetscImaginaryPart(aa[k]) != PetscImaginaryPart(ba[k])) {
5192eeffb40dSHong Zhang       *flg = PETSC_FALSE;
51933ba16761SJacob Faibussowitsch       PetscFunctionReturn(PETSC_SUCCESS);
5194eeffb40dSHong Zhang     }
5195eeffb40dSHong Zhang   }
5196eeffb40dSHong Zhang #else
51979566063dSJacob Faibussowitsch   PetscCall(PetscArraycmp(aa, ba, a->nz, flg));
5198eeffb40dSHong Zhang #endif
51999566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &aa));
52009566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(B, &ba));
52013ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
52027264ac53SSatish Balay }
520336db0b34SBarry Smith 
520405869f15SSatish Balay /*@
520511a5261eSBarry Smith   MatCreateSeqAIJWithArrays - Creates an sequential `MATSEQAIJ` matrix using matrix elements (in CSR format)
520636db0b34SBarry Smith   provided by the user.
520736db0b34SBarry Smith 
5208d083f849SBarry Smith   Collective
520936db0b34SBarry Smith 
521036db0b34SBarry Smith   Input Parameters:
521136db0b34SBarry Smith + comm - must be an MPI communicator of size 1
521236db0b34SBarry Smith . m    - number of rows
521336db0b34SBarry Smith . n    - number of columns
5214483a2f95SBarry Smith . i    - row indices; that is i[0] = 0, i[row] = i[row-1] + number of elements in that row of the matrix
521536db0b34SBarry Smith . j    - column indices
521636db0b34SBarry Smith - a    - matrix values
521736db0b34SBarry Smith 
521836db0b34SBarry Smith   Output Parameter:
521936db0b34SBarry Smith . mat - the matrix
522036db0b34SBarry Smith 
522136db0b34SBarry Smith   Level: intermediate
522236db0b34SBarry Smith 
522336db0b34SBarry Smith   Notes:
52242ef1f0ffSBarry Smith   The `i`, `j`, and `a` arrays are not copied by this routine, the user must free these arrays
5225292fb18eSBarry Smith   once the matrix is destroyed and not before
522636db0b34SBarry Smith 
522736db0b34SBarry Smith   You cannot set new nonzero locations into this matrix, that will generate an error.
522836db0b34SBarry Smith 
52292ef1f0ffSBarry Smith   The `i` and `j` indices are 0 based
523036db0b34SBarry Smith 
5231a4552177SSatish Balay   The format which is used for the sparse matrix input, is equivalent to a
5232a4552177SSatish Balay   row-major ordering.. i.e for the following matrix, the input data expected is
52338eef79e4SBarry Smith   as shown
52342ef1f0ffSBarry Smith .vb
52352ef1f0ffSBarry Smith         1 0 0
52362ef1f0ffSBarry Smith         2 0 3
52372ef1f0ffSBarry Smith         4 5 6
5238a4552177SSatish Balay 
52392ef1f0ffSBarry Smith         i =  {0,1,3,6}  [size = nrow+1  = 3+1]
52402ef1f0ffSBarry Smith         j =  {0,0,2,0,1,2}  [size = 6]; values must be sorted for each row
52412ef1f0ffSBarry Smith         v =  {1,2,3,4,5,6}  [size = 6]
52422ef1f0ffSBarry Smith .ve
5243a4552177SSatish Balay 
52441cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatCreate()`, `MatCreateAIJ()`, `MatCreateSeqAIJ()`, `MatCreateMPIAIJWithArrays()`, `MatMPIAIJSetPreallocationCSR()`
524536db0b34SBarry Smith @*/
5246d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateSeqAIJWithArrays(MPI_Comm comm, PetscInt m, PetscInt n, PetscInt i[], PetscInt j[], PetscScalar a[], Mat *mat)
5247d71ae5a4SJacob Faibussowitsch {
5248cbcfb4deSHong Zhang   PetscInt    ii;
524936db0b34SBarry Smith   Mat_SeqAIJ *aij;
5250cbcfb4deSHong Zhang   PetscInt    jj;
525136db0b34SBarry Smith 
525236db0b34SBarry Smith   PetscFunctionBegin;
5253aed4548fSBarry Smith   PetscCheck(m <= 0 || i[0] == 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "i (row indices) must start with 0");
52549566063dSJacob Faibussowitsch   PetscCall(MatCreate(comm, mat));
52559566063dSJacob Faibussowitsch   PetscCall(MatSetSizes(*mat, m, n, m, n));
52569566063dSJacob Faibussowitsch   /* PetscCall(MatSetBlockSizes(*mat,,)); */
52579566063dSJacob Faibussowitsch   PetscCall(MatSetType(*mat, MATSEQAIJ));
52589566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(*mat, MAT_SKIP_ALLOCATION, NULL));
5259ab93d7beSBarry Smith   aij = (Mat_SeqAIJ *)(*mat)->data;
52609566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(m, &aij->imax));
52619566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(m, &aij->ilen));
5262ab93d7beSBarry Smith 
526336db0b34SBarry Smith   aij->i       = i;
526436db0b34SBarry Smith   aij->j       = j;
526536db0b34SBarry Smith   aij->a       = a;
526636db0b34SBarry Smith   aij->nonew   = -1; /*this indicates that inserting a new value in the matrix that generates a new nonzero is an error*/
5267e6b907acSBarry Smith   aij->free_a  = PETSC_FALSE;
5268e6b907acSBarry Smith   aij->free_ij = PETSC_FALSE;
526936db0b34SBarry Smith 
5270cbc6b225SStefano Zampini   for (ii = 0, aij->nonzerorowcnt = 0, aij->rmax = 0; ii < m; ii++) {
527136db0b34SBarry Smith     aij->ilen[ii] = aij->imax[ii] = i[ii + 1] - i[ii];
527276bd3646SJed Brown     if (PetscDefined(USE_DEBUG)) {
5273aed4548fSBarry Smith       PetscCheck(i[ii + 1] - i[ii] >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Negative row length in i (row indices) row = %" PetscInt_FMT " length = %" PetscInt_FMT, ii, i[ii + 1] - i[ii]);
52749985e31cSBarry Smith       for (jj = i[ii] + 1; jj < i[ii + 1]; jj++) {
527508401ef6SPierre Jolivet         PetscCheck(j[jj] >= j[jj - 1], PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Column entry number %" PetscInt_FMT " (actual column %" PetscInt_FMT ") in row %" PetscInt_FMT " is not sorted", jj - i[ii], j[jj], ii);
527608401ef6SPierre Jolivet         PetscCheck(j[jj] != j[jj - 1], PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Column entry number %" PetscInt_FMT " (actual column %" PetscInt_FMT ") in row %" PetscInt_FMT " is identical to previous entry", jj - i[ii], j[jj], ii);
52779985e31cSBarry Smith       }
527836db0b34SBarry Smith     }
527976bd3646SJed Brown   }
528076bd3646SJed Brown   if (PetscDefined(USE_DEBUG)) {
528136db0b34SBarry Smith     for (ii = 0; ii < aij->i[m]; ii++) {
528208401ef6SPierre Jolivet       PetscCheck(j[ii] >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Negative column index at location = %" PetscInt_FMT " index = %" PetscInt_FMT, ii, j[ii]);
5283da0802e2SStefano Zampini       PetscCheck(j[ii] <= n - 1, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Column index to large at location = %" PetscInt_FMT " index = %" PetscInt_FMT " last column = %" PetscInt_FMT, ii, j[ii], n - 1);
528436db0b34SBarry Smith     }
528576bd3646SJed Brown   }
528636db0b34SBarry Smith 
52879566063dSJacob Faibussowitsch   PetscCall(MatAssemblyBegin(*mat, MAT_FINAL_ASSEMBLY));
52889566063dSJacob Faibussowitsch   PetscCall(MatAssemblyEnd(*mat, MAT_FINAL_ASSEMBLY));
52893ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
529036db0b34SBarry Smith }
5291cbc6b225SStefano Zampini 
5292f62e3866SBarry Smith /*@
529311a5261eSBarry Smith   MatCreateSeqAIJFromTriple - Creates an sequential `MATSEQAIJ` matrix using matrix elements (in COO format)
52948a0b0e6bSVictor Minden   provided by the user.
52958a0b0e6bSVictor Minden 
5296d083f849SBarry Smith   Collective
52978a0b0e6bSVictor Minden 
52988a0b0e6bSVictor Minden   Input Parameters:
52998a0b0e6bSVictor Minden + comm - must be an MPI communicator of size 1
53008a0b0e6bSVictor Minden . m    - number of rows
53018a0b0e6bSVictor Minden . n    - number of columns
53028a0b0e6bSVictor Minden . i    - row indices
53038a0b0e6bSVictor Minden . j    - column indices
53041230e6d1SVictor Minden . a    - matrix values
53051230e6d1SVictor Minden . nz   - number of nonzeros
53062ef1f0ffSBarry Smith - idx  - if the `i` and `j` indices start with 1 use `PETSC_TRUE` otherwise use `PETSC_FALSE`
53078a0b0e6bSVictor Minden 
53088a0b0e6bSVictor Minden   Output Parameter:
53098a0b0e6bSVictor Minden . mat - the matrix
53108a0b0e6bSVictor Minden 
53118a0b0e6bSVictor Minden   Level: intermediate
53128a0b0e6bSVictor Minden 
5313f62e3866SBarry Smith   Example:
5314f62e3866SBarry Smith   For the following matrix, the input data expected is as shown (using 0 based indexing)
53159e99939fSJunchao Zhang .vb
53168a0b0e6bSVictor Minden         1 0 0
53178a0b0e6bSVictor Minden         2 0 3
53188a0b0e6bSVictor Minden         4 5 6
53198a0b0e6bSVictor Minden 
53208a0b0e6bSVictor Minden         i =  {0,1,1,2,2,2}
53218a0b0e6bSVictor Minden         j =  {0,0,2,0,1,2}
53228a0b0e6bSVictor Minden         v =  {1,2,3,4,5,6}
53239e99939fSJunchao Zhang .ve
5324fe59aa6dSJacob Faibussowitsch 
53252ef1f0ffSBarry Smith   Note:
5326d7547e51SJunchao Zhang   Instead of using this function, users should also consider `MatSetPreallocationCOO()` and `MatSetValuesCOO()`, which allow repeated or remote entries,
5327d7547e51SJunchao Zhang   and are particularly useful in iterative applications.
53288a0b0e6bSVictor Minden 
53291cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatCreate()`, `MatCreateAIJ()`, `MatCreateSeqAIJ()`, `MatCreateSeqAIJWithArrays()`, `MatMPIAIJSetPreallocationCSR()`, `MatSetValuesCOO()`, `MatSetPreallocationCOO()`
53308a0b0e6bSVictor Minden @*/
5331ce78bad3SBarry Smith PetscErrorCode MatCreateSeqAIJFromTriple(MPI_Comm comm, PetscInt m, PetscInt n, PetscInt i[], PetscInt j[], PetscScalar a[], Mat *mat, PetscCount nz, PetscBool idx)
5332d71ae5a4SJacob Faibussowitsch {
5333d021a1c5SVictor Minden   PetscInt ii, *nnz, one = 1, row, col;
53348a0b0e6bSVictor Minden 
53358a0b0e6bSVictor Minden   PetscFunctionBegin;
53369566063dSJacob Faibussowitsch   PetscCall(PetscCalloc1(m, &nnz));
5337ad540459SPierre Jolivet   for (ii = 0; ii < nz; ii++) nnz[i[ii] - !!idx] += 1;
53389566063dSJacob Faibussowitsch   PetscCall(MatCreate(comm, mat));
53399566063dSJacob Faibussowitsch   PetscCall(MatSetSizes(*mat, m, n, m, n));
53409566063dSJacob Faibussowitsch   PetscCall(MatSetType(*mat, MATSEQAIJ));
53419566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(*mat, 0, nnz));
53421230e6d1SVictor Minden   for (ii = 0; ii < nz; ii++) {
53431230e6d1SVictor Minden     if (idx) {
53441230e6d1SVictor Minden       row = i[ii] - 1;
53451230e6d1SVictor Minden       col = j[ii] - 1;
53461230e6d1SVictor Minden     } else {
53471230e6d1SVictor Minden       row = i[ii];
53481230e6d1SVictor Minden       col = j[ii];
53498a0b0e6bSVictor Minden     }
53509566063dSJacob Faibussowitsch     PetscCall(MatSetValues(*mat, one, &row, one, &col, &a[ii], ADD_VALUES));
53518a0b0e6bSVictor Minden   }
53529566063dSJacob Faibussowitsch   PetscCall(MatAssemblyBegin(*mat, MAT_FINAL_ASSEMBLY));
53539566063dSJacob Faibussowitsch   PetscCall(MatAssemblyEnd(*mat, MAT_FINAL_ASSEMBLY));
53549566063dSJacob Faibussowitsch   PetscCall(PetscFree(nnz));
53553ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
53568a0b0e6bSVictor Minden }
535736db0b34SBarry Smith 
5358d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJInvalidateDiagonal(Mat A)
5359d71ae5a4SJacob Faibussowitsch {
5360acf2f550SJed Brown   Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data;
5361acf2f550SJed Brown 
5362acf2f550SJed Brown   PetscFunctionBegin;
5363acf2f550SJed Brown   a->idiagvalid  = PETSC_FALSE;
5364acf2f550SJed Brown   a->ibdiagvalid = PETSC_FALSE;
53652205254eSKarl Rupp 
53669566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJInvalidateDiagonal_Inode(A));
53673ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
5368acf2f550SJed Brown }
5369acf2f550SJed Brown 
5370d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateMPIMatConcatenateSeqMat_SeqAIJ(MPI_Comm comm, Mat inmat, PetscInt n, MatReuse scall, Mat *outmat)
5371d71ae5a4SJacob Faibussowitsch {
53729c8f2541SHong Zhang   PetscFunctionBegin;
53739566063dSJacob Faibussowitsch   PetscCall(MatCreateMPIMatConcatenateSeqMat_MPIAIJ(comm, inmat, n, scall, outmat));
53743ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
53759c8f2541SHong Zhang }
53769c8f2541SHong Zhang 
537781824310SBarry Smith /*
537853dd7562SDmitry Karpeev  Permute A into C's *local* index space using rowemb,colemb.
537953dd7562SDmitry Karpeev  The embedding are supposed to be injections and the above implies that the range of rowemb is a subset
538053dd7562SDmitry Karpeev  of [0,m), colemb is in [0,n).
538153dd7562SDmitry Karpeev  If pattern == DIFFERENT_NONZERO_PATTERN, C is preallocated according to A.
538253dd7562SDmitry Karpeev  */
5383d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetSeqMat_SeqAIJ(Mat C, IS rowemb, IS colemb, MatStructure pattern, Mat B)
5384d71ae5a4SJacob Faibussowitsch {
538553dd7562SDmitry Karpeev   /* If making this function public, change the error returned in this function away from _PLIB. */
538653dd7562SDmitry Karpeev   Mat_SeqAIJ     *Baij;
538753dd7562SDmitry Karpeev   PetscBool       seqaij;
538853dd7562SDmitry Karpeev   PetscInt        m, n, *nz, i, j, count;
538953dd7562SDmitry Karpeev   PetscScalar     v;
539053dd7562SDmitry Karpeev   const PetscInt *rowindices, *colindices;
539153dd7562SDmitry Karpeev 
539253dd7562SDmitry Karpeev   PetscFunctionBegin;
53933ba16761SJacob Faibussowitsch   if (!B) PetscFunctionReturn(PETSC_SUCCESS);
539453dd7562SDmitry Karpeev   /* Check to make sure the target matrix (and embeddings) are compatible with C and each other. */
53959566063dSJacob Faibussowitsch   PetscCall(PetscObjectBaseTypeCompare((PetscObject)B, MATSEQAIJ, &seqaij));
539628b400f6SJacob Faibussowitsch   PetscCheck(seqaij, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Input matrix is of wrong type");
539753dd7562SDmitry Karpeev   if (rowemb) {
53989566063dSJacob Faibussowitsch     PetscCall(ISGetLocalSize(rowemb, &m));
539908401ef6SPierre Jolivet     PetscCheck(m == B->rmap->n, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Row IS of size %" PetscInt_FMT " is incompatible with matrix row size %" PetscInt_FMT, m, B->rmap->n);
540053dd7562SDmitry Karpeev   } else {
540108401ef6SPierre Jolivet     PetscCheck(C->rmap->n == B->rmap->n, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Input matrix is row-incompatible with the target matrix");
540253dd7562SDmitry Karpeev   }
540353dd7562SDmitry Karpeev   if (colemb) {
54049566063dSJacob Faibussowitsch     PetscCall(ISGetLocalSize(colemb, &n));
540508401ef6SPierre Jolivet     PetscCheck(n == B->cmap->n, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Diag col IS of size %" PetscInt_FMT " is incompatible with input matrix col size %" PetscInt_FMT, n, B->cmap->n);
540653dd7562SDmitry Karpeev   } else {
540708401ef6SPierre Jolivet     PetscCheck(C->cmap->n == B->cmap->n, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Input matrix is col-incompatible with the target matrix");
540853dd7562SDmitry Karpeev   }
540953dd7562SDmitry Karpeev 
5410f4f49eeaSPierre Jolivet   Baij = (Mat_SeqAIJ *)B->data;
541153dd7562SDmitry Karpeev   if (pattern == DIFFERENT_NONZERO_PATTERN) {
54129566063dSJacob Faibussowitsch     PetscCall(PetscMalloc1(B->rmap->n, &nz));
5413ad540459SPierre Jolivet     for (i = 0; i < B->rmap->n; i++) nz[i] = Baij->i[i + 1] - Baij->i[i];
54149566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJSetPreallocation(C, 0, nz));
54159566063dSJacob Faibussowitsch     PetscCall(PetscFree(nz));
541653dd7562SDmitry Karpeev   }
541748a46eb9SPierre Jolivet   if (pattern == SUBSET_NONZERO_PATTERN) PetscCall(MatZeroEntries(C));
541853dd7562SDmitry Karpeev   count      = 0;
541953dd7562SDmitry Karpeev   rowindices = NULL;
542053dd7562SDmitry Karpeev   colindices = NULL;
542148a46eb9SPierre Jolivet   if (rowemb) PetscCall(ISGetIndices(rowemb, &rowindices));
542248a46eb9SPierre Jolivet   if (colemb) PetscCall(ISGetIndices(colemb, &colindices));
542353dd7562SDmitry Karpeev   for (i = 0; i < B->rmap->n; i++) {
542453dd7562SDmitry Karpeev     PetscInt row;
542553dd7562SDmitry Karpeev     row = i;
542653dd7562SDmitry Karpeev     if (rowindices) row = rowindices[i];
542753dd7562SDmitry Karpeev     for (j = Baij->i[i]; j < Baij->i[i + 1]; j++) {
542853dd7562SDmitry Karpeev       PetscInt col;
542953dd7562SDmitry Karpeev       col = Baij->j[count];
543053dd7562SDmitry Karpeev       if (colindices) col = colindices[col];
543153dd7562SDmitry Karpeev       v = Baij->a[count];
54329566063dSJacob Faibussowitsch       PetscCall(MatSetValues(C, 1, &row, 1, &col, &v, INSERT_VALUES));
543353dd7562SDmitry Karpeev       ++count;
543453dd7562SDmitry Karpeev     }
543553dd7562SDmitry Karpeev   }
543653dd7562SDmitry Karpeev   /* FIXME: set C's nonzerostate correctly. */
543753dd7562SDmitry Karpeev   /* Assembly for C is necessary. */
543853dd7562SDmitry Karpeev   C->preallocated  = PETSC_TRUE;
543953dd7562SDmitry Karpeev   C->assembled     = PETSC_TRUE;
544053dd7562SDmitry Karpeev   C->was_assembled = PETSC_FALSE;
54413ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
544253dd7562SDmitry Karpeev }
544353dd7562SDmitry Karpeev 
544458c11ad4SPierre Jolivet PetscErrorCode MatEliminateZeros_SeqAIJ(Mat A, PetscBool keep)
5445dec0b466SHong Zhang {
5446dec0b466SHong Zhang   Mat_SeqAIJ *a  = (Mat_SeqAIJ *)A->data;
5447dec0b466SHong Zhang   MatScalar  *aa = a->a;
5448dec0b466SHong Zhang   PetscInt    m = A->rmap->n, fshift = 0, fshift_prev = 0, i, k;
5449dec0b466SHong Zhang   PetscInt   *ailen = a->ilen, *imax = a->imax, *ai = a->i, *aj = a->j, rmax = 0;
5450dec0b466SHong Zhang 
5451dec0b466SHong Zhang   PetscFunctionBegin;
5452dec0b466SHong Zhang   PetscCheck(A->assembled, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Cannot eliminate zeros for unassembled matrix");
5453dec0b466SHong Zhang   if (m) rmax = ailen[0]; /* determine row with most nonzeros */
5454dec0b466SHong Zhang   for (i = 1; i <= m; i++) {
5455dec0b466SHong Zhang     /* move each nonzero entry back by the amount of zero slots (fshift) before it*/
5456dec0b466SHong Zhang     for (k = ai[i - 1]; k < ai[i]; k++) {
545758c11ad4SPierre Jolivet       if (aa[k] == 0 && (aj[k] != i - 1 || !keep)) fshift++;
5458dec0b466SHong Zhang       else {
5459dec0b466SHong Zhang         if (aa[k] == 0 && aj[k] == i - 1) PetscCall(PetscInfo(A, "Keep the diagonal zero at row %" PetscInt_FMT "\n", i - 1));
5460dec0b466SHong Zhang         aa[k - fshift] = aa[k];
5461dec0b466SHong Zhang         aj[k - fshift] = aj[k];
5462dec0b466SHong Zhang       }
5463dec0b466SHong Zhang     }
5464dec0b466SHong Zhang     ai[i - 1] -= fshift_prev; // safe to update ai[i-1] now since it will not be used in the next iteration
5465dec0b466SHong Zhang     fshift_prev = fshift;
5466dec0b466SHong Zhang     /* reset ilen and imax for each row */
5467dec0b466SHong Zhang     ailen[i - 1] = imax[i - 1] = ai[i] - fshift - ai[i - 1];
5468dec0b466SHong Zhang     a->nonzerorowcnt += ((ai[i] - fshift - ai[i - 1]) > 0);
5469dec0b466SHong Zhang     rmax = PetscMax(rmax, ailen[i - 1]);
5470dec0b466SHong Zhang   }
5471312eded4SPierre Jolivet   if (fshift) {
5472dec0b466SHong Zhang     if (m) {
5473dec0b466SHong Zhang       ai[m] -= fshift;
5474dec0b466SHong Zhang       a->nz = ai[m];
5475dec0b466SHong Zhang     }
5476dec0b466SHong Zhang     PetscCall(PetscInfo(A, "Matrix size: %" PetscInt_FMT " X %" PetscInt_FMT "; zeros eliminated: %" PetscInt_FMT "; nonzeros left: %" PetscInt_FMT "\n", m, A->cmap->n, fshift, a->nz));
5477312eded4SPierre Jolivet     A->nonzerostate++;
5478dec0b466SHong Zhang     A->info.nz_unneeded += (PetscReal)fshift;
5479dec0b466SHong Zhang     a->rmax = rmax;
5480dec0b466SHong Zhang     if (a->inode.use && a->inode.checked) PetscCall(MatSeqAIJCheckInode(A));
5481dec0b466SHong Zhang     PetscCall(MatAssemblyBegin(A, MAT_FINAL_ASSEMBLY));
5482dec0b466SHong Zhang     PetscCall(MatAssemblyEnd(A, MAT_FINAL_ASSEMBLY));
5483312eded4SPierre Jolivet   }
54843ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
5485dec0b466SHong Zhang }
5486dec0b466SHong Zhang 
54874099cc6bSBarry Smith PetscFunctionList MatSeqAIJList = NULL;
54884099cc6bSBarry Smith 
5489cc4c1da9SBarry Smith /*@
549011a5261eSBarry Smith   MatSeqAIJSetType - Converts a `MATSEQAIJ` matrix to a subtype
54914099cc6bSBarry Smith 
5492c3339decSBarry Smith   Collective
54934099cc6bSBarry Smith 
54944099cc6bSBarry Smith   Input Parameters:
54954099cc6bSBarry Smith + mat    - the matrix object
54964099cc6bSBarry Smith - matype - matrix type
54974099cc6bSBarry Smith 
54984099cc6bSBarry Smith   Options Database Key:
54994e187271SRichard Tran Mills . -mat_seqaij_type  <method> - for example seqaijcrl
55004099cc6bSBarry Smith 
55014099cc6bSBarry Smith   Level: intermediate
55024099cc6bSBarry Smith 
5503fe59aa6dSJacob Faibussowitsch .seealso: [](ch_matrices), `Mat`, `PCSetType()`, `VecSetType()`, `MatCreate()`, `MatType`
55044099cc6bSBarry Smith @*/
5505d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetType(Mat mat, MatType matype)
5506d71ae5a4SJacob Faibussowitsch {
55074099cc6bSBarry Smith   PetscBool sametype;
55085f80ce2aSJacob Faibussowitsch   PetscErrorCode (*r)(Mat, MatType, MatReuse, Mat *);
55094099cc6bSBarry Smith 
55104099cc6bSBarry Smith   PetscFunctionBegin;
55114099cc6bSBarry Smith   PetscValidHeaderSpecific(mat, MAT_CLASSID, 1);
55129566063dSJacob Faibussowitsch   PetscCall(PetscObjectTypeCompare((PetscObject)mat, matype, &sametype));
55133ba16761SJacob Faibussowitsch   if (sametype) PetscFunctionReturn(PETSC_SUCCESS);
55144099cc6bSBarry Smith 
55159566063dSJacob Faibussowitsch   PetscCall(PetscFunctionListFind(MatSeqAIJList, matype, &r));
55166adde796SStefano Zampini   PetscCheck(r, PetscObjectComm((PetscObject)mat), PETSC_ERR_ARG_UNKNOWN_TYPE, "Unknown Mat type given: %s", matype);
55179566063dSJacob Faibussowitsch   PetscCall((*r)(mat, matype, MAT_INPLACE_MATRIX, &mat));
55183ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
55194099cc6bSBarry Smith }
55204099cc6bSBarry Smith 
55214099cc6bSBarry Smith /*@C
552211a5261eSBarry Smith   MatSeqAIJRegister -  - Adds a new sub-matrix type for sequential `MATSEQAIJ` matrices
55234099cc6bSBarry Smith 
5524cc4c1da9SBarry Smith   Not Collective, No Fortran Support
55254099cc6bSBarry Smith 
55264099cc6bSBarry Smith   Input Parameters:
5527fe59aa6dSJacob Faibussowitsch + sname    - name of a new user-defined matrix type, for example `MATSEQAIJCRL`
55284099cc6bSBarry Smith - function - routine to convert to subtype
55294099cc6bSBarry Smith 
55302ef1f0ffSBarry Smith   Level: advanced
55312ef1f0ffSBarry Smith 
55324099cc6bSBarry Smith   Notes:
553311a5261eSBarry Smith   `MatSeqAIJRegister()` may be called multiple times to add several user-defined solvers.
55344099cc6bSBarry Smith 
55354099cc6bSBarry Smith   Then, your matrix can be chosen with the procedural interface at runtime via the option
5536*b44f4de4SBarry Smith .vb
5537*b44f4de4SBarry Smith   -mat_seqaij_type my_mat
5538*b44f4de4SBarry Smith .ve
55394099cc6bSBarry Smith 
55401cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJRegisterAll()`
55414099cc6bSBarry Smith @*/
5542d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJRegister(const char sname[], PetscErrorCode (*function)(Mat, MatType, MatReuse, Mat *))
5543d71ae5a4SJacob Faibussowitsch {
55444099cc6bSBarry Smith   PetscFunctionBegin;
55459566063dSJacob Faibussowitsch   PetscCall(MatInitializePackage());
55469566063dSJacob Faibussowitsch   PetscCall(PetscFunctionListAdd(&MatSeqAIJList, sname, function));
55473ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
55484099cc6bSBarry Smith }
55494099cc6bSBarry Smith 
55504099cc6bSBarry Smith PetscBool MatSeqAIJRegisterAllCalled = PETSC_FALSE;
55514099cc6bSBarry Smith 
55524099cc6bSBarry Smith /*@C
555311a5261eSBarry Smith   MatSeqAIJRegisterAll - Registers all of the matrix subtypes of `MATSSEQAIJ`
55544099cc6bSBarry Smith 
55554099cc6bSBarry Smith   Not Collective
55564099cc6bSBarry Smith 
55574099cc6bSBarry Smith   Level: advanced
55584099cc6bSBarry Smith 
55592ef1f0ffSBarry Smith   Note:
55602ef1f0ffSBarry Smith   This registers the versions of `MATSEQAIJ` for GPUs
55612ef1f0ffSBarry Smith 
55621cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatRegisterAll()`, `MatSeqAIJRegister()`
55634099cc6bSBarry Smith @*/
5564d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJRegisterAll(void)
5565d71ae5a4SJacob Faibussowitsch {
55664099cc6bSBarry Smith   PetscFunctionBegin;
55673ba16761SJacob Faibussowitsch   if (MatSeqAIJRegisterAllCalled) PetscFunctionReturn(PETSC_SUCCESS);
55684099cc6bSBarry Smith   MatSeqAIJRegisterAllCalled = PETSC_TRUE;
55694099cc6bSBarry Smith 
55709566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRegister(MATSEQAIJCRL, MatConvert_SeqAIJ_SeqAIJCRL));
55719566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRegister(MATSEQAIJPERM, MatConvert_SeqAIJ_SeqAIJPERM));
55729566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRegister(MATSEQAIJSELL, MatConvert_SeqAIJ_SeqAIJSELL));
55739779e05dSSatish Balay #if defined(PETSC_HAVE_MKL_SPARSE)
55749566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRegister(MATSEQAIJMKL, MatConvert_SeqAIJ_SeqAIJMKL));
5575485f9817SRichard Tran Mills #endif
55765063d097SStefano Zampini #if defined(PETSC_HAVE_CUDA)
55779566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRegister(MATSEQAIJCUSPARSE, MatConvert_SeqAIJ_SeqAIJCUSPARSE));
55785063d097SStefano Zampini #endif
5579d5e393b6SSuyash Tandon #if defined(PETSC_HAVE_HIP)
5580d5e393b6SSuyash Tandon   PetscCall(MatSeqAIJRegister(MATSEQAIJHIPSPARSE, MatConvert_SeqAIJ_SeqAIJHIPSPARSE));
5581d5e393b6SSuyash Tandon #endif
55825063d097SStefano Zampini #if defined(PETSC_HAVE_KOKKOS_KERNELS)
55839566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRegister(MATSEQAIJKOKKOS, MatConvert_SeqAIJ_SeqAIJKokkos));
55845063d097SStefano Zampini #endif
55854099cc6bSBarry Smith #if defined(PETSC_HAVE_VIENNACL) && defined(PETSC_HAVE_VIENNACL_NO_CUDA)
55869566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRegister(MATMPIAIJVIENNACL, MatConvert_SeqAIJ_SeqAIJViennaCL));
55874099cc6bSBarry Smith #endif
55883ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
55894099cc6bSBarry Smith }
559053dd7562SDmitry Karpeev 
559153dd7562SDmitry Karpeev /*
559281824310SBarry Smith     Special version for direct calls from Fortran
559381824310SBarry Smith */
559481824310SBarry Smith #if defined(PETSC_HAVE_FORTRAN_CAPS)
559581824310SBarry Smith   #define matsetvaluesseqaij_ MATSETVALUESSEQAIJ
559681824310SBarry Smith #elif !defined(PETSC_HAVE_FORTRAN_UNDERSCORE)
559781824310SBarry Smith   #define matsetvaluesseqaij_ matsetvaluesseqaij
559881824310SBarry Smith #endif
559981824310SBarry Smith 
560081824310SBarry Smith /* Change these macros so can be used in void function */
560198921bdaSJacob Faibussowitsch 
560298921bdaSJacob Faibussowitsch /* Change these macros so can be used in void function */
56039566063dSJacob Faibussowitsch /* Identical to PetscCallVoid, except it assigns to *_ierr */
56049566063dSJacob Faibussowitsch #undef PetscCall
56059371c9d4SSatish Balay #define PetscCall(...) \
56069371c9d4SSatish Balay   do { \
56075f80ce2aSJacob Faibussowitsch     PetscErrorCode ierr_msv_mpiaij = __VA_ARGS__; \
560898921bdaSJacob Faibussowitsch     if (PetscUnlikely(ierr_msv_mpiaij)) { \
560998921bdaSJacob Faibussowitsch       *_ierr = PetscError(PETSC_COMM_SELF, __LINE__, PETSC_FUNCTION_NAME, __FILE__, ierr_msv_mpiaij, PETSC_ERROR_REPEAT, " "); \
561098921bdaSJacob Faibussowitsch       return; \
561198921bdaSJacob Faibussowitsch     } \
561298921bdaSJacob Faibussowitsch   } while (0)
561398921bdaSJacob Faibussowitsch 
561498921bdaSJacob Faibussowitsch #undef SETERRQ
56159371c9d4SSatish Balay #define SETERRQ(comm, ierr, ...) \
56169371c9d4SSatish Balay   do { \
561798921bdaSJacob Faibussowitsch     *_ierr = PetscError(comm, __LINE__, PETSC_FUNCTION_NAME, __FILE__, ierr, PETSC_ERROR_INITIAL, __VA_ARGS__); \
561898921bdaSJacob Faibussowitsch     return; \
561998921bdaSJacob Faibussowitsch   } while (0)
562081824310SBarry Smith 
5621d71ae5a4SJacob Faibussowitsch PETSC_EXTERN void matsetvaluesseqaij_(Mat *AA, PetscInt *mm, const PetscInt im[], PetscInt *nn, const PetscInt in[], const PetscScalar v[], InsertMode *isis, PetscErrorCode *_ierr)
5622d71ae5a4SJacob Faibussowitsch {
562381824310SBarry Smith   Mat         A = *AA;
562481824310SBarry Smith   PetscInt    m = *mm, n = *nn;
562581824310SBarry Smith   InsertMode  is = *isis;
562681824310SBarry Smith   Mat_SeqAIJ *a  = (Mat_SeqAIJ *)A->data;
562781824310SBarry Smith   PetscInt   *rp, k, low, high, t, ii, row, nrow, i, col, l, rmax, N;
562881824310SBarry Smith   PetscInt   *imax, *ai, *ailen;
562981824310SBarry Smith   PetscInt   *aj, nonew = a->nonew, lastcol = -1;
563054f21887SBarry Smith   MatScalar  *ap, value, *aa;
5631ace3abfcSBarry Smith   PetscBool   ignorezeroentries = a->ignorezeroentries;
5632ace3abfcSBarry Smith   PetscBool   roworiented       = a->roworiented;
563381824310SBarry Smith 
563481824310SBarry Smith   PetscFunctionBegin;
56354994cf47SJed Brown   MatCheckPreallocated(A, 1);
563681824310SBarry Smith   imax  = a->imax;
563781824310SBarry Smith   ai    = a->i;
563881824310SBarry Smith   ailen = a->ilen;
563981824310SBarry Smith   aj    = a->j;
564081824310SBarry Smith   aa    = a->a;
564181824310SBarry Smith 
564281824310SBarry Smith   for (k = 0; k < m; k++) { /* loop over added rows */
564381824310SBarry Smith     row = im[k];
564481824310SBarry Smith     if (row < 0) continue;
56455f80ce2aSJacob Faibussowitsch     PetscCheck(row < A->rmap->n, PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_OUTOFRANGE, "Row too large");
56469371c9d4SSatish Balay     rp   = aj + ai[row];
56479371c9d4SSatish Balay     ap   = aa + ai[row];
56489371c9d4SSatish Balay     rmax = imax[row];
56499371c9d4SSatish Balay     nrow = ailen[row];
565081824310SBarry Smith     low  = 0;
565181824310SBarry Smith     high = nrow;
565281824310SBarry Smith     for (l = 0; l < n; l++) { /* loop over added columns */
565381824310SBarry Smith       if (in[l] < 0) continue;
56545f80ce2aSJacob Faibussowitsch       PetscCheck(in[l] < A->cmap->n, PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_OUTOFRANGE, "Column too large");
565581824310SBarry Smith       col = in[l];
56562205254eSKarl Rupp       if (roworiented) value = v[l + k * n];
56572205254eSKarl Rupp       else value = v[k + l * m];
56582205254eSKarl Rupp 
565981824310SBarry Smith       if (value == 0.0 && ignorezeroentries && (is == ADD_VALUES)) continue;
566081824310SBarry Smith 
56612205254eSKarl Rupp       if (col <= lastcol) low = 0;
56622205254eSKarl Rupp       else high = nrow;
566381824310SBarry Smith       lastcol = col;
566481824310SBarry Smith       while (high - low > 5) {
566581824310SBarry Smith         t = (low + high) / 2;
566681824310SBarry Smith         if (rp[t] > col) high = t;
566781824310SBarry Smith         else low = t;
566881824310SBarry Smith       }
566981824310SBarry Smith       for (i = low; i < high; i++) {
567081824310SBarry Smith         if (rp[i] > col) break;
567181824310SBarry Smith         if (rp[i] == col) {
567281824310SBarry Smith           if (is == ADD_VALUES) ap[i] += value;
567381824310SBarry Smith           else ap[i] = value;
567481824310SBarry Smith           goto noinsert;
567581824310SBarry Smith         }
567681824310SBarry Smith       }
567781824310SBarry Smith       if (value == 0.0 && ignorezeroentries) goto noinsert;
567881824310SBarry Smith       if (nonew == 1) goto noinsert;
56795f80ce2aSJacob Faibussowitsch       PetscCheck(nonew != -1, PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_OUTOFRANGE, "Inserting a new nonzero in the matrix");
5680fef13f97SBarry Smith       MatSeqXAIJReallocateAIJ(A, A->rmap->n, 1, nrow, row, col, rmax, aa, ai, aj, rp, ap, imax, nonew, MatScalar);
56819371c9d4SSatish Balay       N = nrow++ - 1;
56829371c9d4SSatish Balay       a->nz++;
56839371c9d4SSatish Balay       high++;
568481824310SBarry Smith       /* shift up all the later entries in this row */
568581824310SBarry Smith       for (ii = N; ii >= i; ii--) {
568681824310SBarry Smith         rp[ii + 1] = rp[ii];
568781824310SBarry Smith         ap[ii + 1] = ap[ii];
568881824310SBarry Smith       }
568981824310SBarry Smith       rp[i] = col;
569081824310SBarry Smith       ap[i] = value;
569181824310SBarry Smith     noinsert:;
569281824310SBarry Smith       low = i + 1;
569381824310SBarry Smith     }
569481824310SBarry Smith     ailen[row] = nrow;
569581824310SBarry Smith   }
569681824310SBarry Smith   PetscFunctionReturnVoid();
569781824310SBarry Smith }
569898921bdaSJacob Faibussowitsch /* Undefining these here since they were redefined from their original definition above! No
569998921bdaSJacob Faibussowitsch  * other PETSc functions should be defined past this point, as it is impossible to recover the
570098921bdaSJacob Faibussowitsch  * original definitions */
57019566063dSJacob Faibussowitsch #undef PetscCall
570298921bdaSJacob Faibussowitsch #undef SETERRQ
5703