xref: /petsc/src/mat/impls/aij/seq/aij.c (revision ba38deedd2838b0f18e3744cb0bafd6392690fde)
1d5d45c9bSBarry Smith /*
23369ce9aSBarry Smith     Defines the basic matrix operations for the AIJ (compressed row)
3d5d45c9bSBarry Smith   matrix storage format.
4d5d45c9bSBarry Smith */
53369ce9aSBarry Smith 
6c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/aij.h> /*I "petscmat.h" I*/
7c6db04a5SJed Brown #include <petscblaslapack.h>
8c6db04a5SJed Brown #include <petscbt.h>
9af0996ceSBarry Smith #include <petsc/private/kernels/blocktranspose.h>
100716a85fSBarry Smith 
1126cec326SBarry Smith /* defines MatSetValues_Seq_Hash(), MatAssemblyEnd_Seq_Hash(), MatSetUp_Seq_Hash() */
1226cec326SBarry Smith #define TYPE AIJ
1326cec326SBarry Smith #define TYPE_BS
1426cec326SBarry Smith #include "../src/mat/impls/aij/seq/seqhashmatsetvalues.h"
1526cec326SBarry Smith #include "../src/mat/impls/aij/seq/seqhashmat.h"
1626cec326SBarry Smith #undef TYPE
1726cec326SBarry Smith #undef TYPE_BS
1826cec326SBarry Smith 
19*ba38deedSJacob Faibussowitsch static PetscErrorCode MatSeqAIJSetTypeFromOptions(Mat A)
20d71ae5a4SJacob Faibussowitsch {
214099cc6bSBarry Smith   PetscBool flg;
224099cc6bSBarry Smith   char      type[256];
234099cc6bSBarry Smith 
244099cc6bSBarry Smith   PetscFunctionBegin;
25d0609cedSBarry Smith   PetscObjectOptionsBegin((PetscObject)A);
269566063dSJacob Faibussowitsch   PetscCall(PetscOptionsFList("-mat_seqaij_type", "Matrix SeqAIJ type", "MatSeqAIJSetType", MatSeqAIJList, "seqaij", type, 256, &flg));
279566063dSJacob Faibussowitsch   if (flg) PetscCall(MatSeqAIJSetType(A, type));
28d0609cedSBarry Smith   PetscOptionsEnd();
293ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
304099cc6bSBarry Smith }
314099cc6bSBarry Smith 
32*ba38deedSJacob Faibussowitsch static PetscErrorCode MatGetColumnReductions_SeqAIJ(Mat A, PetscInt type, PetscReal *reductions)
33d71ae5a4SJacob Faibussowitsch {
340716a85fSBarry Smith   PetscInt    i, m, n;
350716a85fSBarry Smith   Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data;
360716a85fSBarry Smith 
370716a85fSBarry Smith   PetscFunctionBegin;
389566063dSJacob Faibussowitsch   PetscCall(MatGetSize(A, &m, &n));
399566063dSJacob Faibussowitsch   PetscCall(PetscArrayzero(reductions, n));
400716a85fSBarry Smith   if (type == NORM_2) {
41ad540459SPierre Jolivet     for (i = 0; i < aij->i[m]; i++) reductions[aij->j[i]] += PetscAbsScalar(aij->a[i] * aij->a[i]);
420716a85fSBarry Smith   } else if (type == NORM_1) {
43ad540459SPierre Jolivet     for (i = 0; i < aij->i[m]; i++) reductions[aij->j[i]] += PetscAbsScalar(aij->a[i]);
440716a85fSBarry Smith   } else if (type == NORM_INFINITY) {
45ad540459SPierre Jolivet     for (i = 0; i < aij->i[m]; i++) reductions[aij->j[i]] = PetscMax(PetscAbsScalar(aij->a[i]), reductions[aij->j[i]]);
46857cbf51SRichard Tran Mills   } else if (type == REDUCTION_SUM_REALPART || type == REDUCTION_MEAN_REALPART) {
47ad540459SPierre Jolivet     for (i = 0; i < aij->i[m]; i++) reductions[aij->j[i]] += PetscRealPart(aij->a[i]);
48857cbf51SRichard Tran Mills   } else if (type == REDUCTION_SUM_IMAGINARYPART || type == REDUCTION_MEAN_IMAGINARYPART) {
49ad540459SPierre Jolivet     for (i = 0; i < aij->i[m]; i++) reductions[aij->j[i]] += PetscImaginaryPart(aij->a[i]);
506adde796SStefano Zampini   } else SETERRQ(PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_WRONG, "Unknown reduction type");
510716a85fSBarry Smith 
520716a85fSBarry Smith   if (type == NORM_2) {
53a873a8cdSSam Reynolds     for (i = 0; i < n; i++) reductions[i] = PetscSqrtReal(reductions[i]);
54857cbf51SRichard Tran Mills   } else if (type == REDUCTION_MEAN_REALPART || type == REDUCTION_MEAN_IMAGINARYPART) {
55a873a8cdSSam Reynolds     for (i = 0; i < n; i++) reductions[i] /= m;
560716a85fSBarry Smith   }
573ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
580716a85fSBarry Smith }
590716a85fSBarry Smith 
60*ba38deedSJacob Faibussowitsch static PetscErrorCode MatFindOffBlockDiagonalEntries_SeqAIJ(Mat A, IS *is)
61d71ae5a4SJacob Faibussowitsch {
623a062f41SBarry Smith   Mat_SeqAIJ     *a = (Mat_SeqAIJ *)A->data;
633a062f41SBarry Smith   PetscInt        i, m = A->rmap->n, cnt = 0, bs = A->rmap->bs;
643a062f41SBarry Smith   const PetscInt *jj = a->j, *ii = a->i;
653a062f41SBarry Smith   PetscInt       *rows;
663a062f41SBarry Smith 
673a062f41SBarry Smith   PetscFunctionBegin;
683a062f41SBarry Smith   for (i = 0; i < m; i++) {
69ad540459SPierre Jolivet     if ((ii[i] != ii[i + 1]) && ((jj[ii[i]] < bs * (i / bs)) || (jj[ii[i + 1] - 1] > bs * ((i + bs) / bs) - 1))) cnt++;
703a062f41SBarry Smith   }
719566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(cnt, &rows));
723a062f41SBarry Smith   cnt = 0;
733a062f41SBarry Smith   for (i = 0; i < m; i++) {
743a062f41SBarry Smith     if ((ii[i] != ii[i + 1]) && ((jj[ii[i]] < bs * (i / bs)) || (jj[ii[i + 1] - 1] > bs * ((i + bs) / bs) - 1))) {
753a062f41SBarry Smith       rows[cnt] = i;
763a062f41SBarry Smith       cnt++;
773a062f41SBarry Smith     }
783a062f41SBarry Smith   }
799566063dSJacob Faibussowitsch   PetscCall(ISCreateGeneral(PETSC_COMM_SELF, cnt, rows, PETSC_OWN_POINTER, is));
803ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
813a062f41SBarry Smith }
823a062f41SBarry Smith 
83d71ae5a4SJacob Faibussowitsch PetscErrorCode MatFindZeroDiagonals_SeqAIJ_Private(Mat A, PetscInt *nrows, PetscInt **zrows)
84d71ae5a4SJacob Faibussowitsch {
856ce1633cSBarry Smith   Mat_SeqAIJ      *a = (Mat_SeqAIJ *)A->data;
86fff043a9SJunchao Zhang   const MatScalar *aa;
876ce1633cSBarry Smith   PetscInt         i, m = A->rmap->n, cnt = 0;
88b2db7409Sstefano_zampini   const PetscInt  *ii = a->i, *jj = a->j, *diag;
896ce1633cSBarry Smith   PetscInt        *rows;
906ce1633cSBarry Smith 
916ce1633cSBarry Smith   PetscFunctionBegin;
929566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &aa));
939566063dSJacob Faibussowitsch   PetscCall(MatMarkDiagonal_SeqAIJ(A));
946ce1633cSBarry Smith   diag = a->diag;
956ce1633cSBarry Smith   for (i = 0; i < m; i++) {
96ad540459SPierre Jolivet     if ((diag[i] >= ii[i + 1]) || (jj[diag[i]] != i) || (aa[diag[i]] == 0.0)) cnt++;
976ce1633cSBarry Smith   }
989566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(cnt, &rows));
996ce1633cSBarry Smith   cnt = 0;
1006ce1633cSBarry Smith   for (i = 0; i < m; i++) {
101ad540459SPierre Jolivet     if ((diag[i] >= ii[i + 1]) || (jj[diag[i]] != i) || (aa[diag[i]] == 0.0)) rows[cnt++] = i;
1026ce1633cSBarry Smith   }
103f1f41ecbSJed Brown   *nrows = cnt;
104f1f41ecbSJed Brown   *zrows = rows;
1059566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &aa));
1063ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
107f1f41ecbSJed Brown }
108f1f41ecbSJed Brown 
109*ba38deedSJacob Faibussowitsch static PetscErrorCode MatFindZeroDiagonals_SeqAIJ(Mat A, IS *zrows)
110d71ae5a4SJacob Faibussowitsch {
111f1f41ecbSJed Brown   PetscInt nrows, *rows;
112f1f41ecbSJed Brown 
113f1f41ecbSJed Brown   PetscFunctionBegin;
1140298fd71SBarry Smith   *zrows = NULL;
1159566063dSJacob Faibussowitsch   PetscCall(MatFindZeroDiagonals_SeqAIJ_Private(A, &nrows, &rows));
1169566063dSJacob Faibussowitsch   PetscCall(ISCreateGeneral(PetscObjectComm((PetscObject)A), nrows, rows, PETSC_OWN_POINTER, zrows));
1173ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
1186ce1633cSBarry Smith }
1196ce1633cSBarry Smith 
120*ba38deedSJacob Faibussowitsch static PetscErrorCode MatFindNonzeroRows_SeqAIJ(Mat A, IS *keptrows)
121d71ae5a4SJacob Faibussowitsch {
122b3a44c85SBarry Smith   Mat_SeqAIJ      *a = (Mat_SeqAIJ *)A->data;
123b3a44c85SBarry Smith   const MatScalar *aa;
124b3a44c85SBarry Smith   PetscInt         m = A->rmap->n, cnt = 0;
125b3a44c85SBarry Smith   const PetscInt  *ii;
126b3a44c85SBarry Smith   PetscInt         n, i, j, *rows;
127b3a44c85SBarry Smith 
128b3a44c85SBarry Smith   PetscFunctionBegin;
1299566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &aa));
130f4259b30SLisandro Dalcin   *keptrows = NULL;
131b3a44c85SBarry Smith   ii        = a->i;
132b3a44c85SBarry Smith   for (i = 0; i < m; i++) {
133b3a44c85SBarry Smith     n = ii[i + 1] - ii[i];
134b3a44c85SBarry Smith     if (!n) {
135b3a44c85SBarry Smith       cnt++;
136b3a44c85SBarry Smith       goto ok1;
137b3a44c85SBarry Smith     }
1382e5835c6SStefano Zampini     for (j = ii[i]; j < ii[i + 1]; j++) {
139b3a44c85SBarry Smith       if (aa[j] != 0.0) goto ok1;
140b3a44c85SBarry Smith     }
141b3a44c85SBarry Smith     cnt++;
142b3a44c85SBarry Smith   ok1:;
143b3a44c85SBarry Smith   }
1442e5835c6SStefano Zampini   if (!cnt) {
1459566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJRestoreArrayRead(A, &aa));
1463ba16761SJacob Faibussowitsch     PetscFunctionReturn(PETSC_SUCCESS);
1472e5835c6SStefano Zampini   }
1489566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(A->rmap->n - cnt, &rows));
149b3a44c85SBarry Smith   cnt = 0;
150b3a44c85SBarry Smith   for (i = 0; i < m; i++) {
151b3a44c85SBarry Smith     n = ii[i + 1] - ii[i];
152b3a44c85SBarry Smith     if (!n) continue;
1532e5835c6SStefano Zampini     for (j = ii[i]; j < ii[i + 1]; j++) {
154b3a44c85SBarry Smith       if (aa[j] != 0.0) {
155b3a44c85SBarry Smith         rows[cnt++] = i;
156b3a44c85SBarry Smith         break;
157b3a44c85SBarry Smith       }
158b3a44c85SBarry Smith     }
159b3a44c85SBarry Smith   }
1609566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &aa));
1619566063dSJacob Faibussowitsch   PetscCall(ISCreateGeneral(PETSC_COMM_SELF, cnt, rows, PETSC_OWN_POINTER, keptrows));
1623ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
163b3a44c85SBarry Smith }
164b3a44c85SBarry Smith 
165d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDiagonalSet_SeqAIJ(Mat Y, Vec D, InsertMode is)
166d71ae5a4SJacob Faibussowitsch {
16779299369SBarry Smith   Mat_SeqAIJ        *aij = (Mat_SeqAIJ *)Y->data;
16899e65526SBarry Smith   PetscInt           i, m = Y->rmap->n;
16999e65526SBarry Smith   const PetscInt    *diag;
1702e5835c6SStefano Zampini   MatScalar         *aa;
17199e65526SBarry Smith   const PetscScalar *v;
172ace3abfcSBarry Smith   PetscBool          missing;
17379299369SBarry Smith 
17479299369SBarry Smith   PetscFunctionBegin;
17509f38230SBarry Smith   if (Y->assembled) {
1769566063dSJacob Faibussowitsch     PetscCall(MatMissingDiagonal_SeqAIJ(Y, &missing, NULL));
17709f38230SBarry Smith     if (!missing) {
17879299369SBarry Smith       diag = aij->diag;
1799566063dSJacob Faibussowitsch       PetscCall(VecGetArrayRead(D, &v));
1809566063dSJacob Faibussowitsch       PetscCall(MatSeqAIJGetArray(Y, &aa));
18179299369SBarry Smith       if (is == INSERT_VALUES) {
182ad540459SPierre Jolivet         for (i = 0; i < m; i++) aa[diag[i]] = v[i];
18379299369SBarry Smith       } else {
184ad540459SPierre Jolivet         for (i = 0; i < m; i++) aa[diag[i]] += v[i];
18579299369SBarry Smith       }
1869566063dSJacob Faibussowitsch       PetscCall(MatSeqAIJRestoreArray(Y, &aa));
1879566063dSJacob Faibussowitsch       PetscCall(VecRestoreArrayRead(D, &v));
1883ba16761SJacob Faibussowitsch       PetscFunctionReturn(PETSC_SUCCESS);
18979299369SBarry Smith     }
1909566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJInvalidateDiagonal(Y));
19109f38230SBarry Smith   }
1929566063dSJacob Faibussowitsch   PetscCall(MatDiagonalSet_Default(Y, D, is));
1933ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
19409f38230SBarry Smith }
19579299369SBarry Smith 
196d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetRowIJ_SeqAIJ(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *m, const PetscInt *ia[], const PetscInt *ja[], PetscBool *done)
197d71ae5a4SJacob Faibussowitsch {
198416022c9SBarry Smith   Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data;
19997f1f81fSBarry Smith   PetscInt    i, ishift;
20017ab2063SBarry Smith 
2013a40ed3dSBarry Smith   PetscFunctionBegin;
202f1f2ae84SBarry Smith   if (m) *m = A->rmap->n;
2033ba16761SJacob Faibussowitsch   if (!ia) PetscFunctionReturn(PETSC_SUCCESS);
204bfeeae90SHong Zhang   ishift = 0;
205b94d7dedSBarry Smith   if (symmetric && A->structurally_symmetric != PETSC_BOOL3_TRUE) {
2069566063dSJacob Faibussowitsch     PetscCall(MatToSymmetricIJ_SeqAIJ(A->rmap->n, a->i, a->j, PETSC_TRUE, ishift, oshift, (PetscInt **)ia, (PetscInt **)ja));
207bfeeae90SHong Zhang   } else if (oshift == 1) {
2081a83f524SJed Brown     PetscInt *tia;
209d0f46423SBarry Smith     PetscInt  nz = a->i[A->rmap->n];
2103b2fbd54SBarry Smith     /* malloc space and  add 1 to i and j indices */
2119566063dSJacob Faibussowitsch     PetscCall(PetscMalloc1(A->rmap->n + 1, &tia));
2121a83f524SJed Brown     for (i = 0; i < A->rmap->n + 1; i++) tia[i] = a->i[i] + 1;
2131a83f524SJed Brown     *ia = tia;
214ecc77c7aSBarry Smith     if (ja) {
2151a83f524SJed Brown       PetscInt *tja;
2169566063dSJacob Faibussowitsch       PetscCall(PetscMalloc1(nz + 1, &tja));
2171a83f524SJed Brown       for (i = 0; i < nz; i++) tja[i] = a->j[i] + 1;
2181a83f524SJed Brown       *ja = tja;
219ecc77c7aSBarry Smith     }
2206945ee14SBarry Smith   } else {
221ecc77c7aSBarry Smith     *ia = a->i;
222ecc77c7aSBarry Smith     if (ja) *ja = a->j;
223a2ce50c7SBarry Smith   }
2243ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
225a2744918SBarry Smith }
226a2744918SBarry Smith 
227d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRestoreRowIJ_SeqAIJ(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *n, const PetscInt *ia[], const PetscInt *ja[], PetscBool *done)
228d71ae5a4SJacob Faibussowitsch {
2293a40ed3dSBarry Smith   PetscFunctionBegin;
2303ba16761SJacob Faibussowitsch   if (!ia) PetscFunctionReturn(PETSC_SUCCESS);
231b94d7dedSBarry Smith   if ((symmetric && A->structurally_symmetric != PETSC_BOOL3_TRUE) || oshift == 1) {
2329566063dSJacob Faibussowitsch     PetscCall(PetscFree(*ia));
2339566063dSJacob Faibussowitsch     if (ja) PetscCall(PetscFree(*ja));
234bcd2baecSBarry Smith   }
2353ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
23617ab2063SBarry Smith }
23717ab2063SBarry Smith 
238d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetColumnIJ_SeqAIJ(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *nn, const PetscInt *ia[], const PetscInt *ja[], PetscBool *done)
239d71ae5a4SJacob Faibussowitsch {
2403b2fbd54SBarry Smith   Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data;
241d0f46423SBarry Smith   PetscInt    i, *collengths, *cia, *cja, n = A->cmap->n, m = A->rmap->n;
24297f1f81fSBarry Smith   PetscInt    nz = a->i[m], row, *jj, mr, col;
2433b2fbd54SBarry Smith 
2443a40ed3dSBarry Smith   PetscFunctionBegin;
245899cda47SBarry Smith   *nn = n;
2463ba16761SJacob Faibussowitsch   if (!ia) PetscFunctionReturn(PETSC_SUCCESS);
2473b2fbd54SBarry Smith   if (symmetric) {
2489566063dSJacob Faibussowitsch     PetscCall(MatToSymmetricIJ_SeqAIJ(A->rmap->n, a->i, a->j, PETSC_TRUE, 0, oshift, (PetscInt **)ia, (PetscInt **)ja));
2493b2fbd54SBarry Smith   } else {
2509566063dSJacob Faibussowitsch     PetscCall(PetscCalloc1(n, &collengths));
2519566063dSJacob Faibussowitsch     PetscCall(PetscMalloc1(n + 1, &cia));
2529566063dSJacob Faibussowitsch     PetscCall(PetscMalloc1(nz, &cja));
2533b2fbd54SBarry Smith     jj = a->j;
254ad540459SPierre Jolivet     for (i = 0; i < nz; i++) collengths[jj[i]]++;
2553b2fbd54SBarry Smith     cia[0] = oshift;
256ad540459SPierre Jolivet     for (i = 0; i < n; i++) cia[i + 1] = cia[i] + collengths[i];
2579566063dSJacob Faibussowitsch     PetscCall(PetscArrayzero(collengths, n));
2583b2fbd54SBarry Smith     jj = a->j;
259a93ec695SBarry Smith     for (row = 0; row < m; row++) {
260a93ec695SBarry Smith       mr = a->i[row + 1] - a->i[row];
261a93ec695SBarry Smith       for (i = 0; i < mr; i++) {
262bfeeae90SHong Zhang         col = *jj++;
2632205254eSKarl Rupp 
2643b2fbd54SBarry Smith         cja[cia[col] + collengths[col]++ - oshift] = row + oshift;
2653b2fbd54SBarry Smith       }
2663b2fbd54SBarry Smith     }
2679566063dSJacob Faibussowitsch     PetscCall(PetscFree(collengths));
2689371c9d4SSatish Balay     *ia = cia;
2699371c9d4SSatish Balay     *ja = cja;
2703b2fbd54SBarry Smith   }
2713ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
2723b2fbd54SBarry Smith }
2733b2fbd54SBarry Smith 
274d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRestoreColumnIJ_SeqAIJ(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *n, const PetscInt *ia[], const PetscInt *ja[], PetscBool *done)
275d71ae5a4SJacob Faibussowitsch {
2763a40ed3dSBarry Smith   PetscFunctionBegin;
2773ba16761SJacob Faibussowitsch   if (!ia) PetscFunctionReturn(PETSC_SUCCESS);
2783b2fbd54SBarry Smith 
2799566063dSJacob Faibussowitsch   PetscCall(PetscFree(*ia));
2809566063dSJacob Faibussowitsch   PetscCall(PetscFree(*ja));
2813ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
2823b2fbd54SBarry Smith }
2833b2fbd54SBarry Smith 
2847cee066cSHong Zhang /*
2857cee066cSHong Zhang  MatGetColumnIJ_SeqAIJ_Color() and MatRestoreColumnIJ_SeqAIJ_Color() are customized from
2867cee066cSHong Zhang  MatGetColumnIJ_SeqAIJ() and MatRestoreColumnIJ_SeqAIJ() by adding an output
287040ebd07SHong Zhang  spidx[], index of a->a, to be used in MatTransposeColoringCreate_SeqAIJ() and MatFDColoringCreate_SeqXAIJ()
2887cee066cSHong Zhang */
289d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetColumnIJ_SeqAIJ_Color(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *nn, const PetscInt *ia[], const PetscInt *ja[], PetscInt *spidx[], PetscBool *done)
290d71ae5a4SJacob Faibussowitsch {
2917cee066cSHong Zhang   Mat_SeqAIJ     *a = (Mat_SeqAIJ *)A->data;
2927cee066cSHong Zhang   PetscInt        i, *collengths, *cia, *cja, n = A->cmap->n, m = A->rmap->n;
293071fcb05SBarry Smith   PetscInt        nz = a->i[m], row, mr, col, tmp;
2947cee066cSHong Zhang   PetscInt       *cspidx;
295071fcb05SBarry Smith   const PetscInt *jj;
2967cee066cSHong Zhang 
2977cee066cSHong Zhang   PetscFunctionBegin;
2987cee066cSHong Zhang   *nn = n;
2993ba16761SJacob Faibussowitsch   if (!ia) PetscFunctionReturn(PETSC_SUCCESS);
300625f6d37SHong Zhang 
3019566063dSJacob Faibussowitsch   PetscCall(PetscCalloc1(n, &collengths));
3029566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(n + 1, &cia));
3039566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(nz, &cja));
3049566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(nz, &cspidx));
3057cee066cSHong Zhang   jj = a->j;
306ad540459SPierre Jolivet   for (i = 0; i < nz; i++) collengths[jj[i]]++;
3077cee066cSHong Zhang   cia[0] = oshift;
308ad540459SPierre Jolivet   for (i = 0; i < n; i++) cia[i + 1] = cia[i] + collengths[i];
3099566063dSJacob Faibussowitsch   PetscCall(PetscArrayzero(collengths, n));
3107cee066cSHong Zhang   jj = a->j;
3117cee066cSHong Zhang   for (row = 0; row < m; row++) {
3127cee066cSHong Zhang     mr = a->i[row + 1] - a->i[row];
3137cee066cSHong Zhang     for (i = 0; i < mr; i++) {
3147cee066cSHong Zhang       col         = *jj++;
315071fcb05SBarry Smith       tmp         = cia[col] + collengths[col]++ - oshift;
316071fcb05SBarry Smith       cspidx[tmp] = a->i[row] + i; /* index of a->j */
317071fcb05SBarry Smith       cja[tmp]    = row + oshift;
3187cee066cSHong Zhang     }
3197cee066cSHong Zhang   }
3209566063dSJacob Faibussowitsch   PetscCall(PetscFree(collengths));
321071fcb05SBarry Smith   *ia    = cia;
322071fcb05SBarry Smith   *ja    = cja;
3237cee066cSHong Zhang   *spidx = cspidx;
3243ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3257cee066cSHong Zhang }
3267cee066cSHong Zhang 
327d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRestoreColumnIJ_SeqAIJ_Color(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *n, const PetscInt *ia[], const PetscInt *ja[], PetscInt *spidx[], PetscBool *done)
328d71ae5a4SJacob Faibussowitsch {
3297cee066cSHong Zhang   PetscFunctionBegin;
3309566063dSJacob Faibussowitsch   PetscCall(MatRestoreColumnIJ_SeqAIJ(A, oshift, symmetric, inodecompressed, n, ia, ja, done));
3319566063dSJacob Faibussowitsch   PetscCall(PetscFree(*spidx));
3323ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3337cee066cSHong Zhang }
3347cee066cSHong Zhang 
335*ba38deedSJacob Faibussowitsch static PetscErrorCode MatSetValuesRow_SeqAIJ(Mat A, PetscInt row, const PetscScalar v[])
336d71ae5a4SJacob Faibussowitsch {
33787d4246cSBarry Smith   Mat_SeqAIJ  *a  = (Mat_SeqAIJ *)A->data;
33887d4246cSBarry Smith   PetscInt    *ai = a->i;
339fff043a9SJunchao Zhang   PetscScalar *aa;
34087d4246cSBarry Smith 
34187d4246cSBarry Smith   PetscFunctionBegin;
3429566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArray(A, &aa));
3439566063dSJacob Faibussowitsch   PetscCall(PetscArraycpy(aa + ai[row], v, ai[row + 1] - ai[row]));
3449566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArray(A, &aa));
3453ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
34687d4246cSBarry Smith }
34787d4246cSBarry Smith 
348bd04181cSBarry Smith /*
349bd04181cSBarry Smith     MatSeqAIJSetValuesLocalFast - An optimized version of MatSetValuesLocal() for SeqAIJ matrices with several assumptions
350bd04181cSBarry Smith 
351bd04181cSBarry Smith       -   a single row of values is set with each call
352bd04181cSBarry Smith       -   no row or column indices are negative or (in error) larger than the number of rows or columns
353bd04181cSBarry Smith       -   the values are always added to the matrix, not set
354bd04181cSBarry Smith       -   no new locations are introduced in the nonzero structure of the matrix
355bd04181cSBarry Smith 
3561f763a69SBarry Smith      This does NOT assume the global column indices are sorted
357bd04181cSBarry Smith 
3581f763a69SBarry Smith */
359bd04181cSBarry Smith 
360af0996ceSBarry Smith #include <petsc/private/isimpl.h>
361d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetValuesLocalFast(Mat A, PetscInt m, const PetscInt im[], PetscInt n, const PetscInt in[], const PetscScalar v[], InsertMode is)
362d71ae5a4SJacob Faibussowitsch {
363189e4007SBarry Smith   Mat_SeqAIJ     *a = (Mat_SeqAIJ *)A->data;
3641f763a69SBarry Smith   PetscInt        low, high, t, row, nrow, i, col, l;
3651f763a69SBarry Smith   const PetscInt *rp, *ai = a->i, *ailen = a->ilen, *aj = a->j;
3661f763a69SBarry Smith   PetscInt        lastcol = -1;
367fff043a9SJunchao Zhang   MatScalar      *ap, value, *aa;
368189e4007SBarry Smith   const PetscInt *ridx = A->rmap->mapping->indices, *cidx = A->cmap->mapping->indices;
369189e4007SBarry Smith 
370fff043a9SJunchao Zhang   PetscFunctionBegin;
3719566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArray(A, &aa));
372f38dd0b8SBarry Smith   row  = ridx[im[0]];
3731f763a69SBarry Smith   rp   = aj + ai[row];
3741f763a69SBarry Smith   ap   = aa + ai[row];
3751f763a69SBarry Smith   nrow = ailen[row];
376189e4007SBarry Smith   low  = 0;
377189e4007SBarry Smith   high = nrow;
378189e4007SBarry Smith   for (l = 0; l < n; l++) { /* loop over added columns */
379189e4007SBarry Smith     col   = cidx[in[l]];
380f38dd0b8SBarry Smith     value = v[l];
381189e4007SBarry Smith 
382189e4007SBarry Smith     if (col <= lastcol) low = 0;
383189e4007SBarry Smith     else high = nrow;
384189e4007SBarry Smith     lastcol = col;
385189e4007SBarry Smith     while (high - low > 5) {
386189e4007SBarry Smith       t = (low + high) / 2;
387189e4007SBarry Smith       if (rp[t] > col) high = t;
388189e4007SBarry Smith       else low = t;
389189e4007SBarry Smith     }
390189e4007SBarry Smith     for (i = low; i < high; i++) {
391189e4007SBarry Smith       if (rp[i] == col) {
3921f763a69SBarry Smith         ap[i] += value;
393189e4007SBarry Smith         low = i + 1;
3941f763a69SBarry Smith         break;
395189e4007SBarry Smith       }
396189e4007SBarry Smith     }
397189e4007SBarry Smith   }
3989566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArray(A, &aa));
3993ba16761SJacob Faibussowitsch   return PETSC_SUCCESS;
400189e4007SBarry Smith }
401189e4007SBarry Smith 
402d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetValues_SeqAIJ(Mat A, PetscInt m, const PetscInt im[], PetscInt n, const PetscInt in[], const PetscScalar v[], InsertMode is)
403d71ae5a4SJacob Faibussowitsch {
404416022c9SBarry Smith   Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data;
405e2ee6c50SBarry Smith   PetscInt   *rp, k, low, high, t, ii, row, nrow, i, col, l, rmax, N;
40697f1f81fSBarry Smith   PetscInt   *imax = a->imax, *ai = a->i, *ailen = a->ilen;
407e2ee6c50SBarry Smith   PetscInt   *aj = a->j, nonew = a->nonew, lastcol = -1;
408ce496241SStefano Zampini   MatScalar  *ap = NULL, value = 0.0, *aa;
409ace3abfcSBarry Smith   PetscBool   ignorezeroentries = a->ignorezeroentries;
410ace3abfcSBarry Smith   PetscBool   roworiented       = a->roworiented;
41117ab2063SBarry Smith 
4123a40ed3dSBarry Smith   PetscFunctionBegin;
4139566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArray(A, &aa));
41417ab2063SBarry Smith   for (k = 0; k < m; k++) { /* loop over added rows */
415416022c9SBarry Smith     row = im[k];
4165ef9f2a5SBarry Smith     if (row < 0) continue;
4176bdcaf15SBarry Smith     PetscCheck(row < A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Row too large: row %" PetscInt_FMT " max %" PetscInt_FMT, row, A->rmap->n - 1);
418720833daSHong Zhang     rp = aj + ai[row];
419876c6284SHong Zhang     if (!A->structure_only) ap = aa + ai[row];
4209371c9d4SSatish Balay     rmax = imax[row];
4219371c9d4SSatish Balay     nrow = ailen[row];
422416022c9SBarry Smith     low  = 0;
423c71e6ed7SBarry Smith     high = nrow;
42417ab2063SBarry Smith     for (l = 0; l < n; l++) { /* loop over added columns */
4255ef9f2a5SBarry Smith       if (in[l] < 0) continue;
4266bdcaf15SBarry Smith       PetscCheck(in[l] < A->cmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Column too large: col %" PetscInt_FMT " max %" PetscInt_FMT, in[l], A->cmap->n - 1);
427bfeeae90SHong Zhang       col = in[l];
428071fcb05SBarry Smith       if (v && !A->structure_only) value = roworiented ? v[l + k * n] : v[k + l * m];
429071fcb05SBarry Smith       if (!A->structure_only && value == 0.0 && ignorezeroentries && is == ADD_VALUES && row != col) continue;
43036db0b34SBarry Smith 
4312205254eSKarl Rupp       if (col <= lastcol) low = 0;
4322205254eSKarl Rupp       else high = nrow;
433e2ee6c50SBarry Smith       lastcol = col;
434416022c9SBarry Smith       while (high - low > 5) {
435416022c9SBarry Smith         t = (low + high) / 2;
436416022c9SBarry Smith         if (rp[t] > col) high = t;
437416022c9SBarry Smith         else low = t;
43817ab2063SBarry Smith       }
439416022c9SBarry Smith       for (i = low; i < high; i++) {
44017ab2063SBarry Smith         if (rp[i] > col) break;
44117ab2063SBarry Smith         if (rp[i] == col) {
442876c6284SHong Zhang           if (!A->structure_only) {
4430c0d7e18SFande Kong             if (is == ADD_VALUES) {
4440c0d7e18SFande Kong               ap[i] += value;
4450c0d7e18SFande Kong               (void)PetscLogFlops(1.0);
4469371c9d4SSatish Balay             } else ap[i] = value;
447720833daSHong Zhang           }
448e44c0bd4SBarry Smith           low = i + 1;
44917ab2063SBarry Smith           goto noinsert;
45017ab2063SBarry Smith         }
45117ab2063SBarry Smith       }
452dcd36c23SBarry Smith       if (value == 0.0 && ignorezeroentries && row != col) goto noinsert;
453c2653b3dSLois Curfman McInnes       if (nonew == 1) goto noinsert;
45408401ef6SPierre Jolivet       PetscCheck(nonew != -1, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Inserting a new nonzero at (%" PetscInt_FMT ",%" PetscInt_FMT ") in the matrix", row, col);
455720833daSHong Zhang       if (A->structure_only) {
456876c6284SHong Zhang         MatSeqXAIJReallocateAIJ_structure_only(A, A->rmap->n, 1, nrow, row, col, rmax, ai, aj, rp, imax, nonew, MatScalar);
457720833daSHong Zhang       } else {
458fef13f97SBarry Smith         MatSeqXAIJReallocateAIJ(A, A->rmap->n, 1, nrow, row, col, rmax, aa, ai, aj, rp, ap, imax, nonew, MatScalar);
459720833daSHong Zhang       }
4609371c9d4SSatish Balay       N = nrow++ - 1;
4619371c9d4SSatish Balay       a->nz++;
4629371c9d4SSatish Balay       high++;
463416022c9SBarry Smith       /* shift up all the later entries in this row */
4649566063dSJacob Faibussowitsch       PetscCall(PetscArraymove(rp + i + 1, rp + i, N - i + 1));
46517ab2063SBarry Smith       rp[i] = col;
466580bdb30SBarry Smith       if (!A->structure_only) {
4679566063dSJacob Faibussowitsch         PetscCall(PetscArraymove(ap + i + 1, ap + i, N - i + 1));
468580bdb30SBarry Smith         ap[i] = value;
469580bdb30SBarry Smith       }
470416022c9SBarry Smith       low = i + 1;
471e56f5c9eSBarry Smith       A->nonzerostate++;
472e44c0bd4SBarry Smith     noinsert:;
47317ab2063SBarry Smith     }
47417ab2063SBarry Smith     ailen[row] = nrow;
47517ab2063SBarry Smith   }
4769566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArray(A, &aa));
4773ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
47817ab2063SBarry Smith }
47917ab2063SBarry Smith 
480*ba38deedSJacob Faibussowitsch static PetscErrorCode MatSetValues_SeqAIJ_SortedFullNoPreallocation(Mat A, PetscInt m, const PetscInt im[], PetscInt n, const PetscInt in[], const PetscScalar v[], InsertMode is)
481d71ae5a4SJacob Faibussowitsch {
48219b08ed1SBarry Smith   Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data;
48319b08ed1SBarry Smith   PetscInt   *rp, k, row;
48419b08ed1SBarry Smith   PetscInt   *ai = a->i;
48519b08ed1SBarry Smith   PetscInt   *aj = a->j;
486fff043a9SJunchao Zhang   MatScalar  *aa, *ap;
48719b08ed1SBarry Smith 
48819b08ed1SBarry Smith   PetscFunctionBegin;
48928b400f6SJacob Faibussowitsch   PetscCheck(!A->was_assembled, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Cannot call on assembled matrix.");
49008401ef6SPierre Jolivet   PetscCheck(m * n + a->nz <= a->maxnz, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Number of entries in matrix will be larger than maximum nonzeros allocated for %" PetscInt_FMT " in MatSeqAIJSetTotalPreallocation()", a->maxnz);
491fff043a9SJunchao Zhang 
4929566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArray(A, &aa));
49319b08ed1SBarry Smith   for (k = 0; k < m; k++) { /* loop over added rows */
49419b08ed1SBarry Smith     row = im[k];
49519b08ed1SBarry Smith     rp  = aj + ai[row];
49619b08ed1SBarry Smith     ap  = aa + ai[row];
49719b08ed1SBarry Smith 
4989566063dSJacob Faibussowitsch     PetscCall(PetscMemcpy(rp, in, n * sizeof(PetscInt)));
49919b08ed1SBarry Smith     if (!A->structure_only) {
50019b08ed1SBarry Smith       if (v) {
5019566063dSJacob Faibussowitsch         PetscCall(PetscMemcpy(ap, v, n * sizeof(PetscScalar)));
50219b08ed1SBarry Smith         v += n;
50319b08ed1SBarry Smith       } else {
5049566063dSJacob Faibussowitsch         PetscCall(PetscMemzero(ap, n * sizeof(PetscScalar)));
50519b08ed1SBarry Smith       }
50619b08ed1SBarry Smith     }
50719b08ed1SBarry Smith     a->ilen[row]  = n;
50819b08ed1SBarry Smith     a->imax[row]  = n;
50919b08ed1SBarry Smith     a->i[row + 1] = a->i[row] + n;
51019b08ed1SBarry Smith     a->nz += n;
51119b08ed1SBarry Smith   }
5129566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArray(A, &aa));
5133ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
51419b08ed1SBarry Smith }
51519b08ed1SBarry Smith 
51619b08ed1SBarry Smith /*@
51719b08ed1SBarry Smith   MatSeqAIJSetTotalPreallocation - Sets an upper bound on the total number of expected nonzeros in the matrix.
51819b08ed1SBarry Smith 
51919b08ed1SBarry Smith   Input Parameters:
52011a5261eSBarry Smith + A       - the `MATSEQAIJ` matrix
52119b08ed1SBarry Smith - nztotal - bound on the number of nonzeros
52219b08ed1SBarry Smith 
52319b08ed1SBarry Smith   Level: advanced
52419b08ed1SBarry Smith 
52519b08ed1SBarry Smith   Notes:
52619b08ed1SBarry Smith   This can be called if you will be provided the matrix row by row (from row zero) with sorted column indices for each row.
52711a5261eSBarry Smith   Simply call `MatSetValues()` after this call to provide the matrix entries in the usual manner. This matrix may be used
52819b08ed1SBarry Smith   as always with multiple matrix assemblies.
52919b08ed1SBarry Smith 
5301cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSetOption()`, `MAT_SORTED_FULL`, `MatSetValues()`, `MatSeqAIJSetPreallocation()`
53119b08ed1SBarry Smith @*/
532d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetTotalPreallocation(Mat A, PetscInt nztotal)
533d71ae5a4SJacob Faibussowitsch {
53419b08ed1SBarry Smith   Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data;
53519b08ed1SBarry Smith 
53619b08ed1SBarry Smith   PetscFunctionBegin;
5379566063dSJacob Faibussowitsch   PetscCall(PetscLayoutSetUp(A->rmap));
5389566063dSJacob Faibussowitsch   PetscCall(PetscLayoutSetUp(A->cmap));
53919b08ed1SBarry Smith   a->maxnz = nztotal;
5404dfa11a4SJacob Faibussowitsch   if (!a->imax) { PetscCall(PetscMalloc1(A->rmap->n, &a->imax)); }
54119b08ed1SBarry Smith   if (!a->ilen) {
5429566063dSJacob Faibussowitsch     PetscCall(PetscMalloc1(A->rmap->n, &a->ilen));
54319b08ed1SBarry Smith   } else {
5449566063dSJacob Faibussowitsch     PetscCall(PetscMemzero(a->ilen, A->rmap->n * sizeof(PetscInt)));
54519b08ed1SBarry Smith   }
54619b08ed1SBarry Smith 
54719b08ed1SBarry Smith   /* allocate the matrix space */
54819b08ed1SBarry Smith   if (A->structure_only) {
5499566063dSJacob Faibussowitsch     PetscCall(PetscMalloc1(nztotal, &a->j));
5509566063dSJacob Faibussowitsch     PetscCall(PetscMalloc1(A->rmap->n + 1, &a->i));
55119b08ed1SBarry Smith   } else {
5529566063dSJacob Faibussowitsch     PetscCall(PetscMalloc3(nztotal, &a->a, nztotal, &a->j, A->rmap->n + 1, &a->i));
55319b08ed1SBarry Smith   }
55419b08ed1SBarry Smith   a->i[0] = 0;
55519b08ed1SBarry Smith   if (A->structure_only) {
55619b08ed1SBarry Smith     a->singlemalloc = PETSC_FALSE;
55719b08ed1SBarry Smith     a->free_a       = PETSC_FALSE;
55819b08ed1SBarry Smith   } else {
55919b08ed1SBarry Smith     a->singlemalloc = PETSC_TRUE;
56019b08ed1SBarry Smith     a->free_a       = PETSC_TRUE;
56119b08ed1SBarry Smith   }
56219b08ed1SBarry Smith   a->free_ij        = PETSC_TRUE;
56319b08ed1SBarry Smith   A->ops->setvalues = MatSetValues_SeqAIJ_SortedFullNoPreallocation;
56419b08ed1SBarry Smith   A->preallocated   = PETSC_TRUE;
5653ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
56619b08ed1SBarry Smith }
56719b08ed1SBarry Smith 
568*ba38deedSJacob Faibussowitsch static PetscErrorCode MatSetValues_SeqAIJ_SortedFull(Mat A, PetscInt m, const PetscInt im[], PetscInt n, const PetscInt in[], const PetscScalar v[], InsertMode is)
569d71ae5a4SJacob Faibussowitsch {
570071fcb05SBarry Smith   Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data;
571071fcb05SBarry Smith   PetscInt   *rp, k, row;
572071fcb05SBarry Smith   PetscInt   *ai = a->i, *ailen = a->ilen;
573071fcb05SBarry Smith   PetscInt   *aj = a->j;
574fff043a9SJunchao Zhang   MatScalar  *aa, *ap;
575071fcb05SBarry Smith 
576071fcb05SBarry Smith   PetscFunctionBegin;
5779566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArray(A, &aa));
578071fcb05SBarry Smith   for (k = 0; k < m; k++) { /* loop over added rows */
579071fcb05SBarry Smith     row = im[k];
5806bdcaf15SBarry Smith     PetscCheck(n <= a->imax[row], PETSC_COMM_SELF, PETSC_ERR_ARG_WRONG, "Preallocation for row %" PetscInt_FMT " does not match number of columns provided", n);
581071fcb05SBarry Smith     rp = aj + ai[row];
582071fcb05SBarry Smith     ap = aa + ai[row];
58348a46eb9SPierre Jolivet     if (!A->was_assembled) PetscCall(PetscMemcpy(rp, in, n * sizeof(PetscInt)));
584071fcb05SBarry Smith     if (!A->structure_only) {
585071fcb05SBarry Smith       if (v) {
5869566063dSJacob Faibussowitsch         PetscCall(PetscMemcpy(ap, v, n * sizeof(PetscScalar)));
587071fcb05SBarry Smith         v += n;
588071fcb05SBarry Smith       } else {
5899566063dSJacob Faibussowitsch         PetscCall(PetscMemzero(ap, n * sizeof(PetscScalar)));
590071fcb05SBarry Smith       }
591071fcb05SBarry Smith     }
592071fcb05SBarry Smith     ailen[row] = n;
593071fcb05SBarry Smith     a->nz += n;
594071fcb05SBarry Smith   }
5959566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArray(A, &aa));
5963ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
597071fcb05SBarry Smith }
598071fcb05SBarry Smith 
599*ba38deedSJacob Faibussowitsch static PetscErrorCode MatGetValues_SeqAIJ(Mat A, PetscInt m, const PetscInt im[], PetscInt n, const PetscInt in[], PetscScalar v[])
600d71ae5a4SJacob Faibussowitsch {
6017eb43aa7SLois Curfman McInnes   Mat_SeqAIJ      *a = (Mat_SeqAIJ *)A->data;
60297f1f81fSBarry Smith   PetscInt        *rp, k, low, high, t, row, nrow, i, col, l, *aj = a->j;
60397f1f81fSBarry Smith   PetscInt        *ai = a->i, *ailen = a->ilen;
6044e208921SJed Brown   const MatScalar *ap, *aa;
6057eb43aa7SLois Curfman McInnes 
6063a40ed3dSBarry Smith   PetscFunctionBegin;
6074e208921SJed Brown   PetscCall(MatSeqAIJGetArrayRead(A, &aa));
6087eb43aa7SLois Curfman McInnes   for (k = 0; k < m; k++) { /* loop over rows */
6097eb43aa7SLois Curfman McInnes     row = im[k];
6109371c9d4SSatish Balay     if (row < 0) {
6119371c9d4SSatish Balay       v += n;
6129371c9d4SSatish Balay       continue;
6139371c9d4SSatish Balay     } /* negative row */
61454c59aa7SJacob Faibussowitsch     PetscCheck(row < A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Row too large: row %" PetscInt_FMT " max %" PetscInt_FMT, row, A->rmap->n - 1);
6159371c9d4SSatish Balay     rp   = aj + ai[row];
6169371c9d4SSatish Balay     ap   = aa + ai[row];
6177eb43aa7SLois Curfman McInnes     nrow = ailen[row];
6187eb43aa7SLois Curfman McInnes     for (l = 0; l < n; l++) { /* loop over columns */
6199371c9d4SSatish Balay       if (in[l] < 0) {
6209371c9d4SSatish Balay         v++;
6219371c9d4SSatish Balay         continue;
6229371c9d4SSatish Balay       } /* negative column */
62354c59aa7SJacob Faibussowitsch       PetscCheck(in[l] < A->cmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Column too large: col %" PetscInt_FMT " max %" PetscInt_FMT, in[l], A->cmap->n - 1);
624bfeeae90SHong Zhang       col  = in[l];
6259371c9d4SSatish Balay       high = nrow;
6269371c9d4SSatish Balay       low  = 0; /* assume unsorted */
6277eb43aa7SLois Curfman McInnes       while (high - low > 5) {
6287eb43aa7SLois Curfman McInnes         t = (low + high) / 2;
6297eb43aa7SLois Curfman McInnes         if (rp[t] > col) high = t;
6307eb43aa7SLois Curfman McInnes         else low = t;
6317eb43aa7SLois Curfman McInnes       }
6327eb43aa7SLois Curfman McInnes       for (i = low; i < high; i++) {
6337eb43aa7SLois Curfman McInnes         if (rp[i] > col) break;
6347eb43aa7SLois Curfman McInnes         if (rp[i] == col) {
635b49de8d1SLois Curfman McInnes           *v++ = ap[i];
6367eb43aa7SLois Curfman McInnes           goto finished;
6377eb43aa7SLois Curfman McInnes         }
6387eb43aa7SLois Curfman McInnes       }
63997e567efSBarry Smith       *v++ = 0.0;
6407eb43aa7SLois Curfman McInnes     finished:;
6417eb43aa7SLois Curfman McInnes     }
6427eb43aa7SLois Curfman McInnes   }
6434e208921SJed Brown   PetscCall(MatSeqAIJRestoreArrayRead(A, &aa));
6443ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
6457eb43aa7SLois Curfman McInnes }
6467eb43aa7SLois Curfman McInnes 
647*ba38deedSJacob Faibussowitsch static PetscErrorCode MatView_SeqAIJ_Binary(Mat mat, PetscViewer viewer)
648d71ae5a4SJacob Faibussowitsch {
6493ea6fe3dSLisandro Dalcin   Mat_SeqAIJ        *A = (Mat_SeqAIJ *)mat->data;
650c898d852SStefano Zampini   const PetscScalar *av;
6513ea6fe3dSLisandro Dalcin   PetscInt           header[4], M, N, m, nz, i;
6523ea6fe3dSLisandro Dalcin   PetscInt          *rowlens;
65317ab2063SBarry Smith 
6543a40ed3dSBarry Smith   PetscFunctionBegin;
6559566063dSJacob Faibussowitsch   PetscCall(PetscViewerSetUp(viewer));
6562205254eSKarl Rupp 
6573ea6fe3dSLisandro Dalcin   M  = mat->rmap->N;
6583ea6fe3dSLisandro Dalcin   N  = mat->cmap->N;
6593ea6fe3dSLisandro Dalcin   m  = mat->rmap->n;
6603ea6fe3dSLisandro Dalcin   nz = A->nz;
661416022c9SBarry Smith 
6623ea6fe3dSLisandro Dalcin   /* write matrix header */
6633ea6fe3dSLisandro Dalcin   header[0] = MAT_FILE_CLASSID;
6649371c9d4SSatish Balay   header[1] = M;
6659371c9d4SSatish Balay   header[2] = N;
6669371c9d4SSatish Balay   header[3] = nz;
6679566063dSJacob Faibussowitsch   PetscCall(PetscViewerBinaryWrite(viewer, header, 4, PETSC_INT));
668416022c9SBarry Smith 
6693ea6fe3dSLisandro Dalcin   /* fill in and store row lengths */
6709566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(m, &rowlens));
6713ea6fe3dSLisandro Dalcin   for (i = 0; i < m; i++) rowlens[i] = A->i[i + 1] - A->i[i];
6729566063dSJacob Faibussowitsch   PetscCall(PetscViewerBinaryWrite(viewer, rowlens, m, PETSC_INT));
6739566063dSJacob Faibussowitsch   PetscCall(PetscFree(rowlens));
6743ea6fe3dSLisandro Dalcin   /* store column indices */
6759566063dSJacob Faibussowitsch   PetscCall(PetscViewerBinaryWrite(viewer, A->j, nz, PETSC_INT));
676416022c9SBarry Smith   /* store nonzero values */
6779566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(mat, &av));
6789566063dSJacob Faibussowitsch   PetscCall(PetscViewerBinaryWrite(viewer, av, nz, PETSC_SCALAR));
6799566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(mat, &av));
680b37d52dbSMark F. Adams 
6813ea6fe3dSLisandro Dalcin   /* write block size option to the viewer's .info file */
6829566063dSJacob Faibussowitsch   PetscCall(MatView_Binary_BlockSizes(mat, viewer));
6833ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
68417ab2063SBarry Smith }
685416022c9SBarry Smith 
686d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatView_SeqAIJ_ASCII_structonly(Mat A, PetscViewer viewer)
687d71ae5a4SJacob Faibussowitsch {
6887dc0baabSHong Zhang   Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data;
6897dc0baabSHong Zhang   PetscInt    i, k, m = A->rmap->N;
6907dc0baabSHong Zhang 
6917dc0baabSHong Zhang   PetscFunctionBegin;
6929566063dSJacob Faibussowitsch   PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE));
6937dc0baabSHong Zhang   for (i = 0; i < m; i++) {
6949566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIPrintf(viewer, "row %" PetscInt_FMT ":", i));
69548a46eb9SPierre Jolivet     for (k = a->i[i]; k < a->i[i + 1]; k++) PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ") ", a->j[k]));
6969566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIPrintf(viewer, "\n"));
6977dc0baabSHong Zhang   }
6989566063dSJacob Faibussowitsch   PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE));
6993ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
7007dc0baabSHong Zhang }
7017dc0baabSHong Zhang 
70209573ac7SBarry Smith extern PetscErrorCode MatSeqAIJFactorInfo_Matlab(Mat, PetscViewer);
703cd155464SBarry Smith 
704*ba38deedSJacob Faibussowitsch static PetscErrorCode MatView_SeqAIJ_ASCII(Mat A, PetscViewer viewer)
705d71ae5a4SJacob Faibussowitsch {
706416022c9SBarry Smith   Mat_SeqAIJ        *a = (Mat_SeqAIJ *)A->data;
707c898d852SStefano Zampini   const PetscScalar *av;
70860e0710aSBarry Smith   PetscInt           i, j, m = A->rmap->n;
709e060cb09SBarry Smith   const char        *name;
710f3ef73ceSBarry Smith   PetscViewerFormat  format;
71117ab2063SBarry Smith 
7123a40ed3dSBarry Smith   PetscFunctionBegin;
7137dc0baabSHong Zhang   if (A->structure_only) {
7149566063dSJacob Faibussowitsch     PetscCall(MatView_SeqAIJ_ASCII_structonly(A, viewer));
7153ba16761SJacob Faibussowitsch     PetscFunctionReturn(PETSC_SUCCESS);
7167dc0baabSHong Zhang   }
71743e49210SHong Zhang 
7189566063dSJacob Faibussowitsch   PetscCall(PetscViewerGetFormat(viewer, &format));
7193ba16761SJacob Faibussowitsch   if (format == PETSC_VIEWER_ASCII_FACTOR_INFO || format == PETSC_VIEWER_ASCII_INFO || format == PETSC_VIEWER_ASCII_INFO_DETAIL) PetscFunctionReturn(PETSC_SUCCESS);
7202e5835c6SStefano Zampini 
721c898d852SStefano Zampini   /* trigger copy to CPU if needed */
7229566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &av));
7239566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &av));
72471c2f376SKris Buschelman   if (format == PETSC_VIEWER_ASCII_MATLAB) {
72597f1f81fSBarry Smith     PetscInt nofinalvalue = 0;
72660e0710aSBarry Smith     if (m && ((a->i[m] == a->i[m - 1]) || (a->j[a->nz - 1] != A->cmap->n - 1))) {
727c337ccceSJed Brown       /* Need a dummy value to ensure the dimension of the matrix. */
728d00d2cf4SBarry Smith       nofinalvalue = 1;
729d00d2cf4SBarry Smith     }
7309566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE));
7319566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIPrintf(viewer, "%% Size = %" PetscInt_FMT " %" PetscInt_FMT " \n", m, A->cmap->n));
7329566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIPrintf(viewer, "%% Nonzeros = %" PetscInt_FMT " \n", a->nz));
733fbfe6fa7SJed Brown #if defined(PETSC_USE_COMPLEX)
7349566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIPrintf(viewer, "zzz = zeros(%" PetscInt_FMT ",4);\n", a->nz + nofinalvalue));
735fbfe6fa7SJed Brown #else
7369566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIPrintf(viewer, "zzz = zeros(%" PetscInt_FMT ",3);\n", a->nz + nofinalvalue));
737fbfe6fa7SJed Brown #endif
7389566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIPrintf(viewer, "zzz = [\n"));
73917ab2063SBarry Smith 
74017ab2063SBarry Smith     for (i = 0; i < m; i++) {
74160e0710aSBarry Smith       for (j = a->i[i]; j < a->i[i + 1]; j++) {
742aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX)
7439566063dSJacob Faibussowitsch         PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT "  %18.16e %18.16e\n", i + 1, a->j[j] + 1, (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j])));
74417ab2063SBarry Smith #else
7459566063dSJacob Faibussowitsch         PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT "  %18.16e\n", i + 1, a->j[j] + 1, (double)a->a[j]));
74617ab2063SBarry Smith #endif
74717ab2063SBarry Smith       }
74817ab2063SBarry Smith     }
749d00d2cf4SBarry Smith     if (nofinalvalue) {
750c337ccceSJed Brown #if defined(PETSC_USE_COMPLEX)
7519566063dSJacob Faibussowitsch       PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT "  %18.16e %18.16e\n", m, A->cmap->n, 0., 0.));
752c337ccceSJed Brown #else
7539566063dSJacob Faibussowitsch       PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT "  %18.16e\n", m, A->cmap->n, 0.0));
754c337ccceSJed Brown #endif
755d00d2cf4SBarry Smith     }
7569566063dSJacob Faibussowitsch     PetscCall(PetscObjectGetName((PetscObject)A, &name));
7579566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIPrintf(viewer, "];\n %s = spconvert(zzz);\n", name));
7589566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE));
759fb9695e5SSatish Balay   } else if (format == PETSC_VIEWER_ASCII_COMMON) {
7609566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE));
76144cd7ae7SLois Curfman McInnes     for (i = 0; i < m; i++) {
7629566063dSJacob Faibussowitsch       PetscCall(PetscViewerASCIIPrintf(viewer, "row %" PetscInt_FMT ":", i));
76360e0710aSBarry Smith       for (j = a->i[i]; j < a->i[i + 1]; j++) {
764aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX)
76536db0b34SBarry Smith         if (PetscImaginaryPart(a->a[j]) > 0.0 && PetscRealPart(a->a[j]) != 0.0) {
7669566063dSJacob Faibussowitsch           PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g + %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j])));
76736db0b34SBarry Smith         } else if (PetscImaginaryPart(a->a[j]) < 0.0 && PetscRealPart(a->a[j]) != 0.0) {
7689566063dSJacob Faibussowitsch           PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g - %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)-PetscImaginaryPart(a->a[j])));
76936db0b34SBarry Smith         } else if (PetscRealPart(a->a[j]) != 0.0) {
7709566063dSJacob Faibussowitsch           PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)PetscRealPart(a->a[j])));
7716831982aSBarry Smith         }
77244cd7ae7SLois Curfman McInnes #else
7739566063dSJacob Faibussowitsch         if (a->a[j] != 0.0) PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)a->a[j]));
77444cd7ae7SLois Curfman McInnes #endif
77544cd7ae7SLois Curfman McInnes       }
7769566063dSJacob Faibussowitsch       PetscCall(PetscViewerASCIIPrintf(viewer, "\n"));
77744cd7ae7SLois Curfman McInnes     }
7789566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE));
779fb9695e5SSatish Balay   } else if (format == PETSC_VIEWER_ASCII_SYMMODU) {
78097f1f81fSBarry Smith     PetscInt nzd = 0, fshift = 1, *sptr;
7819566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE));
7829566063dSJacob Faibussowitsch     PetscCall(PetscMalloc1(m + 1, &sptr));
783496be53dSLois Curfman McInnes     for (i = 0; i < m; i++) {
784496be53dSLois Curfman McInnes       sptr[i] = nzd + 1;
78560e0710aSBarry Smith       for (j = a->i[i]; j < a->i[i + 1]; j++) {
786496be53dSLois Curfman McInnes         if (a->j[j] >= i) {
787aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX)
78836db0b34SBarry Smith           if (PetscImaginaryPart(a->a[j]) != 0.0 || PetscRealPart(a->a[j]) != 0.0) nzd++;
789496be53dSLois Curfman McInnes #else
790496be53dSLois Curfman McInnes           if (a->a[j] != 0.0) nzd++;
791496be53dSLois Curfman McInnes #endif
792496be53dSLois Curfman McInnes         }
793496be53dSLois Curfman McInnes       }
794496be53dSLois Curfman McInnes     }
7952e44a96cSLois Curfman McInnes     sptr[m] = nzd + 1;
7969566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " %" PetscInt_FMT "\n\n", m, nzd));
7972e44a96cSLois Curfman McInnes     for (i = 0; i < m + 1; i += 6) {
7982205254eSKarl Rupp       if (i + 4 < m) {
7999566063dSJacob Faibussowitsch         PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT "\n", sptr[i], sptr[i + 1], sptr[i + 2], sptr[i + 3], sptr[i + 4], sptr[i + 5]));
8002205254eSKarl Rupp       } else if (i + 3 < m) {
8019566063dSJacob Faibussowitsch         PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT "\n", sptr[i], sptr[i + 1], sptr[i + 2], sptr[i + 3], sptr[i + 4]));
8022205254eSKarl Rupp       } else if (i + 2 < m) {
8039566063dSJacob Faibussowitsch         PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT "\n", sptr[i], sptr[i + 1], sptr[i + 2], sptr[i + 3]));
8042205254eSKarl Rupp       } else if (i + 1 < m) {
8059566063dSJacob Faibussowitsch         PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT "\n", sptr[i], sptr[i + 1], sptr[i + 2]));
8062205254eSKarl Rupp       } else if (i < m) {
8079566063dSJacob Faibussowitsch         PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " %" PetscInt_FMT "\n", sptr[i], sptr[i + 1]));
8082205254eSKarl Rupp       } else {
8099566063dSJacob Faibussowitsch         PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT "\n", sptr[i]));
8102205254eSKarl Rupp       }
811496be53dSLois Curfman McInnes     }
8129566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIPrintf(viewer, "\n"));
8139566063dSJacob Faibussowitsch     PetscCall(PetscFree(sptr));
814496be53dSLois Curfman McInnes     for (i = 0; i < m; i++) {
81560e0710aSBarry Smith       for (j = a->i[i]; j < a->i[i + 1]; j++) {
8169566063dSJacob Faibussowitsch         if (a->j[j] >= i) PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " ", a->j[j] + fshift));
817496be53dSLois Curfman McInnes       }
8189566063dSJacob Faibussowitsch       PetscCall(PetscViewerASCIIPrintf(viewer, "\n"));
819496be53dSLois Curfman McInnes     }
8209566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIPrintf(viewer, "\n"));
821496be53dSLois Curfman McInnes     for (i = 0; i < m; i++) {
82260e0710aSBarry Smith       for (j = a->i[i]; j < a->i[i + 1]; j++) {
823496be53dSLois Curfman McInnes         if (a->j[j] >= i) {
824aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX)
82548a46eb9SPierre Jolivet           if (PetscImaginaryPart(a->a[j]) != 0.0 || PetscRealPart(a->a[j]) != 0.0) PetscCall(PetscViewerASCIIPrintf(viewer, " %18.16e %18.16e ", (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j])));
826496be53dSLois Curfman McInnes #else
8279566063dSJacob Faibussowitsch           if (a->a[j] != 0.0) PetscCall(PetscViewerASCIIPrintf(viewer, " %18.16e ", (double)a->a[j]));
828496be53dSLois Curfman McInnes #endif
829496be53dSLois Curfman McInnes         }
830496be53dSLois Curfman McInnes       }
8319566063dSJacob Faibussowitsch       PetscCall(PetscViewerASCIIPrintf(viewer, "\n"));
832496be53dSLois Curfman McInnes     }
8339566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE));
834fb9695e5SSatish Balay   } else if (format == PETSC_VIEWER_ASCII_DENSE) {
83597f1f81fSBarry Smith     PetscInt    cnt = 0, jcnt;
83687828ca2SBarry Smith     PetscScalar value;
83768f1ed48SBarry Smith #if defined(PETSC_USE_COMPLEX)
83868f1ed48SBarry Smith     PetscBool realonly = PETSC_TRUE;
83968f1ed48SBarry Smith 
84068f1ed48SBarry Smith     for (i = 0; i < a->i[m]; i++) {
84168f1ed48SBarry Smith       if (PetscImaginaryPart(a->a[i]) != 0.0) {
84268f1ed48SBarry Smith         realonly = PETSC_FALSE;
84368f1ed48SBarry Smith         break;
84468f1ed48SBarry Smith       }
84568f1ed48SBarry Smith     }
84668f1ed48SBarry Smith #endif
84702594712SBarry Smith 
8489566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE));
84902594712SBarry Smith     for (i = 0; i < m; i++) {
85002594712SBarry Smith       jcnt = 0;
851d0f46423SBarry Smith       for (j = 0; j < A->cmap->n; j++) {
852e24b481bSBarry Smith         if (jcnt < a->i[i + 1] - a->i[i] && j == a->j[cnt]) {
85302594712SBarry Smith           value = a->a[cnt++];
854e24b481bSBarry Smith           jcnt++;
85502594712SBarry Smith         } else {
85602594712SBarry Smith           value = 0.0;
85702594712SBarry Smith         }
858aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX)
85968f1ed48SBarry Smith         if (realonly) {
8609566063dSJacob Faibussowitsch           PetscCall(PetscViewerASCIIPrintf(viewer, " %7.5e ", (double)PetscRealPart(value)));
86168f1ed48SBarry Smith         } else {
8629566063dSJacob Faibussowitsch           PetscCall(PetscViewerASCIIPrintf(viewer, " %7.5e+%7.5e i ", (double)PetscRealPart(value), (double)PetscImaginaryPart(value)));
86368f1ed48SBarry Smith         }
86402594712SBarry Smith #else
8659566063dSJacob Faibussowitsch         PetscCall(PetscViewerASCIIPrintf(viewer, " %7.5e ", (double)value));
86602594712SBarry Smith #endif
86702594712SBarry Smith       }
8689566063dSJacob Faibussowitsch       PetscCall(PetscViewerASCIIPrintf(viewer, "\n"));
86902594712SBarry Smith     }
8709566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE));
8713c215bfdSMatthew Knepley   } else if (format == PETSC_VIEWER_ASCII_MATRIXMARKET) {
872150b93efSMatthew G. Knepley     PetscInt fshift = 1;
8739566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE));
8743c215bfdSMatthew Knepley #if defined(PETSC_USE_COMPLEX)
8759566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIPrintf(viewer, "%%%%MatrixMarket matrix coordinate complex general\n"));
8763c215bfdSMatthew Knepley #else
8779566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIPrintf(viewer, "%%%%MatrixMarket matrix coordinate real general\n"));
8783c215bfdSMatthew Knepley #endif
8799566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT "\n", m, A->cmap->n, a->nz));
8803c215bfdSMatthew Knepley     for (i = 0; i < m; i++) {
88160e0710aSBarry Smith       for (j = a->i[i]; j < a->i[i + 1]; j++) {
8823c215bfdSMatthew Knepley #if defined(PETSC_USE_COMPLEX)
8839566063dSJacob Faibussowitsch         PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT " %g %g\n", i + fshift, a->j[j] + fshift, (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j])));
8843c215bfdSMatthew Knepley #else
8859566063dSJacob Faibussowitsch         PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT " %g\n", i + fshift, a->j[j] + fshift, (double)a->a[j]));
8863c215bfdSMatthew Knepley #endif
8873c215bfdSMatthew Knepley       }
8883c215bfdSMatthew Knepley     }
8899566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE));
8903a40ed3dSBarry Smith   } else {
8919566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE));
892d5f3da31SBarry Smith     if (A->factortype) {
89316cd7e1dSShri Abhyankar       for (i = 0; i < m; i++) {
8949566063dSJacob Faibussowitsch         PetscCall(PetscViewerASCIIPrintf(viewer, "row %" PetscInt_FMT ":", i));
89516cd7e1dSShri Abhyankar         /* L part */
89660e0710aSBarry Smith         for (j = a->i[i]; j < a->i[i + 1]; j++) {
89716cd7e1dSShri Abhyankar #if defined(PETSC_USE_COMPLEX)
89816cd7e1dSShri Abhyankar           if (PetscImaginaryPart(a->a[j]) > 0.0) {
8999566063dSJacob Faibussowitsch             PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g + %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j])));
90016cd7e1dSShri Abhyankar           } else if (PetscImaginaryPart(a->a[j]) < 0.0) {
9019566063dSJacob Faibussowitsch             PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g - %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)(-PetscImaginaryPart(a->a[j]))));
90216cd7e1dSShri Abhyankar           } else {
9039566063dSJacob Faibussowitsch             PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)PetscRealPart(a->a[j])));
90416cd7e1dSShri Abhyankar           }
90516cd7e1dSShri Abhyankar #else
9069566063dSJacob Faibussowitsch           PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)a->a[j]));
90716cd7e1dSShri Abhyankar #endif
90816cd7e1dSShri Abhyankar         }
90916cd7e1dSShri Abhyankar         /* diagonal */
91016cd7e1dSShri Abhyankar         j = a->diag[i];
91116cd7e1dSShri Abhyankar #if defined(PETSC_USE_COMPLEX)
91216cd7e1dSShri Abhyankar         if (PetscImaginaryPart(a->a[j]) > 0.0) {
9139566063dSJacob Faibussowitsch           PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g + %g i)", a->j[j], (double)PetscRealPart(1.0 / a->a[j]), (double)PetscImaginaryPart(1.0 / a->a[j])));
91416cd7e1dSShri Abhyankar         } else if (PetscImaginaryPart(a->a[j]) < 0.0) {
9159566063dSJacob Faibussowitsch           PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g - %g i)", a->j[j], (double)PetscRealPart(1.0 / a->a[j]), (double)(-PetscImaginaryPart(1.0 / a->a[j]))));
91616cd7e1dSShri Abhyankar         } else {
9179566063dSJacob Faibussowitsch           PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)PetscRealPart(1.0 / a->a[j])));
91816cd7e1dSShri Abhyankar         }
91916cd7e1dSShri Abhyankar #else
9209566063dSJacob Faibussowitsch         PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)(1.0 / a->a[j])));
92116cd7e1dSShri Abhyankar #endif
92216cd7e1dSShri Abhyankar 
92316cd7e1dSShri Abhyankar         /* U part */
92460e0710aSBarry Smith         for (j = a->diag[i + 1] + 1; j < a->diag[i]; j++) {
92516cd7e1dSShri Abhyankar #if defined(PETSC_USE_COMPLEX)
92616cd7e1dSShri Abhyankar           if (PetscImaginaryPart(a->a[j]) > 0.0) {
9279566063dSJacob Faibussowitsch             PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g + %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j])));
92816cd7e1dSShri Abhyankar           } else if (PetscImaginaryPart(a->a[j]) < 0.0) {
9299566063dSJacob Faibussowitsch             PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g - %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)(-PetscImaginaryPart(a->a[j]))));
93016cd7e1dSShri Abhyankar           } else {
9319566063dSJacob Faibussowitsch             PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)PetscRealPart(a->a[j])));
93216cd7e1dSShri Abhyankar           }
93316cd7e1dSShri Abhyankar #else
9349566063dSJacob Faibussowitsch           PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)a->a[j]));
93516cd7e1dSShri Abhyankar #endif
93616cd7e1dSShri Abhyankar         }
9379566063dSJacob Faibussowitsch         PetscCall(PetscViewerASCIIPrintf(viewer, "\n"));
93816cd7e1dSShri Abhyankar       }
93916cd7e1dSShri Abhyankar     } else {
94017ab2063SBarry Smith       for (i = 0; i < m; i++) {
9419566063dSJacob Faibussowitsch         PetscCall(PetscViewerASCIIPrintf(viewer, "row %" PetscInt_FMT ":", i));
94260e0710aSBarry Smith         for (j = a->i[i]; j < a->i[i + 1]; j++) {
943aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX)
94436db0b34SBarry Smith           if (PetscImaginaryPart(a->a[j]) > 0.0) {
9459566063dSJacob Faibussowitsch             PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g + %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j])));
94636db0b34SBarry Smith           } else if (PetscImaginaryPart(a->a[j]) < 0.0) {
9479566063dSJacob Faibussowitsch             PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g - %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)-PetscImaginaryPart(a->a[j])));
9483a40ed3dSBarry Smith           } else {
9499566063dSJacob Faibussowitsch             PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)PetscRealPart(a->a[j])));
95017ab2063SBarry Smith           }
95117ab2063SBarry Smith #else
9529566063dSJacob Faibussowitsch           PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)a->a[j]));
95317ab2063SBarry Smith #endif
95417ab2063SBarry Smith         }
9559566063dSJacob Faibussowitsch         PetscCall(PetscViewerASCIIPrintf(viewer, "\n"));
95617ab2063SBarry Smith       }
95716cd7e1dSShri Abhyankar     }
9589566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE));
95917ab2063SBarry Smith   }
9609566063dSJacob Faibussowitsch   PetscCall(PetscViewerFlush(viewer));
9613ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
962416022c9SBarry Smith }
963416022c9SBarry Smith 
9649804daf3SBarry Smith #include <petscdraw.h>
965*ba38deedSJacob Faibussowitsch static PetscErrorCode MatView_SeqAIJ_Draw_Zoom(PetscDraw draw, void *Aa)
966d71ae5a4SJacob Faibussowitsch {
967480ef9eaSBarry Smith   Mat                A = (Mat)Aa;
968416022c9SBarry Smith   Mat_SeqAIJ        *a = (Mat_SeqAIJ *)A->data;
969383922c3SLisandro Dalcin   PetscInt           i, j, m = A->rmap->n;
970383922c3SLisandro Dalcin   int                color;
971b05fc000SLisandro Dalcin   PetscReal          xl, yl, xr, yr, x_l, x_r, y_l, y_r;
972b0a32e0cSBarry Smith   PetscViewer        viewer;
973f3ef73ceSBarry Smith   PetscViewerFormat  format;
974fff043a9SJunchao Zhang   const PetscScalar *aa;
975cddf8d76SBarry Smith 
9763a40ed3dSBarry Smith   PetscFunctionBegin;
9779566063dSJacob Faibussowitsch   PetscCall(PetscObjectQuery((PetscObject)A, "Zoomviewer", (PetscObject *)&viewer));
9789566063dSJacob Faibussowitsch   PetscCall(PetscViewerGetFormat(viewer, &format));
9799566063dSJacob Faibussowitsch   PetscCall(PetscDrawGetCoordinates(draw, &xl, &yl, &xr, &yr));
980383922c3SLisandro Dalcin 
981416022c9SBarry Smith   /* loop over matrix elements drawing boxes */
9829566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &aa));
983fb9695e5SSatish Balay   if (format != PETSC_VIEWER_DRAW_CONTOUR) {
984d0609cedSBarry Smith     PetscDrawCollectiveBegin(draw);
9850513a670SBarry Smith     /* Blue for negative, Cyan for zero and  Red for positive */
986b0a32e0cSBarry Smith     color = PETSC_DRAW_BLUE;
987416022c9SBarry Smith     for (i = 0; i < m; i++) {
9889371c9d4SSatish Balay       y_l = m - i - 1.0;
9899371c9d4SSatish Balay       y_r = y_l + 1.0;
990bfeeae90SHong Zhang       for (j = a->i[i]; j < a->i[i + 1]; j++) {
9919371c9d4SSatish Balay         x_l = a->j[j];
9929371c9d4SSatish Balay         x_r = x_l + 1.0;
993fff043a9SJunchao Zhang         if (PetscRealPart(aa[j]) >= 0.) continue;
9949566063dSJacob Faibussowitsch         PetscCall(PetscDrawRectangle(draw, x_l, y_l, x_r, y_r, color, color, color, color));
995cddf8d76SBarry Smith       }
996cddf8d76SBarry Smith     }
997b0a32e0cSBarry Smith     color = PETSC_DRAW_CYAN;
998cddf8d76SBarry Smith     for (i = 0; i < m; i++) {
9999371c9d4SSatish Balay       y_l = m - i - 1.0;
10009371c9d4SSatish Balay       y_r = y_l + 1.0;
1001bfeeae90SHong Zhang       for (j = a->i[i]; j < a->i[i + 1]; j++) {
10029371c9d4SSatish Balay         x_l = a->j[j];
10039371c9d4SSatish Balay         x_r = x_l + 1.0;
1004fff043a9SJunchao Zhang         if (aa[j] != 0.) continue;
10059566063dSJacob Faibussowitsch         PetscCall(PetscDrawRectangle(draw, x_l, y_l, x_r, y_r, color, color, color, color));
1006cddf8d76SBarry Smith       }
1007cddf8d76SBarry Smith     }
1008b0a32e0cSBarry Smith     color = PETSC_DRAW_RED;
1009cddf8d76SBarry Smith     for (i = 0; i < m; i++) {
10109371c9d4SSatish Balay       y_l = m - i - 1.0;
10119371c9d4SSatish Balay       y_r = y_l + 1.0;
1012bfeeae90SHong Zhang       for (j = a->i[i]; j < a->i[i + 1]; j++) {
10139371c9d4SSatish Balay         x_l = a->j[j];
10149371c9d4SSatish Balay         x_r = x_l + 1.0;
1015fff043a9SJunchao Zhang         if (PetscRealPart(aa[j]) <= 0.) continue;
10169566063dSJacob Faibussowitsch         PetscCall(PetscDrawRectangle(draw, x_l, y_l, x_r, y_r, color, color, color, color));
1017416022c9SBarry Smith       }
1018416022c9SBarry Smith     }
1019d0609cedSBarry Smith     PetscDrawCollectiveEnd(draw);
10200513a670SBarry Smith   } else {
10210513a670SBarry Smith     /* use contour shading to indicate magnitude of values */
10220513a670SBarry Smith     /* first determine max of all nonzero values */
1023b05fc000SLisandro Dalcin     PetscReal minv = 0.0, maxv = 0.0;
1024383922c3SLisandro Dalcin     PetscInt  nz = a->nz, count = 0;
1025b0a32e0cSBarry Smith     PetscDraw popup;
10260513a670SBarry Smith 
10270513a670SBarry Smith     for (i = 0; i < nz; i++) {
1028fff043a9SJunchao Zhang       if (PetscAbsScalar(aa[i]) > maxv) maxv = PetscAbsScalar(aa[i]);
10290513a670SBarry Smith     }
1030383922c3SLisandro Dalcin     if (minv >= maxv) maxv = minv + PETSC_SMALL;
10319566063dSJacob Faibussowitsch     PetscCall(PetscDrawGetPopup(draw, &popup));
10329566063dSJacob Faibussowitsch     PetscCall(PetscDrawScalePopup(popup, minv, maxv));
1033383922c3SLisandro Dalcin 
1034d0609cedSBarry Smith     PetscDrawCollectiveBegin(draw);
10350513a670SBarry Smith     for (i = 0; i < m; i++) {
1036383922c3SLisandro Dalcin       y_l = m - i - 1.0;
1037383922c3SLisandro Dalcin       y_r = y_l + 1.0;
1038bfeeae90SHong Zhang       for (j = a->i[i]; j < a->i[i + 1]; j++) {
1039383922c3SLisandro Dalcin         x_l   = a->j[j];
1040383922c3SLisandro Dalcin         x_r   = x_l + 1.0;
1041fff043a9SJunchao Zhang         color = PetscDrawRealToColor(PetscAbsScalar(aa[count]), minv, maxv);
10429566063dSJacob Faibussowitsch         PetscCall(PetscDrawRectangle(draw, x_l, y_l, x_r, y_r, color, color, color, color));
10430513a670SBarry Smith         count++;
10440513a670SBarry Smith       }
10450513a670SBarry Smith     }
1046d0609cedSBarry Smith     PetscDrawCollectiveEnd(draw);
10470513a670SBarry Smith   }
10489566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &aa));
10493ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
1050480ef9eaSBarry Smith }
1051cddf8d76SBarry Smith 
10529804daf3SBarry Smith #include <petscdraw.h>
1053*ba38deedSJacob Faibussowitsch static PetscErrorCode MatView_SeqAIJ_Draw(Mat A, PetscViewer viewer)
1054d71ae5a4SJacob Faibussowitsch {
1055b0a32e0cSBarry Smith   PetscDraw draw;
105636db0b34SBarry Smith   PetscReal xr, yr, xl, yl, h, w;
1057ace3abfcSBarry Smith   PetscBool isnull;
1058480ef9eaSBarry Smith 
1059480ef9eaSBarry Smith   PetscFunctionBegin;
10609566063dSJacob Faibussowitsch   PetscCall(PetscViewerDrawGetDraw(viewer, 0, &draw));
10619566063dSJacob Faibussowitsch   PetscCall(PetscDrawIsNull(draw, &isnull));
10623ba16761SJacob Faibussowitsch   if (isnull) PetscFunctionReturn(PETSC_SUCCESS);
1063480ef9eaSBarry Smith 
10649371c9d4SSatish Balay   xr = A->cmap->n;
10659371c9d4SSatish Balay   yr = A->rmap->n;
10669371c9d4SSatish Balay   h  = yr / 10.0;
10679371c9d4SSatish Balay   w  = xr / 10.0;
10689371c9d4SSatish Balay   xr += w;
10699371c9d4SSatish Balay   yr += h;
10709371c9d4SSatish Balay   xl = -w;
10719371c9d4SSatish Balay   yl = -h;
10729566063dSJacob Faibussowitsch   PetscCall(PetscDrawSetCoordinates(draw, xl, yl, xr, yr));
10739566063dSJacob Faibussowitsch   PetscCall(PetscObjectCompose((PetscObject)A, "Zoomviewer", (PetscObject)viewer));
10749566063dSJacob Faibussowitsch   PetscCall(PetscDrawZoom(draw, MatView_SeqAIJ_Draw_Zoom, A));
10759566063dSJacob Faibussowitsch   PetscCall(PetscObjectCompose((PetscObject)A, "Zoomviewer", NULL));
10769566063dSJacob Faibussowitsch   PetscCall(PetscDrawSave(draw));
10773ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
1078416022c9SBarry Smith }
1079416022c9SBarry Smith 
1080d71ae5a4SJacob Faibussowitsch PetscErrorCode MatView_SeqAIJ(Mat A, PetscViewer viewer)
1081d71ae5a4SJacob Faibussowitsch {
1082ace3abfcSBarry Smith   PetscBool iascii, isbinary, isdraw;
1083416022c9SBarry Smith 
10843a40ed3dSBarry Smith   PetscFunctionBegin;
10859566063dSJacob Faibussowitsch   PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERASCII, &iascii));
10869566063dSJacob Faibussowitsch   PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERBINARY, &isbinary));
10879566063dSJacob Faibussowitsch   PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERDRAW, &isdraw));
10881baa6e33SBarry Smith   if (iascii) PetscCall(MatView_SeqAIJ_ASCII(A, viewer));
10891baa6e33SBarry Smith   else if (isbinary) PetscCall(MatView_SeqAIJ_Binary(A, viewer));
10901baa6e33SBarry Smith   else if (isdraw) PetscCall(MatView_SeqAIJ_Draw(A, viewer));
10919566063dSJacob Faibussowitsch   PetscCall(MatView_SeqAIJ_Inode(A, viewer));
10923ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
109317ab2063SBarry Smith }
109419bcc07fSBarry Smith 
1095d71ae5a4SJacob Faibussowitsch PetscErrorCode MatAssemblyEnd_SeqAIJ(Mat A, MatAssemblyType mode)
1096d71ae5a4SJacob Faibussowitsch {
1097416022c9SBarry Smith   Mat_SeqAIJ *a      = (Mat_SeqAIJ *)A->data;
1098580bdb30SBarry Smith   PetscInt    fshift = 0, i, *ai = a->i, *aj = a->j, *imax = a->imax;
1099d0f46423SBarry Smith   PetscInt    m = A->rmap->n, *ip, N, *ailen = a->ilen, rmax = 0;
110054f21887SBarry Smith   MatScalar  *aa    = a->a, *ap;
11013447b6efSHong Zhang   PetscReal   ratio = 0.6;
110217ab2063SBarry Smith 
11033a40ed3dSBarry Smith   PetscFunctionBegin;
11043ba16761SJacob Faibussowitsch   if (mode == MAT_FLUSH_ASSEMBLY) PetscFunctionReturn(PETSC_SUCCESS);
11059566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJInvalidateDiagonal(A));
1106b215bc84SStefano Zampini   if (A->was_assembled && A->ass_nonzerostate == A->nonzerostate) {
1107b215bc84SStefano Zampini     /* we need to respect users asking to use or not the inodes routine in between matrix assemblies */
11089566063dSJacob Faibussowitsch     PetscCall(MatAssemblyEnd_SeqAIJ_Inode(A, mode));
11093ba16761SJacob Faibussowitsch     PetscFunctionReturn(PETSC_SUCCESS);
1110b215bc84SStefano Zampini   }
111117ab2063SBarry Smith 
111243ee02c3SBarry Smith   if (m) rmax = ailen[0]; /* determine row with most nonzeros */
111317ab2063SBarry Smith   for (i = 1; i < m; i++) {
1114416022c9SBarry Smith     /* move each row back by the amount of empty slots (fshift) before it*/
111517ab2063SBarry Smith     fshift += imax[i - 1] - ailen[i - 1];
111694a9d846SBarry Smith     rmax = PetscMax(rmax, ailen[i]);
111717ab2063SBarry Smith     if (fshift) {
1118bfeeae90SHong Zhang       ip = aj + ai[i];
1119bfeeae90SHong Zhang       ap = aa + ai[i];
112017ab2063SBarry Smith       N  = ailen[i];
11219566063dSJacob Faibussowitsch       PetscCall(PetscArraymove(ip - fshift, ip, N));
112248a46eb9SPierre Jolivet       if (!A->structure_only) PetscCall(PetscArraymove(ap - fshift, ap, N));
112317ab2063SBarry Smith     }
112417ab2063SBarry Smith     ai[i] = ai[i - 1] + ailen[i - 1];
112517ab2063SBarry Smith   }
112617ab2063SBarry Smith   if (m) {
112717ab2063SBarry Smith     fshift += imax[m - 1] - ailen[m - 1];
112817ab2063SBarry Smith     ai[m] = ai[m - 1] + ailen[m - 1];
112917ab2063SBarry Smith   }
113017ab2063SBarry Smith   /* reset ilen and imax for each row */
11317b083b7cSBarry Smith   a->nonzerorowcnt = 0;
1132396832f4SHong Zhang   if (A->structure_only) {
11339566063dSJacob Faibussowitsch     PetscCall(PetscFree(a->imax));
11349566063dSJacob Faibussowitsch     PetscCall(PetscFree(a->ilen));
1135396832f4SHong Zhang   } else { /* !A->structure_only */
113617ab2063SBarry Smith     for (i = 0; i < m; i++) {
113717ab2063SBarry Smith       ailen[i] = imax[i] = ai[i + 1] - ai[i];
11387b083b7cSBarry Smith       a->nonzerorowcnt += ((ai[i + 1] - ai[i]) > 0);
113917ab2063SBarry Smith     }
1140396832f4SHong Zhang   }
1141bfeeae90SHong Zhang   a->nz = ai[m];
1142aed4548fSBarry Smith   PetscCheck(!fshift || a->nounused != -1, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Unused space detected in matrix: %" PetscInt_FMT " X %" PetscInt_FMT ", %" PetscInt_FMT " unneeded", m, A->cmap->n, fshift);
114317ab2063SBarry Smith 
11449566063dSJacob Faibussowitsch   PetscCall(MatMarkDiagonal_SeqAIJ(A));
11459566063dSJacob Faibussowitsch   PetscCall(PetscInfo(A, "Matrix size: %" PetscInt_FMT " X %" PetscInt_FMT "; storage space: %" PetscInt_FMT " unneeded,%" PetscInt_FMT " used\n", m, A->cmap->n, fshift, a->nz));
11469566063dSJacob Faibussowitsch   PetscCall(PetscInfo(A, "Number of mallocs during MatSetValues() is %" PetscInt_FMT "\n", a->reallocs));
11479566063dSJacob Faibussowitsch   PetscCall(PetscInfo(A, "Maximum nonzeros in any row is %" PetscInt_FMT "\n", rmax));
11482205254eSKarl Rupp 
11498e58a170SBarry Smith   A->info.mallocs += a->reallocs;
1150dd5f02e7SSatish Balay   a->reallocs         = 0;
11516712e2f1SBarry Smith   A->info.nz_unneeded = (PetscReal)fshift;
115236db0b34SBarry Smith   a->rmax             = rmax;
11534e220ebcSLois Curfman McInnes 
115448a46eb9SPierre Jolivet   if (!A->structure_only) PetscCall(MatCheckCompressedRow(A, a->nonzerorowcnt, &a->compressedrow, a->i, m, ratio));
11559566063dSJacob Faibussowitsch   PetscCall(MatAssemblyEnd_SeqAIJ_Inode(A, mode));
11563ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
115717ab2063SBarry Smith }
115817ab2063SBarry Smith 
1159*ba38deedSJacob Faibussowitsch static PetscErrorCode MatRealPart_SeqAIJ(Mat A)
1160d71ae5a4SJacob Faibussowitsch {
116199cafbc1SBarry Smith   Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data;
116299cafbc1SBarry Smith   PetscInt    i, nz = a->nz;
11632e5835c6SStefano Zampini   MatScalar  *aa;
116499cafbc1SBarry Smith 
116599cafbc1SBarry Smith   PetscFunctionBegin;
11669566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArray(A, &aa));
116799cafbc1SBarry Smith   for (i = 0; i < nz; i++) aa[i] = PetscRealPart(aa[i]);
11689566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArray(A, &aa));
11699566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJInvalidateDiagonal(A));
11703ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
117199cafbc1SBarry Smith }
117299cafbc1SBarry Smith 
1173*ba38deedSJacob Faibussowitsch static PetscErrorCode MatImaginaryPart_SeqAIJ(Mat A)
1174d71ae5a4SJacob Faibussowitsch {
117599cafbc1SBarry Smith   Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data;
117699cafbc1SBarry Smith   PetscInt    i, nz = a->nz;
11772e5835c6SStefano Zampini   MatScalar  *aa;
117899cafbc1SBarry Smith 
117999cafbc1SBarry Smith   PetscFunctionBegin;
11809566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArray(A, &aa));
118199cafbc1SBarry Smith   for (i = 0; i < nz; i++) aa[i] = PetscImaginaryPart(aa[i]);
11829566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArray(A, &aa));
11839566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJInvalidateDiagonal(A));
11843ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
118599cafbc1SBarry Smith }
118699cafbc1SBarry Smith 
1187d71ae5a4SJacob Faibussowitsch PetscErrorCode MatZeroEntries_SeqAIJ(Mat A)
1188d71ae5a4SJacob Faibussowitsch {
1189fff043a9SJunchao Zhang   Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data;
1190fff043a9SJunchao Zhang   MatScalar  *aa;
11913a40ed3dSBarry Smith 
11923a40ed3dSBarry Smith   PetscFunctionBegin;
11939566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayWrite(A, &aa));
11949566063dSJacob Faibussowitsch   PetscCall(PetscArrayzero(aa, a->i[A->rmap->n]));
11959566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayWrite(A, &aa));
11969566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJInvalidateDiagonal(A));
11973ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
119817ab2063SBarry Smith }
1199416022c9SBarry Smith 
1200d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDestroy_SeqAIJ(Mat A)
1201d71ae5a4SJacob Faibussowitsch {
1202416022c9SBarry Smith   Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data;
1203d5d45c9bSBarry Smith 
12043a40ed3dSBarry Smith   PetscFunctionBegin;
1205b4e2f619SBarry Smith   if (A->hash_active) {
1206e3c72094SPierre Jolivet     A->ops[0] = a->cops;
1207b4e2f619SBarry Smith     PetscCall(PetscHMapIJVDestroy(&a->ht));
1208b4e2f619SBarry Smith     PetscCall(PetscFree(a->dnz));
1209b4e2f619SBarry Smith     A->hash_active = PETSC_FALSE;
1210b4e2f619SBarry Smith   }
1211b4e2f619SBarry Smith 
12123ba16761SJacob Faibussowitsch   PetscCall(PetscLogObjectState((PetscObject)A, "Rows=%" PetscInt_FMT ", Cols=%" PetscInt_FMT ", NZ=%" PetscInt_FMT, A->rmap->n, A->cmap->n, a->nz));
12139566063dSJacob Faibussowitsch   PetscCall(MatSeqXAIJFreeAIJ(A, &a->a, &a->j, &a->i));
12149566063dSJacob Faibussowitsch   PetscCall(ISDestroy(&a->row));
12159566063dSJacob Faibussowitsch   PetscCall(ISDestroy(&a->col));
12169566063dSJacob Faibussowitsch   PetscCall(PetscFree(a->diag));
12179566063dSJacob Faibussowitsch   PetscCall(PetscFree(a->ibdiag));
12189566063dSJacob Faibussowitsch   PetscCall(PetscFree(a->imax));
12199566063dSJacob Faibussowitsch   PetscCall(PetscFree(a->ilen));
12209566063dSJacob Faibussowitsch   PetscCall(PetscFree(a->ipre));
12219566063dSJacob Faibussowitsch   PetscCall(PetscFree3(a->idiag, a->mdiag, a->ssor_work));
12229566063dSJacob Faibussowitsch   PetscCall(PetscFree(a->solve_work));
12239566063dSJacob Faibussowitsch   PetscCall(ISDestroy(&a->icol));
12249566063dSJacob Faibussowitsch   PetscCall(PetscFree(a->saved_values));
12259566063dSJacob Faibussowitsch   PetscCall(PetscFree2(a->compressedrow.i, a->compressedrow.rindex));
12269566063dSJacob Faibussowitsch   PetscCall(MatDestroy_SeqAIJ_Inode(A));
12279566063dSJacob Faibussowitsch   PetscCall(PetscFree(A->data));
1228901853e0SKris Buschelman 
12296718818eSStefano Zampini   /* MatMatMultNumeric_SeqAIJ_SeqAIJ_Sorted may allocate this.
12306718818eSStefano Zampini      That function is so heavily used (sometimes in an hidden way through multnumeric function pointers)
12316718818eSStefano Zampini      that is hard to properly add this data to the MatProduct data. We free it here to avoid
12326718818eSStefano Zampini      users reusing the matrix object with different data to incur in obscure segmentation faults
12336718818eSStefano Zampini      due to different matrix sizes */
12349566063dSJacob Faibussowitsch   PetscCall(PetscObjectCompose((PetscObject)A, "__PETSc__ab_dense", NULL));
12356718818eSStefano Zampini 
12369566063dSJacob Faibussowitsch   PetscCall(PetscObjectChangeTypeName((PetscObject)A, NULL));
12372e956fe4SStefano Zampini   PetscCall(PetscObjectComposeFunction((PetscObject)A, "PetscMatlabEnginePut_C", NULL));
12382e956fe4SStefano Zampini   PetscCall(PetscObjectComposeFunction((PetscObject)A, "PetscMatlabEngineGet_C", NULL));
12399566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSeqAIJSetColumnIndices_C", NULL));
12409566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatStoreValues_C", NULL));
12419566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatRetrieveValues_C", NULL));
12429566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqsbaij_C", NULL));
12439566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqbaij_C", NULL));
12449566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijperm_C", NULL));
12452e956fe4SStefano Zampini   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijsell_C", NULL));
12462e956fe4SStefano Zampini #if defined(PETSC_HAVE_MKL_SPARSE)
12472e956fe4SStefano Zampini   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijmkl_C", NULL));
12482e956fe4SStefano Zampini #endif
12494222ddf1SHong Zhang #if defined(PETSC_HAVE_CUDA)
12509566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijcusparse_C", NULL));
12519566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaijcusparse_seqaij_C", NULL));
12529566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaij_seqaijcusparse_C", NULL));
12534222ddf1SHong Zhang #endif
1254d5e393b6SSuyash Tandon #if defined(PETSC_HAVE_HIP)
1255d5e393b6SSuyash Tandon   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijhipsparse_C", NULL));
1256d5e393b6SSuyash Tandon   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaijhipsparse_seqaij_C", NULL));
1257d5e393b6SSuyash Tandon   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaij_seqaijhipsparse_C", NULL));
1258d5e393b6SSuyash Tandon #endif
12593d0639e7SStefano Zampini #if defined(PETSC_HAVE_KOKKOS_KERNELS)
12609566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijkokkos_C", NULL));
12613d0639e7SStefano Zampini #endif
12629566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijcrl_C", NULL));
1263af8000cdSHong Zhang #if defined(PETSC_HAVE_ELEMENTAL)
12649566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_elemental_C", NULL));
1265af8000cdSHong Zhang #endif
1266d24d4204SJose E. Roman #if defined(PETSC_HAVE_SCALAPACK)
12679566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_scalapack_C", NULL));
1268d24d4204SJose E. Roman #endif
126963c07aadSStefano Zampini #if defined(PETSC_HAVE_HYPRE)
12709566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_hypre_C", NULL));
12719566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_transpose_seqaij_seqaij_C", NULL));
127263c07aadSStefano Zampini #endif
12739566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqdense_C", NULL));
12749566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqsell_C", NULL));
12759566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_is_C", NULL));
12769566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatIsTranspose_C", NULL));
12772e956fe4SStefano Zampini   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatIsHermitianTranspose_C", NULL));
12789566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSeqAIJSetPreallocation_C", NULL));
12799566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatResetPreallocation_C", NULL));
12809566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSeqAIJSetPreallocationCSR_C", NULL));
12819566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatReorderForNonzeroDiagonal_C", NULL));
12829566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_is_seqaij_C", NULL));
12839566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqdense_seqaij_C", NULL));
12849566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaij_seqaij_C", NULL));
12859566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSeqAIJKron_C", NULL));
12869566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSetPreallocationCOO_C", NULL));
12879566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSetValuesCOO_C", NULL));
12882e956fe4SStefano Zampini   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatFactorGetSolverType_C", NULL));
12892e956fe4SStefano Zampini   /* these calls do not belong here: the subclasses Duplicate/Destroy are wrong */
12902e956fe4SStefano Zampini   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaijsell_seqaij_C", NULL));
12912e956fe4SStefano Zampini   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaijperm_seqaij_C", NULL));
12922e956fe4SStefano Zampini   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijviennacl_C", NULL));
12932e956fe4SStefano Zampini   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaijviennacl_seqdense_C", NULL));
12942e956fe4SStefano Zampini   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaijviennacl_seqaij_C", NULL));
12953ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
129617ab2063SBarry Smith }
129717ab2063SBarry Smith 
1298d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetOption_SeqAIJ(Mat A, MatOption op, PetscBool flg)
1299d71ae5a4SJacob Faibussowitsch {
1300416022c9SBarry Smith   Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data;
13013a40ed3dSBarry Smith 
13023a40ed3dSBarry Smith   PetscFunctionBegin;
1303a65d3064SKris Buschelman   switch (op) {
1304d71ae5a4SJacob Faibussowitsch   case MAT_ROW_ORIENTED:
1305d71ae5a4SJacob Faibussowitsch     a->roworiented = flg;
1306d71ae5a4SJacob Faibussowitsch     break;
1307d71ae5a4SJacob Faibussowitsch   case MAT_KEEP_NONZERO_PATTERN:
1308d71ae5a4SJacob Faibussowitsch     a->keepnonzeropattern = flg;
1309d71ae5a4SJacob Faibussowitsch     break;
1310d71ae5a4SJacob Faibussowitsch   case MAT_NEW_NONZERO_LOCATIONS:
1311d71ae5a4SJacob Faibussowitsch     a->nonew = (flg ? 0 : 1);
1312d71ae5a4SJacob Faibussowitsch     break;
1313d71ae5a4SJacob Faibussowitsch   case MAT_NEW_NONZERO_LOCATION_ERR:
1314d71ae5a4SJacob Faibussowitsch     a->nonew = (flg ? -1 : 0);
1315d71ae5a4SJacob Faibussowitsch     break;
1316d71ae5a4SJacob Faibussowitsch   case MAT_NEW_NONZERO_ALLOCATION_ERR:
1317d71ae5a4SJacob Faibussowitsch     a->nonew = (flg ? -2 : 0);
1318d71ae5a4SJacob Faibussowitsch     break;
1319d71ae5a4SJacob Faibussowitsch   case MAT_UNUSED_NONZERO_LOCATION_ERR:
1320d71ae5a4SJacob Faibussowitsch     a->nounused = (flg ? -1 : 0);
1321d71ae5a4SJacob Faibussowitsch     break;
1322d71ae5a4SJacob Faibussowitsch   case MAT_IGNORE_ZERO_ENTRIES:
1323d71ae5a4SJacob Faibussowitsch     a->ignorezeroentries = flg;
1324d71ae5a4SJacob Faibussowitsch     break;
13253d472b54SHong Zhang   case MAT_SPD:
1326b1646e73SJed Brown   case MAT_SYMMETRIC:
1327b1646e73SJed Brown   case MAT_STRUCTURALLY_SYMMETRIC:
1328b1646e73SJed Brown   case MAT_HERMITIAN:
1329b1646e73SJed Brown   case MAT_SYMMETRY_ETERNAL:
1330957cac9fSHong Zhang   case MAT_STRUCTURE_ONLY:
1331b94d7dedSBarry Smith   case MAT_STRUCTURAL_SYMMETRY_ETERNAL:
1332b94d7dedSBarry Smith   case MAT_SPD_ETERNAL:
1333b94d7dedSBarry Smith     /* if the diagonal matrix is square it inherits some of the properties above */
13345021d80fSJed Brown     break;
13358c78258cSHong Zhang   case MAT_FORCE_DIAGONAL_ENTRIES:
1336a65d3064SKris Buschelman   case MAT_IGNORE_OFF_PROC_ENTRIES:
1337d71ae5a4SJacob Faibussowitsch   case MAT_USE_HASH_TABLE:
1338d71ae5a4SJacob Faibussowitsch     PetscCall(PetscInfo(A, "Option %s ignored\n", MatOptions[op]));
1339d71ae5a4SJacob Faibussowitsch     break;
1340d71ae5a4SJacob Faibussowitsch   case MAT_USE_INODES:
1341d71ae5a4SJacob Faibussowitsch     PetscCall(MatSetOption_SeqAIJ_Inode(A, MAT_USE_INODES, flg));
1342d71ae5a4SJacob Faibussowitsch     break;
1343d71ae5a4SJacob Faibussowitsch   case MAT_SUBMAT_SINGLEIS:
1344d71ae5a4SJacob Faibussowitsch     A->submat_singleis = flg;
1345d71ae5a4SJacob Faibussowitsch     break;
1346071fcb05SBarry Smith   case MAT_SORTED_FULL:
1347071fcb05SBarry Smith     if (flg) A->ops->setvalues = MatSetValues_SeqAIJ_SortedFull;
1348071fcb05SBarry Smith     else A->ops->setvalues = MatSetValues_SeqAIJ;
1349071fcb05SBarry Smith     break;
1350d71ae5a4SJacob Faibussowitsch   case MAT_FORM_EXPLICIT_TRANSPOSE:
1351d71ae5a4SJacob Faibussowitsch     A->form_explicit_transpose = flg;
1352d71ae5a4SJacob Faibussowitsch     break;
1353d71ae5a4SJacob Faibussowitsch   default:
1354d71ae5a4SJacob Faibussowitsch     SETERRQ(PETSC_COMM_SELF, PETSC_ERR_SUP, "unknown option %d", op);
1355a65d3064SKris Buschelman   }
13563ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
135717ab2063SBarry Smith }
135817ab2063SBarry Smith 
1359*ba38deedSJacob Faibussowitsch static PetscErrorCode MatGetDiagonal_SeqAIJ(Mat A, Vec v)
1360d71ae5a4SJacob Faibussowitsch {
1361416022c9SBarry Smith   Mat_SeqAIJ        *a = (Mat_SeqAIJ *)A->data;
1362fdc842d1SBarry Smith   PetscInt           i, j, n, *ai = a->i, *aj = a->j;
1363c898d852SStefano Zampini   PetscScalar       *x;
1364c898d852SStefano Zampini   const PetscScalar *aa;
136517ab2063SBarry Smith 
13663a40ed3dSBarry Smith   PetscFunctionBegin;
13679566063dSJacob Faibussowitsch   PetscCall(VecGetLocalSize(v, &n));
136808401ef6SPierre Jolivet   PetscCheck(n == A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Nonconforming matrix and vector");
13699566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &aa));
1370d5f3da31SBarry Smith   if (A->factortype == MAT_FACTOR_ILU || A->factortype == MAT_FACTOR_LU) {
1371d3e70bfaSHong Zhang     PetscInt *diag = a->diag;
13729566063dSJacob Faibussowitsch     PetscCall(VecGetArrayWrite(v, &x));
13732c990fa1SHong Zhang     for (i = 0; i < n; i++) x[i] = 1.0 / aa[diag[i]];
13749566063dSJacob Faibussowitsch     PetscCall(VecRestoreArrayWrite(v, &x));
13759566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJRestoreArrayRead(A, &aa));
13763ba16761SJacob Faibussowitsch     PetscFunctionReturn(PETSC_SUCCESS);
137735e7444dSHong Zhang   }
137835e7444dSHong Zhang 
13799566063dSJacob Faibussowitsch   PetscCall(VecGetArrayWrite(v, &x));
138035e7444dSHong Zhang   for (i = 0; i < n; i++) {
1381fdc842d1SBarry Smith     x[i] = 0.0;
138235e7444dSHong Zhang     for (j = ai[i]; j < ai[i + 1]; j++) {
138335e7444dSHong Zhang       if (aj[j] == i) {
138435e7444dSHong Zhang         x[i] = aa[j];
138517ab2063SBarry Smith         break;
138617ab2063SBarry Smith       }
138717ab2063SBarry Smith     }
138817ab2063SBarry Smith   }
13899566063dSJacob Faibussowitsch   PetscCall(VecRestoreArrayWrite(v, &x));
13909566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &aa));
13913ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
139217ab2063SBarry Smith }
139317ab2063SBarry Smith 
1394c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/ftn-kernels/fmult.h>
1395d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMultTransposeAdd_SeqAIJ(Mat A, Vec xx, Vec zz, Vec yy)
1396d71ae5a4SJacob Faibussowitsch {
1397416022c9SBarry Smith   Mat_SeqAIJ        *a = (Mat_SeqAIJ *)A->data;
13985f22a7b3SSebastian Grimberg   const MatScalar   *aa;
1399d9ca1df4SBarry Smith   PetscScalar       *y;
1400d9ca1df4SBarry Smith   const PetscScalar *x;
1401d0f46423SBarry Smith   PetscInt           m = A->rmap->n;
14025c897100SBarry Smith #if !defined(PETSC_USE_FORTRAN_KERNEL_MULTTRANSPOSEAIJ)
14035f22a7b3SSebastian Grimberg   const MatScalar  *v;
1404a77337e4SBarry Smith   PetscScalar       alpha;
1405d9ca1df4SBarry Smith   PetscInt          n, i, j;
1406d9ca1df4SBarry Smith   const PetscInt   *idx, *ii, *ridx = NULL;
14073447b6efSHong Zhang   Mat_CompressedRow cprow    = a->compressedrow;
1408ace3abfcSBarry Smith   PetscBool         usecprow = cprow.use;
14095c897100SBarry Smith #endif
141017ab2063SBarry Smith 
14113a40ed3dSBarry Smith   PetscFunctionBegin;
14129566063dSJacob Faibussowitsch   if (zz != yy) PetscCall(VecCopy(zz, yy));
14139566063dSJacob Faibussowitsch   PetscCall(VecGetArrayRead(xx, &x));
14149566063dSJacob Faibussowitsch   PetscCall(VecGetArray(yy, &y));
14159566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &aa));
14165c897100SBarry Smith 
14175c897100SBarry Smith #if defined(PETSC_USE_FORTRAN_KERNEL_MULTTRANSPOSEAIJ)
1418fff043a9SJunchao Zhang   fortranmulttransposeaddaij_(&m, x, a->i, a->j, aa, y);
14195c897100SBarry Smith #else
14203447b6efSHong Zhang   if (usecprow) {
14213447b6efSHong Zhang     m    = cprow.nrows;
14223447b6efSHong Zhang     ii   = cprow.i;
14237b2bb3b9SHong Zhang     ridx = cprow.rindex;
14243447b6efSHong Zhang   } else {
14253447b6efSHong Zhang     ii = a->i;
14263447b6efSHong Zhang   }
142717ab2063SBarry Smith   for (i = 0; i < m; i++) {
14283447b6efSHong Zhang     idx = a->j + ii[i];
1429fff043a9SJunchao Zhang     v   = aa + ii[i];
14303447b6efSHong Zhang     n   = ii[i + 1] - ii[i];
14313447b6efSHong Zhang     if (usecprow) {
14327b2bb3b9SHong Zhang       alpha = x[ridx[i]];
14333447b6efSHong Zhang     } else {
143417ab2063SBarry Smith       alpha = x[i];
14353447b6efSHong Zhang     }
143604fbf559SBarry Smith     for (j = 0; j < n; j++) y[idx[j]] += alpha * v[j];
143717ab2063SBarry Smith   }
14385c897100SBarry Smith #endif
14399566063dSJacob Faibussowitsch   PetscCall(PetscLogFlops(2.0 * a->nz));
14409566063dSJacob Faibussowitsch   PetscCall(VecRestoreArrayRead(xx, &x));
14419566063dSJacob Faibussowitsch   PetscCall(VecRestoreArray(yy, &y));
14429566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &aa));
14433ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
144417ab2063SBarry Smith }
144517ab2063SBarry Smith 
1446d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMultTranspose_SeqAIJ(Mat A, Vec xx, Vec yy)
1447d71ae5a4SJacob Faibussowitsch {
14485c897100SBarry Smith   PetscFunctionBegin;
14499566063dSJacob Faibussowitsch   PetscCall(VecSet(yy, 0.0));
14509566063dSJacob Faibussowitsch   PetscCall(MatMultTransposeAdd_SeqAIJ(A, xx, yy, yy));
14513ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
14525c897100SBarry Smith }
14535c897100SBarry Smith 
1454c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/ftn-kernels/fmult.h>
145578b84d54SShri Abhyankar 
1456d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMult_SeqAIJ(Mat A, Vec xx, Vec yy)
1457d71ae5a4SJacob Faibussowitsch {
1458416022c9SBarry Smith   Mat_SeqAIJ        *a = (Mat_SeqAIJ *)A->data;
1459d9fead3dSBarry Smith   PetscScalar       *y;
146054f21887SBarry Smith   const PetscScalar *x;
1461fff043a9SJunchao Zhang   const MatScalar   *aa, *a_a;
1462003131ecSBarry Smith   PetscInt           m = A->rmap->n;
14630298fd71SBarry Smith   const PetscInt    *aj, *ii, *ridx = NULL;
14647b083b7cSBarry Smith   PetscInt           n, i;
1465362ced78SSatish Balay   PetscScalar        sum;
1466ace3abfcSBarry Smith   PetscBool          usecprow = a->compressedrow.use;
146717ab2063SBarry Smith 
1468b6410449SSatish Balay #if defined(PETSC_HAVE_PRAGMA_DISJOINT)
146997952fefSHong Zhang   #pragma disjoint(*x, *y, *aa)
1470fee21e36SBarry Smith #endif
1471fee21e36SBarry Smith 
14723a40ed3dSBarry Smith   PetscFunctionBegin;
1473b215bc84SStefano Zampini   if (a->inode.use && a->inode.checked) {
14749566063dSJacob Faibussowitsch     PetscCall(MatMult_SeqAIJ_Inode(A, xx, yy));
14753ba16761SJacob Faibussowitsch     PetscFunctionReturn(PETSC_SUCCESS);
1476b215bc84SStefano Zampini   }
14779566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &a_a));
14789566063dSJacob Faibussowitsch   PetscCall(VecGetArrayRead(xx, &x));
14799566063dSJacob Faibussowitsch   PetscCall(VecGetArray(yy, &y));
1480416022c9SBarry Smith   ii = a->i;
14814eb6d288SHong Zhang   if (usecprow) { /* use compressed row format */
14829566063dSJacob Faibussowitsch     PetscCall(PetscArrayzero(y, m));
148397952fefSHong Zhang     m    = a->compressedrow.nrows;
148497952fefSHong Zhang     ii   = a->compressedrow.i;
148597952fefSHong Zhang     ridx = a->compressedrow.rindex;
148697952fefSHong Zhang     for (i = 0; i < m; i++) {
148797952fefSHong Zhang       n   = ii[i + 1] - ii[i];
148897952fefSHong Zhang       aj  = a->j + ii[i];
1489fff043a9SJunchao Zhang       aa  = a_a + ii[i];
149097952fefSHong Zhang       sum = 0.0;
1491003131ecSBarry Smith       PetscSparseDensePlusDot(sum, x, aa, aj, n);
1492003131ecSBarry Smith       /* for (j=0; j<n; j++) sum += (*aa++)*x[*aj++]; */
149397952fefSHong Zhang       y[*ridx++] = sum;
149497952fefSHong Zhang     }
149597952fefSHong Zhang   } else { /* do not use compressed row format */
1496b05257ddSBarry Smith #if defined(PETSC_USE_FORTRAN_KERNEL_MULTAIJ)
14973d3eaba7SBarry Smith     aj = a->j;
1498fff043a9SJunchao Zhang     aa = a_a;
1499b05257ddSBarry Smith     fortranmultaij_(&m, x, ii, aj, aa, y);
1500b05257ddSBarry Smith #else
150117ab2063SBarry Smith     for (i = 0; i < m; i++) {
1502003131ecSBarry Smith       n   = ii[i + 1] - ii[i];
1503003131ecSBarry Smith       aj  = a->j + ii[i];
1504fff043a9SJunchao Zhang       aa  = a_a + ii[i];
150517ab2063SBarry Smith       sum = 0.0;
1506003131ecSBarry Smith       PetscSparseDensePlusDot(sum, x, aa, aj, n);
150717ab2063SBarry Smith       y[i] = sum;
150817ab2063SBarry Smith     }
15098d195f9aSBarry Smith #endif
1510b05257ddSBarry Smith   }
15119566063dSJacob Faibussowitsch   PetscCall(PetscLogFlops(2.0 * a->nz - a->nonzerorowcnt));
15129566063dSJacob Faibussowitsch   PetscCall(VecRestoreArrayRead(xx, &x));
15139566063dSJacob Faibussowitsch   PetscCall(VecRestoreArray(yy, &y));
15149566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &a_a));
15153ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
151617ab2063SBarry Smith }
151717ab2063SBarry Smith 
1518*ba38deedSJacob Faibussowitsch // HACK!!!!! Used by src/mat/tests/ex170.c
1519*ba38deedSJacob Faibussowitsch PETSC_EXTERN PetscErrorCode MatMultMax_SeqAIJ(Mat A, Vec xx, Vec yy)
1520d71ae5a4SJacob Faibussowitsch {
1521b434eb95SMatthew G. Knepley   Mat_SeqAIJ        *a = (Mat_SeqAIJ *)A->data;
1522b434eb95SMatthew G. Knepley   PetscScalar       *y;
1523b434eb95SMatthew G. Knepley   const PetscScalar *x;
1524fff043a9SJunchao Zhang   const MatScalar   *aa, *a_a;
1525b434eb95SMatthew G. Knepley   PetscInt           m = A->rmap->n;
1526b434eb95SMatthew G. Knepley   const PetscInt    *aj, *ii, *ridx   = NULL;
1527b434eb95SMatthew G. Knepley   PetscInt           n, i, nonzerorow = 0;
1528b434eb95SMatthew G. Knepley   PetscScalar        sum;
1529b434eb95SMatthew G. Knepley   PetscBool          usecprow = a->compressedrow.use;
1530b434eb95SMatthew G. Knepley 
1531b434eb95SMatthew G. Knepley #if defined(PETSC_HAVE_PRAGMA_DISJOINT)
1532b434eb95SMatthew G. Knepley   #pragma disjoint(*x, *y, *aa)
1533b434eb95SMatthew G. Knepley #endif
1534b434eb95SMatthew G. Knepley 
1535b434eb95SMatthew G. Knepley   PetscFunctionBegin;
15369566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &a_a));
15379566063dSJacob Faibussowitsch   PetscCall(VecGetArrayRead(xx, &x));
15389566063dSJacob Faibussowitsch   PetscCall(VecGetArray(yy, &y));
1539b434eb95SMatthew G. Knepley   if (usecprow) { /* use compressed row format */
1540b434eb95SMatthew G. Knepley     m    = a->compressedrow.nrows;
1541b434eb95SMatthew G. Knepley     ii   = a->compressedrow.i;
1542b434eb95SMatthew G. Knepley     ridx = a->compressedrow.rindex;
1543b434eb95SMatthew G. Knepley     for (i = 0; i < m; i++) {
1544b434eb95SMatthew G. Knepley       n   = ii[i + 1] - ii[i];
1545b434eb95SMatthew G. Knepley       aj  = a->j + ii[i];
1546fff043a9SJunchao Zhang       aa  = a_a + ii[i];
1547b434eb95SMatthew G. Knepley       sum = 0.0;
1548b434eb95SMatthew G. Knepley       nonzerorow += (n > 0);
1549b434eb95SMatthew G. Knepley       PetscSparseDenseMaxDot(sum, x, aa, aj, n);
1550b434eb95SMatthew G. Knepley       /* for (j=0; j<n; j++) sum += (*aa++)*x[*aj++]; */
1551b434eb95SMatthew G. Knepley       y[*ridx++] = sum;
1552b434eb95SMatthew G. Knepley     }
1553b434eb95SMatthew G. Knepley   } else { /* do not use compressed row format */
15543d3eaba7SBarry Smith     ii = a->i;
1555b434eb95SMatthew G. Knepley     for (i = 0; i < m; i++) {
1556b434eb95SMatthew G. Knepley       n   = ii[i + 1] - ii[i];
1557b434eb95SMatthew G. Knepley       aj  = a->j + ii[i];
1558fff043a9SJunchao Zhang       aa  = a_a + ii[i];
1559b434eb95SMatthew G. Knepley       sum = 0.0;
1560b434eb95SMatthew G. Knepley       nonzerorow += (n > 0);
1561b434eb95SMatthew G. Knepley       PetscSparseDenseMaxDot(sum, x, aa, aj, n);
1562b434eb95SMatthew G. Knepley       y[i] = sum;
1563b434eb95SMatthew G. Knepley     }
1564b434eb95SMatthew G. Knepley   }
15659566063dSJacob Faibussowitsch   PetscCall(PetscLogFlops(2.0 * a->nz - nonzerorow));
15669566063dSJacob Faibussowitsch   PetscCall(VecRestoreArrayRead(xx, &x));
15679566063dSJacob Faibussowitsch   PetscCall(VecRestoreArray(yy, &y));
15689566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &a_a));
15693ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
1570b434eb95SMatthew G. Knepley }
1571b434eb95SMatthew G. Knepley 
1572*ba38deedSJacob Faibussowitsch // HACK!!!!! Used by src/mat/tests/ex170.c
1573*ba38deedSJacob Faibussowitsch PETSC_EXTERN PetscErrorCode MatMultAddMax_SeqAIJ(Mat A, Vec xx, Vec yy, Vec zz)
1574d71ae5a4SJacob Faibussowitsch {
1575b434eb95SMatthew G. Knepley   Mat_SeqAIJ        *a = (Mat_SeqAIJ *)A->data;
1576b434eb95SMatthew G. Knepley   PetscScalar       *y, *z;
1577b434eb95SMatthew G. Knepley   const PetscScalar *x;
1578fff043a9SJunchao Zhang   const MatScalar   *aa, *a_a;
1579b434eb95SMatthew G. Knepley   PetscInt           m = A->rmap->n, *aj, *ii;
1580b434eb95SMatthew G. Knepley   PetscInt           n, i, *ridx = NULL;
1581b434eb95SMatthew G. Knepley   PetscScalar        sum;
1582b434eb95SMatthew G. Knepley   PetscBool          usecprow = a->compressedrow.use;
1583b434eb95SMatthew G. Knepley 
1584b434eb95SMatthew G. Knepley   PetscFunctionBegin;
15859566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &a_a));
15869566063dSJacob Faibussowitsch   PetscCall(VecGetArrayRead(xx, &x));
15879566063dSJacob Faibussowitsch   PetscCall(VecGetArrayPair(yy, zz, &y, &z));
1588b434eb95SMatthew G. Knepley   if (usecprow) { /* use compressed row format */
158948a46eb9SPierre Jolivet     if (zz != yy) PetscCall(PetscArraycpy(z, y, m));
1590b434eb95SMatthew G. Knepley     m    = a->compressedrow.nrows;
1591b434eb95SMatthew G. Knepley     ii   = a->compressedrow.i;
1592b434eb95SMatthew G. Knepley     ridx = a->compressedrow.rindex;
1593b434eb95SMatthew G. Knepley     for (i = 0; i < m; i++) {
1594b434eb95SMatthew G. Knepley       n   = ii[i + 1] - ii[i];
1595b434eb95SMatthew G. Knepley       aj  = a->j + ii[i];
1596fff043a9SJunchao Zhang       aa  = a_a + ii[i];
1597b434eb95SMatthew G. Knepley       sum = y[*ridx];
1598b434eb95SMatthew G. Knepley       PetscSparseDenseMaxDot(sum, x, aa, aj, n);
1599b434eb95SMatthew G. Knepley       z[*ridx++] = sum;
1600b434eb95SMatthew G. Knepley     }
1601b434eb95SMatthew G. Knepley   } else { /* do not use compressed row format */
16023d3eaba7SBarry Smith     ii = a->i;
1603b434eb95SMatthew G. Knepley     for (i = 0; i < m; i++) {
1604b434eb95SMatthew G. Knepley       n   = ii[i + 1] - ii[i];
1605b434eb95SMatthew G. Knepley       aj  = a->j + ii[i];
1606fff043a9SJunchao Zhang       aa  = a_a + ii[i];
1607b434eb95SMatthew G. Knepley       sum = y[i];
1608b434eb95SMatthew G. Knepley       PetscSparseDenseMaxDot(sum, x, aa, aj, n);
1609b434eb95SMatthew G. Knepley       z[i] = sum;
1610b434eb95SMatthew G. Knepley     }
1611b434eb95SMatthew G. Knepley   }
16129566063dSJacob Faibussowitsch   PetscCall(PetscLogFlops(2.0 * a->nz));
16139566063dSJacob Faibussowitsch   PetscCall(VecRestoreArrayRead(xx, &x));
16149566063dSJacob Faibussowitsch   PetscCall(VecRestoreArrayPair(yy, zz, &y, &z));
16159566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &a_a));
16163ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
1617b434eb95SMatthew G. Knepley }
1618b434eb95SMatthew G. Knepley 
1619c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/ftn-kernels/fmultadd.h>
1620d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMultAdd_SeqAIJ(Mat A, Vec xx, Vec yy, Vec zz)
1621d71ae5a4SJacob Faibussowitsch {
1622416022c9SBarry Smith   Mat_SeqAIJ        *a = (Mat_SeqAIJ *)A->data;
1623f15663dcSBarry Smith   PetscScalar       *y, *z;
1624f15663dcSBarry Smith   const PetscScalar *x;
1625fff043a9SJunchao Zhang   const MatScalar   *aa, *a_a;
1626d9ca1df4SBarry Smith   const PetscInt    *aj, *ii, *ridx = NULL;
1627d9ca1df4SBarry Smith   PetscInt           m = A->rmap->n, n, i;
1628362ced78SSatish Balay   PetscScalar        sum;
1629ace3abfcSBarry Smith   PetscBool          usecprow = a->compressedrow.use;
16309ea0dfa2SSatish Balay 
16313a40ed3dSBarry Smith   PetscFunctionBegin;
1632b215bc84SStefano Zampini   if (a->inode.use && a->inode.checked) {
16339566063dSJacob Faibussowitsch     PetscCall(MatMultAdd_SeqAIJ_Inode(A, xx, yy, zz));
16343ba16761SJacob Faibussowitsch     PetscFunctionReturn(PETSC_SUCCESS);
1635b215bc84SStefano Zampini   }
16369566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &a_a));
16379566063dSJacob Faibussowitsch   PetscCall(VecGetArrayRead(xx, &x));
16389566063dSJacob Faibussowitsch   PetscCall(VecGetArrayPair(yy, zz, &y, &z));
16394eb6d288SHong Zhang   if (usecprow) { /* use compressed row format */
164048a46eb9SPierre Jolivet     if (zz != yy) PetscCall(PetscArraycpy(z, y, m));
164197952fefSHong Zhang     m    = a->compressedrow.nrows;
164297952fefSHong Zhang     ii   = a->compressedrow.i;
164397952fefSHong Zhang     ridx = a->compressedrow.rindex;
164497952fefSHong Zhang     for (i = 0; i < m; i++) {
164597952fefSHong Zhang       n   = ii[i + 1] - ii[i];
164697952fefSHong Zhang       aj  = a->j + ii[i];
1647fff043a9SJunchao Zhang       aa  = a_a + ii[i];
164897952fefSHong Zhang       sum = y[*ridx];
1649f15663dcSBarry Smith       PetscSparseDensePlusDot(sum, x, aa, aj, n);
165097952fefSHong Zhang       z[*ridx++] = sum;
165197952fefSHong Zhang     }
165297952fefSHong Zhang   } else { /* do not use compressed row format */
16533d3eaba7SBarry Smith     ii = a->i;
1654f15663dcSBarry Smith #if defined(PETSC_USE_FORTRAN_KERNEL_MULTADDAIJ)
16553d3eaba7SBarry Smith     aj = a->j;
1656fff043a9SJunchao Zhang     aa = a_a;
1657f15663dcSBarry Smith     fortranmultaddaij_(&m, x, ii, aj, aa, y, z);
1658f15663dcSBarry Smith #else
165917ab2063SBarry Smith     for (i = 0; i < m; i++) {
1660f15663dcSBarry Smith       n   = ii[i + 1] - ii[i];
1661f15663dcSBarry Smith       aj  = a->j + ii[i];
1662fff043a9SJunchao Zhang       aa  = a_a + ii[i];
166317ab2063SBarry Smith       sum = y[i];
1664f15663dcSBarry Smith       PetscSparseDensePlusDot(sum, x, aa, aj, n);
166517ab2063SBarry Smith       z[i] = sum;
166617ab2063SBarry Smith     }
166702ab625aSSatish Balay #endif
1668f15663dcSBarry Smith   }
16699566063dSJacob Faibussowitsch   PetscCall(PetscLogFlops(2.0 * a->nz));
16709566063dSJacob Faibussowitsch   PetscCall(VecRestoreArrayRead(xx, &x));
16719566063dSJacob Faibussowitsch   PetscCall(VecRestoreArrayPair(yy, zz, &y, &z));
16729566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &a_a));
16733ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
167417ab2063SBarry Smith }
167517ab2063SBarry Smith 
167617ab2063SBarry Smith /*
167717ab2063SBarry Smith      Adds diagonal pointers to sparse matrix structure.
167817ab2063SBarry Smith */
1679d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMarkDiagonal_SeqAIJ(Mat A)
1680d71ae5a4SJacob Faibussowitsch {
1681416022c9SBarry Smith   Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data;
1682d0f46423SBarry Smith   PetscInt    i, j, m = A->rmap->n;
1683c0c07093SJunchao Zhang   PetscBool   alreadySet = PETSC_TRUE;
168417ab2063SBarry Smith 
16853a40ed3dSBarry Smith   PetscFunctionBegin;
168609f38230SBarry Smith   if (!a->diag) {
16879566063dSJacob Faibussowitsch     PetscCall(PetscMalloc1(m, &a->diag));
1688c0c07093SJunchao Zhang     alreadySet = PETSC_FALSE;
168909f38230SBarry Smith   }
1690d0f46423SBarry Smith   for (i = 0; i < A->rmap->n; i++) {
1691c0c07093SJunchao Zhang     /* If A's diagonal is already correctly set, this fast track enables cheap and repeated MatMarkDiagonal_SeqAIJ() calls */
1692c0c07093SJunchao Zhang     if (alreadySet) {
1693c0c07093SJunchao Zhang       PetscInt pos = a->diag[i];
1694c0c07093SJunchao Zhang       if (pos >= a->i[i] && pos < a->i[i + 1] && a->j[pos] == i) continue;
1695c0c07093SJunchao Zhang     }
1696c0c07093SJunchao Zhang 
169709f38230SBarry Smith     a->diag[i] = a->i[i + 1];
1698bfeeae90SHong Zhang     for (j = a->i[i]; j < a->i[i + 1]; j++) {
1699bfeeae90SHong Zhang       if (a->j[j] == i) {
170009f38230SBarry Smith         a->diag[i] = j;
170117ab2063SBarry Smith         break;
170217ab2063SBarry Smith       }
170317ab2063SBarry Smith     }
170417ab2063SBarry Smith   }
17053ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
170617ab2063SBarry Smith }
170717ab2063SBarry Smith 
1708*ba38deedSJacob Faibussowitsch static PetscErrorCode MatShift_SeqAIJ(Mat A, PetscScalar v)
1709d71ae5a4SJacob Faibussowitsch {
171061ecd0c6SBarry Smith   Mat_SeqAIJ     *a    = (Mat_SeqAIJ *)A->data;
171161ecd0c6SBarry Smith   const PetscInt *diag = (const PetscInt *)a->diag;
171261ecd0c6SBarry Smith   const PetscInt *ii   = (const PetscInt *)a->i;
171361ecd0c6SBarry Smith   PetscInt        i, *mdiag = NULL;
171461ecd0c6SBarry Smith   PetscInt        cnt = 0; /* how many diagonals are missing */
171561ecd0c6SBarry Smith 
171661ecd0c6SBarry Smith   PetscFunctionBegin;
171761ecd0c6SBarry Smith   if (!A->preallocated || !a->nz) {
17189566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJSetPreallocation(A, 1, NULL));
17199566063dSJacob Faibussowitsch     PetscCall(MatShift_Basic(A, v));
17203ba16761SJacob Faibussowitsch     PetscFunctionReturn(PETSC_SUCCESS);
172161ecd0c6SBarry Smith   }
172261ecd0c6SBarry Smith 
172361ecd0c6SBarry Smith   if (a->diagonaldense) {
172461ecd0c6SBarry Smith     cnt = 0;
172561ecd0c6SBarry Smith   } else {
17269566063dSJacob Faibussowitsch     PetscCall(PetscCalloc1(A->rmap->n, &mdiag));
172761ecd0c6SBarry Smith     for (i = 0; i < A->rmap->n; i++) {
1728349d3b71SJunchao Zhang       if (i < A->cmap->n && diag[i] >= ii[i + 1]) { /* 'out of range' rows never have diagonals */
172961ecd0c6SBarry Smith         cnt++;
173061ecd0c6SBarry Smith         mdiag[i] = 1;
173161ecd0c6SBarry Smith       }
173261ecd0c6SBarry Smith     }
173361ecd0c6SBarry Smith   }
173461ecd0c6SBarry Smith   if (!cnt) {
17359566063dSJacob Faibussowitsch     PetscCall(MatShift_Basic(A, v));
173661ecd0c6SBarry Smith   } else {
1737b6f2aa54SBarry Smith     PetscScalar *olda = a->a; /* preserve pointers to current matrix nonzeros structure and values */
1738b6f2aa54SBarry Smith     PetscInt    *oldj = a->j, *oldi = a->i;
173961ecd0c6SBarry Smith     PetscBool    singlemalloc = a->singlemalloc, free_a = a->free_a, free_ij = a->free_ij;
174061ecd0c6SBarry Smith 
174161ecd0c6SBarry Smith     a->a = NULL;
174261ecd0c6SBarry Smith     a->j = NULL;
174361ecd0c6SBarry Smith     a->i = NULL;
174461ecd0c6SBarry Smith     /* increase the values in imax for each row where a diagonal is being inserted then reallocate the matrix data structures */
1745ad540459SPierre Jolivet     for (i = 0; i < PetscMin(A->rmap->n, A->cmap->n); i++) a->imax[i] += mdiag[i];
17469566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(A, 0, a->imax));
174761ecd0c6SBarry Smith 
174861ecd0c6SBarry Smith     /* copy old values into new matrix data structure */
174961ecd0c6SBarry Smith     for (i = 0; i < A->rmap->n; i++) {
17509566063dSJacob Faibussowitsch       PetscCall(MatSetValues(A, 1, &i, a->imax[i] - mdiag[i], &oldj[oldi[i]], &olda[oldi[i]], ADD_VALUES));
175148a46eb9SPierre Jolivet       if (i < A->cmap->n) PetscCall(MatSetValue(A, i, i, v, ADD_VALUES));
1752447d62f5SStefano Zampini     }
17539566063dSJacob Faibussowitsch     PetscCall(MatAssemblyBegin(A, MAT_FINAL_ASSEMBLY));
17549566063dSJacob Faibussowitsch     PetscCall(MatAssemblyEnd(A, MAT_FINAL_ASSEMBLY));
175561ecd0c6SBarry Smith     if (singlemalloc) {
17569566063dSJacob Faibussowitsch       PetscCall(PetscFree3(olda, oldj, oldi));
175761ecd0c6SBarry Smith     } else {
17589566063dSJacob Faibussowitsch       if (free_a) PetscCall(PetscFree(olda));
17599566063dSJacob Faibussowitsch       if (free_ij) PetscCall(PetscFree(oldj));
17609566063dSJacob Faibussowitsch       if (free_ij) PetscCall(PetscFree(oldi));
176161ecd0c6SBarry Smith     }
176261ecd0c6SBarry Smith   }
17639566063dSJacob Faibussowitsch   PetscCall(PetscFree(mdiag));
176461ecd0c6SBarry Smith   a->diagonaldense = PETSC_TRUE;
17653ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
176661ecd0c6SBarry Smith }
176761ecd0c6SBarry Smith 
1768be5855fcSBarry Smith /*
1769be5855fcSBarry Smith      Checks for missing diagonals
1770be5855fcSBarry Smith */
1771d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMissingDiagonal_SeqAIJ(Mat A, PetscBool *missing, PetscInt *d)
1772d71ae5a4SJacob Faibussowitsch {
1773be5855fcSBarry Smith   Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data;
17747734d3b5SMatthew G. Knepley   PetscInt   *diag, *ii = a->i, i;
1775be5855fcSBarry Smith 
1776be5855fcSBarry Smith   PetscFunctionBegin;
177709f38230SBarry Smith   *missing = PETSC_FALSE;
17787734d3b5SMatthew G. Knepley   if (A->rmap->n > 0 && !ii) {
177909f38230SBarry Smith     *missing = PETSC_TRUE;
178009f38230SBarry Smith     if (d) *d = 0;
17819566063dSJacob Faibussowitsch     PetscCall(PetscInfo(A, "Matrix has no entries therefore is missing diagonal\n"));
178209f38230SBarry Smith   } else {
178301445905SHong Zhang     PetscInt n;
178401445905SHong Zhang     n    = PetscMin(A->rmap->n, A->cmap->n);
1785f1e2ffcdSBarry Smith     diag = a->diag;
178601445905SHong Zhang     for (i = 0; i < n; i++) {
17877734d3b5SMatthew G. Knepley       if (diag[i] >= ii[i + 1]) {
178809f38230SBarry Smith         *missing = PETSC_TRUE;
178909f38230SBarry Smith         if (d) *d = i;
17909566063dSJacob Faibussowitsch         PetscCall(PetscInfo(A, "Matrix is missing diagonal number %" PetscInt_FMT "\n", i));
1791358d2f5dSShri Abhyankar         break;
179209f38230SBarry Smith       }
1793be5855fcSBarry Smith     }
1794be5855fcSBarry Smith   }
17953ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
1796be5855fcSBarry Smith }
1797be5855fcSBarry Smith 
17980da83c2eSBarry Smith #include <petscblaslapack.h>
17990da83c2eSBarry Smith #include <petsc/private/kernels/blockinvert.h>
18000da83c2eSBarry Smith 
18010da83c2eSBarry Smith /*
18020da83c2eSBarry Smith     Note that values is allocated externally by the PC and then passed into this routine
18030da83c2eSBarry Smith */
1804*ba38deedSJacob Faibussowitsch static PetscErrorCode MatInvertVariableBlockDiagonal_SeqAIJ(Mat A, PetscInt nblocks, const PetscInt *bsizes, PetscScalar *diag)
1805d71ae5a4SJacob Faibussowitsch {
18060da83c2eSBarry Smith   PetscInt        n = A->rmap->n, i, ncnt = 0, *indx, j, bsizemax = 0, *v_pivots;
18070da83c2eSBarry Smith   PetscBool       allowzeropivot, zeropivotdetected = PETSC_FALSE;
18080da83c2eSBarry Smith   const PetscReal shift = 0.0;
18090da83c2eSBarry Smith   PetscInt        ipvt[5];
18104e208921SJed Brown   PetscCount      flops = 0;
18110da83c2eSBarry Smith   PetscScalar     work[25], *v_work;
18120da83c2eSBarry Smith 
18130da83c2eSBarry Smith   PetscFunctionBegin;
18140da83c2eSBarry Smith   allowzeropivot = PetscNot(A->erroriffailure);
18150da83c2eSBarry Smith   for (i = 0; i < nblocks; i++) ncnt += bsizes[i];
181608401ef6SPierre Jolivet   PetscCheck(ncnt == n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Total blocksizes %" PetscInt_FMT " doesn't match number matrix rows %" PetscInt_FMT, ncnt, n);
1817ad540459SPierre Jolivet   for (i = 0; i < nblocks; i++) bsizemax = PetscMax(bsizemax, bsizes[i]);
18189566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(bsizemax, &indx));
181948a46eb9SPierre Jolivet   if (bsizemax > 7) PetscCall(PetscMalloc2(bsizemax, &v_work, bsizemax, &v_pivots));
18200da83c2eSBarry Smith   ncnt = 0;
18210da83c2eSBarry Smith   for (i = 0; i < nblocks; i++) {
18220da83c2eSBarry Smith     for (j = 0; j < bsizes[i]; j++) indx[j] = ncnt + j;
18239566063dSJacob Faibussowitsch     PetscCall(MatGetValues(A, bsizes[i], indx, bsizes[i], indx, diag));
18240da83c2eSBarry Smith     switch (bsizes[i]) {
1825d71ae5a4SJacob Faibussowitsch     case 1:
1826d71ae5a4SJacob Faibussowitsch       *diag = 1.0 / (*diag);
1827d71ae5a4SJacob Faibussowitsch       break;
18280da83c2eSBarry Smith     case 2:
18299566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_inverse_A_2(diag, shift, allowzeropivot, &zeropivotdetected));
18300da83c2eSBarry Smith       if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT;
18319566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_transpose_A_2(diag));
18320da83c2eSBarry Smith       break;
18330da83c2eSBarry Smith     case 3:
18349566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_inverse_A_3(diag, shift, allowzeropivot, &zeropivotdetected));
18350da83c2eSBarry Smith       if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT;
18369566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_transpose_A_3(diag));
18370da83c2eSBarry Smith       break;
18380da83c2eSBarry Smith     case 4:
18399566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_inverse_A_4(diag, shift, allowzeropivot, &zeropivotdetected));
18400da83c2eSBarry Smith       if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT;
18419566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_transpose_A_4(diag));
18420da83c2eSBarry Smith       break;
18430da83c2eSBarry Smith     case 5:
18449566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_inverse_A_5(diag, ipvt, work, shift, allowzeropivot, &zeropivotdetected));
18450da83c2eSBarry Smith       if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT;
18469566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_transpose_A_5(diag));
18470da83c2eSBarry Smith       break;
18480da83c2eSBarry Smith     case 6:
18499566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_inverse_A_6(diag, shift, allowzeropivot, &zeropivotdetected));
18500da83c2eSBarry Smith       if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT;
18519566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_transpose_A_6(diag));
18520da83c2eSBarry Smith       break;
18530da83c2eSBarry Smith     case 7:
18549566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_inverse_A_7(diag, shift, allowzeropivot, &zeropivotdetected));
18550da83c2eSBarry Smith       if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT;
18569566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_transpose_A_7(diag));
18570da83c2eSBarry Smith       break;
18580da83c2eSBarry Smith     default:
18599566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_inverse_A(bsizes[i], diag, v_pivots, v_work, allowzeropivot, &zeropivotdetected));
18600da83c2eSBarry Smith       if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT;
18619566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_transpose_A_N(diag, bsizes[i]));
18620da83c2eSBarry Smith     }
18630da83c2eSBarry Smith     ncnt += bsizes[i];
18640da83c2eSBarry Smith     diag += bsizes[i] * bsizes[i];
18654e208921SJed Brown     flops += 2 * PetscPowInt(bsizes[i], 3) / 3;
18660da83c2eSBarry Smith   }
18673ba16761SJacob Faibussowitsch   PetscCall(PetscLogFlops(flops));
186848a46eb9SPierre Jolivet   if (bsizemax > 7) PetscCall(PetscFree2(v_work, v_pivots));
18699566063dSJacob Faibussowitsch   PetscCall(PetscFree(indx));
18703ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
18710da83c2eSBarry Smith }
18720da83c2eSBarry Smith 
1873422a814eSBarry Smith /*
1874422a814eSBarry Smith    Negative shift indicates do not generate an error if there is a zero diagonal, just invert it anyways
1875422a814eSBarry Smith */
1876*ba38deedSJacob Faibussowitsch static PetscErrorCode MatInvertDiagonal_SeqAIJ(Mat A, PetscScalar omega, PetscScalar fshift)
1877d71ae5a4SJacob Faibussowitsch {
187871f1c65dSBarry Smith   Mat_SeqAIJ      *a = (Mat_SeqAIJ *)A->data;
1879d0f46423SBarry Smith   PetscInt         i, *diag, m = A->rmap->n;
18802e5835c6SStefano Zampini   const MatScalar *v;
188154f21887SBarry Smith   PetscScalar     *idiag, *mdiag;
188271f1c65dSBarry Smith 
188371f1c65dSBarry Smith   PetscFunctionBegin;
18843ba16761SJacob Faibussowitsch   if (a->idiagvalid) PetscFunctionReturn(PETSC_SUCCESS);
18859566063dSJacob Faibussowitsch   PetscCall(MatMarkDiagonal_SeqAIJ(A));
188671f1c65dSBarry Smith   diag = a->diag;
18874dfa11a4SJacob Faibussowitsch   if (!a->idiag) { PetscCall(PetscMalloc3(m, &a->idiag, m, &a->mdiag, m, &a->ssor_work)); }
18882e5835c6SStefano Zampini 
188971f1c65dSBarry Smith   mdiag = a->mdiag;
189071f1c65dSBarry Smith   idiag = a->idiag;
18919566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &v));
1892422a814eSBarry Smith   if (omega == 1.0 && PetscRealPart(fshift) <= 0.0) {
189371f1c65dSBarry Smith     for (i = 0; i < m; i++) {
189471f1c65dSBarry Smith       mdiag[i] = v[diag[i]];
1895899639b0SHong Zhang       if (!PetscAbsScalar(mdiag[i])) { /* zero diagonal */
1896899639b0SHong Zhang         if (PetscRealPart(fshift)) {
18979566063dSJacob Faibussowitsch           PetscCall(PetscInfo(A, "Zero diagonal on row %" PetscInt_FMT "\n", i));
18987b6c816cSBarry Smith           A->factorerrortype             = MAT_FACTOR_NUMERIC_ZEROPIVOT;
18997b6c816cSBarry Smith           A->factorerror_zeropivot_value = 0.0;
19007b6c816cSBarry Smith           A->factorerror_zeropivot_row   = i;
190198921bdaSJacob Faibussowitsch         } else SETERRQ(PETSC_COMM_SELF, PETSC_ERR_ARG_INCOMP, "Zero diagonal on row %" PetscInt_FMT, i);
1902899639b0SHong Zhang       }
190371f1c65dSBarry Smith       idiag[i] = 1.0 / v[diag[i]];
190471f1c65dSBarry Smith     }
19059566063dSJacob Faibussowitsch     PetscCall(PetscLogFlops(m));
190671f1c65dSBarry Smith   } else {
190771f1c65dSBarry Smith     for (i = 0; i < m; i++) {
190871f1c65dSBarry Smith       mdiag[i] = v[diag[i]];
190971f1c65dSBarry Smith       idiag[i] = omega / (fshift + v[diag[i]]);
191071f1c65dSBarry Smith     }
19119566063dSJacob Faibussowitsch     PetscCall(PetscLogFlops(2.0 * m));
191271f1c65dSBarry Smith   }
191371f1c65dSBarry Smith   a->idiagvalid = PETSC_TRUE;
19149566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &v));
19153ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
191671f1c65dSBarry Smith }
191771f1c65dSBarry Smith 
1918c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/ftn-kernels/frelax.h>
1919d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSOR_SeqAIJ(Mat A, Vec bb, PetscReal omega, MatSORType flag, PetscReal fshift, PetscInt its, PetscInt lits, Vec xx)
1920d71ae5a4SJacob Faibussowitsch {
1921416022c9SBarry Smith   Mat_SeqAIJ        *a = (Mat_SeqAIJ *)A->data;
1922e6d1f457SBarry Smith   PetscScalar       *x, d, sum, *t, scale;
19232e5835c6SStefano Zampini   const MatScalar   *v, *idiag = NULL, *mdiag, *aa;
192454f21887SBarry Smith   const PetscScalar *b, *bs, *xb, *ts;
19253d3eaba7SBarry Smith   PetscInt           n, m = A->rmap->n, i;
192697f1f81fSBarry Smith   const PetscInt    *idx, *diag;
192717ab2063SBarry Smith 
19283a40ed3dSBarry Smith   PetscFunctionBegin;
1929b215bc84SStefano Zampini   if (a->inode.use && a->inode.checked && omega == 1.0 && fshift == 0.0) {
19309566063dSJacob Faibussowitsch     PetscCall(MatSOR_SeqAIJ_Inode(A, bb, omega, flag, fshift, its, lits, xx));
19313ba16761SJacob Faibussowitsch     PetscFunctionReturn(PETSC_SUCCESS);
1932b215bc84SStefano Zampini   }
1933b965ef7fSBarry Smith   its = its * lits;
193491723122SBarry Smith 
193571f1c65dSBarry Smith   if (fshift != a->fshift || omega != a->omega) a->idiagvalid = PETSC_FALSE; /* must recompute idiag[] */
19369566063dSJacob Faibussowitsch   if (!a->idiagvalid) PetscCall(MatInvertDiagonal_SeqAIJ(A, omega, fshift));
193771f1c65dSBarry Smith   a->fshift = fshift;
193871f1c65dSBarry Smith   a->omega  = omega;
1939ed480e8bSBarry Smith 
194071f1c65dSBarry Smith   diag  = a->diag;
194171f1c65dSBarry Smith   t     = a->ssor_work;
1942ed480e8bSBarry Smith   idiag = a->idiag;
194371f1c65dSBarry Smith   mdiag = a->mdiag;
1944ed480e8bSBarry Smith 
19459566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &aa));
19469566063dSJacob Faibussowitsch   PetscCall(VecGetArray(xx, &x));
19479566063dSJacob Faibussowitsch   PetscCall(VecGetArrayRead(bb, &b));
1948ed480e8bSBarry Smith   /* We count flops by assuming the upper triangular and lower triangular parts have the same number of nonzeros */
194917ab2063SBarry Smith   if (flag == SOR_APPLY_UPPER) {
195017ab2063SBarry Smith     /* apply (U + D/omega) to the vector */
1951ed480e8bSBarry Smith     bs = b;
195217ab2063SBarry Smith     for (i = 0; i < m; i++) {
195371f1c65dSBarry Smith       d   = fshift + mdiag[i];
1954416022c9SBarry Smith       n   = a->i[i + 1] - diag[i] - 1;
1955ed480e8bSBarry Smith       idx = a->j + diag[i] + 1;
19562e5835c6SStefano Zampini       v   = aa + diag[i] + 1;
195717ab2063SBarry Smith       sum = b[i] * d / omega;
1958003131ecSBarry Smith       PetscSparseDensePlusDot(sum, bs, v, idx, n);
195917ab2063SBarry Smith       x[i] = sum;
196017ab2063SBarry Smith     }
19619566063dSJacob Faibussowitsch     PetscCall(VecRestoreArray(xx, &x));
19629566063dSJacob Faibussowitsch     PetscCall(VecRestoreArrayRead(bb, &b));
19639566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJRestoreArrayRead(A, &aa));
19649566063dSJacob Faibussowitsch     PetscCall(PetscLogFlops(a->nz));
19653ba16761SJacob Faibussowitsch     PetscFunctionReturn(PETSC_SUCCESS);
196617ab2063SBarry Smith   }
1967c783ea89SBarry Smith 
196808401ef6SPierre Jolivet   PetscCheck(flag != SOR_APPLY_LOWER, PETSC_COMM_SELF, PETSC_ERR_SUP, "SOR_APPLY_LOWER is not implemented");
1969f7d195e4SLawrence Mitchell   if (flag & SOR_EISENSTAT) {
19704c500f23SPierre Jolivet     /* Let  A = L + U + D; where L is lower triangular,
1971887ee2caSBarry Smith     U is upper triangular, E = D/omega; This routine applies
197217ab2063SBarry Smith 
197317ab2063SBarry Smith             (L + E)^{-1} A (U + E)^{-1}
197417ab2063SBarry Smith 
1975887ee2caSBarry Smith     to a vector efficiently using Eisenstat's trick.
197617ab2063SBarry Smith     */
197717ab2063SBarry Smith     scale = (2.0 / omega) - 1.0;
197817ab2063SBarry Smith 
197917ab2063SBarry Smith     /*  x = (E + U)^{-1} b */
198017ab2063SBarry Smith     for (i = m - 1; i >= 0; i--) {
1981416022c9SBarry Smith       n   = a->i[i + 1] - diag[i] - 1;
1982ed480e8bSBarry Smith       idx = a->j + diag[i] + 1;
19832e5835c6SStefano Zampini       v   = aa + diag[i] + 1;
198417ab2063SBarry Smith       sum = b[i];
1985e6d1f457SBarry Smith       PetscSparseDenseMinusDot(sum, x, v, idx, n);
1986ed480e8bSBarry Smith       x[i] = sum * idiag[i];
198717ab2063SBarry Smith     }
198817ab2063SBarry Smith 
198917ab2063SBarry Smith     /*  t = b - (2*E - D)x */
19902e5835c6SStefano Zampini     v = aa;
19912205254eSKarl Rupp     for (i = 0; i < m; i++) t[i] = b[i] - scale * (v[*diag++]) * x[i];
199217ab2063SBarry Smith 
199317ab2063SBarry Smith     /*  t = (E + L)^{-1}t */
1994ed480e8bSBarry Smith     ts   = t;
1995416022c9SBarry Smith     diag = a->diag;
199617ab2063SBarry Smith     for (i = 0; i < m; i++) {
1997416022c9SBarry Smith       n   = diag[i] - a->i[i];
1998ed480e8bSBarry Smith       idx = a->j + a->i[i];
19992e5835c6SStefano Zampini       v   = aa + a->i[i];
200017ab2063SBarry Smith       sum = t[i];
2001003131ecSBarry Smith       PetscSparseDenseMinusDot(sum, ts, v, idx, n);
2002ed480e8bSBarry Smith       t[i] = sum * idiag[i];
2003733d66baSBarry Smith       /*  x = x + t */
2004733d66baSBarry Smith       x[i] += t[i];
200517ab2063SBarry Smith     }
200617ab2063SBarry Smith 
20079566063dSJacob Faibussowitsch     PetscCall(PetscLogFlops(6.0 * m - 1 + 2.0 * a->nz));
20089566063dSJacob Faibussowitsch     PetscCall(VecRestoreArray(xx, &x));
20099566063dSJacob Faibussowitsch     PetscCall(VecRestoreArrayRead(bb, &b));
20103ba16761SJacob Faibussowitsch     PetscFunctionReturn(PETSC_SUCCESS);
201117ab2063SBarry Smith   }
201217ab2063SBarry Smith   if (flag & SOR_ZERO_INITIAL_GUESS) {
201317ab2063SBarry Smith     if (flag & SOR_FORWARD_SWEEP || flag & SOR_LOCAL_FORWARD_SWEEP) {
201417ab2063SBarry Smith       for (i = 0; i < m; i++) {
2015416022c9SBarry Smith         n   = diag[i] - a->i[i];
2016ed480e8bSBarry Smith         idx = a->j + a->i[i];
20172e5835c6SStefano Zampini         v   = aa + a->i[i];
201817ab2063SBarry Smith         sum = b[i];
2019e6d1f457SBarry Smith         PetscSparseDenseMinusDot(sum, x, v, idx, n);
20205c99c7daSBarry Smith         t[i] = sum;
2021ed480e8bSBarry Smith         x[i] = sum * idiag[i];
202217ab2063SBarry Smith       }
20235c99c7daSBarry Smith       xb = t;
20249566063dSJacob Faibussowitsch       PetscCall(PetscLogFlops(a->nz));
20253a40ed3dSBarry Smith     } else xb = b;
202617ab2063SBarry Smith     if (flag & SOR_BACKWARD_SWEEP || flag & SOR_LOCAL_BACKWARD_SWEEP) {
202717ab2063SBarry Smith       for (i = m - 1; i >= 0; i--) {
2028416022c9SBarry Smith         n   = a->i[i + 1] - diag[i] - 1;
2029ed480e8bSBarry Smith         idx = a->j + diag[i] + 1;
20302e5835c6SStefano Zampini         v   = aa + diag[i] + 1;
203117ab2063SBarry Smith         sum = xb[i];
2032e6d1f457SBarry Smith         PetscSparseDenseMinusDot(sum, x, v, idx, n);
20335c99c7daSBarry Smith         if (xb == b) {
2034ed480e8bSBarry Smith           x[i] = sum * idiag[i];
20355c99c7daSBarry Smith         } else {
2036b19a5dc2SMark Adams           x[i] = (1 - omega) * x[i] + sum * idiag[i]; /* omega in idiag */
203717ab2063SBarry Smith         }
20385c99c7daSBarry Smith       }
20399566063dSJacob Faibussowitsch       PetscCall(PetscLogFlops(a->nz)); /* assumes 1/2 in upper */
204017ab2063SBarry Smith     }
204117ab2063SBarry Smith     its--;
204217ab2063SBarry Smith   }
204317ab2063SBarry Smith   while (its--) {
204417ab2063SBarry Smith     if (flag & SOR_FORWARD_SWEEP || flag & SOR_LOCAL_FORWARD_SWEEP) {
204517ab2063SBarry Smith       for (i = 0; i < m; i++) {
2046b19a5dc2SMark Adams         /* lower */
2047b19a5dc2SMark Adams         n   = diag[i] - a->i[i];
2048ed480e8bSBarry Smith         idx = a->j + a->i[i];
20492e5835c6SStefano Zampini         v   = aa + a->i[i];
205017ab2063SBarry Smith         sum = b[i];
2051e6d1f457SBarry Smith         PetscSparseDenseMinusDot(sum, x, v, idx, n);
2052b19a5dc2SMark Adams         t[i] = sum; /* save application of the lower-triangular part */
2053b19a5dc2SMark Adams         /* upper */
2054b19a5dc2SMark Adams         n   = a->i[i + 1] - diag[i] - 1;
2055b19a5dc2SMark Adams         idx = a->j + diag[i] + 1;
20562e5835c6SStefano Zampini         v   = aa + diag[i] + 1;
2057b19a5dc2SMark Adams         PetscSparseDenseMinusDot(sum, x, v, idx, n);
2058b19a5dc2SMark Adams         x[i] = (1. - omega) * x[i] + sum * idiag[i]; /* omega in idiag */
205917ab2063SBarry Smith       }
2060b19a5dc2SMark Adams       xb = t;
20619566063dSJacob Faibussowitsch       PetscCall(PetscLogFlops(2.0 * a->nz));
2062b19a5dc2SMark Adams     } else xb = b;
206317ab2063SBarry Smith     if (flag & SOR_BACKWARD_SWEEP || flag & SOR_LOCAL_BACKWARD_SWEEP) {
206417ab2063SBarry Smith       for (i = m - 1; i >= 0; i--) {
2065b19a5dc2SMark Adams         sum = xb[i];
2066b19a5dc2SMark Adams         if (xb == b) {
2067b19a5dc2SMark Adams           /* whole matrix (no checkpointing available) */
2068416022c9SBarry Smith           n   = a->i[i + 1] - a->i[i];
2069ed480e8bSBarry Smith           idx = a->j + a->i[i];
20702e5835c6SStefano Zampini           v   = aa + a->i[i];
2071e6d1f457SBarry Smith           PetscSparseDenseMinusDot(sum, x, v, idx, n);
2072ed480e8bSBarry Smith           x[i] = (1. - omega) * x[i] + (sum + mdiag[i] * x[i]) * idiag[i];
2073b19a5dc2SMark Adams         } else { /* lower-triangular part has been saved, so only apply upper-triangular */
2074b19a5dc2SMark Adams           n   = a->i[i + 1] - diag[i] - 1;
2075b19a5dc2SMark Adams           idx = a->j + diag[i] + 1;
20762e5835c6SStefano Zampini           v   = aa + diag[i] + 1;
2077b19a5dc2SMark Adams           PetscSparseDenseMinusDot(sum, x, v, idx, n);
2078b19a5dc2SMark Adams           x[i] = (1. - omega) * x[i] + sum * idiag[i]; /* omega in idiag */
207917ab2063SBarry Smith         }
2080b19a5dc2SMark Adams       }
2081b19a5dc2SMark Adams       if (xb == b) {
20829566063dSJacob Faibussowitsch         PetscCall(PetscLogFlops(2.0 * a->nz));
2083b19a5dc2SMark Adams       } else {
20849566063dSJacob Faibussowitsch         PetscCall(PetscLogFlops(a->nz)); /* assumes 1/2 in upper */
2085b19a5dc2SMark Adams       }
208617ab2063SBarry Smith     }
208717ab2063SBarry Smith   }
20889566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &aa));
20899566063dSJacob Faibussowitsch   PetscCall(VecRestoreArray(xx, &x));
20909566063dSJacob Faibussowitsch   PetscCall(VecRestoreArrayRead(bb, &b));
20913ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
209217ab2063SBarry Smith }
209317ab2063SBarry Smith 
2094*ba38deedSJacob Faibussowitsch static PetscErrorCode MatGetInfo_SeqAIJ(Mat A, MatInfoType flag, MatInfo *info)
2095d71ae5a4SJacob Faibussowitsch {
2096416022c9SBarry Smith   Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data;
20974e220ebcSLois Curfman McInnes 
20983a40ed3dSBarry Smith   PetscFunctionBegin;
20994e220ebcSLois Curfman McInnes   info->block_size   = 1.0;
21003966268fSBarry Smith   info->nz_allocated = a->maxnz;
21013966268fSBarry Smith   info->nz_used      = a->nz;
21023966268fSBarry Smith   info->nz_unneeded  = (a->maxnz - a->nz);
21033966268fSBarry Smith   info->assemblies   = A->num_ass;
21043966268fSBarry Smith   info->mallocs      = A->info.mallocs;
21054dfa11a4SJacob Faibussowitsch   info->memory       = 0; /* REVIEW ME */
2106d5f3da31SBarry Smith   if (A->factortype) {
21074e220ebcSLois Curfman McInnes     info->fill_ratio_given  = A->info.fill_ratio_given;
21084e220ebcSLois Curfman McInnes     info->fill_ratio_needed = A->info.fill_ratio_needed;
21094e220ebcSLois Curfman McInnes     info->factor_mallocs    = A->info.factor_mallocs;
21104e220ebcSLois Curfman McInnes   } else {
21114e220ebcSLois Curfman McInnes     info->fill_ratio_given  = 0;
21124e220ebcSLois Curfman McInnes     info->fill_ratio_needed = 0;
21134e220ebcSLois Curfman McInnes     info->factor_mallocs    = 0;
21144e220ebcSLois Curfman McInnes   }
21153ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
211617ab2063SBarry Smith }
211717ab2063SBarry Smith 
2118*ba38deedSJacob Faibussowitsch static PetscErrorCode MatZeroRows_SeqAIJ(Mat A, PetscInt N, const PetscInt rows[], PetscScalar diag, Vec x, Vec b)
2119d71ae5a4SJacob Faibussowitsch {
2120416022c9SBarry Smith   Mat_SeqAIJ        *a = (Mat_SeqAIJ *)A->data;
2121c7da8527SEric Chamberland   PetscInt           i, m = A->rmap->n - 1;
212297b48c8fSBarry Smith   const PetscScalar *xx;
21232e5835c6SStefano Zampini   PetscScalar       *bb, *aa;
2124c7da8527SEric Chamberland   PetscInt           d = 0;
212517ab2063SBarry Smith 
21263a40ed3dSBarry Smith   PetscFunctionBegin;
212797b48c8fSBarry Smith   if (x && b) {
21289566063dSJacob Faibussowitsch     PetscCall(VecGetArrayRead(x, &xx));
21299566063dSJacob Faibussowitsch     PetscCall(VecGetArray(b, &bb));
213097b48c8fSBarry Smith     for (i = 0; i < N; i++) {
2131aed4548fSBarry Smith       PetscCheck(rows[i] >= 0 && rows[i] <= m, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "row %" PetscInt_FMT " out of range", rows[i]);
2132447d62f5SStefano Zampini       if (rows[i] >= A->cmap->n) continue;
213397b48c8fSBarry Smith       bb[rows[i]] = diag * xx[rows[i]];
213497b48c8fSBarry Smith     }
21359566063dSJacob Faibussowitsch     PetscCall(VecRestoreArrayRead(x, &xx));
21369566063dSJacob Faibussowitsch     PetscCall(VecRestoreArray(b, &bb));
213797b48c8fSBarry Smith   }
213897b48c8fSBarry Smith 
21399566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArray(A, &aa));
2140a9817697SBarry Smith   if (a->keepnonzeropattern) {
2141f1e2ffcdSBarry Smith     for (i = 0; i < N; i++) {
2142aed4548fSBarry Smith       PetscCheck(rows[i] >= 0 && rows[i] <= m, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "row %" PetscInt_FMT " out of range", rows[i]);
21439566063dSJacob Faibussowitsch       PetscCall(PetscArrayzero(&aa[a->i[rows[i]]], a->ilen[rows[i]]));
2144f1e2ffcdSBarry Smith     }
2145f4df32b1SMatthew Knepley     if (diag != 0.0) {
2146c7da8527SEric Chamberland       for (i = 0; i < N; i++) {
2147c7da8527SEric Chamberland         d = rows[i];
2148447d62f5SStefano Zampini         if (rows[i] >= A->cmap->n) continue;
214908401ef6SPierre Jolivet         PetscCheck(a->diag[d] < a->i[d + 1], PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Matrix is missing diagonal entry in the zeroed row %" PetscInt_FMT, d);
2150c7da8527SEric Chamberland       }
2151f1e2ffcdSBarry Smith       for (i = 0; i < N; i++) {
2152447d62f5SStefano Zampini         if (rows[i] >= A->cmap->n) continue;
21532e5835c6SStefano Zampini         aa[a->diag[rows[i]]] = diag;
2154f1e2ffcdSBarry Smith       }
2155f1e2ffcdSBarry Smith     }
2156f1e2ffcdSBarry Smith   } else {
2157f4df32b1SMatthew Knepley     if (diag != 0.0) {
215817ab2063SBarry Smith       for (i = 0; i < N; i++) {
2159aed4548fSBarry Smith         PetscCheck(rows[i] >= 0 && rows[i] <= m, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "row %" PetscInt_FMT " out of range", rows[i]);
21607ae801bdSBarry Smith         if (a->ilen[rows[i]] > 0) {
2161447d62f5SStefano Zampini           if (rows[i] >= A->cmap->n) {
2162447d62f5SStefano Zampini             a->ilen[rows[i]] = 0;
2163447d62f5SStefano Zampini           } else {
2164416022c9SBarry Smith             a->ilen[rows[i]]    = 1;
21652e5835c6SStefano Zampini             aa[a->i[rows[i]]]   = diag;
2166bfeeae90SHong Zhang             a->j[a->i[rows[i]]] = rows[i];
2167447d62f5SStefano Zampini           }
2168447d62f5SStefano Zampini         } else if (rows[i] < A->cmap->n) { /* in case row was completely empty */
21699566063dSJacob Faibussowitsch           PetscCall(MatSetValues_SeqAIJ(A, 1, &rows[i], 1, &rows[i], &diag, INSERT_VALUES));
217017ab2063SBarry Smith         }
217117ab2063SBarry Smith       }
21723a40ed3dSBarry Smith     } else {
217317ab2063SBarry Smith       for (i = 0; i < N; i++) {
2174aed4548fSBarry Smith         PetscCheck(rows[i] >= 0 && rows[i] <= m, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "row %" PetscInt_FMT " out of range", rows[i]);
2175416022c9SBarry Smith         a->ilen[rows[i]] = 0;
217617ab2063SBarry Smith       }
217717ab2063SBarry Smith     }
2178e56f5c9eSBarry Smith     A->nonzerostate++;
2179f1e2ffcdSBarry Smith   }
21809566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArray(A, &aa));
2181dbbe0bcdSBarry Smith   PetscUseTypeMethod(A, assemblyend, MAT_FINAL_ASSEMBLY);
21823ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
218317ab2063SBarry Smith }
218417ab2063SBarry Smith 
2185*ba38deedSJacob Faibussowitsch static PetscErrorCode MatZeroRowsColumns_SeqAIJ(Mat A, PetscInt N, const PetscInt rows[], PetscScalar diag, Vec x, Vec b)
2186d71ae5a4SJacob Faibussowitsch {
21876e169961SBarry Smith   Mat_SeqAIJ        *a = (Mat_SeqAIJ *)A->data;
21886e169961SBarry Smith   PetscInt           i, j, m = A->rmap->n - 1, d = 0;
21892b40b63fSBarry Smith   PetscBool          missing, *zeroed, vecs = PETSC_FALSE;
21906e169961SBarry Smith   const PetscScalar *xx;
21912e5835c6SStefano Zampini   PetscScalar       *bb, *aa;
21926e169961SBarry Smith 
21936e169961SBarry Smith   PetscFunctionBegin;
21943ba16761SJacob Faibussowitsch   if (!N) PetscFunctionReturn(PETSC_SUCCESS);
21959566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArray(A, &aa));
21966e169961SBarry Smith   if (x && b) {
21979566063dSJacob Faibussowitsch     PetscCall(VecGetArrayRead(x, &xx));
21989566063dSJacob Faibussowitsch     PetscCall(VecGetArray(b, &bb));
21992b40b63fSBarry Smith     vecs = PETSC_TRUE;
22006e169961SBarry Smith   }
22019566063dSJacob Faibussowitsch   PetscCall(PetscCalloc1(A->rmap->n, &zeroed));
22026e169961SBarry Smith   for (i = 0; i < N; i++) {
2203aed4548fSBarry Smith     PetscCheck(rows[i] >= 0 && rows[i] <= m, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "row %" PetscInt_FMT " out of range", rows[i]);
22049566063dSJacob Faibussowitsch     PetscCall(PetscArrayzero(&aa[a->i[rows[i]]], a->ilen[rows[i]]));
22052205254eSKarl Rupp 
22066e169961SBarry Smith     zeroed[rows[i]] = PETSC_TRUE;
22076e169961SBarry Smith   }
22086e169961SBarry Smith   for (i = 0; i < A->rmap->n; i++) {
22096e169961SBarry Smith     if (!zeroed[i]) {
22106e169961SBarry Smith       for (j = a->i[i]; j < a->i[i + 1]; j++) {
22114cf107fdSStefano Zampini         if (a->j[j] < A->rmap->n && zeroed[a->j[j]]) {
22122e5835c6SStefano Zampini           if (vecs) bb[i] -= aa[j] * xx[a->j[j]];
22132e5835c6SStefano Zampini           aa[j] = 0.0;
22146e169961SBarry Smith         }
22156e169961SBarry Smith       }
22164cf107fdSStefano Zampini     } else if (vecs && i < A->cmap->N) bb[i] = diag * xx[i];
22176e169961SBarry Smith   }
22186e169961SBarry Smith   if (x && b) {
22199566063dSJacob Faibussowitsch     PetscCall(VecRestoreArrayRead(x, &xx));
22209566063dSJacob Faibussowitsch     PetscCall(VecRestoreArray(b, &bb));
22216e169961SBarry Smith   }
22229566063dSJacob Faibussowitsch   PetscCall(PetscFree(zeroed));
22236e169961SBarry Smith   if (diag != 0.0) {
22249566063dSJacob Faibussowitsch     PetscCall(MatMissingDiagonal_SeqAIJ(A, &missing, &d));
22251d5a398dSstefano_zampini     if (missing) {
22261d5a398dSstefano_zampini       for (i = 0; i < N; i++) {
22274cf107fdSStefano Zampini         if (rows[i] >= A->cmap->N) continue;
2228aed4548fSBarry Smith         PetscCheck(!a->nonew || rows[i] < d, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Matrix is missing diagonal entry in row %" PetscInt_FMT " (%" PetscInt_FMT ")", d, rows[i]);
22299566063dSJacob Faibussowitsch         PetscCall(MatSetValues_SeqAIJ(A, 1, &rows[i], 1, &rows[i], &diag, INSERT_VALUES));
22301d5a398dSstefano_zampini       }
22311d5a398dSstefano_zampini     } else {
2232ad540459SPierre Jolivet       for (i = 0; i < N; i++) aa[a->diag[rows[i]]] = diag;
22336e169961SBarry Smith     }
22341d5a398dSstefano_zampini   }
22359566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArray(A, &aa));
2236dbbe0bcdSBarry Smith   PetscUseTypeMethod(A, assemblyend, MAT_FINAL_ASSEMBLY);
22373ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
22386e169961SBarry Smith }
22396e169961SBarry Smith 
2240d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetRow_SeqAIJ(Mat A, PetscInt row, PetscInt *nz, PetscInt **idx, PetscScalar **v)
2241d71ae5a4SJacob Faibussowitsch {
2242fff043a9SJunchao Zhang   Mat_SeqAIJ        *a = (Mat_SeqAIJ *)A->data;
2243fff043a9SJunchao Zhang   const PetscScalar *aa;
2244fff043a9SJunchao Zhang   PetscInt          *itmp;
224517ab2063SBarry Smith 
22463a40ed3dSBarry Smith   PetscFunctionBegin;
22479566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &aa));
2248416022c9SBarry Smith   *nz = a->i[row + 1] - a->i[row];
22492e5835c6SStefano Zampini   if (v) *v = (PetscScalar *)(aa + a->i[row]);
225017ab2063SBarry Smith   if (idx) {
2251bfeeae90SHong Zhang     itmp = a->j + a->i[row];
225226fbe8dcSKarl Rupp     if (*nz) *idx = itmp;
2253f4259b30SLisandro Dalcin     else *idx = NULL;
225417ab2063SBarry Smith   }
22559566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &aa));
22563ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
225717ab2063SBarry Smith }
225817ab2063SBarry Smith 
2259d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRestoreRow_SeqAIJ(Mat A, PetscInt row, PetscInt *nz, PetscInt **idx, PetscScalar **v)
2260d71ae5a4SJacob Faibussowitsch {
22613a40ed3dSBarry Smith   PetscFunctionBegin;
2262cb4a9cd9SHong Zhang   if (nz) *nz = 0;
22632e5835c6SStefano Zampini   if (idx) *idx = NULL;
22642e5835c6SStefano Zampini   if (v) *v = NULL;
22653ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
226617ab2063SBarry Smith }
226717ab2063SBarry Smith 
2268*ba38deedSJacob Faibussowitsch static PetscErrorCode MatNorm_SeqAIJ(Mat A, NormType type, PetscReal *nrm)
2269d71ae5a4SJacob Faibussowitsch {
2270416022c9SBarry Smith   Mat_SeqAIJ      *a = (Mat_SeqAIJ *)A->data;
22712e5835c6SStefano Zampini   const MatScalar *v;
227236db0b34SBarry Smith   PetscReal        sum = 0.0;
227397f1f81fSBarry Smith   PetscInt         i, j;
227417ab2063SBarry Smith 
22753a40ed3dSBarry Smith   PetscFunctionBegin;
22769566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &v));
227717ab2063SBarry Smith   if (type == NORM_FROBENIUS) {
2278570b7f6dSBarry Smith #if defined(PETSC_USE_REAL___FP16)
2279570b7f6dSBarry Smith     PetscBLASInt one = 1, nz = a->nz;
2280792fecdfSBarry Smith     PetscCallBLAS("BLASnrm2", *nrm = BLASnrm2_(&nz, v, &one));
2281570b7f6dSBarry Smith #else
2282416022c9SBarry Smith     for (i = 0; i < a->nz; i++) {
22839371c9d4SSatish Balay       sum += PetscRealPart(PetscConj(*v) * (*v));
22849371c9d4SSatish Balay       v++;
228517ab2063SBarry Smith     }
22868f1a2a5eSBarry Smith     *nrm = PetscSqrtReal(sum);
2287570b7f6dSBarry Smith #endif
22889566063dSJacob Faibussowitsch     PetscCall(PetscLogFlops(2.0 * a->nz));
22893a40ed3dSBarry Smith   } else if (type == NORM_1) {
229036db0b34SBarry Smith     PetscReal *tmp;
229197f1f81fSBarry Smith     PetscInt  *jj = a->j;
22929566063dSJacob Faibussowitsch     PetscCall(PetscCalloc1(A->cmap->n + 1, &tmp));
2293064f8208SBarry Smith     *nrm = 0.0;
2294416022c9SBarry Smith     for (j = 0; j < a->nz; j++) {
22959371c9d4SSatish Balay       tmp[*jj++] += PetscAbsScalar(*v);
22969371c9d4SSatish Balay       v++;
229717ab2063SBarry Smith     }
2298d0f46423SBarry Smith     for (j = 0; j < A->cmap->n; j++) {
2299064f8208SBarry Smith       if (tmp[j] > *nrm) *nrm = tmp[j];
230017ab2063SBarry Smith     }
23019566063dSJacob Faibussowitsch     PetscCall(PetscFree(tmp));
23029566063dSJacob Faibussowitsch     PetscCall(PetscLogFlops(PetscMax(a->nz - 1, 0)));
23033a40ed3dSBarry Smith   } else if (type == NORM_INFINITY) {
2304064f8208SBarry Smith     *nrm = 0.0;
2305d0f46423SBarry Smith     for (j = 0; j < A->rmap->n; j++) {
23062e5835c6SStefano Zampini       const PetscScalar *v2 = v + a->i[j];
230717ab2063SBarry Smith       sum                   = 0.0;
2308416022c9SBarry Smith       for (i = 0; i < a->i[j + 1] - a->i[j]; i++) {
23099371c9d4SSatish Balay         sum += PetscAbsScalar(*v2);
23109371c9d4SSatish Balay         v2++;
231117ab2063SBarry Smith       }
2312064f8208SBarry Smith       if (sum > *nrm) *nrm = sum;
231317ab2063SBarry Smith     }
23149566063dSJacob Faibussowitsch     PetscCall(PetscLogFlops(PetscMax(a->nz - 1, 0)));
2315f23aa3ddSBarry Smith   } else SETERRQ(PETSC_COMM_SELF, PETSC_ERR_SUP, "No support for two norm");
23169566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &v));
23173ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
231817ab2063SBarry Smith }
231917ab2063SBarry Smith 
2320*ba38deedSJacob Faibussowitsch static PetscErrorCode MatIsTranspose_SeqAIJ(Mat A, Mat B, PetscReal tol, PetscBool *f)
2321d71ae5a4SJacob Faibussowitsch {
23223d3eaba7SBarry Smith   Mat_SeqAIJ      *aij = (Mat_SeqAIJ *)A->data, *bij = (Mat_SeqAIJ *)B->data;
232354f21887SBarry Smith   PetscInt        *adx, *bdx, *aii, *bii, *aptr, *bptr;
23242e5835c6SStefano Zampini   const MatScalar *va, *vb;
232597f1f81fSBarry Smith   PetscInt         ma, na, mb, nb, i;
2326cd0d46ebSvictorle 
2327cd0d46ebSvictorle   PetscFunctionBegin;
23289566063dSJacob Faibussowitsch   PetscCall(MatGetSize(A, &ma, &na));
23299566063dSJacob Faibussowitsch   PetscCall(MatGetSize(B, &mb, &nb));
23305485867bSBarry Smith   if (ma != nb || na != mb) {
23315485867bSBarry Smith     *f = PETSC_FALSE;
23323ba16761SJacob Faibussowitsch     PetscFunctionReturn(PETSC_SUCCESS);
23335485867bSBarry Smith   }
23349566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &va));
23359566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(B, &vb));
23369371c9d4SSatish Balay   aii = aij->i;
23379371c9d4SSatish Balay   bii = bij->i;
23389371c9d4SSatish Balay   adx = aij->j;
23399371c9d4SSatish Balay   bdx = bij->j;
23409566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(ma, &aptr));
23419566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(mb, &bptr));
2342cd0d46ebSvictorle   for (i = 0; i < ma; i++) aptr[i] = aii[i];
2343cd0d46ebSvictorle   for (i = 0; i < mb; i++) bptr[i] = bii[i];
2344cd0d46ebSvictorle 
2345cd0d46ebSvictorle   *f = PETSC_TRUE;
2346cd0d46ebSvictorle   for (i = 0; i < ma; i++) {
2347cd0d46ebSvictorle     while (aptr[i] < aii[i + 1]) {
234897f1f81fSBarry Smith       PetscInt    idc, idr;
23495485867bSBarry Smith       PetscScalar vc, vr;
2350cd0d46ebSvictorle       /* column/row index/value */
23515485867bSBarry Smith       idc = adx[aptr[i]];
23525485867bSBarry Smith       idr = bdx[bptr[idc]];
23535485867bSBarry Smith       vc  = va[aptr[i]];
23545485867bSBarry Smith       vr  = vb[bptr[idc]];
23555485867bSBarry Smith       if (i != idr || PetscAbsScalar(vc - vr) > tol) {
23565485867bSBarry Smith         *f = PETSC_FALSE;
23575485867bSBarry Smith         goto done;
2358cd0d46ebSvictorle       } else {
23595485867bSBarry Smith         aptr[i]++;
23605485867bSBarry Smith         if (B || i != idc) bptr[idc]++;
2361cd0d46ebSvictorle       }
2362cd0d46ebSvictorle     }
2363cd0d46ebSvictorle   }
2364cd0d46ebSvictorle done:
23659566063dSJacob Faibussowitsch   PetscCall(PetscFree(aptr));
23669566063dSJacob Faibussowitsch   PetscCall(PetscFree(bptr));
23679566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &va));
23689566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(B, &vb));
23693ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
2370cd0d46ebSvictorle }
2371cd0d46ebSvictorle 
2372*ba38deedSJacob Faibussowitsch static PetscErrorCode MatIsHermitianTranspose_SeqAIJ(Mat A, Mat B, PetscReal tol, PetscBool *f)
2373d71ae5a4SJacob Faibussowitsch {
23743d3eaba7SBarry Smith   Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data, *bij = (Mat_SeqAIJ *)B->data;
237554f21887SBarry Smith   PetscInt   *adx, *bdx, *aii, *bii, *aptr, *bptr;
237654f21887SBarry Smith   MatScalar  *va, *vb;
23771cbb95d3SBarry Smith   PetscInt    ma, na, mb, nb, i;
23781cbb95d3SBarry Smith 
23791cbb95d3SBarry Smith   PetscFunctionBegin;
23809566063dSJacob Faibussowitsch   PetscCall(MatGetSize(A, &ma, &na));
23819566063dSJacob Faibussowitsch   PetscCall(MatGetSize(B, &mb, &nb));
23821cbb95d3SBarry Smith   if (ma != nb || na != mb) {
23831cbb95d3SBarry Smith     *f = PETSC_FALSE;
23843ba16761SJacob Faibussowitsch     PetscFunctionReturn(PETSC_SUCCESS);
23851cbb95d3SBarry Smith   }
23869371c9d4SSatish Balay   aii = aij->i;
23879371c9d4SSatish Balay   bii = bij->i;
23889371c9d4SSatish Balay   adx = aij->j;
23899371c9d4SSatish Balay   bdx = bij->j;
23909371c9d4SSatish Balay   va  = aij->a;
23919371c9d4SSatish Balay   vb  = bij->a;
23929566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(ma, &aptr));
23939566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(mb, &bptr));
23941cbb95d3SBarry Smith   for (i = 0; i < ma; i++) aptr[i] = aii[i];
23951cbb95d3SBarry Smith   for (i = 0; i < mb; i++) bptr[i] = bii[i];
23961cbb95d3SBarry Smith 
23971cbb95d3SBarry Smith   *f = PETSC_TRUE;
23981cbb95d3SBarry Smith   for (i = 0; i < ma; i++) {
23991cbb95d3SBarry Smith     while (aptr[i] < aii[i + 1]) {
24001cbb95d3SBarry Smith       PetscInt    idc, idr;
24011cbb95d3SBarry Smith       PetscScalar vc, vr;
24021cbb95d3SBarry Smith       /* column/row index/value */
24031cbb95d3SBarry Smith       idc = adx[aptr[i]];
24041cbb95d3SBarry Smith       idr = bdx[bptr[idc]];
24051cbb95d3SBarry Smith       vc  = va[aptr[i]];
24061cbb95d3SBarry Smith       vr  = vb[bptr[idc]];
24071cbb95d3SBarry Smith       if (i != idr || PetscAbsScalar(vc - PetscConj(vr)) > tol) {
24081cbb95d3SBarry Smith         *f = PETSC_FALSE;
24091cbb95d3SBarry Smith         goto done;
24101cbb95d3SBarry Smith       } else {
24111cbb95d3SBarry Smith         aptr[i]++;
24121cbb95d3SBarry Smith         if (B || i != idc) bptr[idc]++;
24131cbb95d3SBarry Smith       }
24141cbb95d3SBarry Smith     }
24151cbb95d3SBarry Smith   }
24161cbb95d3SBarry Smith done:
24179566063dSJacob Faibussowitsch   PetscCall(PetscFree(aptr));
24189566063dSJacob Faibussowitsch   PetscCall(PetscFree(bptr));
24193ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
24201cbb95d3SBarry Smith }
24211cbb95d3SBarry Smith 
2422*ba38deedSJacob Faibussowitsch static PetscErrorCode MatIsSymmetric_SeqAIJ(Mat A, PetscReal tol, PetscBool *f)
2423d71ae5a4SJacob Faibussowitsch {
24249e29f15eSvictorle   PetscFunctionBegin;
24259566063dSJacob Faibussowitsch   PetscCall(MatIsTranspose_SeqAIJ(A, A, tol, f));
24263ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
24279e29f15eSvictorle }
24289e29f15eSvictorle 
2429*ba38deedSJacob Faibussowitsch static PetscErrorCode MatIsHermitian_SeqAIJ(Mat A, PetscReal tol, PetscBool *f)
2430d71ae5a4SJacob Faibussowitsch {
24311cbb95d3SBarry Smith   PetscFunctionBegin;
24329566063dSJacob Faibussowitsch   PetscCall(MatIsHermitianTranspose_SeqAIJ(A, A, tol, f));
24333ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
24341cbb95d3SBarry Smith }
24351cbb95d3SBarry Smith 
2436d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDiagonalScale_SeqAIJ(Mat A, Vec ll, Vec rr)
2437d71ae5a4SJacob Faibussowitsch {
2438416022c9SBarry Smith   Mat_SeqAIJ        *a = (Mat_SeqAIJ *)A->data;
2439fff8e43fSBarry Smith   const PetscScalar *l, *r;
2440fff8e43fSBarry Smith   PetscScalar        x;
244154f21887SBarry Smith   MatScalar         *v;
2442fff8e43fSBarry Smith   PetscInt           i, j, m = A->rmap->n, n = A->cmap->n, M, nz = a->nz;
2443fff8e43fSBarry Smith   const PetscInt    *jj;
244417ab2063SBarry Smith 
24453a40ed3dSBarry Smith   PetscFunctionBegin;
244617ab2063SBarry Smith   if (ll) {
24473ea7c6a1SSatish Balay     /* The local size is used so that VecMPI can be passed to this routine
24483ea7c6a1SSatish Balay        by MatDiagonalScale_MPIAIJ */
24499566063dSJacob Faibussowitsch     PetscCall(VecGetLocalSize(ll, &m));
245008401ef6SPierre Jolivet     PetscCheck(m == A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Left scaling vector wrong length");
24519566063dSJacob Faibussowitsch     PetscCall(VecGetArrayRead(ll, &l));
24529566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJGetArray(A, &v));
245317ab2063SBarry Smith     for (i = 0; i < m; i++) {
245417ab2063SBarry Smith       x = l[i];
2455416022c9SBarry Smith       M = a->i[i + 1] - a->i[i];
24562205254eSKarl Rupp       for (j = 0; j < M; j++) (*v++) *= x;
245717ab2063SBarry Smith     }
24589566063dSJacob Faibussowitsch     PetscCall(VecRestoreArrayRead(ll, &l));
24599566063dSJacob Faibussowitsch     PetscCall(PetscLogFlops(nz));
24609566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJRestoreArray(A, &v));
246117ab2063SBarry Smith   }
246217ab2063SBarry Smith   if (rr) {
24639566063dSJacob Faibussowitsch     PetscCall(VecGetLocalSize(rr, &n));
246408401ef6SPierre Jolivet     PetscCheck(n == A->cmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Right scaling vector wrong length");
24659566063dSJacob Faibussowitsch     PetscCall(VecGetArrayRead(rr, &r));
24669566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJGetArray(A, &v));
24672e5835c6SStefano Zampini     jj = a->j;
24682205254eSKarl Rupp     for (i = 0; i < nz; i++) (*v++) *= r[*jj++];
24699566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJRestoreArray(A, &v));
24709566063dSJacob Faibussowitsch     PetscCall(VecRestoreArrayRead(rr, &r));
24719566063dSJacob Faibussowitsch     PetscCall(PetscLogFlops(nz));
247217ab2063SBarry Smith   }
24739566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJInvalidateDiagonal(A));
24743ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
247517ab2063SBarry Smith }
247617ab2063SBarry Smith 
2477d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateSubMatrix_SeqAIJ(Mat A, IS isrow, IS iscol, PetscInt csize, MatReuse scall, Mat *B)
2478d71ae5a4SJacob Faibussowitsch {
2479db02288aSLois Curfman McInnes   Mat_SeqAIJ        *a = (Mat_SeqAIJ *)A->data, *c;
2480d0f46423SBarry Smith   PetscInt          *smap, i, k, kstart, kend, oldcols = A->cmap->n, *lens;
248197f1f81fSBarry Smith   PetscInt           row, mat_i, *mat_j, tcol, first, step, *mat_ilen, sum, lensi;
24825d0c19d7SBarry Smith   const PetscInt    *irow, *icol;
24832e5835c6SStefano Zampini   const PetscScalar *aa;
24845d0c19d7SBarry Smith   PetscInt           nrows, ncols;
248597f1f81fSBarry Smith   PetscInt          *starts, *j_new, *i_new, *aj = a->j, *ai = a->i, ii, *ailen = a->ilen;
2486fb3c7e2dSJunchao Zhang   MatScalar         *a_new, *mat_a, *c_a;
2487416022c9SBarry Smith   Mat                C;
2488cdc6f3adSToby Isaac   PetscBool          stride;
248917ab2063SBarry Smith 
24903a40ed3dSBarry Smith   PetscFunctionBegin;
24919566063dSJacob Faibussowitsch   PetscCall(ISGetIndices(isrow, &irow));
24929566063dSJacob Faibussowitsch   PetscCall(ISGetLocalSize(isrow, &nrows));
24939566063dSJacob Faibussowitsch   PetscCall(ISGetLocalSize(iscol, &ncols));
249417ab2063SBarry Smith 
24959566063dSJacob Faibussowitsch   PetscCall(PetscObjectTypeCompare((PetscObject)iscol, ISSTRIDE, &stride));
2496ff718158SBarry Smith   if (stride) {
24979566063dSJacob Faibussowitsch     PetscCall(ISStrideGetInfo(iscol, &first, &step));
2498ff718158SBarry Smith   } else {
2499ff718158SBarry Smith     first = 0;
2500ff718158SBarry Smith     step  = 0;
2501ff718158SBarry Smith   }
2502fee21e36SBarry Smith   if (stride && step == 1) {
250302834360SBarry Smith     /* special case of contiguous rows */
25049566063dSJacob Faibussowitsch     PetscCall(PetscMalloc2(nrows, &lens, nrows, &starts));
250502834360SBarry Smith     /* loop over new rows determining lens and starting points */
250602834360SBarry Smith     for (i = 0; i < nrows; i++) {
2507bfeeae90SHong Zhang       kstart    = ai[irow[i]];
2508a2744918SBarry Smith       kend      = kstart + ailen[irow[i]];
2509a91a9bebSLisandro Dalcin       starts[i] = kstart;
251002834360SBarry Smith       for (k = kstart; k < kend; k++) {
2511bfeeae90SHong Zhang         if (aj[k] >= first) {
251202834360SBarry Smith           starts[i] = k;
251302834360SBarry Smith           break;
251402834360SBarry Smith         }
251502834360SBarry Smith       }
2516a2744918SBarry Smith       sum = 0;
251702834360SBarry Smith       while (k < kend) {
2518bfeeae90SHong Zhang         if (aj[k++] >= first + ncols) break;
2519a2744918SBarry Smith         sum++;
252002834360SBarry Smith       }
2521a2744918SBarry Smith       lens[i] = sum;
252202834360SBarry Smith     }
252302834360SBarry Smith     /* create submatrix */
2524cddf8d76SBarry Smith     if (scall == MAT_REUSE_MATRIX) {
252597f1f81fSBarry Smith       PetscInt n_cols, n_rows;
25269566063dSJacob Faibussowitsch       PetscCall(MatGetSize(*B, &n_rows, &n_cols));
2527aed4548fSBarry Smith       PetscCheck(n_rows == nrows && n_cols == ncols, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Reused submatrix wrong size");
25289566063dSJacob Faibussowitsch       PetscCall(MatZeroEntries(*B));
252908480c60SBarry Smith       C = *B;
25303a40ed3dSBarry Smith     } else {
25313bef6203SJed Brown       PetscInt rbs, cbs;
25329566063dSJacob Faibussowitsch       PetscCall(MatCreate(PetscObjectComm((PetscObject)A), &C));
25339566063dSJacob Faibussowitsch       PetscCall(MatSetSizes(C, nrows, ncols, PETSC_DETERMINE, PETSC_DETERMINE));
25349566063dSJacob Faibussowitsch       PetscCall(ISGetBlockSize(isrow, &rbs));
25359566063dSJacob Faibussowitsch       PetscCall(ISGetBlockSize(iscol, &cbs));
25369566063dSJacob Faibussowitsch       PetscCall(MatSetBlockSizes(C, rbs, cbs));
25379566063dSJacob Faibussowitsch       PetscCall(MatSetType(C, ((PetscObject)A)->type_name));
25389566063dSJacob Faibussowitsch       PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(C, 0, lens));
253908480c60SBarry Smith     }
2540db02288aSLois Curfman McInnes     c = (Mat_SeqAIJ *)C->data;
2541db02288aSLois Curfman McInnes 
254202834360SBarry Smith     /* loop over rows inserting into submatrix */
2543fb3c7e2dSJunchao Zhang     PetscCall(MatSeqAIJGetArrayWrite(C, &a_new)); // Not 'a_new = c->a-new', since that raw usage ignores offload state of C
2544db02288aSLois Curfman McInnes     j_new = c->j;
2545db02288aSLois Curfman McInnes     i_new = c->i;
25469566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJGetArrayRead(A, &aa));
254702834360SBarry Smith     for (i = 0; i < nrows; i++) {
2548a2744918SBarry Smith       ii    = starts[i];
2549a2744918SBarry Smith       lensi = lens[i];
2550ad540459SPierre Jolivet       for (k = 0; k < lensi; k++) *j_new++ = aj[ii + k] - first;
25519566063dSJacob Faibussowitsch       PetscCall(PetscArraycpy(a_new, aa + starts[i], lensi));
2552a2744918SBarry Smith       a_new += lensi;
2553a2744918SBarry Smith       i_new[i + 1] = i_new[i] + lensi;
2554a2744918SBarry Smith       c->ilen[i]   = lensi;
255502834360SBarry Smith     }
2556fb3c7e2dSJunchao Zhang     PetscCall(MatSeqAIJRestoreArrayWrite(C, &a_new)); // Set C's offload state properly
25579566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJRestoreArrayRead(A, &aa));
25589566063dSJacob Faibussowitsch     PetscCall(PetscFree2(lens, starts));
25593a40ed3dSBarry Smith   } else {
25609566063dSJacob Faibussowitsch     PetscCall(ISGetIndices(iscol, &icol));
25619566063dSJacob Faibussowitsch     PetscCall(PetscCalloc1(oldcols, &smap));
25629566063dSJacob Faibussowitsch     PetscCall(PetscMalloc1(1 + nrows, &lens));
25634dcab191SBarry Smith     for (i = 0; i < ncols; i++) {
25646bdcaf15SBarry Smith       PetscCheck(icol[i] < oldcols, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Requesting column beyond largest column icol[%" PetscInt_FMT "] %" PetscInt_FMT " >= A->cmap->n %" PetscInt_FMT, i, icol[i], oldcols);
25654dcab191SBarry Smith       smap[icol[i]] = i + 1;
25664dcab191SBarry Smith     }
25674dcab191SBarry Smith 
256802834360SBarry Smith     /* determine lens of each row */
256902834360SBarry Smith     for (i = 0; i < nrows; i++) {
2570bfeeae90SHong Zhang       kstart  = ai[irow[i]];
257102834360SBarry Smith       kend    = kstart + a->ilen[irow[i]];
257202834360SBarry Smith       lens[i] = 0;
257302834360SBarry Smith       for (k = kstart; k < kend; k++) {
2574ad540459SPierre Jolivet         if (smap[aj[k]]) lens[i]++;
257502834360SBarry Smith       }
257602834360SBarry Smith     }
257717ab2063SBarry Smith     /* Create and fill new matrix */
2578a2744918SBarry Smith     if (scall == MAT_REUSE_MATRIX) {
2579ace3abfcSBarry Smith       PetscBool equal;
25800f5bd95cSBarry Smith 
258199141d43SSatish Balay       c = (Mat_SeqAIJ *)((*B)->data);
2582aed4548fSBarry Smith       PetscCheck((*B)->rmap->n == nrows && (*B)->cmap->n == ncols, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Cannot reuse matrix. wrong size");
25839566063dSJacob Faibussowitsch       PetscCall(PetscArraycmp(c->ilen, lens, (*B)->rmap->n, &equal));
258428b400f6SJacob Faibussowitsch       PetscCheck(equal, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Cannot reuse matrix. wrong no of nonzeros");
25859566063dSJacob Faibussowitsch       PetscCall(PetscArrayzero(c->ilen, (*B)->rmap->n));
258608480c60SBarry Smith       C = *B;
25873a40ed3dSBarry Smith     } else {
25883bef6203SJed Brown       PetscInt rbs, cbs;
25899566063dSJacob Faibussowitsch       PetscCall(MatCreate(PetscObjectComm((PetscObject)A), &C));
25909566063dSJacob Faibussowitsch       PetscCall(MatSetSizes(C, nrows, ncols, PETSC_DETERMINE, PETSC_DETERMINE));
25919566063dSJacob Faibussowitsch       PetscCall(ISGetBlockSize(isrow, &rbs));
25929566063dSJacob Faibussowitsch       PetscCall(ISGetBlockSize(iscol, &cbs));
25939566063dSJacob Faibussowitsch       PetscCall(MatSetBlockSizes(C, rbs, cbs));
25949566063dSJacob Faibussowitsch       PetscCall(MatSetType(C, ((PetscObject)A)->type_name));
25959566063dSJacob Faibussowitsch       PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(C, 0, lens));
259608480c60SBarry Smith     }
25979566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJGetArrayRead(A, &aa));
2598fb3c7e2dSJunchao Zhang 
259999141d43SSatish Balay     c = (Mat_SeqAIJ *)(C->data);
2600fb3c7e2dSJunchao Zhang     PetscCall(MatSeqAIJGetArrayWrite(C, &c_a)); // Not 'c->a', since that raw usage ignores offload state of C
260117ab2063SBarry Smith     for (i = 0; i < nrows; i++) {
260299141d43SSatish Balay       row      = irow[i];
2603bfeeae90SHong Zhang       kstart   = ai[row];
260499141d43SSatish Balay       kend     = kstart + a->ilen[row];
2605bfeeae90SHong Zhang       mat_i    = c->i[i];
260699141d43SSatish Balay       mat_j    = c->j + mat_i;
2607fb3c7e2dSJunchao Zhang       mat_a    = c_a + mat_i;
260899141d43SSatish Balay       mat_ilen = c->ilen + i;
260917ab2063SBarry Smith       for (k = kstart; k < kend; k++) {
2610bfeeae90SHong Zhang         if ((tcol = smap[a->j[k]])) {
2611ed480e8bSBarry Smith           *mat_j++ = tcol - 1;
26122e5835c6SStefano Zampini           *mat_a++ = aa[k];
261399141d43SSatish Balay           (*mat_ilen)++;
261417ab2063SBarry Smith         }
261517ab2063SBarry Smith       }
261617ab2063SBarry Smith     }
26179566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJRestoreArrayRead(A, &aa));
261802834360SBarry Smith     /* Free work space */
26199566063dSJacob Faibussowitsch     PetscCall(ISRestoreIndices(iscol, &icol));
26209566063dSJacob Faibussowitsch     PetscCall(PetscFree(smap));
26219566063dSJacob Faibussowitsch     PetscCall(PetscFree(lens));
2622cdc6f3adSToby Isaac     /* sort */
2623cdc6f3adSToby Isaac     for (i = 0; i < nrows; i++) {
2624cdc6f3adSToby Isaac       PetscInt ilen;
2625cdc6f3adSToby Isaac 
2626cdc6f3adSToby Isaac       mat_i = c->i[i];
2627cdc6f3adSToby Isaac       mat_j = c->j + mat_i;
2628fb3c7e2dSJunchao Zhang       mat_a = c_a + mat_i;
2629cdc6f3adSToby Isaac       ilen  = c->ilen[i];
26309566063dSJacob Faibussowitsch       PetscCall(PetscSortIntWithScalarArray(ilen, mat_j, mat_a));
2631cdc6f3adSToby Isaac     }
2632fb3c7e2dSJunchao Zhang     PetscCall(MatSeqAIJRestoreArrayWrite(C, &c_a));
263302834360SBarry Smith   }
26348c3ff71bSJunchao Zhang #if defined(PETSC_HAVE_DEVICE)
26359566063dSJacob Faibussowitsch   PetscCall(MatBindToCPU(C, A->boundtocpu));
2636305c6ccfSStefano Zampini #endif
26379566063dSJacob Faibussowitsch   PetscCall(MatAssemblyBegin(C, MAT_FINAL_ASSEMBLY));
26389566063dSJacob Faibussowitsch   PetscCall(MatAssemblyEnd(C, MAT_FINAL_ASSEMBLY));
263917ab2063SBarry Smith 
26409566063dSJacob Faibussowitsch   PetscCall(ISRestoreIndices(isrow, &irow));
2641416022c9SBarry Smith   *B = C;
26423ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
264317ab2063SBarry Smith }
264417ab2063SBarry Smith 
2645*ba38deedSJacob Faibussowitsch static PetscErrorCode MatGetMultiProcBlock_SeqAIJ(Mat mat, MPI_Comm subComm, MatReuse scall, Mat *subMat)
2646d71ae5a4SJacob Faibussowitsch {
264782d44351SHong Zhang   Mat B;
264882d44351SHong Zhang 
264982d44351SHong Zhang   PetscFunctionBegin;
2650c2d650bdSHong Zhang   if (scall == MAT_INITIAL_MATRIX) {
26519566063dSJacob Faibussowitsch     PetscCall(MatCreate(subComm, &B));
26529566063dSJacob Faibussowitsch     PetscCall(MatSetSizes(B, mat->rmap->n, mat->cmap->n, mat->rmap->n, mat->cmap->n));
26539566063dSJacob Faibussowitsch     PetscCall(MatSetBlockSizesFromMats(B, mat, mat));
26549566063dSJacob Faibussowitsch     PetscCall(MatSetType(B, MATSEQAIJ));
26559566063dSJacob Faibussowitsch     PetscCall(MatDuplicateNoCreate_SeqAIJ(B, mat, MAT_COPY_VALUES, PETSC_TRUE));
265682d44351SHong Zhang     *subMat = B;
2657c2d650bdSHong Zhang   } else {
26589566063dSJacob Faibussowitsch     PetscCall(MatCopy_SeqAIJ(mat, *subMat, SAME_NONZERO_PATTERN));
2659c2d650bdSHong Zhang   }
26603ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
266182d44351SHong Zhang }
266282d44351SHong Zhang 
2663*ba38deedSJacob Faibussowitsch static PetscErrorCode MatILUFactor_SeqAIJ(Mat inA, IS row, IS col, const MatFactorInfo *info)
2664d71ae5a4SJacob Faibussowitsch {
266563b91edcSBarry Smith   Mat_SeqAIJ *a = (Mat_SeqAIJ *)inA->data;
266663b91edcSBarry Smith   Mat         outA;
2667ace3abfcSBarry Smith   PetscBool   row_identity, col_identity;
266863b91edcSBarry Smith 
26693a40ed3dSBarry Smith   PetscFunctionBegin;
267008401ef6SPierre Jolivet   PetscCheck(info->levels == 0, PETSC_COMM_SELF, PETSC_ERR_SUP, "Only levels=0 supported for in-place ilu");
26711df811f5SHong Zhang 
26729566063dSJacob Faibussowitsch   PetscCall(ISIdentity(row, &row_identity));
26739566063dSJacob Faibussowitsch   PetscCall(ISIdentity(col, &col_identity));
2674a871dcd8SBarry Smith 
267563b91edcSBarry Smith   outA             = inA;
2676d5f3da31SBarry Smith   outA->factortype = MAT_FACTOR_LU;
26779566063dSJacob Faibussowitsch   PetscCall(PetscFree(inA->solvertype));
26789566063dSJacob Faibussowitsch   PetscCall(PetscStrallocpy(MATSOLVERPETSC, &inA->solvertype));
26792205254eSKarl Rupp 
26809566063dSJacob Faibussowitsch   PetscCall(PetscObjectReference((PetscObject)row));
26819566063dSJacob Faibussowitsch   PetscCall(ISDestroy(&a->row));
26822205254eSKarl Rupp 
2683c3122656SLisandro Dalcin   a->row = row;
26842205254eSKarl Rupp 
26859566063dSJacob Faibussowitsch   PetscCall(PetscObjectReference((PetscObject)col));
26869566063dSJacob Faibussowitsch   PetscCall(ISDestroy(&a->col));
26872205254eSKarl Rupp 
2688c3122656SLisandro Dalcin   a->col = col;
268963b91edcSBarry Smith 
269036db0b34SBarry Smith   /* Create the inverse permutation so that it can be used in MatLUFactorNumeric() */
26919566063dSJacob Faibussowitsch   PetscCall(ISDestroy(&a->icol));
26929566063dSJacob Faibussowitsch   PetscCall(ISInvertPermutation(col, PETSC_DECIDE, &a->icol));
2693f0ec6fceSSatish Balay 
269494a9d846SBarry Smith   if (!a->solve_work) { /* this matrix may have been factored before */
26959566063dSJacob Faibussowitsch     PetscCall(PetscMalloc1(inA->rmap->n + 1, &a->solve_work));
269694a9d846SBarry Smith   }
269763b91edcSBarry Smith 
26989566063dSJacob Faibussowitsch   PetscCall(MatMarkDiagonal_SeqAIJ(inA));
2699137fb511SHong Zhang   if (row_identity && col_identity) {
27009566063dSJacob Faibussowitsch     PetscCall(MatLUFactorNumeric_SeqAIJ_inplace(outA, inA, info));
2701137fb511SHong Zhang   } else {
27029566063dSJacob Faibussowitsch     PetscCall(MatLUFactorNumeric_SeqAIJ_InplaceWithPerm(outA, inA, info));
2703137fb511SHong Zhang   }
27043ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
2705a871dcd8SBarry Smith }
2706a871dcd8SBarry Smith 
2707d71ae5a4SJacob Faibussowitsch PetscErrorCode MatScale_SeqAIJ(Mat inA, PetscScalar alpha)
2708d71ae5a4SJacob Faibussowitsch {
2709f0b747eeSBarry Smith   Mat_SeqAIJ  *a = (Mat_SeqAIJ *)inA->data;
2710dfa0f9e5SStefano Zampini   PetscScalar *v;
2711c5df96a5SBarry Smith   PetscBLASInt one = 1, bnz;
27123a40ed3dSBarry Smith 
27133a40ed3dSBarry Smith   PetscFunctionBegin;
27149566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArray(inA, &v));
27159566063dSJacob Faibussowitsch   PetscCall(PetscBLASIntCast(a->nz, &bnz));
2716792fecdfSBarry Smith   PetscCallBLAS("BLASscal", BLASscal_(&bnz, &alpha, v, &one));
27179566063dSJacob Faibussowitsch   PetscCall(PetscLogFlops(a->nz));
27189566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArray(inA, &v));
27199566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJInvalidateDiagonal(inA));
27203ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
2721f0b747eeSBarry Smith }
2722f0b747eeSBarry Smith 
2723d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDestroySubMatrix_Private(Mat_SubSppt *submatj)
2724d71ae5a4SJacob Faibussowitsch {
272516b64355SHong Zhang   PetscInt i;
272616b64355SHong Zhang 
272716b64355SHong Zhang   PetscFunctionBegin;
272816b64355SHong Zhang   if (!submatj->id) { /* delete data that are linked only to submats[id=0] */
27299566063dSJacob Faibussowitsch     PetscCall(PetscFree4(submatj->sbuf1, submatj->ptr, submatj->tmp, submatj->ctr));
273016b64355SHong Zhang 
273148a46eb9SPierre Jolivet     for (i = 0; i < submatj->nrqr; ++i) PetscCall(PetscFree(submatj->sbuf2[i]));
27329566063dSJacob Faibussowitsch     PetscCall(PetscFree3(submatj->sbuf2, submatj->req_size, submatj->req_source1));
273316b64355SHong Zhang 
273416b64355SHong Zhang     if (submatj->rbuf1) {
27359566063dSJacob Faibussowitsch       PetscCall(PetscFree(submatj->rbuf1[0]));
27369566063dSJacob Faibussowitsch       PetscCall(PetscFree(submatj->rbuf1));
273716b64355SHong Zhang     }
273816b64355SHong Zhang 
273948a46eb9SPierre Jolivet     for (i = 0; i < submatj->nrqs; ++i) PetscCall(PetscFree(submatj->rbuf3[i]));
27409566063dSJacob Faibussowitsch     PetscCall(PetscFree3(submatj->req_source2, submatj->rbuf2, submatj->rbuf3));
27419566063dSJacob Faibussowitsch     PetscCall(PetscFree(submatj->pa));
274216b64355SHong Zhang   }
274316b64355SHong Zhang 
274416b64355SHong Zhang #if defined(PETSC_USE_CTABLE)
2745eec179cfSJacob Faibussowitsch   PetscCall(PetscHMapIDestroy(&submatj->rmap));
27469566063dSJacob Faibussowitsch   if (submatj->cmap_loc) PetscCall(PetscFree(submatj->cmap_loc));
27479566063dSJacob Faibussowitsch   PetscCall(PetscFree(submatj->rmap_loc));
274816b64355SHong Zhang #else
27499566063dSJacob Faibussowitsch   PetscCall(PetscFree(submatj->rmap));
275016b64355SHong Zhang #endif
275116b64355SHong Zhang 
275216b64355SHong Zhang   if (!submatj->allcolumns) {
275316b64355SHong Zhang #if defined(PETSC_USE_CTABLE)
2754eec179cfSJacob Faibussowitsch     PetscCall(PetscHMapIDestroy((PetscHMapI *)&submatj->cmap));
275516b64355SHong Zhang #else
27569566063dSJacob Faibussowitsch     PetscCall(PetscFree(submatj->cmap));
275716b64355SHong Zhang #endif
275816b64355SHong Zhang   }
27599566063dSJacob Faibussowitsch   PetscCall(PetscFree(submatj->row2proc));
276016b64355SHong Zhang 
27619566063dSJacob Faibussowitsch   PetscCall(PetscFree(submatj));
27623ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
276316b64355SHong Zhang }
276416b64355SHong Zhang 
2765d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDestroySubMatrix_SeqAIJ(Mat C)
2766d71ae5a4SJacob Faibussowitsch {
276716b64355SHong Zhang   Mat_SeqAIJ  *c       = (Mat_SeqAIJ *)C->data;
27685c39f6d9SHong Zhang   Mat_SubSppt *submatj = c->submatis1;
276916b64355SHong Zhang 
277016b64355SHong Zhang   PetscFunctionBegin;
27719566063dSJacob Faibussowitsch   PetscCall((*submatj->destroy)(C));
27729566063dSJacob Faibussowitsch   PetscCall(MatDestroySubMatrix_Private(submatj));
27733ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
277416b64355SHong Zhang }
277516b64355SHong Zhang 
277689a1a59bSHong Zhang /* Note this has code duplication with MatDestroySubMatrices_SeqBAIJ() */
2777*ba38deedSJacob Faibussowitsch static PetscErrorCode MatDestroySubMatrices_SeqAIJ(PetscInt n, Mat *mat[])
2778d71ae5a4SJacob Faibussowitsch {
27792d033e1fSHong Zhang   PetscInt     i;
27800fb991dcSHong Zhang   Mat          C;
27810fb991dcSHong Zhang   Mat_SeqAIJ  *c;
27820fb991dcSHong Zhang   Mat_SubSppt *submatj;
27832d033e1fSHong Zhang 
27842d033e1fSHong Zhang   PetscFunctionBegin;
27852d033e1fSHong Zhang   for (i = 0; i < n; i++) {
27860fb991dcSHong Zhang     C       = (*mat)[i];
27870fb991dcSHong Zhang     c       = (Mat_SeqAIJ *)C->data;
27880fb991dcSHong Zhang     submatj = c->submatis1;
27892d033e1fSHong Zhang     if (submatj) {
2790682e4c99SStefano Zampini       if (--((PetscObject)C)->refct <= 0) {
279126cc229bSBarry Smith         PetscCall(PetscFree(C->factorprefix));
27929566063dSJacob Faibussowitsch         PetscCall((*submatj->destroy)(C));
27939566063dSJacob Faibussowitsch         PetscCall(MatDestroySubMatrix_Private(submatj));
27949566063dSJacob Faibussowitsch         PetscCall(PetscFree(C->defaultvectype));
27953faff063SStefano Zampini         PetscCall(PetscFree(C->defaultrandtype));
27969566063dSJacob Faibussowitsch         PetscCall(PetscLayoutDestroy(&C->rmap));
27979566063dSJacob Faibussowitsch         PetscCall(PetscLayoutDestroy(&C->cmap));
27989566063dSJacob Faibussowitsch         PetscCall(PetscHeaderDestroy(&C));
2799682e4c99SStefano Zampini       }
28002d033e1fSHong Zhang     } else {
28019566063dSJacob Faibussowitsch       PetscCall(MatDestroy(&C));
28022d033e1fSHong Zhang     }
28032d033e1fSHong Zhang   }
280486e85357SHong Zhang 
280563a75b2aSHong Zhang   /* Destroy Dummy submatrices created for reuse */
28069566063dSJacob Faibussowitsch   PetscCall(MatDestroySubMatrices_Dummy(n, mat));
280763a75b2aSHong Zhang 
28089566063dSJacob Faibussowitsch   PetscCall(PetscFree(*mat));
28093ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
28102d033e1fSHong Zhang }
28112d033e1fSHong Zhang 
2812*ba38deedSJacob Faibussowitsch static PetscErrorCode MatCreateSubMatrices_SeqAIJ(Mat A, PetscInt n, const IS irow[], const IS icol[], MatReuse scall, Mat *B[])
2813d71ae5a4SJacob Faibussowitsch {
281497f1f81fSBarry Smith   PetscInt i;
2815cddf8d76SBarry Smith 
28163a40ed3dSBarry Smith   PetscFunctionBegin;
281748a46eb9SPierre Jolivet   if (scall == MAT_INITIAL_MATRIX) PetscCall(PetscCalloc1(n + 1, B));
2818cddf8d76SBarry Smith 
281948a46eb9SPierre Jolivet   for (i = 0; i < n; i++) PetscCall(MatCreateSubMatrix_SeqAIJ(A, irow[i], icol[i], PETSC_DECIDE, scall, &(*B)[i]));
28203ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
2821cddf8d76SBarry Smith }
2822cddf8d76SBarry Smith 
2823*ba38deedSJacob Faibussowitsch static PetscErrorCode MatIncreaseOverlap_SeqAIJ(Mat A, PetscInt is_max, IS is[], PetscInt ov)
2824d71ae5a4SJacob Faibussowitsch {
2825e4d965acSSatish Balay   Mat_SeqAIJ     *a = (Mat_SeqAIJ *)A->data;
28269a88ca10SBarry Smith   PetscInt        row, i, j, k, l, ll, m, n, *nidx, isz, val;
28275d0c19d7SBarry Smith   const PetscInt *idx;
28289a88ca10SBarry Smith   PetscInt        start, end, *ai, *aj, bs = (A->rmap->bs > 0 && A->rmap->bs == A->cmap->bs) ? A->rmap->bs : 1;
2829f1af5d2fSBarry Smith   PetscBT         table;
2830bbd702dbSSatish Balay 
28313a40ed3dSBarry Smith   PetscFunctionBegin;
28329a88ca10SBarry Smith   m  = A->rmap->n / bs;
2833e4d965acSSatish Balay   ai = a->i;
2834bfeeae90SHong Zhang   aj = a->j;
28358a047759SSatish Balay 
283608401ef6SPierre Jolivet   PetscCheck(ov >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "illegal negative overlap value used");
283706763907SSatish Balay 
28389566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(m + 1, &nidx));
28399566063dSJacob Faibussowitsch   PetscCall(PetscBTCreate(m, &table));
284006763907SSatish Balay 
2841e4d965acSSatish Balay   for (i = 0; i < is_max; i++) {
2842b97fc60eSLois Curfman McInnes     /* Initialize the two local arrays */
2843e4d965acSSatish Balay     isz = 0;
28449566063dSJacob Faibussowitsch     PetscCall(PetscBTMemzero(m, table));
2845e4d965acSSatish Balay 
2846e4d965acSSatish Balay     /* Extract the indices, assume there can be duplicate entries */
28479566063dSJacob Faibussowitsch     PetscCall(ISGetIndices(is[i], &idx));
28489566063dSJacob Faibussowitsch     PetscCall(ISGetLocalSize(is[i], &n));
2849e4d965acSSatish Balay 
28509a88ca10SBarry Smith     if (bs > 1) {
28519a88ca10SBarry Smith       /* Enter these into the temp arrays. I.e., mark table[row], enter row into new index */
28529a88ca10SBarry Smith       for (j = 0; j < n; ++j) {
28539a88ca10SBarry Smith         if (!PetscBTLookupSet(table, idx[j] / bs)) nidx[isz++] = idx[j] / bs;
28549a88ca10SBarry Smith       }
28559a88ca10SBarry Smith       PetscCall(ISRestoreIndices(is[i], &idx));
28569a88ca10SBarry Smith       PetscCall(ISDestroy(&is[i]));
28579a88ca10SBarry Smith 
28589a88ca10SBarry Smith       k = 0;
28599a88ca10SBarry Smith       for (j = 0; j < ov; j++) { /* for each overlap */
28609a88ca10SBarry Smith         n = isz;
28619a88ca10SBarry Smith         for (; k < n; k++) { /* do only those rows in nidx[k], which are not done yet */
28629a88ca10SBarry Smith           for (ll = 0; ll < bs; ll++) {
28639a88ca10SBarry Smith             row   = bs * nidx[k] + ll;
28649a88ca10SBarry Smith             start = ai[row];
28659a88ca10SBarry Smith             end   = ai[row + 1];
28669a88ca10SBarry Smith             for (l = start; l < end; l++) {
28679a88ca10SBarry Smith               val = aj[l] / bs;
28689a88ca10SBarry Smith               if (!PetscBTLookupSet(table, val)) nidx[isz++] = val;
28699a88ca10SBarry Smith             }
28709a88ca10SBarry Smith           }
28719a88ca10SBarry Smith         }
28729a88ca10SBarry Smith       }
28739a88ca10SBarry Smith       PetscCall(ISCreateBlock(PETSC_COMM_SELF, bs, isz, nidx, PETSC_COPY_VALUES, (is + i)));
28749a88ca10SBarry Smith     } else {
2875dd097bc3SLois Curfman McInnes       /* Enter these into the temp arrays. I.e., mark table[row], enter row into new index */
2876e4d965acSSatish Balay       for (j = 0; j < n; ++j) {
28772205254eSKarl Rupp         if (!PetscBTLookupSet(table, idx[j])) nidx[isz++] = idx[j];
28784dcbc457SBarry Smith       }
28799566063dSJacob Faibussowitsch       PetscCall(ISRestoreIndices(is[i], &idx));
28809566063dSJacob Faibussowitsch       PetscCall(ISDestroy(&is[i]));
2881e4d965acSSatish Balay 
288204a348a9SBarry Smith       k = 0;
288304a348a9SBarry Smith       for (j = 0; j < ov; j++) { /* for each overlap */
288404a348a9SBarry Smith         n = isz;
288506763907SSatish Balay         for (; k < n; k++) { /* do only those rows in nidx[k], which are not done yet */
2886e4d965acSSatish Balay           row   = nidx[k];
2887e4d965acSSatish Balay           start = ai[row];
2888e4d965acSSatish Balay           end   = ai[row + 1];
288904a348a9SBarry Smith           for (l = start; l < end; l++) {
2890efb16452SHong Zhang             val = aj[l];
28912205254eSKarl Rupp             if (!PetscBTLookupSet(table, val)) nidx[isz++] = val;
2892e4d965acSSatish Balay           }
2893e4d965acSSatish Balay         }
2894e4d965acSSatish Balay       }
28959566063dSJacob Faibussowitsch       PetscCall(ISCreateGeneral(PETSC_COMM_SELF, isz, nidx, PETSC_COPY_VALUES, (is + i)));
2896e4d965acSSatish Balay     }
28979a88ca10SBarry Smith   }
28989566063dSJacob Faibussowitsch   PetscCall(PetscBTDestroy(&table));
28999566063dSJacob Faibussowitsch   PetscCall(PetscFree(nidx));
29003ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
29014dcbc457SBarry Smith }
290217ab2063SBarry Smith 
2903*ba38deedSJacob Faibussowitsch static PetscErrorCode MatPermute_SeqAIJ(Mat A, IS rowp, IS colp, Mat *B)
2904d71ae5a4SJacob Faibussowitsch {
29050513a670SBarry Smith   Mat_SeqAIJ     *a = (Mat_SeqAIJ *)A->data;
29063b98c0a2SBarry Smith   PetscInt        i, nz = 0, m = A->rmap->n, n = A->cmap->n;
29075d0c19d7SBarry Smith   const PetscInt *row, *col;
29085d0c19d7SBarry Smith   PetscInt       *cnew, j, *lens;
290956cd22aeSBarry Smith   IS              icolp, irowp;
29100298fd71SBarry Smith   PetscInt       *cwork = NULL;
29110298fd71SBarry Smith   PetscScalar    *vwork = NULL;
29120513a670SBarry Smith 
29133a40ed3dSBarry Smith   PetscFunctionBegin;
29149566063dSJacob Faibussowitsch   PetscCall(ISInvertPermutation(rowp, PETSC_DECIDE, &irowp));
29159566063dSJacob Faibussowitsch   PetscCall(ISGetIndices(irowp, &row));
29169566063dSJacob Faibussowitsch   PetscCall(ISInvertPermutation(colp, PETSC_DECIDE, &icolp));
29179566063dSJacob Faibussowitsch   PetscCall(ISGetIndices(icolp, &col));
29180513a670SBarry Smith 
29190513a670SBarry Smith   /* determine lengths of permuted rows */
29209566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(m + 1, &lens));
29212205254eSKarl Rupp   for (i = 0; i < m; i++) lens[row[i]] = a->i[i + 1] - a->i[i];
29229566063dSJacob Faibussowitsch   PetscCall(MatCreate(PetscObjectComm((PetscObject)A), B));
29239566063dSJacob Faibussowitsch   PetscCall(MatSetSizes(*B, m, n, m, n));
29249566063dSJacob Faibussowitsch   PetscCall(MatSetBlockSizesFromMats(*B, A, A));
29259566063dSJacob Faibussowitsch   PetscCall(MatSetType(*B, ((PetscObject)A)->type_name));
29269566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(*B, 0, lens));
29279566063dSJacob Faibussowitsch   PetscCall(PetscFree(lens));
29280513a670SBarry Smith 
29299566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(n, &cnew));
29300513a670SBarry Smith   for (i = 0; i < m; i++) {
29319566063dSJacob Faibussowitsch     PetscCall(MatGetRow_SeqAIJ(A, i, &nz, &cwork, &vwork));
29322205254eSKarl Rupp     for (j = 0; j < nz; j++) cnew[j] = col[cwork[j]];
29339566063dSJacob Faibussowitsch     PetscCall(MatSetValues_SeqAIJ(*B, 1, &row[i], nz, cnew, vwork, INSERT_VALUES));
29349566063dSJacob Faibussowitsch     PetscCall(MatRestoreRow_SeqAIJ(A, i, &nz, &cwork, &vwork));
29350513a670SBarry Smith   }
29369566063dSJacob Faibussowitsch   PetscCall(PetscFree(cnew));
29372205254eSKarl Rupp 
29383c7d62e4SBarry Smith   (*B)->assembled = PETSC_FALSE;
29392205254eSKarl Rupp 
29408c3ff71bSJunchao Zhang #if defined(PETSC_HAVE_DEVICE)
29419566063dSJacob Faibussowitsch   PetscCall(MatBindToCPU(*B, A->boundtocpu));
29429fe5e383SStefano Zampini #endif
29439566063dSJacob Faibussowitsch   PetscCall(MatAssemblyBegin(*B, MAT_FINAL_ASSEMBLY));
29449566063dSJacob Faibussowitsch   PetscCall(MatAssemblyEnd(*B, MAT_FINAL_ASSEMBLY));
29459566063dSJacob Faibussowitsch   PetscCall(ISRestoreIndices(irowp, &row));
29469566063dSJacob Faibussowitsch   PetscCall(ISRestoreIndices(icolp, &col));
29479566063dSJacob Faibussowitsch   PetscCall(ISDestroy(&irowp));
29489566063dSJacob Faibussowitsch   PetscCall(ISDestroy(&icolp));
294948a46eb9SPierre Jolivet   if (rowp == colp) PetscCall(MatPropagateSymmetryOptions(A, *B));
29503ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
29510513a670SBarry Smith }
29520513a670SBarry Smith 
2953d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCopy_SeqAIJ(Mat A, Mat B, MatStructure str)
2954d71ae5a4SJacob Faibussowitsch {
2955cb5b572fSBarry Smith   PetscFunctionBegin;
295633f4a19fSKris Buschelman   /* If the two matrices have the same copy implementation, use fast copy. */
295733f4a19fSKris Buschelman   if (str == SAME_NONZERO_PATTERN && (A->ops->copy == B->ops->copy)) {
2958be6bf707SBarry Smith     Mat_SeqAIJ        *a = (Mat_SeqAIJ *)A->data;
2959be6bf707SBarry Smith     Mat_SeqAIJ        *b = (Mat_SeqAIJ *)B->data;
29602e5835c6SStefano Zampini     const PetscScalar *aa;
2961be6bf707SBarry Smith 
29629566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJGetArrayRead(A, &aa));
296308401ef6SPierre Jolivet     PetscCheck(a->i[A->rmap->n] == b->i[B->rmap->n], PETSC_COMM_SELF, PETSC_ERR_ARG_INCOMP, "Number of nonzeros in two matrices are different %" PetscInt_FMT " != %" PetscInt_FMT, a->i[A->rmap->n], b->i[B->rmap->n]);
29649566063dSJacob Faibussowitsch     PetscCall(PetscArraycpy(b->a, aa, a->i[A->rmap->n]));
29659566063dSJacob Faibussowitsch     PetscCall(PetscObjectStateIncrease((PetscObject)B));
29669566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJRestoreArrayRead(A, &aa));
2967cb5b572fSBarry Smith   } else {
29689566063dSJacob Faibussowitsch     PetscCall(MatCopy_Basic(A, B, str));
2969cb5b572fSBarry Smith   }
29703ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
2971cb5b572fSBarry Smith }
2972cb5b572fSBarry Smith 
2973d71ae5a4SJacob Faibussowitsch PETSC_INTERN PetscErrorCode MatSeqAIJGetArray_SeqAIJ(Mat A, PetscScalar *array[])
2974d71ae5a4SJacob Faibussowitsch {
29756c0721eeSBarry Smith   Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data;
29766e111a19SKarl Rupp 
29776c0721eeSBarry Smith   PetscFunctionBegin;
29786c0721eeSBarry Smith   *array = a->a;
29793ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
29806c0721eeSBarry Smith }
29816c0721eeSBarry Smith 
2982d71ae5a4SJacob Faibussowitsch PETSC_INTERN PetscErrorCode MatSeqAIJRestoreArray_SeqAIJ(Mat A, PetscScalar *array[])
2983d71ae5a4SJacob Faibussowitsch {
29846c0721eeSBarry Smith   PetscFunctionBegin;
2985f38c1e66SStefano Zampini   *array = NULL;
29863ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
29876c0721eeSBarry Smith }
2988273d9f13SBarry Smith 
29898229c054SShri Abhyankar /*
29908229c054SShri Abhyankar    Computes the number of nonzeros per row needed for preallocation when X and Y
29918229c054SShri Abhyankar    have different nonzero structure.
29928229c054SShri Abhyankar */
2993d71ae5a4SJacob Faibussowitsch PetscErrorCode MatAXPYGetPreallocation_SeqX_private(PetscInt m, const PetscInt *xi, const PetscInt *xj, const PetscInt *yi, const PetscInt *yj, PetscInt *nnz)
2994d71ae5a4SJacob Faibussowitsch {
2995b264fe52SHong Zhang   PetscInt i, j, k, nzx, nzy;
2996ec7775f6SShri Abhyankar 
2997ec7775f6SShri Abhyankar   PetscFunctionBegin;
2998ec7775f6SShri Abhyankar   /* Set the number of nonzeros in the new matrix */
2999ec7775f6SShri Abhyankar   for (i = 0; i < m; i++) {
3000b264fe52SHong Zhang     const PetscInt *xjj = xj + xi[i], *yjj = yj + yi[i];
3001b264fe52SHong Zhang     nzx    = xi[i + 1] - xi[i];
3002b264fe52SHong Zhang     nzy    = yi[i + 1] - yi[i];
30038af7cee1SJed Brown     nnz[i] = 0;
30048af7cee1SJed Brown     for (j = 0, k = 0; j < nzx; j++) {                  /* Point in X */
3005b264fe52SHong Zhang       for (; k < nzy && yjj[k] < xjj[j]; k++) nnz[i]++; /* Catch up to X */
3006b264fe52SHong Zhang       if (k < nzy && yjj[k] == xjj[j]) k++;             /* Skip duplicate */
30078af7cee1SJed Brown       nnz[i]++;
30088af7cee1SJed Brown     }
30098af7cee1SJed Brown     for (; k < nzy; k++) nnz[i]++;
3010ec7775f6SShri Abhyankar   }
30113ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3012ec7775f6SShri Abhyankar }
3013ec7775f6SShri Abhyankar 
3014d71ae5a4SJacob Faibussowitsch PetscErrorCode MatAXPYGetPreallocation_SeqAIJ(Mat Y, Mat X, PetscInt *nnz)
3015d71ae5a4SJacob Faibussowitsch {
3016b264fe52SHong Zhang   PetscInt    m = Y->rmap->N;
3017b264fe52SHong Zhang   Mat_SeqAIJ *x = (Mat_SeqAIJ *)X->data;
3018b264fe52SHong Zhang   Mat_SeqAIJ *y = (Mat_SeqAIJ *)Y->data;
3019b264fe52SHong Zhang 
3020b264fe52SHong Zhang   PetscFunctionBegin;
3021b264fe52SHong Zhang   /* Set the number of nonzeros in the new matrix */
30229566063dSJacob Faibussowitsch   PetscCall(MatAXPYGetPreallocation_SeqX_private(m, x->i, x->j, y->i, y->j, nnz));
30233ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3024b264fe52SHong Zhang }
3025b264fe52SHong Zhang 
3026d71ae5a4SJacob Faibussowitsch PetscErrorCode MatAXPY_SeqAIJ(Mat Y, PetscScalar a, Mat X, MatStructure str)
3027d71ae5a4SJacob Faibussowitsch {
3028ac90fabeSBarry Smith   Mat_SeqAIJ *x = (Mat_SeqAIJ *)X->data, *y = (Mat_SeqAIJ *)Y->data;
3029ac90fabeSBarry Smith 
3030ac90fabeSBarry Smith   PetscFunctionBegin;
3031134adf20SPierre Jolivet   if (str == UNKNOWN_NONZERO_PATTERN || (PetscDefined(USE_DEBUG) && str == SAME_NONZERO_PATTERN)) {
3032134adf20SPierre Jolivet     PetscBool e = x->nz == y->nz ? PETSC_TRUE : PETSC_FALSE;
3033134adf20SPierre Jolivet     if (e) {
30349566063dSJacob Faibussowitsch       PetscCall(PetscArraycmp(x->i, y->i, Y->rmap->n + 1, &e));
303581fa06acSBarry Smith       if (e) {
30369566063dSJacob Faibussowitsch         PetscCall(PetscArraycmp(x->j, y->j, y->nz, &e));
3037134adf20SPierre Jolivet         if (e) str = SAME_NONZERO_PATTERN;
303881fa06acSBarry Smith       }
303981fa06acSBarry Smith     }
304054c59aa7SJacob Faibussowitsch     if (!e) PetscCheck(str != SAME_NONZERO_PATTERN, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONG, "MatStructure is not SAME_NONZERO_PATTERN");
304181fa06acSBarry Smith   }
3042ac90fabeSBarry Smith   if (str == SAME_NONZERO_PATTERN) {
30432e5835c6SStefano Zampini     const PetscScalar *xa;
30442e5835c6SStefano Zampini     PetscScalar       *ya, alpha = a;
304581fa06acSBarry Smith     PetscBLASInt       one = 1, bnz;
304681fa06acSBarry Smith 
30479566063dSJacob Faibussowitsch     PetscCall(PetscBLASIntCast(x->nz, &bnz));
30489566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJGetArray(Y, &ya));
30499566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJGetArrayRead(X, &xa));
3050792fecdfSBarry Smith     PetscCallBLAS("BLASaxpy", BLASaxpy_(&bnz, &alpha, xa, &one, ya, &one));
30519566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJRestoreArrayRead(X, &xa));
30529566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJRestoreArray(Y, &ya));
30539566063dSJacob Faibussowitsch     PetscCall(PetscLogFlops(2.0 * bnz));
30549566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJInvalidateDiagonal(Y));
30559566063dSJacob Faibussowitsch     PetscCall(PetscObjectStateIncrease((PetscObject)Y));
3056ab784542SHong Zhang   } else if (str == SUBSET_NONZERO_PATTERN) { /* nonzeros of X is a subset of Y's */
30579566063dSJacob Faibussowitsch     PetscCall(MatAXPY_Basic(Y, a, X, str));
3058ac90fabeSBarry Smith   } else {
30598229c054SShri Abhyankar     Mat       B;
30608229c054SShri Abhyankar     PetscInt *nnz;
30619566063dSJacob Faibussowitsch     PetscCall(PetscMalloc1(Y->rmap->N, &nnz));
30629566063dSJacob Faibussowitsch     PetscCall(MatCreate(PetscObjectComm((PetscObject)Y), &B));
30639566063dSJacob Faibussowitsch     PetscCall(PetscObjectSetName((PetscObject)B, ((PetscObject)Y)->name));
30649566063dSJacob Faibussowitsch     PetscCall(MatSetLayouts(B, Y->rmap, Y->cmap));
30659566063dSJacob Faibussowitsch     PetscCall(MatSetType(B, ((PetscObject)Y)->type_name));
30669566063dSJacob Faibussowitsch     PetscCall(MatAXPYGetPreallocation_SeqAIJ(Y, X, nnz));
30679566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJSetPreallocation(B, 0, nnz));
30689566063dSJacob Faibussowitsch     PetscCall(MatAXPY_BasicWithPreallocation(B, Y, a, X, str));
30699566063dSJacob Faibussowitsch     PetscCall(MatHeaderMerge(Y, &B));
30709bb234a9SBarry Smith     PetscCall(MatSeqAIJCheckInode(Y));
30719566063dSJacob Faibussowitsch     PetscCall(PetscFree(nnz));
3072ac90fabeSBarry Smith   }
30733ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3074ac90fabeSBarry Smith }
3075ac90fabeSBarry Smith 
3076d71ae5a4SJacob Faibussowitsch PETSC_INTERN PetscErrorCode MatConjugate_SeqAIJ(Mat mat)
3077d71ae5a4SJacob Faibussowitsch {
3078354c94deSBarry Smith #if defined(PETSC_USE_COMPLEX)
3079354c94deSBarry Smith   Mat_SeqAIJ  *aij = (Mat_SeqAIJ *)mat->data;
3080354c94deSBarry Smith   PetscInt     i, nz;
3081354c94deSBarry Smith   PetscScalar *a;
3082354c94deSBarry Smith 
3083354c94deSBarry Smith   PetscFunctionBegin;
3084354c94deSBarry Smith   nz = aij->nz;
30859566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArray(mat, &a));
30862205254eSKarl Rupp   for (i = 0; i < nz; i++) a[i] = PetscConj(a[i]);
30879566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArray(mat, &a));
3088354c94deSBarry Smith #else
3089354c94deSBarry Smith   PetscFunctionBegin;
3090354c94deSBarry Smith #endif
30913ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3092354c94deSBarry Smith }
3093354c94deSBarry Smith 
3094*ba38deedSJacob Faibussowitsch static PetscErrorCode MatGetRowMaxAbs_SeqAIJ(Mat A, Vec v, PetscInt idx[])
3095d71ae5a4SJacob Faibussowitsch {
3096e34fafa9SBarry Smith   Mat_SeqAIJ      *a = (Mat_SeqAIJ *)A->data;
3097d0f46423SBarry Smith   PetscInt         i, j, m = A->rmap->n, *ai, *aj, ncols, n;
3098e34fafa9SBarry Smith   PetscReal        atmp;
3099985db425SBarry Smith   PetscScalar     *x;
3100ce496241SStefano Zampini   const MatScalar *aa, *av;
3101e34fafa9SBarry Smith 
3102e34fafa9SBarry Smith   PetscFunctionBegin;
310328b400f6SJacob Faibussowitsch   PetscCheck(!A->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix");
31049566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &av));
3105ce496241SStefano Zampini   aa = av;
3106e34fafa9SBarry Smith   ai = a->i;
3107e34fafa9SBarry Smith   aj = a->j;
3108e34fafa9SBarry Smith 
31099566063dSJacob Faibussowitsch   PetscCall(VecSet(v, 0.0));
31109566063dSJacob Faibussowitsch   PetscCall(VecGetArrayWrite(v, &x));
31119566063dSJacob Faibussowitsch   PetscCall(VecGetLocalSize(v, &n));
311208401ef6SPierre Jolivet   PetscCheck(n == A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Nonconforming matrix and vector");
3113e34fafa9SBarry Smith   for (i = 0; i < m; i++) {
31149371c9d4SSatish Balay     ncols = ai[1] - ai[0];
31159371c9d4SSatish Balay     ai++;
3116e34fafa9SBarry Smith     for (j = 0; j < ncols; j++) {
3117985db425SBarry Smith       atmp = PetscAbsScalar(*aa);
31189371c9d4SSatish Balay       if (PetscAbsScalar(x[i]) < atmp) {
31199371c9d4SSatish Balay         x[i] = atmp;
31209371c9d4SSatish Balay         if (idx) idx[i] = *aj;
31219371c9d4SSatish Balay       }
31229371c9d4SSatish Balay       aa++;
31239371c9d4SSatish Balay       aj++;
3124985db425SBarry Smith     }
3125985db425SBarry Smith   }
31269566063dSJacob Faibussowitsch   PetscCall(VecRestoreArrayWrite(v, &x));
31279566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &av));
31283ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3129985db425SBarry Smith }
3130985db425SBarry Smith 
3131*ba38deedSJacob Faibussowitsch static PetscErrorCode MatGetRowMax_SeqAIJ(Mat A, Vec v, PetscInt idx[])
3132d71ae5a4SJacob Faibussowitsch {
3133985db425SBarry Smith   Mat_SeqAIJ      *a = (Mat_SeqAIJ *)A->data;
3134d0f46423SBarry Smith   PetscInt         i, j, m = A->rmap->n, *ai, *aj, ncols, n;
3135985db425SBarry Smith   PetscScalar     *x;
3136ce496241SStefano Zampini   const MatScalar *aa, *av;
3137985db425SBarry Smith 
3138985db425SBarry Smith   PetscFunctionBegin;
313928b400f6SJacob Faibussowitsch   PetscCheck(!A->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix");
31409566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &av));
3141ce496241SStefano Zampini   aa = av;
3142985db425SBarry Smith   ai = a->i;
3143985db425SBarry Smith   aj = a->j;
3144985db425SBarry Smith 
31459566063dSJacob Faibussowitsch   PetscCall(VecSet(v, 0.0));
31469566063dSJacob Faibussowitsch   PetscCall(VecGetArrayWrite(v, &x));
31479566063dSJacob Faibussowitsch   PetscCall(VecGetLocalSize(v, &n));
314808401ef6SPierre Jolivet   PetscCheck(n == A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Nonconforming matrix and vector");
3149985db425SBarry Smith   for (i = 0; i < m; i++) {
31509371c9d4SSatish Balay     ncols = ai[1] - ai[0];
31519371c9d4SSatish Balay     ai++;
3152d0f46423SBarry Smith     if (ncols == A->cmap->n) { /* row is dense */
31539371c9d4SSatish Balay       x[i] = *aa;
31549371c9d4SSatish Balay       if (idx) idx[i] = 0;
3155985db425SBarry Smith     } else { /* row is sparse so already KNOW maximum is 0.0 or higher */
3156985db425SBarry Smith       x[i] = 0.0;
3157985db425SBarry Smith       if (idx) {
3158985db425SBarry Smith         for (j = 0; j < ncols; j++) { /* find first implicit 0.0 in the row */
3159985db425SBarry Smith           if (aj[j] > j) {
3160985db425SBarry Smith             idx[i] = j;
3161985db425SBarry Smith             break;
3162985db425SBarry Smith           }
3163985db425SBarry Smith         }
31641a254869SHong Zhang         /* in case first implicit 0.0 in the row occurs at ncols-th column */
31651a254869SHong Zhang         if (j == ncols && j < A->cmap->n) idx[i] = j;
3166985db425SBarry Smith       }
3167985db425SBarry Smith     }
3168985db425SBarry Smith     for (j = 0; j < ncols; j++) {
31699371c9d4SSatish Balay       if (PetscRealPart(x[i]) < PetscRealPart(*aa)) {
31709371c9d4SSatish Balay         x[i] = *aa;
31719371c9d4SSatish Balay         if (idx) idx[i] = *aj;
31729371c9d4SSatish Balay       }
31739371c9d4SSatish Balay       aa++;
31749371c9d4SSatish Balay       aj++;
3175985db425SBarry Smith     }
3176985db425SBarry Smith   }
31779566063dSJacob Faibussowitsch   PetscCall(VecRestoreArrayWrite(v, &x));
31789566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &av));
31793ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3180985db425SBarry Smith }
3181985db425SBarry Smith 
3182*ba38deedSJacob Faibussowitsch static PetscErrorCode MatGetRowMinAbs_SeqAIJ(Mat A, Vec v, PetscInt idx[])
3183d71ae5a4SJacob Faibussowitsch {
3184c87e5d42SMatthew Knepley   Mat_SeqAIJ      *a = (Mat_SeqAIJ *)A->data;
3185c87e5d42SMatthew Knepley   PetscInt         i, j, m = A->rmap->n, *ai, *aj, ncols, n;
3186ce496241SStefano Zampini   PetscScalar     *x;
3187ce496241SStefano Zampini   const MatScalar *aa, *av;
3188c87e5d42SMatthew Knepley 
3189c87e5d42SMatthew Knepley   PetscFunctionBegin;
31909566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &av));
3191ce496241SStefano Zampini   aa = av;
3192c87e5d42SMatthew Knepley   ai = a->i;
3193c87e5d42SMatthew Knepley   aj = a->j;
3194c87e5d42SMatthew Knepley 
31959566063dSJacob Faibussowitsch   PetscCall(VecSet(v, 0.0));
31969566063dSJacob Faibussowitsch   PetscCall(VecGetArrayWrite(v, &x));
31979566063dSJacob Faibussowitsch   PetscCall(VecGetLocalSize(v, &n));
319808401ef6SPierre Jolivet   PetscCheck(n == m, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Nonconforming matrix and vector, %" PetscInt_FMT " vs. %" PetscInt_FMT " rows", m, n);
3199c87e5d42SMatthew Knepley   for (i = 0; i < m; i++) {
32009371c9d4SSatish Balay     ncols = ai[1] - ai[0];
32019371c9d4SSatish Balay     ai++;
3202f07e67edSHong Zhang     if (ncols == A->cmap->n) { /* row is dense */
32039371c9d4SSatish Balay       x[i] = *aa;
32049371c9d4SSatish Balay       if (idx) idx[i] = 0;
3205f07e67edSHong Zhang     } else { /* row is sparse so already KNOW minimum is 0.0 or higher */
3206f07e67edSHong Zhang       x[i] = 0.0;
3207f07e67edSHong Zhang       if (idx) { /* find first implicit 0.0 in the row */
3208289a08f5SMatthew Knepley         for (j = 0; j < ncols; j++) {
3209f07e67edSHong Zhang           if (aj[j] > j) {
3210f07e67edSHong Zhang             idx[i] = j;
32112205254eSKarl Rupp             break;
32122205254eSKarl Rupp           }
3213289a08f5SMatthew Knepley         }
3214f07e67edSHong Zhang         /* in case first implicit 0.0 in the row occurs at ncols-th column */
3215f07e67edSHong Zhang         if (j == ncols && j < A->cmap->n) idx[i] = j;
3216f07e67edSHong Zhang       }
3217289a08f5SMatthew Knepley     }
3218c87e5d42SMatthew Knepley     for (j = 0; j < ncols; j++) {
32199371c9d4SSatish Balay       if (PetscAbsScalar(x[i]) > PetscAbsScalar(*aa)) {
32209371c9d4SSatish Balay         x[i] = *aa;
32219371c9d4SSatish Balay         if (idx) idx[i] = *aj;
32229371c9d4SSatish Balay       }
32239371c9d4SSatish Balay       aa++;
32249371c9d4SSatish Balay       aj++;
3225c87e5d42SMatthew Knepley     }
3226c87e5d42SMatthew Knepley   }
32279566063dSJacob Faibussowitsch   PetscCall(VecRestoreArrayWrite(v, &x));
32289566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &av));
32293ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3230c87e5d42SMatthew Knepley }
3231c87e5d42SMatthew Knepley 
3232*ba38deedSJacob Faibussowitsch static PetscErrorCode MatGetRowMin_SeqAIJ(Mat A, Vec v, PetscInt idx[])
3233d71ae5a4SJacob Faibussowitsch {
3234985db425SBarry Smith   Mat_SeqAIJ      *a = (Mat_SeqAIJ *)A->data;
3235d9ca1df4SBarry Smith   PetscInt         i, j, m = A->rmap->n, ncols, n;
3236d9ca1df4SBarry Smith   const PetscInt  *ai, *aj;
3237985db425SBarry Smith   PetscScalar     *x;
3238ce496241SStefano Zampini   const MatScalar *aa, *av;
3239985db425SBarry Smith 
3240985db425SBarry Smith   PetscFunctionBegin;
324128b400f6SJacob Faibussowitsch   PetscCheck(!A->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix");
32429566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &av));
3243ce496241SStefano Zampini   aa = av;
3244985db425SBarry Smith   ai = a->i;
3245985db425SBarry Smith   aj = a->j;
3246985db425SBarry Smith 
32479566063dSJacob Faibussowitsch   PetscCall(VecSet(v, 0.0));
32489566063dSJacob Faibussowitsch   PetscCall(VecGetArrayWrite(v, &x));
32499566063dSJacob Faibussowitsch   PetscCall(VecGetLocalSize(v, &n));
325008401ef6SPierre Jolivet   PetscCheck(n == m, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Nonconforming matrix and vector");
3251985db425SBarry Smith   for (i = 0; i < m; i++) {
32529371c9d4SSatish Balay     ncols = ai[1] - ai[0];
32539371c9d4SSatish Balay     ai++;
3254d0f46423SBarry Smith     if (ncols == A->cmap->n) { /* row is dense */
32559371c9d4SSatish Balay       x[i] = *aa;
32569371c9d4SSatish Balay       if (idx) idx[i] = 0;
3257985db425SBarry Smith     } else { /* row is sparse so already KNOW minimum is 0.0 or lower */
3258985db425SBarry Smith       x[i] = 0.0;
3259985db425SBarry Smith       if (idx) { /* find first implicit 0.0 in the row */
3260985db425SBarry Smith         for (j = 0; j < ncols; j++) {
3261985db425SBarry Smith           if (aj[j] > j) {
3262985db425SBarry Smith             idx[i] = j;
3263985db425SBarry Smith             break;
3264985db425SBarry Smith           }
3265985db425SBarry Smith         }
3266fa213d2fSHong Zhang         /* in case first implicit 0.0 in the row occurs at ncols-th column */
3267fa213d2fSHong Zhang         if (j == ncols && j < A->cmap->n) idx[i] = j;
3268985db425SBarry Smith       }
3269985db425SBarry Smith     }
3270985db425SBarry Smith     for (j = 0; j < ncols; j++) {
32719371c9d4SSatish Balay       if (PetscRealPart(x[i]) > PetscRealPart(*aa)) {
32729371c9d4SSatish Balay         x[i] = *aa;
32739371c9d4SSatish Balay         if (idx) idx[i] = *aj;
32749371c9d4SSatish Balay       }
32759371c9d4SSatish Balay       aa++;
32769371c9d4SSatish Balay       aj++;
3277e34fafa9SBarry Smith     }
3278e34fafa9SBarry Smith   }
32799566063dSJacob Faibussowitsch   PetscCall(VecRestoreArrayWrite(v, &x));
32809566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &av));
32813ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3282e34fafa9SBarry Smith }
3283bbead8a2SBarry Smith 
3284*ba38deedSJacob Faibussowitsch static PetscErrorCode MatInvertBlockDiagonal_SeqAIJ(Mat A, const PetscScalar **values)
3285d71ae5a4SJacob Faibussowitsch {
3286bbead8a2SBarry Smith   Mat_SeqAIJ     *a = (Mat_SeqAIJ *)A->data;
328733d57670SJed Brown   PetscInt        i, bs = PetscAbs(A->rmap->bs), mbs = A->rmap->n / bs, ipvt[5], bs2 = bs * bs, *v_pivots, ij[7], *IJ, j;
3288bbead8a2SBarry Smith   MatScalar      *diag, work[25], *v_work;
32890da83c2eSBarry Smith   const PetscReal shift = 0.0;
32901a9391e3SHong Zhang   PetscBool       allowzeropivot, zeropivotdetected = PETSC_FALSE;
3291bbead8a2SBarry Smith 
3292bbead8a2SBarry Smith   PetscFunctionBegin;
3293a455e926SHong Zhang   allowzeropivot = PetscNot(A->erroriffailure);
32944a0d0026SBarry Smith   if (a->ibdiagvalid) {
32954a0d0026SBarry Smith     if (values) *values = a->ibdiag;
32963ba16761SJacob Faibussowitsch     PetscFunctionReturn(PETSC_SUCCESS);
32974a0d0026SBarry Smith   }
32989566063dSJacob Faibussowitsch   PetscCall(MatMarkDiagonal_SeqAIJ(A));
32994dfa11a4SJacob Faibussowitsch   if (!a->ibdiag) { PetscCall(PetscMalloc1(bs2 * mbs, &a->ibdiag)); }
3300bbead8a2SBarry Smith   diag = a->ibdiag;
3301bbead8a2SBarry Smith   if (values) *values = a->ibdiag;
3302bbead8a2SBarry Smith   /* factor and invert each block */
3303bbead8a2SBarry Smith   switch (bs) {
3304bbead8a2SBarry Smith   case 1:
3305bbead8a2SBarry Smith     for (i = 0; i < mbs; i++) {
33069566063dSJacob Faibussowitsch       PetscCall(MatGetValues(A, 1, &i, 1, &i, diag + i));
3307ec1892c8SHong Zhang       if (PetscAbsScalar(diag[i] + shift) < PETSC_MACHINE_EPSILON) {
3308ec1892c8SHong Zhang         if (allowzeropivot) {
33097b6c816cSBarry Smith           A->factorerrortype             = MAT_FACTOR_NUMERIC_ZEROPIVOT;
33107b6c816cSBarry Smith           A->factorerror_zeropivot_value = PetscAbsScalar(diag[i]);
33117b6c816cSBarry Smith           A->factorerror_zeropivot_row   = i;
33129566063dSJacob Faibussowitsch           PetscCall(PetscInfo(A, "Zero pivot, row %" PetscInt_FMT " pivot %g tolerance %g\n", i, (double)PetscAbsScalar(diag[i]), (double)PETSC_MACHINE_EPSILON));
331398921bdaSJacob Faibussowitsch         } else SETERRQ(PETSC_COMM_SELF, PETSC_ERR_MAT_LU_ZRPVT, "Zero pivot, row %" PetscInt_FMT " pivot %g tolerance %g", i, (double)PetscAbsScalar(diag[i]), (double)PETSC_MACHINE_EPSILON);
3314ec1892c8SHong Zhang       }
3315bbead8a2SBarry Smith       diag[i] = (PetscScalar)1.0 / (diag[i] + shift);
3316bbead8a2SBarry Smith     }
3317bbead8a2SBarry Smith     break;
3318bbead8a2SBarry Smith   case 2:
3319bbead8a2SBarry Smith     for (i = 0; i < mbs; i++) {
33209371c9d4SSatish Balay       ij[0] = 2 * i;
33219371c9d4SSatish Balay       ij[1] = 2 * i + 1;
33229566063dSJacob Faibussowitsch       PetscCall(MatGetValues(A, 2, ij, 2, ij, diag));
33239566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_inverse_A_2(diag, shift, allowzeropivot, &zeropivotdetected));
33247b6c816cSBarry Smith       if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT;
33259566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_transpose_A_2(diag));
3326bbead8a2SBarry Smith       diag += 4;
3327bbead8a2SBarry Smith     }
3328bbead8a2SBarry Smith     break;
3329bbead8a2SBarry Smith   case 3:
3330bbead8a2SBarry Smith     for (i = 0; i < mbs; i++) {
33319371c9d4SSatish Balay       ij[0] = 3 * i;
33329371c9d4SSatish Balay       ij[1] = 3 * i + 1;
33339371c9d4SSatish Balay       ij[2] = 3 * i + 2;
33349566063dSJacob Faibussowitsch       PetscCall(MatGetValues(A, 3, ij, 3, ij, diag));
33359566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_inverse_A_3(diag, shift, allowzeropivot, &zeropivotdetected));
33367b6c816cSBarry Smith       if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT;
33379566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_transpose_A_3(diag));
3338bbead8a2SBarry Smith       diag += 9;
3339bbead8a2SBarry Smith     }
3340bbead8a2SBarry Smith     break;
3341bbead8a2SBarry Smith   case 4:
3342bbead8a2SBarry Smith     for (i = 0; i < mbs; i++) {
33439371c9d4SSatish Balay       ij[0] = 4 * i;
33449371c9d4SSatish Balay       ij[1] = 4 * i + 1;
33459371c9d4SSatish Balay       ij[2] = 4 * i + 2;
33469371c9d4SSatish Balay       ij[3] = 4 * i + 3;
33479566063dSJacob Faibussowitsch       PetscCall(MatGetValues(A, 4, ij, 4, ij, diag));
33489566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_inverse_A_4(diag, shift, allowzeropivot, &zeropivotdetected));
33497b6c816cSBarry Smith       if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT;
33509566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_transpose_A_4(diag));
3351bbead8a2SBarry Smith       diag += 16;
3352bbead8a2SBarry Smith     }
3353bbead8a2SBarry Smith     break;
3354bbead8a2SBarry Smith   case 5:
3355bbead8a2SBarry Smith     for (i = 0; i < mbs; i++) {
33569371c9d4SSatish Balay       ij[0] = 5 * i;
33579371c9d4SSatish Balay       ij[1] = 5 * i + 1;
33589371c9d4SSatish Balay       ij[2] = 5 * i + 2;
33599371c9d4SSatish Balay       ij[3] = 5 * i + 3;
33609371c9d4SSatish Balay       ij[4] = 5 * i + 4;
33619566063dSJacob Faibussowitsch       PetscCall(MatGetValues(A, 5, ij, 5, ij, diag));
33629566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_inverse_A_5(diag, ipvt, work, shift, allowzeropivot, &zeropivotdetected));
33637b6c816cSBarry Smith       if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT;
33649566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_transpose_A_5(diag));
3365bbead8a2SBarry Smith       diag += 25;
3366bbead8a2SBarry Smith     }
3367bbead8a2SBarry Smith     break;
3368bbead8a2SBarry Smith   case 6:
3369bbead8a2SBarry Smith     for (i = 0; i < mbs; i++) {
33709371c9d4SSatish Balay       ij[0] = 6 * i;
33719371c9d4SSatish Balay       ij[1] = 6 * i + 1;
33729371c9d4SSatish Balay       ij[2] = 6 * i + 2;
33739371c9d4SSatish Balay       ij[3] = 6 * i + 3;
33749371c9d4SSatish Balay       ij[4] = 6 * i + 4;
33759371c9d4SSatish Balay       ij[5] = 6 * i + 5;
33769566063dSJacob Faibussowitsch       PetscCall(MatGetValues(A, 6, ij, 6, ij, diag));
33779566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_inverse_A_6(diag, shift, allowzeropivot, &zeropivotdetected));
33787b6c816cSBarry Smith       if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT;
33799566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_transpose_A_6(diag));
3380bbead8a2SBarry Smith       diag += 36;
3381bbead8a2SBarry Smith     }
3382bbead8a2SBarry Smith     break;
3383bbead8a2SBarry Smith   case 7:
3384bbead8a2SBarry Smith     for (i = 0; i < mbs; i++) {
33859371c9d4SSatish Balay       ij[0] = 7 * i;
33869371c9d4SSatish Balay       ij[1] = 7 * i + 1;
33879371c9d4SSatish Balay       ij[2] = 7 * i + 2;
33889371c9d4SSatish Balay       ij[3] = 7 * i + 3;
33899371c9d4SSatish Balay       ij[4] = 7 * i + 4;
33909371c9d4SSatish Balay       ij[5] = 7 * i + 5;
3391cdd8bf47SJunchao Zhang       ij[6] = 7 * i + 6;
33929566063dSJacob Faibussowitsch       PetscCall(MatGetValues(A, 7, ij, 7, ij, diag));
33939566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_inverse_A_7(diag, shift, allowzeropivot, &zeropivotdetected));
33947b6c816cSBarry Smith       if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT;
33959566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_transpose_A_7(diag));
3396bbead8a2SBarry Smith       diag += 49;
3397bbead8a2SBarry Smith     }
3398bbead8a2SBarry Smith     break;
3399bbead8a2SBarry Smith   default:
34009566063dSJacob Faibussowitsch     PetscCall(PetscMalloc3(bs, &v_work, bs, &v_pivots, bs, &IJ));
3401bbead8a2SBarry Smith     for (i = 0; i < mbs; i++) {
3402ad540459SPierre Jolivet       for (j = 0; j < bs; j++) IJ[j] = bs * i + j;
34039566063dSJacob Faibussowitsch       PetscCall(MatGetValues(A, bs, IJ, bs, IJ, diag));
34049566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_inverse_A(bs, diag, v_pivots, v_work, allowzeropivot, &zeropivotdetected));
34057b6c816cSBarry Smith       if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT;
34069566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_transpose_A_N(diag, bs));
3407bbead8a2SBarry Smith       diag += bs2;
3408bbead8a2SBarry Smith     }
34099566063dSJacob Faibussowitsch     PetscCall(PetscFree3(v_work, v_pivots, IJ));
3410bbead8a2SBarry Smith   }
3411bbead8a2SBarry Smith   a->ibdiagvalid = PETSC_TRUE;
34123ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3413bbead8a2SBarry Smith }
3414bbead8a2SBarry Smith 
3415d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatSetRandom_SeqAIJ(Mat x, PetscRandom rctx)
3416d71ae5a4SJacob Faibussowitsch {
341773a71a0fSBarry Smith   Mat_SeqAIJ *aij = (Mat_SeqAIJ *)x->data;
3418fff043a9SJunchao Zhang   PetscScalar a, *aa;
341973a71a0fSBarry Smith   PetscInt    m, n, i, j, col;
342073a71a0fSBarry Smith 
342173a71a0fSBarry Smith   PetscFunctionBegin;
342273a71a0fSBarry Smith   if (!x->assembled) {
34239566063dSJacob Faibussowitsch     PetscCall(MatGetSize(x, &m, &n));
342473a71a0fSBarry Smith     for (i = 0; i < m; i++) {
342573a71a0fSBarry Smith       for (j = 0; j < aij->imax[i]; j++) {
34269566063dSJacob Faibussowitsch         PetscCall(PetscRandomGetValue(rctx, &a));
342773a71a0fSBarry Smith         col = (PetscInt)(n * PetscRealPart(a));
34289566063dSJacob Faibussowitsch         PetscCall(MatSetValues(x, 1, &i, 1, &col, &a, ADD_VALUES));
342973a71a0fSBarry Smith       }
343073a71a0fSBarry Smith     }
3431e2ce353bSJunchao Zhang   } else {
34329566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJGetArrayWrite(x, &aa));
34339566063dSJacob Faibussowitsch     for (i = 0; i < aij->nz; i++) PetscCall(PetscRandomGetValue(rctx, aa + i));
34349566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJRestoreArrayWrite(x, &aa));
3435e2ce353bSJunchao Zhang   }
34369566063dSJacob Faibussowitsch   PetscCall(MatAssemblyBegin(x, MAT_FINAL_ASSEMBLY));
34379566063dSJacob Faibussowitsch   PetscCall(MatAssemblyEnd(x, MAT_FINAL_ASSEMBLY));
34383ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
343973a71a0fSBarry Smith }
344073a71a0fSBarry Smith 
3441679944adSJunchao Zhang /* Like MatSetRandom_SeqAIJ, but do not set values on columns in range of [low, high) */
3442d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetRandomSkipColumnRange_SeqAIJ_Private(Mat x, PetscInt low, PetscInt high, PetscRandom rctx)
3443d71ae5a4SJacob Faibussowitsch {
3444679944adSJunchao Zhang   Mat_SeqAIJ *aij = (Mat_SeqAIJ *)x->data;
3445679944adSJunchao Zhang   PetscScalar a;
3446679944adSJunchao Zhang   PetscInt    m, n, i, j, col, nskip;
3447679944adSJunchao Zhang 
3448679944adSJunchao Zhang   PetscFunctionBegin;
3449679944adSJunchao Zhang   nskip = high - low;
34509566063dSJacob Faibussowitsch   PetscCall(MatGetSize(x, &m, &n));
3451679944adSJunchao Zhang   n -= nskip; /* shrink number of columns where nonzeros can be set */
3452679944adSJunchao Zhang   for (i = 0; i < m; i++) {
3453679944adSJunchao Zhang     for (j = 0; j < aij->imax[i]; j++) {
34549566063dSJacob Faibussowitsch       PetscCall(PetscRandomGetValue(rctx, &a));
3455679944adSJunchao Zhang       col = (PetscInt)(n * PetscRealPart(a));
3456679944adSJunchao Zhang       if (col >= low) col += nskip; /* shift col rightward to skip the hole */
34579566063dSJacob Faibussowitsch       PetscCall(MatSetValues(x, 1, &i, 1, &col, &a, ADD_VALUES));
3458679944adSJunchao Zhang     }
3459e2ce353bSJunchao Zhang   }
34609566063dSJacob Faibussowitsch   PetscCall(MatAssemblyBegin(x, MAT_FINAL_ASSEMBLY));
34619566063dSJacob Faibussowitsch   PetscCall(MatAssemblyEnd(x, MAT_FINAL_ASSEMBLY));
34623ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3463679944adSJunchao Zhang }
3464679944adSJunchao Zhang 
34650a6ffc59SBarry Smith static struct _MatOps MatOps_Values = {MatSetValues_SeqAIJ,
3466cb5b572fSBarry Smith                                        MatGetRow_SeqAIJ,
3467cb5b572fSBarry Smith                                        MatRestoreRow_SeqAIJ,
3468cb5b572fSBarry Smith                                        MatMult_SeqAIJ,
346997304618SKris Buschelman                                        /*  4*/ MatMultAdd_SeqAIJ,
34707c922b88SBarry Smith                                        MatMultTranspose_SeqAIJ,
34717c922b88SBarry Smith                                        MatMultTransposeAdd_SeqAIJ,
3472f4259b30SLisandro Dalcin                                        NULL,
3473f4259b30SLisandro Dalcin                                        NULL,
3474f4259b30SLisandro Dalcin                                        NULL,
3475f4259b30SLisandro Dalcin                                        /* 10*/ NULL,
3476cb5b572fSBarry Smith                                        MatLUFactor_SeqAIJ,
3477f4259b30SLisandro Dalcin                                        NULL,
347841f059aeSBarry Smith                                        MatSOR_SeqAIJ,
347991e9d3e2SHong Zhang                                        MatTranspose_SeqAIJ,
348097304618SKris Buschelman                                        /*1 5*/ MatGetInfo_SeqAIJ,
3481cb5b572fSBarry Smith                                        MatEqual_SeqAIJ,
3482cb5b572fSBarry Smith                                        MatGetDiagonal_SeqAIJ,
3483cb5b572fSBarry Smith                                        MatDiagonalScale_SeqAIJ,
3484cb5b572fSBarry Smith                                        MatNorm_SeqAIJ,
3485f4259b30SLisandro Dalcin                                        /* 20*/ NULL,
3486cb5b572fSBarry Smith                                        MatAssemblyEnd_SeqAIJ,
3487cb5b572fSBarry Smith                                        MatSetOption_SeqAIJ,
3488cb5b572fSBarry Smith                                        MatZeroEntries_SeqAIJ,
3489d519adbfSMatthew Knepley                                        /* 24*/ MatZeroRows_SeqAIJ,
3490f4259b30SLisandro Dalcin                                        NULL,
3491f4259b30SLisandro Dalcin                                        NULL,
3492f4259b30SLisandro Dalcin                                        NULL,
3493f4259b30SLisandro Dalcin                                        NULL,
349426cec326SBarry Smith                                        /* 29*/ MatSetUp_Seq_Hash,
3495f4259b30SLisandro Dalcin                                        NULL,
3496f4259b30SLisandro Dalcin                                        NULL,
3497f4259b30SLisandro Dalcin                                        NULL,
3498f4259b30SLisandro Dalcin                                        NULL,
3499d519adbfSMatthew Knepley                                        /* 34*/ MatDuplicate_SeqAIJ,
3500f4259b30SLisandro Dalcin                                        NULL,
3501f4259b30SLisandro Dalcin                                        NULL,
3502cb5b572fSBarry Smith                                        MatILUFactor_SeqAIJ,
3503f4259b30SLisandro Dalcin                                        NULL,
3504d519adbfSMatthew Knepley                                        /* 39*/ MatAXPY_SeqAIJ,
35057dae84e0SHong Zhang                                        MatCreateSubMatrices_SeqAIJ,
3506cb5b572fSBarry Smith                                        MatIncreaseOverlap_SeqAIJ,
3507cb5b572fSBarry Smith                                        MatGetValues_SeqAIJ,
3508cb5b572fSBarry Smith                                        MatCopy_SeqAIJ,
3509d519adbfSMatthew Knepley                                        /* 44*/ MatGetRowMax_SeqAIJ,
3510cb5b572fSBarry Smith                                        MatScale_SeqAIJ,
35117d68702bSBarry Smith                                        MatShift_SeqAIJ,
351279299369SBarry Smith                                        MatDiagonalSet_SeqAIJ,
35136e169961SBarry Smith                                        MatZeroRowsColumns_SeqAIJ,
351473a71a0fSBarry Smith                                        /* 49*/ MatSetRandom_SeqAIJ,
35153b2fbd54SBarry Smith                                        MatGetRowIJ_SeqAIJ,
35163b2fbd54SBarry Smith                                        MatRestoreRowIJ_SeqAIJ,
35173b2fbd54SBarry Smith                                        MatGetColumnIJ_SeqAIJ,
3518a93ec695SBarry Smith                                        MatRestoreColumnIJ_SeqAIJ,
351993dfae19SHong Zhang                                        /* 54*/ MatFDColoringCreate_SeqXAIJ,
3520f4259b30SLisandro Dalcin                                        NULL,
3521f4259b30SLisandro Dalcin                                        NULL,
3522cda55fadSBarry Smith                                        MatPermute_SeqAIJ,
3523f4259b30SLisandro Dalcin                                        NULL,
3524f4259b30SLisandro Dalcin                                        /* 59*/ NULL,
3525b9b97703SBarry Smith                                        MatDestroy_SeqAIJ,
3526b9b97703SBarry Smith                                        MatView_SeqAIJ,
3527f4259b30SLisandro Dalcin                                        NULL,
3528f4259b30SLisandro Dalcin                                        NULL,
3529f4259b30SLisandro Dalcin                                        /* 64*/ NULL,
3530321b30b9SSatish Balay                                        MatMatMatMultNumeric_SeqAIJ_SeqAIJ_SeqAIJ,
3531f4259b30SLisandro Dalcin                                        NULL,
3532f4259b30SLisandro Dalcin                                        NULL,
3533f4259b30SLisandro Dalcin                                        NULL,
3534d519adbfSMatthew Knepley                                        /* 69*/ MatGetRowMaxAbs_SeqAIJ,
3535c87e5d42SMatthew Knepley                                        MatGetRowMinAbs_SeqAIJ,
3536f4259b30SLisandro Dalcin                                        NULL,
3537f4259b30SLisandro Dalcin                                        NULL,
3538f4259b30SLisandro Dalcin                                        NULL,
3539f4259b30SLisandro Dalcin                                        /* 74*/ NULL,
35403acb8795SBarry Smith                                        MatFDColoringApply_AIJ,
3541f4259b30SLisandro Dalcin                                        NULL,
3542f4259b30SLisandro Dalcin                                        NULL,
3543f4259b30SLisandro Dalcin                                        NULL,
35446ce1633cSBarry Smith                                        /* 79*/ MatFindZeroDiagonals_SeqAIJ,
3545f4259b30SLisandro Dalcin                                        NULL,
3546f4259b30SLisandro Dalcin                                        NULL,
3547f4259b30SLisandro Dalcin                                        NULL,
3548bc011b1eSHong Zhang                                        MatLoad_SeqAIJ,
3549d519adbfSMatthew Knepley                                        /* 84*/ MatIsSymmetric_SeqAIJ,
35501cbb95d3SBarry Smith                                        MatIsHermitian_SeqAIJ,
3551f4259b30SLisandro Dalcin                                        NULL,
3552f4259b30SLisandro Dalcin                                        NULL,
3553f4259b30SLisandro Dalcin                                        NULL,
3554f4259b30SLisandro Dalcin                                        /* 89*/ NULL,
3555f4259b30SLisandro Dalcin                                        NULL,
355626be0446SHong Zhang                                        MatMatMultNumeric_SeqAIJ_SeqAIJ,
3557f4259b30SLisandro Dalcin                                        NULL,
3558f4259b30SLisandro Dalcin                                        NULL,
35598fa4b5a6SHong Zhang                                        /* 94*/ MatPtAPNumeric_SeqAIJ_SeqAIJ_SparseAxpy,
3560f4259b30SLisandro Dalcin                                        NULL,
3561f4259b30SLisandro Dalcin                                        NULL,
35626fc122caSHong Zhang                                        MatMatTransposeMultNumeric_SeqAIJ_SeqAIJ,
3563f4259b30SLisandro Dalcin                                        NULL,
35644222ddf1SHong Zhang                                        /* 99*/ MatProductSetFromOptions_SeqAIJ,
3565f4259b30SLisandro Dalcin                                        NULL,
3566f4259b30SLisandro Dalcin                                        NULL,
356787d4246cSBarry Smith                                        MatConjugate_SeqAIJ,
3568f4259b30SLisandro Dalcin                                        NULL,
3569d519adbfSMatthew Knepley                                        /*104*/ MatSetValuesRow_SeqAIJ,
357099cafbc1SBarry Smith                                        MatRealPart_SeqAIJ,
3571f5edf698SHong Zhang                                        MatImaginaryPart_SeqAIJ,
3572f4259b30SLisandro Dalcin                                        NULL,
3573f4259b30SLisandro Dalcin                                        NULL,
3574cbd44569SHong Zhang                                        /*109*/ MatMatSolve_SeqAIJ,
3575f4259b30SLisandro Dalcin                                        NULL,
35762af78befSBarry Smith                                        MatGetRowMin_SeqAIJ,
3577f4259b30SLisandro Dalcin                                        NULL,
3578599ef60dSHong Zhang                                        MatMissingDiagonal_SeqAIJ,
3579f4259b30SLisandro Dalcin                                        /*114*/ NULL,
3580f4259b30SLisandro Dalcin                                        NULL,
3581f4259b30SLisandro Dalcin                                        NULL,
3582f4259b30SLisandro Dalcin                                        NULL,
3583f4259b30SLisandro Dalcin                                        NULL,
3584f4259b30SLisandro Dalcin                                        /*119*/ NULL,
3585f4259b30SLisandro Dalcin                                        NULL,
3586f4259b30SLisandro Dalcin                                        NULL,
3587f4259b30SLisandro Dalcin                                        NULL,
3588b3a44c85SBarry Smith                                        MatGetMultiProcBlock_SeqAIJ,
35890716a85fSBarry Smith                                        /*124*/ MatFindNonzeroRows_SeqAIJ,
3590a873a8cdSSam Reynolds                                        MatGetColumnReductions_SeqAIJ,
359137868618SMatthew G Knepley                                        MatInvertBlockDiagonal_SeqAIJ,
35920da83c2eSBarry Smith                                        MatInvertVariableBlockDiagonal_SeqAIJ,
3593f4259b30SLisandro Dalcin                                        NULL,
3594f4259b30SLisandro Dalcin                                        /*129*/ NULL,
3595f4259b30SLisandro Dalcin                                        NULL,
3596f4259b30SLisandro Dalcin                                        NULL,
359775648e8dSHong Zhang                                        MatTransposeMatMultNumeric_SeqAIJ_SeqAIJ,
3598b9af6bddSHong Zhang                                        MatTransposeColoringCreate_SeqAIJ,
3599b9af6bddSHong Zhang                                        /*134*/ MatTransColoringApplySpToDen_SeqAIJ,
36002b8ad9a3SHong Zhang                                        MatTransColoringApplyDenToSp_SeqAIJ,
3601f4259b30SLisandro Dalcin                                        NULL,
3602f4259b30SLisandro Dalcin                                        NULL,
36033964eb88SJed Brown                                        MatRARtNumeric_SeqAIJ_SeqAIJ,
3604f4259b30SLisandro Dalcin                                        /*139*/ NULL,
3605f4259b30SLisandro Dalcin                                        NULL,
3606f4259b30SLisandro Dalcin                                        NULL,
36073a062f41SBarry Smith                                        MatFDColoringSetUp_SeqXAIJ,
36089c8f2541SHong Zhang                                        MatFindOffBlockDiagonalEntries_SeqAIJ,
36094222ddf1SHong Zhang                                        MatCreateMPIMatConcatenateSeqMat_SeqAIJ,
36104222ddf1SHong Zhang                                        /*145*/ MatDestroySubMatrices_SeqAIJ,
3611f4259b30SLisandro Dalcin                                        NULL,
361272833a62Smarkadams4                                        NULL,
361372833a62Smarkadams4                                        MatCreateGraph_Simple_AIJ,
36142d776b49SBarry Smith                                        NULL,
3615dec0b466SHong Zhang                                        /*150*/ MatTransposeSymbolic_SeqAIJ,
3616dec0b466SHong Zhang                                        MatEliminateZeros_SeqAIJ};
361717ab2063SBarry Smith 
3618*ba38deedSJacob Faibussowitsch static PetscErrorCode MatSeqAIJSetColumnIndices_SeqAIJ(Mat mat, PetscInt *indices)
3619d71ae5a4SJacob Faibussowitsch {
3620bef8e0ddSBarry Smith   Mat_SeqAIJ *aij = (Mat_SeqAIJ *)mat->data;
362197f1f81fSBarry Smith   PetscInt    i, nz, n;
3622bef8e0ddSBarry Smith 
3623bef8e0ddSBarry Smith   PetscFunctionBegin;
3624bef8e0ddSBarry Smith   nz = aij->maxnz;
3625d0f46423SBarry Smith   n  = mat->rmap->n;
3626ad540459SPierre Jolivet   for (i = 0; i < nz; i++) aij->j[i] = indices[i];
3627bef8e0ddSBarry Smith   aij->nz = nz;
3628ad540459SPierre Jolivet   for (i = 0; i < n; i++) aij->ilen[i] = aij->imax[i];
36293ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3630bef8e0ddSBarry Smith }
3631bef8e0ddSBarry Smith 
3632a3bb6f32SFande Kong /*
3633ddea5d60SJunchao Zhang  * Given a sparse matrix with global column indices, compact it by using a local column space.
3634ddea5d60SJunchao Zhang  * The result matrix helps saving memory in other algorithms, such as MatPtAPSymbolic_MPIAIJ_MPIAIJ_scalable()
3635ddea5d60SJunchao Zhang  */
3636d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJCompactOutExtraColumns_SeqAIJ(Mat mat, ISLocalToGlobalMapping *mapping)
3637d71ae5a4SJacob Faibussowitsch {
3638a3bb6f32SFande Kong   Mat_SeqAIJ   *aij = (Mat_SeqAIJ *)mat->data;
3639eec179cfSJacob Faibussowitsch   PetscHMapI    gid1_lid1;
3640eec179cfSJacob Faibussowitsch   PetscHashIter tpos;
364125b670f0SStefano Zampini   PetscInt      gid, lid, i, ec, nz = aij->nz;
364225b670f0SStefano Zampini   PetscInt     *garray, *jj = aij->j;
3643a3bb6f32SFande Kong 
3644a3bb6f32SFande Kong   PetscFunctionBegin;
3645a3bb6f32SFande Kong   PetscValidHeaderSpecific(mat, MAT_CLASSID, 1);
36464f572ea9SToby Isaac   PetscAssertPointer(mapping, 2);
3647a3bb6f32SFande Kong   /* use a table */
3648eec179cfSJacob Faibussowitsch   PetscCall(PetscHMapICreateWithSize(mat->rmap->n, &gid1_lid1));
3649a3bb6f32SFande Kong   ec = 0;
365025b670f0SStefano Zampini   for (i = 0; i < nz; i++) {
365125b670f0SStefano Zampini     PetscInt data, gid1 = jj[i] + 1;
3652eec179cfSJacob Faibussowitsch     PetscCall(PetscHMapIGetWithDefault(gid1_lid1, gid1, 0, &data));
3653a3bb6f32SFande Kong     if (!data) {
3654a3bb6f32SFande Kong       /* one based table */
3655c76ffc5fSJacob Faibussowitsch       PetscCall(PetscHMapISet(gid1_lid1, gid1, ++ec));
3656a3bb6f32SFande Kong     }
3657a3bb6f32SFande Kong   }
3658a3bb6f32SFande Kong   /* form array of columns we need */
36599566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(ec, &garray));
3660eec179cfSJacob Faibussowitsch   PetscHashIterBegin(gid1_lid1, tpos);
3661eec179cfSJacob Faibussowitsch   while (!PetscHashIterAtEnd(gid1_lid1, tpos)) {
3662eec179cfSJacob Faibussowitsch     PetscHashIterGetKey(gid1_lid1, tpos, gid);
3663eec179cfSJacob Faibussowitsch     PetscHashIterGetVal(gid1_lid1, tpos, lid);
3664eec179cfSJacob Faibussowitsch     PetscHashIterNext(gid1_lid1, tpos);
3665a3bb6f32SFande Kong     gid--;
3666a3bb6f32SFande Kong     lid--;
3667a3bb6f32SFande Kong     garray[lid] = gid;
3668a3bb6f32SFande Kong   }
36699566063dSJacob Faibussowitsch   PetscCall(PetscSortInt(ec, garray)); /* sort, and rebuild */
3670eec179cfSJacob Faibussowitsch   PetscCall(PetscHMapIClear(gid1_lid1));
3671c76ffc5fSJacob Faibussowitsch   for (i = 0; i < ec; i++) PetscCall(PetscHMapISet(gid1_lid1, garray[i] + 1, i + 1));
3672a3bb6f32SFande Kong   /* compact out the extra columns in B */
367325b670f0SStefano Zampini   for (i = 0; i < nz; i++) {
367425b670f0SStefano Zampini     PetscInt gid1 = jj[i] + 1;
3675eec179cfSJacob Faibussowitsch     PetscCall(PetscHMapIGetWithDefault(gid1_lid1, gid1, 0, &lid));
3676a3bb6f32SFande Kong     lid--;
367725b670f0SStefano Zampini     jj[i] = lid;
3678a3bb6f32SFande Kong   }
36799566063dSJacob Faibussowitsch   PetscCall(PetscLayoutDestroy(&mat->cmap));
3680eec179cfSJacob Faibussowitsch   PetscCall(PetscHMapIDestroy(&gid1_lid1));
36819566063dSJacob Faibussowitsch   PetscCall(PetscLayoutCreateFromSizes(PetscObjectComm((PetscObject)mat), ec, ec, 1, &mat->cmap));
36829566063dSJacob Faibussowitsch   PetscCall(ISLocalToGlobalMappingCreate(PETSC_COMM_SELF, mat->cmap->bs, mat->cmap->n, garray, PETSC_OWN_POINTER, mapping));
36839566063dSJacob Faibussowitsch   PetscCall(ISLocalToGlobalMappingSetType(*mapping, ISLOCALTOGLOBALMAPPINGHASH));
36843ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3685a3bb6f32SFande Kong }
3686a3bb6f32SFande Kong 
3687bef8e0ddSBarry Smith /*@
3688bef8e0ddSBarry Smith   MatSeqAIJSetColumnIndices - Set the column indices for all the rows
3689bef8e0ddSBarry Smith   in the matrix.
3690bef8e0ddSBarry Smith 
3691bef8e0ddSBarry Smith   Input Parameters:
369211a5261eSBarry Smith + mat     - the `MATSEQAIJ` matrix
3693bef8e0ddSBarry Smith - indices - the column indices
3694bef8e0ddSBarry Smith 
369515091d37SBarry Smith   Level: advanced
369615091d37SBarry Smith 
3697bef8e0ddSBarry Smith   Notes:
3698bef8e0ddSBarry Smith   This can be called if you have precomputed the nonzero structure of the
3699bef8e0ddSBarry Smith   matrix and want to provide it to the matrix object to improve the performance
370011a5261eSBarry Smith   of the `MatSetValues()` operation.
3701bef8e0ddSBarry Smith 
3702bef8e0ddSBarry Smith   You MUST have set the correct numbers of nonzeros per row in the call to
370311a5261eSBarry Smith   `MatCreateSeqAIJ()`, and the columns indices MUST be sorted.
3704bef8e0ddSBarry Smith 
370511a5261eSBarry Smith   MUST be called before any calls to `MatSetValues()`
3706bef8e0ddSBarry Smith 
3707b9617806SBarry Smith   The indices should start with zero, not one.
3708b9617806SBarry Smith 
37091cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MATSEQAIJ`
3710bef8e0ddSBarry Smith @*/
3711d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetColumnIndices(Mat mat, PetscInt *indices)
3712d71ae5a4SJacob Faibussowitsch {
3713bef8e0ddSBarry Smith   PetscFunctionBegin;
37140700a824SBarry Smith   PetscValidHeaderSpecific(mat, MAT_CLASSID, 1);
37154f572ea9SToby Isaac   PetscAssertPointer(indices, 2);
3716cac4c232SBarry Smith   PetscUseMethod(mat, "MatSeqAIJSetColumnIndices_C", (Mat, PetscInt *), (mat, indices));
37173ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3718bef8e0ddSBarry Smith }
3719bef8e0ddSBarry Smith 
3720*ba38deedSJacob Faibussowitsch static PetscErrorCode MatStoreValues_SeqAIJ(Mat mat)
3721d71ae5a4SJacob Faibussowitsch {
3722be6bf707SBarry Smith   Mat_SeqAIJ *aij = (Mat_SeqAIJ *)mat->data;
3723d0f46423SBarry Smith   size_t      nz  = aij->i[mat->rmap->n];
3724be6bf707SBarry Smith 
3725be6bf707SBarry Smith   PetscFunctionBegin;
372628b400f6SJacob Faibussowitsch   PetscCheck(aij->nonew, PETSC_COMM_SELF, PETSC_ERR_ORDER, "Must call MatSetOption(A,MAT_NEW_NONZERO_LOCATIONS,PETSC_FALSE);first");
3727be6bf707SBarry Smith 
3728be6bf707SBarry Smith   /* allocate space for values if not already there */
37294dfa11a4SJacob Faibussowitsch   if (!aij->saved_values) { PetscCall(PetscMalloc1(nz + 1, &aij->saved_values)); }
3730be6bf707SBarry Smith 
3731be6bf707SBarry Smith   /* copy values over */
37329566063dSJacob Faibussowitsch   PetscCall(PetscArraycpy(aij->saved_values, aij->a, nz));
37333ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3734be6bf707SBarry Smith }
3735be6bf707SBarry Smith 
3736be6bf707SBarry Smith /*@
373720f4b53cSBarry Smith   MatStoreValues - Stashes a copy of the matrix values; this allows reusing of the linear part of a Jacobian, while recomputing only the
3738be6bf707SBarry Smith   nonlinear portion.
3739be6bf707SBarry Smith 
3740c3339decSBarry Smith   Logically Collect
3741be6bf707SBarry Smith 
374227430b45SBarry Smith   Input Parameter:
374311a5261eSBarry Smith . mat - the matrix (currently only `MATAIJ` matrices support this option)
3744be6bf707SBarry Smith 
374515091d37SBarry Smith   Level: advanced
374615091d37SBarry Smith 
37472920cce0SJacob Faibussowitsch   Example Usage:
374827430b45SBarry Smith .vb
37492ef1f0ffSBarry Smith     Using SNES
375027430b45SBarry Smith     Create Jacobian matrix
375127430b45SBarry Smith     Set linear terms into matrix
375227430b45SBarry Smith     Apply boundary conditions to matrix, at this time matrix must have
375327430b45SBarry Smith       final nonzero structure (i.e. setting the nonlinear terms and applying
375427430b45SBarry Smith       boundary conditions again will not change the nonzero structure
375527430b45SBarry Smith     MatSetOption(mat, MAT_NEW_NONZERO_LOCATIONS, PETSC_FALSE);
375627430b45SBarry Smith     MatStoreValues(mat);
375727430b45SBarry Smith     Call SNESSetJacobian() with matrix
375827430b45SBarry Smith     In your Jacobian routine
375927430b45SBarry Smith       MatRetrieveValues(mat);
376027430b45SBarry Smith       Set nonlinear terms in matrix
3761be6bf707SBarry Smith 
376227430b45SBarry Smith     Without `SNESSolve()`, i.e. when you handle nonlinear solve yourself:
376327430b45SBarry Smith     // build linear portion of Jacobian
376427430b45SBarry Smith     MatSetOption(mat, MAT_NEW_NONZERO_LOCATIONS, PETSC_FALSE);
376527430b45SBarry Smith     MatStoreValues(mat);
376627430b45SBarry Smith     loop over nonlinear iterations
376727430b45SBarry Smith        MatRetrieveValues(mat);
376827430b45SBarry Smith        // call MatSetValues(mat,...) to set nonliner portion of Jacobian
376927430b45SBarry Smith        // call MatAssemblyBegin/End() on matrix
377027430b45SBarry Smith        Solve linear system with Jacobian
377127430b45SBarry Smith     endloop
377227430b45SBarry Smith .ve
3773be6bf707SBarry Smith 
3774be6bf707SBarry Smith   Notes:
3775da81f932SPierre Jolivet   Matrix must already be assembled before calling this routine
377611a5261eSBarry Smith   Must set the matrix option `MatSetOption`(mat,`MAT_NEW_NONZERO_LOCATIONS`,`PETSC_FALSE`); before
3777be6bf707SBarry Smith   calling this routine.
3778be6bf707SBarry Smith 
37790c468ba9SBarry Smith   When this is called multiple times it overwrites the previous set of stored values
37800c468ba9SBarry Smith   and does not allocated additional space.
37810c468ba9SBarry Smith 
3782fe59aa6dSJacob Faibussowitsch .seealso: [](ch_matrices), `Mat`, `MatRetrieveValues()`
3783be6bf707SBarry Smith @*/
3784d71ae5a4SJacob Faibussowitsch PetscErrorCode MatStoreValues(Mat mat)
3785d71ae5a4SJacob Faibussowitsch {
3786be6bf707SBarry Smith   PetscFunctionBegin;
37870700a824SBarry Smith   PetscValidHeaderSpecific(mat, MAT_CLASSID, 1);
378828b400f6SJacob Faibussowitsch   PetscCheck(mat->assembled, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for unassembled matrix");
378928b400f6SJacob Faibussowitsch   PetscCheck(!mat->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix");
3790cac4c232SBarry Smith   PetscUseMethod(mat, "MatStoreValues_C", (Mat), (mat));
37913ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3792be6bf707SBarry Smith }
3793be6bf707SBarry Smith 
3794*ba38deedSJacob Faibussowitsch static PetscErrorCode MatRetrieveValues_SeqAIJ(Mat mat)
3795d71ae5a4SJacob Faibussowitsch {
3796be6bf707SBarry Smith   Mat_SeqAIJ *aij = (Mat_SeqAIJ *)mat->data;
3797d0f46423SBarry Smith   PetscInt    nz  = aij->i[mat->rmap->n];
3798be6bf707SBarry Smith 
3799be6bf707SBarry Smith   PetscFunctionBegin;
380028b400f6SJacob Faibussowitsch   PetscCheck(aij->nonew, PETSC_COMM_SELF, PETSC_ERR_ORDER, "Must call MatSetOption(A,MAT_NEW_NONZERO_LOCATIONS,PETSC_FALSE);first");
380128b400f6SJacob Faibussowitsch   PetscCheck(aij->saved_values, PETSC_COMM_SELF, PETSC_ERR_ORDER, "Must call MatStoreValues(A);first");
3802be6bf707SBarry Smith   /* copy values over */
38039566063dSJacob Faibussowitsch   PetscCall(PetscArraycpy(aij->a, aij->saved_values, nz));
38043ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3805be6bf707SBarry Smith }
3806be6bf707SBarry Smith 
3807be6bf707SBarry Smith /*@
380820f4b53cSBarry Smith   MatRetrieveValues - Retrieves the copy of the matrix values that was stored with `MatStoreValues()`
3809be6bf707SBarry Smith 
3810c3339decSBarry Smith   Logically Collect
3811be6bf707SBarry Smith 
38122fe279fdSBarry Smith   Input Parameter:
381311a5261eSBarry Smith . mat - the matrix (currently only `MATAIJ` matrices support this option)
3814be6bf707SBarry Smith 
381515091d37SBarry Smith   Level: advanced
381615091d37SBarry Smith 
38171cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatStoreValues()`
3818be6bf707SBarry Smith @*/
3819d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRetrieveValues(Mat mat)
3820d71ae5a4SJacob Faibussowitsch {
3821be6bf707SBarry Smith   PetscFunctionBegin;
38220700a824SBarry Smith   PetscValidHeaderSpecific(mat, MAT_CLASSID, 1);
382328b400f6SJacob Faibussowitsch   PetscCheck(mat->assembled, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for unassembled matrix");
382428b400f6SJacob Faibussowitsch   PetscCheck(!mat->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix");
3825cac4c232SBarry Smith   PetscUseMethod(mat, "MatRetrieveValues_C", (Mat), (mat));
38263ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3827be6bf707SBarry Smith }
3828be6bf707SBarry Smith 
382917ab2063SBarry Smith /*@C
383011a5261eSBarry Smith   MatCreateSeqAIJ - Creates a sparse matrix in `MATSEQAIJ` (compressed row) format
38310d15e28bSLois Curfman McInnes   (the default parallel PETSc format).  For good matrix assembly performance
383220f4b53cSBarry Smith   the user should preallocate the matrix storage by setting the parameter `nz`
383320f4b53cSBarry Smith   (or the array `nnz`).
383417ab2063SBarry Smith 
3835d083f849SBarry Smith   Collective
3836db81eaa0SLois Curfman McInnes 
383717ab2063SBarry Smith   Input Parameters:
383811a5261eSBarry Smith + comm - MPI communicator, set to `PETSC_COMM_SELF`
383917ab2063SBarry Smith . m    - number of rows
384017ab2063SBarry Smith . n    - number of columns
384117ab2063SBarry Smith . nz   - number of nonzeros per row (same for all rows)
384251c19458SBarry Smith - nnz  - array containing the number of nonzeros in the various rows
38430298fd71SBarry Smith          (possibly different for each row) or NULL
384417ab2063SBarry Smith 
384517ab2063SBarry Smith   Output Parameter:
3846416022c9SBarry Smith . A - the matrix
384717ab2063SBarry Smith 
38482ef1f0ffSBarry Smith   Options Database Keys:
38492ef1f0ffSBarry Smith + -mat_no_inode            - Do not use inodes
38502ef1f0ffSBarry Smith - -mat_inode_limit <limit> - Sets inode limit (max limit=5)
38512ef1f0ffSBarry Smith 
38522ef1f0ffSBarry Smith   Level: intermediate
3853175b88e8SBarry Smith 
3854b259b22eSLois Curfman McInnes   Notes:
385577433607SBarry Smith   It is recommend to use `MatCreateFromOptions()` instead of this routine
385677433607SBarry Smith 
38572ef1f0ffSBarry Smith   If `nnz` is given then `nz` is ignored
385849a6f317SBarry Smith 
38592ef1f0ffSBarry Smith   The `MATSEQAIJ` format, also called
38602ef1f0ffSBarry Smith   compressed row storage, is fully compatible with standard Fortran
38610002213bSLois Curfman McInnes   storage.  That is, the stored row and column indices can begin at
38622ef1f0ffSBarry Smith   either one (as in Fortran) or zero.
386317ab2063SBarry Smith 
386420f4b53cSBarry Smith   Specify the preallocated storage with either `nz` or `nnz` (not both).
38652ef1f0ffSBarry Smith   Set `nz` = `PETSC_DEFAULT` and `nnz` = `NULL` for PETSc to control dynamic memory
386620f4b53cSBarry Smith   allocation.
386717ab2063SBarry Smith 
3868682d7d0cSBarry Smith   By default, this format uses inodes (identical nodes) when possible, to
38694fca80b9SLois Curfman McInnes   improve numerical efficiency of matrix-vector products and solves. We
3870682d7d0cSBarry Smith   search for consecutive rows with the same nonzero structure, thereby
38716c7ebb05SLois Curfman McInnes   reusing matrix information to achieve increased efficiency.
38726c7ebb05SLois Curfman McInnes 
38731cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, [Sparse Matrix Creation](sec_matsparse), `MatCreate()`, `MatCreateAIJ()`, `MatSetValues()`, `MatSeqAIJSetColumnIndices()`, `MatCreateSeqAIJWithArrays()`
387417ab2063SBarry Smith @*/
3875d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateSeqAIJ(MPI_Comm comm, PetscInt m, PetscInt n, PetscInt nz, const PetscInt nnz[], Mat *A)
3876d71ae5a4SJacob Faibussowitsch {
38773a40ed3dSBarry Smith   PetscFunctionBegin;
38789566063dSJacob Faibussowitsch   PetscCall(MatCreate(comm, A));
38799566063dSJacob Faibussowitsch   PetscCall(MatSetSizes(*A, m, n, m, n));
38809566063dSJacob Faibussowitsch   PetscCall(MatSetType(*A, MATSEQAIJ));
38819566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(*A, nz, nnz));
38823ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3883273d9f13SBarry Smith }
3884273d9f13SBarry Smith 
3885273d9f13SBarry Smith /*@C
3886273d9f13SBarry Smith   MatSeqAIJSetPreallocation - For good matrix assembly performance
3887273d9f13SBarry Smith   the user should preallocate the matrix storage by setting the parameter nz
3888273d9f13SBarry Smith   (or the array nnz).  By setting these parameters accurately, performance
3889273d9f13SBarry Smith   during matrix assembly can be increased by more than a factor of 50.
3890273d9f13SBarry Smith 
3891d083f849SBarry Smith   Collective
3892273d9f13SBarry Smith 
3893273d9f13SBarry Smith   Input Parameters:
38941c4f3114SJed Brown + B   - The matrix
3895273d9f13SBarry Smith . nz  - number of nonzeros per row (same for all rows)
3896273d9f13SBarry Smith - nnz - array containing the number of nonzeros in the various rows
38970298fd71SBarry Smith          (possibly different for each row) or NULL
3898273d9f13SBarry Smith 
38992ef1f0ffSBarry Smith   Options Database Keys:
39002ef1f0ffSBarry Smith + -mat_no_inode            - Do not use inodes
39012ef1f0ffSBarry Smith - -mat_inode_limit <limit> - Sets inode limit (max limit=5)
39022ef1f0ffSBarry Smith 
39032ef1f0ffSBarry Smith   Level: intermediate
39042ef1f0ffSBarry Smith 
3905273d9f13SBarry Smith   Notes:
39062ef1f0ffSBarry Smith   If `nnz` is given then `nz` is ignored
390749a6f317SBarry Smith 
390811a5261eSBarry Smith   The `MATSEQAIJ` format also called
39092ef1f0ffSBarry Smith   compressed row storage, is fully compatible with standard Fortran
3910273d9f13SBarry Smith   storage.  That is, the stored row and column indices can begin at
3911273d9f13SBarry Smith   either one (as in Fortran) or zero.  See the users' manual for details.
3912273d9f13SBarry Smith 
39132ef1f0ffSBarry Smith   Specify the preallocated storage with either `nz` or `nnz` (not both).
39142ef1f0ffSBarry Smith   Set nz = `PETSC_DEFAULT` and `nnz` = `NULL` for PETSc to control dynamic memory
39152ef1f0ffSBarry Smith   allocation.
3916273d9f13SBarry Smith 
391711a5261eSBarry Smith   You can call `MatGetInfo()` to get information on how effective the preallocation was;
3918aa95bbe8SBarry Smith   for example the fields mallocs,nz_allocated,nz_used,nz_unneeded;
3919aa95bbe8SBarry Smith   You can also run with the option -info and look for messages with the string
3920aa95bbe8SBarry Smith   malloc in them to see if additional memory allocation was needed.
3921aa95bbe8SBarry Smith 
392211a5261eSBarry Smith   Developer Notes:
392311a5261eSBarry Smith   Use nz of `MAT_SKIP_ALLOCATION` to not allocate any space for the matrix
3924a96a251dSBarry Smith   entries or columns indices
3925a96a251dSBarry Smith 
3926273d9f13SBarry Smith   By default, this format uses inodes (identical nodes) when possible, to
3927273d9f13SBarry Smith   improve numerical efficiency of matrix-vector products and solves. We
3928273d9f13SBarry Smith   search for consecutive rows with the same nonzero structure, thereby
3929273d9f13SBarry Smith   reusing matrix information to achieve increased efficiency.
3930273d9f13SBarry Smith 
39311cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatCreate()`, `MatCreateAIJ()`, `MatSetValues()`, `MatSeqAIJSetColumnIndices()`, `MatCreateSeqAIJWithArrays()`, `MatGetInfo()`,
3932db781477SPatrick Sanan           `MatSeqAIJSetTotalPreallocation()`
3933273d9f13SBarry Smith @*/
3934d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetPreallocation(Mat B, PetscInt nz, const PetscInt nnz[])
3935d71ae5a4SJacob Faibussowitsch {
3936a23d5eceSKris Buschelman   PetscFunctionBegin;
39376ba663aaSJed Brown   PetscValidHeaderSpecific(B, MAT_CLASSID, 1);
39386ba663aaSJed Brown   PetscValidType(B, 1);
3939cac4c232SBarry Smith   PetscTryMethod(B, "MatSeqAIJSetPreallocation_C", (Mat, PetscInt, const PetscInt[]), (B, nz, nnz));
39403ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3941a23d5eceSKris Buschelman }
3942a23d5eceSKris Buschelman 
3943d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetPreallocation_SeqAIJ(Mat B, PetscInt nz, const PetscInt *nnz)
3944d71ae5a4SJacob Faibussowitsch {
3945ad79cf63SBarry Smith   Mat_SeqAIJ *b              = (Mat_SeqAIJ *)B->data;
39462576faa2SJed Brown   PetscBool   skipallocation = PETSC_FALSE, realalloc = PETSC_FALSE;
394797f1f81fSBarry Smith   PetscInt    i;
3948273d9f13SBarry Smith 
3949273d9f13SBarry Smith   PetscFunctionBegin;
3950ad79cf63SBarry Smith   if (B->hash_active) {
3951aea10558SJacob Faibussowitsch     B->ops[0] = b->cops;
3952ad79cf63SBarry Smith     PetscCall(PetscHMapIJVDestroy(&b->ht));
3953ad79cf63SBarry Smith     PetscCall(PetscFree(b->dnz));
3954ad79cf63SBarry Smith     B->hash_active = PETSC_FALSE;
3955ad79cf63SBarry Smith   }
39562576faa2SJed Brown   if (nz >= 0 || nnz) realalloc = PETSC_TRUE;
3957a96a251dSBarry Smith   if (nz == MAT_SKIP_ALLOCATION) {
3958c461c341SBarry Smith     skipallocation = PETSC_TRUE;
3959c461c341SBarry Smith     nz             = 0;
3960c461c341SBarry Smith   }
39619566063dSJacob Faibussowitsch   PetscCall(PetscLayoutSetUp(B->rmap));
39629566063dSJacob Faibussowitsch   PetscCall(PetscLayoutSetUp(B->cmap));
3963899cda47SBarry Smith 
3964435da068SBarry Smith   if (nz == PETSC_DEFAULT || nz == PETSC_DECIDE) nz = 5;
396508401ef6SPierre Jolivet   PetscCheck(nz >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "nz cannot be less than 0: value %" PetscInt_FMT, nz);
3966cf9c20a2SJed Brown   if (PetscUnlikelyDebug(nnz)) {
3967d0f46423SBarry Smith     for (i = 0; i < B->rmap->n; i++) {
396808401ef6SPierre Jolivet       PetscCheck(nnz[i] >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "nnz cannot be less than 0: local row %" PetscInt_FMT " value %" PetscInt_FMT, i, nnz[i]);
396908401ef6SPierre Jolivet       PetscCheck(nnz[i] <= B->cmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "nnz cannot be greater than row length: local row %" PetscInt_FMT " value %" PetscInt_FMT " rowlength %" PetscInt_FMT, i, nnz[i], B->cmap->n);
3970b73539f3SBarry Smith     }
3971b73539f3SBarry Smith   }
3972b73539f3SBarry Smith 
3973273d9f13SBarry Smith   B->preallocated = PETSC_TRUE;
3974ab93d7beSBarry Smith   if (!skipallocation) {
39754dfa11a4SJacob Faibussowitsch     if (!b->imax) { PetscCall(PetscMalloc1(B->rmap->n, &b->imax)); }
3976071fcb05SBarry Smith     if (!b->ilen) {
3977071fcb05SBarry Smith       /* b->ilen will count nonzeros in each row so far. */
39789566063dSJacob Faibussowitsch       PetscCall(PetscCalloc1(B->rmap->n, &b->ilen));
3979071fcb05SBarry Smith     } else {
39809566063dSJacob Faibussowitsch       PetscCall(PetscMemzero(b->ilen, B->rmap->n * sizeof(PetscInt)));
39812ee49352SLisandro Dalcin     }
3982aa624791SPierre Jolivet     if (!b->ipre) PetscCall(PetscMalloc1(B->rmap->n, &b->ipre));
3983273d9f13SBarry Smith     if (!nnz) {
3984435da068SBarry Smith       if (nz == PETSC_DEFAULT || nz == PETSC_DECIDE) nz = 10;
3985c62bd62aSJed Brown       else if (nz < 0) nz = 1;
39865d2a9ed1SStefano Zampini       nz = PetscMin(nz, B->cmap->n);
3987d0f46423SBarry Smith       for (i = 0; i < B->rmap->n; i++) b->imax[i] = nz;
3988d0f46423SBarry Smith       nz = nz * B->rmap->n;
3989273d9f13SBarry Smith     } else {
3990c73702f5SBarry Smith       PetscInt64 nz64 = 0;
39919371c9d4SSatish Balay       for (i = 0; i < B->rmap->n; i++) {
39929371c9d4SSatish Balay         b->imax[i] = nnz[i];
39939371c9d4SSatish Balay         nz64 += nnz[i];
39949371c9d4SSatish Balay       }
39959566063dSJacob Faibussowitsch       PetscCall(PetscIntCast(nz64, &nz));
3996273d9f13SBarry Smith     }
3997ab93d7beSBarry Smith 
3998273d9f13SBarry Smith     /* allocate the matrix space */
399953dd7562SDmitry Karpeev     /* FIXME: should B's old memory be unlogged? */
40009566063dSJacob Faibussowitsch     PetscCall(MatSeqXAIJFreeAIJ(B, &b->a, &b->j, &b->i));
4001396832f4SHong Zhang     if (B->structure_only) {
40029566063dSJacob Faibussowitsch       PetscCall(PetscMalloc1(nz, &b->j));
40039566063dSJacob Faibussowitsch       PetscCall(PetscMalloc1(B->rmap->n + 1, &b->i));
4004396832f4SHong Zhang     } else {
40059566063dSJacob Faibussowitsch       PetscCall(PetscMalloc3(nz, &b->a, nz, &b->j, B->rmap->n + 1, &b->i));
4006396832f4SHong Zhang     }
4007bfeeae90SHong Zhang     b->i[0] = 0;
4008ad540459SPierre Jolivet     for (i = 1; i < B->rmap->n + 1; i++) b->i[i] = b->i[i - 1] + b->imax[i - 1];
4009396832f4SHong Zhang     if (B->structure_only) {
4010396832f4SHong Zhang       b->singlemalloc = PETSC_FALSE;
4011396832f4SHong Zhang       b->free_a       = PETSC_FALSE;
4012396832f4SHong Zhang     } else {
4013273d9f13SBarry Smith       b->singlemalloc = PETSC_TRUE;
4014e6b907acSBarry Smith       b->free_a       = PETSC_TRUE;
4015396832f4SHong Zhang     }
4016e6b907acSBarry Smith     b->free_ij = PETSC_TRUE;
4017c461c341SBarry Smith   } else {
4018e6b907acSBarry Smith     b->free_a  = PETSC_FALSE;
4019e6b907acSBarry Smith     b->free_ij = PETSC_FALSE;
4020c461c341SBarry Smith   }
4021273d9f13SBarry Smith 
4022846b4da1SFande Kong   if (b->ipre && nnz != b->ipre && b->imax) {
4023846b4da1SFande Kong     /* reserve user-requested sparsity */
40249566063dSJacob Faibussowitsch     PetscCall(PetscArraycpy(b->ipre, b->imax, B->rmap->n));
4025846b4da1SFande Kong   }
4026846b4da1SFande Kong 
4027273d9f13SBarry Smith   b->nz               = 0;
4028273d9f13SBarry Smith   b->maxnz            = nz;
4029273d9f13SBarry Smith   B->info.nz_unneeded = (double)b->maxnz;
40301baa6e33SBarry Smith   if (realalloc) PetscCall(MatSetOption(B, MAT_NEW_NONZERO_ALLOCATION_ERR, PETSC_TRUE));
4031cb7b82ddSBarry Smith   B->was_assembled = PETSC_FALSE;
4032cb7b82ddSBarry Smith   B->assembled     = PETSC_FALSE;
40335519a089SJose E. Roman   /* We simply deem preallocation has changed nonzero state. Updating the state
40345519a089SJose E. Roman      will give clients (like AIJKokkos) a chance to know something has happened.
40355519a089SJose E. Roman   */
40365519a089SJose E. Roman   B->nonzerostate++;
40373ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
4038273d9f13SBarry Smith }
4039273d9f13SBarry Smith 
4040*ba38deedSJacob Faibussowitsch static PetscErrorCode MatResetPreallocation_SeqAIJ(Mat A)
4041d71ae5a4SJacob Faibussowitsch {
4042846b4da1SFande Kong   Mat_SeqAIJ *a;
4043a5bbaf83SFande Kong   PetscInt    i;
40441f14be2bSBarry Smith   PetscBool   skipreset;
4045846b4da1SFande Kong 
4046846b4da1SFande Kong   PetscFunctionBegin;
4047846b4da1SFande Kong   PetscValidHeaderSpecific(A, MAT_CLASSID, 1);
404814d0e64fSAlex Lindsay 
404914d0e64fSAlex Lindsay   /* Check local size. If zero, then return */
40503ba16761SJacob Faibussowitsch   if (!A->rmap->n) PetscFunctionReturn(PETSC_SUCCESS);
405114d0e64fSAlex Lindsay 
4052846b4da1SFande Kong   a = (Mat_SeqAIJ *)A->data;
40532c814fdeSFande Kong   /* if no saved info, we error out */
405428b400f6SJacob Faibussowitsch   PetscCheck(a->ipre, PETSC_COMM_SELF, PETSC_ERR_ARG_NULL, "No saved preallocation info ");
40552c814fdeSFande Kong 
40561f14be2bSBarry Smith   PetscCheck(a->i && a->imax && a->ilen, PETSC_COMM_SELF, PETSC_ERR_ARG_NULL, "Memory info is incomplete, and can not reset preallocation ");
40572c814fdeSFande Kong 
40581f14be2bSBarry Smith   PetscCall(PetscArraycmp(a->ipre, a->ilen, A->rmap->n, &skipreset));
40591f14be2bSBarry Smith   if (!skipreset) {
40609566063dSJacob Faibussowitsch     PetscCall(PetscArraycpy(a->imax, a->ipre, A->rmap->n));
40619566063dSJacob Faibussowitsch     PetscCall(PetscArrayzero(a->ilen, A->rmap->n));
4062846b4da1SFande Kong     a->i[0] = 0;
4063ad540459SPierre Jolivet     for (i = 1; i < A->rmap->n + 1; i++) a->i[i] = a->i[i - 1] + a->imax[i - 1];
4064846b4da1SFande Kong     A->preallocated     = PETSC_TRUE;
4065846b4da1SFande Kong     a->nz               = 0;
4066846b4da1SFande Kong     a->maxnz            = a->i[A->rmap->n];
4067846b4da1SFande Kong     A->info.nz_unneeded = (double)a->maxnz;
4068846b4da1SFande Kong     A->was_assembled    = PETSC_FALSE;
4069846b4da1SFande Kong     A->assembled        = PETSC_FALSE;
40701f14be2bSBarry Smith   }
40713ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
4072846b4da1SFande Kong }
4073846b4da1SFande Kong 
407458d36128SBarry Smith /*@
407511a5261eSBarry Smith   MatSeqAIJSetPreallocationCSR - Allocates memory for a sparse sequential matrix in `MATSEQAIJ` format.
4076a1661176SMatthew Knepley 
4077a1661176SMatthew Knepley   Input Parameters:
4078a1661176SMatthew Knepley + B - the matrix
4079a1661176SMatthew Knepley . i - the indices into j for the start of each row (starts with zero)
4080a1661176SMatthew Knepley . j - the column indices for each row (starts with zero) these must be sorted for each row
4081a1661176SMatthew Knepley - v - optional values in the matrix
4082a1661176SMatthew Knepley 
4083a1661176SMatthew Knepley   Level: developer
4084a1661176SMatthew Knepley 
40856a9b8d82SBarry Smith   Notes:
40862ef1f0ffSBarry Smith   The `i`,`j`,`v` values are COPIED with this routine; to avoid the copy use `MatCreateSeqAIJWithArrays()`
408758d36128SBarry Smith 
40886a9b8d82SBarry Smith   This routine may be called multiple times with different nonzero patterns (or the same nonzero pattern). The nonzero
40896a9b8d82SBarry Smith   structure will be the union of all the previous nonzero structures.
40906a9b8d82SBarry Smith 
40916a9b8d82SBarry Smith   Developer Notes:
40922ef1f0ffSBarry Smith   An optimization could be added to the implementation where it checks if the `i`, and `j` are identical to the current `i` and `j` and
40932ef1f0ffSBarry Smith   then just copies the `v` values directly with `PetscMemcpy()`.
40946a9b8d82SBarry Smith 
409511a5261eSBarry Smith   This routine could also take a `PetscCopyMode` argument to allow sharing the values instead of always copying them.
40966a9b8d82SBarry Smith 
4097fe59aa6dSJacob Faibussowitsch .seealso: [](ch_matrices), `Mat`, `MatCreate()`, `MatCreateSeqAIJ()`, `MatSetValues()`, `MatSeqAIJSetPreallocation()`, `MATSEQAIJ`, `MatResetPreallocation()`
4098a1661176SMatthew Knepley @*/
4099d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetPreallocationCSR(Mat B, const PetscInt i[], const PetscInt j[], const PetscScalar v[])
4100d71ae5a4SJacob Faibussowitsch {
4101a1661176SMatthew Knepley   PetscFunctionBegin;
41020700a824SBarry Smith   PetscValidHeaderSpecific(B, MAT_CLASSID, 1);
41036ba663aaSJed Brown   PetscValidType(B, 1);
4104cac4c232SBarry Smith   PetscTryMethod(B, "MatSeqAIJSetPreallocationCSR_C", (Mat, const PetscInt[], const PetscInt[], const PetscScalar[]), (B, i, j, v));
41053ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
4106a1661176SMatthew Knepley }
4107a1661176SMatthew Knepley 
4108*ba38deedSJacob Faibussowitsch static PetscErrorCode MatSeqAIJSetPreallocationCSR_SeqAIJ(Mat B, const PetscInt Ii[], const PetscInt J[], const PetscScalar v[])
4109d71ae5a4SJacob Faibussowitsch {
4110a1661176SMatthew Knepley   PetscInt  i;
4111a1661176SMatthew Knepley   PetscInt  m, n;
4112a1661176SMatthew Knepley   PetscInt  nz;
41136a9b8d82SBarry Smith   PetscInt *nnz;
4114a1661176SMatthew Knepley 
4115a1661176SMatthew Knepley   PetscFunctionBegin;
4116aed4548fSBarry Smith   PetscCheck(Ii[0] == 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Ii[0] must be 0 it is %" PetscInt_FMT, Ii[0]);
4117779a8d59SSatish Balay 
41189566063dSJacob Faibussowitsch   PetscCall(PetscLayoutSetUp(B->rmap));
41199566063dSJacob Faibussowitsch   PetscCall(PetscLayoutSetUp(B->cmap));
4120779a8d59SSatish Balay 
41219566063dSJacob Faibussowitsch   PetscCall(MatGetSize(B, &m, &n));
41229566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(m + 1, &nnz));
4123a1661176SMatthew Knepley   for (i = 0; i < m; i++) {
4124b7940d39SSatish Balay     nz = Ii[i + 1] - Ii[i];
412508401ef6SPierre Jolivet     PetscCheck(nz >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Local row %" PetscInt_FMT " has a negative number of columns %" PetscInt_FMT, i, nz);
4126a1661176SMatthew Knepley     nnz[i] = nz;
4127a1661176SMatthew Knepley   }
41289566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJSetPreallocation(B, 0, nnz));
41299566063dSJacob Faibussowitsch   PetscCall(PetscFree(nnz));
4130a1661176SMatthew Knepley 
413148a46eb9SPierre Jolivet   for (i = 0; i < m; i++) PetscCall(MatSetValues_SeqAIJ(B, 1, &i, Ii[i + 1] - Ii[i], J + Ii[i], v ? v + Ii[i] : NULL, INSERT_VALUES));
4132a1661176SMatthew Knepley 
41339566063dSJacob Faibussowitsch   PetscCall(MatAssemblyBegin(B, MAT_FINAL_ASSEMBLY));
41349566063dSJacob Faibussowitsch   PetscCall(MatAssemblyEnd(B, MAT_FINAL_ASSEMBLY));
4135a1661176SMatthew Knepley 
41369566063dSJacob Faibussowitsch   PetscCall(MatSetOption(B, MAT_NEW_NONZERO_LOCATION_ERR, PETSC_TRUE));
41373ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
4138a1661176SMatthew Knepley }
4139a1661176SMatthew Knepley 
4140ad7e164aSPierre Jolivet /*@
41412ef1f0ffSBarry Smith   MatSeqAIJKron - Computes `C`, the Kronecker product of `A` and `B`.
4142ad7e164aSPierre Jolivet 
4143ad7e164aSPierre Jolivet   Input Parameters:
4144ad7e164aSPierre Jolivet + A     - left-hand side matrix
4145ad7e164aSPierre Jolivet . B     - right-hand side matrix
414611a5261eSBarry Smith - reuse - either `MAT_INITIAL_MATRIX` or `MAT_REUSE_MATRIX`
4147ad7e164aSPierre Jolivet 
4148ad7e164aSPierre Jolivet   Output Parameter:
41492ef1f0ffSBarry Smith . C - Kronecker product of `A` and `B`
4150ad7e164aSPierre Jolivet 
4151ad7e164aSPierre Jolivet   Level: intermediate
4152ad7e164aSPierre Jolivet 
415311a5261eSBarry Smith   Note:
415411a5261eSBarry Smith   `MAT_REUSE_MATRIX` can only be used when the nonzero structure of the product matrix has not changed from that last call to `MatSeqAIJKron()`.
4155ad7e164aSPierre Jolivet 
41561cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatCreateSeqAIJ()`, `MATSEQAIJ`, `MATKAIJ`, `MatReuse`
4157ad7e164aSPierre Jolivet @*/
4158d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJKron(Mat A, Mat B, MatReuse reuse, Mat *C)
4159d71ae5a4SJacob Faibussowitsch {
4160ad7e164aSPierre Jolivet   PetscFunctionBegin;
4161ad7e164aSPierre Jolivet   PetscValidHeaderSpecific(A, MAT_CLASSID, 1);
4162ad7e164aSPierre Jolivet   PetscValidType(A, 1);
4163ad7e164aSPierre Jolivet   PetscValidHeaderSpecific(B, MAT_CLASSID, 2);
4164ad7e164aSPierre Jolivet   PetscValidType(B, 2);
41654f572ea9SToby Isaac   PetscAssertPointer(C, 4);
4166ad7e164aSPierre Jolivet   if (reuse == MAT_REUSE_MATRIX) {
4167ad7e164aSPierre Jolivet     PetscValidHeaderSpecific(*C, MAT_CLASSID, 4);
4168ad7e164aSPierre Jolivet     PetscValidType(*C, 4);
4169ad7e164aSPierre Jolivet   }
4170cac4c232SBarry Smith   PetscTryMethod(A, "MatSeqAIJKron_C", (Mat, Mat, MatReuse, Mat *), (A, B, reuse, C));
41713ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
4172ad7e164aSPierre Jolivet }
4173ad7e164aSPierre Jolivet 
4174*ba38deedSJacob Faibussowitsch static PetscErrorCode MatSeqAIJKron_SeqAIJ(Mat A, Mat B, MatReuse reuse, Mat *C)
4175d71ae5a4SJacob Faibussowitsch {
4176ad7e164aSPierre Jolivet   Mat                newmat;
4177ad7e164aSPierre Jolivet   Mat_SeqAIJ        *a = (Mat_SeqAIJ *)A->data;
4178ad7e164aSPierre Jolivet   Mat_SeqAIJ        *b = (Mat_SeqAIJ *)B->data;
4179ad7e164aSPierre Jolivet   PetscScalar       *v;
4180fff043a9SJunchao Zhang   const PetscScalar *aa, *ba;
4181ad7e164aSPierre Jolivet   PetscInt          *i, *j, m, n, p, q, nnz = 0, am = A->rmap->n, bm = B->rmap->n, an = A->cmap->n, bn = B->cmap->n;
4182ad7e164aSPierre Jolivet   PetscBool          flg;
4183ad7e164aSPierre Jolivet 
4184ad7e164aSPierre Jolivet   PetscFunctionBegin;
418528b400f6SJacob Faibussowitsch   PetscCheck(!A->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix");
418628b400f6SJacob Faibussowitsch   PetscCheck(A->assembled, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for unassembled matrix");
418728b400f6SJacob Faibussowitsch   PetscCheck(!B->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix");
418828b400f6SJacob Faibussowitsch   PetscCheck(B->assembled, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for unassembled matrix");
41899566063dSJacob Faibussowitsch   PetscCall(PetscObjectTypeCompare((PetscObject)B, MATSEQAIJ, &flg));
419028b400f6SJacob Faibussowitsch   PetscCheck(flg, PETSC_COMM_SELF, PETSC_ERR_SUP, "MatType %s", ((PetscObject)B)->type_name);
4191aed4548fSBarry Smith   PetscCheck(reuse == MAT_INITIAL_MATRIX || reuse == MAT_REUSE_MATRIX, PETSC_COMM_SELF, PETSC_ERR_SUP, "MatReuse %d", (int)reuse);
4192ad7e164aSPierre Jolivet   if (reuse == MAT_INITIAL_MATRIX) {
41939566063dSJacob Faibussowitsch     PetscCall(PetscMalloc2(am * bm + 1, &i, a->i[am] * b->i[bm], &j));
41949566063dSJacob Faibussowitsch     PetscCall(MatCreate(PETSC_COMM_SELF, &newmat));
41959566063dSJacob Faibussowitsch     PetscCall(MatSetSizes(newmat, am * bm, an * bn, am * bm, an * bn));
41969566063dSJacob Faibussowitsch     PetscCall(MatSetType(newmat, MATAIJ));
4197ad7e164aSPierre Jolivet     i[0] = 0;
4198ad7e164aSPierre Jolivet     for (m = 0; m < am; ++m) {
4199ad7e164aSPierre Jolivet       for (p = 0; p < bm; ++p) {
4200ad7e164aSPierre Jolivet         i[m * bm + p + 1] = i[m * bm + p] + (a->i[m + 1] - a->i[m]) * (b->i[p + 1] - b->i[p]);
4201ad7e164aSPierre Jolivet         for (n = a->i[m]; n < a->i[m + 1]; ++n) {
4202ad540459SPierre Jolivet           for (q = b->i[p]; q < b->i[p + 1]; ++q) j[nnz++] = a->j[n] * bn + b->j[q];
4203ad7e164aSPierre Jolivet         }
4204ad7e164aSPierre Jolivet       }
4205ad7e164aSPierre Jolivet     }
42069566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJSetPreallocationCSR(newmat, i, j, NULL));
4207ad7e164aSPierre Jolivet     *C = newmat;
42089566063dSJacob Faibussowitsch     PetscCall(PetscFree2(i, j));
4209ad7e164aSPierre Jolivet     nnz = 0;
4210ad7e164aSPierre Jolivet   }
42119566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArray(*C, &v));
42129566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &aa));
42139566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(B, &ba));
4214ad7e164aSPierre Jolivet   for (m = 0; m < am; ++m) {
4215ad7e164aSPierre Jolivet     for (p = 0; p < bm; ++p) {
4216ad7e164aSPierre Jolivet       for (n = a->i[m]; n < a->i[m + 1]; ++n) {
4217ad540459SPierre Jolivet         for (q = b->i[p]; q < b->i[p + 1]; ++q) v[nnz++] = aa[n] * ba[q];
4218ad7e164aSPierre Jolivet       }
4219ad7e164aSPierre Jolivet     }
4220ad7e164aSPierre Jolivet   }
42219566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArray(*C, &v));
42229566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &aa));
42239566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(B, &ba));
42243ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
4225ad7e164aSPierre Jolivet }
4226ad7e164aSPierre Jolivet 
4227c6db04a5SJed Brown #include <../src/mat/impls/dense/seq/dense.h>
4228af0996ceSBarry Smith #include <petsc/private/kernels/petscaxpy.h>
4229170fe5c8SBarry Smith 
4230170fe5c8SBarry Smith /*
4231170fe5c8SBarry Smith     Computes (B'*A')' since computing B*A directly is untenable
4232170fe5c8SBarry Smith 
4233170fe5c8SBarry Smith                n                       p                          p
42342da392ccSBarry Smith         [             ]       [             ]         [                 ]
42352da392ccSBarry Smith       m [      A      ]  *  n [       B     ]   =   m [         C       ]
42362da392ccSBarry Smith         [             ]       [             ]         [                 ]
4237170fe5c8SBarry Smith 
4238170fe5c8SBarry Smith */
4239d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMatMultNumeric_SeqDense_SeqAIJ(Mat A, Mat B, Mat C)
4240d71ae5a4SJacob Faibussowitsch {
4241170fe5c8SBarry Smith   Mat_SeqDense      *sub_a = (Mat_SeqDense *)A->data;
4242170fe5c8SBarry Smith   Mat_SeqAIJ        *sub_b = (Mat_SeqAIJ *)B->data;
4243170fe5c8SBarry Smith   Mat_SeqDense      *sub_c = (Mat_SeqDense *)C->data;
424486214ceeSStefano Zampini   PetscInt           i, j, n, m, q, p;
4245170fe5c8SBarry Smith   const PetscInt    *ii, *idx;
4246170fe5c8SBarry Smith   const PetscScalar *b, *a, *a_q;
4247170fe5c8SBarry Smith   PetscScalar       *c, *c_q;
424886214ceeSStefano Zampini   PetscInt           clda = sub_c->lda;
424986214ceeSStefano Zampini   PetscInt           alda = sub_a->lda;
4250170fe5c8SBarry Smith 
4251170fe5c8SBarry Smith   PetscFunctionBegin;
4252d0f46423SBarry Smith   m = A->rmap->n;
4253d0f46423SBarry Smith   n = A->cmap->n;
4254d0f46423SBarry Smith   p = B->cmap->n;
4255170fe5c8SBarry Smith   a = sub_a->v;
4256170fe5c8SBarry Smith   b = sub_b->a;
4257170fe5c8SBarry Smith   c = sub_c->v;
425886214ceeSStefano Zampini   if (clda == m) {
42599566063dSJacob Faibussowitsch     PetscCall(PetscArrayzero(c, m * p));
426086214ceeSStefano Zampini   } else {
426186214ceeSStefano Zampini     for (j = 0; j < p; j++)
42629371c9d4SSatish Balay       for (i = 0; i < m; i++) c[j * clda + i] = 0.0;
426386214ceeSStefano Zampini   }
4264170fe5c8SBarry Smith   ii  = sub_b->i;
4265170fe5c8SBarry Smith   idx = sub_b->j;
4266170fe5c8SBarry Smith   for (i = 0; i < n; i++) {
4267170fe5c8SBarry Smith     q = ii[i + 1] - ii[i];
4268170fe5c8SBarry Smith     while (q-- > 0) {
426986214ceeSStefano Zampini       c_q = c + clda * (*idx);
427086214ceeSStefano Zampini       a_q = a + alda * i;
4271854c7f52SBarry Smith       PetscKernelAXPY(c_q, *b, a_q, m);
4272170fe5c8SBarry Smith       idx++;
4273170fe5c8SBarry Smith       b++;
4274170fe5c8SBarry Smith     }
4275170fe5c8SBarry Smith   }
42763ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
4277170fe5c8SBarry Smith }
4278170fe5c8SBarry Smith 
4279d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMatMultSymbolic_SeqDense_SeqAIJ(Mat A, Mat B, PetscReal fill, Mat C)
4280d71ae5a4SJacob Faibussowitsch {
4281d0f46423SBarry Smith   PetscInt  m = A->rmap->n, n = B->cmap->n;
428286214ceeSStefano Zampini   PetscBool cisdense;
4283170fe5c8SBarry Smith 
4284170fe5c8SBarry Smith   PetscFunctionBegin;
428508401ef6SPierre Jolivet   PetscCheck(A->cmap->n == B->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "A->cmap->n %" PetscInt_FMT " != B->rmap->n %" PetscInt_FMT, A->cmap->n, B->rmap->n);
42869566063dSJacob Faibussowitsch   PetscCall(MatSetSizes(C, m, n, m, n));
42879566063dSJacob Faibussowitsch   PetscCall(MatSetBlockSizesFromMats(C, A, B));
4288d5e393b6SSuyash Tandon   PetscCall(PetscObjectTypeCompareAny((PetscObject)C, &cisdense, MATSEQDENSE, MATSEQDENSECUDA, MATSEQDENSEHIP, ""));
428948a46eb9SPierre Jolivet   if (!cisdense) PetscCall(MatSetType(C, MATDENSE));
42909566063dSJacob Faibussowitsch   PetscCall(MatSetUp(C));
4291d73949e8SHong Zhang 
42924222ddf1SHong Zhang   C->ops->matmultnumeric = MatMatMultNumeric_SeqDense_SeqAIJ;
42933ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
4294170fe5c8SBarry Smith }
4295170fe5c8SBarry Smith 
42960bad9183SKris Buschelman /*MC
4297fafad747SKris Buschelman    MATSEQAIJ - MATSEQAIJ = "seqaij" - A matrix type to be used for sequential sparse matrices,
42980bad9183SKris Buschelman    based on compressed sparse row format.
42990bad9183SKris Buschelman 
43002ef1f0ffSBarry Smith    Options Database Key:
43010bad9183SKris Buschelman . -mat_type seqaij - sets the matrix type to "seqaij" during a call to MatSetFromOptions()
43020bad9183SKris Buschelman 
43030bad9183SKris Buschelman    Level: beginner
43040bad9183SKris Buschelman 
43050cd7f59aSBarry Smith    Notes:
43062ef1f0ffSBarry Smith     `MatSetValues()` may be called for this matrix type with a `NULL` argument for the numerical values,
43070cd7f59aSBarry Smith     in this case the values associated with the rows and columns one passes in are set to zero
43080cd7f59aSBarry Smith     in the matrix
43090cd7f59aSBarry Smith 
431011a5261eSBarry Smith     `MatSetOptions`(,`MAT_STRUCTURE_ONLY`,`PETSC_TRUE`) may be called for this matrix type. In this no
431111a5261eSBarry Smith     space is allocated for the nonzero entries and any entries passed with `MatSetValues()` are ignored
43120cd7f59aSBarry Smith 
431311a5261eSBarry Smith   Developer Note:
43142ef1f0ffSBarry Smith     It would be nice if all matrix formats supported passing `NULL` in for the numerical values
43150cd7f59aSBarry Smith 
43161cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatCreateSeqAIJ()`, `MatSetFromOptions()`, `MatSetType()`, `MatCreate()`, `MatType`, `MATSELL`, `MATSEQSELL`, `MATMPISELL`
43170bad9183SKris Buschelman M*/
43180bad9183SKris Buschelman 
4319ccd284c7SBarry Smith /*MC
4320ccd284c7SBarry Smith    MATAIJ - MATAIJ = "aij" - A matrix type to be used for sparse matrices.
4321ccd284c7SBarry Smith 
432211a5261eSBarry Smith    This matrix type is identical to `MATSEQAIJ` when constructed with a single process communicator,
432311a5261eSBarry Smith    and `MATMPIAIJ` otherwise.  As a result, for single process communicators,
432411a5261eSBarry Smith    `MatSeqAIJSetPreallocation()` is supported, and similarly `MatMPIAIJSetPreallocation()` is supported
4325ccd284c7SBarry Smith    for communicators controlling multiple processes.  It is recommended that you call both of
4326ccd284c7SBarry Smith    the above preallocation routines for simplicity.
4327ccd284c7SBarry Smith 
43282ef1f0ffSBarry Smith    Options Database Key:
432911a5261eSBarry Smith . -mat_type aij - sets the matrix type to "aij" during a call to `MatSetFromOptions()`
4330ccd284c7SBarry Smith 
43312ef1f0ffSBarry Smith   Level: beginner
43322ef1f0ffSBarry Smith 
433311a5261eSBarry Smith    Note:
433411a5261eSBarry Smith    Subclasses include `MATAIJCUSPARSE`, `MATAIJPERM`, `MATAIJSELL`, `MATAIJMKL`, `MATAIJCRL`, and also automatically switches over to use inodes when
4335ccd284c7SBarry Smith    enough exist.
4336ccd284c7SBarry Smith 
43371cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatCreateAIJ()`, `MatCreateSeqAIJ()`, `MATSEQAIJ`, `MATMPIAIJ`, `MATSELL`, `MATSEQSELL`, `MATMPISELL`
4338ccd284c7SBarry Smith M*/
4339ccd284c7SBarry Smith 
4340ccd284c7SBarry Smith /*MC
4341ccd284c7SBarry Smith    MATAIJCRL - MATAIJCRL = "aijcrl" - A matrix type to be used for sparse matrices.
4342ccd284c7SBarry Smith 
43432ef1f0ffSBarry Smith    Options Database Key:
43442ef1f0ffSBarry Smith . -mat_type aijcrl - sets the matrix type to "aijcrl" during a call to `MatSetFromOptions()`
43452ef1f0ffSBarry Smith 
43462ef1f0ffSBarry Smith   Level: beginner
43472ef1f0ffSBarry Smith 
43482ef1f0ffSBarry Smith    Note:
434911a5261eSBarry Smith    This matrix type is identical to `MATSEQAIJCRL` when constructed with a single process communicator,
435011a5261eSBarry Smith    and `MATMPIAIJCRL` otherwise.  As a result, for single process communicators,
435111a5261eSBarry Smith    `MatSeqAIJSetPreallocation()` is supported, and similarly `MatMPIAIJSetPreallocation()` is supported
4352ccd284c7SBarry Smith    for communicators controlling multiple processes.  It is recommended that you call both of
4353ccd284c7SBarry Smith    the above preallocation routines for simplicity.
4354ccd284c7SBarry Smith 
43551cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatCreateMPIAIJCRL`, `MATSEQAIJCRL`, `MATMPIAIJCRL`, `MATSEQAIJCRL`, `MATMPIAIJCRL`
4356ccd284c7SBarry Smith M*/
4357ccd284c7SBarry Smith 
43587906f579SHong Zhang PETSC_INTERN PetscErrorCode MatConvert_SeqAIJ_SeqAIJCRL(Mat, MatType, MatReuse, Mat *);
43597906f579SHong Zhang #if defined(PETSC_HAVE_ELEMENTAL)
43607906f579SHong Zhang PETSC_INTERN PetscErrorCode MatConvert_SeqAIJ_Elemental(Mat, MatType, MatReuse, Mat *);
43617906f579SHong Zhang #endif
4362d24d4204SJose E. Roman #if defined(PETSC_HAVE_SCALAPACK)
4363d24d4204SJose E. Roman PETSC_INTERN PetscErrorCode MatConvert_AIJ_ScaLAPACK(Mat, MatType, MatReuse, Mat *);
4364d24d4204SJose E. Roman #endif
43657906f579SHong Zhang #if defined(PETSC_HAVE_HYPRE)
43667906f579SHong Zhang PETSC_INTERN PetscErrorCode MatConvert_AIJ_HYPRE(Mat A, MatType, MatReuse, Mat *);
43677906f579SHong Zhang #endif
43687906f579SHong Zhang 
4369d4002b98SHong Zhang PETSC_EXTERN PetscErrorCode MatConvert_SeqAIJ_SeqSELL(Mat, MatType, MatReuse, Mat *);
4370c9225affSStefano Zampini PETSC_INTERN PetscErrorCode MatConvert_XAIJ_IS(Mat, MatType, MatReuse, Mat *);
43714222ddf1SHong Zhang PETSC_INTERN PetscErrorCode MatProductSetFromOptions_IS_XAIJ(Mat);
43727906f579SHong Zhang 
43738c778c55SBarry Smith /*@C
437411a5261eSBarry Smith   MatSeqAIJGetArray - gives read/write access to the array where the data for a `MATSEQAIJ` matrix is stored
43758c778c55SBarry Smith 
43768c778c55SBarry Smith   Not Collective
43778c778c55SBarry Smith 
43788c778c55SBarry Smith   Input Parameter:
4379fe59aa6dSJacob Faibussowitsch . A - a `MATSEQAIJ` matrix
43808c778c55SBarry Smith 
43818c778c55SBarry Smith   Output Parameter:
43828c778c55SBarry Smith . array - pointer to the data
43838c778c55SBarry Smith 
43848c778c55SBarry Smith   Level: intermediate
43858c778c55SBarry Smith 
4386fe59aa6dSJacob Faibussowitsch   Fortran Notes:
43870ab4885dSBarry Smith   `MatSeqAIJGetArray()` Fortran binding is deprecated (since PETSc 3.19), use `MatSeqAIJGetArrayF90()`
43880ab4885dSBarry Smith 
43891cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJRestoreArray()`, `MatSeqAIJGetArrayF90()`
43908c778c55SBarry Smith @*/
4391d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJGetArray(Mat A, PetscScalar **array)
4392d71ae5a4SJacob Faibussowitsch {
4393d67d9f35SJunchao Zhang   Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data;
43948c778c55SBarry Smith 
43958c778c55SBarry Smith   PetscFunctionBegin;
4396d67d9f35SJunchao Zhang   if (aij->ops->getarray) {
43979566063dSJacob Faibussowitsch     PetscCall((*aij->ops->getarray)(A, array));
4398d67d9f35SJunchao Zhang   } else {
4399d67d9f35SJunchao Zhang     *array = aij->a;
4400d67d9f35SJunchao Zhang   }
44013ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
4402d67d9f35SJunchao Zhang }
4403d67d9f35SJunchao Zhang 
4404d67d9f35SJunchao Zhang /*@C
440511a5261eSBarry Smith   MatSeqAIJRestoreArray - returns access to the array where the data for a `MATSEQAIJ` matrix is stored obtained by `MatSeqAIJGetArray()`
4406d67d9f35SJunchao Zhang 
4407d67d9f35SJunchao Zhang   Not Collective
4408d67d9f35SJunchao Zhang 
4409d67d9f35SJunchao Zhang   Input Parameters:
4410fe59aa6dSJacob Faibussowitsch + A     - a `MATSEQAIJ` matrix
4411d67d9f35SJunchao Zhang - array - pointer to the data
4412d67d9f35SJunchao Zhang 
4413d67d9f35SJunchao Zhang   Level: intermediate
4414d67d9f35SJunchao Zhang 
4415fe59aa6dSJacob Faibussowitsch   Fortran Notes:
44160ab4885dSBarry Smith   `MatSeqAIJRestoreArray()` Fortran binding is deprecated (since PETSc 3.19), use `MatSeqAIJRestoreArrayF90()`
44170ab4885dSBarry Smith 
44181cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJGetArray()`, `MatSeqAIJRestoreArrayF90()`
4419d67d9f35SJunchao Zhang @*/
4420d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJRestoreArray(Mat A, PetscScalar **array)
4421d71ae5a4SJacob Faibussowitsch {
4422d67d9f35SJunchao Zhang   Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data;
4423d67d9f35SJunchao Zhang 
4424d67d9f35SJunchao Zhang   PetscFunctionBegin;
4425d67d9f35SJunchao Zhang   if (aij->ops->restorearray) {
44269566063dSJacob Faibussowitsch     PetscCall((*aij->ops->restorearray)(A, array));
4427d67d9f35SJunchao Zhang   } else {
4428d67d9f35SJunchao Zhang     *array = NULL;
4429d67d9f35SJunchao Zhang   }
44309566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJInvalidateDiagonal(A));
44319566063dSJacob Faibussowitsch   PetscCall(PetscObjectStateIncrease((PetscObject)A));
44323ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
44338c778c55SBarry Smith }
44348c778c55SBarry Smith 
443521e72a00SBarry Smith /*@C
443611a5261eSBarry Smith   MatSeqAIJGetArrayRead - gives read-only access to the array where the data for a `MATSEQAIJ` matrix is stored
44378f1ea47aSStefano Zampini 
44380ab4885dSBarry Smith   Not Collective; No Fortran Support
44398f1ea47aSStefano Zampini 
44408f1ea47aSStefano Zampini   Input Parameter:
4441fe59aa6dSJacob Faibussowitsch . A - a `MATSEQAIJ` matrix
44428f1ea47aSStefano Zampini 
44438f1ea47aSStefano Zampini   Output Parameter:
44448f1ea47aSStefano Zampini . array - pointer to the data
44458f1ea47aSStefano Zampini 
44468f1ea47aSStefano Zampini   Level: intermediate
44478f1ea47aSStefano Zampini 
44481cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJGetArray()`, `MatSeqAIJRestoreArrayRead()`
44498f1ea47aSStefano Zampini @*/
4450d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJGetArrayRead(Mat A, const PetscScalar **array)
4451d71ae5a4SJacob Faibussowitsch {
4452d67d9f35SJunchao Zhang   Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data;
44538f1ea47aSStefano Zampini 
44548f1ea47aSStefano Zampini   PetscFunctionBegin;
4455d67d9f35SJunchao Zhang   if (aij->ops->getarrayread) {
44569566063dSJacob Faibussowitsch     PetscCall((*aij->ops->getarrayread)(A, array));
4457d67d9f35SJunchao Zhang   } else {
4458d67d9f35SJunchao Zhang     *array = aij->a;
4459d67d9f35SJunchao Zhang   }
44603ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
44618f1ea47aSStefano Zampini }
44628f1ea47aSStefano Zampini 
44638f1ea47aSStefano Zampini /*@C
446411a5261eSBarry Smith   MatSeqAIJRestoreArrayRead - restore the read-only access array obtained from `MatSeqAIJGetArrayRead()`
44658f1ea47aSStefano Zampini 
44660ab4885dSBarry Smith   Not Collective; No Fortran Support
44678f1ea47aSStefano Zampini 
44688f1ea47aSStefano Zampini   Input Parameter:
4469fe59aa6dSJacob Faibussowitsch . A - a `MATSEQAIJ` matrix
44708f1ea47aSStefano Zampini 
44718f1ea47aSStefano Zampini   Output Parameter:
44728f1ea47aSStefano Zampini . array - pointer to the data
44738f1ea47aSStefano Zampini 
44748f1ea47aSStefano Zampini   Level: intermediate
44758f1ea47aSStefano Zampini 
44761cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJGetArray()`, `MatSeqAIJGetArrayRead()`
44778f1ea47aSStefano Zampini @*/
4478d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJRestoreArrayRead(Mat A, const PetscScalar **array)
4479d71ae5a4SJacob Faibussowitsch {
4480d67d9f35SJunchao Zhang   Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data;
44818f1ea47aSStefano Zampini 
44828f1ea47aSStefano Zampini   PetscFunctionBegin;
4483d67d9f35SJunchao Zhang   if (aij->ops->restorearrayread) {
44849566063dSJacob Faibussowitsch     PetscCall((*aij->ops->restorearrayread)(A, array));
4485d67d9f35SJunchao Zhang   } else {
4486d67d9f35SJunchao Zhang     *array = NULL;
4487d67d9f35SJunchao Zhang   }
44883ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
4489d67d9f35SJunchao Zhang }
4490d67d9f35SJunchao Zhang 
4491d67d9f35SJunchao Zhang /*@C
449211a5261eSBarry Smith   MatSeqAIJGetArrayWrite - gives write-only access to the array where the data for a `MATSEQAIJ` matrix is stored
4493d67d9f35SJunchao Zhang 
44940ab4885dSBarry Smith   Not Collective; No Fortran Support
4495d67d9f35SJunchao Zhang 
4496d67d9f35SJunchao Zhang   Input Parameter:
4497fe59aa6dSJacob Faibussowitsch . A - a `MATSEQAIJ` matrix
4498d67d9f35SJunchao Zhang 
4499d67d9f35SJunchao Zhang   Output Parameter:
4500d67d9f35SJunchao Zhang . array - pointer to the data
4501d67d9f35SJunchao Zhang 
4502d67d9f35SJunchao Zhang   Level: intermediate
4503d67d9f35SJunchao Zhang 
45041cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJGetArray()`, `MatSeqAIJRestoreArrayRead()`
4505d67d9f35SJunchao Zhang @*/
4506d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJGetArrayWrite(Mat A, PetscScalar **array)
4507d71ae5a4SJacob Faibussowitsch {
4508d67d9f35SJunchao Zhang   Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data;
4509d67d9f35SJunchao Zhang 
4510d67d9f35SJunchao Zhang   PetscFunctionBegin;
4511d67d9f35SJunchao Zhang   if (aij->ops->getarraywrite) {
45129566063dSJacob Faibussowitsch     PetscCall((*aij->ops->getarraywrite)(A, array));
4513d67d9f35SJunchao Zhang   } else {
4514d67d9f35SJunchao Zhang     *array = aij->a;
4515d67d9f35SJunchao Zhang   }
45169566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJInvalidateDiagonal(A));
45179566063dSJacob Faibussowitsch   PetscCall(PetscObjectStateIncrease((PetscObject)A));
45183ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
4519d67d9f35SJunchao Zhang }
4520d67d9f35SJunchao Zhang 
4521d67d9f35SJunchao Zhang /*@C
4522d67d9f35SJunchao Zhang   MatSeqAIJRestoreArrayWrite - restore the read-only access array obtained from MatSeqAIJGetArrayRead
4523d67d9f35SJunchao Zhang 
45240ab4885dSBarry Smith   Not Collective; No Fortran Support
4525d67d9f35SJunchao Zhang 
4526d67d9f35SJunchao Zhang   Input Parameter:
4527fe59aa6dSJacob Faibussowitsch . A - a MATSEQAIJ matrix
4528d67d9f35SJunchao Zhang 
4529d67d9f35SJunchao Zhang   Output Parameter:
4530d67d9f35SJunchao Zhang . array - pointer to the data
4531d67d9f35SJunchao Zhang 
4532d67d9f35SJunchao Zhang   Level: intermediate
4533d67d9f35SJunchao Zhang 
45341cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJGetArray()`, `MatSeqAIJGetArrayRead()`
4535d67d9f35SJunchao Zhang @*/
4536d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJRestoreArrayWrite(Mat A, PetscScalar **array)
4537d71ae5a4SJacob Faibussowitsch {
4538d67d9f35SJunchao Zhang   Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data;
4539d67d9f35SJunchao Zhang 
4540d67d9f35SJunchao Zhang   PetscFunctionBegin;
4541d67d9f35SJunchao Zhang   if (aij->ops->restorearraywrite) {
45429566063dSJacob Faibussowitsch     PetscCall((*aij->ops->restorearraywrite)(A, array));
4543d67d9f35SJunchao Zhang   } else {
4544d67d9f35SJunchao Zhang     *array = NULL;
4545d67d9f35SJunchao Zhang   }
45463ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
45478f1ea47aSStefano Zampini }
45488f1ea47aSStefano Zampini 
45498f1ea47aSStefano Zampini /*@C
455011a5261eSBarry Smith   MatSeqAIJGetCSRAndMemType - Get the CSR arrays and the memory type of the `MATSEQAIJ` matrix
45517ee59b9bSJunchao Zhang 
45520ab4885dSBarry Smith   Not Collective; No Fortran Support
45537ee59b9bSJunchao Zhang 
45547ee59b9bSJunchao Zhang   Input Parameter:
455511a5261eSBarry Smith . mat - a matrix of type `MATSEQAIJ` or its subclasses
45567ee59b9bSJunchao Zhang 
45577ee59b9bSJunchao Zhang   Output Parameters:
45587ee59b9bSJunchao Zhang + i     - row map array of the matrix
45597ee59b9bSJunchao Zhang . j     - column index array of the matrix
45607ee59b9bSJunchao Zhang . a     - data array of the matrix
4561fe59aa6dSJacob Faibussowitsch - mtype - memory type of the arrays
45627ee59b9bSJunchao Zhang 
4563fe59aa6dSJacob Faibussowitsch   Level: developer
45642ef1f0ffSBarry Smith 
45657ee59b9bSJunchao Zhang   Notes:
45662ef1f0ffSBarry Smith   Any of the output parameters can be `NULL`, in which case the corresponding value is not returned.
45677ee59b9bSJunchao Zhang   If mat is a device matrix, the arrays are on the device. Otherwise, they are on the host.
45687ee59b9bSJunchao Zhang 
45697ee59b9bSJunchao Zhang   One can call this routine on a preallocated but not assembled matrix to just get the memory of the CSR underneath the matrix.
45702ef1f0ffSBarry Smith   If the matrix is assembled, the data array `a` is guaranteed to have the latest values of the matrix.
45717ee59b9bSJunchao Zhang 
45721cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJGetArray()`, `MatSeqAIJGetArrayRead()`
45737ee59b9bSJunchao Zhang @*/
4574d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJGetCSRAndMemType(Mat mat, const PetscInt **i, const PetscInt **j, PetscScalar **a, PetscMemType *mtype)
4575d71ae5a4SJacob Faibussowitsch {
45767ee59b9bSJunchao Zhang   Mat_SeqAIJ *aij = (Mat_SeqAIJ *)mat->data;
45777ee59b9bSJunchao Zhang 
45787ee59b9bSJunchao Zhang   PetscFunctionBegin;
45797ee59b9bSJunchao Zhang   PetscCheck(mat->preallocated, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "matrix is not preallocated");
45807ee59b9bSJunchao Zhang   if (aij->ops->getcsrandmemtype) {
45817ee59b9bSJunchao Zhang     PetscCall((*aij->ops->getcsrandmemtype)(mat, i, j, a, mtype));
45827ee59b9bSJunchao Zhang   } else {
45837ee59b9bSJunchao Zhang     if (i) *i = aij->i;
45847ee59b9bSJunchao Zhang     if (j) *j = aij->j;
45857ee59b9bSJunchao Zhang     if (a) *a = aij->a;
45867ee59b9bSJunchao Zhang     if (mtype) *mtype = PETSC_MEMTYPE_HOST;
45877ee59b9bSJunchao Zhang   }
45883ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
45897ee59b9bSJunchao Zhang }
45907ee59b9bSJunchao Zhang 
45917ee59b9bSJunchao Zhang /*@C
459221e72a00SBarry Smith   MatSeqAIJGetMaxRowNonzeros - returns the maximum number of nonzeros in any row
459321e72a00SBarry Smith 
459421e72a00SBarry Smith   Not Collective
459521e72a00SBarry Smith 
459621e72a00SBarry Smith   Input Parameter:
4597fe59aa6dSJacob Faibussowitsch . A - a `MATSEQAIJ` matrix
459821e72a00SBarry Smith 
459921e72a00SBarry Smith   Output Parameter:
460021e72a00SBarry Smith . nz - the maximum number of nonzeros in any row
460121e72a00SBarry Smith 
460221e72a00SBarry Smith   Level: intermediate
460321e72a00SBarry Smith 
46041cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJRestoreArray()`, `MatSeqAIJGetArrayF90()`
460521e72a00SBarry Smith @*/
4606d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJGetMaxRowNonzeros(Mat A, PetscInt *nz)
4607d71ae5a4SJacob Faibussowitsch {
460821e72a00SBarry Smith   Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data;
460921e72a00SBarry Smith 
461021e72a00SBarry Smith   PetscFunctionBegin;
461121e72a00SBarry Smith   *nz = aij->rmax;
46123ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
461321e72a00SBarry Smith }
461421e72a00SBarry Smith 
46152c4ab24aSJunchao Zhang static PetscErrorCode MatCOOStructDestroy_SeqAIJ(void *data)
46162c4ab24aSJunchao Zhang {
46172c4ab24aSJunchao Zhang   MatCOOStruct_SeqAIJ *coo = (MatCOOStruct_SeqAIJ *)data;
46182c4ab24aSJunchao Zhang   PetscFunctionBegin;
46192c4ab24aSJunchao Zhang   PetscCall(PetscFree(coo->perm));
46202c4ab24aSJunchao Zhang   PetscCall(PetscFree(coo->jmap));
46212c4ab24aSJunchao Zhang   PetscCall(PetscFree(coo));
46222c4ab24aSJunchao Zhang   PetscFunctionReturn(PETSC_SUCCESS);
46232c4ab24aSJunchao Zhang }
46242c4ab24aSJunchao Zhang 
4625d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetPreallocationCOO_SeqAIJ(Mat mat, PetscCount coo_n, PetscInt coo_i[], PetscInt coo_j[])
4626d71ae5a4SJacob Faibussowitsch {
4627394ed5ebSJunchao Zhang   MPI_Comm             comm;
4628394ed5ebSJunchao Zhang   PetscInt            *i, *j;
4629394ed5ebSJunchao Zhang   PetscInt             M, N, row;
4630394ed5ebSJunchao Zhang   PetscCount           k, p, q, nneg, nnz, start, end; /* Index the coo array, so use PetscCount as their type */
4631394ed5ebSJunchao Zhang   PetscInt            *Ai;                             /* Change to PetscCount once we use it for row pointers */
4632394ed5ebSJunchao Zhang   PetscInt            *Aj;
4633394ed5ebSJunchao Zhang   PetscScalar         *Aa;
4634cbc6b225SStefano Zampini   Mat_SeqAIJ          *seqaij = (Mat_SeqAIJ *)(mat->data);
4635cbc6b225SStefano Zampini   MatType              rtype;
4636394ed5ebSJunchao Zhang   PetscCount          *perm, *jmap;
46372c4ab24aSJunchao Zhang   PetscContainer       container;
46382c4ab24aSJunchao Zhang   MatCOOStruct_SeqAIJ *coo;
4639394ed5ebSJunchao Zhang 
4640394ed5ebSJunchao Zhang   PetscFunctionBegin;
46419566063dSJacob Faibussowitsch   PetscCall(PetscObjectGetComm((PetscObject)mat, &comm));
46429566063dSJacob Faibussowitsch   PetscCall(MatGetSize(mat, &M, &N));
4643e8729f6fSJunchao Zhang   i = coo_i;
4644e8729f6fSJunchao Zhang   j = coo_j;
46459566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(coo_n, &perm));
4646394ed5ebSJunchao Zhang   for (k = 0; k < coo_n; k++) { /* Ignore entries with negative row or col indices */
4647394ed5ebSJunchao Zhang     if (j[k] < 0) i[k] = -1;
4648394ed5ebSJunchao Zhang     perm[k] = k;
4649394ed5ebSJunchao Zhang   }
4650394ed5ebSJunchao Zhang 
4651394ed5ebSJunchao Zhang   /* Sort by row */
46529566063dSJacob Faibussowitsch   PetscCall(PetscSortIntWithIntCountArrayPair(coo_n, i, j, perm));
4653651b1cf9SStefano Zampini 
4654651b1cf9SStefano Zampini   /* Advance k to the first row with a non-negative index */
4655651b1cf9SStefano Zampini   for (k = 0; k < coo_n; k++)
46569371c9d4SSatish Balay     if (i[k] >= 0) break;
4657394ed5ebSJunchao Zhang   nneg = k;
46589566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(coo_n - nneg + 1, &jmap)); /* +1 to make a CSR-like data structure. jmap[i] originally is the number of repeats for i-th nonzero */
4659394ed5ebSJunchao Zhang   nnz = 0;                                          /* Total number of unique nonzeros to be counted */
466035cb6cd3SPierre Jolivet   jmap++;                                           /* Inc jmap by 1 for convenience */
4661394ed5ebSJunchao Zhang 
46629566063dSJacob Faibussowitsch   PetscCall(PetscCalloc1(M + 1, &Ai));        /* CSR of A */
46639566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(coo_n - nneg, &Aj)); /* We have at most coo_n-nneg unique nonzeros */
4664394ed5ebSJunchao Zhang 
4665651b1cf9SStefano Zampini   /* Support for HYPRE */
4666651b1cf9SStefano Zampini   PetscBool   hypre;
4667651b1cf9SStefano Zampini   const char *name;
4668651b1cf9SStefano Zampini   PetscCall(PetscObjectGetName((PetscObject)mat, &name));
4669651b1cf9SStefano Zampini   PetscCall(PetscStrcmp("_internal_COO_mat_for_hypre", name, &hypre));
4670651b1cf9SStefano Zampini 
4671394ed5ebSJunchao Zhang   /* In each row, sort by column, then unique column indices to get row length */
467235cb6cd3SPierre Jolivet   Ai++;  /* Inc by 1 for convenience */
4673394ed5ebSJunchao Zhang   q = 0; /* q-th unique nonzero, with q starting from 0 */
4674394ed5ebSJunchao Zhang   while (k < coo_n) {
4675394ed5ebSJunchao Zhang     row   = i[k];
4676394ed5ebSJunchao Zhang     start = k; /* [start,end) indices for this row */
4677394ed5ebSJunchao Zhang     while (k < coo_n && i[k] == row) k++;
4678394ed5ebSJunchao Zhang     end = k;
4679651b1cf9SStefano Zampini     /* hack for HYPRE: swap min column to diag so that diagonal values will go first */
4680651b1cf9SStefano Zampini     if (hypre) {
4681651b1cf9SStefano Zampini       PetscInt  minj    = PETSC_MAX_INT;
4682651b1cf9SStefano Zampini       PetscBool hasdiag = PETSC_FALSE;
4683651b1cf9SStefano Zampini       for (p = start; p < end; p++) {
4684651b1cf9SStefano Zampini         hasdiag = (PetscBool)(hasdiag || (j[p] == row));
4685651b1cf9SStefano Zampini         minj    = PetscMin(minj, j[p]);
4686651b1cf9SStefano Zampini       }
4687651b1cf9SStefano Zampini       if (hasdiag) {
4688651b1cf9SStefano Zampini         for (p = start; p < end; p++) {
4689651b1cf9SStefano Zampini           if (j[p] == minj) j[p] = row;
4690651b1cf9SStefano Zampini           else if (j[p] == row) j[p] = minj;
4691651b1cf9SStefano Zampini         }
4692651b1cf9SStefano Zampini       }
4693651b1cf9SStefano Zampini     }
46949566063dSJacob Faibussowitsch     PetscCall(PetscSortIntWithCountArray(end - start, j + start, perm + start));
4695651b1cf9SStefano Zampini 
4696394ed5ebSJunchao Zhang     /* Find number of unique col entries in this row */
4697394ed5ebSJunchao Zhang     Aj[q]   = j[start]; /* Log the first nonzero in this row */
4698651b1cf9SStefano Zampini     jmap[q] = 1;        /* Number of repeats of this nonzero entry */
4699394ed5ebSJunchao Zhang     Ai[row] = 1;
4700394ed5ebSJunchao Zhang     nnz++;
4701394ed5ebSJunchao Zhang 
4702394ed5ebSJunchao Zhang     for (p = start + 1; p < end; p++) { /* Scan remaining nonzero in this row */
4703394ed5ebSJunchao Zhang       if (j[p] != j[p - 1]) {           /* Meet a new nonzero */
4704394ed5ebSJunchao Zhang         q++;
4705394ed5ebSJunchao Zhang         jmap[q] = 1;
4706394ed5ebSJunchao Zhang         Aj[q]   = j[p];
4707394ed5ebSJunchao Zhang         Ai[row]++;
4708394ed5ebSJunchao Zhang         nnz++;
4709394ed5ebSJunchao Zhang       } else {
4710394ed5ebSJunchao Zhang         jmap[q]++;
4711394ed5ebSJunchao Zhang       }
4712394ed5ebSJunchao Zhang     }
4713394ed5ebSJunchao Zhang     q++; /* Move to next row and thus next unique nonzero */
4714394ed5ebSJunchao Zhang   }
4715394ed5ebSJunchao Zhang   Ai--; /* Back to the beginning of Ai[] */
4716394ed5ebSJunchao Zhang   for (k = 0; k < M; k++) Ai[k + 1] += Ai[k];
4717394ed5ebSJunchao Zhang   jmap--; /* Back to the beginning of jmap[] */
4718394ed5ebSJunchao Zhang   jmap[0] = 0;
4719394ed5ebSJunchao Zhang   for (k = 0; k < nnz; k++) jmap[k + 1] += jmap[k];
4720394ed5ebSJunchao Zhang   if (nnz < coo_n - nneg) { /* Realloc with actual number of unique nonzeros */
4721394ed5ebSJunchao Zhang     PetscCount *jmap_new;
4722394ed5ebSJunchao Zhang     PetscInt   *Aj_new;
4723394ed5ebSJunchao Zhang 
47249566063dSJacob Faibussowitsch     PetscCall(PetscMalloc1(nnz + 1, &jmap_new));
47259566063dSJacob Faibussowitsch     PetscCall(PetscArraycpy(jmap_new, jmap, nnz + 1));
47269566063dSJacob Faibussowitsch     PetscCall(PetscFree(jmap));
4727394ed5ebSJunchao Zhang     jmap = jmap_new;
4728394ed5ebSJunchao Zhang 
47299566063dSJacob Faibussowitsch     PetscCall(PetscMalloc1(nnz, &Aj_new));
47309566063dSJacob Faibussowitsch     PetscCall(PetscArraycpy(Aj_new, Aj, nnz));
47319566063dSJacob Faibussowitsch     PetscCall(PetscFree(Aj));
4732394ed5ebSJunchao Zhang     Aj = Aj_new;
4733394ed5ebSJunchao Zhang   }
4734394ed5ebSJunchao Zhang 
4735394ed5ebSJunchao Zhang   if (nneg) { /* Discard heading entries with negative indices in perm[], as we'll access it from index 0 in MatSetValuesCOO */
4736394ed5ebSJunchao Zhang     PetscCount *perm_new;
4737cbc6b225SStefano Zampini 
47389566063dSJacob Faibussowitsch     PetscCall(PetscMalloc1(coo_n - nneg, &perm_new));
47399566063dSJacob Faibussowitsch     PetscCall(PetscArraycpy(perm_new, perm + nneg, coo_n - nneg));
47409566063dSJacob Faibussowitsch     PetscCall(PetscFree(perm));
4741394ed5ebSJunchao Zhang     perm = perm_new;
4742394ed5ebSJunchao Zhang   }
4743394ed5ebSJunchao Zhang 
47449566063dSJacob Faibussowitsch   PetscCall(MatGetRootType_Private(mat, &rtype));
47459566063dSJacob Faibussowitsch   PetscCall(PetscCalloc1(nnz, &Aa)); /* Zero the matrix */
47469566063dSJacob Faibussowitsch   PetscCall(MatSetSeqAIJWithArrays_private(PETSC_COMM_SELF, M, N, Ai, Aj, Aa, rtype, mat));
4747394ed5ebSJunchao Zhang 
4748394ed5ebSJunchao Zhang   seqaij->singlemalloc = PETSC_FALSE;            /* Ai, Aj and Aa are not allocated in one big malloc */
4749394ed5ebSJunchao Zhang   seqaij->free_a = seqaij->free_ij = PETSC_TRUE; /* Let newmat own Ai, Aj and Aa */
47502c4ab24aSJunchao Zhang 
47512c4ab24aSJunchao Zhang   // Put the COO struct in a container and then attach that to the matrix
47522c4ab24aSJunchao Zhang   PetscCall(PetscMalloc1(1, &coo));
47532c4ab24aSJunchao Zhang   coo->nz   = nnz;
47542c4ab24aSJunchao Zhang   coo->n    = coo_n;
47552c4ab24aSJunchao Zhang   coo->Atot = coo_n - nneg; // Annz is seqaij->nz, so no need to record that again
47562c4ab24aSJunchao Zhang   coo->jmap = jmap;         // of length nnz+1
47572c4ab24aSJunchao Zhang   coo->perm = perm;
47582c4ab24aSJunchao Zhang   PetscCall(PetscContainerCreate(PETSC_COMM_SELF, &container));
47592c4ab24aSJunchao Zhang   PetscCall(PetscContainerSetPointer(container, coo));
47602c4ab24aSJunchao Zhang   PetscCall(PetscContainerSetUserDestroy(container, MatCOOStructDestroy_SeqAIJ));
47612c4ab24aSJunchao Zhang   PetscCall(PetscObjectCompose((PetscObject)mat, "__PETSc_MatCOOStruct_Host", (PetscObject)container));
47622c4ab24aSJunchao Zhang   PetscCall(PetscContainerDestroy(&container));
47633ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
4764394ed5ebSJunchao Zhang }
4765394ed5ebSJunchao Zhang 
4766d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatSetValuesCOO_SeqAIJ(Mat A, const PetscScalar v[], InsertMode imode)
4767d71ae5a4SJacob Faibussowitsch {
4768394ed5ebSJunchao Zhang   Mat_SeqAIJ          *aseq = (Mat_SeqAIJ *)A->data;
4769394ed5ebSJunchao Zhang   PetscCount           i, j, Annz = aseq->nz;
47702c4ab24aSJunchao Zhang   PetscCount          *perm, *jmap;
4771394ed5ebSJunchao Zhang   PetscScalar         *Aa;
47722c4ab24aSJunchao Zhang   PetscContainer       container;
47732c4ab24aSJunchao Zhang   MatCOOStruct_SeqAIJ *coo;
4774394ed5ebSJunchao Zhang 
4775394ed5ebSJunchao Zhang   PetscFunctionBegin;
47762c4ab24aSJunchao Zhang   PetscCall(PetscObjectQuery((PetscObject)A, "__PETSc_MatCOOStruct_Host", (PetscObject *)&container));
47772c4ab24aSJunchao Zhang   PetscCheck(container, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Not found MatCOOStruct on this matrix");
47782c4ab24aSJunchao Zhang   PetscCall(PetscContainerGetPointer(container, (void **)&coo));
47792c4ab24aSJunchao Zhang   perm = coo->perm;
47802c4ab24aSJunchao Zhang   jmap = coo->jmap;
47819566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArray(A, &Aa));
4782394ed5ebSJunchao Zhang   for (i = 0; i < Annz; i++) {
4783b6c38306SJunchao Zhang     PetscScalar sum = 0.0;
4784b6c38306SJunchao Zhang     for (j = jmap[i]; j < jmap[i + 1]; j++) sum += v[perm[j]];
4785b6c38306SJunchao Zhang     Aa[i] = (imode == INSERT_VALUES ? 0.0 : Aa[i]) + sum;
4786394ed5ebSJunchao Zhang   }
47879566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArray(A, &Aa));
47883ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
4789394ed5ebSJunchao Zhang }
4790394ed5ebSJunchao Zhang 
479134b5b067SBarry Smith #if defined(PETSC_HAVE_CUDA)
47925063d097SStefano Zampini PETSC_INTERN PetscErrorCode MatConvert_SeqAIJ_SeqAIJCUSPARSE(Mat, MatType, MatReuse, Mat *);
479302fe1965SBarry Smith #endif
4794d5e393b6SSuyash Tandon #if defined(PETSC_HAVE_HIP)
4795d5e393b6SSuyash Tandon PETSC_INTERN PetscErrorCode MatConvert_SeqAIJ_SeqAIJHIPSPARSE(Mat, MatType, MatReuse, Mat *);
4796d5e393b6SSuyash Tandon #endif
47973d0639e7SStefano Zampini #if defined(PETSC_HAVE_KOKKOS_KERNELS)
47985063d097SStefano Zampini PETSC_INTERN PetscErrorCode MatConvert_SeqAIJ_SeqAIJKokkos(Mat, MatType, MatReuse, Mat *);
47993d0639e7SStefano Zampini #endif
480002fe1965SBarry Smith 
4801d71ae5a4SJacob Faibussowitsch PETSC_EXTERN PetscErrorCode MatCreate_SeqAIJ(Mat B)
4802d71ae5a4SJacob Faibussowitsch {
4803273d9f13SBarry Smith   Mat_SeqAIJ *b;
480438baddfdSBarry Smith   PetscMPIInt size;
4805273d9f13SBarry Smith 
4806273d9f13SBarry Smith   PetscFunctionBegin;
48079566063dSJacob Faibussowitsch   PetscCallMPI(MPI_Comm_size(PetscObjectComm((PetscObject)B), &size));
480808401ef6SPierre Jolivet   PetscCheck(size <= 1, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Comm must be of size 1");
4809273d9f13SBarry Smith 
48104dfa11a4SJacob Faibussowitsch   PetscCall(PetscNew(&b));
48112205254eSKarl Rupp 
4812b0a32e0cSBarry Smith   B->data   = (void *)b;
4813aea10558SJacob Faibussowitsch   B->ops[0] = MatOps_Values;
4814071fcb05SBarry Smith   if (B->sortedfull) B->ops->setvalues = MatSetValues_SeqAIJ_SortedFull;
48152205254eSKarl Rupp 
4816f4259b30SLisandro Dalcin   b->row                = NULL;
4817f4259b30SLisandro Dalcin   b->col                = NULL;
4818f4259b30SLisandro Dalcin   b->icol               = NULL;
4819b810aeb4SBarry Smith   b->reallocs           = 0;
482036db0b34SBarry Smith   b->ignorezeroentries  = PETSC_FALSE;
4821f1e2ffcdSBarry Smith   b->roworiented        = PETSC_TRUE;
4822416022c9SBarry Smith   b->nonew              = 0;
4823f4259b30SLisandro Dalcin   b->diag               = NULL;
4824f4259b30SLisandro Dalcin   b->solve_work         = NULL;
4825f4259b30SLisandro Dalcin   B->spptr              = NULL;
4826f4259b30SLisandro Dalcin   b->saved_values       = NULL;
4827f4259b30SLisandro Dalcin   b->idiag              = NULL;
4828f4259b30SLisandro Dalcin   b->mdiag              = NULL;
4829f4259b30SLisandro Dalcin   b->ssor_work          = NULL;
483071f1c65dSBarry Smith   b->omega              = 1.0;
483171f1c65dSBarry Smith   b->fshift             = 0.0;
483271f1c65dSBarry Smith   b->idiagvalid         = PETSC_FALSE;
4833bbead8a2SBarry Smith   b->ibdiagvalid        = PETSC_FALSE;
4834a9817697SBarry Smith   b->keepnonzeropattern = PETSC_FALSE;
483517ab2063SBarry Smith 
48369566063dSJacob Faibussowitsch   PetscCall(PetscObjectChangeTypeName((PetscObject)B, MATSEQAIJ));
4837d1e78c4fSBarry Smith #if defined(PETSC_HAVE_MATLAB)
48389566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "PetscMatlabEnginePut_C", MatlabEnginePut_SeqAIJ));
48399566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "PetscMatlabEngineGet_C", MatlabEngineGet_SeqAIJ));
4840b3866ffcSBarry Smith #endif
48419566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSeqAIJSetColumnIndices_C", MatSeqAIJSetColumnIndices_SeqAIJ));
48429566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatStoreValues_C", MatStoreValues_SeqAIJ));
48439566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatRetrieveValues_C", MatRetrieveValues_SeqAIJ));
48449566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqsbaij_C", MatConvert_SeqAIJ_SeqSBAIJ));
48459566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqbaij_C", MatConvert_SeqAIJ_SeqBAIJ));
48469566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijperm_C", MatConvert_SeqAIJ_SeqAIJPERM));
48479566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijsell_C", MatConvert_SeqAIJ_SeqAIJSELL));
48489779e05dSSatish Balay #if defined(PETSC_HAVE_MKL_SPARSE)
48499566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijmkl_C", MatConvert_SeqAIJ_SeqAIJMKL));
4850191b95cbSRichard Tran Mills #endif
485134b5b067SBarry Smith #if defined(PETSC_HAVE_CUDA)
48529566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijcusparse_C", MatConvert_SeqAIJ_SeqAIJCUSPARSE));
48539566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_seqaijcusparse_seqaij_C", MatProductSetFromOptions_SeqAIJ));
48549566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_seqaij_seqaijcusparse_C", MatProductSetFromOptions_SeqAIJ));
485502fe1965SBarry Smith #endif
4856d5e393b6SSuyash Tandon #if defined(PETSC_HAVE_HIP)
4857d5e393b6SSuyash Tandon   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijhipsparse_C", MatConvert_SeqAIJ_SeqAIJHIPSPARSE));
4858d5e393b6SSuyash Tandon   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_seqaijhipsparse_seqaij_C", MatProductSetFromOptions_SeqAIJ));
4859d5e393b6SSuyash Tandon   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_seqaij_seqaijhipsparse_C", MatProductSetFromOptions_SeqAIJ));
4860d5e393b6SSuyash Tandon #endif
48613d0639e7SStefano Zampini #if defined(PETSC_HAVE_KOKKOS_KERNELS)
48629566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijkokkos_C", MatConvert_SeqAIJ_SeqAIJKokkos));
48633d0639e7SStefano Zampini #endif
48649566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijcrl_C", MatConvert_SeqAIJ_SeqAIJCRL));
4865af8000cdSHong Zhang #if defined(PETSC_HAVE_ELEMENTAL)
48669566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_elemental_C", MatConvert_SeqAIJ_Elemental));
4867af8000cdSHong Zhang #endif
4868d24d4204SJose E. Roman #if defined(PETSC_HAVE_SCALAPACK)
48699566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_scalapack_C", MatConvert_AIJ_ScaLAPACK));
4870d24d4204SJose E. Roman #endif
487163c07aadSStefano Zampini #if defined(PETSC_HAVE_HYPRE)
48729566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_hypre_C", MatConvert_AIJ_HYPRE));
48739566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_transpose_seqaij_seqaij_C", MatProductSetFromOptions_Transpose_AIJ_AIJ));
487463c07aadSStefano Zampini #endif
48759566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqdense_C", MatConvert_SeqAIJ_SeqDense));
48769566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqsell_C", MatConvert_SeqAIJ_SeqSELL));
48779566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_is_C", MatConvert_XAIJ_IS));
48789566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatIsTranspose_C", MatIsTranspose_SeqAIJ));
48799566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatIsHermitianTranspose_C", MatIsTranspose_SeqAIJ));
48809566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSeqAIJSetPreallocation_C", MatSeqAIJSetPreallocation_SeqAIJ));
48819566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatResetPreallocation_C", MatResetPreallocation_SeqAIJ));
48829566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSeqAIJSetPreallocationCSR_C", MatSeqAIJSetPreallocationCSR_SeqAIJ));
48839566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatReorderForNonzeroDiagonal_C", MatReorderForNonzeroDiagonal_SeqAIJ));
48849566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_is_seqaij_C", MatProductSetFromOptions_IS_XAIJ));
48859566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_seqdense_seqaij_C", MatProductSetFromOptions_SeqDense_SeqAIJ));
48869566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_seqaij_seqaij_C", MatProductSetFromOptions_SeqAIJ));
48879566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSeqAIJKron_C", MatSeqAIJKron_SeqAIJ));
48889566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSetPreallocationCOO_C", MatSetPreallocationCOO_SeqAIJ));
48899566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSetValuesCOO_C", MatSetValuesCOO_SeqAIJ));
48909566063dSJacob Faibussowitsch   PetscCall(MatCreate_SeqAIJ_Inode(B));
48919566063dSJacob Faibussowitsch   PetscCall(PetscObjectChangeTypeName((PetscObject)B, MATSEQAIJ));
48929566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJSetTypeFromOptions(B)); /* this allows changing the matrix subtype to say MATSEQAIJPERM */
48933ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
489417ab2063SBarry Smith }
489517ab2063SBarry Smith 
4896b24902e0SBarry Smith /*
48973893b582SJunchao Zhang     Given a matrix generated with MatGetFactor() duplicates all the information in A into C
4898b24902e0SBarry Smith */
4899d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDuplicateNoCreate_SeqAIJ(Mat C, Mat A, MatDuplicateOption cpvalues, PetscBool mallocmatspace)
4900d71ae5a4SJacob Faibussowitsch {
49012a350339SBarry Smith   Mat_SeqAIJ *c = (Mat_SeqAIJ *)C->data, *a = (Mat_SeqAIJ *)A->data;
4902071fcb05SBarry Smith   PetscInt    m = A->rmap->n, i;
490317ab2063SBarry Smith 
49043a40ed3dSBarry Smith   PetscFunctionBegin;
4905aed4548fSBarry Smith   PetscCheck(A->assembled || cpvalues == MAT_DO_NOT_COPY_VALUES, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Cannot duplicate unassembled matrix");
4906273d9f13SBarry Smith 
4907d5f3da31SBarry Smith   C->factortype = A->factortype;
4908f4259b30SLisandro Dalcin   c->row        = NULL;
4909f4259b30SLisandro Dalcin   c->col        = NULL;
4910f4259b30SLisandro Dalcin   c->icol       = NULL;
49116ad4291fSHong Zhang   c->reallocs   = 0;
491217ab2063SBarry Smith 
491369272f91SPierre Jolivet   C->assembled = A->assembled;
491417ab2063SBarry Smith 
491569272f91SPierre Jolivet   if (A->preallocated) {
49169566063dSJacob Faibussowitsch     PetscCall(PetscLayoutReference(A->rmap, &C->rmap));
49179566063dSJacob Faibussowitsch     PetscCall(PetscLayoutReference(A->cmap, &C->cmap));
4918eec197d1SBarry Smith 
491931fe6a7dSBarry Smith     if (!A->hash_active) {
49209566063dSJacob Faibussowitsch       PetscCall(PetscMalloc1(m, &c->imax));
49219566063dSJacob Faibussowitsch       PetscCall(PetscMemcpy(c->imax, a->imax, m * sizeof(PetscInt)));
49229566063dSJacob Faibussowitsch       PetscCall(PetscMalloc1(m, &c->ilen));
49239566063dSJacob Faibussowitsch       PetscCall(PetscMemcpy(c->ilen, a->ilen, m * sizeof(PetscInt)));
492417ab2063SBarry Smith 
492517ab2063SBarry Smith       /* allocate the matrix space */
4926f77e22a1SHong Zhang       if (mallocmatspace) {
49279566063dSJacob Faibussowitsch         PetscCall(PetscMalloc3(a->i[m], &c->a, a->i[m], &c->j, m + 1, &c->i));
49282205254eSKarl Rupp 
4929f1e2ffcdSBarry Smith         c->singlemalloc = PETSC_TRUE;
49302205254eSKarl Rupp 
49319566063dSJacob Faibussowitsch         PetscCall(PetscArraycpy(c->i, a->i, m + 1));
493217ab2063SBarry Smith         if (m > 0) {
49339566063dSJacob Faibussowitsch           PetscCall(PetscArraycpy(c->j, a->j, a->i[m]));
4934be6bf707SBarry Smith           if (cpvalues == MAT_COPY_VALUES) {
49352e5835c6SStefano Zampini             const PetscScalar *aa;
49362e5835c6SStefano Zampini 
49379566063dSJacob Faibussowitsch             PetscCall(MatSeqAIJGetArrayRead(A, &aa));
49389566063dSJacob Faibussowitsch             PetscCall(PetscArraycpy(c->a, aa, a->i[m]));
49399566063dSJacob Faibussowitsch             PetscCall(MatSeqAIJGetArrayRead(A, &aa));
4940be6bf707SBarry Smith           } else {
49419566063dSJacob Faibussowitsch             PetscCall(PetscArrayzero(c->a, a->i[m]));
494217ab2063SBarry Smith           }
494308480c60SBarry Smith         }
4944f77e22a1SHong Zhang       }
494531fe6a7dSBarry Smith       C->preallocated = PETSC_TRUE;
494631fe6a7dSBarry Smith     } else {
494731fe6a7dSBarry Smith       PetscCheck(mallocmatspace, PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_WRONGSTATE, "Cannot malloc matrix memory from a non-preallocated matrix");
494831fe6a7dSBarry Smith       PetscCall(MatSetUp(C));
494931fe6a7dSBarry Smith     }
495017ab2063SBarry Smith 
49516ad4291fSHong Zhang     c->ignorezeroentries = a->ignorezeroentries;
4952416022c9SBarry Smith     c->roworiented       = a->roworiented;
4953416022c9SBarry Smith     c->nonew             = a->nonew;
4954416022c9SBarry Smith     if (a->diag) {
49559566063dSJacob Faibussowitsch       PetscCall(PetscMalloc1(m + 1, &c->diag));
49569566063dSJacob Faibussowitsch       PetscCall(PetscMemcpy(c->diag, a->diag, m * sizeof(PetscInt)));
4957071fcb05SBarry Smith     } else c->diag = NULL;
49582205254eSKarl Rupp 
4959f4259b30SLisandro Dalcin     c->solve_work         = NULL;
4960f4259b30SLisandro Dalcin     c->saved_values       = NULL;
4961f4259b30SLisandro Dalcin     c->idiag              = NULL;
4962f4259b30SLisandro Dalcin     c->ssor_work          = NULL;
4963a9817697SBarry Smith     c->keepnonzeropattern = a->keepnonzeropattern;
4964e6b907acSBarry Smith     c->free_a             = PETSC_TRUE;
4965e6b907acSBarry Smith     c->free_ij            = PETSC_TRUE;
49666ad4291fSHong Zhang 
4967893ad86cSHong Zhang     c->rmax  = a->rmax;
4968416022c9SBarry Smith     c->nz    = a->nz;
49698ed568f8SMatthew G Knepley     c->maxnz = a->nz; /* Since we allocate exactly the right amount */
4970754ec7b1SSatish Balay 
49716ad4291fSHong Zhang     c->compressedrow.use   = a->compressedrow.use;
49726ad4291fSHong Zhang     c->compressedrow.nrows = a->compressedrow.nrows;
4973cd6b891eSBarry Smith     if (a->compressedrow.use) {
49746ad4291fSHong Zhang       i = a->compressedrow.nrows;
49759566063dSJacob Faibussowitsch       PetscCall(PetscMalloc2(i + 1, &c->compressedrow.i, i, &c->compressedrow.rindex));
49769566063dSJacob Faibussowitsch       PetscCall(PetscArraycpy(c->compressedrow.i, a->compressedrow.i, i + 1));
49779566063dSJacob Faibussowitsch       PetscCall(PetscArraycpy(c->compressedrow.rindex, a->compressedrow.rindex, i));
497827ea64f8SHong Zhang     } else {
497927ea64f8SHong Zhang       c->compressedrow.use    = PETSC_FALSE;
49800298fd71SBarry Smith       c->compressedrow.i      = NULL;
49810298fd71SBarry Smith       c->compressedrow.rindex = NULL;
49826ad4291fSHong Zhang     }
4983ea632784SBarry Smith     c->nonzerorowcnt = a->nonzerorowcnt;
4984e56f5c9eSBarry Smith     C->nonzerostate  = A->nonzerostate;
49854846f1f5SKris Buschelman 
49869566063dSJacob Faibussowitsch     PetscCall(MatDuplicate_SeqAIJ_Inode(A, cpvalues, &C));
498769272f91SPierre Jolivet   }
49889566063dSJacob Faibussowitsch   PetscCall(PetscFunctionListDuplicate(((PetscObject)A)->qlist, &((PetscObject)C)->qlist));
49893ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
499017ab2063SBarry Smith }
499117ab2063SBarry Smith 
4992d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDuplicate_SeqAIJ(Mat A, MatDuplicateOption cpvalues, Mat *B)
4993d71ae5a4SJacob Faibussowitsch {
4994b24902e0SBarry Smith   PetscFunctionBegin;
49959566063dSJacob Faibussowitsch   PetscCall(MatCreate(PetscObjectComm((PetscObject)A), B));
49969566063dSJacob Faibussowitsch   PetscCall(MatSetSizes(*B, A->rmap->n, A->cmap->n, A->rmap->n, A->cmap->n));
499748a46eb9SPierre Jolivet   if (!(A->rmap->n % A->rmap->bs) && !(A->cmap->n % A->cmap->bs)) PetscCall(MatSetBlockSizesFromMats(*B, A, A));
49989566063dSJacob Faibussowitsch   PetscCall(MatSetType(*B, ((PetscObject)A)->type_name));
49999566063dSJacob Faibussowitsch   PetscCall(MatDuplicateNoCreate_SeqAIJ(*B, A, cpvalues, PETSC_TRUE));
50003ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
5001b24902e0SBarry Smith }
5002b24902e0SBarry Smith 
5003d71ae5a4SJacob Faibussowitsch PetscErrorCode MatLoad_SeqAIJ(Mat newMat, PetscViewer viewer)
5004d71ae5a4SJacob Faibussowitsch {
500552f91c60SVaclav Hapla   PetscBool isbinary, ishdf5;
500652f91c60SVaclav Hapla 
500752f91c60SVaclav Hapla   PetscFunctionBegin;
500852f91c60SVaclav Hapla   PetscValidHeaderSpecific(newMat, MAT_CLASSID, 1);
500952f91c60SVaclav Hapla   PetscValidHeaderSpecific(viewer, PETSC_VIEWER_CLASSID, 2);
5010c27b3999SVaclav Hapla   /* force binary viewer to load .info file if it has not yet done so */
50119566063dSJacob Faibussowitsch   PetscCall(PetscViewerSetUp(viewer));
50129566063dSJacob Faibussowitsch   PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERBINARY, &isbinary));
50139566063dSJacob Faibussowitsch   PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERHDF5, &ishdf5));
501452f91c60SVaclav Hapla   if (isbinary) {
50159566063dSJacob Faibussowitsch     PetscCall(MatLoad_SeqAIJ_Binary(newMat, viewer));
501652f91c60SVaclav Hapla   } else if (ishdf5) {
501752f91c60SVaclav Hapla #if defined(PETSC_HAVE_HDF5)
50189566063dSJacob Faibussowitsch     PetscCall(MatLoad_AIJ_HDF5(newMat, viewer));
501952f91c60SVaclav Hapla #else
502052f91c60SVaclav Hapla     SETERRQ(PetscObjectComm((PetscObject)newMat), PETSC_ERR_SUP, "HDF5 not supported in this build.\nPlease reconfigure using --download-hdf5");
502152f91c60SVaclav Hapla #endif
502252f91c60SVaclav Hapla   } else {
502398921bdaSJacob Faibussowitsch     SETERRQ(PetscObjectComm((PetscObject)newMat), PETSC_ERR_SUP, "Viewer type %s not yet supported for reading %s matrices", ((PetscObject)viewer)->type_name, ((PetscObject)newMat)->type_name);
502452f91c60SVaclav Hapla   }
50253ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
502652f91c60SVaclav Hapla }
502752f91c60SVaclav Hapla 
5028d71ae5a4SJacob Faibussowitsch PetscErrorCode MatLoad_SeqAIJ_Binary(Mat mat, PetscViewer viewer)
5029d71ae5a4SJacob Faibussowitsch {
50303ea6fe3dSLisandro Dalcin   Mat_SeqAIJ *a = (Mat_SeqAIJ *)mat->data;
50313ea6fe3dSLisandro Dalcin   PetscInt    header[4], *rowlens, M, N, nz, sum, rows, cols, i;
5032fbdbba38SShri Abhyankar 
5033fbdbba38SShri Abhyankar   PetscFunctionBegin;
50349566063dSJacob Faibussowitsch   PetscCall(PetscViewerSetUp(viewer));
5035bbead8a2SBarry Smith 
50363ea6fe3dSLisandro Dalcin   /* read in matrix header */
50379566063dSJacob Faibussowitsch   PetscCall(PetscViewerBinaryRead(viewer, header, 4, NULL, PETSC_INT));
503808401ef6SPierre Jolivet   PetscCheck(header[0] == MAT_FILE_CLASSID, PETSC_COMM_SELF, PETSC_ERR_FILE_UNEXPECTED, "Not a matrix object in file");
50399371c9d4SSatish Balay   M  = header[1];
50409371c9d4SSatish Balay   N  = header[2];
50419371c9d4SSatish Balay   nz = header[3];
504208401ef6SPierre Jolivet   PetscCheck(M >= 0, PetscObjectComm((PetscObject)viewer), PETSC_ERR_FILE_UNEXPECTED, "Matrix row size (%" PetscInt_FMT ") in file is negative", M);
504308401ef6SPierre Jolivet   PetscCheck(N >= 0, PetscObjectComm((PetscObject)viewer), PETSC_ERR_FILE_UNEXPECTED, "Matrix column size (%" PetscInt_FMT ") in file is negative", N);
504408401ef6SPierre Jolivet   PetscCheck(nz >= 0, PETSC_COMM_SELF, PETSC_ERR_FILE_UNEXPECTED, "Matrix stored in special format on disk, cannot load as SeqAIJ");
5045fbdbba38SShri Abhyankar 
50463ea6fe3dSLisandro Dalcin   /* set block sizes from the viewer's .info file */
50479566063dSJacob Faibussowitsch   PetscCall(MatLoad_Binary_BlockSizes(mat, viewer));
50483ea6fe3dSLisandro Dalcin   /* set local and global sizes if not set already */
50493ea6fe3dSLisandro Dalcin   if (mat->rmap->n < 0) mat->rmap->n = M;
50503ea6fe3dSLisandro Dalcin   if (mat->cmap->n < 0) mat->cmap->n = N;
50513ea6fe3dSLisandro Dalcin   if (mat->rmap->N < 0) mat->rmap->N = M;
50523ea6fe3dSLisandro Dalcin   if (mat->cmap->N < 0) mat->cmap->N = N;
50539566063dSJacob Faibussowitsch   PetscCall(PetscLayoutSetUp(mat->rmap));
50549566063dSJacob Faibussowitsch   PetscCall(PetscLayoutSetUp(mat->cmap));
50553ea6fe3dSLisandro Dalcin 
50563ea6fe3dSLisandro Dalcin   /* check if the matrix sizes are correct */
50579566063dSJacob Faibussowitsch   PetscCall(MatGetSize(mat, &rows, &cols));
5058aed4548fSBarry Smith   PetscCheck(M == rows && N == cols, PETSC_COMM_SELF, PETSC_ERR_FILE_UNEXPECTED, "Matrix in file of different sizes (%" PetscInt_FMT ", %" PetscInt_FMT ") than the input matrix (%" PetscInt_FMT ", %" PetscInt_FMT ")", M, N, rows, cols);
50593ea6fe3dSLisandro Dalcin 
5060fbdbba38SShri Abhyankar   /* read in row lengths */
50619566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(M, &rowlens));
50629566063dSJacob Faibussowitsch   PetscCall(PetscViewerBinaryRead(viewer, rowlens, M, NULL, PETSC_INT));
50633ea6fe3dSLisandro Dalcin   /* check if sum(rowlens) is same as nz */
50649371c9d4SSatish Balay   sum = 0;
50659371c9d4SSatish Balay   for (i = 0; i < M; i++) sum += rowlens[i];
506608401ef6SPierre Jolivet   PetscCheck(sum == nz, PETSC_COMM_SELF, PETSC_ERR_FILE_UNEXPECTED, "Inconsistent matrix data in file: nonzeros = %" PetscInt_FMT ", sum-row-lengths = %" PetscInt_FMT, nz, sum);
50673ea6fe3dSLisandro Dalcin   /* preallocate and check sizes */
50689566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(mat, 0, rowlens));
50699566063dSJacob Faibussowitsch   PetscCall(MatGetSize(mat, &rows, &cols));
5070aed4548fSBarry Smith   PetscCheck(M == rows && N == cols, PETSC_COMM_SELF, PETSC_ERR_FILE_UNEXPECTED, "Matrix in file of different length (%" PetscInt_FMT ", %" PetscInt_FMT ") than the input matrix (%" PetscInt_FMT ", %" PetscInt_FMT ")", M, N, rows, cols);
50713ea6fe3dSLisandro Dalcin   /* store row lengths */
50729566063dSJacob Faibussowitsch   PetscCall(PetscArraycpy(a->ilen, rowlens, M));
50739566063dSJacob Faibussowitsch   PetscCall(PetscFree(rowlens));
5074fbdbba38SShri Abhyankar 
50753ea6fe3dSLisandro Dalcin   /* fill in "i" row pointers */
50769371c9d4SSatish Balay   a->i[0] = 0;
50779371c9d4SSatish Balay   for (i = 0; i < M; i++) a->i[i + 1] = a->i[i] + a->ilen[i];
50783ea6fe3dSLisandro Dalcin   /* read in "j" column indices */
50799566063dSJacob Faibussowitsch   PetscCall(PetscViewerBinaryRead(viewer, a->j, nz, NULL, PETSC_INT));
50803ea6fe3dSLisandro Dalcin   /* read in "a" nonzero values */
50819566063dSJacob Faibussowitsch   PetscCall(PetscViewerBinaryRead(viewer, a->a, nz, NULL, PETSC_SCALAR));
5082fbdbba38SShri Abhyankar 
50839566063dSJacob Faibussowitsch   PetscCall(MatAssemblyBegin(mat, MAT_FINAL_ASSEMBLY));
50849566063dSJacob Faibussowitsch   PetscCall(MatAssemblyEnd(mat, MAT_FINAL_ASSEMBLY));
50853ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
5086fbdbba38SShri Abhyankar }
5087fbdbba38SShri Abhyankar 
5088d71ae5a4SJacob Faibussowitsch PetscErrorCode MatEqual_SeqAIJ(Mat A, Mat B, PetscBool *flg)
5089d71ae5a4SJacob Faibussowitsch {
50907264ac53SSatish Balay   Mat_SeqAIJ        *a = (Mat_SeqAIJ *)A->data, *b = (Mat_SeqAIJ *)B->data;
5091fff043a9SJunchao Zhang   const PetscScalar *aa, *ba;
5092eeffb40dSHong Zhang #if defined(PETSC_USE_COMPLEX)
5093eeffb40dSHong Zhang   PetscInt k;
5094eeffb40dSHong Zhang #endif
50957264ac53SSatish Balay 
50963a40ed3dSBarry Smith   PetscFunctionBegin;
5097bfeeae90SHong Zhang   /* If the  matrix dimensions are not equal,or no of nonzeros */
5098d0f46423SBarry Smith   if ((A->rmap->n != B->rmap->n) || (A->cmap->n != B->cmap->n) || (a->nz != b->nz)) {
5099ca44d042SBarry Smith     *flg = PETSC_FALSE;
51003ba16761SJacob Faibussowitsch     PetscFunctionReturn(PETSC_SUCCESS);
5101bcd2baecSBarry Smith   }
51027264ac53SSatish Balay 
51037264ac53SSatish Balay   /* if the a->i are the same */
51049566063dSJacob Faibussowitsch   PetscCall(PetscArraycmp(a->i, b->i, A->rmap->n + 1, flg));
51053ba16761SJacob Faibussowitsch   if (!*flg) PetscFunctionReturn(PETSC_SUCCESS);
51067264ac53SSatish Balay 
51077264ac53SSatish Balay   /* if a->j are the same */
51089566063dSJacob Faibussowitsch   PetscCall(PetscArraycmp(a->j, b->j, a->nz, flg));
51093ba16761SJacob Faibussowitsch   if (!*flg) PetscFunctionReturn(PETSC_SUCCESS);
5110bcd2baecSBarry Smith 
51119566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &aa));
51129566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(B, &ba));
5113bcd2baecSBarry Smith   /* if a->a are the same */
5114eeffb40dSHong Zhang #if defined(PETSC_USE_COMPLEX)
5115eeffb40dSHong Zhang   for (k = 0; k < a->nz; k++) {
5116fff043a9SJunchao Zhang     if (PetscRealPart(aa[k]) != PetscRealPart(ba[k]) || PetscImaginaryPart(aa[k]) != PetscImaginaryPart(ba[k])) {
5117eeffb40dSHong Zhang       *flg = PETSC_FALSE;
51183ba16761SJacob Faibussowitsch       PetscFunctionReturn(PETSC_SUCCESS);
5119eeffb40dSHong Zhang     }
5120eeffb40dSHong Zhang   }
5121eeffb40dSHong Zhang #else
51229566063dSJacob Faibussowitsch   PetscCall(PetscArraycmp(aa, ba, a->nz, flg));
5123eeffb40dSHong Zhang #endif
51249566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &aa));
51259566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(B, &ba));
51263ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
51277264ac53SSatish Balay }
512836db0b34SBarry Smith 
512905869f15SSatish Balay /*@
513011a5261eSBarry Smith   MatCreateSeqAIJWithArrays - Creates an sequential `MATSEQAIJ` matrix using matrix elements (in CSR format)
513136db0b34SBarry Smith   provided by the user.
513236db0b34SBarry Smith 
5133d083f849SBarry Smith   Collective
513436db0b34SBarry Smith 
513536db0b34SBarry Smith   Input Parameters:
513636db0b34SBarry Smith + comm - must be an MPI communicator of size 1
513736db0b34SBarry Smith . m    - number of rows
513836db0b34SBarry Smith . n    - number of columns
5139483a2f95SBarry Smith . i    - row indices; that is i[0] = 0, i[row] = i[row-1] + number of elements in that row of the matrix
514036db0b34SBarry Smith . j    - column indices
514136db0b34SBarry Smith - a    - matrix values
514236db0b34SBarry Smith 
514336db0b34SBarry Smith   Output Parameter:
514436db0b34SBarry Smith . mat - the matrix
514536db0b34SBarry Smith 
514636db0b34SBarry Smith   Level: intermediate
514736db0b34SBarry Smith 
514836db0b34SBarry Smith   Notes:
51492ef1f0ffSBarry Smith   The `i`, `j`, and `a` arrays are not copied by this routine, the user must free these arrays
5150292fb18eSBarry Smith   once the matrix is destroyed and not before
515136db0b34SBarry Smith 
515236db0b34SBarry Smith   You cannot set new nonzero locations into this matrix, that will generate an error.
515336db0b34SBarry Smith 
51542ef1f0ffSBarry Smith   The `i` and `j` indices are 0 based
515536db0b34SBarry Smith 
5156a4552177SSatish Balay   The format which is used for the sparse matrix input, is equivalent to a
5157a4552177SSatish Balay   row-major ordering.. i.e for the following matrix, the input data expected is
51588eef79e4SBarry Smith   as shown
51592ef1f0ffSBarry Smith .vb
51602ef1f0ffSBarry Smith         1 0 0
51612ef1f0ffSBarry Smith         2 0 3
51622ef1f0ffSBarry Smith         4 5 6
5163a4552177SSatish Balay 
51642ef1f0ffSBarry Smith         i =  {0,1,3,6}  [size = nrow+1  = 3+1]
51652ef1f0ffSBarry Smith         j =  {0,0,2,0,1,2}  [size = 6]; values must be sorted for each row
51662ef1f0ffSBarry Smith         v =  {1,2,3,4,5,6}  [size = 6]
51672ef1f0ffSBarry Smith .ve
5168a4552177SSatish Balay 
51691cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatCreate()`, `MatCreateAIJ()`, `MatCreateSeqAIJ()`, `MatCreateMPIAIJWithArrays()`, `MatMPIAIJSetPreallocationCSR()`
517036db0b34SBarry Smith @*/
5171d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateSeqAIJWithArrays(MPI_Comm comm, PetscInt m, PetscInt n, PetscInt i[], PetscInt j[], PetscScalar a[], Mat *mat)
5172d71ae5a4SJacob Faibussowitsch {
5173cbcfb4deSHong Zhang   PetscInt    ii;
517436db0b34SBarry Smith   Mat_SeqAIJ *aij;
5175cbcfb4deSHong Zhang   PetscInt    jj;
517636db0b34SBarry Smith 
517736db0b34SBarry Smith   PetscFunctionBegin;
5178aed4548fSBarry Smith   PetscCheck(m <= 0 || i[0] == 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "i (row indices) must start with 0");
51799566063dSJacob Faibussowitsch   PetscCall(MatCreate(comm, mat));
51809566063dSJacob Faibussowitsch   PetscCall(MatSetSizes(*mat, m, n, m, n));
51819566063dSJacob Faibussowitsch   /* PetscCall(MatSetBlockSizes(*mat,,)); */
51829566063dSJacob Faibussowitsch   PetscCall(MatSetType(*mat, MATSEQAIJ));
51839566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(*mat, MAT_SKIP_ALLOCATION, NULL));
5184ab93d7beSBarry Smith   aij = (Mat_SeqAIJ *)(*mat)->data;
51859566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(m, &aij->imax));
51869566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(m, &aij->ilen));
5187ab93d7beSBarry Smith 
518836db0b34SBarry Smith   aij->i            = i;
518936db0b34SBarry Smith   aij->j            = j;
519036db0b34SBarry Smith   aij->a            = a;
519136db0b34SBarry Smith   aij->singlemalloc = PETSC_FALSE;
519236db0b34SBarry Smith   aij->nonew        = -1; /*this indicates that inserting a new value in the matrix that generates a new nonzero is an error*/
5193e6b907acSBarry Smith   aij->free_a       = PETSC_FALSE;
5194e6b907acSBarry Smith   aij->free_ij      = PETSC_FALSE;
519536db0b34SBarry Smith 
5196cbc6b225SStefano Zampini   for (ii = 0, aij->nonzerorowcnt = 0, aij->rmax = 0; ii < m; ii++) {
519736db0b34SBarry Smith     aij->ilen[ii] = aij->imax[ii] = i[ii + 1] - i[ii];
519876bd3646SJed Brown     if (PetscDefined(USE_DEBUG)) {
5199aed4548fSBarry Smith       PetscCheck(i[ii + 1] - i[ii] >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Negative row length in i (row indices) row = %" PetscInt_FMT " length = %" PetscInt_FMT, ii, i[ii + 1] - i[ii]);
52009985e31cSBarry Smith       for (jj = i[ii] + 1; jj < i[ii + 1]; jj++) {
520108401ef6SPierre Jolivet         PetscCheck(j[jj] >= j[jj - 1], PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Column entry number %" PetscInt_FMT " (actual column %" PetscInt_FMT ") in row %" PetscInt_FMT " is not sorted", jj - i[ii], j[jj], ii);
520208401ef6SPierre Jolivet         PetscCheck(j[jj] != j[jj - 1], PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Column entry number %" PetscInt_FMT " (actual column %" PetscInt_FMT ") in row %" PetscInt_FMT " is identical to previous entry", jj - i[ii], j[jj], ii);
52039985e31cSBarry Smith       }
520436db0b34SBarry Smith     }
520576bd3646SJed Brown   }
520676bd3646SJed Brown   if (PetscDefined(USE_DEBUG)) {
520736db0b34SBarry Smith     for (ii = 0; ii < aij->i[m]; ii++) {
520808401ef6SPierre Jolivet       PetscCheck(j[ii] >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Negative column index at location = %" PetscInt_FMT " index = %" PetscInt_FMT, ii, j[ii]);
5209aed4548fSBarry Smith       PetscCheck(j[ii] <= n - 1, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Column index to large at location = %" PetscInt_FMT " index = %" PetscInt_FMT, ii, j[ii]);
521036db0b34SBarry Smith     }
521176bd3646SJed Brown   }
521236db0b34SBarry Smith 
52139566063dSJacob Faibussowitsch   PetscCall(MatAssemblyBegin(*mat, MAT_FINAL_ASSEMBLY));
52149566063dSJacob Faibussowitsch   PetscCall(MatAssemblyEnd(*mat, MAT_FINAL_ASSEMBLY));
52153ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
521636db0b34SBarry Smith }
5217cbc6b225SStefano Zampini 
5218f62e3866SBarry Smith /*@
521911a5261eSBarry Smith   MatCreateSeqAIJFromTriple - Creates an sequential `MATSEQAIJ` matrix using matrix elements (in COO format)
52208a0b0e6bSVictor Minden   provided by the user.
52218a0b0e6bSVictor Minden 
5222d083f849SBarry Smith   Collective
52238a0b0e6bSVictor Minden 
52248a0b0e6bSVictor Minden   Input Parameters:
52258a0b0e6bSVictor Minden + comm - must be an MPI communicator of size 1
52268a0b0e6bSVictor Minden . m    - number of rows
52278a0b0e6bSVictor Minden . n    - number of columns
52288a0b0e6bSVictor Minden . i    - row indices
52298a0b0e6bSVictor Minden . j    - column indices
52301230e6d1SVictor Minden . a    - matrix values
52311230e6d1SVictor Minden . nz   - number of nonzeros
52322ef1f0ffSBarry Smith - idx  - if the `i` and `j` indices start with 1 use `PETSC_TRUE` otherwise use `PETSC_FALSE`
52338a0b0e6bSVictor Minden 
52348a0b0e6bSVictor Minden   Output Parameter:
52358a0b0e6bSVictor Minden . mat - the matrix
52368a0b0e6bSVictor Minden 
52378a0b0e6bSVictor Minden   Level: intermediate
52388a0b0e6bSVictor Minden 
5239f62e3866SBarry Smith   Example:
5240f62e3866SBarry Smith   For the following matrix, the input data expected is as shown (using 0 based indexing)
52419e99939fSJunchao Zhang .vb
52428a0b0e6bSVictor Minden         1 0 0
52438a0b0e6bSVictor Minden         2 0 3
52448a0b0e6bSVictor Minden         4 5 6
52458a0b0e6bSVictor Minden 
52468a0b0e6bSVictor Minden         i =  {0,1,1,2,2,2}
52478a0b0e6bSVictor Minden         j =  {0,0,2,0,1,2}
52488a0b0e6bSVictor Minden         v =  {1,2,3,4,5,6}
52499e99939fSJunchao Zhang .ve
5250fe59aa6dSJacob Faibussowitsch 
52512ef1f0ffSBarry Smith   Note:
5252d7547e51SJunchao Zhang   Instead of using this function, users should also consider `MatSetPreallocationCOO()` and `MatSetValuesCOO()`, which allow repeated or remote entries,
5253d7547e51SJunchao Zhang   and are particularly useful in iterative applications.
52548a0b0e6bSVictor Minden 
52551cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatCreate()`, `MatCreateAIJ()`, `MatCreateSeqAIJ()`, `MatCreateSeqAIJWithArrays()`, `MatMPIAIJSetPreallocationCSR()`, `MatSetValuesCOO()`, `MatSetPreallocationCOO()`
52568a0b0e6bSVictor Minden @*/
5257d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateSeqAIJFromTriple(MPI_Comm comm, PetscInt m, PetscInt n, PetscInt i[], PetscInt j[], PetscScalar a[], Mat *mat, PetscInt nz, PetscBool idx)
5258d71ae5a4SJacob Faibussowitsch {
5259d021a1c5SVictor Minden   PetscInt ii, *nnz, one = 1, row, col;
52608a0b0e6bSVictor Minden 
52618a0b0e6bSVictor Minden   PetscFunctionBegin;
52629566063dSJacob Faibussowitsch   PetscCall(PetscCalloc1(m, &nnz));
5263ad540459SPierre Jolivet   for (ii = 0; ii < nz; ii++) nnz[i[ii] - !!idx] += 1;
52649566063dSJacob Faibussowitsch   PetscCall(MatCreate(comm, mat));
52659566063dSJacob Faibussowitsch   PetscCall(MatSetSizes(*mat, m, n, m, n));
52669566063dSJacob Faibussowitsch   PetscCall(MatSetType(*mat, MATSEQAIJ));
52679566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(*mat, 0, nnz));
52681230e6d1SVictor Minden   for (ii = 0; ii < nz; ii++) {
52691230e6d1SVictor Minden     if (idx) {
52701230e6d1SVictor Minden       row = i[ii] - 1;
52711230e6d1SVictor Minden       col = j[ii] - 1;
52721230e6d1SVictor Minden     } else {
52731230e6d1SVictor Minden       row = i[ii];
52741230e6d1SVictor Minden       col = j[ii];
52758a0b0e6bSVictor Minden     }
52769566063dSJacob Faibussowitsch     PetscCall(MatSetValues(*mat, one, &row, one, &col, &a[ii], ADD_VALUES));
52778a0b0e6bSVictor Minden   }
52789566063dSJacob Faibussowitsch   PetscCall(MatAssemblyBegin(*mat, MAT_FINAL_ASSEMBLY));
52799566063dSJacob Faibussowitsch   PetscCall(MatAssemblyEnd(*mat, MAT_FINAL_ASSEMBLY));
52809566063dSJacob Faibussowitsch   PetscCall(PetscFree(nnz));
52813ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
52828a0b0e6bSVictor Minden }
528336db0b34SBarry Smith 
5284d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJInvalidateDiagonal(Mat A)
5285d71ae5a4SJacob Faibussowitsch {
5286acf2f550SJed Brown   Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data;
5287acf2f550SJed Brown 
5288acf2f550SJed Brown   PetscFunctionBegin;
5289acf2f550SJed Brown   a->idiagvalid  = PETSC_FALSE;
5290acf2f550SJed Brown   a->ibdiagvalid = PETSC_FALSE;
52912205254eSKarl Rupp 
52929566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJInvalidateDiagonal_Inode(A));
52933ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
5294acf2f550SJed Brown }
5295acf2f550SJed Brown 
5296d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateMPIMatConcatenateSeqMat_SeqAIJ(MPI_Comm comm, Mat inmat, PetscInt n, MatReuse scall, Mat *outmat)
5297d71ae5a4SJacob Faibussowitsch {
52989c8f2541SHong Zhang   PetscFunctionBegin;
52999566063dSJacob Faibussowitsch   PetscCall(MatCreateMPIMatConcatenateSeqMat_MPIAIJ(comm, inmat, n, scall, outmat));
53003ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
53019c8f2541SHong Zhang }
53029c8f2541SHong Zhang 
530381824310SBarry Smith /*
530453dd7562SDmitry Karpeev  Permute A into C's *local* index space using rowemb,colemb.
530553dd7562SDmitry Karpeev  The embedding are supposed to be injections and the above implies that the range of rowemb is a subset
530653dd7562SDmitry Karpeev  of [0,m), colemb is in [0,n).
530753dd7562SDmitry Karpeev  If pattern == DIFFERENT_NONZERO_PATTERN, C is preallocated according to A.
530853dd7562SDmitry Karpeev  */
5309d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetSeqMat_SeqAIJ(Mat C, IS rowemb, IS colemb, MatStructure pattern, Mat B)
5310d71ae5a4SJacob Faibussowitsch {
531153dd7562SDmitry Karpeev   /* If making this function public, change the error returned in this function away from _PLIB. */
531253dd7562SDmitry Karpeev   Mat_SeqAIJ     *Baij;
531353dd7562SDmitry Karpeev   PetscBool       seqaij;
531453dd7562SDmitry Karpeev   PetscInt        m, n, *nz, i, j, count;
531553dd7562SDmitry Karpeev   PetscScalar     v;
531653dd7562SDmitry Karpeev   const PetscInt *rowindices, *colindices;
531753dd7562SDmitry Karpeev 
531853dd7562SDmitry Karpeev   PetscFunctionBegin;
53193ba16761SJacob Faibussowitsch   if (!B) PetscFunctionReturn(PETSC_SUCCESS);
532053dd7562SDmitry Karpeev   /* Check to make sure the target matrix (and embeddings) are compatible with C and each other. */
53219566063dSJacob Faibussowitsch   PetscCall(PetscObjectBaseTypeCompare((PetscObject)B, MATSEQAIJ, &seqaij));
532228b400f6SJacob Faibussowitsch   PetscCheck(seqaij, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Input matrix is of wrong type");
532353dd7562SDmitry Karpeev   if (rowemb) {
53249566063dSJacob Faibussowitsch     PetscCall(ISGetLocalSize(rowemb, &m));
532508401ef6SPierre Jolivet     PetscCheck(m == B->rmap->n, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Row IS of size %" PetscInt_FMT " is incompatible with matrix row size %" PetscInt_FMT, m, B->rmap->n);
532653dd7562SDmitry Karpeev   } else {
532708401ef6SPierre Jolivet     PetscCheck(C->rmap->n == B->rmap->n, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Input matrix is row-incompatible with the target matrix");
532853dd7562SDmitry Karpeev   }
532953dd7562SDmitry Karpeev   if (colemb) {
53309566063dSJacob Faibussowitsch     PetscCall(ISGetLocalSize(colemb, &n));
533108401ef6SPierre Jolivet     PetscCheck(n == B->cmap->n, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Diag col IS of size %" PetscInt_FMT " is incompatible with input matrix col size %" PetscInt_FMT, n, B->cmap->n);
533253dd7562SDmitry Karpeev   } else {
533308401ef6SPierre Jolivet     PetscCheck(C->cmap->n == B->cmap->n, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Input matrix is col-incompatible with the target matrix");
533453dd7562SDmitry Karpeev   }
533553dd7562SDmitry Karpeev 
533653dd7562SDmitry Karpeev   Baij = (Mat_SeqAIJ *)(B->data);
533753dd7562SDmitry Karpeev   if (pattern == DIFFERENT_NONZERO_PATTERN) {
53389566063dSJacob Faibussowitsch     PetscCall(PetscMalloc1(B->rmap->n, &nz));
5339ad540459SPierre Jolivet     for (i = 0; i < B->rmap->n; i++) nz[i] = Baij->i[i + 1] - Baij->i[i];
53409566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJSetPreallocation(C, 0, nz));
53419566063dSJacob Faibussowitsch     PetscCall(PetscFree(nz));
534253dd7562SDmitry Karpeev   }
534348a46eb9SPierre Jolivet   if (pattern == SUBSET_NONZERO_PATTERN) PetscCall(MatZeroEntries(C));
534453dd7562SDmitry Karpeev   count      = 0;
534553dd7562SDmitry Karpeev   rowindices = NULL;
534653dd7562SDmitry Karpeev   colindices = NULL;
534748a46eb9SPierre Jolivet   if (rowemb) PetscCall(ISGetIndices(rowemb, &rowindices));
534848a46eb9SPierre Jolivet   if (colemb) PetscCall(ISGetIndices(colemb, &colindices));
534953dd7562SDmitry Karpeev   for (i = 0; i < B->rmap->n; i++) {
535053dd7562SDmitry Karpeev     PetscInt row;
535153dd7562SDmitry Karpeev     row = i;
535253dd7562SDmitry Karpeev     if (rowindices) row = rowindices[i];
535353dd7562SDmitry Karpeev     for (j = Baij->i[i]; j < Baij->i[i + 1]; j++) {
535453dd7562SDmitry Karpeev       PetscInt col;
535553dd7562SDmitry Karpeev       col = Baij->j[count];
535653dd7562SDmitry Karpeev       if (colindices) col = colindices[col];
535753dd7562SDmitry Karpeev       v = Baij->a[count];
53589566063dSJacob Faibussowitsch       PetscCall(MatSetValues(C, 1, &row, 1, &col, &v, INSERT_VALUES));
535953dd7562SDmitry Karpeev       ++count;
536053dd7562SDmitry Karpeev     }
536153dd7562SDmitry Karpeev   }
536253dd7562SDmitry Karpeev   /* FIXME: set C's nonzerostate correctly. */
536353dd7562SDmitry Karpeev   /* Assembly for C is necessary. */
536453dd7562SDmitry Karpeev   C->preallocated  = PETSC_TRUE;
536553dd7562SDmitry Karpeev   C->assembled     = PETSC_TRUE;
536653dd7562SDmitry Karpeev   C->was_assembled = PETSC_FALSE;
53673ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
536853dd7562SDmitry Karpeev }
536953dd7562SDmitry Karpeev 
537058c11ad4SPierre Jolivet PetscErrorCode MatEliminateZeros_SeqAIJ(Mat A, PetscBool keep)
5371dec0b466SHong Zhang {
5372dec0b466SHong Zhang   Mat_SeqAIJ *a  = (Mat_SeqAIJ *)A->data;
5373dec0b466SHong Zhang   MatScalar  *aa = a->a;
5374dec0b466SHong Zhang   PetscInt    m = A->rmap->n, fshift = 0, fshift_prev = 0, i, k;
5375dec0b466SHong Zhang   PetscInt   *ailen = a->ilen, *imax = a->imax, *ai = a->i, *aj = a->j, rmax = 0;
5376dec0b466SHong Zhang 
5377dec0b466SHong Zhang   PetscFunctionBegin;
5378dec0b466SHong Zhang   PetscCheck(A->assembled, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Cannot eliminate zeros for unassembled matrix");
5379dec0b466SHong Zhang   if (m) rmax = ailen[0]; /* determine row with most nonzeros */
5380dec0b466SHong Zhang   for (i = 1; i <= m; i++) {
5381dec0b466SHong Zhang     /* move each nonzero entry back by the amount of zero slots (fshift) before it*/
5382dec0b466SHong Zhang     for (k = ai[i - 1]; k < ai[i]; k++) {
538358c11ad4SPierre Jolivet       if (aa[k] == 0 && (aj[k] != i - 1 || !keep)) fshift++;
5384dec0b466SHong Zhang       else {
5385dec0b466SHong Zhang         if (aa[k] == 0 && aj[k] == i - 1) PetscCall(PetscInfo(A, "Keep the diagonal zero at row %" PetscInt_FMT "\n", i - 1));
5386dec0b466SHong Zhang         aa[k - fshift] = aa[k];
5387dec0b466SHong Zhang         aj[k - fshift] = aj[k];
5388dec0b466SHong Zhang       }
5389dec0b466SHong Zhang     }
5390dec0b466SHong Zhang     ai[i - 1] -= fshift_prev; // safe to update ai[i-1] now since it will not be used in the next iteration
5391dec0b466SHong Zhang     fshift_prev = fshift;
5392dec0b466SHong Zhang     /* reset ilen and imax for each row */
5393dec0b466SHong Zhang     ailen[i - 1] = imax[i - 1] = ai[i] - fshift - ai[i - 1];
5394dec0b466SHong Zhang     a->nonzerorowcnt += ((ai[i] - fshift - ai[i - 1]) > 0);
5395dec0b466SHong Zhang     rmax = PetscMax(rmax, ailen[i - 1]);
5396dec0b466SHong Zhang   }
5397312eded4SPierre Jolivet   if (fshift) {
5398dec0b466SHong Zhang     if (m) {
5399dec0b466SHong Zhang       ai[m] -= fshift;
5400dec0b466SHong Zhang       a->nz = ai[m];
5401dec0b466SHong Zhang     }
5402dec0b466SHong Zhang     PetscCall(PetscInfo(A, "Matrix size: %" PetscInt_FMT " X %" PetscInt_FMT "; zeros eliminated: %" PetscInt_FMT "; nonzeros left: %" PetscInt_FMT "\n", m, A->cmap->n, fshift, a->nz));
5403312eded4SPierre Jolivet     A->nonzerostate++;
5404dec0b466SHong Zhang     A->info.nz_unneeded += (PetscReal)fshift;
5405dec0b466SHong Zhang     a->rmax = rmax;
5406dec0b466SHong Zhang     if (a->inode.use && a->inode.checked) PetscCall(MatSeqAIJCheckInode(A));
5407dec0b466SHong Zhang     PetscCall(MatAssemblyBegin(A, MAT_FINAL_ASSEMBLY));
5408dec0b466SHong Zhang     PetscCall(MatAssemblyEnd(A, MAT_FINAL_ASSEMBLY));
5409312eded4SPierre Jolivet   }
54103ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
5411dec0b466SHong Zhang }
5412dec0b466SHong Zhang 
54134099cc6bSBarry Smith PetscFunctionList MatSeqAIJList = NULL;
54144099cc6bSBarry Smith 
54154099cc6bSBarry Smith /*@C
541611a5261eSBarry Smith   MatSeqAIJSetType - Converts a `MATSEQAIJ` matrix to a subtype
54174099cc6bSBarry Smith 
5418c3339decSBarry Smith   Collective
54194099cc6bSBarry Smith 
54204099cc6bSBarry Smith   Input Parameters:
54214099cc6bSBarry Smith + mat    - the matrix object
54224099cc6bSBarry Smith - matype - matrix type
54234099cc6bSBarry Smith 
54244099cc6bSBarry Smith   Options Database Key:
54254e187271SRichard Tran Mills . -mat_seqaij_type  <method> - for example seqaijcrl
54264099cc6bSBarry Smith 
54274099cc6bSBarry Smith   Level: intermediate
54284099cc6bSBarry Smith 
5429fe59aa6dSJacob Faibussowitsch .seealso: [](ch_matrices), `Mat`, `PCSetType()`, `VecSetType()`, `MatCreate()`, `MatType`
54304099cc6bSBarry Smith @*/
5431d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetType(Mat mat, MatType matype)
5432d71ae5a4SJacob Faibussowitsch {
54334099cc6bSBarry Smith   PetscBool sametype;
54345f80ce2aSJacob Faibussowitsch   PetscErrorCode (*r)(Mat, MatType, MatReuse, Mat *);
54354099cc6bSBarry Smith 
54364099cc6bSBarry Smith   PetscFunctionBegin;
54374099cc6bSBarry Smith   PetscValidHeaderSpecific(mat, MAT_CLASSID, 1);
54389566063dSJacob Faibussowitsch   PetscCall(PetscObjectTypeCompare((PetscObject)mat, matype, &sametype));
54393ba16761SJacob Faibussowitsch   if (sametype) PetscFunctionReturn(PETSC_SUCCESS);
54404099cc6bSBarry Smith 
54419566063dSJacob Faibussowitsch   PetscCall(PetscFunctionListFind(MatSeqAIJList, matype, &r));
54426adde796SStefano Zampini   PetscCheck(r, PetscObjectComm((PetscObject)mat), PETSC_ERR_ARG_UNKNOWN_TYPE, "Unknown Mat type given: %s", matype);
54439566063dSJacob Faibussowitsch   PetscCall((*r)(mat, matype, MAT_INPLACE_MATRIX, &mat));
54443ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
54454099cc6bSBarry Smith }
54464099cc6bSBarry Smith 
54474099cc6bSBarry Smith /*@C
544811a5261eSBarry Smith   MatSeqAIJRegister -  - Adds a new sub-matrix type for sequential `MATSEQAIJ` matrices
54494099cc6bSBarry Smith 
54504099cc6bSBarry Smith   Not Collective
54514099cc6bSBarry Smith 
54524099cc6bSBarry Smith   Input Parameters:
5453fe59aa6dSJacob Faibussowitsch + sname    - name of a new user-defined matrix type, for example `MATSEQAIJCRL`
54544099cc6bSBarry Smith - function - routine to convert to subtype
54554099cc6bSBarry Smith 
54562ef1f0ffSBarry Smith   Level: advanced
54572ef1f0ffSBarry Smith 
54584099cc6bSBarry Smith   Notes:
545911a5261eSBarry Smith   `MatSeqAIJRegister()` may be called multiple times to add several user-defined solvers.
54604099cc6bSBarry Smith 
54614099cc6bSBarry Smith   Then, your matrix can be chosen with the procedural interface at runtime via the option
54624099cc6bSBarry Smith $     -mat_seqaij_type my_mat
54634099cc6bSBarry Smith 
54641cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJRegisterAll()`
54654099cc6bSBarry Smith @*/
5466d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJRegister(const char sname[], PetscErrorCode (*function)(Mat, MatType, MatReuse, Mat *))
5467d71ae5a4SJacob Faibussowitsch {
54684099cc6bSBarry Smith   PetscFunctionBegin;
54699566063dSJacob Faibussowitsch   PetscCall(MatInitializePackage());
54709566063dSJacob Faibussowitsch   PetscCall(PetscFunctionListAdd(&MatSeqAIJList, sname, function));
54713ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
54724099cc6bSBarry Smith }
54734099cc6bSBarry Smith 
54744099cc6bSBarry Smith PetscBool MatSeqAIJRegisterAllCalled = PETSC_FALSE;
54754099cc6bSBarry Smith 
54764099cc6bSBarry Smith /*@C
547711a5261eSBarry Smith   MatSeqAIJRegisterAll - Registers all of the matrix subtypes of `MATSSEQAIJ`
54784099cc6bSBarry Smith 
54794099cc6bSBarry Smith   Not Collective
54804099cc6bSBarry Smith 
54814099cc6bSBarry Smith   Level: advanced
54824099cc6bSBarry Smith 
54832ef1f0ffSBarry Smith   Note:
54842ef1f0ffSBarry Smith   This registers the versions of `MATSEQAIJ` for GPUs
54852ef1f0ffSBarry Smith 
54861cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatRegisterAll()`, `MatSeqAIJRegister()`
54874099cc6bSBarry Smith @*/
5488d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJRegisterAll(void)
5489d71ae5a4SJacob Faibussowitsch {
54904099cc6bSBarry Smith   PetscFunctionBegin;
54913ba16761SJacob Faibussowitsch   if (MatSeqAIJRegisterAllCalled) PetscFunctionReturn(PETSC_SUCCESS);
54924099cc6bSBarry Smith   MatSeqAIJRegisterAllCalled = PETSC_TRUE;
54934099cc6bSBarry Smith 
54949566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRegister(MATSEQAIJCRL, MatConvert_SeqAIJ_SeqAIJCRL));
54959566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRegister(MATSEQAIJPERM, MatConvert_SeqAIJ_SeqAIJPERM));
54969566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRegister(MATSEQAIJSELL, MatConvert_SeqAIJ_SeqAIJSELL));
54979779e05dSSatish Balay #if defined(PETSC_HAVE_MKL_SPARSE)
54989566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRegister(MATSEQAIJMKL, MatConvert_SeqAIJ_SeqAIJMKL));
5499485f9817SRichard Tran Mills #endif
55005063d097SStefano Zampini #if defined(PETSC_HAVE_CUDA)
55019566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRegister(MATSEQAIJCUSPARSE, MatConvert_SeqAIJ_SeqAIJCUSPARSE));
55025063d097SStefano Zampini #endif
5503d5e393b6SSuyash Tandon #if defined(PETSC_HAVE_HIP)
5504d5e393b6SSuyash Tandon   PetscCall(MatSeqAIJRegister(MATSEQAIJHIPSPARSE, MatConvert_SeqAIJ_SeqAIJHIPSPARSE));
5505d5e393b6SSuyash Tandon #endif
55065063d097SStefano Zampini #if defined(PETSC_HAVE_KOKKOS_KERNELS)
55079566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRegister(MATSEQAIJKOKKOS, MatConvert_SeqAIJ_SeqAIJKokkos));
55085063d097SStefano Zampini #endif
55094099cc6bSBarry Smith #if defined(PETSC_HAVE_VIENNACL) && defined(PETSC_HAVE_VIENNACL_NO_CUDA)
55109566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRegister(MATMPIAIJVIENNACL, MatConvert_SeqAIJ_SeqAIJViennaCL));
55114099cc6bSBarry Smith #endif
55123ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
55134099cc6bSBarry Smith }
551453dd7562SDmitry Karpeev 
551553dd7562SDmitry Karpeev /*
551681824310SBarry Smith     Special version for direct calls from Fortran
551781824310SBarry Smith */
5518af0996ceSBarry Smith #include <petsc/private/fortranimpl.h>
551981824310SBarry Smith #if defined(PETSC_HAVE_FORTRAN_CAPS)
552081824310SBarry Smith   #define matsetvaluesseqaij_ MATSETVALUESSEQAIJ
552181824310SBarry Smith #elif !defined(PETSC_HAVE_FORTRAN_UNDERSCORE)
552281824310SBarry Smith   #define matsetvaluesseqaij_ matsetvaluesseqaij
552381824310SBarry Smith #endif
552481824310SBarry Smith 
552581824310SBarry Smith /* Change these macros so can be used in void function */
552698921bdaSJacob Faibussowitsch 
552798921bdaSJacob Faibussowitsch /* Change these macros so can be used in void function */
55289566063dSJacob Faibussowitsch /* Identical to PetscCallVoid, except it assigns to *_ierr */
55299566063dSJacob Faibussowitsch #undef PetscCall
55309371c9d4SSatish Balay #define PetscCall(...) \
55319371c9d4SSatish Balay   do { \
55325f80ce2aSJacob Faibussowitsch     PetscErrorCode ierr_msv_mpiaij = __VA_ARGS__; \
553398921bdaSJacob Faibussowitsch     if (PetscUnlikely(ierr_msv_mpiaij)) { \
553498921bdaSJacob Faibussowitsch       *_ierr = PetscError(PETSC_COMM_SELF, __LINE__, PETSC_FUNCTION_NAME, __FILE__, ierr_msv_mpiaij, PETSC_ERROR_REPEAT, " "); \
553598921bdaSJacob Faibussowitsch       return; \
553698921bdaSJacob Faibussowitsch     } \
553798921bdaSJacob Faibussowitsch   } while (0)
553898921bdaSJacob Faibussowitsch 
553998921bdaSJacob Faibussowitsch #undef SETERRQ
55409371c9d4SSatish Balay #define SETERRQ(comm, ierr, ...) \
55419371c9d4SSatish Balay   do { \
554298921bdaSJacob Faibussowitsch     *_ierr = PetscError(comm, __LINE__, PETSC_FUNCTION_NAME, __FILE__, ierr, PETSC_ERROR_INITIAL, __VA_ARGS__); \
554398921bdaSJacob Faibussowitsch     return; \
554498921bdaSJacob Faibussowitsch   } while (0)
554581824310SBarry Smith 
5546d71ae5a4SJacob Faibussowitsch PETSC_EXTERN void matsetvaluesseqaij_(Mat *AA, PetscInt *mm, const PetscInt im[], PetscInt *nn, const PetscInt in[], const PetscScalar v[], InsertMode *isis, PetscErrorCode *_ierr)
5547d71ae5a4SJacob Faibussowitsch {
554881824310SBarry Smith   Mat         A = *AA;
554981824310SBarry Smith   PetscInt    m = *mm, n = *nn;
555081824310SBarry Smith   InsertMode  is = *isis;
555181824310SBarry Smith   Mat_SeqAIJ *a  = (Mat_SeqAIJ *)A->data;
555281824310SBarry Smith   PetscInt   *rp, k, low, high, t, ii, row, nrow, i, col, l, rmax, N;
555381824310SBarry Smith   PetscInt   *imax, *ai, *ailen;
555481824310SBarry Smith   PetscInt   *aj, nonew = a->nonew, lastcol = -1;
555554f21887SBarry Smith   MatScalar  *ap, value, *aa;
5556ace3abfcSBarry Smith   PetscBool   ignorezeroentries = a->ignorezeroentries;
5557ace3abfcSBarry Smith   PetscBool   roworiented       = a->roworiented;
555881824310SBarry Smith 
555981824310SBarry Smith   PetscFunctionBegin;
55604994cf47SJed Brown   MatCheckPreallocated(A, 1);
556181824310SBarry Smith   imax  = a->imax;
556281824310SBarry Smith   ai    = a->i;
556381824310SBarry Smith   ailen = a->ilen;
556481824310SBarry Smith   aj    = a->j;
556581824310SBarry Smith   aa    = a->a;
556681824310SBarry Smith 
556781824310SBarry Smith   for (k = 0; k < m; k++) { /* loop over added rows */
556881824310SBarry Smith     row = im[k];
556981824310SBarry Smith     if (row < 0) continue;
55705f80ce2aSJacob Faibussowitsch     PetscCheck(row < A->rmap->n, PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_OUTOFRANGE, "Row too large");
55719371c9d4SSatish Balay     rp   = aj + ai[row];
55729371c9d4SSatish Balay     ap   = aa + ai[row];
55739371c9d4SSatish Balay     rmax = imax[row];
55749371c9d4SSatish Balay     nrow = ailen[row];
557581824310SBarry Smith     low  = 0;
557681824310SBarry Smith     high = nrow;
557781824310SBarry Smith     for (l = 0; l < n; l++) { /* loop over added columns */
557881824310SBarry Smith       if (in[l] < 0) continue;
55795f80ce2aSJacob Faibussowitsch       PetscCheck(in[l] < A->cmap->n, PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_OUTOFRANGE, "Column too large");
558081824310SBarry Smith       col = in[l];
55812205254eSKarl Rupp       if (roworiented) value = v[l + k * n];
55822205254eSKarl Rupp       else value = v[k + l * m];
55832205254eSKarl Rupp 
558481824310SBarry Smith       if (value == 0.0 && ignorezeroentries && (is == ADD_VALUES)) continue;
558581824310SBarry Smith 
55862205254eSKarl Rupp       if (col <= lastcol) low = 0;
55872205254eSKarl Rupp       else high = nrow;
558881824310SBarry Smith       lastcol = col;
558981824310SBarry Smith       while (high - low > 5) {
559081824310SBarry Smith         t = (low + high) / 2;
559181824310SBarry Smith         if (rp[t] > col) high = t;
559281824310SBarry Smith         else low = t;
559381824310SBarry Smith       }
559481824310SBarry Smith       for (i = low; i < high; i++) {
559581824310SBarry Smith         if (rp[i] > col) break;
559681824310SBarry Smith         if (rp[i] == col) {
559781824310SBarry Smith           if (is == ADD_VALUES) ap[i] += value;
559881824310SBarry Smith           else ap[i] = value;
559981824310SBarry Smith           goto noinsert;
560081824310SBarry Smith         }
560181824310SBarry Smith       }
560281824310SBarry Smith       if (value == 0.0 && ignorezeroentries) goto noinsert;
560381824310SBarry Smith       if (nonew == 1) goto noinsert;
56045f80ce2aSJacob Faibussowitsch       PetscCheck(nonew != -1, PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_OUTOFRANGE, "Inserting a new nonzero in the matrix");
5605fef13f97SBarry Smith       MatSeqXAIJReallocateAIJ(A, A->rmap->n, 1, nrow, row, col, rmax, aa, ai, aj, rp, ap, imax, nonew, MatScalar);
56069371c9d4SSatish Balay       N = nrow++ - 1;
56079371c9d4SSatish Balay       a->nz++;
56089371c9d4SSatish Balay       high++;
560981824310SBarry Smith       /* shift up all the later entries in this row */
561081824310SBarry Smith       for (ii = N; ii >= i; ii--) {
561181824310SBarry Smith         rp[ii + 1] = rp[ii];
561281824310SBarry Smith         ap[ii + 1] = ap[ii];
561381824310SBarry Smith       }
561481824310SBarry Smith       rp[i] = col;
561581824310SBarry Smith       ap[i] = value;
5616e56f5c9eSBarry Smith       A->nonzerostate++;
561781824310SBarry Smith     noinsert:;
561881824310SBarry Smith       low = i + 1;
561981824310SBarry Smith     }
562081824310SBarry Smith     ailen[row] = nrow;
562181824310SBarry Smith   }
562281824310SBarry Smith   PetscFunctionReturnVoid();
562381824310SBarry Smith }
562498921bdaSJacob Faibussowitsch /* Undefining these here since they were redefined from their original definition above! No
562598921bdaSJacob Faibussowitsch  * other PETSc functions should be defined past this point, as it is impossible to recover the
562698921bdaSJacob Faibussowitsch  * original definitions */
56279566063dSJacob Faibussowitsch #undef PetscCall
562898921bdaSJacob Faibussowitsch #undef SETERRQ
5629