xref: /petsc/src/mat/impls/aij/seq/aij.c (revision 9f0612e409f6220a780be6348417bea34ef34962)
1d5d45c9bSBarry Smith /*
23369ce9aSBarry Smith     Defines the basic matrix operations for the AIJ (compressed row)
3d5d45c9bSBarry Smith   matrix storage format.
4d5d45c9bSBarry Smith */
53369ce9aSBarry Smith 
6c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/aij.h> /*I "petscmat.h" I*/
7c6db04a5SJed Brown #include <petscblaslapack.h>
8c6db04a5SJed Brown #include <petscbt.h>
9af0996ceSBarry Smith #include <petsc/private/kernels/blocktranspose.h>
100716a85fSBarry Smith 
1126cec326SBarry Smith /* defines MatSetValues_Seq_Hash(), MatAssemblyEnd_Seq_Hash(), MatSetUp_Seq_Hash() */
1226cec326SBarry Smith #define TYPE AIJ
1326cec326SBarry Smith #define TYPE_BS
1426cec326SBarry Smith #include "../src/mat/impls/aij/seq/seqhashmatsetvalues.h"
1526cec326SBarry Smith #include "../src/mat/impls/aij/seq/seqhashmat.h"
1626cec326SBarry Smith #undef TYPE
1726cec326SBarry Smith #undef TYPE_BS
1826cec326SBarry Smith 
19ba38deedSJacob Faibussowitsch static PetscErrorCode MatSeqAIJSetTypeFromOptions(Mat A)
20d71ae5a4SJacob Faibussowitsch {
214099cc6bSBarry Smith   PetscBool flg;
224099cc6bSBarry Smith   char      type[256];
234099cc6bSBarry Smith 
244099cc6bSBarry Smith   PetscFunctionBegin;
25d0609cedSBarry Smith   PetscObjectOptionsBegin((PetscObject)A);
269566063dSJacob Faibussowitsch   PetscCall(PetscOptionsFList("-mat_seqaij_type", "Matrix SeqAIJ type", "MatSeqAIJSetType", MatSeqAIJList, "seqaij", type, 256, &flg));
279566063dSJacob Faibussowitsch   if (flg) PetscCall(MatSeqAIJSetType(A, type));
28d0609cedSBarry Smith   PetscOptionsEnd();
293ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
304099cc6bSBarry Smith }
314099cc6bSBarry Smith 
32ba38deedSJacob Faibussowitsch static PetscErrorCode MatGetColumnReductions_SeqAIJ(Mat A, PetscInt type, PetscReal *reductions)
33d71ae5a4SJacob Faibussowitsch {
340716a85fSBarry Smith   PetscInt    i, m, n;
350716a85fSBarry Smith   Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data;
360716a85fSBarry Smith 
370716a85fSBarry Smith   PetscFunctionBegin;
389566063dSJacob Faibussowitsch   PetscCall(MatGetSize(A, &m, &n));
399566063dSJacob Faibussowitsch   PetscCall(PetscArrayzero(reductions, n));
400716a85fSBarry Smith   if (type == NORM_2) {
41ad540459SPierre Jolivet     for (i = 0; i < aij->i[m]; i++) reductions[aij->j[i]] += PetscAbsScalar(aij->a[i] * aij->a[i]);
420716a85fSBarry Smith   } else if (type == NORM_1) {
43ad540459SPierre Jolivet     for (i = 0; i < aij->i[m]; i++) reductions[aij->j[i]] += PetscAbsScalar(aij->a[i]);
440716a85fSBarry Smith   } else if (type == NORM_INFINITY) {
45ad540459SPierre Jolivet     for (i = 0; i < aij->i[m]; i++) reductions[aij->j[i]] = PetscMax(PetscAbsScalar(aij->a[i]), reductions[aij->j[i]]);
46857cbf51SRichard Tran Mills   } else if (type == REDUCTION_SUM_REALPART || type == REDUCTION_MEAN_REALPART) {
47ad540459SPierre Jolivet     for (i = 0; i < aij->i[m]; i++) reductions[aij->j[i]] += PetscRealPart(aij->a[i]);
48857cbf51SRichard Tran Mills   } else if (type == REDUCTION_SUM_IMAGINARYPART || type == REDUCTION_MEAN_IMAGINARYPART) {
49ad540459SPierre Jolivet     for (i = 0; i < aij->i[m]; i++) reductions[aij->j[i]] += PetscImaginaryPart(aij->a[i]);
506adde796SStefano Zampini   } else SETERRQ(PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_WRONG, "Unknown reduction type");
510716a85fSBarry Smith 
520716a85fSBarry Smith   if (type == NORM_2) {
53a873a8cdSSam Reynolds     for (i = 0; i < n; i++) reductions[i] = PetscSqrtReal(reductions[i]);
54857cbf51SRichard Tran Mills   } else if (type == REDUCTION_MEAN_REALPART || type == REDUCTION_MEAN_IMAGINARYPART) {
55a873a8cdSSam Reynolds     for (i = 0; i < n; i++) reductions[i] /= m;
560716a85fSBarry Smith   }
573ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
580716a85fSBarry Smith }
590716a85fSBarry Smith 
60ba38deedSJacob Faibussowitsch static PetscErrorCode MatFindOffBlockDiagonalEntries_SeqAIJ(Mat A, IS *is)
61d71ae5a4SJacob Faibussowitsch {
623a062f41SBarry Smith   Mat_SeqAIJ     *a = (Mat_SeqAIJ *)A->data;
633a062f41SBarry Smith   PetscInt        i, m = A->rmap->n, cnt = 0, bs = A->rmap->bs;
643a062f41SBarry Smith   const PetscInt *jj = a->j, *ii = a->i;
653a062f41SBarry Smith   PetscInt       *rows;
663a062f41SBarry Smith 
673a062f41SBarry Smith   PetscFunctionBegin;
683a062f41SBarry Smith   for (i = 0; i < m; i++) {
69ad540459SPierre Jolivet     if ((ii[i] != ii[i + 1]) && ((jj[ii[i]] < bs * (i / bs)) || (jj[ii[i + 1] - 1] > bs * ((i + bs) / bs) - 1))) cnt++;
703a062f41SBarry Smith   }
719566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(cnt, &rows));
723a062f41SBarry Smith   cnt = 0;
733a062f41SBarry Smith   for (i = 0; i < m; i++) {
743a062f41SBarry Smith     if ((ii[i] != ii[i + 1]) && ((jj[ii[i]] < bs * (i / bs)) || (jj[ii[i + 1] - 1] > bs * ((i + bs) / bs) - 1))) {
753a062f41SBarry Smith       rows[cnt] = i;
763a062f41SBarry Smith       cnt++;
773a062f41SBarry Smith     }
783a062f41SBarry Smith   }
799566063dSJacob Faibussowitsch   PetscCall(ISCreateGeneral(PETSC_COMM_SELF, cnt, rows, PETSC_OWN_POINTER, is));
803ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
813a062f41SBarry Smith }
823a062f41SBarry Smith 
83d71ae5a4SJacob Faibussowitsch PetscErrorCode MatFindZeroDiagonals_SeqAIJ_Private(Mat A, PetscInt *nrows, PetscInt **zrows)
84d71ae5a4SJacob Faibussowitsch {
856ce1633cSBarry Smith   Mat_SeqAIJ      *a = (Mat_SeqAIJ *)A->data;
86fff043a9SJunchao Zhang   const MatScalar *aa;
876ce1633cSBarry Smith   PetscInt         i, m = A->rmap->n, cnt = 0;
88b2db7409Sstefano_zampini   const PetscInt  *ii = a->i, *jj = a->j, *diag;
896ce1633cSBarry Smith   PetscInt        *rows;
906ce1633cSBarry Smith 
916ce1633cSBarry Smith   PetscFunctionBegin;
929566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &aa));
939566063dSJacob Faibussowitsch   PetscCall(MatMarkDiagonal_SeqAIJ(A));
946ce1633cSBarry Smith   diag = a->diag;
956ce1633cSBarry Smith   for (i = 0; i < m; i++) {
96ad540459SPierre Jolivet     if ((diag[i] >= ii[i + 1]) || (jj[diag[i]] != i) || (aa[diag[i]] == 0.0)) cnt++;
976ce1633cSBarry Smith   }
989566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(cnt, &rows));
996ce1633cSBarry Smith   cnt = 0;
1006ce1633cSBarry Smith   for (i = 0; i < m; i++) {
101ad540459SPierre Jolivet     if ((diag[i] >= ii[i + 1]) || (jj[diag[i]] != i) || (aa[diag[i]] == 0.0)) rows[cnt++] = i;
1026ce1633cSBarry Smith   }
103f1f41ecbSJed Brown   *nrows = cnt;
104f1f41ecbSJed Brown   *zrows = rows;
1059566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &aa));
1063ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
107f1f41ecbSJed Brown }
108f1f41ecbSJed Brown 
109ba38deedSJacob Faibussowitsch static PetscErrorCode MatFindZeroDiagonals_SeqAIJ(Mat A, IS *zrows)
110d71ae5a4SJacob Faibussowitsch {
111f1f41ecbSJed Brown   PetscInt nrows, *rows;
112f1f41ecbSJed Brown 
113f1f41ecbSJed Brown   PetscFunctionBegin;
1140298fd71SBarry Smith   *zrows = NULL;
1159566063dSJacob Faibussowitsch   PetscCall(MatFindZeroDiagonals_SeqAIJ_Private(A, &nrows, &rows));
1169566063dSJacob Faibussowitsch   PetscCall(ISCreateGeneral(PetscObjectComm((PetscObject)A), nrows, rows, PETSC_OWN_POINTER, zrows));
1173ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
1186ce1633cSBarry Smith }
1196ce1633cSBarry Smith 
120ba38deedSJacob Faibussowitsch static PetscErrorCode MatFindNonzeroRows_SeqAIJ(Mat A, IS *keptrows)
121d71ae5a4SJacob Faibussowitsch {
122b3a44c85SBarry Smith   Mat_SeqAIJ      *a = (Mat_SeqAIJ *)A->data;
123b3a44c85SBarry Smith   const MatScalar *aa;
124b3a44c85SBarry Smith   PetscInt         m = A->rmap->n, cnt = 0;
125b3a44c85SBarry Smith   const PetscInt  *ii;
126b3a44c85SBarry Smith   PetscInt         n, i, j, *rows;
127b3a44c85SBarry Smith 
128b3a44c85SBarry Smith   PetscFunctionBegin;
1299566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &aa));
130f4259b30SLisandro Dalcin   *keptrows = NULL;
131b3a44c85SBarry Smith   ii        = a->i;
132b3a44c85SBarry Smith   for (i = 0; i < m; i++) {
133b3a44c85SBarry Smith     n = ii[i + 1] - ii[i];
134b3a44c85SBarry Smith     if (!n) {
135b3a44c85SBarry Smith       cnt++;
136b3a44c85SBarry Smith       goto ok1;
137b3a44c85SBarry Smith     }
1382e5835c6SStefano Zampini     for (j = ii[i]; j < ii[i + 1]; j++) {
139b3a44c85SBarry Smith       if (aa[j] != 0.0) goto ok1;
140b3a44c85SBarry Smith     }
141b3a44c85SBarry Smith     cnt++;
142b3a44c85SBarry Smith   ok1:;
143b3a44c85SBarry Smith   }
1442e5835c6SStefano Zampini   if (!cnt) {
1459566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJRestoreArrayRead(A, &aa));
1463ba16761SJacob Faibussowitsch     PetscFunctionReturn(PETSC_SUCCESS);
1472e5835c6SStefano Zampini   }
1489566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(A->rmap->n - cnt, &rows));
149b3a44c85SBarry Smith   cnt = 0;
150b3a44c85SBarry Smith   for (i = 0; i < m; i++) {
151b3a44c85SBarry Smith     n = ii[i + 1] - ii[i];
152b3a44c85SBarry Smith     if (!n) continue;
1532e5835c6SStefano Zampini     for (j = ii[i]; j < ii[i + 1]; j++) {
154b3a44c85SBarry Smith       if (aa[j] != 0.0) {
155b3a44c85SBarry Smith         rows[cnt++] = i;
156b3a44c85SBarry Smith         break;
157b3a44c85SBarry Smith       }
158b3a44c85SBarry Smith     }
159b3a44c85SBarry Smith   }
1609566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &aa));
1619566063dSJacob Faibussowitsch   PetscCall(ISCreateGeneral(PETSC_COMM_SELF, cnt, rows, PETSC_OWN_POINTER, keptrows));
1623ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
163b3a44c85SBarry Smith }
164b3a44c85SBarry Smith 
165d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDiagonalSet_SeqAIJ(Mat Y, Vec D, InsertMode is)
166d71ae5a4SJacob Faibussowitsch {
16779299369SBarry Smith   Mat_SeqAIJ        *aij = (Mat_SeqAIJ *)Y->data;
16899e65526SBarry Smith   PetscInt           i, m = Y->rmap->n;
16999e65526SBarry Smith   const PetscInt    *diag;
1702e5835c6SStefano Zampini   MatScalar         *aa;
17199e65526SBarry Smith   const PetscScalar *v;
172ace3abfcSBarry Smith   PetscBool          missing;
17379299369SBarry Smith 
17479299369SBarry Smith   PetscFunctionBegin;
17509f38230SBarry Smith   if (Y->assembled) {
1769566063dSJacob Faibussowitsch     PetscCall(MatMissingDiagonal_SeqAIJ(Y, &missing, NULL));
17709f38230SBarry Smith     if (!missing) {
17879299369SBarry Smith       diag = aij->diag;
1799566063dSJacob Faibussowitsch       PetscCall(VecGetArrayRead(D, &v));
1809566063dSJacob Faibussowitsch       PetscCall(MatSeqAIJGetArray(Y, &aa));
18179299369SBarry Smith       if (is == INSERT_VALUES) {
182ad540459SPierre Jolivet         for (i = 0; i < m; i++) aa[diag[i]] = v[i];
18379299369SBarry Smith       } else {
184ad540459SPierre Jolivet         for (i = 0; i < m; i++) aa[diag[i]] += v[i];
18579299369SBarry Smith       }
1869566063dSJacob Faibussowitsch       PetscCall(MatSeqAIJRestoreArray(Y, &aa));
1879566063dSJacob Faibussowitsch       PetscCall(VecRestoreArrayRead(D, &v));
1883ba16761SJacob Faibussowitsch       PetscFunctionReturn(PETSC_SUCCESS);
18979299369SBarry Smith     }
1909566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJInvalidateDiagonal(Y));
19109f38230SBarry Smith   }
1929566063dSJacob Faibussowitsch   PetscCall(MatDiagonalSet_Default(Y, D, is));
1933ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
19409f38230SBarry Smith }
19579299369SBarry Smith 
196d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetRowIJ_SeqAIJ(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *m, const PetscInt *ia[], const PetscInt *ja[], PetscBool *done)
197d71ae5a4SJacob Faibussowitsch {
198416022c9SBarry Smith   Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data;
19997f1f81fSBarry Smith   PetscInt    i, ishift;
20017ab2063SBarry Smith 
2013a40ed3dSBarry Smith   PetscFunctionBegin;
202f1f2ae84SBarry Smith   if (m) *m = A->rmap->n;
2033ba16761SJacob Faibussowitsch   if (!ia) PetscFunctionReturn(PETSC_SUCCESS);
204bfeeae90SHong Zhang   ishift = 0;
205b94d7dedSBarry Smith   if (symmetric && A->structurally_symmetric != PETSC_BOOL3_TRUE) {
2069566063dSJacob Faibussowitsch     PetscCall(MatToSymmetricIJ_SeqAIJ(A->rmap->n, a->i, a->j, PETSC_TRUE, ishift, oshift, (PetscInt **)ia, (PetscInt **)ja));
207bfeeae90SHong Zhang   } else if (oshift == 1) {
2081a83f524SJed Brown     PetscInt *tia;
209d0f46423SBarry Smith     PetscInt  nz = a->i[A->rmap->n];
2103b2fbd54SBarry Smith     /* malloc space and  add 1 to i and j indices */
2119566063dSJacob Faibussowitsch     PetscCall(PetscMalloc1(A->rmap->n + 1, &tia));
2121a83f524SJed Brown     for (i = 0; i < A->rmap->n + 1; i++) tia[i] = a->i[i] + 1;
2131a83f524SJed Brown     *ia = tia;
214ecc77c7aSBarry Smith     if (ja) {
2151a83f524SJed Brown       PetscInt *tja;
2169566063dSJacob Faibussowitsch       PetscCall(PetscMalloc1(nz + 1, &tja));
2171a83f524SJed Brown       for (i = 0; i < nz; i++) tja[i] = a->j[i] + 1;
2181a83f524SJed Brown       *ja = tja;
219ecc77c7aSBarry Smith     }
2206945ee14SBarry Smith   } else {
221ecc77c7aSBarry Smith     *ia = a->i;
222ecc77c7aSBarry Smith     if (ja) *ja = a->j;
223a2ce50c7SBarry Smith   }
2243ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
225a2744918SBarry Smith }
226a2744918SBarry Smith 
227d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRestoreRowIJ_SeqAIJ(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *n, const PetscInt *ia[], const PetscInt *ja[], PetscBool *done)
228d71ae5a4SJacob Faibussowitsch {
2293a40ed3dSBarry Smith   PetscFunctionBegin;
2303ba16761SJacob Faibussowitsch   if (!ia) PetscFunctionReturn(PETSC_SUCCESS);
231b94d7dedSBarry Smith   if ((symmetric && A->structurally_symmetric != PETSC_BOOL3_TRUE) || oshift == 1) {
2329566063dSJacob Faibussowitsch     PetscCall(PetscFree(*ia));
2339566063dSJacob Faibussowitsch     if (ja) PetscCall(PetscFree(*ja));
234bcd2baecSBarry Smith   }
2353ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
23617ab2063SBarry Smith }
23717ab2063SBarry Smith 
238d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetColumnIJ_SeqAIJ(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *nn, const PetscInt *ia[], const PetscInt *ja[], PetscBool *done)
239d71ae5a4SJacob Faibussowitsch {
2403b2fbd54SBarry Smith   Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data;
241d0f46423SBarry Smith   PetscInt    i, *collengths, *cia, *cja, n = A->cmap->n, m = A->rmap->n;
24297f1f81fSBarry Smith   PetscInt    nz = a->i[m], row, *jj, mr, col;
2433b2fbd54SBarry Smith 
2443a40ed3dSBarry Smith   PetscFunctionBegin;
245899cda47SBarry Smith   *nn = n;
2463ba16761SJacob Faibussowitsch   if (!ia) PetscFunctionReturn(PETSC_SUCCESS);
2473b2fbd54SBarry Smith   if (symmetric) {
2489566063dSJacob Faibussowitsch     PetscCall(MatToSymmetricIJ_SeqAIJ(A->rmap->n, a->i, a->j, PETSC_TRUE, 0, oshift, (PetscInt **)ia, (PetscInt **)ja));
2493b2fbd54SBarry Smith   } else {
2509566063dSJacob Faibussowitsch     PetscCall(PetscCalloc1(n, &collengths));
2519566063dSJacob Faibussowitsch     PetscCall(PetscMalloc1(n + 1, &cia));
2529566063dSJacob Faibussowitsch     PetscCall(PetscMalloc1(nz, &cja));
2533b2fbd54SBarry Smith     jj = a->j;
254ad540459SPierre Jolivet     for (i = 0; i < nz; i++) collengths[jj[i]]++;
2553b2fbd54SBarry Smith     cia[0] = oshift;
256ad540459SPierre Jolivet     for (i = 0; i < n; i++) cia[i + 1] = cia[i] + collengths[i];
2579566063dSJacob Faibussowitsch     PetscCall(PetscArrayzero(collengths, n));
2583b2fbd54SBarry Smith     jj = a->j;
259a93ec695SBarry Smith     for (row = 0; row < m; row++) {
260a93ec695SBarry Smith       mr = a->i[row + 1] - a->i[row];
261a93ec695SBarry Smith       for (i = 0; i < mr; i++) {
262bfeeae90SHong Zhang         col = *jj++;
2632205254eSKarl Rupp 
2643b2fbd54SBarry Smith         cja[cia[col] + collengths[col]++ - oshift] = row + oshift;
2653b2fbd54SBarry Smith       }
2663b2fbd54SBarry Smith     }
2679566063dSJacob Faibussowitsch     PetscCall(PetscFree(collengths));
2689371c9d4SSatish Balay     *ia = cia;
2699371c9d4SSatish Balay     *ja = cja;
2703b2fbd54SBarry Smith   }
2713ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
2723b2fbd54SBarry Smith }
2733b2fbd54SBarry Smith 
274d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRestoreColumnIJ_SeqAIJ(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *n, const PetscInt *ia[], const PetscInt *ja[], PetscBool *done)
275d71ae5a4SJacob Faibussowitsch {
2763a40ed3dSBarry Smith   PetscFunctionBegin;
2773ba16761SJacob Faibussowitsch   if (!ia) PetscFunctionReturn(PETSC_SUCCESS);
2783b2fbd54SBarry Smith 
2799566063dSJacob Faibussowitsch   PetscCall(PetscFree(*ia));
2809566063dSJacob Faibussowitsch   PetscCall(PetscFree(*ja));
2813ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
2823b2fbd54SBarry Smith }
2833b2fbd54SBarry Smith 
2847cee066cSHong Zhang /*
2857cee066cSHong Zhang  MatGetColumnIJ_SeqAIJ_Color() and MatRestoreColumnIJ_SeqAIJ_Color() are customized from
2867cee066cSHong Zhang  MatGetColumnIJ_SeqAIJ() and MatRestoreColumnIJ_SeqAIJ() by adding an output
287040ebd07SHong Zhang  spidx[], index of a->a, to be used in MatTransposeColoringCreate_SeqAIJ() and MatFDColoringCreate_SeqXAIJ()
2887cee066cSHong Zhang */
289d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetColumnIJ_SeqAIJ_Color(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *nn, const PetscInt *ia[], const PetscInt *ja[], PetscInt *spidx[], PetscBool *done)
290d71ae5a4SJacob Faibussowitsch {
2917cee066cSHong Zhang   Mat_SeqAIJ     *a = (Mat_SeqAIJ *)A->data;
2927cee066cSHong Zhang   PetscInt        i, *collengths, *cia, *cja, n = A->cmap->n, m = A->rmap->n;
293071fcb05SBarry Smith   PetscInt        nz = a->i[m], row, mr, col, tmp;
2947cee066cSHong Zhang   PetscInt       *cspidx;
295071fcb05SBarry Smith   const PetscInt *jj;
2967cee066cSHong Zhang 
2977cee066cSHong Zhang   PetscFunctionBegin;
2987cee066cSHong Zhang   *nn = n;
2993ba16761SJacob Faibussowitsch   if (!ia) PetscFunctionReturn(PETSC_SUCCESS);
300625f6d37SHong Zhang 
3019566063dSJacob Faibussowitsch   PetscCall(PetscCalloc1(n, &collengths));
3029566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(n + 1, &cia));
3039566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(nz, &cja));
3049566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(nz, &cspidx));
3057cee066cSHong Zhang   jj = a->j;
306ad540459SPierre Jolivet   for (i = 0; i < nz; i++) collengths[jj[i]]++;
3077cee066cSHong Zhang   cia[0] = oshift;
308ad540459SPierre Jolivet   for (i = 0; i < n; i++) cia[i + 1] = cia[i] + collengths[i];
3099566063dSJacob Faibussowitsch   PetscCall(PetscArrayzero(collengths, n));
3107cee066cSHong Zhang   jj = a->j;
3117cee066cSHong Zhang   for (row = 0; row < m; row++) {
3127cee066cSHong Zhang     mr = a->i[row + 1] - a->i[row];
3137cee066cSHong Zhang     for (i = 0; i < mr; i++) {
3147cee066cSHong Zhang       col         = *jj++;
315071fcb05SBarry Smith       tmp         = cia[col] + collengths[col]++ - oshift;
316071fcb05SBarry Smith       cspidx[tmp] = a->i[row] + i; /* index of a->j */
317071fcb05SBarry Smith       cja[tmp]    = row + oshift;
3187cee066cSHong Zhang     }
3197cee066cSHong Zhang   }
3209566063dSJacob Faibussowitsch   PetscCall(PetscFree(collengths));
321071fcb05SBarry Smith   *ia    = cia;
322071fcb05SBarry Smith   *ja    = cja;
3237cee066cSHong Zhang   *spidx = cspidx;
3243ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3257cee066cSHong Zhang }
3267cee066cSHong Zhang 
327d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRestoreColumnIJ_SeqAIJ_Color(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *n, const PetscInt *ia[], const PetscInt *ja[], PetscInt *spidx[], PetscBool *done)
328d71ae5a4SJacob Faibussowitsch {
3297cee066cSHong Zhang   PetscFunctionBegin;
3309566063dSJacob Faibussowitsch   PetscCall(MatRestoreColumnIJ_SeqAIJ(A, oshift, symmetric, inodecompressed, n, ia, ja, done));
3319566063dSJacob Faibussowitsch   PetscCall(PetscFree(*spidx));
3323ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3337cee066cSHong Zhang }
3347cee066cSHong Zhang 
335ba38deedSJacob Faibussowitsch static PetscErrorCode MatSetValuesRow_SeqAIJ(Mat A, PetscInt row, const PetscScalar v[])
336d71ae5a4SJacob Faibussowitsch {
33787d4246cSBarry Smith   Mat_SeqAIJ  *a  = (Mat_SeqAIJ *)A->data;
33887d4246cSBarry Smith   PetscInt    *ai = a->i;
339fff043a9SJunchao Zhang   PetscScalar *aa;
34087d4246cSBarry Smith 
34187d4246cSBarry Smith   PetscFunctionBegin;
3429566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArray(A, &aa));
3439566063dSJacob Faibussowitsch   PetscCall(PetscArraycpy(aa + ai[row], v, ai[row + 1] - ai[row]));
3449566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArray(A, &aa));
3453ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
34687d4246cSBarry Smith }
34787d4246cSBarry Smith 
348bd04181cSBarry Smith /*
349bd04181cSBarry Smith     MatSeqAIJSetValuesLocalFast - An optimized version of MatSetValuesLocal() for SeqAIJ matrices with several assumptions
350bd04181cSBarry Smith 
351bd04181cSBarry Smith       -   a single row of values is set with each call
352bd04181cSBarry Smith       -   no row or column indices are negative or (in error) larger than the number of rows or columns
353bd04181cSBarry Smith       -   the values are always added to the matrix, not set
354bd04181cSBarry Smith       -   no new locations are introduced in the nonzero structure of the matrix
355bd04181cSBarry Smith 
3561f763a69SBarry Smith      This does NOT assume the global column indices are sorted
357bd04181cSBarry Smith 
3581f763a69SBarry Smith */
359bd04181cSBarry Smith 
360af0996ceSBarry Smith #include <petsc/private/isimpl.h>
361d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetValuesLocalFast(Mat A, PetscInt m, const PetscInt im[], PetscInt n, const PetscInt in[], const PetscScalar v[], InsertMode is)
362d71ae5a4SJacob Faibussowitsch {
363189e4007SBarry Smith   Mat_SeqAIJ     *a = (Mat_SeqAIJ *)A->data;
3641f763a69SBarry Smith   PetscInt        low, high, t, row, nrow, i, col, l;
3651f763a69SBarry Smith   const PetscInt *rp, *ai = a->i, *ailen = a->ilen, *aj = a->j;
3661f763a69SBarry Smith   PetscInt        lastcol = -1;
367fff043a9SJunchao Zhang   MatScalar      *ap, value, *aa;
368189e4007SBarry Smith   const PetscInt *ridx = A->rmap->mapping->indices, *cidx = A->cmap->mapping->indices;
369189e4007SBarry Smith 
370fff043a9SJunchao Zhang   PetscFunctionBegin;
3719566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArray(A, &aa));
372f38dd0b8SBarry Smith   row  = ridx[im[0]];
3731f763a69SBarry Smith   rp   = aj + ai[row];
3741f763a69SBarry Smith   ap   = aa + ai[row];
3751f763a69SBarry Smith   nrow = ailen[row];
376189e4007SBarry Smith   low  = 0;
377189e4007SBarry Smith   high = nrow;
378189e4007SBarry Smith   for (l = 0; l < n; l++) { /* loop over added columns */
379189e4007SBarry Smith     col   = cidx[in[l]];
380f38dd0b8SBarry Smith     value = v[l];
381189e4007SBarry Smith 
382189e4007SBarry Smith     if (col <= lastcol) low = 0;
383189e4007SBarry Smith     else high = nrow;
384189e4007SBarry Smith     lastcol = col;
385189e4007SBarry Smith     while (high - low > 5) {
386189e4007SBarry Smith       t = (low + high) / 2;
387189e4007SBarry Smith       if (rp[t] > col) high = t;
388189e4007SBarry Smith       else low = t;
389189e4007SBarry Smith     }
390189e4007SBarry Smith     for (i = low; i < high; i++) {
391189e4007SBarry Smith       if (rp[i] == col) {
3921f763a69SBarry Smith         ap[i] += value;
393189e4007SBarry Smith         low = i + 1;
3941f763a69SBarry Smith         break;
395189e4007SBarry Smith       }
396189e4007SBarry Smith     }
397189e4007SBarry Smith   }
3989566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArray(A, &aa));
3993ba16761SJacob Faibussowitsch   return PETSC_SUCCESS;
400189e4007SBarry Smith }
401189e4007SBarry Smith 
402d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetValues_SeqAIJ(Mat A, PetscInt m, const PetscInt im[], PetscInt n, const PetscInt in[], const PetscScalar v[], InsertMode is)
403d71ae5a4SJacob Faibussowitsch {
404416022c9SBarry Smith   Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data;
405e2ee6c50SBarry Smith   PetscInt   *rp, k, low, high, t, ii, row, nrow, i, col, l, rmax, N;
40697f1f81fSBarry Smith   PetscInt   *imax = a->imax, *ai = a->i, *ailen = a->ilen;
407e2ee6c50SBarry Smith   PetscInt   *aj = a->j, nonew = a->nonew, lastcol = -1;
408ce496241SStefano Zampini   MatScalar  *ap = NULL, value = 0.0, *aa;
409ace3abfcSBarry Smith   PetscBool   ignorezeroentries = a->ignorezeroentries;
410ace3abfcSBarry Smith   PetscBool   roworiented       = a->roworiented;
41117ab2063SBarry Smith 
4123a40ed3dSBarry Smith   PetscFunctionBegin;
4139566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArray(A, &aa));
41417ab2063SBarry Smith   for (k = 0; k < m; k++) { /* loop over added rows */
415416022c9SBarry Smith     row = im[k];
4165ef9f2a5SBarry Smith     if (row < 0) continue;
4176bdcaf15SBarry Smith     PetscCheck(row < A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Row too large: row %" PetscInt_FMT " max %" PetscInt_FMT, row, A->rmap->n - 1);
4188e3a54c0SPierre Jolivet     rp = PetscSafePointerPlusOffset(aj, ai[row]);
4198e3a54c0SPierre Jolivet     if (!A->structure_only) ap = PetscSafePointerPlusOffset(aa, ai[row]);
4209371c9d4SSatish Balay     rmax = imax[row];
4219371c9d4SSatish Balay     nrow = ailen[row];
422416022c9SBarry Smith     low  = 0;
423c71e6ed7SBarry Smith     high = nrow;
42417ab2063SBarry Smith     for (l = 0; l < n; l++) { /* loop over added columns */
4255ef9f2a5SBarry Smith       if (in[l] < 0) continue;
4266bdcaf15SBarry Smith       PetscCheck(in[l] < A->cmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Column too large: col %" PetscInt_FMT " max %" PetscInt_FMT, in[l], A->cmap->n - 1);
427bfeeae90SHong Zhang       col = in[l];
428071fcb05SBarry Smith       if (v && !A->structure_only) value = roworiented ? v[l + k * n] : v[k + l * m];
429071fcb05SBarry Smith       if (!A->structure_only && value == 0.0 && ignorezeroentries && is == ADD_VALUES && row != col) continue;
43036db0b34SBarry Smith 
4312205254eSKarl Rupp       if (col <= lastcol) low = 0;
4322205254eSKarl Rupp       else high = nrow;
433e2ee6c50SBarry Smith       lastcol = col;
434416022c9SBarry Smith       while (high - low > 5) {
435416022c9SBarry Smith         t = (low + high) / 2;
436416022c9SBarry Smith         if (rp[t] > col) high = t;
437416022c9SBarry Smith         else low = t;
43817ab2063SBarry Smith       }
439416022c9SBarry Smith       for (i = low; i < high; i++) {
44017ab2063SBarry Smith         if (rp[i] > col) break;
44117ab2063SBarry Smith         if (rp[i] == col) {
442876c6284SHong Zhang           if (!A->structure_only) {
4430c0d7e18SFande Kong             if (is == ADD_VALUES) {
4440c0d7e18SFande Kong               ap[i] += value;
4450c0d7e18SFande Kong               (void)PetscLogFlops(1.0);
4469371c9d4SSatish Balay             } else ap[i] = value;
447720833daSHong Zhang           }
448e44c0bd4SBarry Smith           low = i + 1;
44917ab2063SBarry Smith           goto noinsert;
45017ab2063SBarry Smith         }
45117ab2063SBarry Smith       }
452dcd36c23SBarry Smith       if (value == 0.0 && ignorezeroentries && row != col) goto noinsert;
453c2653b3dSLois Curfman McInnes       if (nonew == 1) goto noinsert;
45408401ef6SPierre Jolivet       PetscCheck(nonew != -1, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Inserting a new nonzero at (%" PetscInt_FMT ",%" PetscInt_FMT ") in the matrix", row, col);
455720833daSHong Zhang       if (A->structure_only) {
456876c6284SHong Zhang         MatSeqXAIJReallocateAIJ_structure_only(A, A->rmap->n, 1, nrow, row, col, rmax, ai, aj, rp, imax, nonew, MatScalar);
457720833daSHong Zhang       } else {
458fef13f97SBarry Smith         MatSeqXAIJReallocateAIJ(A, A->rmap->n, 1, nrow, row, col, rmax, aa, ai, aj, rp, ap, imax, nonew, MatScalar);
459720833daSHong Zhang       }
4609371c9d4SSatish Balay       N = nrow++ - 1;
4619371c9d4SSatish Balay       a->nz++;
4629371c9d4SSatish Balay       high++;
463416022c9SBarry Smith       /* shift up all the later entries in this row */
4649566063dSJacob Faibussowitsch       PetscCall(PetscArraymove(rp + i + 1, rp + i, N - i + 1));
46517ab2063SBarry Smith       rp[i] = col;
466580bdb30SBarry Smith       if (!A->structure_only) {
4679566063dSJacob Faibussowitsch         PetscCall(PetscArraymove(ap + i + 1, ap + i, N - i + 1));
468580bdb30SBarry Smith         ap[i] = value;
469580bdb30SBarry Smith       }
470416022c9SBarry Smith       low = i + 1;
471e44c0bd4SBarry Smith     noinsert:;
47217ab2063SBarry Smith     }
47317ab2063SBarry Smith     ailen[row] = nrow;
47417ab2063SBarry Smith   }
4759566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArray(A, &aa));
4763ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
47717ab2063SBarry Smith }
47817ab2063SBarry Smith 
479ba38deedSJacob Faibussowitsch static PetscErrorCode MatSetValues_SeqAIJ_SortedFullNoPreallocation(Mat A, PetscInt m, const PetscInt im[], PetscInt n, const PetscInt in[], const PetscScalar v[], InsertMode is)
480d71ae5a4SJacob Faibussowitsch {
48119b08ed1SBarry Smith   Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data;
48219b08ed1SBarry Smith   PetscInt   *rp, k, row;
48319b08ed1SBarry Smith   PetscInt   *ai = a->i;
48419b08ed1SBarry Smith   PetscInt   *aj = a->j;
485fff043a9SJunchao Zhang   MatScalar  *aa, *ap;
48619b08ed1SBarry Smith 
48719b08ed1SBarry Smith   PetscFunctionBegin;
48828b400f6SJacob Faibussowitsch   PetscCheck(!A->was_assembled, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Cannot call on assembled matrix.");
48908401ef6SPierre Jolivet   PetscCheck(m * n + a->nz <= a->maxnz, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Number of entries in matrix will be larger than maximum nonzeros allocated for %" PetscInt_FMT " in MatSeqAIJSetTotalPreallocation()", a->maxnz);
490fff043a9SJunchao Zhang 
4919566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArray(A, &aa));
49219b08ed1SBarry Smith   for (k = 0; k < m; k++) { /* loop over added rows */
49319b08ed1SBarry Smith     row = im[k];
49419b08ed1SBarry Smith     rp  = aj + ai[row];
4958e3a54c0SPierre Jolivet     ap  = PetscSafePointerPlusOffset(aa, ai[row]);
49619b08ed1SBarry Smith 
4979566063dSJacob Faibussowitsch     PetscCall(PetscMemcpy(rp, in, n * sizeof(PetscInt)));
49819b08ed1SBarry Smith     if (!A->structure_only) {
49919b08ed1SBarry Smith       if (v) {
5009566063dSJacob Faibussowitsch         PetscCall(PetscMemcpy(ap, v, n * sizeof(PetscScalar)));
50119b08ed1SBarry Smith         v += n;
50219b08ed1SBarry Smith       } else {
5039566063dSJacob Faibussowitsch         PetscCall(PetscMemzero(ap, n * sizeof(PetscScalar)));
50419b08ed1SBarry Smith       }
50519b08ed1SBarry Smith     }
50619b08ed1SBarry Smith     a->ilen[row]  = n;
50719b08ed1SBarry Smith     a->imax[row]  = n;
50819b08ed1SBarry Smith     a->i[row + 1] = a->i[row] + n;
50919b08ed1SBarry Smith     a->nz += n;
51019b08ed1SBarry Smith   }
5119566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArray(A, &aa));
5123ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
51319b08ed1SBarry Smith }
51419b08ed1SBarry Smith 
51519b08ed1SBarry Smith /*@
51619b08ed1SBarry Smith   MatSeqAIJSetTotalPreallocation - Sets an upper bound on the total number of expected nonzeros in the matrix.
51719b08ed1SBarry Smith 
51819b08ed1SBarry Smith   Input Parameters:
51911a5261eSBarry Smith + A       - the `MATSEQAIJ` matrix
52019b08ed1SBarry Smith - nztotal - bound on the number of nonzeros
52119b08ed1SBarry Smith 
52219b08ed1SBarry Smith   Level: advanced
52319b08ed1SBarry Smith 
52419b08ed1SBarry Smith   Notes:
52519b08ed1SBarry Smith   This can be called if you will be provided the matrix row by row (from row zero) with sorted column indices for each row.
52611a5261eSBarry Smith   Simply call `MatSetValues()` after this call to provide the matrix entries in the usual manner. This matrix may be used
52719b08ed1SBarry Smith   as always with multiple matrix assemblies.
52819b08ed1SBarry Smith 
5291cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSetOption()`, `MAT_SORTED_FULL`, `MatSetValues()`, `MatSeqAIJSetPreallocation()`
53019b08ed1SBarry Smith @*/
531d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetTotalPreallocation(Mat A, PetscInt nztotal)
532d71ae5a4SJacob Faibussowitsch {
53319b08ed1SBarry Smith   Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data;
53419b08ed1SBarry Smith 
53519b08ed1SBarry Smith   PetscFunctionBegin;
5369566063dSJacob Faibussowitsch   PetscCall(PetscLayoutSetUp(A->rmap));
5379566063dSJacob Faibussowitsch   PetscCall(PetscLayoutSetUp(A->cmap));
53819b08ed1SBarry Smith   a->maxnz = nztotal;
5394dfa11a4SJacob Faibussowitsch   if (!a->imax) { PetscCall(PetscMalloc1(A->rmap->n, &a->imax)); }
54019b08ed1SBarry Smith   if (!a->ilen) {
5419566063dSJacob Faibussowitsch     PetscCall(PetscMalloc1(A->rmap->n, &a->ilen));
54219b08ed1SBarry Smith   } else {
5439566063dSJacob Faibussowitsch     PetscCall(PetscMemzero(a->ilen, A->rmap->n * sizeof(PetscInt)));
54419b08ed1SBarry Smith   }
54519b08ed1SBarry Smith 
54619b08ed1SBarry Smith   /* allocate the matrix space */
547*9f0612e4SBarry Smith   PetscCall(PetscShmgetAllocateArray(A->rmap->n + 1, sizeof(PetscInt), (void **)&a->i));
548*9f0612e4SBarry Smith   PetscCall(PetscShmgetAllocateArray(nztotal, sizeof(PetscInt), (void **)&a->j));
549*9f0612e4SBarry Smith   a->free_ij = PETSC_TRUE;
55019b08ed1SBarry Smith   if (A->structure_only) {
55119b08ed1SBarry Smith     a->free_a = PETSC_FALSE;
55219b08ed1SBarry Smith   } else {
553*9f0612e4SBarry Smith     PetscCall(PetscShmgetAllocateArray(nztotal, sizeof(PetscScalar), (void **)&a->a));
55419b08ed1SBarry Smith     a->free_a = PETSC_TRUE;
55519b08ed1SBarry Smith   }
556*9f0612e4SBarry Smith   a->i[0]           = 0;
55719b08ed1SBarry Smith   A->ops->setvalues = MatSetValues_SeqAIJ_SortedFullNoPreallocation;
55819b08ed1SBarry Smith   A->preallocated   = PETSC_TRUE;
5593ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
56019b08ed1SBarry Smith }
56119b08ed1SBarry Smith 
562ba38deedSJacob Faibussowitsch static PetscErrorCode MatSetValues_SeqAIJ_SortedFull(Mat A, PetscInt m, const PetscInt im[], PetscInt n, const PetscInt in[], const PetscScalar v[], InsertMode is)
563d71ae5a4SJacob Faibussowitsch {
564071fcb05SBarry Smith   Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data;
565071fcb05SBarry Smith   PetscInt   *rp, k, row;
566071fcb05SBarry Smith   PetscInt   *ai = a->i, *ailen = a->ilen;
567071fcb05SBarry Smith   PetscInt   *aj = a->j;
568fff043a9SJunchao Zhang   MatScalar  *aa, *ap;
569071fcb05SBarry Smith 
570071fcb05SBarry Smith   PetscFunctionBegin;
5719566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArray(A, &aa));
572071fcb05SBarry Smith   for (k = 0; k < m; k++) { /* loop over added rows */
573071fcb05SBarry Smith     row = im[k];
5746bdcaf15SBarry Smith     PetscCheck(n <= a->imax[row], PETSC_COMM_SELF, PETSC_ERR_ARG_WRONG, "Preallocation for row %" PetscInt_FMT " does not match number of columns provided", n);
575071fcb05SBarry Smith     rp = aj + ai[row];
576071fcb05SBarry Smith     ap = aa + ai[row];
57748a46eb9SPierre Jolivet     if (!A->was_assembled) PetscCall(PetscMemcpy(rp, in, n * sizeof(PetscInt)));
578071fcb05SBarry Smith     if (!A->structure_only) {
579071fcb05SBarry Smith       if (v) {
5809566063dSJacob Faibussowitsch         PetscCall(PetscMemcpy(ap, v, n * sizeof(PetscScalar)));
581071fcb05SBarry Smith         v += n;
582071fcb05SBarry Smith       } else {
5839566063dSJacob Faibussowitsch         PetscCall(PetscMemzero(ap, n * sizeof(PetscScalar)));
584071fcb05SBarry Smith       }
585071fcb05SBarry Smith     }
586071fcb05SBarry Smith     ailen[row] = n;
587071fcb05SBarry Smith     a->nz += n;
588071fcb05SBarry Smith   }
5899566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArray(A, &aa));
5903ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
591071fcb05SBarry Smith }
592071fcb05SBarry Smith 
593ba38deedSJacob Faibussowitsch static PetscErrorCode MatGetValues_SeqAIJ(Mat A, PetscInt m, const PetscInt im[], PetscInt n, const PetscInt in[], PetscScalar v[])
594d71ae5a4SJacob Faibussowitsch {
5957eb43aa7SLois Curfman McInnes   Mat_SeqAIJ      *a = (Mat_SeqAIJ *)A->data;
59697f1f81fSBarry Smith   PetscInt        *rp, k, low, high, t, row, nrow, i, col, l, *aj = a->j;
59797f1f81fSBarry Smith   PetscInt        *ai = a->i, *ailen = a->ilen;
5984e208921SJed Brown   const MatScalar *ap, *aa;
5997eb43aa7SLois Curfman McInnes 
6003a40ed3dSBarry Smith   PetscFunctionBegin;
6014e208921SJed Brown   PetscCall(MatSeqAIJGetArrayRead(A, &aa));
6027eb43aa7SLois Curfman McInnes   for (k = 0; k < m; k++) { /* loop over rows */
6037eb43aa7SLois Curfman McInnes     row = im[k];
6049371c9d4SSatish Balay     if (row < 0) {
6059371c9d4SSatish Balay       v += n;
6069371c9d4SSatish Balay       continue;
6079371c9d4SSatish Balay     } /* negative row */
60854c59aa7SJacob Faibussowitsch     PetscCheck(row < A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Row too large: row %" PetscInt_FMT " max %" PetscInt_FMT, row, A->rmap->n - 1);
6098e3a54c0SPierre Jolivet     rp   = PetscSafePointerPlusOffset(aj, ai[row]);
6108e3a54c0SPierre Jolivet     ap   = PetscSafePointerPlusOffset(aa, ai[row]);
6117eb43aa7SLois Curfman McInnes     nrow = ailen[row];
6127eb43aa7SLois Curfman McInnes     for (l = 0; l < n; l++) { /* loop over columns */
6139371c9d4SSatish Balay       if (in[l] < 0) {
6149371c9d4SSatish Balay         v++;
6159371c9d4SSatish Balay         continue;
6169371c9d4SSatish Balay       } /* negative column */
61754c59aa7SJacob Faibussowitsch       PetscCheck(in[l] < A->cmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Column too large: col %" PetscInt_FMT " max %" PetscInt_FMT, in[l], A->cmap->n - 1);
618bfeeae90SHong Zhang       col  = in[l];
6199371c9d4SSatish Balay       high = nrow;
6209371c9d4SSatish Balay       low  = 0; /* assume unsorted */
6217eb43aa7SLois Curfman McInnes       while (high - low > 5) {
6227eb43aa7SLois Curfman McInnes         t = (low + high) / 2;
6237eb43aa7SLois Curfman McInnes         if (rp[t] > col) high = t;
6247eb43aa7SLois Curfman McInnes         else low = t;
6257eb43aa7SLois Curfman McInnes       }
6267eb43aa7SLois Curfman McInnes       for (i = low; i < high; i++) {
6277eb43aa7SLois Curfman McInnes         if (rp[i] > col) break;
6287eb43aa7SLois Curfman McInnes         if (rp[i] == col) {
629b49de8d1SLois Curfman McInnes           *v++ = ap[i];
6307eb43aa7SLois Curfman McInnes           goto finished;
6317eb43aa7SLois Curfman McInnes         }
6327eb43aa7SLois Curfman McInnes       }
63397e567efSBarry Smith       *v++ = 0.0;
6347eb43aa7SLois Curfman McInnes     finished:;
6357eb43aa7SLois Curfman McInnes     }
6367eb43aa7SLois Curfman McInnes   }
6374e208921SJed Brown   PetscCall(MatSeqAIJRestoreArrayRead(A, &aa));
6383ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
6397eb43aa7SLois Curfman McInnes }
6407eb43aa7SLois Curfman McInnes 
641ba38deedSJacob Faibussowitsch static PetscErrorCode MatView_SeqAIJ_Binary(Mat mat, PetscViewer viewer)
642d71ae5a4SJacob Faibussowitsch {
6433ea6fe3dSLisandro Dalcin   Mat_SeqAIJ        *A = (Mat_SeqAIJ *)mat->data;
644c898d852SStefano Zampini   const PetscScalar *av;
6453ea6fe3dSLisandro Dalcin   PetscInt           header[4], M, N, m, nz, i;
6463ea6fe3dSLisandro Dalcin   PetscInt          *rowlens;
64717ab2063SBarry Smith 
6483a40ed3dSBarry Smith   PetscFunctionBegin;
6499566063dSJacob Faibussowitsch   PetscCall(PetscViewerSetUp(viewer));
6502205254eSKarl Rupp 
6513ea6fe3dSLisandro Dalcin   M  = mat->rmap->N;
6523ea6fe3dSLisandro Dalcin   N  = mat->cmap->N;
6533ea6fe3dSLisandro Dalcin   m  = mat->rmap->n;
6543ea6fe3dSLisandro Dalcin   nz = A->nz;
655416022c9SBarry Smith 
6563ea6fe3dSLisandro Dalcin   /* write matrix header */
6573ea6fe3dSLisandro Dalcin   header[0] = MAT_FILE_CLASSID;
6589371c9d4SSatish Balay   header[1] = M;
6599371c9d4SSatish Balay   header[2] = N;
6609371c9d4SSatish Balay   header[3] = nz;
6619566063dSJacob Faibussowitsch   PetscCall(PetscViewerBinaryWrite(viewer, header, 4, PETSC_INT));
662416022c9SBarry Smith 
6633ea6fe3dSLisandro Dalcin   /* fill in and store row lengths */
6649566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(m, &rowlens));
6653ea6fe3dSLisandro Dalcin   for (i = 0; i < m; i++) rowlens[i] = A->i[i + 1] - A->i[i];
6669566063dSJacob Faibussowitsch   PetscCall(PetscViewerBinaryWrite(viewer, rowlens, m, PETSC_INT));
6679566063dSJacob Faibussowitsch   PetscCall(PetscFree(rowlens));
6683ea6fe3dSLisandro Dalcin   /* store column indices */
6699566063dSJacob Faibussowitsch   PetscCall(PetscViewerBinaryWrite(viewer, A->j, nz, PETSC_INT));
670416022c9SBarry Smith   /* store nonzero values */
6719566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(mat, &av));
6729566063dSJacob Faibussowitsch   PetscCall(PetscViewerBinaryWrite(viewer, av, nz, PETSC_SCALAR));
6739566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(mat, &av));
674b37d52dbSMark F. Adams 
6753ea6fe3dSLisandro Dalcin   /* write block size option to the viewer's .info file */
6769566063dSJacob Faibussowitsch   PetscCall(MatView_Binary_BlockSizes(mat, viewer));
6773ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
67817ab2063SBarry Smith }
679416022c9SBarry Smith 
680d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatView_SeqAIJ_ASCII_structonly(Mat A, PetscViewer viewer)
681d71ae5a4SJacob Faibussowitsch {
6827dc0baabSHong Zhang   Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data;
6837dc0baabSHong Zhang   PetscInt    i, k, m = A->rmap->N;
6847dc0baabSHong Zhang 
6857dc0baabSHong Zhang   PetscFunctionBegin;
6869566063dSJacob Faibussowitsch   PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE));
6877dc0baabSHong Zhang   for (i = 0; i < m; i++) {
6889566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIPrintf(viewer, "row %" PetscInt_FMT ":", i));
68948a46eb9SPierre Jolivet     for (k = a->i[i]; k < a->i[i + 1]; k++) PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ") ", a->j[k]));
6909566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIPrintf(viewer, "\n"));
6917dc0baabSHong Zhang   }
6929566063dSJacob Faibussowitsch   PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE));
6933ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
6947dc0baabSHong Zhang }
6957dc0baabSHong Zhang 
69609573ac7SBarry Smith extern PetscErrorCode MatSeqAIJFactorInfo_Matlab(Mat, PetscViewer);
697cd155464SBarry Smith 
698ba38deedSJacob Faibussowitsch static PetscErrorCode MatView_SeqAIJ_ASCII(Mat A, PetscViewer viewer)
699d71ae5a4SJacob Faibussowitsch {
700416022c9SBarry Smith   Mat_SeqAIJ        *a = (Mat_SeqAIJ *)A->data;
701c898d852SStefano Zampini   const PetscScalar *av;
70260e0710aSBarry Smith   PetscInt           i, j, m = A->rmap->n;
703e060cb09SBarry Smith   const char        *name;
704f3ef73ceSBarry Smith   PetscViewerFormat  format;
70517ab2063SBarry Smith 
7063a40ed3dSBarry Smith   PetscFunctionBegin;
7077dc0baabSHong Zhang   if (A->structure_only) {
7089566063dSJacob Faibussowitsch     PetscCall(MatView_SeqAIJ_ASCII_structonly(A, viewer));
7093ba16761SJacob Faibussowitsch     PetscFunctionReturn(PETSC_SUCCESS);
7107dc0baabSHong Zhang   }
71143e49210SHong Zhang 
7129566063dSJacob Faibussowitsch   PetscCall(PetscViewerGetFormat(viewer, &format));
7133ba16761SJacob Faibussowitsch   if (format == PETSC_VIEWER_ASCII_FACTOR_INFO || format == PETSC_VIEWER_ASCII_INFO || format == PETSC_VIEWER_ASCII_INFO_DETAIL) PetscFunctionReturn(PETSC_SUCCESS);
7142e5835c6SStefano Zampini 
715c898d852SStefano Zampini   /* trigger copy to CPU if needed */
7169566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &av));
7179566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &av));
71871c2f376SKris Buschelman   if (format == PETSC_VIEWER_ASCII_MATLAB) {
71997f1f81fSBarry Smith     PetscInt nofinalvalue = 0;
72060e0710aSBarry Smith     if (m && ((a->i[m] == a->i[m - 1]) || (a->j[a->nz - 1] != A->cmap->n - 1))) {
721c337ccceSJed Brown       /* Need a dummy value to ensure the dimension of the matrix. */
722d00d2cf4SBarry Smith       nofinalvalue = 1;
723d00d2cf4SBarry Smith     }
7249566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE));
7259566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIPrintf(viewer, "%% Size = %" PetscInt_FMT " %" PetscInt_FMT " \n", m, A->cmap->n));
7269566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIPrintf(viewer, "%% Nonzeros = %" PetscInt_FMT " \n", a->nz));
727fbfe6fa7SJed Brown #if defined(PETSC_USE_COMPLEX)
7289566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIPrintf(viewer, "zzz = zeros(%" PetscInt_FMT ",4);\n", a->nz + nofinalvalue));
729fbfe6fa7SJed Brown #else
7309566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIPrintf(viewer, "zzz = zeros(%" PetscInt_FMT ",3);\n", a->nz + nofinalvalue));
731fbfe6fa7SJed Brown #endif
7329566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIPrintf(viewer, "zzz = [\n"));
73317ab2063SBarry Smith 
73417ab2063SBarry Smith     for (i = 0; i < m; i++) {
73560e0710aSBarry Smith       for (j = a->i[i]; j < a->i[i + 1]; j++) {
736aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX)
7379566063dSJacob Faibussowitsch         PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT "  %18.16e %18.16e\n", i + 1, a->j[j] + 1, (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j])));
73817ab2063SBarry Smith #else
7399566063dSJacob Faibussowitsch         PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT "  %18.16e\n", i + 1, a->j[j] + 1, (double)a->a[j]));
74017ab2063SBarry Smith #endif
74117ab2063SBarry Smith       }
74217ab2063SBarry Smith     }
743d00d2cf4SBarry Smith     if (nofinalvalue) {
744c337ccceSJed Brown #if defined(PETSC_USE_COMPLEX)
7459566063dSJacob Faibussowitsch       PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT "  %18.16e %18.16e\n", m, A->cmap->n, 0., 0.));
746c337ccceSJed Brown #else
7479566063dSJacob Faibussowitsch       PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT "  %18.16e\n", m, A->cmap->n, 0.0));
748c337ccceSJed Brown #endif
749d00d2cf4SBarry Smith     }
7509566063dSJacob Faibussowitsch     PetscCall(PetscObjectGetName((PetscObject)A, &name));
7519566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIPrintf(viewer, "];\n %s = spconvert(zzz);\n", name));
7529566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE));
753fb9695e5SSatish Balay   } else if (format == PETSC_VIEWER_ASCII_COMMON) {
7549566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE));
75544cd7ae7SLois Curfman McInnes     for (i = 0; i < m; i++) {
7569566063dSJacob Faibussowitsch       PetscCall(PetscViewerASCIIPrintf(viewer, "row %" PetscInt_FMT ":", i));
75760e0710aSBarry Smith       for (j = a->i[i]; j < a->i[i + 1]; j++) {
758aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX)
75936db0b34SBarry Smith         if (PetscImaginaryPart(a->a[j]) > 0.0 && PetscRealPart(a->a[j]) != 0.0) {
7609566063dSJacob Faibussowitsch           PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g + %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j])));
76136db0b34SBarry Smith         } else if (PetscImaginaryPart(a->a[j]) < 0.0 && PetscRealPart(a->a[j]) != 0.0) {
7629566063dSJacob Faibussowitsch           PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g - %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)-PetscImaginaryPart(a->a[j])));
76336db0b34SBarry Smith         } else if (PetscRealPart(a->a[j]) != 0.0) {
7649566063dSJacob Faibussowitsch           PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)PetscRealPart(a->a[j])));
7656831982aSBarry Smith         }
76644cd7ae7SLois Curfman McInnes #else
7679566063dSJacob Faibussowitsch         if (a->a[j] != 0.0) PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)a->a[j]));
76844cd7ae7SLois Curfman McInnes #endif
76944cd7ae7SLois Curfman McInnes       }
7709566063dSJacob Faibussowitsch       PetscCall(PetscViewerASCIIPrintf(viewer, "\n"));
77144cd7ae7SLois Curfman McInnes     }
7729566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE));
773fb9695e5SSatish Balay   } else if (format == PETSC_VIEWER_ASCII_SYMMODU) {
77497f1f81fSBarry Smith     PetscInt nzd = 0, fshift = 1, *sptr;
7759566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE));
7769566063dSJacob Faibussowitsch     PetscCall(PetscMalloc1(m + 1, &sptr));
777496be53dSLois Curfman McInnes     for (i = 0; i < m; i++) {
778496be53dSLois Curfman McInnes       sptr[i] = nzd + 1;
77960e0710aSBarry Smith       for (j = a->i[i]; j < a->i[i + 1]; j++) {
780496be53dSLois Curfman McInnes         if (a->j[j] >= i) {
781aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX)
78236db0b34SBarry Smith           if (PetscImaginaryPart(a->a[j]) != 0.0 || PetscRealPart(a->a[j]) != 0.0) nzd++;
783496be53dSLois Curfman McInnes #else
784496be53dSLois Curfman McInnes           if (a->a[j] != 0.0) nzd++;
785496be53dSLois Curfman McInnes #endif
786496be53dSLois Curfman McInnes         }
787496be53dSLois Curfman McInnes       }
788496be53dSLois Curfman McInnes     }
7892e44a96cSLois Curfman McInnes     sptr[m] = nzd + 1;
7909566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " %" PetscInt_FMT "\n\n", m, nzd));
7912e44a96cSLois Curfman McInnes     for (i = 0; i < m + 1; i += 6) {
7922205254eSKarl Rupp       if (i + 4 < m) {
7939566063dSJacob Faibussowitsch         PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT "\n", sptr[i], sptr[i + 1], sptr[i + 2], sptr[i + 3], sptr[i + 4], sptr[i + 5]));
7942205254eSKarl Rupp       } else if (i + 3 < m) {
7959566063dSJacob Faibussowitsch         PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT "\n", sptr[i], sptr[i + 1], sptr[i + 2], sptr[i + 3], sptr[i + 4]));
7962205254eSKarl Rupp       } else if (i + 2 < m) {
7979566063dSJacob Faibussowitsch         PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT "\n", sptr[i], sptr[i + 1], sptr[i + 2], sptr[i + 3]));
7982205254eSKarl Rupp       } else if (i + 1 < m) {
7999566063dSJacob Faibussowitsch         PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT "\n", sptr[i], sptr[i + 1], sptr[i + 2]));
8002205254eSKarl Rupp       } else if (i < m) {
8019566063dSJacob Faibussowitsch         PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " %" PetscInt_FMT "\n", sptr[i], sptr[i + 1]));
8022205254eSKarl Rupp       } else {
8039566063dSJacob Faibussowitsch         PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT "\n", sptr[i]));
8042205254eSKarl Rupp       }
805496be53dSLois Curfman McInnes     }
8069566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIPrintf(viewer, "\n"));
8079566063dSJacob Faibussowitsch     PetscCall(PetscFree(sptr));
808496be53dSLois Curfman McInnes     for (i = 0; i < m; i++) {
80960e0710aSBarry Smith       for (j = a->i[i]; j < a->i[i + 1]; j++) {
8109566063dSJacob Faibussowitsch         if (a->j[j] >= i) PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " ", a->j[j] + fshift));
811496be53dSLois Curfman McInnes       }
8129566063dSJacob Faibussowitsch       PetscCall(PetscViewerASCIIPrintf(viewer, "\n"));
813496be53dSLois Curfman McInnes     }
8149566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIPrintf(viewer, "\n"));
815496be53dSLois Curfman McInnes     for (i = 0; i < m; i++) {
81660e0710aSBarry Smith       for (j = a->i[i]; j < a->i[i + 1]; j++) {
817496be53dSLois Curfman McInnes         if (a->j[j] >= i) {
818aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX)
81948a46eb9SPierre Jolivet           if (PetscImaginaryPart(a->a[j]) != 0.0 || PetscRealPart(a->a[j]) != 0.0) PetscCall(PetscViewerASCIIPrintf(viewer, " %18.16e %18.16e ", (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j])));
820496be53dSLois Curfman McInnes #else
8219566063dSJacob Faibussowitsch           if (a->a[j] != 0.0) PetscCall(PetscViewerASCIIPrintf(viewer, " %18.16e ", (double)a->a[j]));
822496be53dSLois Curfman McInnes #endif
823496be53dSLois Curfman McInnes         }
824496be53dSLois Curfman McInnes       }
8259566063dSJacob Faibussowitsch       PetscCall(PetscViewerASCIIPrintf(viewer, "\n"));
826496be53dSLois Curfman McInnes     }
8279566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE));
828fb9695e5SSatish Balay   } else if (format == PETSC_VIEWER_ASCII_DENSE) {
82997f1f81fSBarry Smith     PetscInt    cnt = 0, jcnt;
83087828ca2SBarry Smith     PetscScalar value;
83168f1ed48SBarry Smith #if defined(PETSC_USE_COMPLEX)
83268f1ed48SBarry Smith     PetscBool realonly = PETSC_TRUE;
83368f1ed48SBarry Smith 
83468f1ed48SBarry Smith     for (i = 0; i < a->i[m]; i++) {
83568f1ed48SBarry Smith       if (PetscImaginaryPart(a->a[i]) != 0.0) {
83668f1ed48SBarry Smith         realonly = PETSC_FALSE;
83768f1ed48SBarry Smith         break;
83868f1ed48SBarry Smith       }
83968f1ed48SBarry Smith     }
84068f1ed48SBarry Smith #endif
84102594712SBarry Smith 
8429566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE));
84302594712SBarry Smith     for (i = 0; i < m; i++) {
84402594712SBarry Smith       jcnt = 0;
845d0f46423SBarry Smith       for (j = 0; j < A->cmap->n; j++) {
846e24b481bSBarry Smith         if (jcnt < a->i[i + 1] - a->i[i] && j == a->j[cnt]) {
84702594712SBarry Smith           value = a->a[cnt++];
848e24b481bSBarry Smith           jcnt++;
84902594712SBarry Smith         } else {
85002594712SBarry Smith           value = 0.0;
85102594712SBarry Smith         }
852aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX)
85368f1ed48SBarry Smith         if (realonly) {
8549566063dSJacob Faibussowitsch           PetscCall(PetscViewerASCIIPrintf(viewer, " %7.5e ", (double)PetscRealPart(value)));
85568f1ed48SBarry Smith         } else {
8569566063dSJacob Faibussowitsch           PetscCall(PetscViewerASCIIPrintf(viewer, " %7.5e+%7.5e i ", (double)PetscRealPart(value), (double)PetscImaginaryPart(value)));
85768f1ed48SBarry Smith         }
85802594712SBarry Smith #else
8599566063dSJacob Faibussowitsch         PetscCall(PetscViewerASCIIPrintf(viewer, " %7.5e ", (double)value));
86002594712SBarry Smith #endif
86102594712SBarry Smith       }
8629566063dSJacob Faibussowitsch       PetscCall(PetscViewerASCIIPrintf(viewer, "\n"));
86302594712SBarry Smith     }
8649566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE));
8653c215bfdSMatthew Knepley   } else if (format == PETSC_VIEWER_ASCII_MATRIXMARKET) {
866150b93efSMatthew G. Knepley     PetscInt fshift = 1;
8679566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE));
8683c215bfdSMatthew Knepley #if defined(PETSC_USE_COMPLEX)
8699566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIPrintf(viewer, "%%%%MatrixMarket matrix coordinate complex general\n"));
8703c215bfdSMatthew Knepley #else
8719566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIPrintf(viewer, "%%%%MatrixMarket matrix coordinate real general\n"));
8723c215bfdSMatthew Knepley #endif
8739566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT "\n", m, A->cmap->n, a->nz));
8743c215bfdSMatthew Knepley     for (i = 0; i < m; i++) {
87560e0710aSBarry Smith       for (j = a->i[i]; j < a->i[i + 1]; j++) {
8763c215bfdSMatthew Knepley #if defined(PETSC_USE_COMPLEX)
8779566063dSJacob Faibussowitsch         PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT " %g %g\n", i + fshift, a->j[j] + fshift, (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j])));
8783c215bfdSMatthew Knepley #else
8799566063dSJacob Faibussowitsch         PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT " %g\n", i + fshift, a->j[j] + fshift, (double)a->a[j]));
8803c215bfdSMatthew Knepley #endif
8813c215bfdSMatthew Knepley       }
8823c215bfdSMatthew Knepley     }
8839566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE));
8843a40ed3dSBarry Smith   } else {
8859566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE));
886d5f3da31SBarry Smith     if (A->factortype) {
88716cd7e1dSShri Abhyankar       for (i = 0; i < m; i++) {
8889566063dSJacob Faibussowitsch         PetscCall(PetscViewerASCIIPrintf(viewer, "row %" PetscInt_FMT ":", i));
88916cd7e1dSShri Abhyankar         /* L part */
89060e0710aSBarry Smith         for (j = a->i[i]; j < a->i[i + 1]; j++) {
89116cd7e1dSShri Abhyankar #if defined(PETSC_USE_COMPLEX)
89216cd7e1dSShri Abhyankar           if (PetscImaginaryPart(a->a[j]) > 0.0) {
8939566063dSJacob Faibussowitsch             PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g + %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j])));
89416cd7e1dSShri Abhyankar           } else if (PetscImaginaryPart(a->a[j]) < 0.0) {
8959566063dSJacob Faibussowitsch             PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g - %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)(-PetscImaginaryPart(a->a[j]))));
89616cd7e1dSShri Abhyankar           } else {
8979566063dSJacob Faibussowitsch             PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)PetscRealPart(a->a[j])));
89816cd7e1dSShri Abhyankar           }
89916cd7e1dSShri Abhyankar #else
9009566063dSJacob Faibussowitsch           PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)a->a[j]));
90116cd7e1dSShri Abhyankar #endif
90216cd7e1dSShri Abhyankar         }
90316cd7e1dSShri Abhyankar         /* diagonal */
90416cd7e1dSShri Abhyankar         j = a->diag[i];
90516cd7e1dSShri Abhyankar #if defined(PETSC_USE_COMPLEX)
90616cd7e1dSShri Abhyankar         if (PetscImaginaryPart(a->a[j]) > 0.0) {
9079566063dSJacob Faibussowitsch           PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g + %g i)", a->j[j], (double)PetscRealPart(1.0 / a->a[j]), (double)PetscImaginaryPart(1.0 / a->a[j])));
90816cd7e1dSShri Abhyankar         } else if (PetscImaginaryPart(a->a[j]) < 0.0) {
9099566063dSJacob Faibussowitsch           PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g - %g i)", a->j[j], (double)PetscRealPart(1.0 / a->a[j]), (double)(-PetscImaginaryPart(1.0 / a->a[j]))));
91016cd7e1dSShri Abhyankar         } else {
9119566063dSJacob Faibussowitsch           PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)PetscRealPart(1.0 / a->a[j])));
91216cd7e1dSShri Abhyankar         }
91316cd7e1dSShri Abhyankar #else
9149566063dSJacob Faibussowitsch         PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)(1.0 / a->a[j])));
91516cd7e1dSShri Abhyankar #endif
91616cd7e1dSShri Abhyankar 
91716cd7e1dSShri Abhyankar         /* U part */
91860e0710aSBarry Smith         for (j = a->diag[i + 1] + 1; j < a->diag[i]; j++) {
91916cd7e1dSShri Abhyankar #if defined(PETSC_USE_COMPLEX)
92016cd7e1dSShri Abhyankar           if (PetscImaginaryPart(a->a[j]) > 0.0) {
9219566063dSJacob Faibussowitsch             PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g + %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j])));
92216cd7e1dSShri Abhyankar           } else if (PetscImaginaryPart(a->a[j]) < 0.0) {
9239566063dSJacob Faibussowitsch             PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g - %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)(-PetscImaginaryPart(a->a[j]))));
92416cd7e1dSShri Abhyankar           } else {
9259566063dSJacob Faibussowitsch             PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)PetscRealPart(a->a[j])));
92616cd7e1dSShri Abhyankar           }
92716cd7e1dSShri Abhyankar #else
9289566063dSJacob Faibussowitsch           PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)a->a[j]));
92916cd7e1dSShri Abhyankar #endif
93016cd7e1dSShri Abhyankar         }
9319566063dSJacob Faibussowitsch         PetscCall(PetscViewerASCIIPrintf(viewer, "\n"));
93216cd7e1dSShri Abhyankar       }
93316cd7e1dSShri Abhyankar     } else {
93417ab2063SBarry Smith       for (i = 0; i < m; i++) {
9359566063dSJacob Faibussowitsch         PetscCall(PetscViewerASCIIPrintf(viewer, "row %" PetscInt_FMT ":", i));
93660e0710aSBarry Smith         for (j = a->i[i]; j < a->i[i + 1]; j++) {
937aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX)
93836db0b34SBarry Smith           if (PetscImaginaryPart(a->a[j]) > 0.0) {
9399566063dSJacob Faibussowitsch             PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g + %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j])));
94036db0b34SBarry Smith           } else if (PetscImaginaryPart(a->a[j]) < 0.0) {
9419566063dSJacob Faibussowitsch             PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g - %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)-PetscImaginaryPart(a->a[j])));
9423a40ed3dSBarry Smith           } else {
9439566063dSJacob Faibussowitsch             PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)PetscRealPart(a->a[j])));
94417ab2063SBarry Smith           }
94517ab2063SBarry Smith #else
9469566063dSJacob Faibussowitsch           PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)a->a[j]));
94717ab2063SBarry Smith #endif
94817ab2063SBarry Smith         }
9499566063dSJacob Faibussowitsch         PetscCall(PetscViewerASCIIPrintf(viewer, "\n"));
95017ab2063SBarry Smith       }
95116cd7e1dSShri Abhyankar     }
9529566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE));
95317ab2063SBarry Smith   }
9549566063dSJacob Faibussowitsch   PetscCall(PetscViewerFlush(viewer));
9553ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
956416022c9SBarry Smith }
957416022c9SBarry Smith 
9589804daf3SBarry Smith #include <petscdraw.h>
959ba38deedSJacob Faibussowitsch static PetscErrorCode MatView_SeqAIJ_Draw_Zoom(PetscDraw draw, void *Aa)
960d71ae5a4SJacob Faibussowitsch {
961480ef9eaSBarry Smith   Mat                A = (Mat)Aa;
962416022c9SBarry Smith   Mat_SeqAIJ        *a = (Mat_SeqAIJ *)A->data;
963383922c3SLisandro Dalcin   PetscInt           i, j, m = A->rmap->n;
964383922c3SLisandro Dalcin   int                color;
965b05fc000SLisandro Dalcin   PetscReal          xl, yl, xr, yr, x_l, x_r, y_l, y_r;
966b0a32e0cSBarry Smith   PetscViewer        viewer;
967f3ef73ceSBarry Smith   PetscViewerFormat  format;
968fff043a9SJunchao Zhang   const PetscScalar *aa;
969cddf8d76SBarry Smith 
9703a40ed3dSBarry Smith   PetscFunctionBegin;
9719566063dSJacob Faibussowitsch   PetscCall(PetscObjectQuery((PetscObject)A, "Zoomviewer", (PetscObject *)&viewer));
9729566063dSJacob Faibussowitsch   PetscCall(PetscViewerGetFormat(viewer, &format));
9739566063dSJacob Faibussowitsch   PetscCall(PetscDrawGetCoordinates(draw, &xl, &yl, &xr, &yr));
974383922c3SLisandro Dalcin 
975416022c9SBarry Smith   /* loop over matrix elements drawing boxes */
9769566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &aa));
977fb9695e5SSatish Balay   if (format != PETSC_VIEWER_DRAW_CONTOUR) {
978d0609cedSBarry Smith     PetscDrawCollectiveBegin(draw);
9790513a670SBarry Smith     /* Blue for negative, Cyan for zero and  Red for positive */
980b0a32e0cSBarry Smith     color = PETSC_DRAW_BLUE;
981416022c9SBarry Smith     for (i = 0; i < m; i++) {
9829371c9d4SSatish Balay       y_l = m - i - 1.0;
9839371c9d4SSatish Balay       y_r = y_l + 1.0;
984bfeeae90SHong Zhang       for (j = a->i[i]; j < a->i[i + 1]; j++) {
9859371c9d4SSatish Balay         x_l = a->j[j];
9869371c9d4SSatish Balay         x_r = x_l + 1.0;
987fff043a9SJunchao Zhang         if (PetscRealPart(aa[j]) >= 0.) continue;
9889566063dSJacob Faibussowitsch         PetscCall(PetscDrawRectangle(draw, x_l, y_l, x_r, y_r, color, color, color, color));
989cddf8d76SBarry Smith       }
990cddf8d76SBarry Smith     }
991b0a32e0cSBarry Smith     color = PETSC_DRAW_CYAN;
992cddf8d76SBarry Smith     for (i = 0; i < m; i++) {
9939371c9d4SSatish Balay       y_l = m - i - 1.0;
9949371c9d4SSatish Balay       y_r = y_l + 1.0;
995bfeeae90SHong Zhang       for (j = a->i[i]; j < a->i[i + 1]; j++) {
9969371c9d4SSatish Balay         x_l = a->j[j];
9979371c9d4SSatish Balay         x_r = x_l + 1.0;
998fff043a9SJunchao Zhang         if (aa[j] != 0.) continue;
9999566063dSJacob Faibussowitsch         PetscCall(PetscDrawRectangle(draw, x_l, y_l, x_r, y_r, color, color, color, color));
1000cddf8d76SBarry Smith       }
1001cddf8d76SBarry Smith     }
1002b0a32e0cSBarry Smith     color = PETSC_DRAW_RED;
1003cddf8d76SBarry Smith     for (i = 0; i < m; i++) {
10049371c9d4SSatish Balay       y_l = m - i - 1.0;
10059371c9d4SSatish Balay       y_r = y_l + 1.0;
1006bfeeae90SHong Zhang       for (j = a->i[i]; j < a->i[i + 1]; j++) {
10079371c9d4SSatish Balay         x_l = a->j[j];
10089371c9d4SSatish Balay         x_r = x_l + 1.0;
1009fff043a9SJunchao Zhang         if (PetscRealPart(aa[j]) <= 0.) continue;
10109566063dSJacob Faibussowitsch         PetscCall(PetscDrawRectangle(draw, x_l, y_l, x_r, y_r, color, color, color, color));
1011416022c9SBarry Smith       }
1012416022c9SBarry Smith     }
1013d0609cedSBarry Smith     PetscDrawCollectiveEnd(draw);
10140513a670SBarry Smith   } else {
10150513a670SBarry Smith     /* use contour shading to indicate magnitude of values */
10160513a670SBarry Smith     /* first determine max of all nonzero values */
1017b05fc000SLisandro Dalcin     PetscReal minv = 0.0, maxv = 0.0;
1018383922c3SLisandro Dalcin     PetscInt  nz = a->nz, count = 0;
1019b0a32e0cSBarry Smith     PetscDraw popup;
10200513a670SBarry Smith 
10210513a670SBarry Smith     for (i = 0; i < nz; i++) {
1022fff043a9SJunchao Zhang       if (PetscAbsScalar(aa[i]) > maxv) maxv = PetscAbsScalar(aa[i]);
10230513a670SBarry Smith     }
1024383922c3SLisandro Dalcin     if (minv >= maxv) maxv = minv + PETSC_SMALL;
10259566063dSJacob Faibussowitsch     PetscCall(PetscDrawGetPopup(draw, &popup));
10269566063dSJacob Faibussowitsch     PetscCall(PetscDrawScalePopup(popup, minv, maxv));
1027383922c3SLisandro Dalcin 
1028d0609cedSBarry Smith     PetscDrawCollectiveBegin(draw);
10290513a670SBarry Smith     for (i = 0; i < m; i++) {
1030383922c3SLisandro Dalcin       y_l = m - i - 1.0;
1031383922c3SLisandro Dalcin       y_r = y_l + 1.0;
1032bfeeae90SHong Zhang       for (j = a->i[i]; j < a->i[i + 1]; j++) {
1033383922c3SLisandro Dalcin         x_l   = a->j[j];
1034383922c3SLisandro Dalcin         x_r   = x_l + 1.0;
1035fff043a9SJunchao Zhang         color = PetscDrawRealToColor(PetscAbsScalar(aa[count]), minv, maxv);
10369566063dSJacob Faibussowitsch         PetscCall(PetscDrawRectangle(draw, x_l, y_l, x_r, y_r, color, color, color, color));
10370513a670SBarry Smith         count++;
10380513a670SBarry Smith       }
10390513a670SBarry Smith     }
1040d0609cedSBarry Smith     PetscDrawCollectiveEnd(draw);
10410513a670SBarry Smith   }
10429566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &aa));
10433ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
1044480ef9eaSBarry Smith }
1045cddf8d76SBarry Smith 
10469804daf3SBarry Smith #include <petscdraw.h>
1047ba38deedSJacob Faibussowitsch static PetscErrorCode MatView_SeqAIJ_Draw(Mat A, PetscViewer viewer)
1048d71ae5a4SJacob Faibussowitsch {
1049b0a32e0cSBarry Smith   PetscDraw draw;
105036db0b34SBarry Smith   PetscReal xr, yr, xl, yl, h, w;
1051ace3abfcSBarry Smith   PetscBool isnull;
1052480ef9eaSBarry Smith 
1053480ef9eaSBarry Smith   PetscFunctionBegin;
10549566063dSJacob Faibussowitsch   PetscCall(PetscViewerDrawGetDraw(viewer, 0, &draw));
10559566063dSJacob Faibussowitsch   PetscCall(PetscDrawIsNull(draw, &isnull));
10563ba16761SJacob Faibussowitsch   if (isnull) PetscFunctionReturn(PETSC_SUCCESS);
1057480ef9eaSBarry Smith 
10589371c9d4SSatish Balay   xr = A->cmap->n;
10599371c9d4SSatish Balay   yr = A->rmap->n;
10609371c9d4SSatish Balay   h  = yr / 10.0;
10619371c9d4SSatish Balay   w  = xr / 10.0;
10629371c9d4SSatish Balay   xr += w;
10639371c9d4SSatish Balay   yr += h;
10649371c9d4SSatish Balay   xl = -w;
10659371c9d4SSatish Balay   yl = -h;
10669566063dSJacob Faibussowitsch   PetscCall(PetscDrawSetCoordinates(draw, xl, yl, xr, yr));
10679566063dSJacob Faibussowitsch   PetscCall(PetscObjectCompose((PetscObject)A, "Zoomviewer", (PetscObject)viewer));
10689566063dSJacob Faibussowitsch   PetscCall(PetscDrawZoom(draw, MatView_SeqAIJ_Draw_Zoom, A));
10699566063dSJacob Faibussowitsch   PetscCall(PetscObjectCompose((PetscObject)A, "Zoomviewer", NULL));
10709566063dSJacob Faibussowitsch   PetscCall(PetscDrawSave(draw));
10713ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
1072416022c9SBarry Smith }
1073416022c9SBarry Smith 
1074d71ae5a4SJacob Faibussowitsch PetscErrorCode MatView_SeqAIJ(Mat A, PetscViewer viewer)
1075d71ae5a4SJacob Faibussowitsch {
1076ace3abfcSBarry Smith   PetscBool iascii, isbinary, isdraw;
1077416022c9SBarry Smith 
10783a40ed3dSBarry Smith   PetscFunctionBegin;
10799566063dSJacob Faibussowitsch   PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERASCII, &iascii));
10809566063dSJacob Faibussowitsch   PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERBINARY, &isbinary));
10819566063dSJacob Faibussowitsch   PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERDRAW, &isdraw));
10821baa6e33SBarry Smith   if (iascii) PetscCall(MatView_SeqAIJ_ASCII(A, viewer));
10831baa6e33SBarry Smith   else if (isbinary) PetscCall(MatView_SeqAIJ_Binary(A, viewer));
10841baa6e33SBarry Smith   else if (isdraw) PetscCall(MatView_SeqAIJ_Draw(A, viewer));
10859566063dSJacob Faibussowitsch   PetscCall(MatView_SeqAIJ_Inode(A, viewer));
10863ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
108717ab2063SBarry Smith }
108819bcc07fSBarry Smith 
1089d71ae5a4SJacob Faibussowitsch PetscErrorCode MatAssemblyEnd_SeqAIJ(Mat A, MatAssemblyType mode)
1090d71ae5a4SJacob Faibussowitsch {
1091416022c9SBarry Smith   Mat_SeqAIJ *a      = (Mat_SeqAIJ *)A->data;
1092580bdb30SBarry Smith   PetscInt    fshift = 0, i, *ai = a->i, *aj = a->j, *imax = a->imax;
1093bc43efbbSJunchao Zhang   PetscInt    m = A->rmap->n, *ip, N, *ailen = a->ilen, rmax = 0, n;
109454f21887SBarry Smith   MatScalar  *aa    = a->a, *ap;
10953447b6efSHong Zhang   PetscReal   ratio = 0.6;
109617ab2063SBarry Smith 
10973a40ed3dSBarry Smith   PetscFunctionBegin;
10983ba16761SJacob Faibussowitsch   if (mode == MAT_FLUSH_ASSEMBLY) PetscFunctionReturn(PETSC_SUCCESS);
10999566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJInvalidateDiagonal(A));
1100b215bc84SStefano Zampini   if (A->was_assembled && A->ass_nonzerostate == A->nonzerostate) {
1101b215bc84SStefano Zampini     /* we need to respect users asking to use or not the inodes routine in between matrix assemblies */
11029566063dSJacob Faibussowitsch     PetscCall(MatAssemblyEnd_SeqAIJ_Inode(A, mode));
11033ba16761SJacob Faibussowitsch     PetscFunctionReturn(PETSC_SUCCESS);
1104b215bc84SStefano Zampini   }
110517ab2063SBarry Smith 
110643ee02c3SBarry Smith   if (m) rmax = ailen[0]; /* determine row with most nonzeros */
110717ab2063SBarry Smith   for (i = 1; i < m; i++) {
1108416022c9SBarry Smith     /* move each row back by the amount of empty slots (fshift) before it*/
110917ab2063SBarry Smith     fshift += imax[i - 1] - ailen[i - 1];
111094a9d846SBarry Smith     rmax = PetscMax(rmax, ailen[i]);
111117ab2063SBarry Smith     if (fshift) {
1112bfeeae90SHong Zhang       ip = aj + ai[i];
1113bfeeae90SHong Zhang       ap = aa + ai[i];
111417ab2063SBarry Smith       N  = ailen[i];
11159566063dSJacob Faibussowitsch       PetscCall(PetscArraymove(ip - fshift, ip, N));
111648a46eb9SPierre Jolivet       if (!A->structure_only) PetscCall(PetscArraymove(ap - fshift, ap, N));
111717ab2063SBarry Smith     }
111817ab2063SBarry Smith     ai[i] = ai[i - 1] + ailen[i - 1];
111917ab2063SBarry Smith   }
112017ab2063SBarry Smith   if (m) {
112117ab2063SBarry Smith     fshift += imax[m - 1] - ailen[m - 1];
112217ab2063SBarry Smith     ai[m] = ai[m - 1] + ailen[m - 1];
112317ab2063SBarry Smith   }
112417ab2063SBarry Smith   /* reset ilen and imax for each row */
11257b083b7cSBarry Smith   a->nonzerorowcnt = 0;
1126396832f4SHong Zhang   if (A->structure_only) {
11279566063dSJacob Faibussowitsch     PetscCall(PetscFree(a->imax));
11289566063dSJacob Faibussowitsch     PetscCall(PetscFree(a->ilen));
1129396832f4SHong Zhang   } else { /* !A->structure_only */
113017ab2063SBarry Smith     for (i = 0; i < m; i++) {
113117ab2063SBarry Smith       ailen[i] = imax[i] = ai[i + 1] - ai[i];
11327b083b7cSBarry Smith       a->nonzerorowcnt += ((ai[i + 1] - ai[i]) > 0);
113317ab2063SBarry Smith     }
1134396832f4SHong Zhang   }
1135bfeeae90SHong Zhang   a->nz = ai[m];
1136aed4548fSBarry Smith   PetscCheck(!fshift || a->nounused != -1, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Unused space detected in matrix: %" PetscInt_FMT " X %" PetscInt_FMT ", %" PetscInt_FMT " unneeded", m, A->cmap->n, fshift);
1137bc43efbbSJunchao Zhang   PetscCall(MatMarkDiagonal_SeqAIJ(A)); // since diagonal info is used a lot, it is helpful to set them up at the end of assembly
1138bc43efbbSJunchao Zhang   a->diagonaldense = PETSC_TRUE;
1139bc43efbbSJunchao Zhang   n                = PetscMin(A->rmap->n, A->cmap->n);
1140bc43efbbSJunchao Zhang   for (i = 0; i < n; i++) {
1141bc43efbbSJunchao Zhang     if (a->diag[i] >= ai[i + 1]) {
1142bc43efbbSJunchao Zhang       a->diagonaldense = PETSC_FALSE;
1143bc43efbbSJunchao Zhang       break;
1144bc43efbbSJunchao Zhang     }
1145bc43efbbSJunchao Zhang   }
11469566063dSJacob Faibussowitsch   PetscCall(PetscInfo(A, "Matrix size: %" PetscInt_FMT " X %" PetscInt_FMT "; storage space: %" PetscInt_FMT " unneeded,%" PetscInt_FMT " used\n", m, A->cmap->n, fshift, a->nz));
11479566063dSJacob Faibussowitsch   PetscCall(PetscInfo(A, "Number of mallocs during MatSetValues() is %" PetscInt_FMT "\n", a->reallocs));
11489566063dSJacob Faibussowitsch   PetscCall(PetscInfo(A, "Maximum nonzeros in any row is %" PetscInt_FMT "\n", rmax));
11492205254eSKarl Rupp 
11508e58a170SBarry Smith   A->info.mallocs += a->reallocs;
1151dd5f02e7SSatish Balay   a->reallocs         = 0;
11526712e2f1SBarry Smith   A->info.nz_unneeded = (PetscReal)fshift;
115336db0b34SBarry Smith   a->rmax             = rmax;
11544e220ebcSLois Curfman McInnes 
115548a46eb9SPierre Jolivet   if (!A->structure_only) PetscCall(MatCheckCompressedRow(A, a->nonzerorowcnt, &a->compressedrow, a->i, m, ratio));
11569566063dSJacob Faibussowitsch   PetscCall(MatAssemblyEnd_SeqAIJ_Inode(A, mode));
11573ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
115817ab2063SBarry Smith }
115917ab2063SBarry Smith 
1160ba38deedSJacob Faibussowitsch static PetscErrorCode MatRealPart_SeqAIJ(Mat A)
1161d71ae5a4SJacob Faibussowitsch {
116299cafbc1SBarry Smith   Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data;
116399cafbc1SBarry Smith   PetscInt    i, nz = a->nz;
11642e5835c6SStefano Zampini   MatScalar  *aa;
116599cafbc1SBarry Smith 
116699cafbc1SBarry Smith   PetscFunctionBegin;
11679566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArray(A, &aa));
116899cafbc1SBarry Smith   for (i = 0; i < nz; i++) aa[i] = PetscRealPart(aa[i]);
11699566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArray(A, &aa));
11709566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJInvalidateDiagonal(A));
11713ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
117299cafbc1SBarry Smith }
117399cafbc1SBarry Smith 
1174ba38deedSJacob Faibussowitsch static PetscErrorCode MatImaginaryPart_SeqAIJ(Mat A)
1175d71ae5a4SJacob Faibussowitsch {
117699cafbc1SBarry Smith   Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data;
117799cafbc1SBarry Smith   PetscInt    i, nz = a->nz;
11782e5835c6SStefano Zampini   MatScalar  *aa;
117999cafbc1SBarry Smith 
118099cafbc1SBarry Smith   PetscFunctionBegin;
11819566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArray(A, &aa));
118299cafbc1SBarry Smith   for (i = 0; i < nz; i++) aa[i] = PetscImaginaryPart(aa[i]);
11839566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArray(A, &aa));
11849566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJInvalidateDiagonal(A));
11853ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
118699cafbc1SBarry Smith }
118799cafbc1SBarry Smith 
1188d71ae5a4SJacob Faibussowitsch PetscErrorCode MatZeroEntries_SeqAIJ(Mat A)
1189d71ae5a4SJacob Faibussowitsch {
1190fff043a9SJunchao Zhang   Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data;
1191fff043a9SJunchao Zhang   MatScalar  *aa;
11923a40ed3dSBarry Smith 
11933a40ed3dSBarry Smith   PetscFunctionBegin;
11949566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayWrite(A, &aa));
11959566063dSJacob Faibussowitsch   PetscCall(PetscArrayzero(aa, a->i[A->rmap->n]));
11969566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayWrite(A, &aa));
11979566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJInvalidateDiagonal(A));
11983ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
119917ab2063SBarry Smith }
1200416022c9SBarry Smith 
1201d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDestroy_SeqAIJ(Mat A)
1202d71ae5a4SJacob Faibussowitsch {
1203416022c9SBarry Smith   Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data;
1204d5d45c9bSBarry Smith 
12053a40ed3dSBarry Smith   PetscFunctionBegin;
1206b4e2f619SBarry Smith   if (A->hash_active) {
1207e3c72094SPierre Jolivet     A->ops[0] = a->cops;
1208b4e2f619SBarry Smith     PetscCall(PetscHMapIJVDestroy(&a->ht));
1209b4e2f619SBarry Smith     PetscCall(PetscFree(a->dnz));
1210b4e2f619SBarry Smith     A->hash_active = PETSC_FALSE;
1211b4e2f619SBarry Smith   }
1212b4e2f619SBarry Smith 
12133ba16761SJacob Faibussowitsch   PetscCall(PetscLogObjectState((PetscObject)A, "Rows=%" PetscInt_FMT ", Cols=%" PetscInt_FMT ", NZ=%" PetscInt_FMT, A->rmap->n, A->cmap->n, a->nz));
12149566063dSJacob Faibussowitsch   PetscCall(MatSeqXAIJFreeAIJ(A, &a->a, &a->j, &a->i));
12159566063dSJacob Faibussowitsch   PetscCall(ISDestroy(&a->row));
12169566063dSJacob Faibussowitsch   PetscCall(ISDestroy(&a->col));
12179566063dSJacob Faibussowitsch   PetscCall(PetscFree(a->diag));
12189566063dSJacob Faibussowitsch   PetscCall(PetscFree(a->ibdiag));
12199566063dSJacob Faibussowitsch   PetscCall(PetscFree(a->imax));
12209566063dSJacob Faibussowitsch   PetscCall(PetscFree(a->ilen));
12219566063dSJacob Faibussowitsch   PetscCall(PetscFree(a->ipre));
12229566063dSJacob Faibussowitsch   PetscCall(PetscFree3(a->idiag, a->mdiag, a->ssor_work));
12239566063dSJacob Faibussowitsch   PetscCall(PetscFree(a->solve_work));
12249566063dSJacob Faibussowitsch   PetscCall(ISDestroy(&a->icol));
12259566063dSJacob Faibussowitsch   PetscCall(PetscFree(a->saved_values));
12269566063dSJacob Faibussowitsch   PetscCall(PetscFree2(a->compressedrow.i, a->compressedrow.rindex));
12279566063dSJacob Faibussowitsch   PetscCall(MatDestroy_SeqAIJ_Inode(A));
12289566063dSJacob Faibussowitsch   PetscCall(PetscFree(A->data));
1229901853e0SKris Buschelman 
12306718818eSStefano Zampini   /* MatMatMultNumeric_SeqAIJ_SeqAIJ_Sorted may allocate this.
12316718818eSStefano Zampini      That function is so heavily used (sometimes in an hidden way through multnumeric function pointers)
12326718818eSStefano Zampini      that is hard to properly add this data to the MatProduct data. We free it here to avoid
12336718818eSStefano Zampini      users reusing the matrix object with different data to incur in obscure segmentation faults
12346718818eSStefano Zampini      due to different matrix sizes */
12359566063dSJacob Faibussowitsch   PetscCall(PetscObjectCompose((PetscObject)A, "__PETSc__ab_dense", NULL));
12366718818eSStefano Zampini 
12379566063dSJacob Faibussowitsch   PetscCall(PetscObjectChangeTypeName((PetscObject)A, NULL));
12382e956fe4SStefano Zampini   PetscCall(PetscObjectComposeFunction((PetscObject)A, "PetscMatlabEnginePut_C", NULL));
12392e956fe4SStefano Zampini   PetscCall(PetscObjectComposeFunction((PetscObject)A, "PetscMatlabEngineGet_C", NULL));
12409566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSeqAIJSetColumnIndices_C", NULL));
12419566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatStoreValues_C", NULL));
12429566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatRetrieveValues_C", NULL));
12439566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqsbaij_C", NULL));
12449566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqbaij_C", NULL));
12459566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijperm_C", NULL));
12462e956fe4SStefano Zampini   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijsell_C", NULL));
12472e956fe4SStefano Zampini #if defined(PETSC_HAVE_MKL_SPARSE)
12482e956fe4SStefano Zampini   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijmkl_C", NULL));
12492e956fe4SStefano Zampini #endif
12504222ddf1SHong Zhang #if defined(PETSC_HAVE_CUDA)
12519566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijcusparse_C", NULL));
12529566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaijcusparse_seqaij_C", NULL));
12539566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaij_seqaijcusparse_C", NULL));
12544222ddf1SHong Zhang #endif
1255d5e393b6SSuyash Tandon #if defined(PETSC_HAVE_HIP)
1256d5e393b6SSuyash Tandon   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijhipsparse_C", NULL));
1257d5e393b6SSuyash Tandon   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaijhipsparse_seqaij_C", NULL));
1258d5e393b6SSuyash Tandon   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaij_seqaijhipsparse_C", NULL));
1259d5e393b6SSuyash Tandon #endif
12603d0639e7SStefano Zampini #if defined(PETSC_HAVE_KOKKOS_KERNELS)
12619566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijkokkos_C", NULL));
12623d0639e7SStefano Zampini #endif
12639566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijcrl_C", NULL));
1264af8000cdSHong Zhang #if defined(PETSC_HAVE_ELEMENTAL)
12659566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_elemental_C", NULL));
1266af8000cdSHong Zhang #endif
1267d24d4204SJose E. Roman #if defined(PETSC_HAVE_SCALAPACK)
12689566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_scalapack_C", NULL));
1269d24d4204SJose E. Roman #endif
127063c07aadSStefano Zampini #if defined(PETSC_HAVE_HYPRE)
12719566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_hypre_C", NULL));
12729566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_transpose_seqaij_seqaij_C", NULL));
127363c07aadSStefano Zampini #endif
12749566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqdense_C", NULL));
12759566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqsell_C", NULL));
12769566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_is_C", NULL));
12779566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatIsTranspose_C", NULL));
12782e956fe4SStefano Zampini   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatIsHermitianTranspose_C", NULL));
12799566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSeqAIJSetPreallocation_C", NULL));
12809566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatResetPreallocation_C", NULL));
12819566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSeqAIJSetPreallocationCSR_C", NULL));
12829566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatReorderForNonzeroDiagonal_C", NULL));
12839566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_is_seqaij_C", NULL));
12849566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqdense_seqaij_C", NULL));
12859566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaij_seqaij_C", NULL));
12869566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSeqAIJKron_C", NULL));
12879566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSetPreallocationCOO_C", NULL));
12889566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSetValuesCOO_C", NULL));
12892e956fe4SStefano Zampini   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatFactorGetSolverType_C", NULL));
12902e956fe4SStefano Zampini   /* these calls do not belong here: the subclasses Duplicate/Destroy are wrong */
12912e956fe4SStefano Zampini   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaijsell_seqaij_C", NULL));
12922e956fe4SStefano Zampini   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaijperm_seqaij_C", NULL));
12932e956fe4SStefano Zampini   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijviennacl_C", NULL));
12942e956fe4SStefano Zampini   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaijviennacl_seqdense_C", NULL));
12952e956fe4SStefano Zampini   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaijviennacl_seqaij_C", NULL));
12963ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
129717ab2063SBarry Smith }
129817ab2063SBarry Smith 
1299d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetOption_SeqAIJ(Mat A, MatOption op, PetscBool flg)
1300d71ae5a4SJacob Faibussowitsch {
1301416022c9SBarry Smith   Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data;
13023a40ed3dSBarry Smith 
13033a40ed3dSBarry Smith   PetscFunctionBegin;
1304a65d3064SKris Buschelman   switch (op) {
1305d71ae5a4SJacob Faibussowitsch   case MAT_ROW_ORIENTED:
1306d71ae5a4SJacob Faibussowitsch     a->roworiented = flg;
1307d71ae5a4SJacob Faibussowitsch     break;
1308d71ae5a4SJacob Faibussowitsch   case MAT_KEEP_NONZERO_PATTERN:
1309d71ae5a4SJacob Faibussowitsch     a->keepnonzeropattern = flg;
1310d71ae5a4SJacob Faibussowitsch     break;
1311d71ae5a4SJacob Faibussowitsch   case MAT_NEW_NONZERO_LOCATIONS:
1312d71ae5a4SJacob Faibussowitsch     a->nonew = (flg ? 0 : 1);
1313d71ae5a4SJacob Faibussowitsch     break;
1314d71ae5a4SJacob Faibussowitsch   case MAT_NEW_NONZERO_LOCATION_ERR:
1315d71ae5a4SJacob Faibussowitsch     a->nonew = (flg ? -1 : 0);
1316d71ae5a4SJacob Faibussowitsch     break;
1317d71ae5a4SJacob Faibussowitsch   case MAT_NEW_NONZERO_ALLOCATION_ERR:
1318d71ae5a4SJacob Faibussowitsch     a->nonew = (flg ? -2 : 0);
1319d71ae5a4SJacob Faibussowitsch     break;
1320d71ae5a4SJacob Faibussowitsch   case MAT_UNUSED_NONZERO_LOCATION_ERR:
1321d71ae5a4SJacob Faibussowitsch     a->nounused = (flg ? -1 : 0);
1322d71ae5a4SJacob Faibussowitsch     break;
1323d71ae5a4SJacob Faibussowitsch   case MAT_IGNORE_ZERO_ENTRIES:
1324d71ae5a4SJacob Faibussowitsch     a->ignorezeroentries = flg;
1325d71ae5a4SJacob Faibussowitsch     break;
13263d472b54SHong Zhang   case MAT_SPD:
1327b1646e73SJed Brown   case MAT_SYMMETRIC:
1328b1646e73SJed Brown   case MAT_STRUCTURALLY_SYMMETRIC:
1329b1646e73SJed Brown   case MAT_HERMITIAN:
1330b1646e73SJed Brown   case MAT_SYMMETRY_ETERNAL:
1331957cac9fSHong Zhang   case MAT_STRUCTURE_ONLY:
1332b94d7dedSBarry Smith   case MAT_STRUCTURAL_SYMMETRY_ETERNAL:
1333b94d7dedSBarry Smith   case MAT_SPD_ETERNAL:
1334b94d7dedSBarry Smith     /* if the diagonal matrix is square it inherits some of the properties above */
13355021d80fSJed Brown     break;
13368c78258cSHong Zhang   case MAT_FORCE_DIAGONAL_ENTRIES:
1337a65d3064SKris Buschelman   case MAT_IGNORE_OFF_PROC_ENTRIES:
1338d71ae5a4SJacob Faibussowitsch   case MAT_USE_HASH_TABLE:
1339d71ae5a4SJacob Faibussowitsch     PetscCall(PetscInfo(A, "Option %s ignored\n", MatOptions[op]));
1340d71ae5a4SJacob Faibussowitsch     break;
1341d71ae5a4SJacob Faibussowitsch   case MAT_USE_INODES:
1342d71ae5a4SJacob Faibussowitsch     PetscCall(MatSetOption_SeqAIJ_Inode(A, MAT_USE_INODES, flg));
1343d71ae5a4SJacob Faibussowitsch     break;
1344d71ae5a4SJacob Faibussowitsch   case MAT_SUBMAT_SINGLEIS:
1345d71ae5a4SJacob Faibussowitsch     A->submat_singleis = flg;
1346d71ae5a4SJacob Faibussowitsch     break;
1347071fcb05SBarry Smith   case MAT_SORTED_FULL:
1348071fcb05SBarry Smith     if (flg) A->ops->setvalues = MatSetValues_SeqAIJ_SortedFull;
1349071fcb05SBarry Smith     else A->ops->setvalues = MatSetValues_SeqAIJ;
1350071fcb05SBarry Smith     break;
1351d71ae5a4SJacob Faibussowitsch   case MAT_FORM_EXPLICIT_TRANSPOSE:
1352d71ae5a4SJacob Faibussowitsch     A->form_explicit_transpose = flg;
1353d71ae5a4SJacob Faibussowitsch     break;
1354d71ae5a4SJacob Faibussowitsch   default:
1355d71ae5a4SJacob Faibussowitsch     SETERRQ(PETSC_COMM_SELF, PETSC_ERR_SUP, "unknown option %d", op);
1356a65d3064SKris Buschelman   }
13573ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
135817ab2063SBarry Smith }
135917ab2063SBarry Smith 
1360ba38deedSJacob Faibussowitsch static PetscErrorCode MatGetDiagonal_SeqAIJ(Mat A, Vec v)
1361d71ae5a4SJacob Faibussowitsch {
1362416022c9SBarry Smith   Mat_SeqAIJ        *a = (Mat_SeqAIJ *)A->data;
1363fdc842d1SBarry Smith   PetscInt           i, j, n, *ai = a->i, *aj = a->j;
1364c898d852SStefano Zampini   PetscScalar       *x;
1365c898d852SStefano Zampini   const PetscScalar *aa;
136617ab2063SBarry Smith 
13673a40ed3dSBarry Smith   PetscFunctionBegin;
13689566063dSJacob Faibussowitsch   PetscCall(VecGetLocalSize(v, &n));
136908401ef6SPierre Jolivet   PetscCheck(n == A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Nonconforming matrix and vector");
13709566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &aa));
1371d5f3da31SBarry Smith   if (A->factortype == MAT_FACTOR_ILU || A->factortype == MAT_FACTOR_LU) {
1372d3e70bfaSHong Zhang     PetscInt *diag = a->diag;
13739566063dSJacob Faibussowitsch     PetscCall(VecGetArrayWrite(v, &x));
13742c990fa1SHong Zhang     for (i = 0; i < n; i++) x[i] = 1.0 / aa[diag[i]];
13759566063dSJacob Faibussowitsch     PetscCall(VecRestoreArrayWrite(v, &x));
13769566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJRestoreArrayRead(A, &aa));
13773ba16761SJacob Faibussowitsch     PetscFunctionReturn(PETSC_SUCCESS);
137835e7444dSHong Zhang   }
137935e7444dSHong Zhang 
13809566063dSJacob Faibussowitsch   PetscCall(VecGetArrayWrite(v, &x));
138135e7444dSHong Zhang   for (i = 0; i < n; i++) {
1382fdc842d1SBarry Smith     x[i] = 0.0;
138335e7444dSHong Zhang     for (j = ai[i]; j < ai[i + 1]; j++) {
138435e7444dSHong Zhang       if (aj[j] == i) {
138535e7444dSHong Zhang         x[i] = aa[j];
138617ab2063SBarry Smith         break;
138717ab2063SBarry Smith       }
138817ab2063SBarry Smith     }
138917ab2063SBarry Smith   }
13909566063dSJacob Faibussowitsch   PetscCall(VecRestoreArrayWrite(v, &x));
13919566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &aa));
13923ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
139317ab2063SBarry Smith }
139417ab2063SBarry Smith 
1395c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/ftn-kernels/fmult.h>
1396d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMultTransposeAdd_SeqAIJ(Mat A, Vec xx, Vec zz, Vec yy)
1397d71ae5a4SJacob Faibussowitsch {
1398416022c9SBarry Smith   Mat_SeqAIJ        *a = (Mat_SeqAIJ *)A->data;
13995f22a7b3SSebastian Grimberg   const MatScalar   *aa;
1400d9ca1df4SBarry Smith   PetscScalar       *y;
1401d9ca1df4SBarry Smith   const PetscScalar *x;
1402d0f46423SBarry Smith   PetscInt           m = A->rmap->n;
14035c897100SBarry Smith #if !defined(PETSC_USE_FORTRAN_KERNEL_MULTTRANSPOSEAIJ)
14045f22a7b3SSebastian Grimberg   const MatScalar  *v;
1405a77337e4SBarry Smith   PetscScalar       alpha;
1406d9ca1df4SBarry Smith   PetscInt          n, i, j;
1407d9ca1df4SBarry Smith   const PetscInt   *idx, *ii, *ridx = NULL;
14083447b6efSHong Zhang   Mat_CompressedRow cprow    = a->compressedrow;
1409ace3abfcSBarry Smith   PetscBool         usecprow = cprow.use;
14105c897100SBarry Smith #endif
141117ab2063SBarry Smith 
14123a40ed3dSBarry Smith   PetscFunctionBegin;
14139566063dSJacob Faibussowitsch   if (zz != yy) PetscCall(VecCopy(zz, yy));
14149566063dSJacob Faibussowitsch   PetscCall(VecGetArrayRead(xx, &x));
14159566063dSJacob Faibussowitsch   PetscCall(VecGetArray(yy, &y));
14169566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &aa));
14175c897100SBarry Smith 
14185c897100SBarry Smith #if defined(PETSC_USE_FORTRAN_KERNEL_MULTTRANSPOSEAIJ)
1419fff043a9SJunchao Zhang   fortranmulttransposeaddaij_(&m, x, a->i, a->j, aa, y);
14205c897100SBarry Smith #else
14213447b6efSHong Zhang   if (usecprow) {
14223447b6efSHong Zhang     m    = cprow.nrows;
14233447b6efSHong Zhang     ii   = cprow.i;
14247b2bb3b9SHong Zhang     ridx = cprow.rindex;
14253447b6efSHong Zhang   } else {
14263447b6efSHong Zhang     ii = a->i;
14273447b6efSHong Zhang   }
142817ab2063SBarry Smith   for (i = 0; i < m; i++) {
14293447b6efSHong Zhang     idx = a->j + ii[i];
1430fff043a9SJunchao Zhang     v   = aa + ii[i];
14313447b6efSHong Zhang     n   = ii[i + 1] - ii[i];
14323447b6efSHong Zhang     if (usecprow) {
14337b2bb3b9SHong Zhang       alpha = x[ridx[i]];
14343447b6efSHong Zhang     } else {
143517ab2063SBarry Smith       alpha = x[i];
14363447b6efSHong Zhang     }
143704fbf559SBarry Smith     for (j = 0; j < n; j++) y[idx[j]] += alpha * v[j];
143817ab2063SBarry Smith   }
14395c897100SBarry Smith #endif
14409566063dSJacob Faibussowitsch   PetscCall(PetscLogFlops(2.0 * a->nz));
14419566063dSJacob Faibussowitsch   PetscCall(VecRestoreArrayRead(xx, &x));
14429566063dSJacob Faibussowitsch   PetscCall(VecRestoreArray(yy, &y));
14439566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &aa));
14443ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
144517ab2063SBarry Smith }
144617ab2063SBarry Smith 
1447d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMultTranspose_SeqAIJ(Mat A, Vec xx, Vec yy)
1448d71ae5a4SJacob Faibussowitsch {
14495c897100SBarry Smith   PetscFunctionBegin;
14509566063dSJacob Faibussowitsch   PetscCall(VecSet(yy, 0.0));
14519566063dSJacob Faibussowitsch   PetscCall(MatMultTransposeAdd_SeqAIJ(A, xx, yy, yy));
14523ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
14535c897100SBarry Smith }
14545c897100SBarry Smith 
1455c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/ftn-kernels/fmult.h>
145678b84d54SShri Abhyankar 
1457d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMult_SeqAIJ(Mat A, Vec xx, Vec yy)
1458d71ae5a4SJacob Faibussowitsch {
1459416022c9SBarry Smith   Mat_SeqAIJ        *a = (Mat_SeqAIJ *)A->data;
1460d9fead3dSBarry Smith   PetscScalar       *y;
146154f21887SBarry Smith   const PetscScalar *x;
14625914357eSBarry Smith   const MatScalar   *a_a;
1463003131ecSBarry Smith   PetscInt           m = A->rmap->n;
14645914357eSBarry Smith   const PetscInt    *ii, *ridx = NULL;
1465ace3abfcSBarry Smith   PetscBool          usecprow = a->compressedrow.use;
146617ab2063SBarry Smith 
1467b6410449SSatish Balay #if defined(PETSC_HAVE_PRAGMA_DISJOINT)
146897952fefSHong Zhang   #pragma disjoint(*x, *y, *aa)
1469fee21e36SBarry Smith #endif
1470fee21e36SBarry Smith 
14713a40ed3dSBarry Smith   PetscFunctionBegin;
1472b215bc84SStefano Zampini   if (a->inode.use && a->inode.checked) {
14739566063dSJacob Faibussowitsch     PetscCall(MatMult_SeqAIJ_Inode(A, xx, yy));
14743ba16761SJacob Faibussowitsch     PetscFunctionReturn(PETSC_SUCCESS);
1475b215bc84SStefano Zampini   }
14769566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &a_a));
14779566063dSJacob Faibussowitsch   PetscCall(VecGetArrayRead(xx, &x));
14789566063dSJacob Faibussowitsch   PetscCall(VecGetArray(yy, &y));
1479416022c9SBarry Smith   ii = a->i;
14804eb6d288SHong Zhang   if (usecprow) { /* use compressed row format */
14819566063dSJacob Faibussowitsch     PetscCall(PetscArrayzero(y, m));
148297952fefSHong Zhang     m    = a->compressedrow.nrows;
148397952fefSHong Zhang     ii   = a->compressedrow.i;
148497952fefSHong Zhang     ridx = a->compressedrow.rindex;
14855914357eSBarry Smith     PetscPragmaUseOMPKernels(parallel for)
14865914357eSBarry Smith     for (PetscInt i = 0; i < m; i++) {
14875914357eSBarry Smith       PetscInt           n   = ii[i + 1] - ii[i];
14885914357eSBarry Smith       const PetscInt    *aj  = a->j + ii[i];
14895914357eSBarry Smith       const PetscScalar *aa  = a_a + ii[i];
14905914357eSBarry Smith       PetscScalar        sum = 0.0;
1491003131ecSBarry Smith       PetscSparseDensePlusDot(sum, x, aa, aj, n);
1492003131ecSBarry Smith       /* for (j=0; j<n; j++) sum += (*aa++)*x[*aj++]; */
149397952fefSHong Zhang       y[*ridx++] = sum;
149497952fefSHong Zhang     }
149597952fefSHong Zhang   } else { /* do not use compressed row format */
1496b05257ddSBarry Smith #if defined(PETSC_USE_FORTRAN_KERNEL_MULTAIJ)
14975914357eSBarry Smith     fortranmultaij_(&m, x, ii, a->j, a_a, y);
1498b05257ddSBarry Smith #else
14995914357eSBarry Smith     PetscPragmaUseOMPKernels(parallel for)
15005914357eSBarry Smith     for (PetscInt i = 0; i < m; i++) {
15015914357eSBarry Smith       PetscInt           n   = ii[i + 1] - ii[i];
15025914357eSBarry Smith       const PetscInt    *aj  = a->j + ii[i];
15035914357eSBarry Smith       const PetscScalar *aa  = a_a + ii[i];
15045914357eSBarry Smith       PetscScalar        sum = 0.0;
1505003131ecSBarry Smith       PetscSparseDensePlusDot(sum, x, aa, aj, n);
150617ab2063SBarry Smith       y[i] = sum;
150717ab2063SBarry Smith     }
15088d195f9aSBarry Smith #endif
1509b05257ddSBarry Smith   }
15109566063dSJacob Faibussowitsch   PetscCall(PetscLogFlops(2.0 * a->nz - a->nonzerorowcnt));
15119566063dSJacob Faibussowitsch   PetscCall(VecRestoreArrayRead(xx, &x));
15129566063dSJacob Faibussowitsch   PetscCall(VecRestoreArray(yy, &y));
15139566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &a_a));
15143ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
151517ab2063SBarry Smith }
151617ab2063SBarry Smith 
1517ba38deedSJacob Faibussowitsch // HACK!!!!! Used by src/mat/tests/ex170.c
1518ba38deedSJacob Faibussowitsch PETSC_EXTERN PetscErrorCode MatMultMax_SeqAIJ(Mat A, Vec xx, Vec yy)
1519d71ae5a4SJacob Faibussowitsch {
1520b434eb95SMatthew G. Knepley   Mat_SeqAIJ        *a = (Mat_SeqAIJ *)A->data;
1521b434eb95SMatthew G. Knepley   PetscScalar       *y;
1522b434eb95SMatthew G. Knepley   const PetscScalar *x;
1523fff043a9SJunchao Zhang   const MatScalar   *aa, *a_a;
1524b434eb95SMatthew G. Knepley   PetscInt           m = A->rmap->n;
1525b434eb95SMatthew G. Knepley   const PetscInt    *aj, *ii, *ridx   = NULL;
1526b434eb95SMatthew G. Knepley   PetscInt           n, i, nonzerorow = 0;
1527b434eb95SMatthew G. Knepley   PetscScalar        sum;
1528b434eb95SMatthew G. Knepley   PetscBool          usecprow = a->compressedrow.use;
1529b434eb95SMatthew G. Knepley 
1530b434eb95SMatthew G. Knepley #if defined(PETSC_HAVE_PRAGMA_DISJOINT)
1531b434eb95SMatthew G. Knepley   #pragma disjoint(*x, *y, *aa)
1532b434eb95SMatthew G. Knepley #endif
1533b434eb95SMatthew G. Knepley 
1534b434eb95SMatthew G. Knepley   PetscFunctionBegin;
15359566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &a_a));
15369566063dSJacob Faibussowitsch   PetscCall(VecGetArrayRead(xx, &x));
15379566063dSJacob Faibussowitsch   PetscCall(VecGetArray(yy, &y));
1538b434eb95SMatthew G. Knepley   if (usecprow) { /* use compressed row format */
1539b434eb95SMatthew G. Knepley     m    = a->compressedrow.nrows;
1540b434eb95SMatthew G. Knepley     ii   = a->compressedrow.i;
1541b434eb95SMatthew G. Knepley     ridx = a->compressedrow.rindex;
1542b434eb95SMatthew G. Knepley     for (i = 0; i < m; i++) {
1543b434eb95SMatthew G. Knepley       n   = ii[i + 1] - ii[i];
1544b434eb95SMatthew G. Knepley       aj  = a->j + ii[i];
1545fff043a9SJunchao Zhang       aa  = a_a + ii[i];
1546b434eb95SMatthew G. Knepley       sum = 0.0;
1547b434eb95SMatthew G. Knepley       nonzerorow += (n > 0);
1548b434eb95SMatthew G. Knepley       PetscSparseDenseMaxDot(sum, x, aa, aj, n);
1549b434eb95SMatthew G. Knepley       /* for (j=0; j<n; j++) sum += (*aa++)*x[*aj++]; */
1550b434eb95SMatthew G. Knepley       y[*ridx++] = sum;
1551b434eb95SMatthew G. Knepley     }
1552b434eb95SMatthew G. Knepley   } else { /* do not use compressed row format */
15533d3eaba7SBarry Smith     ii = a->i;
1554b434eb95SMatthew G. Knepley     for (i = 0; i < m; i++) {
1555b434eb95SMatthew G. Knepley       n   = ii[i + 1] - ii[i];
1556b434eb95SMatthew G. Knepley       aj  = a->j + ii[i];
1557fff043a9SJunchao Zhang       aa  = a_a + ii[i];
1558b434eb95SMatthew G. Knepley       sum = 0.0;
1559b434eb95SMatthew G. Knepley       nonzerorow += (n > 0);
1560b434eb95SMatthew G. Knepley       PetscSparseDenseMaxDot(sum, x, aa, aj, n);
1561b434eb95SMatthew G. Knepley       y[i] = sum;
1562b434eb95SMatthew G. Knepley     }
1563b434eb95SMatthew G. Knepley   }
15649566063dSJacob Faibussowitsch   PetscCall(PetscLogFlops(2.0 * a->nz - nonzerorow));
15659566063dSJacob Faibussowitsch   PetscCall(VecRestoreArrayRead(xx, &x));
15669566063dSJacob Faibussowitsch   PetscCall(VecRestoreArray(yy, &y));
15679566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &a_a));
15683ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
1569b434eb95SMatthew G. Knepley }
1570b434eb95SMatthew G. Knepley 
1571ba38deedSJacob Faibussowitsch // HACK!!!!! Used by src/mat/tests/ex170.c
1572ba38deedSJacob Faibussowitsch PETSC_EXTERN PetscErrorCode MatMultAddMax_SeqAIJ(Mat A, Vec xx, Vec yy, Vec zz)
1573d71ae5a4SJacob Faibussowitsch {
1574b434eb95SMatthew G. Knepley   Mat_SeqAIJ        *a = (Mat_SeqAIJ *)A->data;
1575b434eb95SMatthew G. Knepley   PetscScalar       *y, *z;
1576b434eb95SMatthew G. Knepley   const PetscScalar *x;
1577fff043a9SJunchao Zhang   const MatScalar   *aa, *a_a;
1578b434eb95SMatthew G. Knepley   PetscInt           m = A->rmap->n, *aj, *ii;
1579b434eb95SMatthew G. Knepley   PetscInt           n, i, *ridx = NULL;
1580b434eb95SMatthew G. Knepley   PetscScalar        sum;
1581b434eb95SMatthew G. Knepley   PetscBool          usecprow = a->compressedrow.use;
1582b434eb95SMatthew G. Knepley 
1583b434eb95SMatthew G. Knepley   PetscFunctionBegin;
15849566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &a_a));
15859566063dSJacob Faibussowitsch   PetscCall(VecGetArrayRead(xx, &x));
15869566063dSJacob Faibussowitsch   PetscCall(VecGetArrayPair(yy, zz, &y, &z));
1587b434eb95SMatthew G. Knepley   if (usecprow) { /* use compressed row format */
158848a46eb9SPierre Jolivet     if (zz != yy) PetscCall(PetscArraycpy(z, y, m));
1589b434eb95SMatthew G. Knepley     m    = a->compressedrow.nrows;
1590b434eb95SMatthew G. Knepley     ii   = a->compressedrow.i;
1591b434eb95SMatthew G. Knepley     ridx = a->compressedrow.rindex;
1592b434eb95SMatthew G. Knepley     for (i = 0; i < m; i++) {
1593b434eb95SMatthew G. Knepley       n   = ii[i + 1] - ii[i];
1594b434eb95SMatthew G. Knepley       aj  = a->j + ii[i];
1595fff043a9SJunchao Zhang       aa  = a_a + ii[i];
1596b434eb95SMatthew G. Knepley       sum = y[*ridx];
1597b434eb95SMatthew G. Knepley       PetscSparseDenseMaxDot(sum, x, aa, aj, n);
1598b434eb95SMatthew G. Knepley       z[*ridx++] = sum;
1599b434eb95SMatthew G. Knepley     }
1600b434eb95SMatthew G. Knepley   } else { /* do not use compressed row format */
16013d3eaba7SBarry Smith     ii = a->i;
1602b434eb95SMatthew G. Knepley     for (i = 0; i < m; i++) {
1603b434eb95SMatthew G. Knepley       n   = ii[i + 1] - ii[i];
1604b434eb95SMatthew G. Knepley       aj  = a->j + ii[i];
1605fff043a9SJunchao Zhang       aa  = a_a + ii[i];
1606b434eb95SMatthew G. Knepley       sum = y[i];
1607b434eb95SMatthew G. Knepley       PetscSparseDenseMaxDot(sum, x, aa, aj, n);
1608b434eb95SMatthew G. Knepley       z[i] = sum;
1609b434eb95SMatthew G. Knepley     }
1610b434eb95SMatthew G. Knepley   }
16119566063dSJacob Faibussowitsch   PetscCall(PetscLogFlops(2.0 * a->nz));
16129566063dSJacob Faibussowitsch   PetscCall(VecRestoreArrayRead(xx, &x));
16139566063dSJacob Faibussowitsch   PetscCall(VecRestoreArrayPair(yy, zz, &y, &z));
16149566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &a_a));
16153ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
1616b434eb95SMatthew G. Knepley }
1617b434eb95SMatthew G. Knepley 
1618c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/ftn-kernels/fmultadd.h>
1619d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMultAdd_SeqAIJ(Mat A, Vec xx, Vec yy, Vec zz)
1620d71ae5a4SJacob Faibussowitsch {
1621416022c9SBarry Smith   Mat_SeqAIJ        *a = (Mat_SeqAIJ *)A->data;
1622f15663dcSBarry Smith   PetscScalar       *y, *z;
1623f15663dcSBarry Smith   const PetscScalar *x;
16245914357eSBarry Smith   const MatScalar   *a_a;
16255914357eSBarry Smith   const PetscInt    *ii, *ridx = NULL;
16265914357eSBarry Smith   PetscInt           m        = A->rmap->n;
1627ace3abfcSBarry Smith   PetscBool          usecprow = a->compressedrow.use;
16289ea0dfa2SSatish Balay 
16293a40ed3dSBarry Smith   PetscFunctionBegin;
1630b215bc84SStefano Zampini   if (a->inode.use && a->inode.checked) {
16319566063dSJacob Faibussowitsch     PetscCall(MatMultAdd_SeqAIJ_Inode(A, xx, yy, zz));
16323ba16761SJacob Faibussowitsch     PetscFunctionReturn(PETSC_SUCCESS);
1633b215bc84SStefano Zampini   }
16349566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &a_a));
16359566063dSJacob Faibussowitsch   PetscCall(VecGetArrayRead(xx, &x));
16369566063dSJacob Faibussowitsch   PetscCall(VecGetArrayPair(yy, zz, &y, &z));
16374eb6d288SHong Zhang   if (usecprow) { /* use compressed row format */
163848a46eb9SPierre Jolivet     if (zz != yy) PetscCall(PetscArraycpy(z, y, m));
163997952fefSHong Zhang     m    = a->compressedrow.nrows;
164097952fefSHong Zhang     ii   = a->compressedrow.i;
164197952fefSHong Zhang     ridx = a->compressedrow.rindex;
16425914357eSBarry Smith     for (PetscInt i = 0; i < m; i++) {
16435914357eSBarry Smith       PetscInt           n   = ii[i + 1] - ii[i];
16445914357eSBarry Smith       const PetscInt    *aj  = a->j + ii[i];
16455914357eSBarry Smith       const PetscScalar *aa  = a_a + ii[i];
16465914357eSBarry Smith       PetscScalar        sum = y[*ridx];
1647f15663dcSBarry Smith       PetscSparseDensePlusDot(sum, x, aa, aj, n);
164897952fefSHong Zhang       z[*ridx++] = sum;
164997952fefSHong Zhang     }
165097952fefSHong Zhang   } else { /* do not use compressed row format */
16513d3eaba7SBarry Smith     ii = a->i;
1652f15663dcSBarry Smith #if defined(PETSC_USE_FORTRAN_KERNEL_MULTADDAIJ)
16535914357eSBarry Smith     fortranmultaddaij_(&m, x, ii, a->j, a_a, y, z);
1654f15663dcSBarry Smith #else
16555914357eSBarry Smith     PetscPragmaUseOMPKernels(parallel for)
16565914357eSBarry Smith     for (PetscInt i = 0; i < m; i++) {
16575914357eSBarry Smith       PetscInt           n   = ii[i + 1] - ii[i];
16585914357eSBarry Smith       const PetscInt    *aj  = a->j + ii[i];
16595914357eSBarry Smith       const PetscScalar *aa  = a_a + ii[i];
16605914357eSBarry Smith       PetscScalar        sum = y[i];
1661f15663dcSBarry Smith       PetscSparseDensePlusDot(sum, x, aa, aj, n);
166217ab2063SBarry Smith       z[i] = sum;
166317ab2063SBarry Smith     }
166402ab625aSSatish Balay #endif
1665f15663dcSBarry Smith   }
16669566063dSJacob Faibussowitsch   PetscCall(PetscLogFlops(2.0 * a->nz));
16679566063dSJacob Faibussowitsch   PetscCall(VecRestoreArrayRead(xx, &x));
16689566063dSJacob Faibussowitsch   PetscCall(VecRestoreArrayPair(yy, zz, &y, &z));
16699566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &a_a));
16703ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
167117ab2063SBarry Smith }
167217ab2063SBarry Smith 
167317ab2063SBarry Smith /*
167417ab2063SBarry Smith      Adds diagonal pointers to sparse matrix structure.
167517ab2063SBarry Smith */
1676d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMarkDiagonal_SeqAIJ(Mat A)
1677d71ae5a4SJacob Faibussowitsch {
1678416022c9SBarry Smith   Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data;
1679d0f46423SBarry Smith   PetscInt    i, j, m = A->rmap->n;
1680c0c07093SJunchao Zhang   PetscBool   alreadySet = PETSC_TRUE;
168117ab2063SBarry Smith 
16823a40ed3dSBarry Smith   PetscFunctionBegin;
168309f38230SBarry Smith   if (!a->diag) {
16849566063dSJacob Faibussowitsch     PetscCall(PetscMalloc1(m, &a->diag));
1685c0c07093SJunchao Zhang     alreadySet = PETSC_FALSE;
168609f38230SBarry Smith   }
1687d0f46423SBarry Smith   for (i = 0; i < A->rmap->n; i++) {
1688c0c07093SJunchao Zhang     /* If A's diagonal is already correctly set, this fast track enables cheap and repeated MatMarkDiagonal_SeqAIJ() calls */
1689c0c07093SJunchao Zhang     if (alreadySet) {
1690c0c07093SJunchao Zhang       PetscInt pos = a->diag[i];
1691c0c07093SJunchao Zhang       if (pos >= a->i[i] && pos < a->i[i + 1] && a->j[pos] == i) continue;
1692c0c07093SJunchao Zhang     }
1693c0c07093SJunchao Zhang 
169409f38230SBarry Smith     a->diag[i] = a->i[i + 1];
1695bfeeae90SHong Zhang     for (j = a->i[i]; j < a->i[i + 1]; j++) {
1696bfeeae90SHong Zhang       if (a->j[j] == i) {
169709f38230SBarry Smith         a->diag[i] = j;
169817ab2063SBarry Smith         break;
169917ab2063SBarry Smith       }
170017ab2063SBarry Smith     }
170117ab2063SBarry Smith   }
17023ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
170317ab2063SBarry Smith }
170417ab2063SBarry Smith 
1705ba38deedSJacob Faibussowitsch static PetscErrorCode MatShift_SeqAIJ(Mat A, PetscScalar v)
1706d71ae5a4SJacob Faibussowitsch {
170761ecd0c6SBarry Smith   Mat_SeqAIJ     *a    = (Mat_SeqAIJ *)A->data;
170861ecd0c6SBarry Smith   const PetscInt *diag = (const PetscInt *)a->diag;
170961ecd0c6SBarry Smith   const PetscInt *ii   = (const PetscInt *)a->i;
171061ecd0c6SBarry Smith   PetscInt        i, *mdiag = NULL;
171161ecd0c6SBarry Smith   PetscInt        cnt = 0; /* how many diagonals are missing */
171261ecd0c6SBarry Smith 
171361ecd0c6SBarry Smith   PetscFunctionBegin;
171461ecd0c6SBarry Smith   if (!A->preallocated || !a->nz) {
17159566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJSetPreallocation(A, 1, NULL));
17169566063dSJacob Faibussowitsch     PetscCall(MatShift_Basic(A, v));
17173ba16761SJacob Faibussowitsch     PetscFunctionReturn(PETSC_SUCCESS);
171861ecd0c6SBarry Smith   }
171961ecd0c6SBarry Smith 
172061ecd0c6SBarry Smith   if (a->diagonaldense) {
172161ecd0c6SBarry Smith     cnt = 0;
172261ecd0c6SBarry Smith   } else {
17239566063dSJacob Faibussowitsch     PetscCall(PetscCalloc1(A->rmap->n, &mdiag));
172461ecd0c6SBarry Smith     for (i = 0; i < A->rmap->n; i++) {
1725349d3b71SJunchao Zhang       if (i < A->cmap->n && diag[i] >= ii[i + 1]) { /* 'out of range' rows never have diagonals */
172661ecd0c6SBarry Smith         cnt++;
172761ecd0c6SBarry Smith         mdiag[i] = 1;
172861ecd0c6SBarry Smith       }
172961ecd0c6SBarry Smith     }
173061ecd0c6SBarry Smith   }
173161ecd0c6SBarry Smith   if (!cnt) {
17329566063dSJacob Faibussowitsch     PetscCall(MatShift_Basic(A, v));
173361ecd0c6SBarry Smith   } else {
1734b6f2aa54SBarry Smith     PetscScalar       *olda = a->a; /* preserve pointers to current matrix nonzeros structure and values */
1735b6f2aa54SBarry Smith     PetscInt          *oldj = a->j, *oldi = a->i;
1736*9f0612e4SBarry Smith     PetscBool          free_a = a->free_a, free_ij = a->free_ij;
17376ea2a7edSJunchao Zhang     const PetscScalar *Aa;
17386ea2a7edSJunchao Zhang 
17396ea2a7edSJunchao Zhang     PetscCall(MatSeqAIJGetArrayRead(A, &Aa)); // sync the host
17406ea2a7edSJunchao Zhang     PetscCall(MatSeqAIJRestoreArrayRead(A, &Aa));
174161ecd0c6SBarry Smith 
174261ecd0c6SBarry Smith     a->a = NULL;
174361ecd0c6SBarry Smith     a->j = NULL;
174461ecd0c6SBarry Smith     a->i = NULL;
174561ecd0c6SBarry Smith     /* increase the values in imax for each row where a diagonal is being inserted then reallocate the matrix data structures */
1746ad540459SPierre Jolivet     for (i = 0; i < PetscMin(A->rmap->n, A->cmap->n); i++) a->imax[i] += mdiag[i];
17479566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(A, 0, a->imax));
174861ecd0c6SBarry Smith 
174961ecd0c6SBarry Smith     /* copy old values into new matrix data structure */
175061ecd0c6SBarry Smith     for (i = 0; i < A->rmap->n; i++) {
17519566063dSJacob Faibussowitsch       PetscCall(MatSetValues(A, 1, &i, a->imax[i] - mdiag[i], &oldj[oldi[i]], &olda[oldi[i]], ADD_VALUES));
175248a46eb9SPierre Jolivet       if (i < A->cmap->n) PetscCall(MatSetValue(A, i, i, v, ADD_VALUES));
1753447d62f5SStefano Zampini     }
17549566063dSJacob Faibussowitsch     PetscCall(MatAssemblyBegin(A, MAT_FINAL_ASSEMBLY));
17559566063dSJacob Faibussowitsch     PetscCall(MatAssemblyEnd(A, MAT_FINAL_ASSEMBLY));
1756*9f0612e4SBarry Smith     if (free_a) PetscCall(PetscShmgetDeallocateArray((void **)&olda));
1757*9f0612e4SBarry Smith     if (free_ij) PetscCall(PetscShmgetDeallocateArray((void **)&oldj));
1758*9f0612e4SBarry Smith     if (free_ij) PetscCall(PetscShmgetDeallocateArray((void **)&oldi));
175961ecd0c6SBarry Smith   }
17609566063dSJacob Faibussowitsch   PetscCall(PetscFree(mdiag));
176161ecd0c6SBarry Smith   a->diagonaldense = PETSC_TRUE;
17623ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
176361ecd0c6SBarry Smith }
176461ecd0c6SBarry Smith 
1765be5855fcSBarry Smith /*
1766be5855fcSBarry Smith      Checks for missing diagonals
1767be5855fcSBarry Smith */
1768d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMissingDiagonal_SeqAIJ(Mat A, PetscBool *missing, PetscInt *d)
1769d71ae5a4SJacob Faibussowitsch {
1770be5855fcSBarry Smith   Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data;
17717734d3b5SMatthew G. Knepley   PetscInt   *diag, *ii = a->i, i;
1772be5855fcSBarry Smith 
1773be5855fcSBarry Smith   PetscFunctionBegin;
177409f38230SBarry Smith   *missing = PETSC_FALSE;
17757734d3b5SMatthew G. Knepley   if (A->rmap->n > 0 && !ii) {
177609f38230SBarry Smith     *missing = PETSC_TRUE;
177709f38230SBarry Smith     if (d) *d = 0;
17789566063dSJacob Faibussowitsch     PetscCall(PetscInfo(A, "Matrix has no entries therefore is missing diagonal\n"));
177909f38230SBarry Smith   } else {
178001445905SHong Zhang     PetscInt n;
178101445905SHong Zhang     n    = PetscMin(A->rmap->n, A->cmap->n);
1782f1e2ffcdSBarry Smith     diag = a->diag;
178301445905SHong Zhang     for (i = 0; i < n; i++) {
17847734d3b5SMatthew G. Knepley       if (diag[i] >= ii[i + 1]) {
178509f38230SBarry Smith         *missing = PETSC_TRUE;
178609f38230SBarry Smith         if (d) *d = i;
17879566063dSJacob Faibussowitsch         PetscCall(PetscInfo(A, "Matrix is missing diagonal number %" PetscInt_FMT "\n", i));
1788358d2f5dSShri Abhyankar         break;
178909f38230SBarry Smith       }
1790be5855fcSBarry Smith     }
1791be5855fcSBarry Smith   }
17923ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
1793be5855fcSBarry Smith }
1794be5855fcSBarry Smith 
17950da83c2eSBarry Smith #include <petscblaslapack.h>
17960da83c2eSBarry Smith #include <petsc/private/kernels/blockinvert.h>
17970da83c2eSBarry Smith 
17980da83c2eSBarry Smith /*
17990da83c2eSBarry Smith     Note that values is allocated externally by the PC and then passed into this routine
18000da83c2eSBarry Smith */
1801ba38deedSJacob Faibussowitsch static PetscErrorCode MatInvertVariableBlockDiagonal_SeqAIJ(Mat A, PetscInt nblocks, const PetscInt *bsizes, PetscScalar *diag)
1802d71ae5a4SJacob Faibussowitsch {
18030da83c2eSBarry Smith   PetscInt        n = A->rmap->n, i, ncnt = 0, *indx, j, bsizemax = 0, *v_pivots;
18040da83c2eSBarry Smith   PetscBool       allowzeropivot, zeropivotdetected = PETSC_FALSE;
18050da83c2eSBarry Smith   const PetscReal shift = 0.0;
18060da83c2eSBarry Smith   PetscInt        ipvt[5];
18074e208921SJed Brown   PetscCount      flops = 0;
18080da83c2eSBarry Smith   PetscScalar     work[25], *v_work;
18090da83c2eSBarry Smith 
18100da83c2eSBarry Smith   PetscFunctionBegin;
18110da83c2eSBarry Smith   allowzeropivot = PetscNot(A->erroriffailure);
18120da83c2eSBarry Smith   for (i = 0; i < nblocks; i++) ncnt += bsizes[i];
181308401ef6SPierre Jolivet   PetscCheck(ncnt == n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Total blocksizes %" PetscInt_FMT " doesn't match number matrix rows %" PetscInt_FMT, ncnt, n);
1814ad540459SPierre Jolivet   for (i = 0; i < nblocks; i++) bsizemax = PetscMax(bsizemax, bsizes[i]);
18159566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(bsizemax, &indx));
181648a46eb9SPierre Jolivet   if (bsizemax > 7) PetscCall(PetscMalloc2(bsizemax, &v_work, bsizemax, &v_pivots));
18170da83c2eSBarry Smith   ncnt = 0;
18180da83c2eSBarry Smith   for (i = 0; i < nblocks; i++) {
18190da83c2eSBarry Smith     for (j = 0; j < bsizes[i]; j++) indx[j] = ncnt + j;
18209566063dSJacob Faibussowitsch     PetscCall(MatGetValues(A, bsizes[i], indx, bsizes[i], indx, diag));
18210da83c2eSBarry Smith     switch (bsizes[i]) {
1822d71ae5a4SJacob Faibussowitsch     case 1:
1823d71ae5a4SJacob Faibussowitsch       *diag = 1.0 / (*diag);
1824d71ae5a4SJacob Faibussowitsch       break;
18250da83c2eSBarry Smith     case 2:
18269566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_inverse_A_2(diag, shift, allowzeropivot, &zeropivotdetected));
18270da83c2eSBarry Smith       if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT;
18289566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_transpose_A_2(diag));
18290da83c2eSBarry Smith       break;
18300da83c2eSBarry Smith     case 3:
18319566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_inverse_A_3(diag, shift, allowzeropivot, &zeropivotdetected));
18320da83c2eSBarry Smith       if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT;
18339566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_transpose_A_3(diag));
18340da83c2eSBarry Smith       break;
18350da83c2eSBarry Smith     case 4:
18369566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_inverse_A_4(diag, shift, allowzeropivot, &zeropivotdetected));
18370da83c2eSBarry Smith       if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT;
18389566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_transpose_A_4(diag));
18390da83c2eSBarry Smith       break;
18400da83c2eSBarry Smith     case 5:
18419566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_inverse_A_5(diag, ipvt, work, shift, allowzeropivot, &zeropivotdetected));
18420da83c2eSBarry Smith       if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT;
18439566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_transpose_A_5(diag));
18440da83c2eSBarry Smith       break;
18450da83c2eSBarry Smith     case 6:
18469566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_inverse_A_6(diag, shift, allowzeropivot, &zeropivotdetected));
18470da83c2eSBarry Smith       if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT;
18489566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_transpose_A_6(diag));
18490da83c2eSBarry Smith       break;
18500da83c2eSBarry Smith     case 7:
18519566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_inverse_A_7(diag, shift, allowzeropivot, &zeropivotdetected));
18520da83c2eSBarry Smith       if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT;
18539566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_transpose_A_7(diag));
18540da83c2eSBarry Smith       break;
18550da83c2eSBarry Smith     default:
18569566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_inverse_A(bsizes[i], diag, v_pivots, v_work, allowzeropivot, &zeropivotdetected));
18570da83c2eSBarry Smith       if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT;
18589566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_transpose_A_N(diag, bsizes[i]));
18590da83c2eSBarry Smith     }
18600da83c2eSBarry Smith     ncnt += bsizes[i];
18610da83c2eSBarry Smith     diag += bsizes[i] * bsizes[i];
1862baa50dc0SBrad Aagaard     flops += 2 * PetscPowInt64(bsizes[i], 3) / 3;
18630da83c2eSBarry Smith   }
18643ba16761SJacob Faibussowitsch   PetscCall(PetscLogFlops(flops));
186548a46eb9SPierre Jolivet   if (bsizemax > 7) PetscCall(PetscFree2(v_work, v_pivots));
18669566063dSJacob Faibussowitsch   PetscCall(PetscFree(indx));
18673ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
18680da83c2eSBarry Smith }
18690da83c2eSBarry Smith 
1870422a814eSBarry Smith /*
1871422a814eSBarry Smith    Negative shift indicates do not generate an error if there is a zero diagonal, just invert it anyways
1872422a814eSBarry Smith */
1873ba38deedSJacob Faibussowitsch static PetscErrorCode MatInvertDiagonal_SeqAIJ(Mat A, PetscScalar omega, PetscScalar fshift)
1874d71ae5a4SJacob Faibussowitsch {
187571f1c65dSBarry Smith   Mat_SeqAIJ      *a = (Mat_SeqAIJ *)A->data;
1876d0f46423SBarry Smith   PetscInt         i, *diag, m = A->rmap->n;
18772e5835c6SStefano Zampini   const MatScalar *v;
187854f21887SBarry Smith   PetscScalar     *idiag, *mdiag;
187971f1c65dSBarry Smith 
188071f1c65dSBarry Smith   PetscFunctionBegin;
18813ba16761SJacob Faibussowitsch   if (a->idiagvalid) PetscFunctionReturn(PETSC_SUCCESS);
18829566063dSJacob Faibussowitsch   PetscCall(MatMarkDiagonal_SeqAIJ(A));
188371f1c65dSBarry Smith   diag = a->diag;
18844dfa11a4SJacob Faibussowitsch   if (!a->idiag) { PetscCall(PetscMalloc3(m, &a->idiag, m, &a->mdiag, m, &a->ssor_work)); }
18852e5835c6SStefano Zampini 
188671f1c65dSBarry Smith   mdiag = a->mdiag;
188771f1c65dSBarry Smith   idiag = a->idiag;
18889566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &v));
1889422a814eSBarry Smith   if (omega == 1.0 && PetscRealPart(fshift) <= 0.0) {
189071f1c65dSBarry Smith     for (i = 0; i < m; i++) {
189171f1c65dSBarry Smith       mdiag[i] = v[diag[i]];
1892899639b0SHong Zhang       if (!PetscAbsScalar(mdiag[i])) { /* zero diagonal */
1893899639b0SHong Zhang         if (PetscRealPart(fshift)) {
18949566063dSJacob Faibussowitsch           PetscCall(PetscInfo(A, "Zero diagonal on row %" PetscInt_FMT "\n", i));
18957b6c816cSBarry Smith           A->factorerrortype             = MAT_FACTOR_NUMERIC_ZEROPIVOT;
18967b6c816cSBarry Smith           A->factorerror_zeropivot_value = 0.0;
18977b6c816cSBarry Smith           A->factorerror_zeropivot_row   = i;
189898921bdaSJacob Faibussowitsch         } else SETERRQ(PETSC_COMM_SELF, PETSC_ERR_ARG_INCOMP, "Zero diagonal on row %" PetscInt_FMT, i);
1899899639b0SHong Zhang       }
190071f1c65dSBarry Smith       idiag[i] = 1.0 / v[diag[i]];
190171f1c65dSBarry Smith     }
19029566063dSJacob Faibussowitsch     PetscCall(PetscLogFlops(m));
190371f1c65dSBarry Smith   } else {
190471f1c65dSBarry Smith     for (i = 0; i < m; i++) {
190571f1c65dSBarry Smith       mdiag[i] = v[diag[i]];
190671f1c65dSBarry Smith       idiag[i] = omega / (fshift + v[diag[i]]);
190771f1c65dSBarry Smith     }
19089566063dSJacob Faibussowitsch     PetscCall(PetscLogFlops(2.0 * m));
190971f1c65dSBarry Smith   }
191071f1c65dSBarry Smith   a->idiagvalid = PETSC_TRUE;
19119566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &v));
19123ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
191371f1c65dSBarry Smith }
191471f1c65dSBarry Smith 
1915d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSOR_SeqAIJ(Mat A, Vec bb, PetscReal omega, MatSORType flag, PetscReal fshift, PetscInt its, PetscInt lits, Vec xx)
1916d71ae5a4SJacob Faibussowitsch {
1917416022c9SBarry Smith   Mat_SeqAIJ        *a = (Mat_SeqAIJ *)A->data;
1918e6d1f457SBarry Smith   PetscScalar       *x, d, sum, *t, scale;
19192e5835c6SStefano Zampini   const MatScalar   *v, *idiag = NULL, *mdiag, *aa;
192054f21887SBarry Smith   const PetscScalar *b, *bs, *xb, *ts;
19213d3eaba7SBarry Smith   PetscInt           n, m = A->rmap->n, i;
192297f1f81fSBarry Smith   const PetscInt    *idx, *diag;
192317ab2063SBarry Smith 
19243a40ed3dSBarry Smith   PetscFunctionBegin;
1925b215bc84SStefano Zampini   if (a->inode.use && a->inode.checked && omega == 1.0 && fshift == 0.0) {
19269566063dSJacob Faibussowitsch     PetscCall(MatSOR_SeqAIJ_Inode(A, bb, omega, flag, fshift, its, lits, xx));
19273ba16761SJacob Faibussowitsch     PetscFunctionReturn(PETSC_SUCCESS);
1928b215bc84SStefano Zampini   }
1929b965ef7fSBarry Smith   its = its * lits;
193091723122SBarry Smith 
193171f1c65dSBarry Smith   if (fshift != a->fshift || omega != a->omega) a->idiagvalid = PETSC_FALSE; /* must recompute idiag[] */
19329566063dSJacob Faibussowitsch   if (!a->idiagvalid) PetscCall(MatInvertDiagonal_SeqAIJ(A, omega, fshift));
193371f1c65dSBarry Smith   a->fshift = fshift;
193471f1c65dSBarry Smith   a->omega  = omega;
1935ed480e8bSBarry Smith 
193671f1c65dSBarry Smith   diag  = a->diag;
193771f1c65dSBarry Smith   t     = a->ssor_work;
1938ed480e8bSBarry Smith   idiag = a->idiag;
193971f1c65dSBarry Smith   mdiag = a->mdiag;
1940ed480e8bSBarry Smith 
19419566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &aa));
19429566063dSJacob Faibussowitsch   PetscCall(VecGetArray(xx, &x));
19439566063dSJacob Faibussowitsch   PetscCall(VecGetArrayRead(bb, &b));
1944ed480e8bSBarry Smith   /* We count flops by assuming the upper triangular and lower triangular parts have the same number of nonzeros */
194517ab2063SBarry Smith   if (flag == SOR_APPLY_UPPER) {
194617ab2063SBarry Smith     /* apply (U + D/omega) to the vector */
1947ed480e8bSBarry Smith     bs = b;
194817ab2063SBarry Smith     for (i = 0; i < m; i++) {
194971f1c65dSBarry Smith       d   = fshift + mdiag[i];
1950416022c9SBarry Smith       n   = a->i[i + 1] - diag[i] - 1;
1951ed480e8bSBarry Smith       idx = a->j + diag[i] + 1;
19522e5835c6SStefano Zampini       v   = aa + diag[i] + 1;
195317ab2063SBarry Smith       sum = b[i] * d / omega;
1954003131ecSBarry Smith       PetscSparseDensePlusDot(sum, bs, v, idx, n);
195517ab2063SBarry Smith       x[i] = sum;
195617ab2063SBarry Smith     }
19579566063dSJacob Faibussowitsch     PetscCall(VecRestoreArray(xx, &x));
19589566063dSJacob Faibussowitsch     PetscCall(VecRestoreArrayRead(bb, &b));
19599566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJRestoreArrayRead(A, &aa));
19609566063dSJacob Faibussowitsch     PetscCall(PetscLogFlops(a->nz));
19613ba16761SJacob Faibussowitsch     PetscFunctionReturn(PETSC_SUCCESS);
196217ab2063SBarry Smith   }
1963c783ea89SBarry Smith 
196408401ef6SPierre Jolivet   PetscCheck(flag != SOR_APPLY_LOWER, PETSC_COMM_SELF, PETSC_ERR_SUP, "SOR_APPLY_LOWER is not implemented");
1965f7d195e4SLawrence Mitchell   if (flag & SOR_EISENSTAT) {
19664c500f23SPierre Jolivet     /* Let  A = L + U + D; where L is lower triangular,
1967887ee2caSBarry Smith     U is upper triangular, E = D/omega; This routine applies
196817ab2063SBarry Smith 
196917ab2063SBarry Smith             (L + E)^{-1} A (U + E)^{-1}
197017ab2063SBarry Smith 
1971887ee2caSBarry Smith     to a vector efficiently using Eisenstat's trick.
197217ab2063SBarry Smith     */
197317ab2063SBarry Smith     scale = (2.0 / omega) - 1.0;
197417ab2063SBarry Smith 
197517ab2063SBarry Smith     /*  x = (E + U)^{-1} b */
197617ab2063SBarry Smith     for (i = m - 1; i >= 0; i--) {
1977416022c9SBarry Smith       n   = a->i[i + 1] - diag[i] - 1;
1978ed480e8bSBarry Smith       idx = a->j + diag[i] + 1;
19792e5835c6SStefano Zampini       v   = aa + diag[i] + 1;
198017ab2063SBarry Smith       sum = b[i];
1981e6d1f457SBarry Smith       PetscSparseDenseMinusDot(sum, x, v, idx, n);
1982ed480e8bSBarry Smith       x[i] = sum * idiag[i];
198317ab2063SBarry Smith     }
198417ab2063SBarry Smith 
198517ab2063SBarry Smith     /*  t = b - (2*E - D)x */
19862e5835c6SStefano Zampini     v = aa;
19872205254eSKarl Rupp     for (i = 0; i < m; i++) t[i] = b[i] - scale * (v[*diag++]) * x[i];
198817ab2063SBarry Smith 
198917ab2063SBarry Smith     /*  t = (E + L)^{-1}t */
1990ed480e8bSBarry Smith     ts   = t;
1991416022c9SBarry Smith     diag = a->diag;
199217ab2063SBarry Smith     for (i = 0; i < m; i++) {
1993416022c9SBarry Smith       n   = diag[i] - a->i[i];
1994ed480e8bSBarry Smith       idx = a->j + a->i[i];
19952e5835c6SStefano Zampini       v   = aa + a->i[i];
199617ab2063SBarry Smith       sum = t[i];
1997003131ecSBarry Smith       PetscSparseDenseMinusDot(sum, ts, v, idx, n);
1998ed480e8bSBarry Smith       t[i] = sum * idiag[i];
1999733d66baSBarry Smith       /*  x = x + t */
2000733d66baSBarry Smith       x[i] += t[i];
200117ab2063SBarry Smith     }
200217ab2063SBarry Smith 
20039566063dSJacob Faibussowitsch     PetscCall(PetscLogFlops(6.0 * m - 1 + 2.0 * a->nz));
20049566063dSJacob Faibussowitsch     PetscCall(VecRestoreArray(xx, &x));
20059566063dSJacob Faibussowitsch     PetscCall(VecRestoreArrayRead(bb, &b));
20063ba16761SJacob Faibussowitsch     PetscFunctionReturn(PETSC_SUCCESS);
200717ab2063SBarry Smith   }
200817ab2063SBarry Smith   if (flag & SOR_ZERO_INITIAL_GUESS) {
200917ab2063SBarry Smith     if (flag & SOR_FORWARD_SWEEP || flag & SOR_LOCAL_FORWARD_SWEEP) {
201017ab2063SBarry Smith       for (i = 0; i < m; i++) {
2011416022c9SBarry Smith         n   = diag[i] - a->i[i];
2012ed480e8bSBarry Smith         idx = a->j + a->i[i];
20132e5835c6SStefano Zampini         v   = aa + a->i[i];
201417ab2063SBarry Smith         sum = b[i];
2015e6d1f457SBarry Smith         PetscSparseDenseMinusDot(sum, x, v, idx, n);
20165c99c7daSBarry Smith         t[i] = sum;
2017ed480e8bSBarry Smith         x[i] = sum * idiag[i];
201817ab2063SBarry Smith       }
20195c99c7daSBarry Smith       xb = t;
20209566063dSJacob Faibussowitsch       PetscCall(PetscLogFlops(a->nz));
20213a40ed3dSBarry Smith     } else xb = b;
202217ab2063SBarry Smith     if (flag & SOR_BACKWARD_SWEEP || flag & SOR_LOCAL_BACKWARD_SWEEP) {
202317ab2063SBarry Smith       for (i = m - 1; i >= 0; i--) {
2024416022c9SBarry Smith         n   = a->i[i + 1] - diag[i] - 1;
2025ed480e8bSBarry Smith         idx = a->j + diag[i] + 1;
20262e5835c6SStefano Zampini         v   = aa + diag[i] + 1;
202717ab2063SBarry Smith         sum = xb[i];
2028e6d1f457SBarry Smith         PetscSparseDenseMinusDot(sum, x, v, idx, n);
20295c99c7daSBarry Smith         if (xb == b) {
2030ed480e8bSBarry Smith           x[i] = sum * idiag[i];
20315c99c7daSBarry Smith         } else {
2032b19a5dc2SMark Adams           x[i] = (1 - omega) * x[i] + sum * idiag[i]; /* omega in idiag */
203317ab2063SBarry Smith         }
20345c99c7daSBarry Smith       }
20359566063dSJacob Faibussowitsch       PetscCall(PetscLogFlops(a->nz)); /* assumes 1/2 in upper */
203617ab2063SBarry Smith     }
203717ab2063SBarry Smith     its--;
203817ab2063SBarry Smith   }
203917ab2063SBarry Smith   while (its--) {
204017ab2063SBarry Smith     if (flag & SOR_FORWARD_SWEEP || flag & SOR_LOCAL_FORWARD_SWEEP) {
204117ab2063SBarry Smith       for (i = 0; i < m; i++) {
2042b19a5dc2SMark Adams         /* lower */
2043b19a5dc2SMark Adams         n   = diag[i] - a->i[i];
2044ed480e8bSBarry Smith         idx = a->j + a->i[i];
20452e5835c6SStefano Zampini         v   = aa + a->i[i];
204617ab2063SBarry Smith         sum = b[i];
2047e6d1f457SBarry Smith         PetscSparseDenseMinusDot(sum, x, v, idx, n);
2048b19a5dc2SMark Adams         t[i] = sum; /* save application of the lower-triangular part */
2049b19a5dc2SMark Adams         /* upper */
2050b19a5dc2SMark Adams         n   = a->i[i + 1] - diag[i] - 1;
2051b19a5dc2SMark Adams         idx = a->j + diag[i] + 1;
20522e5835c6SStefano Zampini         v   = aa + diag[i] + 1;
2053b19a5dc2SMark Adams         PetscSparseDenseMinusDot(sum, x, v, idx, n);
2054b19a5dc2SMark Adams         x[i] = (1. - omega) * x[i] + sum * idiag[i]; /* omega in idiag */
205517ab2063SBarry Smith       }
2056b19a5dc2SMark Adams       xb = t;
20579566063dSJacob Faibussowitsch       PetscCall(PetscLogFlops(2.0 * a->nz));
2058b19a5dc2SMark Adams     } else xb = b;
205917ab2063SBarry Smith     if (flag & SOR_BACKWARD_SWEEP || flag & SOR_LOCAL_BACKWARD_SWEEP) {
206017ab2063SBarry Smith       for (i = m - 1; i >= 0; i--) {
2061b19a5dc2SMark Adams         sum = xb[i];
2062b19a5dc2SMark Adams         if (xb == b) {
2063b19a5dc2SMark Adams           /* whole matrix (no checkpointing available) */
2064416022c9SBarry Smith           n   = a->i[i + 1] - a->i[i];
2065ed480e8bSBarry Smith           idx = a->j + a->i[i];
20662e5835c6SStefano Zampini           v   = aa + a->i[i];
2067e6d1f457SBarry Smith           PetscSparseDenseMinusDot(sum, x, v, idx, n);
2068ed480e8bSBarry Smith           x[i] = (1. - omega) * x[i] + (sum + mdiag[i] * x[i]) * idiag[i];
2069b19a5dc2SMark Adams         } else { /* lower-triangular part has been saved, so only apply upper-triangular */
2070b19a5dc2SMark Adams           n   = a->i[i + 1] - diag[i] - 1;
2071b19a5dc2SMark Adams           idx = a->j + diag[i] + 1;
20722e5835c6SStefano Zampini           v   = aa + diag[i] + 1;
2073b19a5dc2SMark Adams           PetscSparseDenseMinusDot(sum, x, v, idx, n);
2074b19a5dc2SMark Adams           x[i] = (1. - omega) * x[i] + sum * idiag[i]; /* omega in idiag */
207517ab2063SBarry Smith         }
2076b19a5dc2SMark Adams       }
2077b19a5dc2SMark Adams       if (xb == b) {
20789566063dSJacob Faibussowitsch         PetscCall(PetscLogFlops(2.0 * a->nz));
2079b19a5dc2SMark Adams       } else {
20809566063dSJacob Faibussowitsch         PetscCall(PetscLogFlops(a->nz)); /* assumes 1/2 in upper */
2081b19a5dc2SMark Adams       }
208217ab2063SBarry Smith     }
208317ab2063SBarry Smith   }
20849566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &aa));
20859566063dSJacob Faibussowitsch   PetscCall(VecRestoreArray(xx, &x));
20869566063dSJacob Faibussowitsch   PetscCall(VecRestoreArrayRead(bb, &b));
20873ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
208817ab2063SBarry Smith }
208917ab2063SBarry Smith 
2090ba38deedSJacob Faibussowitsch static PetscErrorCode MatGetInfo_SeqAIJ(Mat A, MatInfoType flag, MatInfo *info)
2091d71ae5a4SJacob Faibussowitsch {
2092416022c9SBarry Smith   Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data;
20934e220ebcSLois Curfman McInnes 
20943a40ed3dSBarry Smith   PetscFunctionBegin;
20954e220ebcSLois Curfman McInnes   info->block_size   = 1.0;
20963966268fSBarry Smith   info->nz_allocated = a->maxnz;
20973966268fSBarry Smith   info->nz_used      = a->nz;
20983966268fSBarry Smith   info->nz_unneeded  = (a->maxnz - a->nz);
20993966268fSBarry Smith   info->assemblies   = A->num_ass;
21003966268fSBarry Smith   info->mallocs      = A->info.mallocs;
21014dfa11a4SJacob Faibussowitsch   info->memory       = 0; /* REVIEW ME */
2102d5f3da31SBarry Smith   if (A->factortype) {
21034e220ebcSLois Curfman McInnes     info->fill_ratio_given  = A->info.fill_ratio_given;
21044e220ebcSLois Curfman McInnes     info->fill_ratio_needed = A->info.fill_ratio_needed;
21054e220ebcSLois Curfman McInnes     info->factor_mallocs    = A->info.factor_mallocs;
21064e220ebcSLois Curfman McInnes   } else {
21074e220ebcSLois Curfman McInnes     info->fill_ratio_given  = 0;
21084e220ebcSLois Curfman McInnes     info->fill_ratio_needed = 0;
21094e220ebcSLois Curfman McInnes     info->factor_mallocs    = 0;
21104e220ebcSLois Curfman McInnes   }
21113ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
211217ab2063SBarry Smith }
211317ab2063SBarry Smith 
2114ba38deedSJacob Faibussowitsch static PetscErrorCode MatZeroRows_SeqAIJ(Mat A, PetscInt N, const PetscInt rows[], PetscScalar diag, Vec x, Vec b)
2115d71ae5a4SJacob Faibussowitsch {
2116416022c9SBarry Smith   Mat_SeqAIJ        *a = (Mat_SeqAIJ *)A->data;
2117c7da8527SEric Chamberland   PetscInt           i, m = A->rmap->n - 1;
211897b48c8fSBarry Smith   const PetscScalar *xx;
21192e5835c6SStefano Zampini   PetscScalar       *bb, *aa;
2120c7da8527SEric Chamberland   PetscInt           d = 0;
212117ab2063SBarry Smith 
21223a40ed3dSBarry Smith   PetscFunctionBegin;
212397b48c8fSBarry Smith   if (x && b) {
21249566063dSJacob Faibussowitsch     PetscCall(VecGetArrayRead(x, &xx));
21259566063dSJacob Faibussowitsch     PetscCall(VecGetArray(b, &bb));
212697b48c8fSBarry Smith     for (i = 0; i < N; i++) {
2127aed4548fSBarry Smith       PetscCheck(rows[i] >= 0 && rows[i] <= m, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "row %" PetscInt_FMT " out of range", rows[i]);
2128447d62f5SStefano Zampini       if (rows[i] >= A->cmap->n) continue;
212997b48c8fSBarry Smith       bb[rows[i]] = diag * xx[rows[i]];
213097b48c8fSBarry Smith     }
21319566063dSJacob Faibussowitsch     PetscCall(VecRestoreArrayRead(x, &xx));
21329566063dSJacob Faibussowitsch     PetscCall(VecRestoreArray(b, &bb));
213397b48c8fSBarry Smith   }
213497b48c8fSBarry Smith 
21359566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArray(A, &aa));
2136a9817697SBarry Smith   if (a->keepnonzeropattern) {
2137f1e2ffcdSBarry Smith     for (i = 0; i < N; i++) {
2138aed4548fSBarry Smith       PetscCheck(rows[i] >= 0 && rows[i] <= m, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "row %" PetscInt_FMT " out of range", rows[i]);
21399566063dSJacob Faibussowitsch       PetscCall(PetscArrayzero(&aa[a->i[rows[i]]], a->ilen[rows[i]]));
2140f1e2ffcdSBarry Smith     }
2141f4df32b1SMatthew Knepley     if (diag != 0.0) {
2142c7da8527SEric Chamberland       for (i = 0; i < N; i++) {
2143c7da8527SEric Chamberland         d = rows[i];
2144447d62f5SStefano Zampini         if (rows[i] >= A->cmap->n) continue;
214508401ef6SPierre Jolivet         PetscCheck(a->diag[d] < a->i[d + 1], PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Matrix is missing diagonal entry in the zeroed row %" PetscInt_FMT, d);
2146c7da8527SEric Chamberland       }
2147f1e2ffcdSBarry Smith       for (i = 0; i < N; i++) {
2148447d62f5SStefano Zampini         if (rows[i] >= A->cmap->n) continue;
21492e5835c6SStefano Zampini         aa[a->diag[rows[i]]] = diag;
2150f1e2ffcdSBarry Smith       }
2151f1e2ffcdSBarry Smith     }
2152f1e2ffcdSBarry Smith   } else {
2153f4df32b1SMatthew Knepley     if (diag != 0.0) {
215417ab2063SBarry Smith       for (i = 0; i < N; i++) {
2155aed4548fSBarry Smith         PetscCheck(rows[i] >= 0 && rows[i] <= m, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "row %" PetscInt_FMT " out of range", rows[i]);
21567ae801bdSBarry Smith         if (a->ilen[rows[i]] > 0) {
2157447d62f5SStefano Zampini           if (rows[i] >= A->cmap->n) {
2158447d62f5SStefano Zampini             a->ilen[rows[i]] = 0;
2159447d62f5SStefano Zampini           } else {
2160416022c9SBarry Smith             a->ilen[rows[i]]    = 1;
21612e5835c6SStefano Zampini             aa[a->i[rows[i]]]   = diag;
2162bfeeae90SHong Zhang             a->j[a->i[rows[i]]] = rows[i];
2163447d62f5SStefano Zampini           }
2164447d62f5SStefano Zampini         } else if (rows[i] < A->cmap->n) { /* in case row was completely empty */
21659566063dSJacob Faibussowitsch           PetscCall(MatSetValues_SeqAIJ(A, 1, &rows[i], 1, &rows[i], &diag, INSERT_VALUES));
216617ab2063SBarry Smith         }
216717ab2063SBarry Smith       }
21683a40ed3dSBarry Smith     } else {
216917ab2063SBarry Smith       for (i = 0; i < N; i++) {
2170aed4548fSBarry Smith         PetscCheck(rows[i] >= 0 && rows[i] <= m, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "row %" PetscInt_FMT " out of range", rows[i]);
2171416022c9SBarry Smith         a->ilen[rows[i]] = 0;
217217ab2063SBarry Smith       }
217317ab2063SBarry Smith     }
2174e56f5c9eSBarry Smith     A->nonzerostate++;
2175f1e2ffcdSBarry Smith   }
21769566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArray(A, &aa));
2177dbbe0bcdSBarry Smith   PetscUseTypeMethod(A, assemblyend, MAT_FINAL_ASSEMBLY);
21783ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
217917ab2063SBarry Smith }
218017ab2063SBarry Smith 
2181ba38deedSJacob Faibussowitsch static PetscErrorCode MatZeroRowsColumns_SeqAIJ(Mat A, PetscInt N, const PetscInt rows[], PetscScalar diag, Vec x, Vec b)
2182d71ae5a4SJacob Faibussowitsch {
21836e169961SBarry Smith   Mat_SeqAIJ        *a = (Mat_SeqAIJ *)A->data;
21846e169961SBarry Smith   PetscInt           i, j, m = A->rmap->n - 1, d = 0;
21852b40b63fSBarry Smith   PetscBool          missing, *zeroed, vecs = PETSC_FALSE;
21866e169961SBarry Smith   const PetscScalar *xx;
21872e5835c6SStefano Zampini   PetscScalar       *bb, *aa;
21886e169961SBarry Smith 
21896e169961SBarry Smith   PetscFunctionBegin;
21903ba16761SJacob Faibussowitsch   if (!N) PetscFunctionReturn(PETSC_SUCCESS);
21919566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArray(A, &aa));
21926e169961SBarry Smith   if (x && b) {
21939566063dSJacob Faibussowitsch     PetscCall(VecGetArrayRead(x, &xx));
21949566063dSJacob Faibussowitsch     PetscCall(VecGetArray(b, &bb));
21952b40b63fSBarry Smith     vecs = PETSC_TRUE;
21966e169961SBarry Smith   }
21979566063dSJacob Faibussowitsch   PetscCall(PetscCalloc1(A->rmap->n, &zeroed));
21986e169961SBarry Smith   for (i = 0; i < N; i++) {
2199aed4548fSBarry Smith     PetscCheck(rows[i] >= 0 && rows[i] <= m, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "row %" PetscInt_FMT " out of range", rows[i]);
22008e3a54c0SPierre Jolivet     PetscCall(PetscArrayzero(PetscSafePointerPlusOffset(aa, a->i[rows[i]]), a->ilen[rows[i]]));
22012205254eSKarl Rupp 
22026e169961SBarry Smith     zeroed[rows[i]] = PETSC_TRUE;
22036e169961SBarry Smith   }
22046e169961SBarry Smith   for (i = 0; i < A->rmap->n; i++) {
22056e169961SBarry Smith     if (!zeroed[i]) {
22066e169961SBarry Smith       for (j = a->i[i]; j < a->i[i + 1]; j++) {
22074cf107fdSStefano Zampini         if (a->j[j] < A->rmap->n && zeroed[a->j[j]]) {
22082e5835c6SStefano Zampini           if (vecs) bb[i] -= aa[j] * xx[a->j[j]];
22092e5835c6SStefano Zampini           aa[j] = 0.0;
22106e169961SBarry Smith         }
22116e169961SBarry Smith       }
22124cf107fdSStefano Zampini     } else if (vecs && i < A->cmap->N) bb[i] = diag * xx[i];
22136e169961SBarry Smith   }
22146e169961SBarry Smith   if (x && b) {
22159566063dSJacob Faibussowitsch     PetscCall(VecRestoreArrayRead(x, &xx));
22169566063dSJacob Faibussowitsch     PetscCall(VecRestoreArray(b, &bb));
22176e169961SBarry Smith   }
22189566063dSJacob Faibussowitsch   PetscCall(PetscFree(zeroed));
22196e169961SBarry Smith   if (diag != 0.0) {
22209566063dSJacob Faibussowitsch     PetscCall(MatMissingDiagonal_SeqAIJ(A, &missing, &d));
22211d5a398dSstefano_zampini     if (missing) {
22221d5a398dSstefano_zampini       for (i = 0; i < N; i++) {
22234cf107fdSStefano Zampini         if (rows[i] >= A->cmap->N) continue;
2224aed4548fSBarry Smith         PetscCheck(!a->nonew || rows[i] < d, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Matrix is missing diagonal entry in row %" PetscInt_FMT " (%" PetscInt_FMT ")", d, rows[i]);
22259566063dSJacob Faibussowitsch         PetscCall(MatSetValues_SeqAIJ(A, 1, &rows[i], 1, &rows[i], &diag, INSERT_VALUES));
22261d5a398dSstefano_zampini       }
22271d5a398dSstefano_zampini     } else {
2228ad540459SPierre Jolivet       for (i = 0; i < N; i++) aa[a->diag[rows[i]]] = diag;
22296e169961SBarry Smith     }
22301d5a398dSstefano_zampini   }
22319566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArray(A, &aa));
2232dbbe0bcdSBarry Smith   PetscUseTypeMethod(A, assemblyend, MAT_FINAL_ASSEMBLY);
22333ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
22346e169961SBarry Smith }
22356e169961SBarry Smith 
2236d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetRow_SeqAIJ(Mat A, PetscInt row, PetscInt *nz, PetscInt **idx, PetscScalar **v)
2237d71ae5a4SJacob Faibussowitsch {
2238fff043a9SJunchao Zhang   Mat_SeqAIJ        *a = (Mat_SeqAIJ *)A->data;
2239fff043a9SJunchao Zhang   const PetscScalar *aa;
224017ab2063SBarry Smith 
22413a40ed3dSBarry Smith   PetscFunctionBegin;
22429566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &aa));
2243416022c9SBarry Smith   *nz = a->i[row + 1] - a->i[row];
22448e3a54c0SPierre Jolivet   if (v) *v = PetscSafePointerPlusOffset((PetscScalar *)aa, a->i[row]);
224517ab2063SBarry Smith   if (idx) {
22465c0db29aSPierre Jolivet     if (*nz && a->j) *idx = a->j + a->i[row];
2247f4259b30SLisandro Dalcin     else *idx = NULL;
224817ab2063SBarry Smith   }
22499566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &aa));
22503ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
225117ab2063SBarry Smith }
225217ab2063SBarry Smith 
2253d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRestoreRow_SeqAIJ(Mat A, PetscInt row, PetscInt *nz, PetscInt **idx, PetscScalar **v)
2254d71ae5a4SJacob Faibussowitsch {
22553a40ed3dSBarry Smith   PetscFunctionBegin;
22563ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
225717ab2063SBarry Smith }
225817ab2063SBarry Smith 
2259ba38deedSJacob Faibussowitsch static PetscErrorCode MatNorm_SeqAIJ(Mat A, NormType type, PetscReal *nrm)
2260d71ae5a4SJacob Faibussowitsch {
2261416022c9SBarry Smith   Mat_SeqAIJ      *a = (Mat_SeqAIJ *)A->data;
22622e5835c6SStefano Zampini   const MatScalar *v;
226336db0b34SBarry Smith   PetscReal        sum = 0.0;
226497f1f81fSBarry Smith   PetscInt         i, j;
226517ab2063SBarry Smith 
22663a40ed3dSBarry Smith   PetscFunctionBegin;
22679566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &v));
226817ab2063SBarry Smith   if (type == NORM_FROBENIUS) {
2269570b7f6dSBarry Smith #if defined(PETSC_USE_REAL___FP16)
2270570b7f6dSBarry Smith     PetscBLASInt one = 1, nz = a->nz;
2271792fecdfSBarry Smith     PetscCallBLAS("BLASnrm2", *nrm = BLASnrm2_(&nz, v, &one));
2272570b7f6dSBarry Smith #else
2273416022c9SBarry Smith     for (i = 0; i < a->nz; i++) {
22749371c9d4SSatish Balay       sum += PetscRealPart(PetscConj(*v) * (*v));
22759371c9d4SSatish Balay       v++;
227617ab2063SBarry Smith     }
22778f1a2a5eSBarry Smith     *nrm = PetscSqrtReal(sum);
2278570b7f6dSBarry Smith #endif
22799566063dSJacob Faibussowitsch     PetscCall(PetscLogFlops(2.0 * a->nz));
22803a40ed3dSBarry Smith   } else if (type == NORM_1) {
228136db0b34SBarry Smith     PetscReal *tmp;
228297f1f81fSBarry Smith     PetscInt  *jj = a->j;
22839566063dSJacob Faibussowitsch     PetscCall(PetscCalloc1(A->cmap->n + 1, &tmp));
2284064f8208SBarry Smith     *nrm = 0.0;
2285416022c9SBarry Smith     for (j = 0; j < a->nz; j++) {
22869371c9d4SSatish Balay       tmp[*jj++] += PetscAbsScalar(*v);
22879371c9d4SSatish Balay       v++;
228817ab2063SBarry Smith     }
2289d0f46423SBarry Smith     for (j = 0; j < A->cmap->n; j++) {
2290064f8208SBarry Smith       if (tmp[j] > *nrm) *nrm = tmp[j];
229117ab2063SBarry Smith     }
22929566063dSJacob Faibussowitsch     PetscCall(PetscFree(tmp));
22939566063dSJacob Faibussowitsch     PetscCall(PetscLogFlops(PetscMax(a->nz - 1, 0)));
22943a40ed3dSBarry Smith   } else if (type == NORM_INFINITY) {
2295064f8208SBarry Smith     *nrm = 0.0;
2296d0f46423SBarry Smith     for (j = 0; j < A->rmap->n; j++) {
22978e3a54c0SPierre Jolivet       const PetscScalar *v2 = PetscSafePointerPlusOffset(v, a->i[j]);
229817ab2063SBarry Smith       sum                   = 0.0;
2299416022c9SBarry Smith       for (i = 0; i < a->i[j + 1] - a->i[j]; i++) {
23009371c9d4SSatish Balay         sum += PetscAbsScalar(*v2);
23019371c9d4SSatish Balay         v2++;
230217ab2063SBarry Smith       }
2303064f8208SBarry Smith       if (sum > *nrm) *nrm = sum;
230417ab2063SBarry Smith     }
23059566063dSJacob Faibussowitsch     PetscCall(PetscLogFlops(PetscMax(a->nz - 1, 0)));
2306f23aa3ddSBarry Smith   } else SETERRQ(PETSC_COMM_SELF, PETSC_ERR_SUP, "No support for two norm");
23079566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &v));
23083ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
230917ab2063SBarry Smith }
231017ab2063SBarry Smith 
2311ba38deedSJacob Faibussowitsch static PetscErrorCode MatIsTranspose_SeqAIJ(Mat A, Mat B, PetscReal tol, PetscBool *f)
2312d71ae5a4SJacob Faibussowitsch {
23133d3eaba7SBarry Smith   Mat_SeqAIJ      *aij = (Mat_SeqAIJ *)A->data, *bij = (Mat_SeqAIJ *)B->data;
231454f21887SBarry Smith   PetscInt        *adx, *bdx, *aii, *bii, *aptr, *bptr;
23152e5835c6SStefano Zampini   const MatScalar *va, *vb;
231697f1f81fSBarry Smith   PetscInt         ma, na, mb, nb, i;
2317cd0d46ebSvictorle 
2318cd0d46ebSvictorle   PetscFunctionBegin;
23199566063dSJacob Faibussowitsch   PetscCall(MatGetSize(A, &ma, &na));
23209566063dSJacob Faibussowitsch   PetscCall(MatGetSize(B, &mb, &nb));
23215485867bSBarry Smith   if (ma != nb || na != mb) {
23225485867bSBarry Smith     *f = PETSC_FALSE;
23233ba16761SJacob Faibussowitsch     PetscFunctionReturn(PETSC_SUCCESS);
23245485867bSBarry Smith   }
23259566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &va));
23269566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(B, &vb));
23279371c9d4SSatish Balay   aii = aij->i;
23289371c9d4SSatish Balay   bii = bij->i;
23299371c9d4SSatish Balay   adx = aij->j;
23309371c9d4SSatish Balay   bdx = bij->j;
23319566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(ma, &aptr));
23329566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(mb, &bptr));
2333cd0d46ebSvictorle   for (i = 0; i < ma; i++) aptr[i] = aii[i];
2334cd0d46ebSvictorle   for (i = 0; i < mb; i++) bptr[i] = bii[i];
2335cd0d46ebSvictorle 
2336cd0d46ebSvictorle   *f = PETSC_TRUE;
2337cd0d46ebSvictorle   for (i = 0; i < ma; i++) {
2338cd0d46ebSvictorle     while (aptr[i] < aii[i + 1]) {
233997f1f81fSBarry Smith       PetscInt    idc, idr;
23405485867bSBarry Smith       PetscScalar vc, vr;
2341cd0d46ebSvictorle       /* column/row index/value */
23425485867bSBarry Smith       idc = adx[aptr[i]];
23435485867bSBarry Smith       idr = bdx[bptr[idc]];
23445485867bSBarry Smith       vc  = va[aptr[i]];
23455485867bSBarry Smith       vr  = vb[bptr[idc]];
23465485867bSBarry Smith       if (i != idr || PetscAbsScalar(vc - vr) > tol) {
23475485867bSBarry Smith         *f = PETSC_FALSE;
23485485867bSBarry Smith         goto done;
2349cd0d46ebSvictorle       } else {
23505485867bSBarry Smith         aptr[i]++;
23515485867bSBarry Smith         if (B || i != idc) bptr[idc]++;
2352cd0d46ebSvictorle       }
2353cd0d46ebSvictorle     }
2354cd0d46ebSvictorle   }
2355cd0d46ebSvictorle done:
23569566063dSJacob Faibussowitsch   PetscCall(PetscFree(aptr));
23579566063dSJacob Faibussowitsch   PetscCall(PetscFree(bptr));
23589566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &va));
23599566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(B, &vb));
23603ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
2361cd0d46ebSvictorle }
2362cd0d46ebSvictorle 
2363ba38deedSJacob Faibussowitsch static PetscErrorCode MatIsHermitianTranspose_SeqAIJ(Mat A, Mat B, PetscReal tol, PetscBool *f)
2364d71ae5a4SJacob Faibussowitsch {
23653d3eaba7SBarry Smith   Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data, *bij = (Mat_SeqAIJ *)B->data;
236654f21887SBarry Smith   PetscInt   *adx, *bdx, *aii, *bii, *aptr, *bptr;
236754f21887SBarry Smith   MatScalar  *va, *vb;
23681cbb95d3SBarry Smith   PetscInt    ma, na, mb, nb, i;
23691cbb95d3SBarry Smith 
23701cbb95d3SBarry Smith   PetscFunctionBegin;
23719566063dSJacob Faibussowitsch   PetscCall(MatGetSize(A, &ma, &na));
23729566063dSJacob Faibussowitsch   PetscCall(MatGetSize(B, &mb, &nb));
23731cbb95d3SBarry Smith   if (ma != nb || na != mb) {
23741cbb95d3SBarry Smith     *f = PETSC_FALSE;
23753ba16761SJacob Faibussowitsch     PetscFunctionReturn(PETSC_SUCCESS);
23761cbb95d3SBarry Smith   }
23779371c9d4SSatish Balay   aii = aij->i;
23789371c9d4SSatish Balay   bii = bij->i;
23799371c9d4SSatish Balay   adx = aij->j;
23809371c9d4SSatish Balay   bdx = bij->j;
23819371c9d4SSatish Balay   va  = aij->a;
23829371c9d4SSatish Balay   vb  = bij->a;
23839566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(ma, &aptr));
23849566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(mb, &bptr));
23851cbb95d3SBarry Smith   for (i = 0; i < ma; i++) aptr[i] = aii[i];
23861cbb95d3SBarry Smith   for (i = 0; i < mb; i++) bptr[i] = bii[i];
23871cbb95d3SBarry Smith 
23881cbb95d3SBarry Smith   *f = PETSC_TRUE;
23891cbb95d3SBarry Smith   for (i = 0; i < ma; i++) {
23901cbb95d3SBarry Smith     while (aptr[i] < aii[i + 1]) {
23911cbb95d3SBarry Smith       PetscInt    idc, idr;
23921cbb95d3SBarry Smith       PetscScalar vc, vr;
23931cbb95d3SBarry Smith       /* column/row index/value */
23941cbb95d3SBarry Smith       idc = adx[aptr[i]];
23951cbb95d3SBarry Smith       idr = bdx[bptr[idc]];
23961cbb95d3SBarry Smith       vc  = va[aptr[i]];
23971cbb95d3SBarry Smith       vr  = vb[bptr[idc]];
23981cbb95d3SBarry Smith       if (i != idr || PetscAbsScalar(vc - PetscConj(vr)) > tol) {
23991cbb95d3SBarry Smith         *f = PETSC_FALSE;
24001cbb95d3SBarry Smith         goto done;
24011cbb95d3SBarry Smith       } else {
24021cbb95d3SBarry Smith         aptr[i]++;
24031cbb95d3SBarry Smith         if (B || i != idc) bptr[idc]++;
24041cbb95d3SBarry Smith       }
24051cbb95d3SBarry Smith     }
24061cbb95d3SBarry Smith   }
24071cbb95d3SBarry Smith done:
24089566063dSJacob Faibussowitsch   PetscCall(PetscFree(aptr));
24099566063dSJacob Faibussowitsch   PetscCall(PetscFree(bptr));
24103ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
24111cbb95d3SBarry Smith }
24121cbb95d3SBarry Smith 
2413d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDiagonalScale_SeqAIJ(Mat A, Vec ll, Vec rr)
2414d71ae5a4SJacob Faibussowitsch {
2415416022c9SBarry Smith   Mat_SeqAIJ        *a = (Mat_SeqAIJ *)A->data;
2416fff8e43fSBarry Smith   const PetscScalar *l, *r;
2417fff8e43fSBarry Smith   PetscScalar        x;
241854f21887SBarry Smith   MatScalar         *v;
2419fff8e43fSBarry Smith   PetscInt           i, j, m = A->rmap->n, n = A->cmap->n, M, nz = a->nz;
2420fff8e43fSBarry Smith   const PetscInt    *jj;
242117ab2063SBarry Smith 
24223a40ed3dSBarry Smith   PetscFunctionBegin;
242317ab2063SBarry Smith   if (ll) {
24243ea7c6a1SSatish Balay     /* The local size is used so that VecMPI can be passed to this routine
24253ea7c6a1SSatish Balay        by MatDiagonalScale_MPIAIJ */
24269566063dSJacob Faibussowitsch     PetscCall(VecGetLocalSize(ll, &m));
242708401ef6SPierre Jolivet     PetscCheck(m == A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Left scaling vector wrong length");
24289566063dSJacob Faibussowitsch     PetscCall(VecGetArrayRead(ll, &l));
24299566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJGetArray(A, &v));
243017ab2063SBarry Smith     for (i = 0; i < m; i++) {
243117ab2063SBarry Smith       x = l[i];
2432416022c9SBarry Smith       M = a->i[i + 1] - a->i[i];
24332205254eSKarl Rupp       for (j = 0; j < M; j++) (*v++) *= x;
243417ab2063SBarry Smith     }
24359566063dSJacob Faibussowitsch     PetscCall(VecRestoreArrayRead(ll, &l));
24369566063dSJacob Faibussowitsch     PetscCall(PetscLogFlops(nz));
24379566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJRestoreArray(A, &v));
243817ab2063SBarry Smith   }
243917ab2063SBarry Smith   if (rr) {
24409566063dSJacob Faibussowitsch     PetscCall(VecGetLocalSize(rr, &n));
244108401ef6SPierre Jolivet     PetscCheck(n == A->cmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Right scaling vector wrong length");
24429566063dSJacob Faibussowitsch     PetscCall(VecGetArrayRead(rr, &r));
24439566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJGetArray(A, &v));
24442e5835c6SStefano Zampini     jj = a->j;
24452205254eSKarl Rupp     for (i = 0; i < nz; i++) (*v++) *= r[*jj++];
24469566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJRestoreArray(A, &v));
24479566063dSJacob Faibussowitsch     PetscCall(VecRestoreArrayRead(rr, &r));
24489566063dSJacob Faibussowitsch     PetscCall(PetscLogFlops(nz));
244917ab2063SBarry Smith   }
24509566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJInvalidateDiagonal(A));
24513ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
245217ab2063SBarry Smith }
245317ab2063SBarry Smith 
2454d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateSubMatrix_SeqAIJ(Mat A, IS isrow, IS iscol, PetscInt csize, MatReuse scall, Mat *B)
2455d71ae5a4SJacob Faibussowitsch {
2456db02288aSLois Curfman McInnes   Mat_SeqAIJ        *a = (Mat_SeqAIJ *)A->data, *c;
2457d0f46423SBarry Smith   PetscInt          *smap, i, k, kstart, kend, oldcols = A->cmap->n, *lens;
245897f1f81fSBarry Smith   PetscInt           row, mat_i, *mat_j, tcol, first, step, *mat_ilen, sum, lensi;
24595d0c19d7SBarry Smith   const PetscInt    *irow, *icol;
24602e5835c6SStefano Zampini   const PetscScalar *aa;
24615d0c19d7SBarry Smith   PetscInt           nrows, ncols;
246297f1f81fSBarry Smith   PetscInt          *starts, *j_new, *i_new, *aj = a->j, *ai = a->i, ii, *ailen = a->ilen;
2463fb3c7e2dSJunchao Zhang   MatScalar         *a_new, *mat_a, *c_a;
2464416022c9SBarry Smith   Mat                C;
2465cdc6f3adSToby Isaac   PetscBool          stride;
246617ab2063SBarry Smith 
24673a40ed3dSBarry Smith   PetscFunctionBegin;
24689566063dSJacob Faibussowitsch   PetscCall(ISGetIndices(isrow, &irow));
24699566063dSJacob Faibussowitsch   PetscCall(ISGetLocalSize(isrow, &nrows));
24709566063dSJacob Faibussowitsch   PetscCall(ISGetLocalSize(iscol, &ncols));
247117ab2063SBarry Smith 
24729566063dSJacob Faibussowitsch   PetscCall(PetscObjectTypeCompare((PetscObject)iscol, ISSTRIDE, &stride));
2473ff718158SBarry Smith   if (stride) {
24749566063dSJacob Faibussowitsch     PetscCall(ISStrideGetInfo(iscol, &first, &step));
2475ff718158SBarry Smith   } else {
2476ff718158SBarry Smith     first = 0;
2477ff718158SBarry Smith     step  = 0;
2478ff718158SBarry Smith   }
2479fee21e36SBarry Smith   if (stride && step == 1) {
248002834360SBarry Smith     /* special case of contiguous rows */
24819566063dSJacob Faibussowitsch     PetscCall(PetscMalloc2(nrows, &lens, nrows, &starts));
248202834360SBarry Smith     /* loop over new rows determining lens and starting points */
248302834360SBarry Smith     for (i = 0; i < nrows; i++) {
2484bfeeae90SHong Zhang       kstart    = ai[irow[i]];
2485a2744918SBarry Smith       kend      = kstart + ailen[irow[i]];
2486a91a9bebSLisandro Dalcin       starts[i] = kstart;
248702834360SBarry Smith       for (k = kstart; k < kend; k++) {
2488bfeeae90SHong Zhang         if (aj[k] >= first) {
248902834360SBarry Smith           starts[i] = k;
249002834360SBarry Smith           break;
249102834360SBarry Smith         }
249202834360SBarry Smith       }
2493a2744918SBarry Smith       sum = 0;
249402834360SBarry Smith       while (k < kend) {
2495bfeeae90SHong Zhang         if (aj[k++] >= first + ncols) break;
2496a2744918SBarry Smith         sum++;
249702834360SBarry Smith       }
2498a2744918SBarry Smith       lens[i] = sum;
249902834360SBarry Smith     }
250002834360SBarry Smith     /* create submatrix */
2501cddf8d76SBarry Smith     if (scall == MAT_REUSE_MATRIX) {
250297f1f81fSBarry Smith       PetscInt n_cols, n_rows;
25039566063dSJacob Faibussowitsch       PetscCall(MatGetSize(*B, &n_rows, &n_cols));
2504aed4548fSBarry Smith       PetscCheck(n_rows == nrows && n_cols == ncols, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Reused submatrix wrong size");
25059566063dSJacob Faibussowitsch       PetscCall(MatZeroEntries(*B));
250608480c60SBarry Smith       C = *B;
25073a40ed3dSBarry Smith     } else {
25083bef6203SJed Brown       PetscInt rbs, cbs;
25099566063dSJacob Faibussowitsch       PetscCall(MatCreate(PetscObjectComm((PetscObject)A), &C));
25109566063dSJacob Faibussowitsch       PetscCall(MatSetSizes(C, nrows, ncols, PETSC_DETERMINE, PETSC_DETERMINE));
25119566063dSJacob Faibussowitsch       PetscCall(ISGetBlockSize(isrow, &rbs));
25129566063dSJacob Faibussowitsch       PetscCall(ISGetBlockSize(iscol, &cbs));
25139566063dSJacob Faibussowitsch       PetscCall(MatSetBlockSizes(C, rbs, cbs));
25149566063dSJacob Faibussowitsch       PetscCall(MatSetType(C, ((PetscObject)A)->type_name));
25159566063dSJacob Faibussowitsch       PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(C, 0, lens));
251608480c60SBarry Smith     }
2517db02288aSLois Curfman McInnes     c = (Mat_SeqAIJ *)C->data;
2518db02288aSLois Curfman McInnes 
251902834360SBarry Smith     /* loop over rows inserting into submatrix */
2520fb3c7e2dSJunchao Zhang     PetscCall(MatSeqAIJGetArrayWrite(C, &a_new)); // Not 'a_new = c->a-new', since that raw usage ignores offload state of C
2521db02288aSLois Curfman McInnes     j_new = c->j;
2522db02288aSLois Curfman McInnes     i_new = c->i;
25239566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJGetArrayRead(A, &aa));
252402834360SBarry Smith     for (i = 0; i < nrows; i++) {
2525a2744918SBarry Smith       ii    = starts[i];
2526a2744918SBarry Smith       lensi = lens[i];
2527810441c8SPierre Jolivet       if (lensi) {
2528ad540459SPierre Jolivet         for (k = 0; k < lensi; k++) *j_new++ = aj[ii + k] - first;
25299566063dSJacob Faibussowitsch         PetscCall(PetscArraycpy(a_new, aa + starts[i], lensi));
2530a2744918SBarry Smith         a_new += lensi;
2531810441c8SPierre Jolivet       }
2532a2744918SBarry Smith       i_new[i + 1] = i_new[i] + lensi;
2533a2744918SBarry Smith       c->ilen[i]   = lensi;
253402834360SBarry Smith     }
2535fb3c7e2dSJunchao Zhang     PetscCall(MatSeqAIJRestoreArrayWrite(C, &a_new)); // Set C's offload state properly
25369566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJRestoreArrayRead(A, &aa));
25379566063dSJacob Faibussowitsch     PetscCall(PetscFree2(lens, starts));
25383a40ed3dSBarry Smith   } else {
25399566063dSJacob Faibussowitsch     PetscCall(ISGetIndices(iscol, &icol));
25409566063dSJacob Faibussowitsch     PetscCall(PetscCalloc1(oldcols, &smap));
25419566063dSJacob Faibussowitsch     PetscCall(PetscMalloc1(1 + nrows, &lens));
25424dcab191SBarry Smith     for (i = 0; i < ncols; i++) {
25436bdcaf15SBarry Smith       PetscCheck(icol[i] < oldcols, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Requesting column beyond largest column icol[%" PetscInt_FMT "] %" PetscInt_FMT " >= A->cmap->n %" PetscInt_FMT, i, icol[i], oldcols);
25444dcab191SBarry Smith       smap[icol[i]] = i + 1;
25454dcab191SBarry Smith     }
25464dcab191SBarry Smith 
254702834360SBarry Smith     /* determine lens of each row */
254802834360SBarry Smith     for (i = 0; i < nrows; i++) {
2549bfeeae90SHong Zhang       kstart  = ai[irow[i]];
255002834360SBarry Smith       kend    = kstart + a->ilen[irow[i]];
255102834360SBarry Smith       lens[i] = 0;
255202834360SBarry Smith       for (k = kstart; k < kend; k++) {
2553ad540459SPierre Jolivet         if (smap[aj[k]]) lens[i]++;
255402834360SBarry Smith       }
255502834360SBarry Smith     }
255617ab2063SBarry Smith     /* Create and fill new matrix */
2557a2744918SBarry Smith     if (scall == MAT_REUSE_MATRIX) {
2558ace3abfcSBarry Smith       PetscBool equal;
25590f5bd95cSBarry Smith 
256099141d43SSatish Balay       c = (Mat_SeqAIJ *)((*B)->data);
2561aed4548fSBarry Smith       PetscCheck((*B)->rmap->n == nrows && (*B)->cmap->n == ncols, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Cannot reuse matrix. wrong size");
25629566063dSJacob Faibussowitsch       PetscCall(PetscArraycmp(c->ilen, lens, (*B)->rmap->n, &equal));
2563fdfbdca6SPierre Jolivet       PetscCheck(equal, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Cannot reuse matrix. wrong number of nonzeros");
25649566063dSJacob Faibussowitsch       PetscCall(PetscArrayzero(c->ilen, (*B)->rmap->n));
256508480c60SBarry Smith       C = *B;
25663a40ed3dSBarry Smith     } else {
25673bef6203SJed Brown       PetscInt rbs, cbs;
25689566063dSJacob Faibussowitsch       PetscCall(MatCreate(PetscObjectComm((PetscObject)A), &C));
25699566063dSJacob Faibussowitsch       PetscCall(MatSetSizes(C, nrows, ncols, PETSC_DETERMINE, PETSC_DETERMINE));
25709566063dSJacob Faibussowitsch       PetscCall(ISGetBlockSize(isrow, &rbs));
25719566063dSJacob Faibussowitsch       PetscCall(ISGetBlockSize(iscol, &cbs));
257237a5e0faSPierre Jolivet       if (rbs > 1 || cbs > 1) PetscCall(MatSetBlockSizes(C, rbs, cbs));
25739566063dSJacob Faibussowitsch       PetscCall(MatSetType(C, ((PetscObject)A)->type_name));
25749566063dSJacob Faibussowitsch       PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(C, 0, lens));
257508480c60SBarry Smith     }
25769566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJGetArrayRead(A, &aa));
2577fb3c7e2dSJunchao Zhang 
2578f4f49eeaSPierre Jolivet     c = (Mat_SeqAIJ *)C->data;
2579fb3c7e2dSJunchao Zhang     PetscCall(MatSeqAIJGetArrayWrite(C, &c_a)); // Not 'c->a', since that raw usage ignores offload state of C
258017ab2063SBarry Smith     for (i = 0; i < nrows; i++) {
258199141d43SSatish Balay       row      = irow[i];
2582bfeeae90SHong Zhang       kstart   = ai[row];
258399141d43SSatish Balay       kend     = kstart + a->ilen[row];
2584bfeeae90SHong Zhang       mat_i    = c->i[i];
25858e3a54c0SPierre Jolivet       mat_j    = PetscSafePointerPlusOffset(c->j, mat_i);
25868e3a54c0SPierre Jolivet       mat_a    = PetscSafePointerPlusOffset(c_a, mat_i);
258799141d43SSatish Balay       mat_ilen = c->ilen + i;
258817ab2063SBarry Smith       for (k = kstart; k < kend; k++) {
2589bfeeae90SHong Zhang         if ((tcol = smap[a->j[k]])) {
2590ed480e8bSBarry Smith           *mat_j++ = tcol - 1;
25912e5835c6SStefano Zampini           *mat_a++ = aa[k];
259299141d43SSatish Balay           (*mat_ilen)++;
259317ab2063SBarry Smith         }
259417ab2063SBarry Smith       }
259517ab2063SBarry Smith     }
25969566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJRestoreArrayRead(A, &aa));
259702834360SBarry Smith     /* Free work space */
25989566063dSJacob Faibussowitsch     PetscCall(ISRestoreIndices(iscol, &icol));
25999566063dSJacob Faibussowitsch     PetscCall(PetscFree(smap));
26009566063dSJacob Faibussowitsch     PetscCall(PetscFree(lens));
2601cdc6f3adSToby Isaac     /* sort */
2602cdc6f3adSToby Isaac     for (i = 0; i < nrows; i++) {
2603cdc6f3adSToby Isaac       PetscInt ilen;
2604cdc6f3adSToby Isaac 
2605cdc6f3adSToby Isaac       mat_i = c->i[i];
26068e3a54c0SPierre Jolivet       mat_j = PetscSafePointerPlusOffset(c->j, mat_i);
26078e3a54c0SPierre Jolivet       mat_a = PetscSafePointerPlusOffset(c_a, mat_i);
2608cdc6f3adSToby Isaac       ilen  = c->ilen[i];
26099566063dSJacob Faibussowitsch       PetscCall(PetscSortIntWithScalarArray(ilen, mat_j, mat_a));
2610cdc6f3adSToby Isaac     }
2611fb3c7e2dSJunchao Zhang     PetscCall(MatSeqAIJRestoreArrayWrite(C, &c_a));
261202834360SBarry Smith   }
26138c3ff71bSJunchao Zhang #if defined(PETSC_HAVE_DEVICE)
26149566063dSJacob Faibussowitsch   PetscCall(MatBindToCPU(C, A->boundtocpu));
2615305c6ccfSStefano Zampini #endif
26169566063dSJacob Faibussowitsch   PetscCall(MatAssemblyBegin(C, MAT_FINAL_ASSEMBLY));
26179566063dSJacob Faibussowitsch   PetscCall(MatAssemblyEnd(C, MAT_FINAL_ASSEMBLY));
261817ab2063SBarry Smith 
26199566063dSJacob Faibussowitsch   PetscCall(ISRestoreIndices(isrow, &irow));
2620416022c9SBarry Smith   *B = C;
26213ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
262217ab2063SBarry Smith }
262317ab2063SBarry Smith 
2624ba38deedSJacob Faibussowitsch static PetscErrorCode MatGetMultiProcBlock_SeqAIJ(Mat mat, MPI_Comm subComm, MatReuse scall, Mat *subMat)
2625d71ae5a4SJacob Faibussowitsch {
262682d44351SHong Zhang   Mat B;
262782d44351SHong Zhang 
262882d44351SHong Zhang   PetscFunctionBegin;
2629c2d650bdSHong Zhang   if (scall == MAT_INITIAL_MATRIX) {
26309566063dSJacob Faibussowitsch     PetscCall(MatCreate(subComm, &B));
26319566063dSJacob Faibussowitsch     PetscCall(MatSetSizes(B, mat->rmap->n, mat->cmap->n, mat->rmap->n, mat->cmap->n));
26329566063dSJacob Faibussowitsch     PetscCall(MatSetBlockSizesFromMats(B, mat, mat));
26339566063dSJacob Faibussowitsch     PetscCall(MatSetType(B, MATSEQAIJ));
26349566063dSJacob Faibussowitsch     PetscCall(MatDuplicateNoCreate_SeqAIJ(B, mat, MAT_COPY_VALUES, PETSC_TRUE));
263582d44351SHong Zhang     *subMat = B;
2636c2d650bdSHong Zhang   } else {
26379566063dSJacob Faibussowitsch     PetscCall(MatCopy_SeqAIJ(mat, *subMat, SAME_NONZERO_PATTERN));
2638c2d650bdSHong Zhang   }
26393ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
264082d44351SHong Zhang }
264182d44351SHong Zhang 
2642ba38deedSJacob Faibussowitsch static PetscErrorCode MatILUFactor_SeqAIJ(Mat inA, IS row, IS col, const MatFactorInfo *info)
2643d71ae5a4SJacob Faibussowitsch {
264463b91edcSBarry Smith   Mat_SeqAIJ *a = (Mat_SeqAIJ *)inA->data;
264563b91edcSBarry Smith   Mat         outA;
2646ace3abfcSBarry Smith   PetscBool   row_identity, col_identity;
264763b91edcSBarry Smith 
26483a40ed3dSBarry Smith   PetscFunctionBegin;
264908401ef6SPierre Jolivet   PetscCheck(info->levels == 0, PETSC_COMM_SELF, PETSC_ERR_SUP, "Only levels=0 supported for in-place ilu");
26501df811f5SHong Zhang 
26519566063dSJacob Faibussowitsch   PetscCall(ISIdentity(row, &row_identity));
26529566063dSJacob Faibussowitsch   PetscCall(ISIdentity(col, &col_identity));
2653a871dcd8SBarry Smith 
265463b91edcSBarry Smith   outA             = inA;
2655d5f3da31SBarry Smith   outA->factortype = MAT_FACTOR_LU;
26569566063dSJacob Faibussowitsch   PetscCall(PetscFree(inA->solvertype));
26579566063dSJacob Faibussowitsch   PetscCall(PetscStrallocpy(MATSOLVERPETSC, &inA->solvertype));
26582205254eSKarl Rupp 
26599566063dSJacob Faibussowitsch   PetscCall(PetscObjectReference((PetscObject)row));
26609566063dSJacob Faibussowitsch   PetscCall(ISDestroy(&a->row));
26612205254eSKarl Rupp 
2662c3122656SLisandro Dalcin   a->row = row;
26632205254eSKarl Rupp 
26649566063dSJacob Faibussowitsch   PetscCall(PetscObjectReference((PetscObject)col));
26659566063dSJacob Faibussowitsch   PetscCall(ISDestroy(&a->col));
26662205254eSKarl Rupp 
2667c3122656SLisandro Dalcin   a->col = col;
266863b91edcSBarry Smith 
266936db0b34SBarry Smith   /* Create the inverse permutation so that it can be used in MatLUFactorNumeric() */
26709566063dSJacob Faibussowitsch   PetscCall(ISDestroy(&a->icol));
26719566063dSJacob Faibussowitsch   PetscCall(ISInvertPermutation(col, PETSC_DECIDE, &a->icol));
2672f0ec6fceSSatish Balay 
267394a9d846SBarry Smith   if (!a->solve_work) { /* this matrix may have been factored before */
26749566063dSJacob Faibussowitsch     PetscCall(PetscMalloc1(inA->rmap->n + 1, &a->solve_work));
267594a9d846SBarry Smith   }
267663b91edcSBarry Smith 
26779566063dSJacob Faibussowitsch   PetscCall(MatMarkDiagonal_SeqAIJ(inA));
2678137fb511SHong Zhang   if (row_identity && col_identity) {
26799566063dSJacob Faibussowitsch     PetscCall(MatLUFactorNumeric_SeqAIJ_inplace(outA, inA, info));
2680137fb511SHong Zhang   } else {
26819566063dSJacob Faibussowitsch     PetscCall(MatLUFactorNumeric_SeqAIJ_InplaceWithPerm(outA, inA, info));
2682137fb511SHong Zhang   }
26833ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
2684a871dcd8SBarry Smith }
2685a871dcd8SBarry Smith 
2686d71ae5a4SJacob Faibussowitsch PetscErrorCode MatScale_SeqAIJ(Mat inA, PetscScalar alpha)
2687d71ae5a4SJacob Faibussowitsch {
2688f0b747eeSBarry Smith   Mat_SeqAIJ  *a = (Mat_SeqAIJ *)inA->data;
2689dfa0f9e5SStefano Zampini   PetscScalar *v;
2690c5df96a5SBarry Smith   PetscBLASInt one = 1, bnz;
26913a40ed3dSBarry Smith 
26923a40ed3dSBarry Smith   PetscFunctionBegin;
26939566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArray(inA, &v));
26949566063dSJacob Faibussowitsch   PetscCall(PetscBLASIntCast(a->nz, &bnz));
2695792fecdfSBarry Smith   PetscCallBLAS("BLASscal", BLASscal_(&bnz, &alpha, v, &one));
26969566063dSJacob Faibussowitsch   PetscCall(PetscLogFlops(a->nz));
26979566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArray(inA, &v));
26989566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJInvalidateDiagonal(inA));
26993ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
2700f0b747eeSBarry Smith }
2701f0b747eeSBarry Smith 
2702d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDestroySubMatrix_Private(Mat_SubSppt *submatj)
2703d71ae5a4SJacob Faibussowitsch {
270416b64355SHong Zhang   PetscInt i;
270516b64355SHong Zhang 
270616b64355SHong Zhang   PetscFunctionBegin;
270716b64355SHong Zhang   if (!submatj->id) { /* delete data that are linked only to submats[id=0] */
27089566063dSJacob Faibussowitsch     PetscCall(PetscFree4(submatj->sbuf1, submatj->ptr, submatj->tmp, submatj->ctr));
270916b64355SHong Zhang 
271048a46eb9SPierre Jolivet     for (i = 0; i < submatj->nrqr; ++i) PetscCall(PetscFree(submatj->sbuf2[i]));
27119566063dSJacob Faibussowitsch     PetscCall(PetscFree3(submatj->sbuf2, submatj->req_size, submatj->req_source1));
271216b64355SHong Zhang 
271316b64355SHong Zhang     if (submatj->rbuf1) {
27149566063dSJacob Faibussowitsch       PetscCall(PetscFree(submatj->rbuf1[0]));
27159566063dSJacob Faibussowitsch       PetscCall(PetscFree(submatj->rbuf1));
271616b64355SHong Zhang     }
271716b64355SHong Zhang 
271848a46eb9SPierre Jolivet     for (i = 0; i < submatj->nrqs; ++i) PetscCall(PetscFree(submatj->rbuf3[i]));
27199566063dSJacob Faibussowitsch     PetscCall(PetscFree3(submatj->req_source2, submatj->rbuf2, submatj->rbuf3));
27209566063dSJacob Faibussowitsch     PetscCall(PetscFree(submatj->pa));
272116b64355SHong Zhang   }
272216b64355SHong Zhang 
272316b64355SHong Zhang #if defined(PETSC_USE_CTABLE)
2724eec179cfSJacob Faibussowitsch   PetscCall(PetscHMapIDestroy(&submatj->rmap));
27259566063dSJacob Faibussowitsch   if (submatj->cmap_loc) PetscCall(PetscFree(submatj->cmap_loc));
27269566063dSJacob Faibussowitsch   PetscCall(PetscFree(submatj->rmap_loc));
272716b64355SHong Zhang #else
27289566063dSJacob Faibussowitsch   PetscCall(PetscFree(submatj->rmap));
272916b64355SHong Zhang #endif
273016b64355SHong Zhang 
273116b64355SHong Zhang   if (!submatj->allcolumns) {
273216b64355SHong Zhang #if defined(PETSC_USE_CTABLE)
2733eec179cfSJacob Faibussowitsch     PetscCall(PetscHMapIDestroy((PetscHMapI *)&submatj->cmap));
273416b64355SHong Zhang #else
27359566063dSJacob Faibussowitsch     PetscCall(PetscFree(submatj->cmap));
273616b64355SHong Zhang #endif
273716b64355SHong Zhang   }
27389566063dSJacob Faibussowitsch   PetscCall(PetscFree(submatj->row2proc));
273916b64355SHong Zhang 
27409566063dSJacob Faibussowitsch   PetscCall(PetscFree(submatj));
27413ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
274216b64355SHong Zhang }
274316b64355SHong Zhang 
2744d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDestroySubMatrix_SeqAIJ(Mat C)
2745d71ae5a4SJacob Faibussowitsch {
274616b64355SHong Zhang   Mat_SeqAIJ  *c       = (Mat_SeqAIJ *)C->data;
27475c39f6d9SHong Zhang   Mat_SubSppt *submatj = c->submatis1;
274816b64355SHong Zhang 
274916b64355SHong Zhang   PetscFunctionBegin;
27509566063dSJacob Faibussowitsch   PetscCall((*submatj->destroy)(C));
27519566063dSJacob Faibussowitsch   PetscCall(MatDestroySubMatrix_Private(submatj));
27523ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
275316b64355SHong Zhang }
275416b64355SHong Zhang 
275589a1a59bSHong Zhang /* Note this has code duplication with MatDestroySubMatrices_SeqBAIJ() */
2756ba38deedSJacob Faibussowitsch static PetscErrorCode MatDestroySubMatrices_SeqAIJ(PetscInt n, Mat *mat[])
2757d71ae5a4SJacob Faibussowitsch {
27582d033e1fSHong Zhang   PetscInt     i;
27590fb991dcSHong Zhang   Mat          C;
27600fb991dcSHong Zhang   Mat_SeqAIJ  *c;
27610fb991dcSHong Zhang   Mat_SubSppt *submatj;
27622d033e1fSHong Zhang 
27632d033e1fSHong Zhang   PetscFunctionBegin;
27642d033e1fSHong Zhang   for (i = 0; i < n; i++) {
27650fb991dcSHong Zhang     C       = (*mat)[i];
27660fb991dcSHong Zhang     c       = (Mat_SeqAIJ *)C->data;
27670fb991dcSHong Zhang     submatj = c->submatis1;
27682d033e1fSHong Zhang     if (submatj) {
2769682e4c99SStefano Zampini       if (--((PetscObject)C)->refct <= 0) {
277026cc229bSBarry Smith         PetscCall(PetscFree(C->factorprefix));
27719566063dSJacob Faibussowitsch         PetscCall((*submatj->destroy)(C));
27729566063dSJacob Faibussowitsch         PetscCall(MatDestroySubMatrix_Private(submatj));
27739566063dSJacob Faibussowitsch         PetscCall(PetscFree(C->defaultvectype));
27743faff063SStefano Zampini         PetscCall(PetscFree(C->defaultrandtype));
27759566063dSJacob Faibussowitsch         PetscCall(PetscLayoutDestroy(&C->rmap));
27769566063dSJacob Faibussowitsch         PetscCall(PetscLayoutDestroy(&C->cmap));
27779566063dSJacob Faibussowitsch         PetscCall(PetscHeaderDestroy(&C));
2778682e4c99SStefano Zampini       }
27792d033e1fSHong Zhang     } else {
27809566063dSJacob Faibussowitsch       PetscCall(MatDestroy(&C));
27812d033e1fSHong Zhang     }
27822d033e1fSHong Zhang   }
278386e85357SHong Zhang 
278463a75b2aSHong Zhang   /* Destroy Dummy submatrices created for reuse */
27859566063dSJacob Faibussowitsch   PetscCall(MatDestroySubMatrices_Dummy(n, mat));
278663a75b2aSHong Zhang 
27879566063dSJacob Faibussowitsch   PetscCall(PetscFree(*mat));
27883ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
27892d033e1fSHong Zhang }
27902d033e1fSHong Zhang 
2791ba38deedSJacob Faibussowitsch static PetscErrorCode MatCreateSubMatrices_SeqAIJ(Mat A, PetscInt n, const IS irow[], const IS icol[], MatReuse scall, Mat *B[])
2792d71ae5a4SJacob Faibussowitsch {
279397f1f81fSBarry Smith   PetscInt i;
2794cddf8d76SBarry Smith 
27953a40ed3dSBarry Smith   PetscFunctionBegin;
279648a46eb9SPierre Jolivet   if (scall == MAT_INITIAL_MATRIX) PetscCall(PetscCalloc1(n + 1, B));
2797cddf8d76SBarry Smith 
279848a46eb9SPierre Jolivet   for (i = 0; i < n; i++) PetscCall(MatCreateSubMatrix_SeqAIJ(A, irow[i], icol[i], PETSC_DECIDE, scall, &(*B)[i]));
27993ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
2800cddf8d76SBarry Smith }
2801cddf8d76SBarry Smith 
2802ba38deedSJacob Faibussowitsch static PetscErrorCode MatIncreaseOverlap_SeqAIJ(Mat A, PetscInt is_max, IS is[], PetscInt ov)
2803d71ae5a4SJacob Faibussowitsch {
2804e4d965acSSatish Balay   Mat_SeqAIJ     *a = (Mat_SeqAIJ *)A->data;
28059a88ca10SBarry Smith   PetscInt        row, i, j, k, l, ll, m, n, *nidx, isz, val;
28065d0c19d7SBarry Smith   const PetscInt *idx;
28079a88ca10SBarry Smith   PetscInt        start, end, *ai, *aj, bs = (A->rmap->bs > 0 && A->rmap->bs == A->cmap->bs) ? A->rmap->bs : 1;
2808f1af5d2fSBarry Smith   PetscBT         table;
2809bbd702dbSSatish Balay 
28103a40ed3dSBarry Smith   PetscFunctionBegin;
28119a88ca10SBarry Smith   m  = A->rmap->n / bs;
2812e4d965acSSatish Balay   ai = a->i;
2813bfeeae90SHong Zhang   aj = a->j;
28148a047759SSatish Balay 
281508401ef6SPierre Jolivet   PetscCheck(ov >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "illegal negative overlap value used");
281606763907SSatish Balay 
28179566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(m + 1, &nidx));
28189566063dSJacob Faibussowitsch   PetscCall(PetscBTCreate(m, &table));
281906763907SSatish Balay 
2820e4d965acSSatish Balay   for (i = 0; i < is_max; i++) {
2821b97fc60eSLois Curfman McInnes     /* Initialize the two local arrays */
2822e4d965acSSatish Balay     isz = 0;
28239566063dSJacob Faibussowitsch     PetscCall(PetscBTMemzero(m, table));
2824e4d965acSSatish Balay 
2825e4d965acSSatish Balay     /* Extract the indices, assume there can be duplicate entries */
28269566063dSJacob Faibussowitsch     PetscCall(ISGetIndices(is[i], &idx));
28279566063dSJacob Faibussowitsch     PetscCall(ISGetLocalSize(is[i], &n));
2828e4d965acSSatish Balay 
28299a88ca10SBarry Smith     if (bs > 1) {
28309a88ca10SBarry Smith       /* Enter these into the temp arrays. I.e., mark table[row], enter row into new index */
28319a88ca10SBarry Smith       for (j = 0; j < n; ++j) {
28329a88ca10SBarry Smith         if (!PetscBTLookupSet(table, idx[j] / bs)) nidx[isz++] = idx[j] / bs;
28339a88ca10SBarry Smith       }
28349a88ca10SBarry Smith       PetscCall(ISRestoreIndices(is[i], &idx));
28359a88ca10SBarry Smith       PetscCall(ISDestroy(&is[i]));
28369a88ca10SBarry Smith 
28379a88ca10SBarry Smith       k = 0;
28389a88ca10SBarry Smith       for (j = 0; j < ov; j++) { /* for each overlap */
28399a88ca10SBarry Smith         n = isz;
28409a88ca10SBarry Smith         for (; k < n; k++) { /* do only those rows in nidx[k], which are not done yet */
28419a88ca10SBarry Smith           for (ll = 0; ll < bs; ll++) {
28429a88ca10SBarry Smith             row   = bs * nidx[k] + ll;
28439a88ca10SBarry Smith             start = ai[row];
28449a88ca10SBarry Smith             end   = ai[row + 1];
28459a88ca10SBarry Smith             for (l = start; l < end; l++) {
28469a88ca10SBarry Smith               val = aj[l] / bs;
28479a88ca10SBarry Smith               if (!PetscBTLookupSet(table, val)) nidx[isz++] = val;
28489a88ca10SBarry Smith             }
28499a88ca10SBarry Smith           }
28509a88ca10SBarry Smith         }
28519a88ca10SBarry Smith       }
28529a88ca10SBarry Smith       PetscCall(ISCreateBlock(PETSC_COMM_SELF, bs, isz, nidx, PETSC_COPY_VALUES, (is + i)));
28539a88ca10SBarry Smith     } else {
2854dd097bc3SLois Curfman McInnes       /* Enter these into the temp arrays. I.e., mark table[row], enter row into new index */
2855e4d965acSSatish Balay       for (j = 0; j < n; ++j) {
28562205254eSKarl Rupp         if (!PetscBTLookupSet(table, idx[j])) nidx[isz++] = idx[j];
28574dcbc457SBarry Smith       }
28589566063dSJacob Faibussowitsch       PetscCall(ISRestoreIndices(is[i], &idx));
28599566063dSJacob Faibussowitsch       PetscCall(ISDestroy(&is[i]));
2860e4d965acSSatish Balay 
286104a348a9SBarry Smith       k = 0;
286204a348a9SBarry Smith       for (j = 0; j < ov; j++) { /* for each overlap */
286304a348a9SBarry Smith         n = isz;
286406763907SSatish Balay         for (; k < n; k++) { /* do only those rows in nidx[k], which are not done yet */
2865e4d965acSSatish Balay           row   = nidx[k];
2866e4d965acSSatish Balay           start = ai[row];
2867e4d965acSSatish Balay           end   = ai[row + 1];
286804a348a9SBarry Smith           for (l = start; l < end; l++) {
2869efb16452SHong Zhang             val = aj[l];
28702205254eSKarl Rupp             if (!PetscBTLookupSet(table, val)) nidx[isz++] = val;
2871e4d965acSSatish Balay           }
2872e4d965acSSatish Balay         }
2873e4d965acSSatish Balay       }
28749566063dSJacob Faibussowitsch       PetscCall(ISCreateGeneral(PETSC_COMM_SELF, isz, nidx, PETSC_COPY_VALUES, (is + i)));
2875e4d965acSSatish Balay     }
28769a88ca10SBarry Smith   }
28779566063dSJacob Faibussowitsch   PetscCall(PetscBTDestroy(&table));
28789566063dSJacob Faibussowitsch   PetscCall(PetscFree(nidx));
28793ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
28804dcbc457SBarry Smith }
288117ab2063SBarry Smith 
2882ba38deedSJacob Faibussowitsch static PetscErrorCode MatPermute_SeqAIJ(Mat A, IS rowp, IS colp, Mat *B)
2883d71ae5a4SJacob Faibussowitsch {
28840513a670SBarry Smith   Mat_SeqAIJ     *a = (Mat_SeqAIJ *)A->data;
28853b98c0a2SBarry Smith   PetscInt        i, nz = 0, m = A->rmap->n, n = A->cmap->n;
28865d0c19d7SBarry Smith   const PetscInt *row, *col;
28875d0c19d7SBarry Smith   PetscInt       *cnew, j, *lens;
288856cd22aeSBarry Smith   IS              icolp, irowp;
28890298fd71SBarry Smith   PetscInt       *cwork = NULL;
28900298fd71SBarry Smith   PetscScalar    *vwork = NULL;
28910513a670SBarry Smith 
28923a40ed3dSBarry Smith   PetscFunctionBegin;
28939566063dSJacob Faibussowitsch   PetscCall(ISInvertPermutation(rowp, PETSC_DECIDE, &irowp));
28949566063dSJacob Faibussowitsch   PetscCall(ISGetIndices(irowp, &row));
28959566063dSJacob Faibussowitsch   PetscCall(ISInvertPermutation(colp, PETSC_DECIDE, &icolp));
28969566063dSJacob Faibussowitsch   PetscCall(ISGetIndices(icolp, &col));
28970513a670SBarry Smith 
28980513a670SBarry Smith   /* determine lengths of permuted rows */
28999566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(m + 1, &lens));
29002205254eSKarl Rupp   for (i = 0; i < m; i++) lens[row[i]] = a->i[i + 1] - a->i[i];
29019566063dSJacob Faibussowitsch   PetscCall(MatCreate(PetscObjectComm((PetscObject)A), B));
29029566063dSJacob Faibussowitsch   PetscCall(MatSetSizes(*B, m, n, m, n));
29039566063dSJacob Faibussowitsch   PetscCall(MatSetBlockSizesFromMats(*B, A, A));
29049566063dSJacob Faibussowitsch   PetscCall(MatSetType(*B, ((PetscObject)A)->type_name));
29059566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(*B, 0, lens));
29069566063dSJacob Faibussowitsch   PetscCall(PetscFree(lens));
29070513a670SBarry Smith 
29089566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(n, &cnew));
29090513a670SBarry Smith   for (i = 0; i < m; i++) {
29109566063dSJacob Faibussowitsch     PetscCall(MatGetRow_SeqAIJ(A, i, &nz, &cwork, &vwork));
29112205254eSKarl Rupp     for (j = 0; j < nz; j++) cnew[j] = col[cwork[j]];
29129566063dSJacob Faibussowitsch     PetscCall(MatSetValues_SeqAIJ(*B, 1, &row[i], nz, cnew, vwork, INSERT_VALUES));
29139566063dSJacob Faibussowitsch     PetscCall(MatRestoreRow_SeqAIJ(A, i, &nz, &cwork, &vwork));
29140513a670SBarry Smith   }
29159566063dSJacob Faibussowitsch   PetscCall(PetscFree(cnew));
29162205254eSKarl Rupp 
29173c7d62e4SBarry Smith   (*B)->assembled = PETSC_FALSE;
29182205254eSKarl Rupp 
29198c3ff71bSJunchao Zhang #if defined(PETSC_HAVE_DEVICE)
29209566063dSJacob Faibussowitsch   PetscCall(MatBindToCPU(*B, A->boundtocpu));
29219fe5e383SStefano Zampini #endif
29229566063dSJacob Faibussowitsch   PetscCall(MatAssemblyBegin(*B, MAT_FINAL_ASSEMBLY));
29239566063dSJacob Faibussowitsch   PetscCall(MatAssemblyEnd(*B, MAT_FINAL_ASSEMBLY));
29249566063dSJacob Faibussowitsch   PetscCall(ISRestoreIndices(irowp, &row));
29259566063dSJacob Faibussowitsch   PetscCall(ISRestoreIndices(icolp, &col));
29269566063dSJacob Faibussowitsch   PetscCall(ISDestroy(&irowp));
29279566063dSJacob Faibussowitsch   PetscCall(ISDestroy(&icolp));
292848a46eb9SPierre Jolivet   if (rowp == colp) PetscCall(MatPropagateSymmetryOptions(A, *B));
29293ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
29300513a670SBarry Smith }
29310513a670SBarry Smith 
2932d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCopy_SeqAIJ(Mat A, Mat B, MatStructure str)
2933d71ae5a4SJacob Faibussowitsch {
2934cb5b572fSBarry Smith   PetscFunctionBegin;
293533f4a19fSKris Buschelman   /* If the two matrices have the same copy implementation, use fast copy. */
293633f4a19fSKris Buschelman   if (str == SAME_NONZERO_PATTERN && (A->ops->copy == B->ops->copy)) {
2937be6bf707SBarry Smith     Mat_SeqAIJ        *a = (Mat_SeqAIJ *)A->data;
2938be6bf707SBarry Smith     Mat_SeqAIJ        *b = (Mat_SeqAIJ *)B->data;
29392e5835c6SStefano Zampini     const PetscScalar *aa;
2940be6bf707SBarry Smith 
29419566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJGetArrayRead(A, &aa));
294208401ef6SPierre Jolivet     PetscCheck(a->i[A->rmap->n] == b->i[B->rmap->n], PETSC_COMM_SELF, PETSC_ERR_ARG_INCOMP, "Number of nonzeros in two matrices are different %" PetscInt_FMT " != %" PetscInt_FMT, a->i[A->rmap->n], b->i[B->rmap->n]);
29439566063dSJacob Faibussowitsch     PetscCall(PetscArraycpy(b->a, aa, a->i[A->rmap->n]));
29449566063dSJacob Faibussowitsch     PetscCall(PetscObjectStateIncrease((PetscObject)B));
29459566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJRestoreArrayRead(A, &aa));
2946cb5b572fSBarry Smith   } else {
29479566063dSJacob Faibussowitsch     PetscCall(MatCopy_Basic(A, B, str));
2948cb5b572fSBarry Smith   }
29493ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
2950cb5b572fSBarry Smith }
2951cb5b572fSBarry Smith 
2952d71ae5a4SJacob Faibussowitsch PETSC_INTERN PetscErrorCode MatSeqAIJGetArray_SeqAIJ(Mat A, PetscScalar *array[])
2953d71ae5a4SJacob Faibussowitsch {
29546c0721eeSBarry Smith   Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data;
29556e111a19SKarl Rupp 
29566c0721eeSBarry Smith   PetscFunctionBegin;
29576c0721eeSBarry Smith   *array = a->a;
29583ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
29596c0721eeSBarry Smith }
29606c0721eeSBarry Smith 
2961d71ae5a4SJacob Faibussowitsch PETSC_INTERN PetscErrorCode MatSeqAIJRestoreArray_SeqAIJ(Mat A, PetscScalar *array[])
2962d71ae5a4SJacob Faibussowitsch {
29636c0721eeSBarry Smith   PetscFunctionBegin;
2964f38c1e66SStefano Zampini   *array = NULL;
29653ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
29666c0721eeSBarry Smith }
2967273d9f13SBarry Smith 
29688229c054SShri Abhyankar /*
29698229c054SShri Abhyankar    Computes the number of nonzeros per row needed for preallocation when X and Y
29708229c054SShri Abhyankar    have different nonzero structure.
29718229c054SShri Abhyankar */
2972d71ae5a4SJacob Faibussowitsch PetscErrorCode MatAXPYGetPreallocation_SeqX_private(PetscInt m, const PetscInt *xi, const PetscInt *xj, const PetscInt *yi, const PetscInt *yj, PetscInt *nnz)
2973d71ae5a4SJacob Faibussowitsch {
2974b264fe52SHong Zhang   PetscInt i, j, k, nzx, nzy;
2975ec7775f6SShri Abhyankar 
2976ec7775f6SShri Abhyankar   PetscFunctionBegin;
2977ec7775f6SShri Abhyankar   /* Set the number of nonzeros in the new matrix */
2978ec7775f6SShri Abhyankar   for (i = 0; i < m; i++) {
29798e3a54c0SPierre Jolivet     const PetscInt *xjj = PetscSafePointerPlusOffset(xj, xi[i]), *yjj = PetscSafePointerPlusOffset(yj, yi[i]);
2980b264fe52SHong Zhang     nzx    = xi[i + 1] - xi[i];
2981b264fe52SHong Zhang     nzy    = yi[i + 1] - yi[i];
29828af7cee1SJed Brown     nnz[i] = 0;
29838af7cee1SJed Brown     for (j = 0, k = 0; j < nzx; j++) {                  /* Point in X */
2984b264fe52SHong Zhang       for (; k < nzy && yjj[k] < xjj[j]; k++) nnz[i]++; /* Catch up to X */
2985b264fe52SHong Zhang       if (k < nzy && yjj[k] == xjj[j]) k++;             /* Skip duplicate */
29868af7cee1SJed Brown       nnz[i]++;
29878af7cee1SJed Brown     }
29888af7cee1SJed Brown     for (; k < nzy; k++) nnz[i]++;
2989ec7775f6SShri Abhyankar   }
29903ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
2991ec7775f6SShri Abhyankar }
2992ec7775f6SShri Abhyankar 
2993d71ae5a4SJacob Faibussowitsch PetscErrorCode MatAXPYGetPreallocation_SeqAIJ(Mat Y, Mat X, PetscInt *nnz)
2994d71ae5a4SJacob Faibussowitsch {
2995b264fe52SHong Zhang   PetscInt    m = Y->rmap->N;
2996b264fe52SHong Zhang   Mat_SeqAIJ *x = (Mat_SeqAIJ *)X->data;
2997b264fe52SHong Zhang   Mat_SeqAIJ *y = (Mat_SeqAIJ *)Y->data;
2998b264fe52SHong Zhang 
2999b264fe52SHong Zhang   PetscFunctionBegin;
3000b264fe52SHong Zhang   /* Set the number of nonzeros in the new matrix */
30019566063dSJacob Faibussowitsch   PetscCall(MatAXPYGetPreallocation_SeqX_private(m, x->i, x->j, y->i, y->j, nnz));
30023ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3003b264fe52SHong Zhang }
3004b264fe52SHong Zhang 
3005d71ae5a4SJacob Faibussowitsch PetscErrorCode MatAXPY_SeqAIJ(Mat Y, PetscScalar a, Mat X, MatStructure str)
3006d71ae5a4SJacob Faibussowitsch {
3007ac90fabeSBarry Smith   Mat_SeqAIJ *x = (Mat_SeqAIJ *)X->data, *y = (Mat_SeqAIJ *)Y->data;
3008ac90fabeSBarry Smith 
3009ac90fabeSBarry Smith   PetscFunctionBegin;
3010134adf20SPierre Jolivet   if (str == UNKNOWN_NONZERO_PATTERN || (PetscDefined(USE_DEBUG) && str == SAME_NONZERO_PATTERN)) {
3011134adf20SPierre Jolivet     PetscBool e = x->nz == y->nz ? PETSC_TRUE : PETSC_FALSE;
3012134adf20SPierre Jolivet     if (e) {
30139566063dSJacob Faibussowitsch       PetscCall(PetscArraycmp(x->i, y->i, Y->rmap->n + 1, &e));
301481fa06acSBarry Smith       if (e) {
30159566063dSJacob Faibussowitsch         PetscCall(PetscArraycmp(x->j, y->j, y->nz, &e));
3016134adf20SPierre Jolivet         if (e) str = SAME_NONZERO_PATTERN;
301781fa06acSBarry Smith       }
301881fa06acSBarry Smith     }
301954c59aa7SJacob Faibussowitsch     if (!e) PetscCheck(str != SAME_NONZERO_PATTERN, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONG, "MatStructure is not SAME_NONZERO_PATTERN");
302081fa06acSBarry Smith   }
3021ac90fabeSBarry Smith   if (str == SAME_NONZERO_PATTERN) {
30222e5835c6SStefano Zampini     const PetscScalar *xa;
30232e5835c6SStefano Zampini     PetscScalar       *ya, alpha = a;
302481fa06acSBarry Smith     PetscBLASInt       one = 1, bnz;
302581fa06acSBarry Smith 
30269566063dSJacob Faibussowitsch     PetscCall(PetscBLASIntCast(x->nz, &bnz));
30279566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJGetArray(Y, &ya));
30289566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJGetArrayRead(X, &xa));
3029792fecdfSBarry Smith     PetscCallBLAS("BLASaxpy", BLASaxpy_(&bnz, &alpha, xa, &one, ya, &one));
30309566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJRestoreArrayRead(X, &xa));
30319566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJRestoreArray(Y, &ya));
30329566063dSJacob Faibussowitsch     PetscCall(PetscLogFlops(2.0 * bnz));
30339566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJInvalidateDiagonal(Y));
30349566063dSJacob Faibussowitsch     PetscCall(PetscObjectStateIncrease((PetscObject)Y));
3035ab784542SHong Zhang   } else if (str == SUBSET_NONZERO_PATTERN) { /* nonzeros of X is a subset of Y's */
30369566063dSJacob Faibussowitsch     PetscCall(MatAXPY_Basic(Y, a, X, str));
3037ac90fabeSBarry Smith   } else {
30388229c054SShri Abhyankar     Mat       B;
30398229c054SShri Abhyankar     PetscInt *nnz;
30409566063dSJacob Faibussowitsch     PetscCall(PetscMalloc1(Y->rmap->N, &nnz));
30419566063dSJacob Faibussowitsch     PetscCall(MatCreate(PetscObjectComm((PetscObject)Y), &B));
30429566063dSJacob Faibussowitsch     PetscCall(PetscObjectSetName((PetscObject)B, ((PetscObject)Y)->name));
30439566063dSJacob Faibussowitsch     PetscCall(MatSetLayouts(B, Y->rmap, Y->cmap));
30449566063dSJacob Faibussowitsch     PetscCall(MatSetType(B, ((PetscObject)Y)->type_name));
30459566063dSJacob Faibussowitsch     PetscCall(MatAXPYGetPreallocation_SeqAIJ(Y, X, nnz));
30469566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJSetPreallocation(B, 0, nnz));
30479566063dSJacob Faibussowitsch     PetscCall(MatAXPY_BasicWithPreallocation(B, Y, a, X, str));
30489566063dSJacob Faibussowitsch     PetscCall(MatHeaderMerge(Y, &B));
30499bb234a9SBarry Smith     PetscCall(MatSeqAIJCheckInode(Y));
30509566063dSJacob Faibussowitsch     PetscCall(PetscFree(nnz));
3051ac90fabeSBarry Smith   }
30523ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3053ac90fabeSBarry Smith }
3054ac90fabeSBarry Smith 
3055d71ae5a4SJacob Faibussowitsch PETSC_INTERN PetscErrorCode MatConjugate_SeqAIJ(Mat mat)
3056d71ae5a4SJacob Faibussowitsch {
3057354c94deSBarry Smith #if defined(PETSC_USE_COMPLEX)
3058354c94deSBarry Smith   Mat_SeqAIJ  *aij = (Mat_SeqAIJ *)mat->data;
3059354c94deSBarry Smith   PetscInt     i, nz;
3060354c94deSBarry Smith   PetscScalar *a;
3061354c94deSBarry Smith 
3062354c94deSBarry Smith   PetscFunctionBegin;
3063354c94deSBarry Smith   nz = aij->nz;
30649566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArray(mat, &a));
30652205254eSKarl Rupp   for (i = 0; i < nz; i++) a[i] = PetscConj(a[i]);
30669566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArray(mat, &a));
3067354c94deSBarry Smith #else
3068354c94deSBarry Smith   PetscFunctionBegin;
3069354c94deSBarry Smith #endif
30703ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3071354c94deSBarry Smith }
3072354c94deSBarry Smith 
3073ba38deedSJacob Faibussowitsch static PetscErrorCode MatGetRowMaxAbs_SeqAIJ(Mat A, Vec v, PetscInt idx[])
3074d71ae5a4SJacob Faibussowitsch {
3075e34fafa9SBarry Smith   Mat_SeqAIJ      *a = (Mat_SeqAIJ *)A->data;
3076d0f46423SBarry Smith   PetscInt         i, j, m = A->rmap->n, *ai, *aj, ncols, n;
3077e34fafa9SBarry Smith   PetscReal        atmp;
3078985db425SBarry Smith   PetscScalar     *x;
3079ce496241SStefano Zampini   const MatScalar *aa, *av;
3080e34fafa9SBarry Smith 
3081e34fafa9SBarry Smith   PetscFunctionBegin;
308228b400f6SJacob Faibussowitsch   PetscCheck(!A->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix");
30839566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &av));
3084ce496241SStefano Zampini   aa = av;
3085e34fafa9SBarry Smith   ai = a->i;
3086e34fafa9SBarry Smith   aj = a->j;
3087e34fafa9SBarry Smith 
30889566063dSJacob Faibussowitsch   PetscCall(VecSet(v, 0.0));
30899566063dSJacob Faibussowitsch   PetscCall(VecGetArrayWrite(v, &x));
30909566063dSJacob Faibussowitsch   PetscCall(VecGetLocalSize(v, &n));
309108401ef6SPierre Jolivet   PetscCheck(n == A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Nonconforming matrix and vector");
3092e34fafa9SBarry Smith   for (i = 0; i < m; i++) {
30939371c9d4SSatish Balay     ncols = ai[1] - ai[0];
30949371c9d4SSatish Balay     ai++;
3095e34fafa9SBarry Smith     for (j = 0; j < ncols; j++) {
3096985db425SBarry Smith       atmp = PetscAbsScalar(*aa);
30979371c9d4SSatish Balay       if (PetscAbsScalar(x[i]) < atmp) {
30989371c9d4SSatish Balay         x[i] = atmp;
30999371c9d4SSatish Balay         if (idx) idx[i] = *aj;
31009371c9d4SSatish Balay       }
31019371c9d4SSatish Balay       aa++;
31029371c9d4SSatish Balay       aj++;
3103985db425SBarry Smith     }
3104985db425SBarry Smith   }
31059566063dSJacob Faibussowitsch   PetscCall(VecRestoreArrayWrite(v, &x));
31069566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &av));
31073ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3108985db425SBarry Smith }
3109985db425SBarry Smith 
3110eede4a3fSMark Adams static PetscErrorCode MatGetRowSumAbs_SeqAIJ(Mat A, Vec v)
3111eede4a3fSMark Adams {
3112eede4a3fSMark Adams   Mat_SeqAIJ      *a = (Mat_SeqAIJ *)A->data;
3113eede4a3fSMark Adams   PetscInt         i, j, m = A->rmap->n, *ai, ncols, n;
3114eede4a3fSMark Adams   PetscScalar     *x;
3115eede4a3fSMark Adams   const MatScalar *aa, *av;
3116eede4a3fSMark Adams 
3117eede4a3fSMark Adams   PetscFunctionBegin;
3118eede4a3fSMark Adams   PetscCheck(!A->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix");
3119eede4a3fSMark Adams   PetscCall(MatSeqAIJGetArrayRead(A, &av));
3120eede4a3fSMark Adams   aa = av;
3121eede4a3fSMark Adams   ai = a->i;
3122eede4a3fSMark Adams 
3123eede4a3fSMark Adams   PetscCall(VecSet(v, 0.0));
3124eede4a3fSMark Adams   PetscCall(VecGetArrayWrite(v, &x));
3125eede4a3fSMark Adams   PetscCall(VecGetLocalSize(v, &n));
3126eede4a3fSMark Adams   PetscCheck(n == A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Nonconforming matrix and vector");
3127eede4a3fSMark Adams   for (i = 0; i < m; i++) {
3128eede4a3fSMark Adams     ncols = ai[1] - ai[0];
3129eede4a3fSMark Adams     ai++;
3130eede4a3fSMark Adams     for (j = 0; j < ncols; j++) {
3131eede4a3fSMark Adams       x[i] += PetscAbsScalar(*aa);
3132eede4a3fSMark Adams       aa++;
3133eede4a3fSMark Adams     }
3134eede4a3fSMark Adams   }
3135eede4a3fSMark Adams   PetscCall(VecRestoreArrayWrite(v, &x));
3136eede4a3fSMark Adams   PetscCall(MatSeqAIJRestoreArrayRead(A, &av));
3137eede4a3fSMark Adams   PetscFunctionReturn(PETSC_SUCCESS);
3138eede4a3fSMark Adams }
3139eede4a3fSMark Adams 
3140ba38deedSJacob Faibussowitsch static PetscErrorCode MatGetRowMax_SeqAIJ(Mat A, Vec v, PetscInt idx[])
3141d71ae5a4SJacob Faibussowitsch {
3142985db425SBarry Smith   Mat_SeqAIJ      *a = (Mat_SeqAIJ *)A->data;
3143d0f46423SBarry Smith   PetscInt         i, j, m = A->rmap->n, *ai, *aj, ncols, n;
3144985db425SBarry Smith   PetscScalar     *x;
3145ce496241SStefano Zampini   const MatScalar *aa, *av;
3146985db425SBarry Smith 
3147985db425SBarry Smith   PetscFunctionBegin;
314828b400f6SJacob Faibussowitsch   PetscCheck(!A->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix");
31499566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &av));
3150ce496241SStefano Zampini   aa = av;
3151985db425SBarry Smith   ai = a->i;
3152985db425SBarry Smith   aj = a->j;
3153985db425SBarry Smith 
31549566063dSJacob Faibussowitsch   PetscCall(VecSet(v, 0.0));
31559566063dSJacob Faibussowitsch   PetscCall(VecGetArrayWrite(v, &x));
31569566063dSJacob Faibussowitsch   PetscCall(VecGetLocalSize(v, &n));
315708401ef6SPierre Jolivet   PetscCheck(n == A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Nonconforming matrix and vector");
3158985db425SBarry Smith   for (i = 0; i < m; i++) {
31599371c9d4SSatish Balay     ncols = ai[1] - ai[0];
31609371c9d4SSatish Balay     ai++;
3161d0f46423SBarry Smith     if (ncols == A->cmap->n) { /* row is dense */
31629371c9d4SSatish Balay       x[i] = *aa;
31639371c9d4SSatish Balay       if (idx) idx[i] = 0;
3164985db425SBarry Smith     } else { /* row is sparse so already KNOW maximum is 0.0 or higher */
3165985db425SBarry Smith       x[i] = 0.0;
3166985db425SBarry Smith       if (idx) {
3167985db425SBarry Smith         for (j = 0; j < ncols; j++) { /* find first implicit 0.0 in the row */
3168985db425SBarry Smith           if (aj[j] > j) {
3169985db425SBarry Smith             idx[i] = j;
3170985db425SBarry Smith             break;
3171985db425SBarry Smith           }
3172985db425SBarry Smith         }
31731a254869SHong Zhang         /* in case first implicit 0.0 in the row occurs at ncols-th column */
31741a254869SHong Zhang         if (j == ncols && j < A->cmap->n) idx[i] = j;
3175985db425SBarry Smith       }
3176985db425SBarry Smith     }
3177985db425SBarry Smith     for (j = 0; j < ncols; j++) {
31789371c9d4SSatish Balay       if (PetscRealPart(x[i]) < PetscRealPart(*aa)) {
31799371c9d4SSatish Balay         x[i] = *aa;
31809371c9d4SSatish Balay         if (idx) idx[i] = *aj;
31819371c9d4SSatish Balay       }
31829371c9d4SSatish Balay       aa++;
31839371c9d4SSatish Balay       aj++;
3184985db425SBarry Smith     }
3185985db425SBarry Smith   }
31869566063dSJacob Faibussowitsch   PetscCall(VecRestoreArrayWrite(v, &x));
31879566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &av));
31883ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3189985db425SBarry Smith }
3190985db425SBarry Smith 
3191ba38deedSJacob Faibussowitsch static PetscErrorCode MatGetRowMinAbs_SeqAIJ(Mat A, Vec v, PetscInt idx[])
3192d71ae5a4SJacob Faibussowitsch {
3193c87e5d42SMatthew Knepley   Mat_SeqAIJ      *a = (Mat_SeqAIJ *)A->data;
3194c87e5d42SMatthew Knepley   PetscInt         i, j, m = A->rmap->n, *ai, *aj, ncols, n;
3195ce496241SStefano Zampini   PetscScalar     *x;
3196ce496241SStefano Zampini   const MatScalar *aa, *av;
3197c87e5d42SMatthew Knepley 
3198c87e5d42SMatthew Knepley   PetscFunctionBegin;
31999566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &av));
3200ce496241SStefano Zampini   aa = av;
3201c87e5d42SMatthew Knepley   ai = a->i;
3202c87e5d42SMatthew Knepley   aj = a->j;
3203c87e5d42SMatthew Knepley 
32049566063dSJacob Faibussowitsch   PetscCall(VecSet(v, 0.0));
32059566063dSJacob Faibussowitsch   PetscCall(VecGetArrayWrite(v, &x));
32069566063dSJacob Faibussowitsch   PetscCall(VecGetLocalSize(v, &n));
320708401ef6SPierre Jolivet   PetscCheck(n == m, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Nonconforming matrix and vector, %" PetscInt_FMT " vs. %" PetscInt_FMT " rows", m, n);
3208c87e5d42SMatthew Knepley   for (i = 0; i < m; i++) {
32099371c9d4SSatish Balay     ncols = ai[1] - ai[0];
32109371c9d4SSatish Balay     ai++;
3211f07e67edSHong Zhang     if (ncols == A->cmap->n) { /* row is dense */
32129371c9d4SSatish Balay       x[i] = *aa;
32139371c9d4SSatish Balay       if (idx) idx[i] = 0;
3214f07e67edSHong Zhang     } else { /* row is sparse so already KNOW minimum is 0.0 or higher */
3215f07e67edSHong Zhang       x[i] = 0.0;
3216f07e67edSHong Zhang       if (idx) { /* find first implicit 0.0 in the row */
3217289a08f5SMatthew Knepley         for (j = 0; j < ncols; j++) {
3218f07e67edSHong Zhang           if (aj[j] > j) {
3219f07e67edSHong Zhang             idx[i] = j;
32202205254eSKarl Rupp             break;
32212205254eSKarl Rupp           }
3222289a08f5SMatthew Knepley         }
3223f07e67edSHong Zhang         /* in case first implicit 0.0 in the row occurs at ncols-th column */
3224f07e67edSHong Zhang         if (j == ncols && j < A->cmap->n) idx[i] = j;
3225f07e67edSHong Zhang       }
3226289a08f5SMatthew Knepley     }
3227c87e5d42SMatthew Knepley     for (j = 0; j < ncols; j++) {
32289371c9d4SSatish Balay       if (PetscAbsScalar(x[i]) > PetscAbsScalar(*aa)) {
32299371c9d4SSatish Balay         x[i] = *aa;
32309371c9d4SSatish Balay         if (idx) idx[i] = *aj;
32319371c9d4SSatish Balay       }
32329371c9d4SSatish Balay       aa++;
32339371c9d4SSatish Balay       aj++;
3234c87e5d42SMatthew Knepley     }
3235c87e5d42SMatthew Knepley   }
32369566063dSJacob Faibussowitsch   PetscCall(VecRestoreArrayWrite(v, &x));
32379566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &av));
32383ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3239c87e5d42SMatthew Knepley }
3240c87e5d42SMatthew Knepley 
3241ba38deedSJacob Faibussowitsch static PetscErrorCode MatGetRowMin_SeqAIJ(Mat A, Vec v, PetscInt idx[])
3242d71ae5a4SJacob Faibussowitsch {
3243985db425SBarry Smith   Mat_SeqAIJ      *a = (Mat_SeqAIJ *)A->data;
3244d9ca1df4SBarry Smith   PetscInt         i, j, m = A->rmap->n, ncols, n;
3245d9ca1df4SBarry Smith   const PetscInt  *ai, *aj;
3246985db425SBarry Smith   PetscScalar     *x;
3247ce496241SStefano Zampini   const MatScalar *aa, *av;
3248985db425SBarry Smith 
3249985db425SBarry Smith   PetscFunctionBegin;
325028b400f6SJacob Faibussowitsch   PetscCheck(!A->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix");
32519566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &av));
3252ce496241SStefano Zampini   aa = av;
3253985db425SBarry Smith   ai = a->i;
3254985db425SBarry Smith   aj = a->j;
3255985db425SBarry Smith 
32569566063dSJacob Faibussowitsch   PetscCall(VecSet(v, 0.0));
32579566063dSJacob Faibussowitsch   PetscCall(VecGetArrayWrite(v, &x));
32589566063dSJacob Faibussowitsch   PetscCall(VecGetLocalSize(v, &n));
325908401ef6SPierre Jolivet   PetscCheck(n == m, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Nonconforming matrix and vector");
3260985db425SBarry Smith   for (i = 0; i < m; i++) {
32619371c9d4SSatish Balay     ncols = ai[1] - ai[0];
32629371c9d4SSatish Balay     ai++;
3263d0f46423SBarry Smith     if (ncols == A->cmap->n) { /* row is dense */
32649371c9d4SSatish Balay       x[i] = *aa;
32659371c9d4SSatish Balay       if (idx) idx[i] = 0;
3266985db425SBarry Smith     } else { /* row is sparse so already KNOW minimum is 0.0 or lower */
3267985db425SBarry Smith       x[i] = 0.0;
3268985db425SBarry Smith       if (idx) { /* find first implicit 0.0 in the row */
3269985db425SBarry Smith         for (j = 0; j < ncols; j++) {
3270985db425SBarry Smith           if (aj[j] > j) {
3271985db425SBarry Smith             idx[i] = j;
3272985db425SBarry Smith             break;
3273985db425SBarry Smith           }
3274985db425SBarry Smith         }
3275fa213d2fSHong Zhang         /* in case first implicit 0.0 in the row occurs at ncols-th column */
3276fa213d2fSHong Zhang         if (j == ncols && j < A->cmap->n) idx[i] = j;
3277985db425SBarry Smith       }
3278985db425SBarry Smith     }
3279985db425SBarry Smith     for (j = 0; j < ncols; j++) {
32809371c9d4SSatish Balay       if (PetscRealPart(x[i]) > PetscRealPart(*aa)) {
32819371c9d4SSatish Balay         x[i] = *aa;
32829371c9d4SSatish Balay         if (idx) idx[i] = *aj;
32839371c9d4SSatish Balay       }
32849371c9d4SSatish Balay       aa++;
32859371c9d4SSatish Balay       aj++;
3286e34fafa9SBarry Smith     }
3287e34fafa9SBarry Smith   }
32889566063dSJacob Faibussowitsch   PetscCall(VecRestoreArrayWrite(v, &x));
32899566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &av));
32903ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3291e34fafa9SBarry Smith }
3292bbead8a2SBarry Smith 
3293ba38deedSJacob Faibussowitsch static PetscErrorCode MatInvertBlockDiagonal_SeqAIJ(Mat A, const PetscScalar **values)
3294d71ae5a4SJacob Faibussowitsch {
3295bbead8a2SBarry Smith   Mat_SeqAIJ     *a = (Mat_SeqAIJ *)A->data;
329633d57670SJed Brown   PetscInt        i, bs = PetscAbs(A->rmap->bs), mbs = A->rmap->n / bs, ipvt[5], bs2 = bs * bs, *v_pivots, ij[7], *IJ, j;
3297bbead8a2SBarry Smith   MatScalar      *diag, work[25], *v_work;
32980da83c2eSBarry Smith   const PetscReal shift = 0.0;
32991a9391e3SHong Zhang   PetscBool       allowzeropivot, zeropivotdetected = PETSC_FALSE;
3300bbead8a2SBarry Smith 
3301bbead8a2SBarry Smith   PetscFunctionBegin;
3302a455e926SHong Zhang   allowzeropivot = PetscNot(A->erroriffailure);
33034a0d0026SBarry Smith   if (a->ibdiagvalid) {
33044a0d0026SBarry Smith     if (values) *values = a->ibdiag;
33053ba16761SJacob Faibussowitsch     PetscFunctionReturn(PETSC_SUCCESS);
33064a0d0026SBarry Smith   }
33079566063dSJacob Faibussowitsch   PetscCall(MatMarkDiagonal_SeqAIJ(A));
33084dfa11a4SJacob Faibussowitsch   if (!a->ibdiag) { PetscCall(PetscMalloc1(bs2 * mbs, &a->ibdiag)); }
3309bbead8a2SBarry Smith   diag = a->ibdiag;
3310bbead8a2SBarry Smith   if (values) *values = a->ibdiag;
3311bbead8a2SBarry Smith   /* factor and invert each block */
3312bbead8a2SBarry Smith   switch (bs) {
3313bbead8a2SBarry Smith   case 1:
3314bbead8a2SBarry Smith     for (i = 0; i < mbs; i++) {
33159566063dSJacob Faibussowitsch       PetscCall(MatGetValues(A, 1, &i, 1, &i, diag + i));
3316ec1892c8SHong Zhang       if (PetscAbsScalar(diag[i] + shift) < PETSC_MACHINE_EPSILON) {
3317ec1892c8SHong Zhang         if (allowzeropivot) {
33187b6c816cSBarry Smith           A->factorerrortype             = MAT_FACTOR_NUMERIC_ZEROPIVOT;
33197b6c816cSBarry Smith           A->factorerror_zeropivot_value = PetscAbsScalar(diag[i]);
33207b6c816cSBarry Smith           A->factorerror_zeropivot_row   = i;
33219566063dSJacob Faibussowitsch           PetscCall(PetscInfo(A, "Zero pivot, row %" PetscInt_FMT " pivot %g tolerance %g\n", i, (double)PetscAbsScalar(diag[i]), (double)PETSC_MACHINE_EPSILON));
332298921bdaSJacob Faibussowitsch         } else SETERRQ(PETSC_COMM_SELF, PETSC_ERR_MAT_LU_ZRPVT, "Zero pivot, row %" PetscInt_FMT " pivot %g tolerance %g", i, (double)PetscAbsScalar(diag[i]), (double)PETSC_MACHINE_EPSILON);
3323ec1892c8SHong Zhang       }
3324bbead8a2SBarry Smith       diag[i] = (PetscScalar)1.0 / (diag[i] + shift);
3325bbead8a2SBarry Smith     }
3326bbead8a2SBarry Smith     break;
3327bbead8a2SBarry Smith   case 2:
3328bbead8a2SBarry Smith     for (i = 0; i < mbs; i++) {
33299371c9d4SSatish Balay       ij[0] = 2 * i;
33309371c9d4SSatish Balay       ij[1] = 2 * i + 1;
33319566063dSJacob Faibussowitsch       PetscCall(MatGetValues(A, 2, ij, 2, ij, diag));
33329566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_inverse_A_2(diag, shift, allowzeropivot, &zeropivotdetected));
33337b6c816cSBarry Smith       if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT;
33349566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_transpose_A_2(diag));
3335bbead8a2SBarry Smith       diag += 4;
3336bbead8a2SBarry Smith     }
3337bbead8a2SBarry Smith     break;
3338bbead8a2SBarry Smith   case 3:
3339bbead8a2SBarry Smith     for (i = 0; i < mbs; i++) {
33409371c9d4SSatish Balay       ij[0] = 3 * i;
33419371c9d4SSatish Balay       ij[1] = 3 * i + 1;
33429371c9d4SSatish Balay       ij[2] = 3 * i + 2;
33439566063dSJacob Faibussowitsch       PetscCall(MatGetValues(A, 3, ij, 3, ij, diag));
33449566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_inverse_A_3(diag, shift, allowzeropivot, &zeropivotdetected));
33457b6c816cSBarry Smith       if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT;
33469566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_transpose_A_3(diag));
3347bbead8a2SBarry Smith       diag += 9;
3348bbead8a2SBarry Smith     }
3349bbead8a2SBarry Smith     break;
3350bbead8a2SBarry Smith   case 4:
3351bbead8a2SBarry Smith     for (i = 0; i < mbs; i++) {
33529371c9d4SSatish Balay       ij[0] = 4 * i;
33539371c9d4SSatish Balay       ij[1] = 4 * i + 1;
33549371c9d4SSatish Balay       ij[2] = 4 * i + 2;
33559371c9d4SSatish Balay       ij[3] = 4 * i + 3;
33569566063dSJacob Faibussowitsch       PetscCall(MatGetValues(A, 4, ij, 4, ij, diag));
33579566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_inverse_A_4(diag, shift, allowzeropivot, &zeropivotdetected));
33587b6c816cSBarry Smith       if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT;
33599566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_transpose_A_4(diag));
3360bbead8a2SBarry Smith       diag += 16;
3361bbead8a2SBarry Smith     }
3362bbead8a2SBarry Smith     break;
3363bbead8a2SBarry Smith   case 5:
3364bbead8a2SBarry Smith     for (i = 0; i < mbs; i++) {
33659371c9d4SSatish Balay       ij[0] = 5 * i;
33669371c9d4SSatish Balay       ij[1] = 5 * i + 1;
33679371c9d4SSatish Balay       ij[2] = 5 * i + 2;
33689371c9d4SSatish Balay       ij[3] = 5 * i + 3;
33699371c9d4SSatish Balay       ij[4] = 5 * i + 4;
33709566063dSJacob Faibussowitsch       PetscCall(MatGetValues(A, 5, ij, 5, ij, diag));
33719566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_inverse_A_5(diag, ipvt, work, shift, allowzeropivot, &zeropivotdetected));
33727b6c816cSBarry Smith       if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT;
33739566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_transpose_A_5(diag));
3374bbead8a2SBarry Smith       diag += 25;
3375bbead8a2SBarry Smith     }
3376bbead8a2SBarry Smith     break;
3377bbead8a2SBarry Smith   case 6:
3378bbead8a2SBarry Smith     for (i = 0; i < mbs; i++) {
33799371c9d4SSatish Balay       ij[0] = 6 * i;
33809371c9d4SSatish Balay       ij[1] = 6 * i + 1;
33819371c9d4SSatish Balay       ij[2] = 6 * i + 2;
33829371c9d4SSatish Balay       ij[3] = 6 * i + 3;
33839371c9d4SSatish Balay       ij[4] = 6 * i + 4;
33849371c9d4SSatish Balay       ij[5] = 6 * i + 5;
33859566063dSJacob Faibussowitsch       PetscCall(MatGetValues(A, 6, ij, 6, ij, diag));
33869566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_inverse_A_6(diag, shift, allowzeropivot, &zeropivotdetected));
33877b6c816cSBarry Smith       if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT;
33889566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_transpose_A_6(diag));
3389bbead8a2SBarry Smith       diag += 36;
3390bbead8a2SBarry Smith     }
3391bbead8a2SBarry Smith     break;
3392bbead8a2SBarry Smith   case 7:
3393bbead8a2SBarry Smith     for (i = 0; i < mbs; i++) {
33949371c9d4SSatish Balay       ij[0] = 7 * i;
33959371c9d4SSatish Balay       ij[1] = 7 * i + 1;
33969371c9d4SSatish Balay       ij[2] = 7 * i + 2;
33979371c9d4SSatish Balay       ij[3] = 7 * i + 3;
33989371c9d4SSatish Balay       ij[4] = 7 * i + 4;
33999371c9d4SSatish Balay       ij[5] = 7 * i + 5;
3400cdd8bf47SJunchao Zhang       ij[6] = 7 * i + 6;
34019566063dSJacob Faibussowitsch       PetscCall(MatGetValues(A, 7, ij, 7, ij, diag));
34029566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_inverse_A_7(diag, shift, allowzeropivot, &zeropivotdetected));
34037b6c816cSBarry Smith       if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT;
34049566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_transpose_A_7(diag));
3405bbead8a2SBarry Smith       diag += 49;
3406bbead8a2SBarry Smith     }
3407bbead8a2SBarry Smith     break;
3408bbead8a2SBarry Smith   default:
34099566063dSJacob Faibussowitsch     PetscCall(PetscMalloc3(bs, &v_work, bs, &v_pivots, bs, &IJ));
3410bbead8a2SBarry Smith     for (i = 0; i < mbs; i++) {
3411ad540459SPierre Jolivet       for (j = 0; j < bs; j++) IJ[j] = bs * i + j;
34129566063dSJacob Faibussowitsch       PetscCall(MatGetValues(A, bs, IJ, bs, IJ, diag));
34139566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_inverse_A(bs, diag, v_pivots, v_work, allowzeropivot, &zeropivotdetected));
34147b6c816cSBarry Smith       if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT;
34159566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_transpose_A_N(diag, bs));
3416bbead8a2SBarry Smith       diag += bs2;
3417bbead8a2SBarry Smith     }
34189566063dSJacob Faibussowitsch     PetscCall(PetscFree3(v_work, v_pivots, IJ));
3419bbead8a2SBarry Smith   }
3420bbead8a2SBarry Smith   a->ibdiagvalid = PETSC_TRUE;
34213ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3422bbead8a2SBarry Smith }
3423bbead8a2SBarry Smith 
3424d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatSetRandom_SeqAIJ(Mat x, PetscRandom rctx)
3425d71ae5a4SJacob Faibussowitsch {
342673a71a0fSBarry Smith   Mat_SeqAIJ *aij = (Mat_SeqAIJ *)x->data;
3427fff043a9SJunchao Zhang   PetscScalar a, *aa;
342873a71a0fSBarry Smith   PetscInt    m, n, i, j, col;
342973a71a0fSBarry Smith 
343073a71a0fSBarry Smith   PetscFunctionBegin;
343173a71a0fSBarry Smith   if (!x->assembled) {
34329566063dSJacob Faibussowitsch     PetscCall(MatGetSize(x, &m, &n));
343373a71a0fSBarry Smith     for (i = 0; i < m; i++) {
343473a71a0fSBarry Smith       for (j = 0; j < aij->imax[i]; j++) {
34359566063dSJacob Faibussowitsch         PetscCall(PetscRandomGetValue(rctx, &a));
343673a71a0fSBarry Smith         col = (PetscInt)(n * PetscRealPart(a));
34379566063dSJacob Faibussowitsch         PetscCall(MatSetValues(x, 1, &i, 1, &col, &a, ADD_VALUES));
343873a71a0fSBarry Smith       }
343973a71a0fSBarry Smith     }
3440e2ce353bSJunchao Zhang   } else {
34419566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJGetArrayWrite(x, &aa));
34429566063dSJacob Faibussowitsch     for (i = 0; i < aij->nz; i++) PetscCall(PetscRandomGetValue(rctx, aa + i));
34439566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJRestoreArrayWrite(x, &aa));
3444e2ce353bSJunchao Zhang   }
34459566063dSJacob Faibussowitsch   PetscCall(MatAssemblyBegin(x, MAT_FINAL_ASSEMBLY));
34469566063dSJacob Faibussowitsch   PetscCall(MatAssemblyEnd(x, MAT_FINAL_ASSEMBLY));
34473ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
344873a71a0fSBarry Smith }
344973a71a0fSBarry Smith 
3450679944adSJunchao Zhang /* Like MatSetRandom_SeqAIJ, but do not set values on columns in range of [low, high) */
3451d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetRandomSkipColumnRange_SeqAIJ_Private(Mat x, PetscInt low, PetscInt high, PetscRandom rctx)
3452d71ae5a4SJacob Faibussowitsch {
3453679944adSJunchao Zhang   Mat_SeqAIJ *aij = (Mat_SeqAIJ *)x->data;
3454679944adSJunchao Zhang   PetscScalar a;
3455679944adSJunchao Zhang   PetscInt    m, n, i, j, col, nskip;
3456679944adSJunchao Zhang 
3457679944adSJunchao Zhang   PetscFunctionBegin;
3458679944adSJunchao Zhang   nskip = high - low;
34599566063dSJacob Faibussowitsch   PetscCall(MatGetSize(x, &m, &n));
3460679944adSJunchao Zhang   n -= nskip; /* shrink number of columns where nonzeros can be set */
3461679944adSJunchao Zhang   for (i = 0; i < m; i++) {
3462679944adSJunchao Zhang     for (j = 0; j < aij->imax[i]; j++) {
34639566063dSJacob Faibussowitsch       PetscCall(PetscRandomGetValue(rctx, &a));
3464679944adSJunchao Zhang       col = (PetscInt)(n * PetscRealPart(a));
3465679944adSJunchao Zhang       if (col >= low) col += nskip; /* shift col rightward to skip the hole */
34669566063dSJacob Faibussowitsch       PetscCall(MatSetValues(x, 1, &i, 1, &col, &a, ADD_VALUES));
3467679944adSJunchao Zhang     }
3468e2ce353bSJunchao Zhang   }
34699566063dSJacob Faibussowitsch   PetscCall(MatAssemblyBegin(x, MAT_FINAL_ASSEMBLY));
34709566063dSJacob Faibussowitsch   PetscCall(MatAssemblyEnd(x, MAT_FINAL_ASSEMBLY));
34713ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3472679944adSJunchao Zhang }
3473679944adSJunchao Zhang 
34740a6ffc59SBarry Smith static struct _MatOps MatOps_Values = {MatSetValues_SeqAIJ,
3475cb5b572fSBarry Smith                                        MatGetRow_SeqAIJ,
3476cb5b572fSBarry Smith                                        MatRestoreRow_SeqAIJ,
3477cb5b572fSBarry Smith                                        MatMult_SeqAIJ,
347897304618SKris Buschelman                                        /*  4*/ MatMultAdd_SeqAIJ,
34797c922b88SBarry Smith                                        MatMultTranspose_SeqAIJ,
34807c922b88SBarry Smith                                        MatMultTransposeAdd_SeqAIJ,
3481f4259b30SLisandro Dalcin                                        NULL,
3482f4259b30SLisandro Dalcin                                        NULL,
3483f4259b30SLisandro Dalcin                                        NULL,
3484f4259b30SLisandro Dalcin                                        /* 10*/ NULL,
3485cb5b572fSBarry Smith                                        MatLUFactor_SeqAIJ,
3486f4259b30SLisandro Dalcin                                        NULL,
348741f059aeSBarry Smith                                        MatSOR_SeqAIJ,
348891e9d3e2SHong Zhang                                        MatTranspose_SeqAIJ,
348997304618SKris Buschelman                                        /*1 5*/ MatGetInfo_SeqAIJ,
3490cb5b572fSBarry Smith                                        MatEqual_SeqAIJ,
3491cb5b572fSBarry Smith                                        MatGetDiagonal_SeqAIJ,
3492cb5b572fSBarry Smith                                        MatDiagonalScale_SeqAIJ,
3493cb5b572fSBarry Smith                                        MatNorm_SeqAIJ,
3494f4259b30SLisandro Dalcin                                        /* 20*/ NULL,
3495cb5b572fSBarry Smith                                        MatAssemblyEnd_SeqAIJ,
3496cb5b572fSBarry Smith                                        MatSetOption_SeqAIJ,
3497cb5b572fSBarry Smith                                        MatZeroEntries_SeqAIJ,
3498d519adbfSMatthew Knepley                                        /* 24*/ MatZeroRows_SeqAIJ,
3499f4259b30SLisandro Dalcin                                        NULL,
3500f4259b30SLisandro Dalcin                                        NULL,
3501f4259b30SLisandro Dalcin                                        NULL,
3502f4259b30SLisandro Dalcin                                        NULL,
350326cec326SBarry Smith                                        /* 29*/ MatSetUp_Seq_Hash,
3504f4259b30SLisandro Dalcin                                        NULL,
3505f4259b30SLisandro Dalcin                                        NULL,
3506f4259b30SLisandro Dalcin                                        NULL,
3507f4259b30SLisandro Dalcin                                        NULL,
3508d519adbfSMatthew Knepley                                        /* 34*/ MatDuplicate_SeqAIJ,
3509f4259b30SLisandro Dalcin                                        NULL,
3510f4259b30SLisandro Dalcin                                        NULL,
3511cb5b572fSBarry Smith                                        MatILUFactor_SeqAIJ,
3512f4259b30SLisandro Dalcin                                        NULL,
3513d519adbfSMatthew Knepley                                        /* 39*/ MatAXPY_SeqAIJ,
35147dae84e0SHong Zhang                                        MatCreateSubMatrices_SeqAIJ,
3515cb5b572fSBarry Smith                                        MatIncreaseOverlap_SeqAIJ,
3516cb5b572fSBarry Smith                                        MatGetValues_SeqAIJ,
3517cb5b572fSBarry Smith                                        MatCopy_SeqAIJ,
3518d519adbfSMatthew Knepley                                        /* 44*/ MatGetRowMax_SeqAIJ,
3519cb5b572fSBarry Smith                                        MatScale_SeqAIJ,
35207d68702bSBarry Smith                                        MatShift_SeqAIJ,
352179299369SBarry Smith                                        MatDiagonalSet_SeqAIJ,
35226e169961SBarry Smith                                        MatZeroRowsColumns_SeqAIJ,
352373a71a0fSBarry Smith                                        /* 49*/ MatSetRandom_SeqAIJ,
35243b2fbd54SBarry Smith                                        MatGetRowIJ_SeqAIJ,
35253b2fbd54SBarry Smith                                        MatRestoreRowIJ_SeqAIJ,
35263b2fbd54SBarry Smith                                        MatGetColumnIJ_SeqAIJ,
3527a93ec695SBarry Smith                                        MatRestoreColumnIJ_SeqAIJ,
352893dfae19SHong Zhang                                        /* 54*/ MatFDColoringCreate_SeqXAIJ,
3529f4259b30SLisandro Dalcin                                        NULL,
3530f4259b30SLisandro Dalcin                                        NULL,
3531cda55fadSBarry Smith                                        MatPermute_SeqAIJ,
3532f4259b30SLisandro Dalcin                                        NULL,
3533f4259b30SLisandro Dalcin                                        /* 59*/ NULL,
3534b9b97703SBarry Smith                                        MatDestroy_SeqAIJ,
3535b9b97703SBarry Smith                                        MatView_SeqAIJ,
3536f4259b30SLisandro Dalcin                                        NULL,
3537f4259b30SLisandro Dalcin                                        NULL,
3538f4259b30SLisandro Dalcin                                        /* 64*/ NULL,
3539321b30b9SSatish Balay                                        MatMatMatMultNumeric_SeqAIJ_SeqAIJ_SeqAIJ,
3540f4259b30SLisandro Dalcin                                        NULL,
3541f4259b30SLisandro Dalcin                                        NULL,
3542f4259b30SLisandro Dalcin                                        NULL,
3543d519adbfSMatthew Knepley                                        /* 69*/ MatGetRowMaxAbs_SeqAIJ,
3544c87e5d42SMatthew Knepley                                        MatGetRowMinAbs_SeqAIJ,
3545f4259b30SLisandro Dalcin                                        NULL,
3546f4259b30SLisandro Dalcin                                        NULL,
3547f4259b30SLisandro Dalcin                                        NULL,
3548f4259b30SLisandro Dalcin                                        /* 74*/ NULL,
35493acb8795SBarry Smith                                        MatFDColoringApply_AIJ,
3550f4259b30SLisandro Dalcin                                        NULL,
3551f4259b30SLisandro Dalcin                                        NULL,
3552f4259b30SLisandro Dalcin                                        NULL,
35536ce1633cSBarry Smith                                        /* 79*/ MatFindZeroDiagonals_SeqAIJ,
3554f4259b30SLisandro Dalcin                                        NULL,
3555f4259b30SLisandro Dalcin                                        NULL,
3556f4259b30SLisandro Dalcin                                        NULL,
3557bc011b1eSHong Zhang                                        MatLoad_SeqAIJ,
35586cff0a6bSPierre Jolivet                                        /* 84*/ NULL,
35596cff0a6bSPierre Jolivet                                        NULL,
3560f4259b30SLisandro Dalcin                                        NULL,
3561f4259b30SLisandro Dalcin                                        NULL,
3562f4259b30SLisandro Dalcin                                        NULL,
3563f4259b30SLisandro Dalcin                                        /* 89*/ NULL,
3564f4259b30SLisandro Dalcin                                        NULL,
356526be0446SHong Zhang                                        MatMatMultNumeric_SeqAIJ_SeqAIJ,
3566f4259b30SLisandro Dalcin                                        NULL,
3567f4259b30SLisandro Dalcin                                        NULL,
35688fa4b5a6SHong Zhang                                        /* 94*/ MatPtAPNumeric_SeqAIJ_SeqAIJ_SparseAxpy,
3569f4259b30SLisandro Dalcin                                        NULL,
3570f4259b30SLisandro Dalcin                                        NULL,
35716fc122caSHong Zhang                                        MatMatTransposeMultNumeric_SeqAIJ_SeqAIJ,
3572f4259b30SLisandro Dalcin                                        NULL,
35734222ddf1SHong Zhang                                        /* 99*/ MatProductSetFromOptions_SeqAIJ,
3574f4259b30SLisandro Dalcin                                        NULL,
3575f4259b30SLisandro Dalcin                                        NULL,
357687d4246cSBarry Smith                                        MatConjugate_SeqAIJ,
3577f4259b30SLisandro Dalcin                                        NULL,
3578d519adbfSMatthew Knepley                                        /*104*/ MatSetValuesRow_SeqAIJ,
357999cafbc1SBarry Smith                                        MatRealPart_SeqAIJ,
3580f5edf698SHong Zhang                                        MatImaginaryPart_SeqAIJ,
3581f4259b30SLisandro Dalcin                                        NULL,
3582f4259b30SLisandro Dalcin                                        NULL,
3583cbd44569SHong Zhang                                        /*109*/ MatMatSolve_SeqAIJ,
3584f4259b30SLisandro Dalcin                                        NULL,
35852af78befSBarry Smith                                        MatGetRowMin_SeqAIJ,
3586f4259b30SLisandro Dalcin                                        NULL,
3587599ef60dSHong Zhang                                        MatMissingDiagonal_SeqAIJ,
3588f4259b30SLisandro Dalcin                                        /*114*/ NULL,
3589f4259b30SLisandro Dalcin                                        NULL,
3590f4259b30SLisandro Dalcin                                        NULL,
3591f4259b30SLisandro Dalcin                                        NULL,
3592f4259b30SLisandro Dalcin                                        NULL,
3593f4259b30SLisandro Dalcin                                        /*119*/ NULL,
3594f4259b30SLisandro Dalcin                                        NULL,
3595f4259b30SLisandro Dalcin                                        NULL,
3596f4259b30SLisandro Dalcin                                        NULL,
3597b3a44c85SBarry Smith                                        MatGetMultiProcBlock_SeqAIJ,
35980716a85fSBarry Smith                                        /*124*/ MatFindNonzeroRows_SeqAIJ,
3599a873a8cdSSam Reynolds                                        MatGetColumnReductions_SeqAIJ,
360037868618SMatthew G Knepley                                        MatInvertBlockDiagonal_SeqAIJ,
36010da83c2eSBarry Smith                                        MatInvertVariableBlockDiagonal_SeqAIJ,
3602f4259b30SLisandro Dalcin                                        NULL,
3603f4259b30SLisandro Dalcin                                        /*129*/ NULL,
3604f4259b30SLisandro Dalcin                                        NULL,
3605f4259b30SLisandro Dalcin                                        NULL,
360675648e8dSHong Zhang                                        MatTransposeMatMultNumeric_SeqAIJ_SeqAIJ,
3607b9af6bddSHong Zhang                                        MatTransposeColoringCreate_SeqAIJ,
3608b9af6bddSHong Zhang                                        /*134*/ MatTransColoringApplySpToDen_SeqAIJ,
36092b8ad9a3SHong Zhang                                        MatTransColoringApplyDenToSp_SeqAIJ,
3610f4259b30SLisandro Dalcin                                        NULL,
3611f4259b30SLisandro Dalcin                                        NULL,
36123964eb88SJed Brown                                        MatRARtNumeric_SeqAIJ_SeqAIJ,
3613f4259b30SLisandro Dalcin                                        /*139*/ NULL,
3614f4259b30SLisandro Dalcin                                        NULL,
3615f4259b30SLisandro Dalcin                                        NULL,
36163a062f41SBarry Smith                                        MatFDColoringSetUp_SeqXAIJ,
36179c8f2541SHong Zhang                                        MatFindOffBlockDiagonalEntries_SeqAIJ,
36184222ddf1SHong Zhang                                        MatCreateMPIMatConcatenateSeqMat_SeqAIJ,
36194222ddf1SHong Zhang                                        /*145*/ MatDestroySubMatrices_SeqAIJ,
3620f4259b30SLisandro Dalcin                                        NULL,
362172833a62Smarkadams4                                        NULL,
362272833a62Smarkadams4                                        MatCreateGraph_Simple_AIJ,
36232d776b49SBarry Smith                                        NULL,
3624dec0b466SHong Zhang                                        /*150*/ MatTransposeSymbolic_SeqAIJ,
3625eede4a3fSMark Adams                                        MatEliminateZeros_SeqAIJ,
36264cc2b5b5SPierre Jolivet                                        MatGetRowSumAbs_SeqAIJ,
36274cc2b5b5SPierre Jolivet                                        NULL};
362817ab2063SBarry Smith 
3629ba38deedSJacob Faibussowitsch static PetscErrorCode MatSeqAIJSetColumnIndices_SeqAIJ(Mat mat, PetscInt *indices)
3630d71ae5a4SJacob Faibussowitsch {
3631bef8e0ddSBarry Smith   Mat_SeqAIJ *aij = (Mat_SeqAIJ *)mat->data;
363297f1f81fSBarry Smith   PetscInt    i, nz, n;
3633bef8e0ddSBarry Smith 
3634bef8e0ddSBarry Smith   PetscFunctionBegin;
3635bef8e0ddSBarry Smith   nz = aij->maxnz;
3636d0f46423SBarry Smith   n  = mat->rmap->n;
3637ad540459SPierre Jolivet   for (i = 0; i < nz; i++) aij->j[i] = indices[i];
3638bef8e0ddSBarry Smith   aij->nz = nz;
3639ad540459SPierre Jolivet   for (i = 0; i < n; i++) aij->ilen[i] = aij->imax[i];
36403ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3641bef8e0ddSBarry Smith }
3642bef8e0ddSBarry Smith 
3643a3bb6f32SFande Kong /*
3644ddea5d60SJunchao Zhang  * Given a sparse matrix with global column indices, compact it by using a local column space.
3645ddea5d60SJunchao Zhang  * The result matrix helps saving memory in other algorithms, such as MatPtAPSymbolic_MPIAIJ_MPIAIJ_scalable()
3646ddea5d60SJunchao Zhang  */
3647d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJCompactOutExtraColumns_SeqAIJ(Mat mat, ISLocalToGlobalMapping *mapping)
3648d71ae5a4SJacob Faibussowitsch {
3649a3bb6f32SFande Kong   Mat_SeqAIJ   *aij = (Mat_SeqAIJ *)mat->data;
3650eec179cfSJacob Faibussowitsch   PetscHMapI    gid1_lid1;
3651eec179cfSJacob Faibussowitsch   PetscHashIter tpos;
365225b670f0SStefano Zampini   PetscInt      gid, lid, i, ec, nz = aij->nz;
365325b670f0SStefano Zampini   PetscInt     *garray, *jj = aij->j;
3654a3bb6f32SFande Kong 
3655a3bb6f32SFande Kong   PetscFunctionBegin;
3656a3bb6f32SFande Kong   PetscValidHeaderSpecific(mat, MAT_CLASSID, 1);
36574f572ea9SToby Isaac   PetscAssertPointer(mapping, 2);
3658a3bb6f32SFande Kong   /* use a table */
3659eec179cfSJacob Faibussowitsch   PetscCall(PetscHMapICreateWithSize(mat->rmap->n, &gid1_lid1));
3660a3bb6f32SFande Kong   ec = 0;
366125b670f0SStefano Zampini   for (i = 0; i < nz; i++) {
366225b670f0SStefano Zampini     PetscInt data, gid1 = jj[i] + 1;
3663eec179cfSJacob Faibussowitsch     PetscCall(PetscHMapIGetWithDefault(gid1_lid1, gid1, 0, &data));
3664a3bb6f32SFande Kong     if (!data) {
3665a3bb6f32SFande Kong       /* one based table */
3666c76ffc5fSJacob Faibussowitsch       PetscCall(PetscHMapISet(gid1_lid1, gid1, ++ec));
3667a3bb6f32SFande Kong     }
3668a3bb6f32SFande Kong   }
3669a3bb6f32SFande Kong   /* form array of columns we need */
36709566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(ec, &garray));
3671eec179cfSJacob Faibussowitsch   PetscHashIterBegin(gid1_lid1, tpos);
3672eec179cfSJacob Faibussowitsch   while (!PetscHashIterAtEnd(gid1_lid1, tpos)) {
3673eec179cfSJacob Faibussowitsch     PetscHashIterGetKey(gid1_lid1, tpos, gid);
3674eec179cfSJacob Faibussowitsch     PetscHashIterGetVal(gid1_lid1, tpos, lid);
3675eec179cfSJacob Faibussowitsch     PetscHashIterNext(gid1_lid1, tpos);
3676a3bb6f32SFande Kong     gid--;
3677a3bb6f32SFande Kong     lid--;
3678a3bb6f32SFande Kong     garray[lid] = gid;
3679a3bb6f32SFande Kong   }
36809566063dSJacob Faibussowitsch   PetscCall(PetscSortInt(ec, garray)); /* sort, and rebuild */
3681eec179cfSJacob Faibussowitsch   PetscCall(PetscHMapIClear(gid1_lid1));
3682c76ffc5fSJacob Faibussowitsch   for (i = 0; i < ec; i++) PetscCall(PetscHMapISet(gid1_lid1, garray[i] + 1, i + 1));
3683a3bb6f32SFande Kong   /* compact out the extra columns in B */
368425b670f0SStefano Zampini   for (i = 0; i < nz; i++) {
368525b670f0SStefano Zampini     PetscInt gid1 = jj[i] + 1;
3686eec179cfSJacob Faibussowitsch     PetscCall(PetscHMapIGetWithDefault(gid1_lid1, gid1, 0, &lid));
3687a3bb6f32SFande Kong     lid--;
368825b670f0SStefano Zampini     jj[i] = lid;
3689a3bb6f32SFande Kong   }
36909566063dSJacob Faibussowitsch   PetscCall(PetscLayoutDestroy(&mat->cmap));
3691eec179cfSJacob Faibussowitsch   PetscCall(PetscHMapIDestroy(&gid1_lid1));
36929566063dSJacob Faibussowitsch   PetscCall(PetscLayoutCreateFromSizes(PetscObjectComm((PetscObject)mat), ec, ec, 1, &mat->cmap));
36939566063dSJacob Faibussowitsch   PetscCall(ISLocalToGlobalMappingCreate(PETSC_COMM_SELF, mat->cmap->bs, mat->cmap->n, garray, PETSC_OWN_POINTER, mapping));
36949566063dSJacob Faibussowitsch   PetscCall(ISLocalToGlobalMappingSetType(*mapping, ISLOCALTOGLOBALMAPPINGHASH));
36953ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3696a3bb6f32SFande Kong }
3697a3bb6f32SFande Kong 
3698bef8e0ddSBarry Smith /*@
3699bef8e0ddSBarry Smith   MatSeqAIJSetColumnIndices - Set the column indices for all the rows
3700bef8e0ddSBarry Smith   in the matrix.
3701bef8e0ddSBarry Smith 
3702bef8e0ddSBarry Smith   Input Parameters:
370311a5261eSBarry Smith + mat     - the `MATSEQAIJ` matrix
3704bef8e0ddSBarry Smith - indices - the column indices
3705bef8e0ddSBarry Smith 
370615091d37SBarry Smith   Level: advanced
370715091d37SBarry Smith 
3708bef8e0ddSBarry Smith   Notes:
3709bef8e0ddSBarry Smith   This can be called if you have precomputed the nonzero structure of the
3710bef8e0ddSBarry Smith   matrix and want to provide it to the matrix object to improve the performance
371111a5261eSBarry Smith   of the `MatSetValues()` operation.
3712bef8e0ddSBarry Smith 
3713bef8e0ddSBarry Smith   You MUST have set the correct numbers of nonzeros per row in the call to
371411a5261eSBarry Smith   `MatCreateSeqAIJ()`, and the columns indices MUST be sorted.
3715bef8e0ddSBarry Smith 
371611a5261eSBarry Smith   MUST be called before any calls to `MatSetValues()`
3717bef8e0ddSBarry Smith 
3718b9617806SBarry Smith   The indices should start with zero, not one.
3719b9617806SBarry Smith 
37201cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MATSEQAIJ`
3721bef8e0ddSBarry Smith @*/
3722d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetColumnIndices(Mat mat, PetscInt *indices)
3723d71ae5a4SJacob Faibussowitsch {
3724bef8e0ddSBarry Smith   PetscFunctionBegin;
37250700a824SBarry Smith   PetscValidHeaderSpecific(mat, MAT_CLASSID, 1);
37264f572ea9SToby Isaac   PetscAssertPointer(indices, 2);
3727cac4c232SBarry Smith   PetscUseMethod(mat, "MatSeqAIJSetColumnIndices_C", (Mat, PetscInt *), (mat, indices));
37283ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3729bef8e0ddSBarry Smith }
3730bef8e0ddSBarry Smith 
3731ba38deedSJacob Faibussowitsch static PetscErrorCode MatStoreValues_SeqAIJ(Mat mat)
3732d71ae5a4SJacob Faibussowitsch {
3733be6bf707SBarry Smith   Mat_SeqAIJ *aij = (Mat_SeqAIJ *)mat->data;
3734d0f46423SBarry Smith   size_t      nz  = aij->i[mat->rmap->n];
3735be6bf707SBarry Smith 
3736be6bf707SBarry Smith   PetscFunctionBegin;
373728b400f6SJacob Faibussowitsch   PetscCheck(aij->nonew, PETSC_COMM_SELF, PETSC_ERR_ORDER, "Must call MatSetOption(A,MAT_NEW_NONZERO_LOCATIONS,PETSC_FALSE);first");
3738be6bf707SBarry Smith 
3739be6bf707SBarry Smith   /* allocate space for values if not already there */
37404dfa11a4SJacob Faibussowitsch   if (!aij->saved_values) { PetscCall(PetscMalloc1(nz + 1, &aij->saved_values)); }
3741be6bf707SBarry Smith 
3742be6bf707SBarry Smith   /* copy values over */
37439566063dSJacob Faibussowitsch   PetscCall(PetscArraycpy(aij->saved_values, aij->a, nz));
37443ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3745be6bf707SBarry Smith }
3746be6bf707SBarry Smith 
3747be6bf707SBarry Smith /*@
374820f4b53cSBarry Smith   MatStoreValues - Stashes a copy of the matrix values; this allows reusing of the linear part of a Jacobian, while recomputing only the
3749be6bf707SBarry Smith   nonlinear portion.
3750be6bf707SBarry Smith 
3751c3339decSBarry Smith   Logically Collect
3752be6bf707SBarry Smith 
375327430b45SBarry Smith   Input Parameter:
375411a5261eSBarry Smith . mat - the matrix (currently only `MATAIJ` matrices support this option)
3755be6bf707SBarry Smith 
375615091d37SBarry Smith   Level: advanced
375715091d37SBarry Smith 
37582920cce0SJacob Faibussowitsch   Example Usage:
375927430b45SBarry Smith .vb
37602ef1f0ffSBarry Smith     Using SNES
376127430b45SBarry Smith     Create Jacobian matrix
376227430b45SBarry Smith     Set linear terms into matrix
376327430b45SBarry Smith     Apply boundary conditions to matrix, at this time matrix must have
376427430b45SBarry Smith       final nonzero structure (i.e. setting the nonlinear terms and applying
376527430b45SBarry Smith       boundary conditions again will not change the nonzero structure
376627430b45SBarry Smith     MatSetOption(mat, MAT_NEW_NONZERO_LOCATIONS, PETSC_FALSE);
376727430b45SBarry Smith     MatStoreValues(mat);
376827430b45SBarry Smith     Call SNESSetJacobian() with matrix
376927430b45SBarry Smith     In your Jacobian routine
377027430b45SBarry Smith       MatRetrieveValues(mat);
377127430b45SBarry Smith       Set nonlinear terms in matrix
3772be6bf707SBarry Smith 
377327430b45SBarry Smith     Without `SNESSolve()`, i.e. when you handle nonlinear solve yourself:
377427430b45SBarry Smith     // build linear portion of Jacobian
377527430b45SBarry Smith     MatSetOption(mat, MAT_NEW_NONZERO_LOCATIONS, PETSC_FALSE);
377627430b45SBarry Smith     MatStoreValues(mat);
377727430b45SBarry Smith     loop over nonlinear iterations
377827430b45SBarry Smith        MatRetrieveValues(mat);
377927430b45SBarry Smith        // call MatSetValues(mat,...) to set nonliner portion of Jacobian
378027430b45SBarry Smith        // call MatAssemblyBegin/End() on matrix
378127430b45SBarry Smith        Solve linear system with Jacobian
378227430b45SBarry Smith     endloop
378327430b45SBarry Smith .ve
3784be6bf707SBarry Smith 
3785be6bf707SBarry Smith   Notes:
3786da81f932SPierre Jolivet   Matrix must already be assembled before calling this routine
378711a5261eSBarry Smith   Must set the matrix option `MatSetOption`(mat,`MAT_NEW_NONZERO_LOCATIONS`,`PETSC_FALSE`); before
3788be6bf707SBarry Smith   calling this routine.
3789be6bf707SBarry Smith 
37900c468ba9SBarry Smith   When this is called multiple times it overwrites the previous set of stored values
37910c468ba9SBarry Smith   and does not allocated additional space.
37920c468ba9SBarry Smith 
3793fe59aa6dSJacob Faibussowitsch .seealso: [](ch_matrices), `Mat`, `MatRetrieveValues()`
3794be6bf707SBarry Smith @*/
3795d71ae5a4SJacob Faibussowitsch PetscErrorCode MatStoreValues(Mat mat)
3796d71ae5a4SJacob Faibussowitsch {
3797be6bf707SBarry Smith   PetscFunctionBegin;
37980700a824SBarry Smith   PetscValidHeaderSpecific(mat, MAT_CLASSID, 1);
379928b400f6SJacob Faibussowitsch   PetscCheck(mat->assembled, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for unassembled matrix");
380028b400f6SJacob Faibussowitsch   PetscCheck(!mat->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix");
3801cac4c232SBarry Smith   PetscUseMethod(mat, "MatStoreValues_C", (Mat), (mat));
38023ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3803be6bf707SBarry Smith }
3804be6bf707SBarry Smith 
3805ba38deedSJacob Faibussowitsch static PetscErrorCode MatRetrieveValues_SeqAIJ(Mat mat)
3806d71ae5a4SJacob Faibussowitsch {
3807be6bf707SBarry Smith   Mat_SeqAIJ *aij = (Mat_SeqAIJ *)mat->data;
3808d0f46423SBarry Smith   PetscInt    nz  = aij->i[mat->rmap->n];
3809be6bf707SBarry Smith 
3810be6bf707SBarry Smith   PetscFunctionBegin;
381128b400f6SJacob Faibussowitsch   PetscCheck(aij->nonew, PETSC_COMM_SELF, PETSC_ERR_ORDER, "Must call MatSetOption(A,MAT_NEW_NONZERO_LOCATIONS,PETSC_FALSE);first");
381228b400f6SJacob Faibussowitsch   PetscCheck(aij->saved_values, PETSC_COMM_SELF, PETSC_ERR_ORDER, "Must call MatStoreValues(A);first");
3813be6bf707SBarry Smith   /* copy values over */
38149566063dSJacob Faibussowitsch   PetscCall(PetscArraycpy(aij->a, aij->saved_values, nz));
38153ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3816be6bf707SBarry Smith }
3817be6bf707SBarry Smith 
3818be6bf707SBarry Smith /*@
381920f4b53cSBarry Smith   MatRetrieveValues - Retrieves the copy of the matrix values that was stored with `MatStoreValues()`
3820be6bf707SBarry Smith 
3821c3339decSBarry Smith   Logically Collect
3822be6bf707SBarry Smith 
38232fe279fdSBarry Smith   Input Parameter:
382411a5261eSBarry Smith . mat - the matrix (currently only `MATAIJ` matrices support this option)
3825be6bf707SBarry Smith 
382615091d37SBarry Smith   Level: advanced
382715091d37SBarry Smith 
38281cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatStoreValues()`
3829be6bf707SBarry Smith @*/
3830d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRetrieveValues(Mat mat)
3831d71ae5a4SJacob Faibussowitsch {
3832be6bf707SBarry Smith   PetscFunctionBegin;
38330700a824SBarry Smith   PetscValidHeaderSpecific(mat, MAT_CLASSID, 1);
383428b400f6SJacob Faibussowitsch   PetscCheck(mat->assembled, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for unassembled matrix");
383528b400f6SJacob Faibussowitsch   PetscCheck(!mat->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix");
3836cac4c232SBarry Smith   PetscUseMethod(mat, "MatRetrieveValues_C", (Mat), (mat));
38373ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3838be6bf707SBarry Smith }
3839be6bf707SBarry Smith 
38405d83a8b1SBarry Smith /*@
384111a5261eSBarry Smith   MatCreateSeqAIJ - Creates a sparse matrix in `MATSEQAIJ` (compressed row) format
38420d15e28bSLois Curfman McInnes   (the default parallel PETSc format).  For good matrix assembly performance
384320f4b53cSBarry Smith   the user should preallocate the matrix storage by setting the parameter `nz`
384420f4b53cSBarry Smith   (or the array `nnz`).
384517ab2063SBarry Smith 
3846d083f849SBarry Smith   Collective
3847db81eaa0SLois Curfman McInnes 
384817ab2063SBarry Smith   Input Parameters:
384911a5261eSBarry Smith + comm - MPI communicator, set to `PETSC_COMM_SELF`
385017ab2063SBarry Smith . m    - number of rows
385117ab2063SBarry Smith . n    - number of columns
385217ab2063SBarry Smith . nz   - number of nonzeros per row (same for all rows)
385351c19458SBarry Smith - nnz  - array containing the number of nonzeros in the various rows
38540298fd71SBarry Smith          (possibly different for each row) or NULL
385517ab2063SBarry Smith 
385617ab2063SBarry Smith   Output Parameter:
3857416022c9SBarry Smith . A - the matrix
385817ab2063SBarry Smith 
38592ef1f0ffSBarry Smith   Options Database Keys:
38602ef1f0ffSBarry Smith + -mat_no_inode            - Do not use inodes
38612ef1f0ffSBarry Smith - -mat_inode_limit <limit> - Sets inode limit (max limit=5)
38622ef1f0ffSBarry Smith 
38632ef1f0ffSBarry Smith   Level: intermediate
3864175b88e8SBarry Smith 
3865b259b22eSLois Curfman McInnes   Notes:
386677433607SBarry Smith   It is recommend to use `MatCreateFromOptions()` instead of this routine
386777433607SBarry Smith 
38682ef1f0ffSBarry Smith   If `nnz` is given then `nz` is ignored
386949a6f317SBarry Smith 
38702ef1f0ffSBarry Smith   The `MATSEQAIJ` format, also called
38712ef1f0ffSBarry Smith   compressed row storage, is fully compatible with standard Fortran
38720002213bSLois Curfman McInnes   storage.  That is, the stored row and column indices can begin at
38732ef1f0ffSBarry Smith   either one (as in Fortran) or zero.
387417ab2063SBarry Smith 
387520f4b53cSBarry Smith   Specify the preallocated storage with either `nz` or `nnz` (not both).
38762ef1f0ffSBarry Smith   Set `nz` = `PETSC_DEFAULT` and `nnz` = `NULL` for PETSc to control dynamic memory
387720f4b53cSBarry Smith   allocation.
387817ab2063SBarry Smith 
3879682d7d0cSBarry Smith   By default, this format uses inodes (identical nodes) when possible, to
38804fca80b9SLois Curfman McInnes   improve numerical efficiency of matrix-vector products and solves. We
3881682d7d0cSBarry Smith   search for consecutive rows with the same nonzero structure, thereby
38826c7ebb05SLois Curfman McInnes   reusing matrix information to achieve increased efficiency.
38836c7ebb05SLois Curfman McInnes 
38841cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, [Sparse Matrix Creation](sec_matsparse), `MatCreate()`, `MatCreateAIJ()`, `MatSetValues()`, `MatSeqAIJSetColumnIndices()`, `MatCreateSeqAIJWithArrays()`
388517ab2063SBarry Smith @*/
3886d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateSeqAIJ(MPI_Comm comm, PetscInt m, PetscInt n, PetscInt nz, const PetscInt nnz[], Mat *A)
3887d71ae5a4SJacob Faibussowitsch {
38883a40ed3dSBarry Smith   PetscFunctionBegin;
38899566063dSJacob Faibussowitsch   PetscCall(MatCreate(comm, A));
38909566063dSJacob Faibussowitsch   PetscCall(MatSetSizes(*A, m, n, m, n));
38919566063dSJacob Faibussowitsch   PetscCall(MatSetType(*A, MATSEQAIJ));
38929566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(*A, nz, nnz));
38933ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3894273d9f13SBarry Smith }
3895273d9f13SBarry Smith 
38965d83a8b1SBarry Smith /*@
3897273d9f13SBarry Smith   MatSeqAIJSetPreallocation - For good matrix assembly performance
3898273d9f13SBarry Smith   the user should preallocate the matrix storage by setting the parameter nz
3899273d9f13SBarry Smith   (or the array nnz).  By setting these parameters accurately, performance
3900273d9f13SBarry Smith   during matrix assembly can be increased by more than a factor of 50.
3901273d9f13SBarry Smith 
3902d083f849SBarry Smith   Collective
3903273d9f13SBarry Smith 
3904273d9f13SBarry Smith   Input Parameters:
39051c4f3114SJed Brown + B   - The matrix
3906273d9f13SBarry Smith . nz  - number of nonzeros per row (same for all rows)
3907273d9f13SBarry Smith - nnz - array containing the number of nonzeros in the various rows
39080298fd71SBarry Smith          (possibly different for each row) or NULL
3909273d9f13SBarry Smith 
39102ef1f0ffSBarry Smith   Options Database Keys:
39112ef1f0ffSBarry Smith + -mat_no_inode            - Do not use inodes
39122ef1f0ffSBarry Smith - -mat_inode_limit <limit> - Sets inode limit (max limit=5)
39132ef1f0ffSBarry Smith 
39142ef1f0ffSBarry Smith   Level: intermediate
39152ef1f0ffSBarry Smith 
3916273d9f13SBarry Smith   Notes:
39172ef1f0ffSBarry Smith   If `nnz` is given then `nz` is ignored
391849a6f317SBarry Smith 
391911a5261eSBarry Smith   The `MATSEQAIJ` format also called
39202ef1f0ffSBarry Smith   compressed row storage, is fully compatible with standard Fortran
3921273d9f13SBarry Smith   storage.  That is, the stored row and column indices can begin at
3922273d9f13SBarry Smith   either one (as in Fortran) or zero.  See the users' manual for details.
3923273d9f13SBarry Smith 
39242ef1f0ffSBarry Smith   Specify the preallocated storage with either `nz` or `nnz` (not both).
39252ef1f0ffSBarry Smith   Set nz = `PETSC_DEFAULT` and `nnz` = `NULL` for PETSc to control dynamic memory
39262ef1f0ffSBarry Smith   allocation.
3927273d9f13SBarry Smith 
392811a5261eSBarry Smith   You can call `MatGetInfo()` to get information on how effective the preallocation was;
3929aa95bbe8SBarry Smith   for example the fields mallocs,nz_allocated,nz_used,nz_unneeded;
3930aa95bbe8SBarry Smith   You can also run with the option -info and look for messages with the string
3931aa95bbe8SBarry Smith   malloc in them to see if additional memory allocation was needed.
3932aa95bbe8SBarry Smith 
393311a5261eSBarry Smith   Developer Notes:
393411a5261eSBarry Smith   Use nz of `MAT_SKIP_ALLOCATION` to not allocate any space for the matrix
3935a96a251dSBarry Smith   entries or columns indices
3936a96a251dSBarry Smith 
3937273d9f13SBarry Smith   By default, this format uses inodes (identical nodes) when possible, to
3938273d9f13SBarry Smith   improve numerical efficiency of matrix-vector products and solves. We
3939273d9f13SBarry Smith   search for consecutive rows with the same nonzero structure, thereby
3940273d9f13SBarry Smith   reusing matrix information to achieve increased efficiency.
3941273d9f13SBarry Smith 
39421cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatCreate()`, `MatCreateAIJ()`, `MatSetValues()`, `MatSeqAIJSetColumnIndices()`, `MatCreateSeqAIJWithArrays()`, `MatGetInfo()`,
3943db781477SPatrick Sanan           `MatSeqAIJSetTotalPreallocation()`
3944273d9f13SBarry Smith @*/
3945d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetPreallocation(Mat B, PetscInt nz, const PetscInt nnz[])
3946d71ae5a4SJacob Faibussowitsch {
3947a23d5eceSKris Buschelman   PetscFunctionBegin;
39486ba663aaSJed Brown   PetscValidHeaderSpecific(B, MAT_CLASSID, 1);
39496ba663aaSJed Brown   PetscValidType(B, 1);
3950cac4c232SBarry Smith   PetscTryMethod(B, "MatSeqAIJSetPreallocation_C", (Mat, PetscInt, const PetscInt[]), (B, nz, nnz));
39513ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3952a23d5eceSKris Buschelman }
3953a23d5eceSKris Buschelman 
3954d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetPreallocation_SeqAIJ(Mat B, PetscInt nz, const PetscInt *nnz)
3955d71ae5a4SJacob Faibussowitsch {
3956ad79cf63SBarry Smith   Mat_SeqAIJ *b              = (Mat_SeqAIJ *)B->data;
39572576faa2SJed Brown   PetscBool   skipallocation = PETSC_FALSE, realalloc = PETSC_FALSE;
395897f1f81fSBarry Smith   PetscInt    i;
3959273d9f13SBarry Smith 
3960273d9f13SBarry Smith   PetscFunctionBegin;
3961ad79cf63SBarry Smith   if (B->hash_active) {
3962aea10558SJacob Faibussowitsch     B->ops[0] = b->cops;
3963ad79cf63SBarry Smith     PetscCall(PetscHMapIJVDestroy(&b->ht));
3964ad79cf63SBarry Smith     PetscCall(PetscFree(b->dnz));
3965ad79cf63SBarry Smith     B->hash_active = PETSC_FALSE;
3966ad79cf63SBarry Smith   }
39672576faa2SJed Brown   if (nz >= 0 || nnz) realalloc = PETSC_TRUE;
3968a96a251dSBarry Smith   if (nz == MAT_SKIP_ALLOCATION) {
3969c461c341SBarry Smith     skipallocation = PETSC_TRUE;
3970c461c341SBarry Smith     nz             = 0;
3971c461c341SBarry Smith   }
39729566063dSJacob Faibussowitsch   PetscCall(PetscLayoutSetUp(B->rmap));
39739566063dSJacob Faibussowitsch   PetscCall(PetscLayoutSetUp(B->cmap));
3974899cda47SBarry Smith 
3975435da068SBarry Smith   if (nz == PETSC_DEFAULT || nz == PETSC_DECIDE) nz = 5;
397608401ef6SPierre Jolivet   PetscCheck(nz >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "nz cannot be less than 0: value %" PetscInt_FMT, nz);
3977*9f0612e4SBarry Smith   if (nnz) {
3978d0f46423SBarry Smith     for (i = 0; i < B->rmap->n; i++) {
397908401ef6SPierre Jolivet       PetscCheck(nnz[i] >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "nnz cannot be less than 0: local row %" PetscInt_FMT " value %" PetscInt_FMT, i, nnz[i]);
398008401ef6SPierre Jolivet       PetscCheck(nnz[i] <= B->cmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "nnz cannot be greater than row length: local row %" PetscInt_FMT " value %" PetscInt_FMT " rowlength %" PetscInt_FMT, i, nnz[i], B->cmap->n);
3981b73539f3SBarry Smith     }
3982b73539f3SBarry Smith   }
3983b73539f3SBarry Smith 
3984273d9f13SBarry Smith   B->preallocated = PETSC_TRUE;
3985ab93d7beSBarry Smith   if (!skipallocation) {
39864dfa11a4SJacob Faibussowitsch     if (!b->imax) { PetscCall(PetscMalloc1(B->rmap->n, &b->imax)); }
3987071fcb05SBarry Smith     if (!b->ilen) {
3988071fcb05SBarry Smith       /* b->ilen will count nonzeros in each row so far. */
39899566063dSJacob Faibussowitsch       PetscCall(PetscCalloc1(B->rmap->n, &b->ilen));
3990071fcb05SBarry Smith     } else {
39919566063dSJacob Faibussowitsch       PetscCall(PetscMemzero(b->ilen, B->rmap->n * sizeof(PetscInt)));
39922ee49352SLisandro Dalcin     }
3993aa624791SPierre Jolivet     if (!b->ipre) PetscCall(PetscMalloc1(B->rmap->n, &b->ipre));
3994273d9f13SBarry Smith     if (!nnz) {
3995435da068SBarry Smith       if (nz == PETSC_DEFAULT || nz == PETSC_DECIDE) nz = 10;
3996c62bd62aSJed Brown       else if (nz < 0) nz = 1;
39975d2a9ed1SStefano Zampini       nz = PetscMin(nz, B->cmap->n);
3998d0f46423SBarry Smith       for (i = 0; i < B->rmap->n; i++) b->imax[i] = nz;
3999c43c4a61SBarry Smith       PetscCall(PetscIntMultError(nz, B->rmap->n, &nz));
4000273d9f13SBarry Smith     } else {
4001c73702f5SBarry Smith       PetscInt64 nz64 = 0;
40029371c9d4SSatish Balay       for (i = 0; i < B->rmap->n; i++) {
40039371c9d4SSatish Balay         b->imax[i] = nnz[i];
40049371c9d4SSatish Balay         nz64 += nnz[i];
40059371c9d4SSatish Balay       }
40069566063dSJacob Faibussowitsch       PetscCall(PetscIntCast(nz64, &nz));
4007273d9f13SBarry Smith     }
4008ab93d7beSBarry Smith 
4009273d9f13SBarry Smith     /* allocate the matrix space */
40109566063dSJacob Faibussowitsch     PetscCall(MatSeqXAIJFreeAIJ(B, &b->a, &b->j, &b->i));
4011*9f0612e4SBarry Smith     PetscCall(PetscShmgetAllocateArray(nz, sizeof(PetscInt), (void **)&b->j));
4012*9f0612e4SBarry Smith     PetscCall(PetscShmgetAllocateArray(B->rmap->n + 1, sizeof(PetscInt), (void **)&b->i));
4013*9f0612e4SBarry Smith     b->free_ij = PETSC_TRUE;
4014396832f4SHong Zhang     if (B->structure_only) {
4015*9f0612e4SBarry Smith       b->free_a = PETSC_FALSE;
4016396832f4SHong Zhang     } else {
4017*9f0612e4SBarry Smith       PetscCall(PetscShmgetAllocateArray(nz, sizeof(PetscScalar), (void **)&b->a));
4018*9f0612e4SBarry Smith       b->free_a = PETSC_TRUE;
4019396832f4SHong Zhang     }
4020bfeeae90SHong Zhang     b->i[0] = 0;
4021ad540459SPierre Jolivet     for (i = 1; i < B->rmap->n + 1; i++) b->i[i] = b->i[i - 1] + b->imax[i - 1];
4022c461c341SBarry Smith   } else {
4023e6b907acSBarry Smith     b->free_a  = PETSC_FALSE;
4024e6b907acSBarry Smith     b->free_ij = PETSC_FALSE;
4025c461c341SBarry Smith   }
4026273d9f13SBarry Smith 
4027846b4da1SFande Kong   if (b->ipre && nnz != b->ipre && b->imax) {
4028846b4da1SFande Kong     /* reserve user-requested sparsity */
40299566063dSJacob Faibussowitsch     PetscCall(PetscArraycpy(b->ipre, b->imax, B->rmap->n));
4030846b4da1SFande Kong   }
4031846b4da1SFande Kong 
4032273d9f13SBarry Smith   b->nz               = 0;
4033273d9f13SBarry Smith   b->maxnz            = nz;
4034273d9f13SBarry Smith   B->info.nz_unneeded = (double)b->maxnz;
40351baa6e33SBarry Smith   if (realalloc) PetscCall(MatSetOption(B, MAT_NEW_NONZERO_ALLOCATION_ERR, PETSC_TRUE));
4036cb7b82ddSBarry Smith   B->was_assembled = PETSC_FALSE;
4037cb7b82ddSBarry Smith   B->assembled     = PETSC_FALSE;
40385519a089SJose E. Roman   /* We simply deem preallocation has changed nonzero state. Updating the state
40395519a089SJose E. Roman      will give clients (like AIJKokkos) a chance to know something has happened.
40405519a089SJose E. Roman   */
40415519a089SJose E. Roman   B->nonzerostate++;
40423ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
4043273d9f13SBarry Smith }
4044273d9f13SBarry Smith 
4045ba38deedSJacob Faibussowitsch static PetscErrorCode MatResetPreallocation_SeqAIJ(Mat A)
4046d71ae5a4SJacob Faibussowitsch {
4047846b4da1SFande Kong   Mat_SeqAIJ *a;
4048a5bbaf83SFande Kong   PetscInt    i;
40491f14be2bSBarry Smith   PetscBool   skipreset;
4050846b4da1SFande Kong 
4051846b4da1SFande Kong   PetscFunctionBegin;
4052846b4da1SFande Kong   PetscValidHeaderSpecific(A, MAT_CLASSID, 1);
405314d0e64fSAlex Lindsay 
405414d0e64fSAlex Lindsay   /* Check local size. If zero, then return */
40553ba16761SJacob Faibussowitsch   if (!A->rmap->n) PetscFunctionReturn(PETSC_SUCCESS);
405614d0e64fSAlex Lindsay 
4057846b4da1SFande Kong   a = (Mat_SeqAIJ *)A->data;
40582c814fdeSFande Kong   /* if no saved info, we error out */
405928b400f6SJacob Faibussowitsch   PetscCheck(a->ipre, PETSC_COMM_SELF, PETSC_ERR_ARG_NULL, "No saved preallocation info ");
40602c814fdeSFande Kong 
40611f14be2bSBarry Smith   PetscCheck(a->i && a->imax && a->ilen, PETSC_COMM_SELF, PETSC_ERR_ARG_NULL, "Memory info is incomplete, and can not reset preallocation ");
40622c814fdeSFande Kong 
40631f14be2bSBarry Smith   PetscCall(PetscArraycmp(a->ipre, a->ilen, A->rmap->n, &skipreset));
40641f14be2bSBarry Smith   if (!skipreset) {
40659566063dSJacob Faibussowitsch     PetscCall(PetscArraycpy(a->imax, a->ipre, A->rmap->n));
40669566063dSJacob Faibussowitsch     PetscCall(PetscArrayzero(a->ilen, A->rmap->n));
4067846b4da1SFande Kong     a->i[0] = 0;
4068ad540459SPierre Jolivet     for (i = 1; i < A->rmap->n + 1; i++) a->i[i] = a->i[i - 1] + a->imax[i - 1];
4069846b4da1SFande Kong     A->preallocated     = PETSC_TRUE;
4070846b4da1SFande Kong     a->nz               = 0;
4071846b4da1SFande Kong     a->maxnz            = a->i[A->rmap->n];
4072846b4da1SFande Kong     A->info.nz_unneeded = (double)a->maxnz;
4073846b4da1SFande Kong     A->was_assembled    = PETSC_FALSE;
4074846b4da1SFande Kong     A->assembled        = PETSC_FALSE;
40751f14be2bSBarry Smith   }
40763ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
4077846b4da1SFande Kong }
4078846b4da1SFande Kong 
407958d36128SBarry Smith /*@
408011a5261eSBarry Smith   MatSeqAIJSetPreallocationCSR - Allocates memory for a sparse sequential matrix in `MATSEQAIJ` format.
4081a1661176SMatthew Knepley 
4082a1661176SMatthew Knepley   Input Parameters:
4083a1661176SMatthew Knepley + B - the matrix
4084d8a51d2aSBarry Smith . i - the indices into `j` for the start of each row (indices start with zero)
4085d8a51d2aSBarry Smith . j - the column indices for each row (indices start with zero) these must be sorted for each row
4086d8a51d2aSBarry Smith - v - optional values in the matrix, use `NULL` if not provided
4087a1661176SMatthew Knepley 
4088a1661176SMatthew Knepley   Level: developer
4089a1661176SMatthew Knepley 
40906a9b8d82SBarry Smith   Notes:
40912ef1f0ffSBarry Smith   The `i`,`j`,`v` values are COPIED with this routine; to avoid the copy use `MatCreateSeqAIJWithArrays()`
409258d36128SBarry Smith 
40936a9b8d82SBarry Smith   This routine may be called multiple times with different nonzero patterns (or the same nonzero pattern). The nonzero
40946a9b8d82SBarry Smith   structure will be the union of all the previous nonzero structures.
40956a9b8d82SBarry Smith 
40966a9b8d82SBarry Smith   Developer Notes:
40972ef1f0ffSBarry Smith   An optimization could be added to the implementation where it checks if the `i`, and `j` are identical to the current `i` and `j` and
40982ef1f0ffSBarry Smith   then just copies the `v` values directly with `PetscMemcpy()`.
40996a9b8d82SBarry Smith 
410011a5261eSBarry Smith   This routine could also take a `PetscCopyMode` argument to allow sharing the values instead of always copying them.
41016a9b8d82SBarry Smith 
4102fe59aa6dSJacob Faibussowitsch .seealso: [](ch_matrices), `Mat`, `MatCreate()`, `MatCreateSeqAIJ()`, `MatSetValues()`, `MatSeqAIJSetPreallocation()`, `MATSEQAIJ`, `MatResetPreallocation()`
4103a1661176SMatthew Knepley @*/
4104d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetPreallocationCSR(Mat B, const PetscInt i[], const PetscInt j[], const PetscScalar v[])
4105d71ae5a4SJacob Faibussowitsch {
4106a1661176SMatthew Knepley   PetscFunctionBegin;
41070700a824SBarry Smith   PetscValidHeaderSpecific(B, MAT_CLASSID, 1);
41086ba663aaSJed Brown   PetscValidType(B, 1);
4109cac4c232SBarry Smith   PetscTryMethod(B, "MatSeqAIJSetPreallocationCSR_C", (Mat, const PetscInt[], const PetscInt[], const PetscScalar[]), (B, i, j, v));
41103ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
4111a1661176SMatthew Knepley }
4112a1661176SMatthew Knepley 
4113ba38deedSJacob Faibussowitsch static PetscErrorCode MatSeqAIJSetPreallocationCSR_SeqAIJ(Mat B, const PetscInt Ii[], const PetscInt J[], const PetscScalar v[])
4114d71ae5a4SJacob Faibussowitsch {
4115a1661176SMatthew Knepley   PetscInt  i;
4116a1661176SMatthew Knepley   PetscInt  m, n;
4117a1661176SMatthew Knepley   PetscInt  nz;
41186a9b8d82SBarry Smith   PetscInt *nnz;
4119a1661176SMatthew Knepley 
4120a1661176SMatthew Knepley   PetscFunctionBegin;
4121aed4548fSBarry Smith   PetscCheck(Ii[0] == 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Ii[0] must be 0 it is %" PetscInt_FMT, Ii[0]);
4122779a8d59SSatish Balay 
41239566063dSJacob Faibussowitsch   PetscCall(PetscLayoutSetUp(B->rmap));
41249566063dSJacob Faibussowitsch   PetscCall(PetscLayoutSetUp(B->cmap));
4125779a8d59SSatish Balay 
41269566063dSJacob Faibussowitsch   PetscCall(MatGetSize(B, &m, &n));
41279566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(m + 1, &nnz));
4128a1661176SMatthew Knepley   for (i = 0; i < m; i++) {
4129b7940d39SSatish Balay     nz = Ii[i + 1] - Ii[i];
413008401ef6SPierre Jolivet     PetscCheck(nz >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Local row %" PetscInt_FMT " has a negative number of columns %" PetscInt_FMT, i, nz);
4131a1661176SMatthew Knepley     nnz[i] = nz;
4132a1661176SMatthew Knepley   }
41339566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJSetPreallocation(B, 0, nnz));
41349566063dSJacob Faibussowitsch   PetscCall(PetscFree(nnz));
4135a1661176SMatthew Knepley 
41368e3a54c0SPierre Jolivet   for (i = 0; i < m; i++) PetscCall(MatSetValues_SeqAIJ(B, 1, &i, Ii[i + 1] - Ii[i], J + Ii[i], PetscSafePointerPlusOffset(v, Ii[i]), INSERT_VALUES));
4137a1661176SMatthew Knepley 
41389566063dSJacob Faibussowitsch   PetscCall(MatAssemblyBegin(B, MAT_FINAL_ASSEMBLY));
41399566063dSJacob Faibussowitsch   PetscCall(MatAssemblyEnd(B, MAT_FINAL_ASSEMBLY));
4140a1661176SMatthew Knepley 
41419566063dSJacob Faibussowitsch   PetscCall(MatSetOption(B, MAT_NEW_NONZERO_LOCATION_ERR, PETSC_TRUE));
41423ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
4143a1661176SMatthew Knepley }
4144a1661176SMatthew Knepley 
4145ad7e164aSPierre Jolivet /*@
41462ef1f0ffSBarry Smith   MatSeqAIJKron - Computes `C`, the Kronecker product of `A` and `B`.
4147ad7e164aSPierre Jolivet 
4148ad7e164aSPierre Jolivet   Input Parameters:
4149ad7e164aSPierre Jolivet + A     - left-hand side matrix
4150ad7e164aSPierre Jolivet . B     - right-hand side matrix
415111a5261eSBarry Smith - reuse - either `MAT_INITIAL_MATRIX` or `MAT_REUSE_MATRIX`
4152ad7e164aSPierre Jolivet 
4153ad7e164aSPierre Jolivet   Output Parameter:
41542ef1f0ffSBarry Smith . C - Kronecker product of `A` and `B`
4155ad7e164aSPierre Jolivet 
4156ad7e164aSPierre Jolivet   Level: intermediate
4157ad7e164aSPierre Jolivet 
415811a5261eSBarry Smith   Note:
415911a5261eSBarry Smith   `MAT_REUSE_MATRIX` can only be used when the nonzero structure of the product matrix has not changed from that last call to `MatSeqAIJKron()`.
4160ad7e164aSPierre Jolivet 
41611cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatCreateSeqAIJ()`, `MATSEQAIJ`, `MATKAIJ`, `MatReuse`
4162ad7e164aSPierre Jolivet @*/
4163d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJKron(Mat A, Mat B, MatReuse reuse, Mat *C)
4164d71ae5a4SJacob Faibussowitsch {
4165ad7e164aSPierre Jolivet   PetscFunctionBegin;
4166ad7e164aSPierre Jolivet   PetscValidHeaderSpecific(A, MAT_CLASSID, 1);
4167ad7e164aSPierre Jolivet   PetscValidType(A, 1);
4168ad7e164aSPierre Jolivet   PetscValidHeaderSpecific(B, MAT_CLASSID, 2);
4169ad7e164aSPierre Jolivet   PetscValidType(B, 2);
41704f572ea9SToby Isaac   PetscAssertPointer(C, 4);
4171ad7e164aSPierre Jolivet   if (reuse == MAT_REUSE_MATRIX) {
4172ad7e164aSPierre Jolivet     PetscValidHeaderSpecific(*C, MAT_CLASSID, 4);
4173ad7e164aSPierre Jolivet     PetscValidType(*C, 4);
4174ad7e164aSPierre Jolivet   }
4175cac4c232SBarry Smith   PetscTryMethod(A, "MatSeqAIJKron_C", (Mat, Mat, MatReuse, Mat *), (A, B, reuse, C));
41763ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
4177ad7e164aSPierre Jolivet }
4178ad7e164aSPierre Jolivet 
4179ba38deedSJacob Faibussowitsch static PetscErrorCode MatSeqAIJKron_SeqAIJ(Mat A, Mat B, MatReuse reuse, Mat *C)
4180d71ae5a4SJacob Faibussowitsch {
4181ad7e164aSPierre Jolivet   Mat                newmat;
4182ad7e164aSPierre Jolivet   Mat_SeqAIJ        *a = (Mat_SeqAIJ *)A->data;
4183ad7e164aSPierre Jolivet   Mat_SeqAIJ        *b = (Mat_SeqAIJ *)B->data;
4184ad7e164aSPierre Jolivet   PetscScalar       *v;
4185fff043a9SJunchao Zhang   const PetscScalar *aa, *ba;
4186ad7e164aSPierre Jolivet   PetscInt          *i, *j, m, n, p, q, nnz = 0, am = A->rmap->n, bm = B->rmap->n, an = A->cmap->n, bn = B->cmap->n;
4187ad7e164aSPierre Jolivet   PetscBool          flg;
4188ad7e164aSPierre Jolivet 
4189ad7e164aSPierre Jolivet   PetscFunctionBegin;
419028b400f6SJacob Faibussowitsch   PetscCheck(!A->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix");
419128b400f6SJacob Faibussowitsch   PetscCheck(A->assembled, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for unassembled matrix");
419228b400f6SJacob Faibussowitsch   PetscCheck(!B->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix");
419328b400f6SJacob Faibussowitsch   PetscCheck(B->assembled, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for unassembled matrix");
41949566063dSJacob Faibussowitsch   PetscCall(PetscObjectTypeCompare((PetscObject)B, MATSEQAIJ, &flg));
419528b400f6SJacob Faibussowitsch   PetscCheck(flg, PETSC_COMM_SELF, PETSC_ERR_SUP, "MatType %s", ((PetscObject)B)->type_name);
4196aed4548fSBarry Smith   PetscCheck(reuse == MAT_INITIAL_MATRIX || reuse == MAT_REUSE_MATRIX, PETSC_COMM_SELF, PETSC_ERR_SUP, "MatReuse %d", (int)reuse);
4197ad7e164aSPierre Jolivet   if (reuse == MAT_INITIAL_MATRIX) {
41989566063dSJacob Faibussowitsch     PetscCall(PetscMalloc2(am * bm + 1, &i, a->i[am] * b->i[bm], &j));
41999566063dSJacob Faibussowitsch     PetscCall(MatCreate(PETSC_COMM_SELF, &newmat));
42009566063dSJacob Faibussowitsch     PetscCall(MatSetSizes(newmat, am * bm, an * bn, am * bm, an * bn));
42019566063dSJacob Faibussowitsch     PetscCall(MatSetType(newmat, MATAIJ));
4202ad7e164aSPierre Jolivet     i[0] = 0;
4203ad7e164aSPierre Jolivet     for (m = 0; m < am; ++m) {
4204ad7e164aSPierre Jolivet       for (p = 0; p < bm; ++p) {
4205ad7e164aSPierre Jolivet         i[m * bm + p + 1] = i[m * bm + p] + (a->i[m + 1] - a->i[m]) * (b->i[p + 1] - b->i[p]);
4206ad7e164aSPierre Jolivet         for (n = a->i[m]; n < a->i[m + 1]; ++n) {
4207ad540459SPierre Jolivet           for (q = b->i[p]; q < b->i[p + 1]; ++q) j[nnz++] = a->j[n] * bn + b->j[q];
4208ad7e164aSPierre Jolivet         }
4209ad7e164aSPierre Jolivet       }
4210ad7e164aSPierre Jolivet     }
42119566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJSetPreallocationCSR(newmat, i, j, NULL));
4212ad7e164aSPierre Jolivet     *C = newmat;
42139566063dSJacob Faibussowitsch     PetscCall(PetscFree2(i, j));
4214ad7e164aSPierre Jolivet     nnz = 0;
4215ad7e164aSPierre Jolivet   }
42169566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArray(*C, &v));
42179566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &aa));
42189566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(B, &ba));
4219ad7e164aSPierre Jolivet   for (m = 0; m < am; ++m) {
4220ad7e164aSPierre Jolivet     for (p = 0; p < bm; ++p) {
4221ad7e164aSPierre Jolivet       for (n = a->i[m]; n < a->i[m + 1]; ++n) {
4222ad540459SPierre Jolivet         for (q = b->i[p]; q < b->i[p + 1]; ++q) v[nnz++] = aa[n] * ba[q];
4223ad7e164aSPierre Jolivet       }
4224ad7e164aSPierre Jolivet     }
4225ad7e164aSPierre Jolivet   }
42269566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArray(*C, &v));
42279566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &aa));
42289566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(B, &ba));
42293ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
4230ad7e164aSPierre Jolivet }
4231ad7e164aSPierre Jolivet 
4232c6db04a5SJed Brown #include <../src/mat/impls/dense/seq/dense.h>
4233af0996ceSBarry Smith #include <petsc/private/kernels/petscaxpy.h>
4234170fe5c8SBarry Smith 
4235170fe5c8SBarry Smith /*
4236170fe5c8SBarry Smith     Computes (B'*A')' since computing B*A directly is untenable
4237170fe5c8SBarry Smith 
4238170fe5c8SBarry Smith                n                       p                          p
42392da392ccSBarry Smith         [             ]       [             ]         [                 ]
42402da392ccSBarry Smith       m [      A      ]  *  n [       B     ]   =   m [         C       ]
42412da392ccSBarry Smith         [             ]       [             ]         [                 ]
4242170fe5c8SBarry Smith 
4243170fe5c8SBarry Smith */
4244d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMatMultNumeric_SeqDense_SeqAIJ(Mat A, Mat B, Mat C)
4245d71ae5a4SJacob Faibussowitsch {
4246170fe5c8SBarry Smith   Mat_SeqDense      *sub_a = (Mat_SeqDense *)A->data;
4247170fe5c8SBarry Smith   Mat_SeqAIJ        *sub_b = (Mat_SeqAIJ *)B->data;
4248170fe5c8SBarry Smith   Mat_SeqDense      *sub_c = (Mat_SeqDense *)C->data;
424986214ceeSStefano Zampini   PetscInt           i, j, n, m, q, p;
4250170fe5c8SBarry Smith   const PetscInt    *ii, *idx;
4251170fe5c8SBarry Smith   const PetscScalar *b, *a, *a_q;
4252170fe5c8SBarry Smith   PetscScalar       *c, *c_q;
425386214ceeSStefano Zampini   PetscInt           clda = sub_c->lda;
425486214ceeSStefano Zampini   PetscInt           alda = sub_a->lda;
4255170fe5c8SBarry Smith 
4256170fe5c8SBarry Smith   PetscFunctionBegin;
4257d0f46423SBarry Smith   m = A->rmap->n;
4258d0f46423SBarry Smith   n = A->cmap->n;
4259d0f46423SBarry Smith   p = B->cmap->n;
4260170fe5c8SBarry Smith   a = sub_a->v;
4261170fe5c8SBarry Smith   b = sub_b->a;
4262170fe5c8SBarry Smith   c = sub_c->v;
426386214ceeSStefano Zampini   if (clda == m) {
42649566063dSJacob Faibussowitsch     PetscCall(PetscArrayzero(c, m * p));
426586214ceeSStefano Zampini   } else {
426686214ceeSStefano Zampini     for (j = 0; j < p; j++)
42679371c9d4SSatish Balay       for (i = 0; i < m; i++) c[j * clda + i] = 0.0;
426886214ceeSStefano Zampini   }
4269170fe5c8SBarry Smith   ii  = sub_b->i;
4270170fe5c8SBarry Smith   idx = sub_b->j;
4271170fe5c8SBarry Smith   for (i = 0; i < n; i++) {
4272170fe5c8SBarry Smith     q = ii[i + 1] - ii[i];
4273170fe5c8SBarry Smith     while (q-- > 0) {
427486214ceeSStefano Zampini       c_q = c + clda * (*idx);
427586214ceeSStefano Zampini       a_q = a + alda * i;
4276854c7f52SBarry Smith       PetscKernelAXPY(c_q, *b, a_q, m);
4277170fe5c8SBarry Smith       idx++;
4278170fe5c8SBarry Smith       b++;
4279170fe5c8SBarry Smith     }
4280170fe5c8SBarry Smith   }
42813ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
4282170fe5c8SBarry Smith }
4283170fe5c8SBarry Smith 
4284d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMatMultSymbolic_SeqDense_SeqAIJ(Mat A, Mat B, PetscReal fill, Mat C)
4285d71ae5a4SJacob Faibussowitsch {
4286d0f46423SBarry Smith   PetscInt  m = A->rmap->n, n = B->cmap->n;
428786214ceeSStefano Zampini   PetscBool cisdense;
4288170fe5c8SBarry Smith 
4289170fe5c8SBarry Smith   PetscFunctionBegin;
429008401ef6SPierre Jolivet   PetscCheck(A->cmap->n == B->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "A->cmap->n %" PetscInt_FMT " != B->rmap->n %" PetscInt_FMT, A->cmap->n, B->rmap->n);
42919566063dSJacob Faibussowitsch   PetscCall(MatSetSizes(C, m, n, m, n));
42929566063dSJacob Faibussowitsch   PetscCall(MatSetBlockSizesFromMats(C, A, B));
4293d5e393b6SSuyash Tandon   PetscCall(PetscObjectTypeCompareAny((PetscObject)C, &cisdense, MATSEQDENSE, MATSEQDENSECUDA, MATSEQDENSEHIP, ""));
429448a46eb9SPierre Jolivet   if (!cisdense) PetscCall(MatSetType(C, MATDENSE));
42959566063dSJacob Faibussowitsch   PetscCall(MatSetUp(C));
4296d73949e8SHong Zhang 
42974222ddf1SHong Zhang   C->ops->matmultnumeric = MatMatMultNumeric_SeqDense_SeqAIJ;
42983ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
4299170fe5c8SBarry Smith }
4300170fe5c8SBarry Smith 
43010bad9183SKris Buschelman /*MC
4302fafad747SKris Buschelman    MATSEQAIJ - MATSEQAIJ = "seqaij" - A matrix type to be used for sequential sparse matrices,
43030bad9183SKris Buschelman    based on compressed sparse row format.
43040bad9183SKris Buschelman 
43052ef1f0ffSBarry Smith    Options Database Key:
43060bad9183SKris Buschelman . -mat_type seqaij - sets the matrix type to "seqaij" during a call to MatSetFromOptions()
43070bad9183SKris Buschelman 
43080bad9183SKris Buschelman    Level: beginner
43090bad9183SKris Buschelman 
43100cd7f59aSBarry Smith    Notes:
43112ef1f0ffSBarry Smith     `MatSetValues()` may be called for this matrix type with a `NULL` argument for the numerical values,
43120cd7f59aSBarry Smith     in this case the values associated with the rows and columns one passes in are set to zero
43130cd7f59aSBarry Smith     in the matrix
43140cd7f59aSBarry Smith 
431511a5261eSBarry Smith     `MatSetOptions`(,`MAT_STRUCTURE_ONLY`,`PETSC_TRUE`) may be called for this matrix type. In this no
431611a5261eSBarry Smith     space is allocated for the nonzero entries and any entries passed with `MatSetValues()` are ignored
43170cd7f59aSBarry Smith 
431811a5261eSBarry Smith   Developer Note:
43192ef1f0ffSBarry Smith     It would be nice if all matrix formats supported passing `NULL` in for the numerical values
43200cd7f59aSBarry Smith 
43211cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatCreateSeqAIJ()`, `MatSetFromOptions()`, `MatSetType()`, `MatCreate()`, `MatType`, `MATSELL`, `MATSEQSELL`, `MATMPISELL`
43220bad9183SKris Buschelman M*/
43230bad9183SKris Buschelman 
4324ccd284c7SBarry Smith /*MC
4325ccd284c7SBarry Smith    MATAIJ - MATAIJ = "aij" - A matrix type to be used for sparse matrices.
4326ccd284c7SBarry Smith 
432711a5261eSBarry Smith    This matrix type is identical to `MATSEQAIJ` when constructed with a single process communicator,
432811a5261eSBarry Smith    and `MATMPIAIJ` otherwise.  As a result, for single process communicators,
432911a5261eSBarry Smith    `MatSeqAIJSetPreallocation()` is supported, and similarly `MatMPIAIJSetPreallocation()` is supported
4330ccd284c7SBarry Smith    for communicators controlling multiple processes.  It is recommended that you call both of
4331ccd284c7SBarry Smith    the above preallocation routines for simplicity.
4332ccd284c7SBarry Smith 
43332ef1f0ffSBarry Smith    Options Database Key:
433411a5261eSBarry Smith . -mat_type aij - sets the matrix type to "aij" during a call to `MatSetFromOptions()`
4335ccd284c7SBarry Smith 
43362ef1f0ffSBarry Smith   Level: beginner
43372ef1f0ffSBarry Smith 
433811a5261eSBarry Smith    Note:
433911a5261eSBarry Smith    Subclasses include `MATAIJCUSPARSE`, `MATAIJPERM`, `MATAIJSELL`, `MATAIJMKL`, `MATAIJCRL`, and also automatically switches over to use inodes when
4340ccd284c7SBarry Smith    enough exist.
4341ccd284c7SBarry Smith 
43421cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatCreateAIJ()`, `MatCreateSeqAIJ()`, `MATSEQAIJ`, `MATMPIAIJ`, `MATSELL`, `MATSEQSELL`, `MATMPISELL`
4343ccd284c7SBarry Smith M*/
4344ccd284c7SBarry Smith 
4345ccd284c7SBarry Smith /*MC
4346ccd284c7SBarry Smith    MATAIJCRL - MATAIJCRL = "aijcrl" - A matrix type to be used for sparse matrices.
4347ccd284c7SBarry Smith 
43482ef1f0ffSBarry Smith    Options Database Key:
43492ef1f0ffSBarry Smith . -mat_type aijcrl - sets the matrix type to "aijcrl" during a call to `MatSetFromOptions()`
43502ef1f0ffSBarry Smith 
43512ef1f0ffSBarry Smith   Level: beginner
43522ef1f0ffSBarry Smith 
43532ef1f0ffSBarry Smith    Note:
435411a5261eSBarry Smith    This matrix type is identical to `MATSEQAIJCRL` when constructed with a single process communicator,
435511a5261eSBarry Smith    and `MATMPIAIJCRL` otherwise.  As a result, for single process communicators,
435611a5261eSBarry Smith    `MatSeqAIJSetPreallocation()` is supported, and similarly `MatMPIAIJSetPreallocation()` is supported
4357ccd284c7SBarry Smith    for communicators controlling multiple processes.  It is recommended that you call both of
4358ccd284c7SBarry Smith    the above preallocation routines for simplicity.
4359ccd284c7SBarry Smith 
43601cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatCreateMPIAIJCRL`, `MATSEQAIJCRL`, `MATMPIAIJCRL`, `MATSEQAIJCRL`, `MATMPIAIJCRL`
4361ccd284c7SBarry Smith M*/
4362ccd284c7SBarry Smith 
43637906f579SHong Zhang PETSC_INTERN PetscErrorCode MatConvert_SeqAIJ_SeqAIJCRL(Mat, MatType, MatReuse, Mat *);
43647906f579SHong Zhang #if defined(PETSC_HAVE_ELEMENTAL)
43657906f579SHong Zhang PETSC_INTERN PetscErrorCode MatConvert_SeqAIJ_Elemental(Mat, MatType, MatReuse, Mat *);
43667906f579SHong Zhang #endif
4367d24d4204SJose E. Roman #if defined(PETSC_HAVE_SCALAPACK)
4368d24d4204SJose E. Roman PETSC_INTERN PetscErrorCode MatConvert_AIJ_ScaLAPACK(Mat, MatType, MatReuse, Mat *);
4369d24d4204SJose E. Roman #endif
43707906f579SHong Zhang #if defined(PETSC_HAVE_HYPRE)
43717906f579SHong Zhang PETSC_INTERN PetscErrorCode MatConvert_AIJ_HYPRE(Mat A, MatType, MatReuse, Mat *);
43727906f579SHong Zhang #endif
43737906f579SHong Zhang 
4374d4002b98SHong Zhang PETSC_EXTERN PetscErrorCode MatConvert_SeqAIJ_SeqSELL(Mat, MatType, MatReuse, Mat *);
4375c9225affSStefano Zampini PETSC_INTERN PetscErrorCode MatConvert_XAIJ_IS(Mat, MatType, MatReuse, Mat *);
43764222ddf1SHong Zhang PETSC_INTERN PetscErrorCode MatProductSetFromOptions_IS_XAIJ(Mat);
43777906f579SHong Zhang 
43788c778c55SBarry Smith /*@C
437911a5261eSBarry Smith   MatSeqAIJGetArray - gives read/write access to the array where the data for a `MATSEQAIJ` matrix is stored
43808c778c55SBarry Smith 
43818c778c55SBarry Smith   Not Collective
43828c778c55SBarry Smith 
43838c778c55SBarry Smith   Input Parameter:
4384fe59aa6dSJacob Faibussowitsch . A - a `MATSEQAIJ` matrix
43858c778c55SBarry Smith 
43868c778c55SBarry Smith   Output Parameter:
43878c778c55SBarry Smith . array - pointer to the data
43888c778c55SBarry Smith 
43898c778c55SBarry Smith   Level: intermediate
43908c778c55SBarry Smith 
4391fe59aa6dSJacob Faibussowitsch   Fortran Notes:
43920ab4885dSBarry Smith   `MatSeqAIJGetArray()` Fortran binding is deprecated (since PETSc 3.19), use `MatSeqAIJGetArrayF90()`
43930ab4885dSBarry Smith 
43941cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJRestoreArray()`, `MatSeqAIJGetArrayF90()`
43958c778c55SBarry Smith @*/
43965d83a8b1SBarry Smith PetscErrorCode MatSeqAIJGetArray(Mat A, PetscScalar *array[])
4397d71ae5a4SJacob Faibussowitsch {
4398d67d9f35SJunchao Zhang   Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data;
43998c778c55SBarry Smith 
44008c778c55SBarry Smith   PetscFunctionBegin;
4401d67d9f35SJunchao Zhang   if (aij->ops->getarray) {
44029566063dSJacob Faibussowitsch     PetscCall((*aij->ops->getarray)(A, array));
4403d67d9f35SJunchao Zhang   } else {
4404d67d9f35SJunchao Zhang     *array = aij->a;
4405d67d9f35SJunchao Zhang   }
44063ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
4407d67d9f35SJunchao Zhang }
4408d67d9f35SJunchao Zhang 
4409d67d9f35SJunchao Zhang /*@C
441011a5261eSBarry Smith   MatSeqAIJRestoreArray - returns access to the array where the data for a `MATSEQAIJ` matrix is stored obtained by `MatSeqAIJGetArray()`
4411d67d9f35SJunchao Zhang 
4412d67d9f35SJunchao Zhang   Not Collective
4413d67d9f35SJunchao Zhang 
4414d67d9f35SJunchao Zhang   Input Parameters:
4415fe59aa6dSJacob Faibussowitsch + A     - a `MATSEQAIJ` matrix
4416d67d9f35SJunchao Zhang - array - pointer to the data
4417d67d9f35SJunchao Zhang 
4418d67d9f35SJunchao Zhang   Level: intermediate
4419d67d9f35SJunchao Zhang 
4420fe59aa6dSJacob Faibussowitsch   Fortran Notes:
44210ab4885dSBarry Smith   `MatSeqAIJRestoreArray()` Fortran binding is deprecated (since PETSc 3.19), use `MatSeqAIJRestoreArrayF90()`
44220ab4885dSBarry Smith 
44231cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJGetArray()`, `MatSeqAIJRestoreArrayF90()`
4424d67d9f35SJunchao Zhang @*/
44255d83a8b1SBarry Smith PetscErrorCode MatSeqAIJRestoreArray(Mat A, PetscScalar *array[])
4426d71ae5a4SJacob Faibussowitsch {
4427d67d9f35SJunchao Zhang   Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data;
4428d67d9f35SJunchao Zhang 
4429d67d9f35SJunchao Zhang   PetscFunctionBegin;
4430d67d9f35SJunchao Zhang   if (aij->ops->restorearray) {
44319566063dSJacob Faibussowitsch     PetscCall((*aij->ops->restorearray)(A, array));
4432d67d9f35SJunchao Zhang   } else {
4433d67d9f35SJunchao Zhang     *array = NULL;
4434d67d9f35SJunchao Zhang   }
44359566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJInvalidateDiagonal(A));
44369566063dSJacob Faibussowitsch   PetscCall(PetscObjectStateIncrease((PetscObject)A));
44373ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
44388c778c55SBarry Smith }
44398c778c55SBarry Smith 
444021e72a00SBarry Smith /*@C
444111a5261eSBarry Smith   MatSeqAIJGetArrayRead - gives read-only access to the array where the data for a `MATSEQAIJ` matrix is stored
44428f1ea47aSStefano Zampini 
44430ab4885dSBarry Smith   Not Collective; No Fortran Support
44448f1ea47aSStefano Zampini 
44458f1ea47aSStefano Zampini   Input Parameter:
4446fe59aa6dSJacob Faibussowitsch . A - a `MATSEQAIJ` matrix
44478f1ea47aSStefano Zampini 
44488f1ea47aSStefano Zampini   Output Parameter:
44498f1ea47aSStefano Zampini . array - pointer to the data
44508f1ea47aSStefano Zampini 
44518f1ea47aSStefano Zampini   Level: intermediate
44528f1ea47aSStefano Zampini 
44531cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJGetArray()`, `MatSeqAIJRestoreArrayRead()`
44548f1ea47aSStefano Zampini @*/
44555d83a8b1SBarry Smith PetscErrorCode MatSeqAIJGetArrayRead(Mat A, const PetscScalar *array[])
4456d71ae5a4SJacob Faibussowitsch {
4457d67d9f35SJunchao Zhang   Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data;
44588f1ea47aSStefano Zampini 
44598f1ea47aSStefano Zampini   PetscFunctionBegin;
4460d67d9f35SJunchao Zhang   if (aij->ops->getarrayread) {
44619566063dSJacob Faibussowitsch     PetscCall((*aij->ops->getarrayread)(A, array));
4462d67d9f35SJunchao Zhang   } else {
4463d67d9f35SJunchao Zhang     *array = aij->a;
4464d67d9f35SJunchao Zhang   }
44653ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
44668f1ea47aSStefano Zampini }
44678f1ea47aSStefano Zampini 
44688f1ea47aSStefano Zampini /*@C
446911a5261eSBarry Smith   MatSeqAIJRestoreArrayRead - restore the read-only access array obtained from `MatSeqAIJGetArrayRead()`
44708f1ea47aSStefano Zampini 
44710ab4885dSBarry Smith   Not Collective; No Fortran Support
44728f1ea47aSStefano Zampini 
44738f1ea47aSStefano Zampini   Input Parameter:
4474fe59aa6dSJacob Faibussowitsch . A - a `MATSEQAIJ` matrix
44758f1ea47aSStefano Zampini 
44768f1ea47aSStefano Zampini   Output Parameter:
44778f1ea47aSStefano Zampini . array - pointer to the data
44788f1ea47aSStefano Zampini 
44798f1ea47aSStefano Zampini   Level: intermediate
44808f1ea47aSStefano Zampini 
44811cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJGetArray()`, `MatSeqAIJGetArrayRead()`
44828f1ea47aSStefano Zampini @*/
44835d83a8b1SBarry Smith PetscErrorCode MatSeqAIJRestoreArrayRead(Mat A, const PetscScalar *array[])
4484d71ae5a4SJacob Faibussowitsch {
4485d67d9f35SJunchao Zhang   Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data;
44868f1ea47aSStefano Zampini 
44878f1ea47aSStefano Zampini   PetscFunctionBegin;
4488d67d9f35SJunchao Zhang   if (aij->ops->restorearrayread) {
44899566063dSJacob Faibussowitsch     PetscCall((*aij->ops->restorearrayread)(A, array));
4490d67d9f35SJunchao Zhang   } else {
4491d67d9f35SJunchao Zhang     *array = NULL;
4492d67d9f35SJunchao Zhang   }
44933ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
4494d67d9f35SJunchao Zhang }
4495d67d9f35SJunchao Zhang 
4496d67d9f35SJunchao Zhang /*@C
449711a5261eSBarry Smith   MatSeqAIJGetArrayWrite - gives write-only access to the array where the data for a `MATSEQAIJ` matrix is stored
4498d67d9f35SJunchao Zhang 
44990ab4885dSBarry Smith   Not Collective; No Fortran Support
4500d67d9f35SJunchao Zhang 
4501d67d9f35SJunchao Zhang   Input Parameter:
4502fe59aa6dSJacob Faibussowitsch . A - a `MATSEQAIJ` matrix
4503d67d9f35SJunchao Zhang 
4504d67d9f35SJunchao Zhang   Output Parameter:
4505d67d9f35SJunchao Zhang . array - pointer to the data
4506d67d9f35SJunchao Zhang 
4507d67d9f35SJunchao Zhang   Level: intermediate
4508d67d9f35SJunchao Zhang 
45091cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJGetArray()`, `MatSeqAIJRestoreArrayRead()`
4510d67d9f35SJunchao Zhang @*/
45115d83a8b1SBarry Smith PetscErrorCode MatSeqAIJGetArrayWrite(Mat A, PetscScalar *array[])
4512d71ae5a4SJacob Faibussowitsch {
4513d67d9f35SJunchao Zhang   Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data;
4514d67d9f35SJunchao Zhang 
4515d67d9f35SJunchao Zhang   PetscFunctionBegin;
4516d67d9f35SJunchao Zhang   if (aij->ops->getarraywrite) {
45179566063dSJacob Faibussowitsch     PetscCall((*aij->ops->getarraywrite)(A, array));
4518d67d9f35SJunchao Zhang   } else {
4519d67d9f35SJunchao Zhang     *array = aij->a;
4520d67d9f35SJunchao Zhang   }
45219566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJInvalidateDiagonal(A));
45229566063dSJacob Faibussowitsch   PetscCall(PetscObjectStateIncrease((PetscObject)A));
45233ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
4524d67d9f35SJunchao Zhang }
4525d67d9f35SJunchao Zhang 
4526d67d9f35SJunchao Zhang /*@C
4527d67d9f35SJunchao Zhang   MatSeqAIJRestoreArrayWrite - restore the read-only access array obtained from MatSeqAIJGetArrayRead
4528d67d9f35SJunchao Zhang 
45290ab4885dSBarry Smith   Not Collective; No Fortran Support
4530d67d9f35SJunchao Zhang 
4531d67d9f35SJunchao Zhang   Input Parameter:
4532fe59aa6dSJacob Faibussowitsch . A - a MATSEQAIJ matrix
4533d67d9f35SJunchao Zhang 
4534d67d9f35SJunchao Zhang   Output Parameter:
4535d67d9f35SJunchao Zhang . array - pointer to the data
4536d67d9f35SJunchao Zhang 
4537d67d9f35SJunchao Zhang   Level: intermediate
4538d67d9f35SJunchao Zhang 
45391cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJGetArray()`, `MatSeqAIJGetArrayRead()`
4540d67d9f35SJunchao Zhang @*/
45415d83a8b1SBarry Smith PetscErrorCode MatSeqAIJRestoreArrayWrite(Mat A, PetscScalar *array[])
4542d71ae5a4SJacob Faibussowitsch {
4543d67d9f35SJunchao Zhang   Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data;
4544d67d9f35SJunchao Zhang 
4545d67d9f35SJunchao Zhang   PetscFunctionBegin;
4546d67d9f35SJunchao Zhang   if (aij->ops->restorearraywrite) {
45479566063dSJacob Faibussowitsch     PetscCall((*aij->ops->restorearraywrite)(A, array));
4548d67d9f35SJunchao Zhang   } else {
4549d67d9f35SJunchao Zhang     *array = NULL;
4550d67d9f35SJunchao Zhang   }
45513ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
45528f1ea47aSStefano Zampini }
45538f1ea47aSStefano Zampini 
45548f1ea47aSStefano Zampini /*@C
455511a5261eSBarry Smith   MatSeqAIJGetCSRAndMemType - Get the CSR arrays and the memory type of the `MATSEQAIJ` matrix
45567ee59b9bSJunchao Zhang 
45570ab4885dSBarry Smith   Not Collective; No Fortran Support
45587ee59b9bSJunchao Zhang 
45597ee59b9bSJunchao Zhang   Input Parameter:
456011a5261eSBarry Smith . mat - a matrix of type `MATSEQAIJ` or its subclasses
45617ee59b9bSJunchao Zhang 
45627ee59b9bSJunchao Zhang   Output Parameters:
45637ee59b9bSJunchao Zhang + i     - row map array of the matrix
45647ee59b9bSJunchao Zhang . j     - column index array of the matrix
45657ee59b9bSJunchao Zhang . a     - data array of the matrix
4566fe59aa6dSJacob Faibussowitsch - mtype - memory type of the arrays
45677ee59b9bSJunchao Zhang 
4568fe59aa6dSJacob Faibussowitsch   Level: developer
45692ef1f0ffSBarry Smith 
45707ee59b9bSJunchao Zhang   Notes:
45712ef1f0ffSBarry Smith   Any of the output parameters can be `NULL`, in which case the corresponding value is not returned.
45727ee59b9bSJunchao Zhang   If mat is a device matrix, the arrays are on the device. Otherwise, they are on the host.
45737ee59b9bSJunchao Zhang 
45747ee59b9bSJunchao Zhang   One can call this routine on a preallocated but not assembled matrix to just get the memory of the CSR underneath the matrix.
45752ef1f0ffSBarry Smith   If the matrix is assembled, the data array `a` is guaranteed to have the latest values of the matrix.
45767ee59b9bSJunchao Zhang 
45771cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJGetArray()`, `MatSeqAIJGetArrayRead()`
45787ee59b9bSJunchao Zhang @*/
45795d83a8b1SBarry Smith PetscErrorCode MatSeqAIJGetCSRAndMemType(Mat mat, const PetscInt *i[], const PetscInt *j[], PetscScalar *a[], PetscMemType *mtype)
4580d71ae5a4SJacob Faibussowitsch {
45817ee59b9bSJunchao Zhang   Mat_SeqAIJ *aij = (Mat_SeqAIJ *)mat->data;
45827ee59b9bSJunchao Zhang 
45837ee59b9bSJunchao Zhang   PetscFunctionBegin;
45847ee59b9bSJunchao Zhang   PetscCheck(mat->preallocated, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "matrix is not preallocated");
45857ee59b9bSJunchao Zhang   if (aij->ops->getcsrandmemtype) {
45867ee59b9bSJunchao Zhang     PetscCall((*aij->ops->getcsrandmemtype)(mat, i, j, a, mtype));
45877ee59b9bSJunchao Zhang   } else {
45887ee59b9bSJunchao Zhang     if (i) *i = aij->i;
45897ee59b9bSJunchao Zhang     if (j) *j = aij->j;
45907ee59b9bSJunchao Zhang     if (a) *a = aij->a;
45917ee59b9bSJunchao Zhang     if (mtype) *mtype = PETSC_MEMTYPE_HOST;
45927ee59b9bSJunchao Zhang   }
45933ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
45947ee59b9bSJunchao Zhang }
45957ee59b9bSJunchao Zhang 
4596cc4c1da9SBarry Smith /*@
459721e72a00SBarry Smith   MatSeqAIJGetMaxRowNonzeros - returns the maximum number of nonzeros in any row
459821e72a00SBarry Smith 
459921e72a00SBarry Smith   Not Collective
460021e72a00SBarry Smith 
460121e72a00SBarry Smith   Input Parameter:
4602fe59aa6dSJacob Faibussowitsch . A - a `MATSEQAIJ` matrix
460321e72a00SBarry Smith 
460421e72a00SBarry Smith   Output Parameter:
460521e72a00SBarry Smith . nz - the maximum number of nonzeros in any row
460621e72a00SBarry Smith 
460721e72a00SBarry Smith   Level: intermediate
460821e72a00SBarry Smith 
46091cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJRestoreArray()`, `MatSeqAIJGetArrayF90()`
461021e72a00SBarry Smith @*/
4611d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJGetMaxRowNonzeros(Mat A, PetscInt *nz)
4612d71ae5a4SJacob Faibussowitsch {
461321e72a00SBarry Smith   Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data;
461421e72a00SBarry Smith 
461521e72a00SBarry Smith   PetscFunctionBegin;
461621e72a00SBarry Smith   *nz = aij->rmax;
46173ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
461821e72a00SBarry Smith }
461921e72a00SBarry Smith 
46202c4ab24aSJunchao Zhang static PetscErrorCode MatCOOStructDestroy_SeqAIJ(void *data)
46212c4ab24aSJunchao Zhang {
46222c4ab24aSJunchao Zhang   MatCOOStruct_SeqAIJ *coo = (MatCOOStruct_SeqAIJ *)data;
46234d86920dSPierre Jolivet 
46242c4ab24aSJunchao Zhang   PetscFunctionBegin;
46252c4ab24aSJunchao Zhang   PetscCall(PetscFree(coo->perm));
46262c4ab24aSJunchao Zhang   PetscCall(PetscFree(coo->jmap));
46272c4ab24aSJunchao Zhang   PetscCall(PetscFree(coo));
46282c4ab24aSJunchao Zhang   PetscFunctionReturn(PETSC_SUCCESS);
46292c4ab24aSJunchao Zhang }
46302c4ab24aSJunchao Zhang 
4631d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetPreallocationCOO_SeqAIJ(Mat mat, PetscCount coo_n, PetscInt coo_i[], PetscInt coo_j[])
4632d71ae5a4SJacob Faibussowitsch {
4633394ed5ebSJunchao Zhang   MPI_Comm             comm;
4634394ed5ebSJunchao Zhang   PetscInt            *i, *j;
46350d88f7f4SJunchao Zhang   PetscInt             M, N, row, iprev;
4636394ed5ebSJunchao Zhang   PetscCount           k, p, q, nneg, nnz, start, end; /* Index the coo array, so use PetscCount as their type */
4637394ed5ebSJunchao Zhang   PetscInt            *Ai;                             /* Change to PetscCount once we use it for row pointers */
4638394ed5ebSJunchao Zhang   PetscInt            *Aj;
4639394ed5ebSJunchao Zhang   PetscScalar         *Aa;
4640f4f49eeaSPierre Jolivet   Mat_SeqAIJ          *seqaij = (Mat_SeqAIJ *)mat->data;
4641cbc6b225SStefano Zampini   MatType              rtype;
4642394ed5ebSJunchao Zhang   PetscCount          *perm, *jmap;
46432c4ab24aSJunchao Zhang   PetscContainer       container;
46442c4ab24aSJunchao Zhang   MatCOOStruct_SeqAIJ *coo;
46450d88f7f4SJunchao Zhang   PetscBool            isorted;
4646*9f0612e4SBarry Smith   PetscBool            hypre;
4647*9f0612e4SBarry Smith   const char          *name;
4648394ed5ebSJunchao Zhang 
4649394ed5ebSJunchao Zhang   PetscFunctionBegin;
46509566063dSJacob Faibussowitsch   PetscCall(PetscObjectGetComm((PetscObject)mat, &comm));
46519566063dSJacob Faibussowitsch   PetscCall(MatGetSize(mat, &M, &N));
4652e8729f6fSJunchao Zhang   i = coo_i;
4653e8729f6fSJunchao Zhang   j = coo_j;
46549566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(coo_n, &perm));
46550d88f7f4SJunchao Zhang 
46560d88f7f4SJunchao Zhang   /* Ignore entries with negative row or col indices; at the same time, check if i[] is already sorted (e.g., MatConvert_AlJ_HYPRE results in this case) */
46570d88f7f4SJunchao Zhang   isorted = PETSC_TRUE;
46580d88f7f4SJunchao Zhang   iprev   = PETSC_INT_MIN;
46590d88f7f4SJunchao Zhang   for (k = 0; k < coo_n; k++) {
4660394ed5ebSJunchao Zhang     if (j[k] < 0) i[k] = -1;
46610d88f7f4SJunchao Zhang     if (isorted) {
46620d88f7f4SJunchao Zhang       if (i[k] < iprev) isorted = PETSC_FALSE;
46630d88f7f4SJunchao Zhang       else iprev = i[k];
46640d88f7f4SJunchao Zhang     }
4665394ed5ebSJunchao Zhang     perm[k] = k;
4666394ed5ebSJunchao Zhang   }
4667394ed5ebSJunchao Zhang 
46680d88f7f4SJunchao Zhang   /* Sort by row if not already */
46690d88f7f4SJunchao Zhang   if (!isorted) PetscCall(PetscSortIntWithIntCountArrayPair(coo_n, i, j, perm));
4670651b1cf9SStefano Zampini 
4671651b1cf9SStefano Zampini   /* Advance k to the first row with a non-negative index */
4672651b1cf9SStefano Zampini   for (k = 0; k < coo_n; k++)
46739371c9d4SSatish Balay     if (i[k] >= 0) break;
4674394ed5ebSJunchao Zhang   nneg = k;
46759566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(coo_n - nneg + 1, &jmap)); /* +1 to make a CSR-like data structure. jmap[i] originally is the number of repeats for i-th nonzero */
4676394ed5ebSJunchao Zhang   nnz = 0;                                          /* Total number of unique nonzeros to be counted */
467735cb6cd3SPierre Jolivet   jmap++;                                           /* Inc jmap by 1 for convenience */
4678394ed5ebSJunchao Zhang 
4679*9f0612e4SBarry Smith   PetscCall(PetscShmgetAllocateArray(M + 1, sizeof(PetscInt), (void **)&Ai)); /* CSR of A */
4680*9f0612e4SBarry Smith   PetscCall(PetscArrayzero(Ai, M + 1));
4681*9f0612e4SBarry Smith   PetscCall(PetscShmgetAllocateArray(coo_n - nneg, sizeof(PetscInt), (void **)&Aj)); /* We have at most coo_n-nneg unique nonzeros */
4682394ed5ebSJunchao Zhang 
4683651b1cf9SStefano Zampini   PetscCall(PetscObjectGetName((PetscObject)mat, &name));
4684651b1cf9SStefano Zampini   PetscCall(PetscStrcmp("_internal_COO_mat_for_hypre", name, &hypre));
4685651b1cf9SStefano Zampini 
4686394ed5ebSJunchao Zhang   /* In each row, sort by column, then unique column indices to get row length */
468735cb6cd3SPierre Jolivet   Ai++;  /* Inc by 1 for convenience */
4688394ed5ebSJunchao Zhang   q = 0; /* q-th unique nonzero, with q starting from 0 */
4689394ed5ebSJunchao Zhang   while (k < coo_n) {
46900d88f7f4SJunchao Zhang     PetscBool strictly_sorted; // this row is strictly sorted?
46910d88f7f4SJunchao Zhang     PetscInt  jprev;
46920d88f7f4SJunchao Zhang 
46930d88f7f4SJunchao Zhang     /* get [start,end) indices for this row; also check if cols in this row are strictly sorted */
4694394ed5ebSJunchao Zhang     row             = i[k];
46950d88f7f4SJunchao Zhang     start           = k;
46960d88f7f4SJunchao Zhang     jprev           = PETSC_INT_MIN;
46970d88f7f4SJunchao Zhang     strictly_sorted = PETSC_TRUE;
46980d88f7f4SJunchao Zhang     while (k < coo_n && i[k] == row) {
46990d88f7f4SJunchao Zhang       if (strictly_sorted) {
47000d88f7f4SJunchao Zhang         if (j[k] <= jprev) strictly_sorted = PETSC_FALSE;
47010d88f7f4SJunchao Zhang         else jprev = j[k];
47020d88f7f4SJunchao Zhang       }
47030d88f7f4SJunchao Zhang       k++;
47040d88f7f4SJunchao Zhang     }
4705394ed5ebSJunchao Zhang     end = k;
47060d88f7f4SJunchao Zhang 
4707651b1cf9SStefano Zampini     /* hack for HYPRE: swap min column to diag so that diagonal values will go first */
4708651b1cf9SStefano Zampini     if (hypre) {
4709651b1cf9SStefano Zampini       PetscInt  minj    = PETSC_MAX_INT;
4710651b1cf9SStefano Zampini       PetscBool hasdiag = PETSC_FALSE;
47110d88f7f4SJunchao Zhang 
47120d88f7f4SJunchao Zhang       if (strictly_sorted) { // fast path to swap the first and the diag
47130d88f7f4SJunchao Zhang         PetscCount tmp;
47140d88f7f4SJunchao Zhang         for (p = start; p < end; p++) {
47150d88f7f4SJunchao Zhang           if (j[p] == row && p != start) {
47160d88f7f4SJunchao Zhang             j[p]        = j[start];
47170d88f7f4SJunchao Zhang             j[start]    = row;
47180d88f7f4SJunchao Zhang             tmp         = perm[start];
47190d88f7f4SJunchao Zhang             perm[start] = perm[p];
47200d88f7f4SJunchao Zhang             perm[p]     = tmp;
47210d88f7f4SJunchao Zhang             break;
47220d88f7f4SJunchao Zhang           }
47230d88f7f4SJunchao Zhang         }
47240d88f7f4SJunchao Zhang       } else {
4725651b1cf9SStefano Zampini         for (p = start; p < end; p++) {
4726651b1cf9SStefano Zampini           hasdiag = (PetscBool)(hasdiag || (j[p] == row));
4727651b1cf9SStefano Zampini           minj    = PetscMin(minj, j[p]);
4728651b1cf9SStefano Zampini         }
47290d88f7f4SJunchao Zhang 
4730651b1cf9SStefano Zampini         if (hasdiag) {
4731651b1cf9SStefano Zampini           for (p = start; p < end; p++) {
4732651b1cf9SStefano Zampini             if (j[p] == minj) j[p] = row;
4733651b1cf9SStefano Zampini             else if (j[p] == row) j[p] = minj;
4734651b1cf9SStefano Zampini           }
4735651b1cf9SStefano Zampini         }
4736651b1cf9SStefano Zampini       }
47370d88f7f4SJunchao Zhang     }
47380d88f7f4SJunchao Zhang     // sort by columns in a row
47390d88f7f4SJunchao Zhang     if (!strictly_sorted) PetscCall(PetscSortIntWithCountArray(end - start, j + start, perm + start));
4740651b1cf9SStefano Zampini 
47410d88f7f4SJunchao Zhang     if (strictly_sorted) { // fast path to set Aj[], jmap[], Ai[], nnz, q
47420d88f7f4SJunchao Zhang       for (p = start; p < end; p++, q++) {
47430d88f7f4SJunchao Zhang         Aj[q]   = j[p];
47440d88f7f4SJunchao Zhang         jmap[q] = 1;
47450d88f7f4SJunchao Zhang       }
47460d88f7f4SJunchao Zhang       Ai[row] = end - start;
47470d88f7f4SJunchao Zhang       nnz += Ai[row]; // q is already advanced
47480d88f7f4SJunchao Zhang     } else {
4749394ed5ebSJunchao Zhang       /* Find number of unique col entries in this row */
4750394ed5ebSJunchao Zhang       Aj[q]   = j[start]; /* Log the first nonzero in this row */
4751651b1cf9SStefano Zampini       jmap[q] = 1;        /* Number of repeats of this nonzero entry */
4752394ed5ebSJunchao Zhang       Ai[row] = 1;
4753394ed5ebSJunchao Zhang       nnz++;
4754394ed5ebSJunchao Zhang 
4755394ed5ebSJunchao Zhang       for (p = start + 1; p < end; p++) { /* Scan remaining nonzero in this row */
4756394ed5ebSJunchao Zhang         if (j[p] != j[p - 1]) {           /* Meet a new nonzero */
4757394ed5ebSJunchao Zhang           q++;
4758394ed5ebSJunchao Zhang           jmap[q] = 1;
4759394ed5ebSJunchao Zhang           Aj[q]   = j[p];
4760394ed5ebSJunchao Zhang           Ai[row]++;
4761394ed5ebSJunchao Zhang           nnz++;
4762394ed5ebSJunchao Zhang         } else {
4763394ed5ebSJunchao Zhang           jmap[q]++;
4764394ed5ebSJunchao Zhang         }
4765394ed5ebSJunchao Zhang       }
4766394ed5ebSJunchao Zhang       q++; /* Move to next row and thus next unique nonzero */
4767394ed5ebSJunchao Zhang     }
47680d88f7f4SJunchao Zhang   }
47690d88f7f4SJunchao Zhang 
4770394ed5ebSJunchao Zhang   Ai--; /* Back to the beginning of Ai[] */
4771394ed5ebSJunchao Zhang   for (k = 0; k < M; k++) Ai[k + 1] += Ai[k];
47720d88f7f4SJunchao Zhang   jmap--; // Back to the beginning of jmap[]
4773394ed5ebSJunchao Zhang   jmap[0] = 0;
4774394ed5ebSJunchao Zhang   for (k = 0; k < nnz; k++) jmap[k + 1] += jmap[k];
47750d88f7f4SJunchao Zhang 
4776*9f0612e4SBarry Smith   if (nnz < coo_n - nneg) { /* Reallocate with actual number of unique nonzeros */
4777394ed5ebSJunchao Zhang     PetscCount *jmap_new;
4778394ed5ebSJunchao Zhang     PetscInt   *Aj_new;
4779394ed5ebSJunchao Zhang 
47809566063dSJacob Faibussowitsch     PetscCall(PetscMalloc1(nnz + 1, &jmap_new));
47819566063dSJacob Faibussowitsch     PetscCall(PetscArraycpy(jmap_new, jmap, nnz + 1));
47829566063dSJacob Faibussowitsch     PetscCall(PetscFree(jmap));
4783394ed5ebSJunchao Zhang     jmap = jmap_new;
4784394ed5ebSJunchao Zhang 
4785*9f0612e4SBarry Smith     PetscCall(PetscShmgetAllocateArray(nnz, sizeof(PetscInt), (void **)&Aj_new));
47869566063dSJacob Faibussowitsch     PetscCall(PetscArraycpy(Aj_new, Aj, nnz));
4787*9f0612e4SBarry Smith     PetscCall(PetscShmgetDeallocateArray((void **)&Aj));
4788394ed5ebSJunchao Zhang     Aj = Aj_new;
4789394ed5ebSJunchao Zhang   }
4790394ed5ebSJunchao Zhang 
4791394ed5ebSJunchao Zhang   if (nneg) { /* Discard heading entries with negative indices in perm[], as we'll access it from index 0 in MatSetValuesCOO */
4792394ed5ebSJunchao Zhang     PetscCount *perm_new;
4793cbc6b225SStefano Zampini 
47949566063dSJacob Faibussowitsch     PetscCall(PetscMalloc1(coo_n - nneg, &perm_new));
47959566063dSJacob Faibussowitsch     PetscCall(PetscArraycpy(perm_new, perm + nneg, coo_n - nneg));
47969566063dSJacob Faibussowitsch     PetscCall(PetscFree(perm));
4797394ed5ebSJunchao Zhang     perm = perm_new;
4798394ed5ebSJunchao Zhang   }
4799394ed5ebSJunchao Zhang 
48009566063dSJacob Faibussowitsch   PetscCall(MatGetRootType_Private(mat, &rtype));
4801*9f0612e4SBarry Smith   PetscCall(PetscShmgetAllocateArray(nnz, sizeof(PetscScalar), (void **)&Aa));
4802*9f0612e4SBarry Smith   PetscCall(PetscArrayzero(Aa, nnz));
48039566063dSJacob Faibussowitsch   PetscCall(MatSetSeqAIJWithArrays_private(PETSC_COMM_SELF, M, N, Ai, Aj, Aa, rtype, mat));
4804394ed5ebSJunchao Zhang 
4805394ed5ebSJunchao Zhang   seqaij->free_a = seqaij->free_ij = PETSC_TRUE; /* Let newmat own Ai, Aj and Aa */
48062c4ab24aSJunchao Zhang 
48072c4ab24aSJunchao Zhang   // Put the COO struct in a container and then attach that to the matrix
48082c4ab24aSJunchao Zhang   PetscCall(PetscMalloc1(1, &coo));
48092c4ab24aSJunchao Zhang   coo->nz   = nnz;
48102c4ab24aSJunchao Zhang   coo->n    = coo_n;
48112c4ab24aSJunchao Zhang   coo->Atot = coo_n - nneg; // Annz is seqaij->nz, so no need to record that again
48122c4ab24aSJunchao Zhang   coo->jmap = jmap;         // of length nnz+1
48132c4ab24aSJunchao Zhang   coo->perm = perm;
48142c4ab24aSJunchao Zhang   PetscCall(PetscContainerCreate(PETSC_COMM_SELF, &container));
48152c4ab24aSJunchao Zhang   PetscCall(PetscContainerSetPointer(container, coo));
48162c4ab24aSJunchao Zhang   PetscCall(PetscContainerSetUserDestroy(container, MatCOOStructDestroy_SeqAIJ));
48172c4ab24aSJunchao Zhang   PetscCall(PetscObjectCompose((PetscObject)mat, "__PETSc_MatCOOStruct_Host", (PetscObject)container));
48182c4ab24aSJunchao Zhang   PetscCall(PetscContainerDestroy(&container));
48193ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
4820394ed5ebSJunchao Zhang }
4821394ed5ebSJunchao Zhang 
4822d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatSetValuesCOO_SeqAIJ(Mat A, const PetscScalar v[], InsertMode imode)
4823d71ae5a4SJacob Faibussowitsch {
4824394ed5ebSJunchao Zhang   Mat_SeqAIJ          *aseq = (Mat_SeqAIJ *)A->data;
4825394ed5ebSJunchao Zhang   PetscCount           i, j, Annz = aseq->nz;
48262c4ab24aSJunchao Zhang   PetscCount          *perm, *jmap;
4827394ed5ebSJunchao Zhang   PetscScalar         *Aa;
48282c4ab24aSJunchao Zhang   PetscContainer       container;
48292c4ab24aSJunchao Zhang   MatCOOStruct_SeqAIJ *coo;
4830394ed5ebSJunchao Zhang 
4831394ed5ebSJunchao Zhang   PetscFunctionBegin;
48322c4ab24aSJunchao Zhang   PetscCall(PetscObjectQuery((PetscObject)A, "__PETSc_MatCOOStruct_Host", (PetscObject *)&container));
48332c4ab24aSJunchao Zhang   PetscCheck(container, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Not found MatCOOStruct on this matrix");
48342c4ab24aSJunchao Zhang   PetscCall(PetscContainerGetPointer(container, (void **)&coo));
48352c4ab24aSJunchao Zhang   perm = coo->perm;
48362c4ab24aSJunchao Zhang   jmap = coo->jmap;
48379566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArray(A, &Aa));
4838394ed5ebSJunchao Zhang   for (i = 0; i < Annz; i++) {
4839b6c38306SJunchao Zhang     PetscScalar sum = 0.0;
4840b6c38306SJunchao Zhang     for (j = jmap[i]; j < jmap[i + 1]; j++) sum += v[perm[j]];
4841b6c38306SJunchao Zhang     Aa[i] = (imode == INSERT_VALUES ? 0.0 : Aa[i]) + sum;
4842394ed5ebSJunchao Zhang   }
48439566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArray(A, &Aa));
48443ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
4845394ed5ebSJunchao Zhang }
4846394ed5ebSJunchao Zhang 
484734b5b067SBarry Smith #if defined(PETSC_HAVE_CUDA)
48485063d097SStefano Zampini PETSC_INTERN PetscErrorCode MatConvert_SeqAIJ_SeqAIJCUSPARSE(Mat, MatType, MatReuse, Mat *);
484902fe1965SBarry Smith #endif
4850d5e393b6SSuyash Tandon #if defined(PETSC_HAVE_HIP)
4851d5e393b6SSuyash Tandon PETSC_INTERN PetscErrorCode MatConvert_SeqAIJ_SeqAIJHIPSPARSE(Mat, MatType, MatReuse, Mat *);
4852d5e393b6SSuyash Tandon #endif
48533d0639e7SStefano Zampini #if defined(PETSC_HAVE_KOKKOS_KERNELS)
48545063d097SStefano Zampini PETSC_INTERN PetscErrorCode MatConvert_SeqAIJ_SeqAIJKokkos(Mat, MatType, MatReuse, Mat *);
48553d0639e7SStefano Zampini #endif
485602fe1965SBarry Smith 
4857d71ae5a4SJacob Faibussowitsch PETSC_EXTERN PetscErrorCode MatCreate_SeqAIJ(Mat B)
4858d71ae5a4SJacob Faibussowitsch {
4859273d9f13SBarry Smith   Mat_SeqAIJ *b;
486038baddfdSBarry Smith   PetscMPIInt size;
4861273d9f13SBarry Smith 
4862273d9f13SBarry Smith   PetscFunctionBegin;
48639566063dSJacob Faibussowitsch   PetscCallMPI(MPI_Comm_size(PetscObjectComm((PetscObject)B), &size));
486408401ef6SPierre Jolivet   PetscCheck(size <= 1, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Comm must be of size 1");
4865273d9f13SBarry Smith 
48664dfa11a4SJacob Faibussowitsch   PetscCall(PetscNew(&b));
48672205254eSKarl Rupp 
4868b0a32e0cSBarry Smith   B->data   = (void *)b;
4869aea10558SJacob Faibussowitsch   B->ops[0] = MatOps_Values;
4870071fcb05SBarry Smith   if (B->sortedfull) B->ops->setvalues = MatSetValues_SeqAIJ_SortedFull;
48712205254eSKarl Rupp 
4872f4259b30SLisandro Dalcin   b->row                = NULL;
4873f4259b30SLisandro Dalcin   b->col                = NULL;
4874f4259b30SLisandro Dalcin   b->icol               = NULL;
4875b810aeb4SBarry Smith   b->reallocs           = 0;
487636db0b34SBarry Smith   b->ignorezeroentries  = PETSC_FALSE;
4877f1e2ffcdSBarry Smith   b->roworiented        = PETSC_TRUE;
4878416022c9SBarry Smith   b->nonew              = 0;
4879f4259b30SLisandro Dalcin   b->diag               = NULL;
4880f4259b30SLisandro Dalcin   b->solve_work         = NULL;
4881f4259b30SLisandro Dalcin   B->spptr              = NULL;
4882f4259b30SLisandro Dalcin   b->saved_values       = NULL;
4883f4259b30SLisandro Dalcin   b->idiag              = NULL;
4884f4259b30SLisandro Dalcin   b->mdiag              = NULL;
4885f4259b30SLisandro Dalcin   b->ssor_work          = NULL;
488671f1c65dSBarry Smith   b->omega              = 1.0;
488771f1c65dSBarry Smith   b->fshift             = 0.0;
488871f1c65dSBarry Smith   b->idiagvalid         = PETSC_FALSE;
4889bbead8a2SBarry Smith   b->ibdiagvalid        = PETSC_FALSE;
4890a9817697SBarry Smith   b->keepnonzeropattern = PETSC_FALSE;
489117ab2063SBarry Smith 
48929566063dSJacob Faibussowitsch   PetscCall(PetscObjectChangeTypeName((PetscObject)B, MATSEQAIJ));
4893d1e78c4fSBarry Smith #if defined(PETSC_HAVE_MATLAB)
48949566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "PetscMatlabEnginePut_C", MatlabEnginePut_SeqAIJ));
48959566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "PetscMatlabEngineGet_C", MatlabEngineGet_SeqAIJ));
4896b3866ffcSBarry Smith #endif
48979566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSeqAIJSetColumnIndices_C", MatSeqAIJSetColumnIndices_SeqAIJ));
48989566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatStoreValues_C", MatStoreValues_SeqAIJ));
48999566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatRetrieveValues_C", MatRetrieveValues_SeqAIJ));
49009566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqsbaij_C", MatConvert_SeqAIJ_SeqSBAIJ));
49019566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqbaij_C", MatConvert_SeqAIJ_SeqBAIJ));
49029566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijperm_C", MatConvert_SeqAIJ_SeqAIJPERM));
49039566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijsell_C", MatConvert_SeqAIJ_SeqAIJSELL));
49049779e05dSSatish Balay #if defined(PETSC_HAVE_MKL_SPARSE)
49059566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijmkl_C", MatConvert_SeqAIJ_SeqAIJMKL));
4906191b95cbSRichard Tran Mills #endif
490734b5b067SBarry Smith #if defined(PETSC_HAVE_CUDA)
49089566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijcusparse_C", MatConvert_SeqAIJ_SeqAIJCUSPARSE));
49099566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_seqaijcusparse_seqaij_C", MatProductSetFromOptions_SeqAIJ));
49109566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_seqaij_seqaijcusparse_C", MatProductSetFromOptions_SeqAIJ));
491102fe1965SBarry Smith #endif
4912d5e393b6SSuyash Tandon #if defined(PETSC_HAVE_HIP)
4913d5e393b6SSuyash Tandon   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijhipsparse_C", MatConvert_SeqAIJ_SeqAIJHIPSPARSE));
4914d5e393b6SSuyash Tandon   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_seqaijhipsparse_seqaij_C", MatProductSetFromOptions_SeqAIJ));
4915d5e393b6SSuyash Tandon   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_seqaij_seqaijhipsparse_C", MatProductSetFromOptions_SeqAIJ));
4916d5e393b6SSuyash Tandon #endif
49173d0639e7SStefano Zampini #if defined(PETSC_HAVE_KOKKOS_KERNELS)
49189566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijkokkos_C", MatConvert_SeqAIJ_SeqAIJKokkos));
49193d0639e7SStefano Zampini #endif
49209566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijcrl_C", MatConvert_SeqAIJ_SeqAIJCRL));
4921af8000cdSHong Zhang #if defined(PETSC_HAVE_ELEMENTAL)
49229566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_elemental_C", MatConvert_SeqAIJ_Elemental));
4923af8000cdSHong Zhang #endif
4924d24d4204SJose E. Roman #if defined(PETSC_HAVE_SCALAPACK)
49259566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_scalapack_C", MatConvert_AIJ_ScaLAPACK));
4926d24d4204SJose E. Roman #endif
492763c07aadSStefano Zampini #if defined(PETSC_HAVE_HYPRE)
49289566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_hypre_C", MatConvert_AIJ_HYPRE));
49299566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_transpose_seqaij_seqaij_C", MatProductSetFromOptions_Transpose_AIJ_AIJ));
493063c07aadSStefano Zampini #endif
49319566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqdense_C", MatConvert_SeqAIJ_SeqDense));
49329566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqsell_C", MatConvert_SeqAIJ_SeqSELL));
49339566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_is_C", MatConvert_XAIJ_IS));
49349566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatIsTranspose_C", MatIsTranspose_SeqAIJ));
493514e4dea2SJose E. Roman   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatIsHermitianTranspose_C", MatIsHermitianTranspose_SeqAIJ));
49369566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSeqAIJSetPreallocation_C", MatSeqAIJSetPreallocation_SeqAIJ));
49379566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatResetPreallocation_C", MatResetPreallocation_SeqAIJ));
49389566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSeqAIJSetPreallocationCSR_C", MatSeqAIJSetPreallocationCSR_SeqAIJ));
49399566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatReorderForNonzeroDiagonal_C", MatReorderForNonzeroDiagonal_SeqAIJ));
49409566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_is_seqaij_C", MatProductSetFromOptions_IS_XAIJ));
49419566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_seqdense_seqaij_C", MatProductSetFromOptions_SeqDense_SeqAIJ));
49429566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_seqaij_seqaij_C", MatProductSetFromOptions_SeqAIJ));
49439566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSeqAIJKron_C", MatSeqAIJKron_SeqAIJ));
49449566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSetPreallocationCOO_C", MatSetPreallocationCOO_SeqAIJ));
49459566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSetValuesCOO_C", MatSetValuesCOO_SeqAIJ));
49469566063dSJacob Faibussowitsch   PetscCall(MatCreate_SeqAIJ_Inode(B));
49479566063dSJacob Faibussowitsch   PetscCall(PetscObjectChangeTypeName((PetscObject)B, MATSEQAIJ));
49489566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJSetTypeFromOptions(B)); /* this allows changing the matrix subtype to say MATSEQAIJPERM */
49493ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
495017ab2063SBarry Smith }
495117ab2063SBarry Smith 
4952b24902e0SBarry Smith /*
49533893b582SJunchao Zhang     Given a matrix generated with MatGetFactor() duplicates all the information in A into C
4954b24902e0SBarry Smith */
4955d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDuplicateNoCreate_SeqAIJ(Mat C, Mat A, MatDuplicateOption cpvalues, PetscBool mallocmatspace)
4956d71ae5a4SJacob Faibussowitsch {
49572a350339SBarry Smith   Mat_SeqAIJ *c = (Mat_SeqAIJ *)C->data, *a = (Mat_SeqAIJ *)A->data;
4958071fcb05SBarry Smith   PetscInt    m = A->rmap->n, i;
495917ab2063SBarry Smith 
49603a40ed3dSBarry Smith   PetscFunctionBegin;
4961aed4548fSBarry Smith   PetscCheck(A->assembled || cpvalues == MAT_DO_NOT_COPY_VALUES, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Cannot duplicate unassembled matrix");
4962273d9f13SBarry Smith 
4963d5f3da31SBarry Smith   C->factortype    = A->factortype;
4964f4259b30SLisandro Dalcin   c->row           = NULL;
4965f4259b30SLisandro Dalcin   c->col           = NULL;
4966f4259b30SLisandro Dalcin   c->icol          = NULL;
49676ad4291fSHong Zhang   c->reallocs      = 0;
4968bc43efbbSJunchao Zhang   c->diagonaldense = a->diagonaldense;
496917ab2063SBarry Smith 
497069272f91SPierre Jolivet   C->assembled = A->assembled;
497117ab2063SBarry Smith 
497269272f91SPierre Jolivet   if (A->preallocated) {
49739566063dSJacob Faibussowitsch     PetscCall(PetscLayoutReference(A->rmap, &C->rmap));
49749566063dSJacob Faibussowitsch     PetscCall(PetscLayoutReference(A->cmap, &C->cmap));
4975eec197d1SBarry Smith 
497631fe6a7dSBarry Smith     if (!A->hash_active) {
49779566063dSJacob Faibussowitsch       PetscCall(PetscMalloc1(m, &c->imax));
49789566063dSJacob Faibussowitsch       PetscCall(PetscMemcpy(c->imax, a->imax, m * sizeof(PetscInt)));
49799566063dSJacob Faibussowitsch       PetscCall(PetscMalloc1(m, &c->ilen));
49809566063dSJacob Faibussowitsch       PetscCall(PetscMemcpy(c->ilen, a->ilen, m * sizeof(PetscInt)));
498117ab2063SBarry Smith 
498217ab2063SBarry Smith       /* allocate the matrix space */
4983f77e22a1SHong Zhang       if (mallocmatspace) {
4984*9f0612e4SBarry Smith         PetscCall(PetscShmgetAllocateArray(a->i[m], sizeof(PetscScalar), (void **)&c->a));
4985*9f0612e4SBarry Smith         PetscCall(PetscShmgetAllocateArray(a->i[m], sizeof(PetscInt), (void **)&c->j));
4986*9f0612e4SBarry Smith         PetscCall(PetscShmgetAllocateArray(m + 1, sizeof(PetscInt), (void **)&c->i));
49879566063dSJacob Faibussowitsch         PetscCall(PetscArraycpy(c->i, a->i, m + 1));
4988*9f0612e4SBarry Smith         c->free_a  = PETSC_TRUE;
4989*9f0612e4SBarry Smith         c->free_ij = PETSC_TRUE;
499017ab2063SBarry Smith         if (m > 0) {
49919566063dSJacob Faibussowitsch           PetscCall(PetscArraycpy(c->j, a->j, a->i[m]));
4992be6bf707SBarry Smith           if (cpvalues == MAT_COPY_VALUES) {
49932e5835c6SStefano Zampini             const PetscScalar *aa;
49942e5835c6SStefano Zampini 
49959566063dSJacob Faibussowitsch             PetscCall(MatSeqAIJGetArrayRead(A, &aa));
49969566063dSJacob Faibussowitsch             PetscCall(PetscArraycpy(c->a, aa, a->i[m]));
49979566063dSJacob Faibussowitsch             PetscCall(MatSeqAIJGetArrayRead(A, &aa));
4998be6bf707SBarry Smith           } else {
49999566063dSJacob Faibussowitsch             PetscCall(PetscArrayzero(c->a, a->i[m]));
500017ab2063SBarry Smith           }
500108480c60SBarry Smith         }
5002f77e22a1SHong Zhang       }
500331fe6a7dSBarry Smith       C->preallocated = PETSC_TRUE;
500431fe6a7dSBarry Smith     } else {
500531fe6a7dSBarry Smith       PetscCheck(mallocmatspace, PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_WRONGSTATE, "Cannot malloc matrix memory from a non-preallocated matrix");
500631fe6a7dSBarry Smith       PetscCall(MatSetUp(C));
500731fe6a7dSBarry Smith     }
500817ab2063SBarry Smith 
50096ad4291fSHong Zhang     c->ignorezeroentries = a->ignorezeroentries;
5010416022c9SBarry Smith     c->roworiented       = a->roworiented;
5011416022c9SBarry Smith     c->nonew             = a->nonew;
5012416022c9SBarry Smith     if (a->diag) {
50139566063dSJacob Faibussowitsch       PetscCall(PetscMalloc1(m + 1, &c->diag));
50149566063dSJacob Faibussowitsch       PetscCall(PetscMemcpy(c->diag, a->diag, m * sizeof(PetscInt)));
5015071fcb05SBarry Smith     } else c->diag = NULL;
50162205254eSKarl Rupp 
5017f4259b30SLisandro Dalcin     c->solve_work         = NULL;
5018f4259b30SLisandro Dalcin     c->saved_values       = NULL;
5019f4259b30SLisandro Dalcin     c->idiag              = NULL;
5020f4259b30SLisandro Dalcin     c->ssor_work          = NULL;
5021a9817697SBarry Smith     c->keepnonzeropattern = a->keepnonzeropattern;
50226ad4291fSHong Zhang 
5023893ad86cSHong Zhang     c->rmax  = a->rmax;
5024416022c9SBarry Smith     c->nz    = a->nz;
50258ed568f8SMatthew G Knepley     c->maxnz = a->nz; /* Since we allocate exactly the right amount */
5026754ec7b1SSatish Balay 
50276ad4291fSHong Zhang     c->compressedrow.use   = a->compressedrow.use;
50286ad4291fSHong Zhang     c->compressedrow.nrows = a->compressedrow.nrows;
5029cd6b891eSBarry Smith     if (a->compressedrow.use) {
50306ad4291fSHong Zhang       i = a->compressedrow.nrows;
50319566063dSJacob Faibussowitsch       PetscCall(PetscMalloc2(i + 1, &c->compressedrow.i, i, &c->compressedrow.rindex));
50329566063dSJacob Faibussowitsch       PetscCall(PetscArraycpy(c->compressedrow.i, a->compressedrow.i, i + 1));
50339566063dSJacob Faibussowitsch       PetscCall(PetscArraycpy(c->compressedrow.rindex, a->compressedrow.rindex, i));
503427ea64f8SHong Zhang     } else {
503527ea64f8SHong Zhang       c->compressedrow.use    = PETSC_FALSE;
50360298fd71SBarry Smith       c->compressedrow.i      = NULL;
50370298fd71SBarry Smith       c->compressedrow.rindex = NULL;
50386ad4291fSHong Zhang     }
5039ea632784SBarry Smith     c->nonzerorowcnt = a->nonzerorowcnt;
5040e56f5c9eSBarry Smith     C->nonzerostate  = A->nonzerostate;
50414846f1f5SKris Buschelman 
50429566063dSJacob Faibussowitsch     PetscCall(MatDuplicate_SeqAIJ_Inode(A, cpvalues, &C));
504369272f91SPierre Jolivet   }
50449566063dSJacob Faibussowitsch   PetscCall(PetscFunctionListDuplicate(((PetscObject)A)->qlist, &((PetscObject)C)->qlist));
50453ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
504617ab2063SBarry Smith }
504717ab2063SBarry Smith 
5048d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDuplicate_SeqAIJ(Mat A, MatDuplicateOption cpvalues, Mat *B)
5049d71ae5a4SJacob Faibussowitsch {
5050b24902e0SBarry Smith   PetscFunctionBegin;
50519566063dSJacob Faibussowitsch   PetscCall(MatCreate(PetscObjectComm((PetscObject)A), B));
50529566063dSJacob Faibussowitsch   PetscCall(MatSetSizes(*B, A->rmap->n, A->cmap->n, A->rmap->n, A->cmap->n));
505348a46eb9SPierre Jolivet   if (!(A->rmap->n % A->rmap->bs) && !(A->cmap->n % A->cmap->bs)) PetscCall(MatSetBlockSizesFromMats(*B, A, A));
50549566063dSJacob Faibussowitsch   PetscCall(MatSetType(*B, ((PetscObject)A)->type_name));
50559566063dSJacob Faibussowitsch   PetscCall(MatDuplicateNoCreate_SeqAIJ(*B, A, cpvalues, PETSC_TRUE));
50563ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
5057b24902e0SBarry Smith }
5058b24902e0SBarry Smith 
5059d71ae5a4SJacob Faibussowitsch PetscErrorCode MatLoad_SeqAIJ(Mat newMat, PetscViewer viewer)
5060d71ae5a4SJacob Faibussowitsch {
506152f91c60SVaclav Hapla   PetscBool isbinary, ishdf5;
506252f91c60SVaclav Hapla 
506352f91c60SVaclav Hapla   PetscFunctionBegin;
506452f91c60SVaclav Hapla   PetscValidHeaderSpecific(newMat, MAT_CLASSID, 1);
506552f91c60SVaclav Hapla   PetscValidHeaderSpecific(viewer, PETSC_VIEWER_CLASSID, 2);
5066c27b3999SVaclav Hapla   /* force binary viewer to load .info file if it has not yet done so */
50679566063dSJacob Faibussowitsch   PetscCall(PetscViewerSetUp(viewer));
50689566063dSJacob Faibussowitsch   PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERBINARY, &isbinary));
50699566063dSJacob Faibussowitsch   PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERHDF5, &ishdf5));
507052f91c60SVaclav Hapla   if (isbinary) {
50719566063dSJacob Faibussowitsch     PetscCall(MatLoad_SeqAIJ_Binary(newMat, viewer));
507252f91c60SVaclav Hapla   } else if (ishdf5) {
507352f91c60SVaclav Hapla #if defined(PETSC_HAVE_HDF5)
50749566063dSJacob Faibussowitsch     PetscCall(MatLoad_AIJ_HDF5(newMat, viewer));
507552f91c60SVaclav Hapla #else
507652f91c60SVaclav Hapla     SETERRQ(PetscObjectComm((PetscObject)newMat), PETSC_ERR_SUP, "HDF5 not supported in this build.\nPlease reconfigure using --download-hdf5");
507752f91c60SVaclav Hapla #endif
507852f91c60SVaclav Hapla   } else {
507998921bdaSJacob Faibussowitsch     SETERRQ(PetscObjectComm((PetscObject)newMat), PETSC_ERR_SUP, "Viewer type %s not yet supported for reading %s matrices", ((PetscObject)viewer)->type_name, ((PetscObject)newMat)->type_name);
508052f91c60SVaclav Hapla   }
50813ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
508252f91c60SVaclav Hapla }
508352f91c60SVaclav Hapla 
5084d71ae5a4SJacob Faibussowitsch PetscErrorCode MatLoad_SeqAIJ_Binary(Mat mat, PetscViewer viewer)
5085d71ae5a4SJacob Faibussowitsch {
50863ea6fe3dSLisandro Dalcin   Mat_SeqAIJ *a = (Mat_SeqAIJ *)mat->data;
50873ea6fe3dSLisandro Dalcin   PetscInt    header[4], *rowlens, M, N, nz, sum, rows, cols, i;
5088fbdbba38SShri Abhyankar 
5089fbdbba38SShri Abhyankar   PetscFunctionBegin;
50909566063dSJacob Faibussowitsch   PetscCall(PetscViewerSetUp(viewer));
5091bbead8a2SBarry Smith 
50923ea6fe3dSLisandro Dalcin   /* read in matrix header */
50939566063dSJacob Faibussowitsch   PetscCall(PetscViewerBinaryRead(viewer, header, 4, NULL, PETSC_INT));
509408401ef6SPierre Jolivet   PetscCheck(header[0] == MAT_FILE_CLASSID, PETSC_COMM_SELF, PETSC_ERR_FILE_UNEXPECTED, "Not a matrix object in file");
50959371c9d4SSatish Balay   M  = header[1];
50969371c9d4SSatish Balay   N  = header[2];
50979371c9d4SSatish Balay   nz = header[3];
509808401ef6SPierre Jolivet   PetscCheck(M >= 0, PetscObjectComm((PetscObject)viewer), PETSC_ERR_FILE_UNEXPECTED, "Matrix row size (%" PetscInt_FMT ") in file is negative", M);
509908401ef6SPierre Jolivet   PetscCheck(N >= 0, PetscObjectComm((PetscObject)viewer), PETSC_ERR_FILE_UNEXPECTED, "Matrix column size (%" PetscInt_FMT ") in file is negative", N);
510008401ef6SPierre Jolivet   PetscCheck(nz >= 0, PETSC_COMM_SELF, PETSC_ERR_FILE_UNEXPECTED, "Matrix stored in special format on disk, cannot load as SeqAIJ");
5101fbdbba38SShri Abhyankar 
51023ea6fe3dSLisandro Dalcin   /* set block sizes from the viewer's .info file */
51039566063dSJacob Faibussowitsch   PetscCall(MatLoad_Binary_BlockSizes(mat, viewer));
51043ea6fe3dSLisandro Dalcin   /* set local and global sizes if not set already */
51053ea6fe3dSLisandro Dalcin   if (mat->rmap->n < 0) mat->rmap->n = M;
51063ea6fe3dSLisandro Dalcin   if (mat->cmap->n < 0) mat->cmap->n = N;
51073ea6fe3dSLisandro Dalcin   if (mat->rmap->N < 0) mat->rmap->N = M;
51083ea6fe3dSLisandro Dalcin   if (mat->cmap->N < 0) mat->cmap->N = N;
51099566063dSJacob Faibussowitsch   PetscCall(PetscLayoutSetUp(mat->rmap));
51109566063dSJacob Faibussowitsch   PetscCall(PetscLayoutSetUp(mat->cmap));
51113ea6fe3dSLisandro Dalcin 
51123ea6fe3dSLisandro Dalcin   /* check if the matrix sizes are correct */
51139566063dSJacob Faibussowitsch   PetscCall(MatGetSize(mat, &rows, &cols));
5114aed4548fSBarry Smith   PetscCheck(M == rows && N == cols, PETSC_COMM_SELF, PETSC_ERR_FILE_UNEXPECTED, "Matrix in file of different sizes (%" PetscInt_FMT ", %" PetscInt_FMT ") than the input matrix (%" PetscInt_FMT ", %" PetscInt_FMT ")", M, N, rows, cols);
51153ea6fe3dSLisandro Dalcin 
5116fbdbba38SShri Abhyankar   /* read in row lengths */
51179566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(M, &rowlens));
51189566063dSJacob Faibussowitsch   PetscCall(PetscViewerBinaryRead(viewer, rowlens, M, NULL, PETSC_INT));
51193ea6fe3dSLisandro Dalcin   /* check if sum(rowlens) is same as nz */
51209371c9d4SSatish Balay   sum = 0;
51219371c9d4SSatish Balay   for (i = 0; i < M; i++) sum += rowlens[i];
512208401ef6SPierre Jolivet   PetscCheck(sum == nz, PETSC_COMM_SELF, PETSC_ERR_FILE_UNEXPECTED, "Inconsistent matrix data in file: nonzeros = %" PetscInt_FMT ", sum-row-lengths = %" PetscInt_FMT, nz, sum);
51233ea6fe3dSLisandro Dalcin   /* preallocate and check sizes */
51249566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(mat, 0, rowlens));
51259566063dSJacob Faibussowitsch   PetscCall(MatGetSize(mat, &rows, &cols));
5126aed4548fSBarry Smith   PetscCheck(M == rows && N == cols, PETSC_COMM_SELF, PETSC_ERR_FILE_UNEXPECTED, "Matrix in file of different length (%" PetscInt_FMT ", %" PetscInt_FMT ") than the input matrix (%" PetscInt_FMT ", %" PetscInt_FMT ")", M, N, rows, cols);
51273ea6fe3dSLisandro Dalcin   /* store row lengths */
51289566063dSJacob Faibussowitsch   PetscCall(PetscArraycpy(a->ilen, rowlens, M));
51299566063dSJacob Faibussowitsch   PetscCall(PetscFree(rowlens));
5130fbdbba38SShri Abhyankar 
51313ea6fe3dSLisandro Dalcin   /* fill in "i" row pointers */
51329371c9d4SSatish Balay   a->i[0] = 0;
51339371c9d4SSatish Balay   for (i = 0; i < M; i++) a->i[i + 1] = a->i[i] + a->ilen[i];
51343ea6fe3dSLisandro Dalcin   /* read in "j" column indices */
51359566063dSJacob Faibussowitsch   PetscCall(PetscViewerBinaryRead(viewer, a->j, nz, NULL, PETSC_INT));
51363ea6fe3dSLisandro Dalcin   /* read in "a" nonzero values */
51379566063dSJacob Faibussowitsch   PetscCall(PetscViewerBinaryRead(viewer, a->a, nz, NULL, PETSC_SCALAR));
5138fbdbba38SShri Abhyankar 
51399566063dSJacob Faibussowitsch   PetscCall(MatAssemblyBegin(mat, MAT_FINAL_ASSEMBLY));
51409566063dSJacob Faibussowitsch   PetscCall(MatAssemblyEnd(mat, MAT_FINAL_ASSEMBLY));
51413ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
5142fbdbba38SShri Abhyankar }
5143fbdbba38SShri Abhyankar 
5144d71ae5a4SJacob Faibussowitsch PetscErrorCode MatEqual_SeqAIJ(Mat A, Mat B, PetscBool *flg)
5145d71ae5a4SJacob Faibussowitsch {
51467264ac53SSatish Balay   Mat_SeqAIJ        *a = (Mat_SeqAIJ *)A->data, *b = (Mat_SeqAIJ *)B->data;
5147fff043a9SJunchao Zhang   const PetscScalar *aa, *ba;
5148eeffb40dSHong Zhang #if defined(PETSC_USE_COMPLEX)
5149eeffb40dSHong Zhang   PetscInt k;
5150eeffb40dSHong Zhang #endif
51517264ac53SSatish Balay 
51523a40ed3dSBarry Smith   PetscFunctionBegin;
5153bfeeae90SHong Zhang   /* If the  matrix dimensions are not equal,or no of nonzeros */
5154d0f46423SBarry Smith   if ((A->rmap->n != B->rmap->n) || (A->cmap->n != B->cmap->n) || (a->nz != b->nz)) {
5155ca44d042SBarry Smith     *flg = PETSC_FALSE;
51563ba16761SJacob Faibussowitsch     PetscFunctionReturn(PETSC_SUCCESS);
5157bcd2baecSBarry Smith   }
51587264ac53SSatish Balay 
51597264ac53SSatish Balay   /* if the a->i are the same */
51609566063dSJacob Faibussowitsch   PetscCall(PetscArraycmp(a->i, b->i, A->rmap->n + 1, flg));
51613ba16761SJacob Faibussowitsch   if (!*flg) PetscFunctionReturn(PETSC_SUCCESS);
51627264ac53SSatish Balay 
51637264ac53SSatish Balay   /* if a->j are the same */
51649566063dSJacob Faibussowitsch   PetscCall(PetscArraycmp(a->j, b->j, a->nz, flg));
51653ba16761SJacob Faibussowitsch   if (!*flg) PetscFunctionReturn(PETSC_SUCCESS);
5166bcd2baecSBarry Smith 
51679566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &aa));
51689566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(B, &ba));
5169bcd2baecSBarry Smith   /* if a->a are the same */
5170eeffb40dSHong Zhang #if defined(PETSC_USE_COMPLEX)
5171eeffb40dSHong Zhang   for (k = 0; k < a->nz; k++) {
5172fff043a9SJunchao Zhang     if (PetscRealPart(aa[k]) != PetscRealPart(ba[k]) || PetscImaginaryPart(aa[k]) != PetscImaginaryPart(ba[k])) {
5173eeffb40dSHong Zhang       *flg = PETSC_FALSE;
51743ba16761SJacob Faibussowitsch       PetscFunctionReturn(PETSC_SUCCESS);
5175eeffb40dSHong Zhang     }
5176eeffb40dSHong Zhang   }
5177eeffb40dSHong Zhang #else
51789566063dSJacob Faibussowitsch   PetscCall(PetscArraycmp(aa, ba, a->nz, flg));
5179eeffb40dSHong Zhang #endif
51809566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &aa));
51819566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(B, &ba));
51823ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
51837264ac53SSatish Balay }
518436db0b34SBarry Smith 
518505869f15SSatish Balay /*@
518611a5261eSBarry Smith   MatCreateSeqAIJWithArrays - Creates an sequential `MATSEQAIJ` matrix using matrix elements (in CSR format)
518736db0b34SBarry Smith   provided by the user.
518836db0b34SBarry Smith 
5189d083f849SBarry Smith   Collective
519036db0b34SBarry Smith 
519136db0b34SBarry Smith   Input Parameters:
519236db0b34SBarry Smith + comm - must be an MPI communicator of size 1
519336db0b34SBarry Smith . m    - number of rows
519436db0b34SBarry Smith . n    - number of columns
5195483a2f95SBarry Smith . i    - row indices; that is i[0] = 0, i[row] = i[row-1] + number of elements in that row of the matrix
519636db0b34SBarry Smith . j    - column indices
519736db0b34SBarry Smith - a    - matrix values
519836db0b34SBarry Smith 
519936db0b34SBarry Smith   Output Parameter:
520036db0b34SBarry Smith . mat - the matrix
520136db0b34SBarry Smith 
520236db0b34SBarry Smith   Level: intermediate
520336db0b34SBarry Smith 
520436db0b34SBarry Smith   Notes:
52052ef1f0ffSBarry Smith   The `i`, `j`, and `a` arrays are not copied by this routine, the user must free these arrays
5206292fb18eSBarry Smith   once the matrix is destroyed and not before
520736db0b34SBarry Smith 
520836db0b34SBarry Smith   You cannot set new nonzero locations into this matrix, that will generate an error.
520936db0b34SBarry Smith 
52102ef1f0ffSBarry Smith   The `i` and `j` indices are 0 based
521136db0b34SBarry Smith 
5212a4552177SSatish Balay   The format which is used for the sparse matrix input, is equivalent to a
5213a4552177SSatish Balay   row-major ordering.. i.e for the following matrix, the input data expected is
52148eef79e4SBarry Smith   as shown
52152ef1f0ffSBarry Smith .vb
52162ef1f0ffSBarry Smith         1 0 0
52172ef1f0ffSBarry Smith         2 0 3
52182ef1f0ffSBarry Smith         4 5 6
5219a4552177SSatish Balay 
52202ef1f0ffSBarry Smith         i =  {0,1,3,6}  [size = nrow+1  = 3+1]
52212ef1f0ffSBarry Smith         j =  {0,0,2,0,1,2}  [size = 6]; values must be sorted for each row
52222ef1f0ffSBarry Smith         v =  {1,2,3,4,5,6}  [size = 6]
52232ef1f0ffSBarry Smith .ve
5224a4552177SSatish Balay 
52251cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatCreate()`, `MatCreateAIJ()`, `MatCreateSeqAIJ()`, `MatCreateMPIAIJWithArrays()`, `MatMPIAIJSetPreallocationCSR()`
522636db0b34SBarry Smith @*/
5227d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateSeqAIJWithArrays(MPI_Comm comm, PetscInt m, PetscInt n, PetscInt i[], PetscInt j[], PetscScalar a[], Mat *mat)
5228d71ae5a4SJacob Faibussowitsch {
5229cbcfb4deSHong Zhang   PetscInt    ii;
523036db0b34SBarry Smith   Mat_SeqAIJ *aij;
5231cbcfb4deSHong Zhang   PetscInt    jj;
523236db0b34SBarry Smith 
523336db0b34SBarry Smith   PetscFunctionBegin;
5234aed4548fSBarry Smith   PetscCheck(m <= 0 || i[0] == 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "i (row indices) must start with 0");
52359566063dSJacob Faibussowitsch   PetscCall(MatCreate(comm, mat));
52369566063dSJacob Faibussowitsch   PetscCall(MatSetSizes(*mat, m, n, m, n));
52379566063dSJacob Faibussowitsch   /* PetscCall(MatSetBlockSizes(*mat,,)); */
52389566063dSJacob Faibussowitsch   PetscCall(MatSetType(*mat, MATSEQAIJ));
52399566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(*mat, MAT_SKIP_ALLOCATION, NULL));
5240ab93d7beSBarry Smith   aij = (Mat_SeqAIJ *)(*mat)->data;
52419566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(m, &aij->imax));
52429566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(m, &aij->ilen));
5243ab93d7beSBarry Smith 
524436db0b34SBarry Smith   aij->i       = i;
524536db0b34SBarry Smith   aij->j       = j;
524636db0b34SBarry Smith   aij->a       = a;
524736db0b34SBarry Smith   aij->nonew   = -1; /*this indicates that inserting a new value in the matrix that generates a new nonzero is an error*/
5248e6b907acSBarry Smith   aij->free_a  = PETSC_FALSE;
5249e6b907acSBarry Smith   aij->free_ij = PETSC_FALSE;
525036db0b34SBarry Smith 
5251cbc6b225SStefano Zampini   for (ii = 0, aij->nonzerorowcnt = 0, aij->rmax = 0; ii < m; ii++) {
525236db0b34SBarry Smith     aij->ilen[ii] = aij->imax[ii] = i[ii + 1] - i[ii];
525376bd3646SJed Brown     if (PetscDefined(USE_DEBUG)) {
5254aed4548fSBarry Smith       PetscCheck(i[ii + 1] - i[ii] >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Negative row length in i (row indices) row = %" PetscInt_FMT " length = %" PetscInt_FMT, ii, i[ii + 1] - i[ii]);
52559985e31cSBarry Smith       for (jj = i[ii] + 1; jj < i[ii + 1]; jj++) {
525608401ef6SPierre Jolivet         PetscCheck(j[jj] >= j[jj - 1], PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Column entry number %" PetscInt_FMT " (actual column %" PetscInt_FMT ") in row %" PetscInt_FMT " is not sorted", jj - i[ii], j[jj], ii);
525708401ef6SPierre Jolivet         PetscCheck(j[jj] != j[jj - 1], PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Column entry number %" PetscInt_FMT " (actual column %" PetscInt_FMT ") in row %" PetscInt_FMT " is identical to previous entry", jj - i[ii], j[jj], ii);
52589985e31cSBarry Smith       }
525936db0b34SBarry Smith     }
526076bd3646SJed Brown   }
526176bd3646SJed Brown   if (PetscDefined(USE_DEBUG)) {
526236db0b34SBarry Smith     for (ii = 0; ii < aij->i[m]; ii++) {
526308401ef6SPierre Jolivet       PetscCheck(j[ii] >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Negative column index at location = %" PetscInt_FMT " index = %" PetscInt_FMT, ii, j[ii]);
5264da0802e2SStefano Zampini       PetscCheck(j[ii] <= n - 1, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Column index to large at location = %" PetscInt_FMT " index = %" PetscInt_FMT " last column = %" PetscInt_FMT, ii, j[ii], n - 1);
526536db0b34SBarry Smith     }
526676bd3646SJed Brown   }
526736db0b34SBarry Smith 
52689566063dSJacob Faibussowitsch   PetscCall(MatAssemblyBegin(*mat, MAT_FINAL_ASSEMBLY));
52699566063dSJacob Faibussowitsch   PetscCall(MatAssemblyEnd(*mat, MAT_FINAL_ASSEMBLY));
52703ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
527136db0b34SBarry Smith }
5272cbc6b225SStefano Zampini 
5273f62e3866SBarry Smith /*@
527411a5261eSBarry Smith   MatCreateSeqAIJFromTriple - Creates an sequential `MATSEQAIJ` matrix using matrix elements (in COO format)
52758a0b0e6bSVictor Minden   provided by the user.
52768a0b0e6bSVictor Minden 
5277d083f849SBarry Smith   Collective
52788a0b0e6bSVictor Minden 
52798a0b0e6bSVictor Minden   Input Parameters:
52808a0b0e6bSVictor Minden + comm - must be an MPI communicator of size 1
52818a0b0e6bSVictor Minden . m    - number of rows
52828a0b0e6bSVictor Minden . n    - number of columns
52838a0b0e6bSVictor Minden . i    - row indices
52848a0b0e6bSVictor Minden . j    - column indices
52851230e6d1SVictor Minden . a    - matrix values
52861230e6d1SVictor Minden . nz   - number of nonzeros
52872ef1f0ffSBarry Smith - idx  - if the `i` and `j` indices start with 1 use `PETSC_TRUE` otherwise use `PETSC_FALSE`
52888a0b0e6bSVictor Minden 
52898a0b0e6bSVictor Minden   Output Parameter:
52908a0b0e6bSVictor Minden . mat - the matrix
52918a0b0e6bSVictor Minden 
52928a0b0e6bSVictor Minden   Level: intermediate
52938a0b0e6bSVictor Minden 
5294f62e3866SBarry Smith   Example:
5295f62e3866SBarry Smith   For the following matrix, the input data expected is as shown (using 0 based indexing)
52969e99939fSJunchao Zhang .vb
52978a0b0e6bSVictor Minden         1 0 0
52988a0b0e6bSVictor Minden         2 0 3
52998a0b0e6bSVictor Minden         4 5 6
53008a0b0e6bSVictor Minden 
53018a0b0e6bSVictor Minden         i =  {0,1,1,2,2,2}
53028a0b0e6bSVictor Minden         j =  {0,0,2,0,1,2}
53038a0b0e6bSVictor Minden         v =  {1,2,3,4,5,6}
53049e99939fSJunchao Zhang .ve
5305fe59aa6dSJacob Faibussowitsch 
53062ef1f0ffSBarry Smith   Note:
5307d7547e51SJunchao Zhang   Instead of using this function, users should also consider `MatSetPreallocationCOO()` and `MatSetValuesCOO()`, which allow repeated or remote entries,
5308d7547e51SJunchao Zhang   and are particularly useful in iterative applications.
53098a0b0e6bSVictor Minden 
53101cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatCreate()`, `MatCreateAIJ()`, `MatCreateSeqAIJ()`, `MatCreateSeqAIJWithArrays()`, `MatMPIAIJSetPreallocationCSR()`, `MatSetValuesCOO()`, `MatSetPreallocationCOO()`
53118a0b0e6bSVictor Minden @*/
5312d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateSeqAIJFromTriple(MPI_Comm comm, PetscInt m, PetscInt n, PetscInt i[], PetscInt j[], PetscScalar a[], Mat *mat, PetscInt nz, PetscBool idx)
5313d71ae5a4SJacob Faibussowitsch {
5314d021a1c5SVictor Minden   PetscInt ii, *nnz, one = 1, row, col;
53158a0b0e6bSVictor Minden 
53168a0b0e6bSVictor Minden   PetscFunctionBegin;
53179566063dSJacob Faibussowitsch   PetscCall(PetscCalloc1(m, &nnz));
5318ad540459SPierre Jolivet   for (ii = 0; ii < nz; ii++) nnz[i[ii] - !!idx] += 1;
53199566063dSJacob Faibussowitsch   PetscCall(MatCreate(comm, mat));
53209566063dSJacob Faibussowitsch   PetscCall(MatSetSizes(*mat, m, n, m, n));
53219566063dSJacob Faibussowitsch   PetscCall(MatSetType(*mat, MATSEQAIJ));
53229566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(*mat, 0, nnz));
53231230e6d1SVictor Minden   for (ii = 0; ii < nz; ii++) {
53241230e6d1SVictor Minden     if (idx) {
53251230e6d1SVictor Minden       row = i[ii] - 1;
53261230e6d1SVictor Minden       col = j[ii] - 1;
53271230e6d1SVictor Minden     } else {
53281230e6d1SVictor Minden       row = i[ii];
53291230e6d1SVictor Minden       col = j[ii];
53308a0b0e6bSVictor Minden     }
53319566063dSJacob Faibussowitsch     PetscCall(MatSetValues(*mat, one, &row, one, &col, &a[ii], ADD_VALUES));
53328a0b0e6bSVictor Minden   }
53339566063dSJacob Faibussowitsch   PetscCall(MatAssemblyBegin(*mat, MAT_FINAL_ASSEMBLY));
53349566063dSJacob Faibussowitsch   PetscCall(MatAssemblyEnd(*mat, MAT_FINAL_ASSEMBLY));
53359566063dSJacob Faibussowitsch   PetscCall(PetscFree(nnz));
53363ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
53378a0b0e6bSVictor Minden }
533836db0b34SBarry Smith 
5339d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJInvalidateDiagonal(Mat A)
5340d71ae5a4SJacob Faibussowitsch {
5341acf2f550SJed Brown   Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data;
5342acf2f550SJed Brown 
5343acf2f550SJed Brown   PetscFunctionBegin;
5344acf2f550SJed Brown   a->idiagvalid  = PETSC_FALSE;
5345acf2f550SJed Brown   a->ibdiagvalid = PETSC_FALSE;
53462205254eSKarl Rupp 
53479566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJInvalidateDiagonal_Inode(A));
53483ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
5349acf2f550SJed Brown }
5350acf2f550SJed Brown 
5351d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateMPIMatConcatenateSeqMat_SeqAIJ(MPI_Comm comm, Mat inmat, PetscInt n, MatReuse scall, Mat *outmat)
5352d71ae5a4SJacob Faibussowitsch {
53539c8f2541SHong Zhang   PetscFunctionBegin;
53549566063dSJacob Faibussowitsch   PetscCall(MatCreateMPIMatConcatenateSeqMat_MPIAIJ(comm, inmat, n, scall, outmat));
53553ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
53569c8f2541SHong Zhang }
53579c8f2541SHong Zhang 
535881824310SBarry Smith /*
535953dd7562SDmitry Karpeev  Permute A into C's *local* index space using rowemb,colemb.
536053dd7562SDmitry Karpeev  The embedding are supposed to be injections and the above implies that the range of rowemb is a subset
536153dd7562SDmitry Karpeev  of [0,m), colemb is in [0,n).
536253dd7562SDmitry Karpeev  If pattern == DIFFERENT_NONZERO_PATTERN, C is preallocated according to A.
536353dd7562SDmitry Karpeev  */
5364d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetSeqMat_SeqAIJ(Mat C, IS rowemb, IS colemb, MatStructure pattern, Mat B)
5365d71ae5a4SJacob Faibussowitsch {
536653dd7562SDmitry Karpeev   /* If making this function public, change the error returned in this function away from _PLIB. */
536753dd7562SDmitry Karpeev   Mat_SeqAIJ     *Baij;
536853dd7562SDmitry Karpeev   PetscBool       seqaij;
536953dd7562SDmitry Karpeev   PetscInt        m, n, *nz, i, j, count;
537053dd7562SDmitry Karpeev   PetscScalar     v;
537153dd7562SDmitry Karpeev   const PetscInt *rowindices, *colindices;
537253dd7562SDmitry Karpeev 
537353dd7562SDmitry Karpeev   PetscFunctionBegin;
53743ba16761SJacob Faibussowitsch   if (!B) PetscFunctionReturn(PETSC_SUCCESS);
537553dd7562SDmitry Karpeev   /* Check to make sure the target matrix (and embeddings) are compatible with C and each other. */
53769566063dSJacob Faibussowitsch   PetscCall(PetscObjectBaseTypeCompare((PetscObject)B, MATSEQAIJ, &seqaij));
537728b400f6SJacob Faibussowitsch   PetscCheck(seqaij, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Input matrix is of wrong type");
537853dd7562SDmitry Karpeev   if (rowemb) {
53799566063dSJacob Faibussowitsch     PetscCall(ISGetLocalSize(rowemb, &m));
538008401ef6SPierre Jolivet     PetscCheck(m == B->rmap->n, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Row IS of size %" PetscInt_FMT " is incompatible with matrix row size %" PetscInt_FMT, m, B->rmap->n);
538153dd7562SDmitry Karpeev   } else {
538208401ef6SPierre Jolivet     PetscCheck(C->rmap->n == B->rmap->n, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Input matrix is row-incompatible with the target matrix");
538353dd7562SDmitry Karpeev   }
538453dd7562SDmitry Karpeev   if (colemb) {
53859566063dSJacob Faibussowitsch     PetscCall(ISGetLocalSize(colemb, &n));
538608401ef6SPierre Jolivet     PetscCheck(n == B->cmap->n, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Diag col IS of size %" PetscInt_FMT " is incompatible with input matrix col size %" PetscInt_FMT, n, B->cmap->n);
538753dd7562SDmitry Karpeev   } else {
538808401ef6SPierre Jolivet     PetscCheck(C->cmap->n == B->cmap->n, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Input matrix is col-incompatible with the target matrix");
538953dd7562SDmitry Karpeev   }
539053dd7562SDmitry Karpeev 
5391f4f49eeaSPierre Jolivet   Baij = (Mat_SeqAIJ *)B->data;
539253dd7562SDmitry Karpeev   if (pattern == DIFFERENT_NONZERO_PATTERN) {
53939566063dSJacob Faibussowitsch     PetscCall(PetscMalloc1(B->rmap->n, &nz));
5394ad540459SPierre Jolivet     for (i = 0; i < B->rmap->n; i++) nz[i] = Baij->i[i + 1] - Baij->i[i];
53959566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJSetPreallocation(C, 0, nz));
53969566063dSJacob Faibussowitsch     PetscCall(PetscFree(nz));
539753dd7562SDmitry Karpeev   }
539848a46eb9SPierre Jolivet   if (pattern == SUBSET_NONZERO_PATTERN) PetscCall(MatZeroEntries(C));
539953dd7562SDmitry Karpeev   count      = 0;
540053dd7562SDmitry Karpeev   rowindices = NULL;
540153dd7562SDmitry Karpeev   colindices = NULL;
540248a46eb9SPierre Jolivet   if (rowemb) PetscCall(ISGetIndices(rowemb, &rowindices));
540348a46eb9SPierre Jolivet   if (colemb) PetscCall(ISGetIndices(colemb, &colindices));
540453dd7562SDmitry Karpeev   for (i = 0; i < B->rmap->n; i++) {
540553dd7562SDmitry Karpeev     PetscInt row;
540653dd7562SDmitry Karpeev     row = i;
540753dd7562SDmitry Karpeev     if (rowindices) row = rowindices[i];
540853dd7562SDmitry Karpeev     for (j = Baij->i[i]; j < Baij->i[i + 1]; j++) {
540953dd7562SDmitry Karpeev       PetscInt col;
541053dd7562SDmitry Karpeev       col = Baij->j[count];
541153dd7562SDmitry Karpeev       if (colindices) col = colindices[col];
541253dd7562SDmitry Karpeev       v = Baij->a[count];
54139566063dSJacob Faibussowitsch       PetscCall(MatSetValues(C, 1, &row, 1, &col, &v, INSERT_VALUES));
541453dd7562SDmitry Karpeev       ++count;
541553dd7562SDmitry Karpeev     }
541653dd7562SDmitry Karpeev   }
541753dd7562SDmitry Karpeev   /* FIXME: set C's nonzerostate correctly. */
541853dd7562SDmitry Karpeev   /* Assembly for C is necessary. */
541953dd7562SDmitry Karpeev   C->preallocated  = PETSC_TRUE;
542053dd7562SDmitry Karpeev   C->assembled     = PETSC_TRUE;
542153dd7562SDmitry Karpeev   C->was_assembled = PETSC_FALSE;
54223ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
542353dd7562SDmitry Karpeev }
542453dd7562SDmitry Karpeev 
542558c11ad4SPierre Jolivet PetscErrorCode MatEliminateZeros_SeqAIJ(Mat A, PetscBool keep)
5426dec0b466SHong Zhang {
5427dec0b466SHong Zhang   Mat_SeqAIJ *a  = (Mat_SeqAIJ *)A->data;
5428dec0b466SHong Zhang   MatScalar  *aa = a->a;
5429dec0b466SHong Zhang   PetscInt    m = A->rmap->n, fshift = 0, fshift_prev = 0, i, k;
5430dec0b466SHong Zhang   PetscInt   *ailen = a->ilen, *imax = a->imax, *ai = a->i, *aj = a->j, rmax = 0;
5431dec0b466SHong Zhang 
5432dec0b466SHong Zhang   PetscFunctionBegin;
5433dec0b466SHong Zhang   PetscCheck(A->assembled, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Cannot eliminate zeros for unassembled matrix");
5434dec0b466SHong Zhang   if (m) rmax = ailen[0]; /* determine row with most nonzeros */
5435dec0b466SHong Zhang   for (i = 1; i <= m; i++) {
5436dec0b466SHong Zhang     /* move each nonzero entry back by the amount of zero slots (fshift) before it*/
5437dec0b466SHong Zhang     for (k = ai[i - 1]; k < ai[i]; k++) {
543858c11ad4SPierre Jolivet       if (aa[k] == 0 && (aj[k] != i - 1 || !keep)) fshift++;
5439dec0b466SHong Zhang       else {
5440dec0b466SHong Zhang         if (aa[k] == 0 && aj[k] == i - 1) PetscCall(PetscInfo(A, "Keep the diagonal zero at row %" PetscInt_FMT "\n", i - 1));
5441dec0b466SHong Zhang         aa[k - fshift] = aa[k];
5442dec0b466SHong Zhang         aj[k - fshift] = aj[k];
5443dec0b466SHong Zhang       }
5444dec0b466SHong Zhang     }
5445dec0b466SHong Zhang     ai[i - 1] -= fshift_prev; // safe to update ai[i-1] now since it will not be used in the next iteration
5446dec0b466SHong Zhang     fshift_prev = fshift;
5447dec0b466SHong Zhang     /* reset ilen and imax for each row */
5448dec0b466SHong Zhang     ailen[i - 1] = imax[i - 1] = ai[i] - fshift - ai[i - 1];
5449dec0b466SHong Zhang     a->nonzerorowcnt += ((ai[i] - fshift - ai[i - 1]) > 0);
5450dec0b466SHong Zhang     rmax = PetscMax(rmax, ailen[i - 1]);
5451dec0b466SHong Zhang   }
5452312eded4SPierre Jolivet   if (fshift) {
5453dec0b466SHong Zhang     if (m) {
5454dec0b466SHong Zhang       ai[m] -= fshift;
5455dec0b466SHong Zhang       a->nz = ai[m];
5456dec0b466SHong Zhang     }
5457dec0b466SHong Zhang     PetscCall(PetscInfo(A, "Matrix size: %" PetscInt_FMT " X %" PetscInt_FMT "; zeros eliminated: %" PetscInt_FMT "; nonzeros left: %" PetscInt_FMT "\n", m, A->cmap->n, fshift, a->nz));
5458312eded4SPierre Jolivet     A->nonzerostate++;
5459dec0b466SHong Zhang     A->info.nz_unneeded += (PetscReal)fshift;
5460dec0b466SHong Zhang     a->rmax = rmax;
5461dec0b466SHong Zhang     if (a->inode.use && a->inode.checked) PetscCall(MatSeqAIJCheckInode(A));
5462dec0b466SHong Zhang     PetscCall(MatAssemblyBegin(A, MAT_FINAL_ASSEMBLY));
5463dec0b466SHong Zhang     PetscCall(MatAssemblyEnd(A, MAT_FINAL_ASSEMBLY));
5464312eded4SPierre Jolivet   }
54653ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
5466dec0b466SHong Zhang }
5467dec0b466SHong Zhang 
54684099cc6bSBarry Smith PetscFunctionList MatSeqAIJList = NULL;
54694099cc6bSBarry Smith 
5470cc4c1da9SBarry Smith /*@
547111a5261eSBarry Smith   MatSeqAIJSetType - Converts a `MATSEQAIJ` matrix to a subtype
54724099cc6bSBarry Smith 
5473c3339decSBarry Smith   Collective
54744099cc6bSBarry Smith 
54754099cc6bSBarry Smith   Input Parameters:
54764099cc6bSBarry Smith + mat    - the matrix object
54774099cc6bSBarry Smith - matype - matrix type
54784099cc6bSBarry Smith 
54794099cc6bSBarry Smith   Options Database Key:
54804e187271SRichard Tran Mills . -mat_seqaij_type  <method> - for example seqaijcrl
54814099cc6bSBarry Smith 
54824099cc6bSBarry Smith   Level: intermediate
54834099cc6bSBarry Smith 
5484fe59aa6dSJacob Faibussowitsch .seealso: [](ch_matrices), `Mat`, `PCSetType()`, `VecSetType()`, `MatCreate()`, `MatType`
54854099cc6bSBarry Smith @*/
5486d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetType(Mat mat, MatType matype)
5487d71ae5a4SJacob Faibussowitsch {
54884099cc6bSBarry Smith   PetscBool sametype;
54895f80ce2aSJacob Faibussowitsch   PetscErrorCode (*r)(Mat, MatType, MatReuse, Mat *);
54904099cc6bSBarry Smith 
54914099cc6bSBarry Smith   PetscFunctionBegin;
54924099cc6bSBarry Smith   PetscValidHeaderSpecific(mat, MAT_CLASSID, 1);
54939566063dSJacob Faibussowitsch   PetscCall(PetscObjectTypeCompare((PetscObject)mat, matype, &sametype));
54943ba16761SJacob Faibussowitsch   if (sametype) PetscFunctionReturn(PETSC_SUCCESS);
54954099cc6bSBarry Smith 
54969566063dSJacob Faibussowitsch   PetscCall(PetscFunctionListFind(MatSeqAIJList, matype, &r));
54976adde796SStefano Zampini   PetscCheck(r, PetscObjectComm((PetscObject)mat), PETSC_ERR_ARG_UNKNOWN_TYPE, "Unknown Mat type given: %s", matype);
54989566063dSJacob Faibussowitsch   PetscCall((*r)(mat, matype, MAT_INPLACE_MATRIX, &mat));
54993ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
55004099cc6bSBarry Smith }
55014099cc6bSBarry Smith 
55024099cc6bSBarry Smith /*@C
550311a5261eSBarry Smith   MatSeqAIJRegister -  - Adds a new sub-matrix type for sequential `MATSEQAIJ` matrices
55044099cc6bSBarry Smith 
5505cc4c1da9SBarry Smith   Not Collective, No Fortran Support
55064099cc6bSBarry Smith 
55074099cc6bSBarry Smith   Input Parameters:
5508fe59aa6dSJacob Faibussowitsch + sname    - name of a new user-defined matrix type, for example `MATSEQAIJCRL`
55094099cc6bSBarry Smith - function - routine to convert to subtype
55104099cc6bSBarry Smith 
55112ef1f0ffSBarry Smith   Level: advanced
55122ef1f0ffSBarry Smith 
55134099cc6bSBarry Smith   Notes:
551411a5261eSBarry Smith   `MatSeqAIJRegister()` may be called multiple times to add several user-defined solvers.
55154099cc6bSBarry Smith 
55164099cc6bSBarry Smith   Then, your matrix can be chosen with the procedural interface at runtime via the option
55174099cc6bSBarry Smith $     -mat_seqaij_type my_mat
55184099cc6bSBarry Smith 
55191cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJRegisterAll()`
55204099cc6bSBarry Smith @*/
5521d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJRegister(const char sname[], PetscErrorCode (*function)(Mat, MatType, MatReuse, Mat *))
5522d71ae5a4SJacob Faibussowitsch {
55234099cc6bSBarry Smith   PetscFunctionBegin;
55249566063dSJacob Faibussowitsch   PetscCall(MatInitializePackage());
55259566063dSJacob Faibussowitsch   PetscCall(PetscFunctionListAdd(&MatSeqAIJList, sname, function));
55263ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
55274099cc6bSBarry Smith }
55284099cc6bSBarry Smith 
55294099cc6bSBarry Smith PetscBool MatSeqAIJRegisterAllCalled = PETSC_FALSE;
55304099cc6bSBarry Smith 
55314099cc6bSBarry Smith /*@C
553211a5261eSBarry Smith   MatSeqAIJRegisterAll - Registers all of the matrix subtypes of `MATSSEQAIJ`
55334099cc6bSBarry Smith 
55344099cc6bSBarry Smith   Not Collective
55354099cc6bSBarry Smith 
55364099cc6bSBarry Smith   Level: advanced
55374099cc6bSBarry Smith 
55382ef1f0ffSBarry Smith   Note:
55392ef1f0ffSBarry Smith   This registers the versions of `MATSEQAIJ` for GPUs
55402ef1f0ffSBarry Smith 
55411cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatRegisterAll()`, `MatSeqAIJRegister()`
55424099cc6bSBarry Smith @*/
5543d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJRegisterAll(void)
5544d71ae5a4SJacob Faibussowitsch {
55454099cc6bSBarry Smith   PetscFunctionBegin;
55463ba16761SJacob Faibussowitsch   if (MatSeqAIJRegisterAllCalled) PetscFunctionReturn(PETSC_SUCCESS);
55474099cc6bSBarry Smith   MatSeqAIJRegisterAllCalled = PETSC_TRUE;
55484099cc6bSBarry Smith 
55499566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRegister(MATSEQAIJCRL, MatConvert_SeqAIJ_SeqAIJCRL));
55509566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRegister(MATSEQAIJPERM, MatConvert_SeqAIJ_SeqAIJPERM));
55519566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRegister(MATSEQAIJSELL, MatConvert_SeqAIJ_SeqAIJSELL));
55529779e05dSSatish Balay #if defined(PETSC_HAVE_MKL_SPARSE)
55539566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRegister(MATSEQAIJMKL, MatConvert_SeqAIJ_SeqAIJMKL));
5554485f9817SRichard Tran Mills #endif
55555063d097SStefano Zampini #if defined(PETSC_HAVE_CUDA)
55569566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRegister(MATSEQAIJCUSPARSE, MatConvert_SeqAIJ_SeqAIJCUSPARSE));
55575063d097SStefano Zampini #endif
5558d5e393b6SSuyash Tandon #if defined(PETSC_HAVE_HIP)
5559d5e393b6SSuyash Tandon   PetscCall(MatSeqAIJRegister(MATSEQAIJHIPSPARSE, MatConvert_SeqAIJ_SeqAIJHIPSPARSE));
5560d5e393b6SSuyash Tandon #endif
55615063d097SStefano Zampini #if defined(PETSC_HAVE_KOKKOS_KERNELS)
55629566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRegister(MATSEQAIJKOKKOS, MatConvert_SeqAIJ_SeqAIJKokkos));
55635063d097SStefano Zampini #endif
55644099cc6bSBarry Smith #if defined(PETSC_HAVE_VIENNACL) && defined(PETSC_HAVE_VIENNACL_NO_CUDA)
55659566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRegister(MATMPIAIJVIENNACL, MatConvert_SeqAIJ_SeqAIJViennaCL));
55664099cc6bSBarry Smith #endif
55673ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
55684099cc6bSBarry Smith }
556953dd7562SDmitry Karpeev 
557053dd7562SDmitry Karpeev /*
557181824310SBarry Smith     Special version for direct calls from Fortran
557281824310SBarry Smith */
557381824310SBarry Smith #if defined(PETSC_HAVE_FORTRAN_CAPS)
557481824310SBarry Smith   #define matsetvaluesseqaij_ MATSETVALUESSEQAIJ
557581824310SBarry Smith #elif !defined(PETSC_HAVE_FORTRAN_UNDERSCORE)
557681824310SBarry Smith   #define matsetvaluesseqaij_ matsetvaluesseqaij
557781824310SBarry Smith #endif
557881824310SBarry Smith 
557981824310SBarry Smith /* Change these macros so can be used in void function */
558098921bdaSJacob Faibussowitsch 
558198921bdaSJacob Faibussowitsch /* Change these macros so can be used in void function */
55829566063dSJacob Faibussowitsch /* Identical to PetscCallVoid, except it assigns to *_ierr */
55839566063dSJacob Faibussowitsch #undef PetscCall
55849371c9d4SSatish Balay #define PetscCall(...) \
55859371c9d4SSatish Balay   do { \
55865f80ce2aSJacob Faibussowitsch     PetscErrorCode ierr_msv_mpiaij = __VA_ARGS__; \
558798921bdaSJacob Faibussowitsch     if (PetscUnlikely(ierr_msv_mpiaij)) { \
558898921bdaSJacob Faibussowitsch       *_ierr = PetscError(PETSC_COMM_SELF, __LINE__, PETSC_FUNCTION_NAME, __FILE__, ierr_msv_mpiaij, PETSC_ERROR_REPEAT, " "); \
558998921bdaSJacob Faibussowitsch       return; \
559098921bdaSJacob Faibussowitsch     } \
559198921bdaSJacob Faibussowitsch   } while (0)
559298921bdaSJacob Faibussowitsch 
559398921bdaSJacob Faibussowitsch #undef SETERRQ
55949371c9d4SSatish Balay #define SETERRQ(comm, ierr, ...) \
55959371c9d4SSatish Balay   do { \
559698921bdaSJacob Faibussowitsch     *_ierr = PetscError(comm, __LINE__, PETSC_FUNCTION_NAME, __FILE__, ierr, PETSC_ERROR_INITIAL, __VA_ARGS__); \
559798921bdaSJacob Faibussowitsch     return; \
559898921bdaSJacob Faibussowitsch   } while (0)
559981824310SBarry Smith 
5600d71ae5a4SJacob Faibussowitsch PETSC_EXTERN void matsetvaluesseqaij_(Mat *AA, PetscInt *mm, const PetscInt im[], PetscInt *nn, const PetscInt in[], const PetscScalar v[], InsertMode *isis, PetscErrorCode *_ierr)
5601d71ae5a4SJacob Faibussowitsch {
560281824310SBarry Smith   Mat         A = *AA;
560381824310SBarry Smith   PetscInt    m = *mm, n = *nn;
560481824310SBarry Smith   InsertMode  is = *isis;
560581824310SBarry Smith   Mat_SeqAIJ *a  = (Mat_SeqAIJ *)A->data;
560681824310SBarry Smith   PetscInt   *rp, k, low, high, t, ii, row, nrow, i, col, l, rmax, N;
560781824310SBarry Smith   PetscInt   *imax, *ai, *ailen;
560881824310SBarry Smith   PetscInt   *aj, nonew = a->nonew, lastcol = -1;
560954f21887SBarry Smith   MatScalar  *ap, value, *aa;
5610ace3abfcSBarry Smith   PetscBool   ignorezeroentries = a->ignorezeroentries;
5611ace3abfcSBarry Smith   PetscBool   roworiented       = a->roworiented;
561281824310SBarry Smith 
561381824310SBarry Smith   PetscFunctionBegin;
56144994cf47SJed Brown   MatCheckPreallocated(A, 1);
561581824310SBarry Smith   imax  = a->imax;
561681824310SBarry Smith   ai    = a->i;
561781824310SBarry Smith   ailen = a->ilen;
561881824310SBarry Smith   aj    = a->j;
561981824310SBarry Smith   aa    = a->a;
562081824310SBarry Smith 
562181824310SBarry Smith   for (k = 0; k < m; k++) { /* loop over added rows */
562281824310SBarry Smith     row = im[k];
562381824310SBarry Smith     if (row < 0) continue;
56245f80ce2aSJacob Faibussowitsch     PetscCheck(row < A->rmap->n, PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_OUTOFRANGE, "Row too large");
56259371c9d4SSatish Balay     rp   = aj + ai[row];
56269371c9d4SSatish Balay     ap   = aa + ai[row];
56279371c9d4SSatish Balay     rmax = imax[row];
56289371c9d4SSatish Balay     nrow = ailen[row];
562981824310SBarry Smith     low  = 0;
563081824310SBarry Smith     high = nrow;
563181824310SBarry Smith     for (l = 0; l < n; l++) { /* loop over added columns */
563281824310SBarry Smith       if (in[l] < 0) continue;
56335f80ce2aSJacob Faibussowitsch       PetscCheck(in[l] < A->cmap->n, PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_OUTOFRANGE, "Column too large");
563481824310SBarry Smith       col = in[l];
56352205254eSKarl Rupp       if (roworiented) value = v[l + k * n];
56362205254eSKarl Rupp       else value = v[k + l * m];
56372205254eSKarl Rupp 
563881824310SBarry Smith       if (value == 0.0 && ignorezeroentries && (is == ADD_VALUES)) continue;
563981824310SBarry Smith 
56402205254eSKarl Rupp       if (col <= lastcol) low = 0;
56412205254eSKarl Rupp       else high = nrow;
564281824310SBarry Smith       lastcol = col;
564381824310SBarry Smith       while (high - low > 5) {
564481824310SBarry Smith         t = (low + high) / 2;
564581824310SBarry Smith         if (rp[t] > col) high = t;
564681824310SBarry Smith         else low = t;
564781824310SBarry Smith       }
564881824310SBarry Smith       for (i = low; i < high; i++) {
564981824310SBarry Smith         if (rp[i] > col) break;
565081824310SBarry Smith         if (rp[i] == col) {
565181824310SBarry Smith           if (is == ADD_VALUES) ap[i] += value;
565281824310SBarry Smith           else ap[i] = value;
565381824310SBarry Smith           goto noinsert;
565481824310SBarry Smith         }
565581824310SBarry Smith       }
565681824310SBarry Smith       if (value == 0.0 && ignorezeroentries) goto noinsert;
565781824310SBarry Smith       if (nonew == 1) goto noinsert;
56585f80ce2aSJacob Faibussowitsch       PetscCheck(nonew != -1, PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_OUTOFRANGE, "Inserting a new nonzero in the matrix");
5659fef13f97SBarry Smith       MatSeqXAIJReallocateAIJ(A, A->rmap->n, 1, nrow, row, col, rmax, aa, ai, aj, rp, ap, imax, nonew, MatScalar);
56609371c9d4SSatish Balay       N = nrow++ - 1;
56619371c9d4SSatish Balay       a->nz++;
56629371c9d4SSatish Balay       high++;
566381824310SBarry Smith       /* shift up all the later entries in this row */
566481824310SBarry Smith       for (ii = N; ii >= i; ii--) {
566581824310SBarry Smith         rp[ii + 1] = rp[ii];
566681824310SBarry Smith         ap[ii + 1] = ap[ii];
566781824310SBarry Smith       }
566881824310SBarry Smith       rp[i] = col;
566981824310SBarry Smith       ap[i] = value;
567081824310SBarry Smith     noinsert:;
567181824310SBarry Smith       low = i + 1;
567281824310SBarry Smith     }
567381824310SBarry Smith     ailen[row] = nrow;
567481824310SBarry Smith   }
567581824310SBarry Smith   PetscFunctionReturnVoid();
567681824310SBarry Smith }
567798921bdaSJacob Faibussowitsch /* Undefining these here since they were redefined from their original definition above! No
567898921bdaSJacob Faibussowitsch  * other PETSc functions should be defined past this point, as it is impossible to recover the
567998921bdaSJacob Faibussowitsch  * original definitions */
56809566063dSJacob Faibussowitsch #undef PetscCall
568198921bdaSJacob Faibussowitsch #undef SETERRQ
5682