xref: /petsc/src/mat/impls/aij/seq/aij.c (revision 5914357ec6ae0b2d581c0a9548ac0a3ec2123079)
1d5d45c9bSBarry Smith /*
23369ce9aSBarry Smith     Defines the basic matrix operations for the AIJ (compressed row)
3d5d45c9bSBarry Smith   matrix storage format.
4d5d45c9bSBarry Smith */
53369ce9aSBarry Smith 
6c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/aij.h> /*I "petscmat.h" I*/
7c6db04a5SJed Brown #include <petscblaslapack.h>
8c6db04a5SJed Brown #include <petscbt.h>
9af0996ceSBarry Smith #include <petsc/private/kernels/blocktranspose.h>
100716a85fSBarry Smith 
1126cec326SBarry Smith /* defines MatSetValues_Seq_Hash(), MatAssemblyEnd_Seq_Hash(), MatSetUp_Seq_Hash() */
1226cec326SBarry Smith #define TYPE AIJ
1326cec326SBarry Smith #define TYPE_BS
1426cec326SBarry Smith #include "../src/mat/impls/aij/seq/seqhashmatsetvalues.h"
1526cec326SBarry Smith #include "../src/mat/impls/aij/seq/seqhashmat.h"
1626cec326SBarry Smith #undef TYPE
1726cec326SBarry Smith #undef TYPE_BS
1826cec326SBarry Smith 
19ba38deedSJacob Faibussowitsch static PetscErrorCode MatSeqAIJSetTypeFromOptions(Mat A)
20d71ae5a4SJacob Faibussowitsch {
214099cc6bSBarry Smith   PetscBool flg;
224099cc6bSBarry Smith   char      type[256];
234099cc6bSBarry Smith 
244099cc6bSBarry Smith   PetscFunctionBegin;
25d0609cedSBarry Smith   PetscObjectOptionsBegin((PetscObject)A);
269566063dSJacob Faibussowitsch   PetscCall(PetscOptionsFList("-mat_seqaij_type", "Matrix SeqAIJ type", "MatSeqAIJSetType", MatSeqAIJList, "seqaij", type, 256, &flg));
279566063dSJacob Faibussowitsch   if (flg) PetscCall(MatSeqAIJSetType(A, type));
28d0609cedSBarry Smith   PetscOptionsEnd();
293ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
304099cc6bSBarry Smith }
314099cc6bSBarry Smith 
32ba38deedSJacob Faibussowitsch static PetscErrorCode MatGetColumnReductions_SeqAIJ(Mat A, PetscInt type, PetscReal *reductions)
33d71ae5a4SJacob Faibussowitsch {
340716a85fSBarry Smith   PetscInt    i, m, n;
350716a85fSBarry Smith   Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data;
360716a85fSBarry Smith 
370716a85fSBarry Smith   PetscFunctionBegin;
389566063dSJacob Faibussowitsch   PetscCall(MatGetSize(A, &m, &n));
399566063dSJacob Faibussowitsch   PetscCall(PetscArrayzero(reductions, n));
400716a85fSBarry Smith   if (type == NORM_2) {
41ad540459SPierre Jolivet     for (i = 0; i < aij->i[m]; i++) reductions[aij->j[i]] += PetscAbsScalar(aij->a[i] * aij->a[i]);
420716a85fSBarry Smith   } else if (type == NORM_1) {
43ad540459SPierre Jolivet     for (i = 0; i < aij->i[m]; i++) reductions[aij->j[i]] += PetscAbsScalar(aij->a[i]);
440716a85fSBarry Smith   } else if (type == NORM_INFINITY) {
45ad540459SPierre Jolivet     for (i = 0; i < aij->i[m]; i++) reductions[aij->j[i]] = PetscMax(PetscAbsScalar(aij->a[i]), reductions[aij->j[i]]);
46857cbf51SRichard Tran Mills   } else if (type == REDUCTION_SUM_REALPART || type == REDUCTION_MEAN_REALPART) {
47ad540459SPierre Jolivet     for (i = 0; i < aij->i[m]; i++) reductions[aij->j[i]] += PetscRealPart(aij->a[i]);
48857cbf51SRichard Tran Mills   } else if (type == REDUCTION_SUM_IMAGINARYPART || type == REDUCTION_MEAN_IMAGINARYPART) {
49ad540459SPierre Jolivet     for (i = 0; i < aij->i[m]; i++) reductions[aij->j[i]] += PetscImaginaryPart(aij->a[i]);
506adde796SStefano Zampini   } else SETERRQ(PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_WRONG, "Unknown reduction type");
510716a85fSBarry Smith 
520716a85fSBarry Smith   if (type == NORM_2) {
53a873a8cdSSam Reynolds     for (i = 0; i < n; i++) reductions[i] = PetscSqrtReal(reductions[i]);
54857cbf51SRichard Tran Mills   } else if (type == REDUCTION_MEAN_REALPART || type == REDUCTION_MEAN_IMAGINARYPART) {
55a873a8cdSSam Reynolds     for (i = 0; i < n; i++) reductions[i] /= m;
560716a85fSBarry Smith   }
573ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
580716a85fSBarry Smith }
590716a85fSBarry Smith 
60ba38deedSJacob Faibussowitsch static PetscErrorCode MatFindOffBlockDiagonalEntries_SeqAIJ(Mat A, IS *is)
61d71ae5a4SJacob Faibussowitsch {
623a062f41SBarry Smith   Mat_SeqAIJ     *a = (Mat_SeqAIJ *)A->data;
633a062f41SBarry Smith   PetscInt        i, m = A->rmap->n, cnt = 0, bs = A->rmap->bs;
643a062f41SBarry Smith   const PetscInt *jj = a->j, *ii = a->i;
653a062f41SBarry Smith   PetscInt       *rows;
663a062f41SBarry Smith 
673a062f41SBarry Smith   PetscFunctionBegin;
683a062f41SBarry Smith   for (i = 0; i < m; i++) {
69ad540459SPierre Jolivet     if ((ii[i] != ii[i + 1]) && ((jj[ii[i]] < bs * (i / bs)) || (jj[ii[i + 1] - 1] > bs * ((i + bs) / bs) - 1))) cnt++;
703a062f41SBarry Smith   }
719566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(cnt, &rows));
723a062f41SBarry Smith   cnt = 0;
733a062f41SBarry Smith   for (i = 0; i < m; i++) {
743a062f41SBarry Smith     if ((ii[i] != ii[i + 1]) && ((jj[ii[i]] < bs * (i / bs)) || (jj[ii[i + 1] - 1] > bs * ((i + bs) / bs) - 1))) {
753a062f41SBarry Smith       rows[cnt] = i;
763a062f41SBarry Smith       cnt++;
773a062f41SBarry Smith     }
783a062f41SBarry Smith   }
799566063dSJacob Faibussowitsch   PetscCall(ISCreateGeneral(PETSC_COMM_SELF, cnt, rows, PETSC_OWN_POINTER, is));
803ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
813a062f41SBarry Smith }
823a062f41SBarry Smith 
83d71ae5a4SJacob Faibussowitsch PetscErrorCode MatFindZeroDiagonals_SeqAIJ_Private(Mat A, PetscInt *nrows, PetscInt **zrows)
84d71ae5a4SJacob Faibussowitsch {
856ce1633cSBarry Smith   Mat_SeqAIJ      *a = (Mat_SeqAIJ *)A->data;
86fff043a9SJunchao Zhang   const MatScalar *aa;
876ce1633cSBarry Smith   PetscInt         i, m = A->rmap->n, cnt = 0;
88b2db7409Sstefano_zampini   const PetscInt  *ii = a->i, *jj = a->j, *diag;
896ce1633cSBarry Smith   PetscInt        *rows;
906ce1633cSBarry Smith 
916ce1633cSBarry Smith   PetscFunctionBegin;
929566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &aa));
939566063dSJacob Faibussowitsch   PetscCall(MatMarkDiagonal_SeqAIJ(A));
946ce1633cSBarry Smith   diag = a->diag;
956ce1633cSBarry Smith   for (i = 0; i < m; i++) {
96ad540459SPierre Jolivet     if ((diag[i] >= ii[i + 1]) || (jj[diag[i]] != i) || (aa[diag[i]] == 0.0)) cnt++;
976ce1633cSBarry Smith   }
989566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(cnt, &rows));
996ce1633cSBarry Smith   cnt = 0;
1006ce1633cSBarry Smith   for (i = 0; i < m; i++) {
101ad540459SPierre Jolivet     if ((diag[i] >= ii[i + 1]) || (jj[diag[i]] != i) || (aa[diag[i]] == 0.0)) rows[cnt++] = i;
1026ce1633cSBarry Smith   }
103f1f41ecbSJed Brown   *nrows = cnt;
104f1f41ecbSJed Brown   *zrows = rows;
1059566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &aa));
1063ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
107f1f41ecbSJed Brown }
108f1f41ecbSJed Brown 
109ba38deedSJacob Faibussowitsch static PetscErrorCode MatFindZeroDiagonals_SeqAIJ(Mat A, IS *zrows)
110d71ae5a4SJacob Faibussowitsch {
111f1f41ecbSJed Brown   PetscInt nrows, *rows;
112f1f41ecbSJed Brown 
113f1f41ecbSJed Brown   PetscFunctionBegin;
1140298fd71SBarry Smith   *zrows = NULL;
1159566063dSJacob Faibussowitsch   PetscCall(MatFindZeroDiagonals_SeqAIJ_Private(A, &nrows, &rows));
1169566063dSJacob Faibussowitsch   PetscCall(ISCreateGeneral(PetscObjectComm((PetscObject)A), nrows, rows, PETSC_OWN_POINTER, zrows));
1173ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
1186ce1633cSBarry Smith }
1196ce1633cSBarry Smith 
120ba38deedSJacob Faibussowitsch static PetscErrorCode MatFindNonzeroRows_SeqAIJ(Mat A, IS *keptrows)
121d71ae5a4SJacob Faibussowitsch {
122b3a44c85SBarry Smith   Mat_SeqAIJ      *a = (Mat_SeqAIJ *)A->data;
123b3a44c85SBarry Smith   const MatScalar *aa;
124b3a44c85SBarry Smith   PetscInt         m = A->rmap->n, cnt = 0;
125b3a44c85SBarry Smith   const PetscInt  *ii;
126b3a44c85SBarry Smith   PetscInt         n, i, j, *rows;
127b3a44c85SBarry Smith 
128b3a44c85SBarry Smith   PetscFunctionBegin;
1299566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &aa));
130f4259b30SLisandro Dalcin   *keptrows = NULL;
131b3a44c85SBarry Smith   ii        = a->i;
132b3a44c85SBarry Smith   for (i = 0; i < m; i++) {
133b3a44c85SBarry Smith     n = ii[i + 1] - ii[i];
134b3a44c85SBarry Smith     if (!n) {
135b3a44c85SBarry Smith       cnt++;
136b3a44c85SBarry Smith       goto ok1;
137b3a44c85SBarry Smith     }
1382e5835c6SStefano Zampini     for (j = ii[i]; j < ii[i + 1]; j++) {
139b3a44c85SBarry Smith       if (aa[j] != 0.0) goto ok1;
140b3a44c85SBarry Smith     }
141b3a44c85SBarry Smith     cnt++;
142b3a44c85SBarry Smith   ok1:;
143b3a44c85SBarry Smith   }
1442e5835c6SStefano Zampini   if (!cnt) {
1459566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJRestoreArrayRead(A, &aa));
1463ba16761SJacob Faibussowitsch     PetscFunctionReturn(PETSC_SUCCESS);
1472e5835c6SStefano Zampini   }
1489566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(A->rmap->n - cnt, &rows));
149b3a44c85SBarry Smith   cnt = 0;
150b3a44c85SBarry Smith   for (i = 0; i < m; i++) {
151b3a44c85SBarry Smith     n = ii[i + 1] - ii[i];
152b3a44c85SBarry Smith     if (!n) continue;
1532e5835c6SStefano Zampini     for (j = ii[i]; j < ii[i + 1]; j++) {
154b3a44c85SBarry Smith       if (aa[j] != 0.0) {
155b3a44c85SBarry Smith         rows[cnt++] = i;
156b3a44c85SBarry Smith         break;
157b3a44c85SBarry Smith       }
158b3a44c85SBarry Smith     }
159b3a44c85SBarry Smith   }
1609566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &aa));
1619566063dSJacob Faibussowitsch   PetscCall(ISCreateGeneral(PETSC_COMM_SELF, cnt, rows, PETSC_OWN_POINTER, keptrows));
1623ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
163b3a44c85SBarry Smith }
164b3a44c85SBarry Smith 
165d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDiagonalSet_SeqAIJ(Mat Y, Vec D, InsertMode is)
166d71ae5a4SJacob Faibussowitsch {
16779299369SBarry Smith   Mat_SeqAIJ        *aij = (Mat_SeqAIJ *)Y->data;
16899e65526SBarry Smith   PetscInt           i, m = Y->rmap->n;
16999e65526SBarry Smith   const PetscInt    *diag;
1702e5835c6SStefano Zampini   MatScalar         *aa;
17199e65526SBarry Smith   const PetscScalar *v;
172ace3abfcSBarry Smith   PetscBool          missing;
17379299369SBarry Smith 
17479299369SBarry Smith   PetscFunctionBegin;
17509f38230SBarry Smith   if (Y->assembled) {
1769566063dSJacob Faibussowitsch     PetscCall(MatMissingDiagonal_SeqAIJ(Y, &missing, NULL));
17709f38230SBarry Smith     if (!missing) {
17879299369SBarry Smith       diag = aij->diag;
1799566063dSJacob Faibussowitsch       PetscCall(VecGetArrayRead(D, &v));
1809566063dSJacob Faibussowitsch       PetscCall(MatSeqAIJGetArray(Y, &aa));
18179299369SBarry Smith       if (is == INSERT_VALUES) {
182ad540459SPierre Jolivet         for (i = 0; i < m; i++) aa[diag[i]] = v[i];
18379299369SBarry Smith       } else {
184ad540459SPierre Jolivet         for (i = 0; i < m; i++) aa[diag[i]] += v[i];
18579299369SBarry Smith       }
1869566063dSJacob Faibussowitsch       PetscCall(MatSeqAIJRestoreArray(Y, &aa));
1879566063dSJacob Faibussowitsch       PetscCall(VecRestoreArrayRead(D, &v));
1883ba16761SJacob Faibussowitsch       PetscFunctionReturn(PETSC_SUCCESS);
18979299369SBarry Smith     }
1909566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJInvalidateDiagonal(Y));
19109f38230SBarry Smith   }
1929566063dSJacob Faibussowitsch   PetscCall(MatDiagonalSet_Default(Y, D, is));
1933ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
19409f38230SBarry Smith }
19579299369SBarry Smith 
196d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetRowIJ_SeqAIJ(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *m, const PetscInt *ia[], const PetscInt *ja[], PetscBool *done)
197d71ae5a4SJacob Faibussowitsch {
198416022c9SBarry Smith   Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data;
19997f1f81fSBarry Smith   PetscInt    i, ishift;
20017ab2063SBarry Smith 
2013a40ed3dSBarry Smith   PetscFunctionBegin;
202f1f2ae84SBarry Smith   if (m) *m = A->rmap->n;
2033ba16761SJacob Faibussowitsch   if (!ia) PetscFunctionReturn(PETSC_SUCCESS);
204bfeeae90SHong Zhang   ishift = 0;
205b94d7dedSBarry Smith   if (symmetric && A->structurally_symmetric != PETSC_BOOL3_TRUE) {
2069566063dSJacob Faibussowitsch     PetscCall(MatToSymmetricIJ_SeqAIJ(A->rmap->n, a->i, a->j, PETSC_TRUE, ishift, oshift, (PetscInt **)ia, (PetscInt **)ja));
207bfeeae90SHong Zhang   } else if (oshift == 1) {
2081a83f524SJed Brown     PetscInt *tia;
209d0f46423SBarry Smith     PetscInt  nz = a->i[A->rmap->n];
2103b2fbd54SBarry Smith     /* malloc space and  add 1 to i and j indices */
2119566063dSJacob Faibussowitsch     PetscCall(PetscMalloc1(A->rmap->n + 1, &tia));
2121a83f524SJed Brown     for (i = 0; i < A->rmap->n + 1; i++) tia[i] = a->i[i] + 1;
2131a83f524SJed Brown     *ia = tia;
214ecc77c7aSBarry Smith     if (ja) {
2151a83f524SJed Brown       PetscInt *tja;
2169566063dSJacob Faibussowitsch       PetscCall(PetscMalloc1(nz + 1, &tja));
2171a83f524SJed Brown       for (i = 0; i < nz; i++) tja[i] = a->j[i] + 1;
2181a83f524SJed Brown       *ja = tja;
219ecc77c7aSBarry Smith     }
2206945ee14SBarry Smith   } else {
221ecc77c7aSBarry Smith     *ia = a->i;
222ecc77c7aSBarry Smith     if (ja) *ja = a->j;
223a2ce50c7SBarry Smith   }
2243ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
225a2744918SBarry Smith }
226a2744918SBarry Smith 
227d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRestoreRowIJ_SeqAIJ(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *n, const PetscInt *ia[], const PetscInt *ja[], PetscBool *done)
228d71ae5a4SJacob Faibussowitsch {
2293a40ed3dSBarry Smith   PetscFunctionBegin;
2303ba16761SJacob Faibussowitsch   if (!ia) PetscFunctionReturn(PETSC_SUCCESS);
231b94d7dedSBarry Smith   if ((symmetric && A->structurally_symmetric != PETSC_BOOL3_TRUE) || oshift == 1) {
2329566063dSJacob Faibussowitsch     PetscCall(PetscFree(*ia));
2339566063dSJacob Faibussowitsch     if (ja) PetscCall(PetscFree(*ja));
234bcd2baecSBarry Smith   }
2353ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
23617ab2063SBarry Smith }
23717ab2063SBarry Smith 
238d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetColumnIJ_SeqAIJ(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *nn, const PetscInt *ia[], const PetscInt *ja[], PetscBool *done)
239d71ae5a4SJacob Faibussowitsch {
2403b2fbd54SBarry Smith   Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data;
241d0f46423SBarry Smith   PetscInt    i, *collengths, *cia, *cja, n = A->cmap->n, m = A->rmap->n;
24297f1f81fSBarry Smith   PetscInt    nz = a->i[m], row, *jj, mr, col;
2433b2fbd54SBarry Smith 
2443a40ed3dSBarry Smith   PetscFunctionBegin;
245899cda47SBarry Smith   *nn = n;
2463ba16761SJacob Faibussowitsch   if (!ia) PetscFunctionReturn(PETSC_SUCCESS);
2473b2fbd54SBarry Smith   if (symmetric) {
2489566063dSJacob Faibussowitsch     PetscCall(MatToSymmetricIJ_SeqAIJ(A->rmap->n, a->i, a->j, PETSC_TRUE, 0, oshift, (PetscInt **)ia, (PetscInt **)ja));
2493b2fbd54SBarry Smith   } else {
2509566063dSJacob Faibussowitsch     PetscCall(PetscCalloc1(n, &collengths));
2519566063dSJacob Faibussowitsch     PetscCall(PetscMalloc1(n + 1, &cia));
2529566063dSJacob Faibussowitsch     PetscCall(PetscMalloc1(nz, &cja));
2533b2fbd54SBarry Smith     jj = a->j;
254ad540459SPierre Jolivet     for (i = 0; i < nz; i++) collengths[jj[i]]++;
2553b2fbd54SBarry Smith     cia[0] = oshift;
256ad540459SPierre Jolivet     for (i = 0; i < n; i++) cia[i + 1] = cia[i] + collengths[i];
2579566063dSJacob Faibussowitsch     PetscCall(PetscArrayzero(collengths, n));
2583b2fbd54SBarry Smith     jj = a->j;
259a93ec695SBarry Smith     for (row = 0; row < m; row++) {
260a93ec695SBarry Smith       mr = a->i[row + 1] - a->i[row];
261a93ec695SBarry Smith       for (i = 0; i < mr; i++) {
262bfeeae90SHong Zhang         col = *jj++;
2632205254eSKarl Rupp 
2643b2fbd54SBarry Smith         cja[cia[col] + collengths[col]++ - oshift] = row + oshift;
2653b2fbd54SBarry Smith       }
2663b2fbd54SBarry Smith     }
2679566063dSJacob Faibussowitsch     PetscCall(PetscFree(collengths));
2689371c9d4SSatish Balay     *ia = cia;
2699371c9d4SSatish Balay     *ja = cja;
2703b2fbd54SBarry Smith   }
2713ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
2723b2fbd54SBarry Smith }
2733b2fbd54SBarry Smith 
274d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRestoreColumnIJ_SeqAIJ(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *n, const PetscInt *ia[], const PetscInt *ja[], PetscBool *done)
275d71ae5a4SJacob Faibussowitsch {
2763a40ed3dSBarry Smith   PetscFunctionBegin;
2773ba16761SJacob Faibussowitsch   if (!ia) PetscFunctionReturn(PETSC_SUCCESS);
2783b2fbd54SBarry Smith 
2799566063dSJacob Faibussowitsch   PetscCall(PetscFree(*ia));
2809566063dSJacob Faibussowitsch   PetscCall(PetscFree(*ja));
2813ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
2823b2fbd54SBarry Smith }
2833b2fbd54SBarry Smith 
2847cee066cSHong Zhang /*
2857cee066cSHong Zhang  MatGetColumnIJ_SeqAIJ_Color() and MatRestoreColumnIJ_SeqAIJ_Color() are customized from
2867cee066cSHong Zhang  MatGetColumnIJ_SeqAIJ() and MatRestoreColumnIJ_SeqAIJ() by adding an output
287040ebd07SHong Zhang  spidx[], index of a->a, to be used in MatTransposeColoringCreate_SeqAIJ() and MatFDColoringCreate_SeqXAIJ()
2887cee066cSHong Zhang */
289d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetColumnIJ_SeqAIJ_Color(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *nn, const PetscInt *ia[], const PetscInt *ja[], PetscInt *spidx[], PetscBool *done)
290d71ae5a4SJacob Faibussowitsch {
2917cee066cSHong Zhang   Mat_SeqAIJ     *a = (Mat_SeqAIJ *)A->data;
2927cee066cSHong Zhang   PetscInt        i, *collengths, *cia, *cja, n = A->cmap->n, m = A->rmap->n;
293071fcb05SBarry Smith   PetscInt        nz = a->i[m], row, mr, col, tmp;
2947cee066cSHong Zhang   PetscInt       *cspidx;
295071fcb05SBarry Smith   const PetscInt *jj;
2967cee066cSHong Zhang 
2977cee066cSHong Zhang   PetscFunctionBegin;
2987cee066cSHong Zhang   *nn = n;
2993ba16761SJacob Faibussowitsch   if (!ia) PetscFunctionReturn(PETSC_SUCCESS);
300625f6d37SHong Zhang 
3019566063dSJacob Faibussowitsch   PetscCall(PetscCalloc1(n, &collengths));
3029566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(n + 1, &cia));
3039566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(nz, &cja));
3049566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(nz, &cspidx));
3057cee066cSHong Zhang   jj = a->j;
306ad540459SPierre Jolivet   for (i = 0; i < nz; i++) collengths[jj[i]]++;
3077cee066cSHong Zhang   cia[0] = oshift;
308ad540459SPierre Jolivet   for (i = 0; i < n; i++) cia[i + 1] = cia[i] + collengths[i];
3099566063dSJacob Faibussowitsch   PetscCall(PetscArrayzero(collengths, n));
3107cee066cSHong Zhang   jj = a->j;
3117cee066cSHong Zhang   for (row = 0; row < m; row++) {
3127cee066cSHong Zhang     mr = a->i[row + 1] - a->i[row];
3137cee066cSHong Zhang     for (i = 0; i < mr; i++) {
3147cee066cSHong Zhang       col         = *jj++;
315071fcb05SBarry Smith       tmp         = cia[col] + collengths[col]++ - oshift;
316071fcb05SBarry Smith       cspidx[tmp] = a->i[row] + i; /* index of a->j */
317071fcb05SBarry Smith       cja[tmp]    = row + oshift;
3187cee066cSHong Zhang     }
3197cee066cSHong Zhang   }
3209566063dSJacob Faibussowitsch   PetscCall(PetscFree(collengths));
321071fcb05SBarry Smith   *ia    = cia;
322071fcb05SBarry Smith   *ja    = cja;
3237cee066cSHong Zhang   *spidx = cspidx;
3243ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3257cee066cSHong Zhang }
3267cee066cSHong Zhang 
327d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRestoreColumnIJ_SeqAIJ_Color(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *n, const PetscInt *ia[], const PetscInt *ja[], PetscInt *spidx[], PetscBool *done)
328d71ae5a4SJacob Faibussowitsch {
3297cee066cSHong Zhang   PetscFunctionBegin;
3309566063dSJacob Faibussowitsch   PetscCall(MatRestoreColumnIJ_SeqAIJ(A, oshift, symmetric, inodecompressed, n, ia, ja, done));
3319566063dSJacob Faibussowitsch   PetscCall(PetscFree(*spidx));
3323ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3337cee066cSHong Zhang }
3347cee066cSHong Zhang 
335ba38deedSJacob Faibussowitsch static PetscErrorCode MatSetValuesRow_SeqAIJ(Mat A, PetscInt row, const PetscScalar v[])
336d71ae5a4SJacob Faibussowitsch {
33787d4246cSBarry Smith   Mat_SeqAIJ  *a  = (Mat_SeqAIJ *)A->data;
33887d4246cSBarry Smith   PetscInt    *ai = a->i;
339fff043a9SJunchao Zhang   PetscScalar *aa;
34087d4246cSBarry Smith 
34187d4246cSBarry Smith   PetscFunctionBegin;
3429566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArray(A, &aa));
3439566063dSJacob Faibussowitsch   PetscCall(PetscArraycpy(aa + ai[row], v, ai[row + 1] - ai[row]));
3449566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArray(A, &aa));
3453ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
34687d4246cSBarry Smith }
34787d4246cSBarry Smith 
348bd04181cSBarry Smith /*
349bd04181cSBarry Smith     MatSeqAIJSetValuesLocalFast - An optimized version of MatSetValuesLocal() for SeqAIJ matrices with several assumptions
350bd04181cSBarry Smith 
351bd04181cSBarry Smith       -   a single row of values is set with each call
352bd04181cSBarry Smith       -   no row or column indices are negative or (in error) larger than the number of rows or columns
353bd04181cSBarry Smith       -   the values are always added to the matrix, not set
354bd04181cSBarry Smith       -   no new locations are introduced in the nonzero structure of the matrix
355bd04181cSBarry Smith 
3561f763a69SBarry Smith      This does NOT assume the global column indices are sorted
357bd04181cSBarry Smith 
3581f763a69SBarry Smith */
359bd04181cSBarry Smith 
360af0996ceSBarry Smith #include <petsc/private/isimpl.h>
361d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetValuesLocalFast(Mat A, PetscInt m, const PetscInt im[], PetscInt n, const PetscInt in[], const PetscScalar v[], InsertMode is)
362d71ae5a4SJacob Faibussowitsch {
363189e4007SBarry Smith   Mat_SeqAIJ     *a = (Mat_SeqAIJ *)A->data;
3641f763a69SBarry Smith   PetscInt        low, high, t, row, nrow, i, col, l;
3651f763a69SBarry Smith   const PetscInt *rp, *ai = a->i, *ailen = a->ilen, *aj = a->j;
3661f763a69SBarry Smith   PetscInt        lastcol = -1;
367fff043a9SJunchao Zhang   MatScalar      *ap, value, *aa;
368189e4007SBarry Smith   const PetscInt *ridx = A->rmap->mapping->indices, *cidx = A->cmap->mapping->indices;
369189e4007SBarry Smith 
370fff043a9SJunchao Zhang   PetscFunctionBegin;
3719566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArray(A, &aa));
372f38dd0b8SBarry Smith   row  = ridx[im[0]];
3731f763a69SBarry Smith   rp   = aj + ai[row];
3741f763a69SBarry Smith   ap   = aa + ai[row];
3751f763a69SBarry Smith   nrow = ailen[row];
376189e4007SBarry Smith   low  = 0;
377189e4007SBarry Smith   high = nrow;
378189e4007SBarry Smith   for (l = 0; l < n; l++) { /* loop over added columns */
379189e4007SBarry Smith     col   = cidx[in[l]];
380f38dd0b8SBarry Smith     value = v[l];
381189e4007SBarry Smith 
382189e4007SBarry Smith     if (col <= lastcol) low = 0;
383189e4007SBarry Smith     else high = nrow;
384189e4007SBarry Smith     lastcol = col;
385189e4007SBarry Smith     while (high - low > 5) {
386189e4007SBarry Smith       t = (low + high) / 2;
387189e4007SBarry Smith       if (rp[t] > col) high = t;
388189e4007SBarry Smith       else low = t;
389189e4007SBarry Smith     }
390189e4007SBarry Smith     for (i = low; i < high; i++) {
391189e4007SBarry Smith       if (rp[i] == col) {
3921f763a69SBarry Smith         ap[i] += value;
393189e4007SBarry Smith         low = i + 1;
3941f763a69SBarry Smith         break;
395189e4007SBarry Smith       }
396189e4007SBarry Smith     }
397189e4007SBarry Smith   }
3989566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArray(A, &aa));
3993ba16761SJacob Faibussowitsch   return PETSC_SUCCESS;
400189e4007SBarry Smith }
401189e4007SBarry Smith 
402d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetValues_SeqAIJ(Mat A, PetscInt m, const PetscInt im[], PetscInt n, const PetscInt in[], const PetscScalar v[], InsertMode is)
403d71ae5a4SJacob Faibussowitsch {
404416022c9SBarry Smith   Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data;
405e2ee6c50SBarry Smith   PetscInt   *rp, k, low, high, t, ii, row, nrow, i, col, l, rmax, N;
40697f1f81fSBarry Smith   PetscInt   *imax = a->imax, *ai = a->i, *ailen = a->ilen;
407e2ee6c50SBarry Smith   PetscInt   *aj = a->j, nonew = a->nonew, lastcol = -1;
408ce496241SStefano Zampini   MatScalar  *ap = NULL, value = 0.0, *aa;
409ace3abfcSBarry Smith   PetscBool   ignorezeroentries = a->ignorezeroentries;
410ace3abfcSBarry Smith   PetscBool   roworiented       = a->roworiented;
41117ab2063SBarry Smith 
4123a40ed3dSBarry Smith   PetscFunctionBegin;
4139566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArray(A, &aa));
41417ab2063SBarry Smith   for (k = 0; k < m; k++) { /* loop over added rows */
415416022c9SBarry Smith     row = im[k];
4165ef9f2a5SBarry Smith     if (row < 0) continue;
4176bdcaf15SBarry Smith     PetscCheck(row < A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Row too large: row %" PetscInt_FMT " max %" PetscInt_FMT, row, A->rmap->n - 1);
4188e3a54c0SPierre Jolivet     rp = PetscSafePointerPlusOffset(aj, ai[row]);
4198e3a54c0SPierre Jolivet     if (!A->structure_only) ap = PetscSafePointerPlusOffset(aa, ai[row]);
4209371c9d4SSatish Balay     rmax = imax[row];
4219371c9d4SSatish Balay     nrow = ailen[row];
422416022c9SBarry Smith     low  = 0;
423c71e6ed7SBarry Smith     high = nrow;
42417ab2063SBarry Smith     for (l = 0; l < n; l++) { /* loop over added columns */
4255ef9f2a5SBarry Smith       if (in[l] < 0) continue;
4266bdcaf15SBarry Smith       PetscCheck(in[l] < A->cmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Column too large: col %" PetscInt_FMT " max %" PetscInt_FMT, in[l], A->cmap->n - 1);
427bfeeae90SHong Zhang       col = in[l];
428071fcb05SBarry Smith       if (v && !A->structure_only) value = roworiented ? v[l + k * n] : v[k + l * m];
429071fcb05SBarry Smith       if (!A->structure_only && value == 0.0 && ignorezeroentries && is == ADD_VALUES && row != col) continue;
43036db0b34SBarry Smith 
4312205254eSKarl Rupp       if (col <= lastcol) low = 0;
4322205254eSKarl Rupp       else high = nrow;
433e2ee6c50SBarry Smith       lastcol = col;
434416022c9SBarry Smith       while (high - low > 5) {
435416022c9SBarry Smith         t = (low + high) / 2;
436416022c9SBarry Smith         if (rp[t] > col) high = t;
437416022c9SBarry Smith         else low = t;
43817ab2063SBarry Smith       }
439416022c9SBarry Smith       for (i = low; i < high; i++) {
44017ab2063SBarry Smith         if (rp[i] > col) break;
44117ab2063SBarry Smith         if (rp[i] == col) {
442876c6284SHong Zhang           if (!A->structure_only) {
4430c0d7e18SFande Kong             if (is == ADD_VALUES) {
4440c0d7e18SFande Kong               ap[i] += value;
4450c0d7e18SFande Kong               (void)PetscLogFlops(1.0);
4469371c9d4SSatish Balay             } else ap[i] = value;
447720833daSHong Zhang           }
448e44c0bd4SBarry Smith           low = i + 1;
44917ab2063SBarry Smith           goto noinsert;
45017ab2063SBarry Smith         }
45117ab2063SBarry Smith       }
452dcd36c23SBarry Smith       if (value == 0.0 && ignorezeroentries && row != col) goto noinsert;
453c2653b3dSLois Curfman McInnes       if (nonew == 1) goto noinsert;
45408401ef6SPierre Jolivet       PetscCheck(nonew != -1, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Inserting a new nonzero at (%" PetscInt_FMT ",%" PetscInt_FMT ") in the matrix", row, col);
455720833daSHong Zhang       if (A->structure_only) {
456876c6284SHong Zhang         MatSeqXAIJReallocateAIJ_structure_only(A, A->rmap->n, 1, nrow, row, col, rmax, ai, aj, rp, imax, nonew, MatScalar);
457720833daSHong Zhang       } else {
458fef13f97SBarry Smith         MatSeqXAIJReallocateAIJ(A, A->rmap->n, 1, nrow, row, col, rmax, aa, ai, aj, rp, ap, imax, nonew, MatScalar);
459720833daSHong Zhang       }
4609371c9d4SSatish Balay       N = nrow++ - 1;
4619371c9d4SSatish Balay       a->nz++;
4629371c9d4SSatish Balay       high++;
463416022c9SBarry Smith       /* shift up all the later entries in this row */
4649566063dSJacob Faibussowitsch       PetscCall(PetscArraymove(rp + i + 1, rp + i, N - i + 1));
46517ab2063SBarry Smith       rp[i] = col;
466580bdb30SBarry Smith       if (!A->structure_only) {
4679566063dSJacob Faibussowitsch         PetscCall(PetscArraymove(ap + i + 1, ap + i, N - i + 1));
468580bdb30SBarry Smith         ap[i] = value;
469580bdb30SBarry Smith       }
470416022c9SBarry Smith       low = i + 1;
471e44c0bd4SBarry Smith     noinsert:;
47217ab2063SBarry Smith     }
47317ab2063SBarry Smith     ailen[row] = nrow;
47417ab2063SBarry Smith   }
4759566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArray(A, &aa));
4763ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
47717ab2063SBarry Smith }
47817ab2063SBarry Smith 
479ba38deedSJacob Faibussowitsch static PetscErrorCode MatSetValues_SeqAIJ_SortedFullNoPreallocation(Mat A, PetscInt m, const PetscInt im[], PetscInt n, const PetscInt in[], const PetscScalar v[], InsertMode is)
480d71ae5a4SJacob Faibussowitsch {
48119b08ed1SBarry Smith   Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data;
48219b08ed1SBarry Smith   PetscInt   *rp, k, row;
48319b08ed1SBarry Smith   PetscInt   *ai = a->i;
48419b08ed1SBarry Smith   PetscInt   *aj = a->j;
485fff043a9SJunchao Zhang   MatScalar  *aa, *ap;
48619b08ed1SBarry Smith 
48719b08ed1SBarry Smith   PetscFunctionBegin;
48828b400f6SJacob Faibussowitsch   PetscCheck(!A->was_assembled, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Cannot call on assembled matrix.");
48908401ef6SPierre Jolivet   PetscCheck(m * n + a->nz <= a->maxnz, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Number of entries in matrix will be larger than maximum nonzeros allocated for %" PetscInt_FMT " in MatSeqAIJSetTotalPreallocation()", a->maxnz);
490fff043a9SJunchao Zhang 
4919566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArray(A, &aa));
49219b08ed1SBarry Smith   for (k = 0; k < m; k++) { /* loop over added rows */
49319b08ed1SBarry Smith     row = im[k];
49419b08ed1SBarry Smith     rp  = aj + ai[row];
4958e3a54c0SPierre Jolivet     ap  = PetscSafePointerPlusOffset(aa, ai[row]);
49619b08ed1SBarry Smith 
4979566063dSJacob Faibussowitsch     PetscCall(PetscMemcpy(rp, in, n * sizeof(PetscInt)));
49819b08ed1SBarry Smith     if (!A->structure_only) {
49919b08ed1SBarry Smith       if (v) {
5009566063dSJacob Faibussowitsch         PetscCall(PetscMemcpy(ap, v, n * sizeof(PetscScalar)));
50119b08ed1SBarry Smith         v += n;
50219b08ed1SBarry Smith       } else {
5039566063dSJacob Faibussowitsch         PetscCall(PetscMemzero(ap, n * sizeof(PetscScalar)));
50419b08ed1SBarry Smith       }
50519b08ed1SBarry Smith     }
50619b08ed1SBarry Smith     a->ilen[row]  = n;
50719b08ed1SBarry Smith     a->imax[row]  = n;
50819b08ed1SBarry Smith     a->i[row + 1] = a->i[row] + n;
50919b08ed1SBarry Smith     a->nz += n;
51019b08ed1SBarry Smith   }
5119566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArray(A, &aa));
5123ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
51319b08ed1SBarry Smith }
51419b08ed1SBarry Smith 
51519b08ed1SBarry Smith /*@
51619b08ed1SBarry Smith   MatSeqAIJSetTotalPreallocation - Sets an upper bound on the total number of expected nonzeros in the matrix.
51719b08ed1SBarry Smith 
51819b08ed1SBarry Smith   Input Parameters:
51911a5261eSBarry Smith + A       - the `MATSEQAIJ` matrix
52019b08ed1SBarry Smith - nztotal - bound on the number of nonzeros
52119b08ed1SBarry Smith 
52219b08ed1SBarry Smith   Level: advanced
52319b08ed1SBarry Smith 
52419b08ed1SBarry Smith   Notes:
52519b08ed1SBarry Smith   This can be called if you will be provided the matrix row by row (from row zero) with sorted column indices for each row.
52611a5261eSBarry Smith   Simply call `MatSetValues()` after this call to provide the matrix entries in the usual manner. This matrix may be used
52719b08ed1SBarry Smith   as always with multiple matrix assemblies.
52819b08ed1SBarry Smith 
5291cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSetOption()`, `MAT_SORTED_FULL`, `MatSetValues()`, `MatSeqAIJSetPreallocation()`
53019b08ed1SBarry Smith @*/
531d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetTotalPreallocation(Mat A, PetscInt nztotal)
532d71ae5a4SJacob Faibussowitsch {
53319b08ed1SBarry Smith   Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data;
53419b08ed1SBarry Smith 
53519b08ed1SBarry Smith   PetscFunctionBegin;
5369566063dSJacob Faibussowitsch   PetscCall(PetscLayoutSetUp(A->rmap));
5379566063dSJacob Faibussowitsch   PetscCall(PetscLayoutSetUp(A->cmap));
53819b08ed1SBarry Smith   a->maxnz = nztotal;
5394dfa11a4SJacob Faibussowitsch   if (!a->imax) { PetscCall(PetscMalloc1(A->rmap->n, &a->imax)); }
54019b08ed1SBarry Smith   if (!a->ilen) {
5419566063dSJacob Faibussowitsch     PetscCall(PetscMalloc1(A->rmap->n, &a->ilen));
54219b08ed1SBarry Smith   } else {
5439566063dSJacob Faibussowitsch     PetscCall(PetscMemzero(a->ilen, A->rmap->n * sizeof(PetscInt)));
54419b08ed1SBarry Smith   }
54519b08ed1SBarry Smith 
54619b08ed1SBarry Smith   /* allocate the matrix space */
54719b08ed1SBarry Smith   if (A->structure_only) {
5489566063dSJacob Faibussowitsch     PetscCall(PetscMalloc1(nztotal, &a->j));
5499566063dSJacob Faibussowitsch     PetscCall(PetscMalloc1(A->rmap->n + 1, &a->i));
55019b08ed1SBarry Smith   } else {
5519566063dSJacob Faibussowitsch     PetscCall(PetscMalloc3(nztotal, &a->a, nztotal, &a->j, A->rmap->n + 1, &a->i));
55219b08ed1SBarry Smith   }
55319b08ed1SBarry Smith   a->i[0] = 0;
55419b08ed1SBarry Smith   if (A->structure_only) {
55519b08ed1SBarry Smith     a->singlemalloc = PETSC_FALSE;
55619b08ed1SBarry Smith     a->free_a       = PETSC_FALSE;
55719b08ed1SBarry Smith   } else {
55819b08ed1SBarry Smith     a->singlemalloc = PETSC_TRUE;
55919b08ed1SBarry Smith     a->free_a       = PETSC_TRUE;
56019b08ed1SBarry Smith   }
56119b08ed1SBarry Smith   a->free_ij        = PETSC_TRUE;
56219b08ed1SBarry Smith   A->ops->setvalues = MatSetValues_SeqAIJ_SortedFullNoPreallocation;
56319b08ed1SBarry Smith   A->preallocated   = PETSC_TRUE;
5643ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
56519b08ed1SBarry Smith }
56619b08ed1SBarry Smith 
567ba38deedSJacob Faibussowitsch static PetscErrorCode MatSetValues_SeqAIJ_SortedFull(Mat A, PetscInt m, const PetscInt im[], PetscInt n, const PetscInt in[], const PetscScalar v[], InsertMode is)
568d71ae5a4SJacob Faibussowitsch {
569071fcb05SBarry Smith   Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data;
570071fcb05SBarry Smith   PetscInt   *rp, k, row;
571071fcb05SBarry Smith   PetscInt   *ai = a->i, *ailen = a->ilen;
572071fcb05SBarry Smith   PetscInt   *aj = a->j;
573fff043a9SJunchao Zhang   MatScalar  *aa, *ap;
574071fcb05SBarry Smith 
575071fcb05SBarry Smith   PetscFunctionBegin;
5769566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArray(A, &aa));
577071fcb05SBarry Smith   for (k = 0; k < m; k++) { /* loop over added rows */
578071fcb05SBarry Smith     row = im[k];
5796bdcaf15SBarry Smith     PetscCheck(n <= a->imax[row], PETSC_COMM_SELF, PETSC_ERR_ARG_WRONG, "Preallocation for row %" PetscInt_FMT " does not match number of columns provided", n);
580071fcb05SBarry Smith     rp = aj + ai[row];
581071fcb05SBarry Smith     ap = aa + ai[row];
58248a46eb9SPierre Jolivet     if (!A->was_assembled) PetscCall(PetscMemcpy(rp, in, n * sizeof(PetscInt)));
583071fcb05SBarry Smith     if (!A->structure_only) {
584071fcb05SBarry Smith       if (v) {
5859566063dSJacob Faibussowitsch         PetscCall(PetscMemcpy(ap, v, n * sizeof(PetscScalar)));
586071fcb05SBarry Smith         v += n;
587071fcb05SBarry Smith       } else {
5889566063dSJacob Faibussowitsch         PetscCall(PetscMemzero(ap, n * sizeof(PetscScalar)));
589071fcb05SBarry Smith       }
590071fcb05SBarry Smith     }
591071fcb05SBarry Smith     ailen[row] = n;
592071fcb05SBarry Smith     a->nz += n;
593071fcb05SBarry Smith   }
5949566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArray(A, &aa));
5953ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
596071fcb05SBarry Smith }
597071fcb05SBarry Smith 
598ba38deedSJacob Faibussowitsch static PetscErrorCode MatGetValues_SeqAIJ(Mat A, PetscInt m, const PetscInt im[], PetscInt n, const PetscInt in[], PetscScalar v[])
599d71ae5a4SJacob Faibussowitsch {
6007eb43aa7SLois Curfman McInnes   Mat_SeqAIJ      *a = (Mat_SeqAIJ *)A->data;
60197f1f81fSBarry Smith   PetscInt        *rp, k, low, high, t, row, nrow, i, col, l, *aj = a->j;
60297f1f81fSBarry Smith   PetscInt        *ai = a->i, *ailen = a->ilen;
6034e208921SJed Brown   const MatScalar *ap, *aa;
6047eb43aa7SLois Curfman McInnes 
6053a40ed3dSBarry Smith   PetscFunctionBegin;
6064e208921SJed Brown   PetscCall(MatSeqAIJGetArrayRead(A, &aa));
6077eb43aa7SLois Curfman McInnes   for (k = 0; k < m; k++) { /* loop over rows */
6087eb43aa7SLois Curfman McInnes     row = im[k];
6099371c9d4SSatish Balay     if (row < 0) {
6109371c9d4SSatish Balay       v += n;
6119371c9d4SSatish Balay       continue;
6129371c9d4SSatish Balay     } /* negative row */
61354c59aa7SJacob Faibussowitsch     PetscCheck(row < A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Row too large: row %" PetscInt_FMT " max %" PetscInt_FMT, row, A->rmap->n - 1);
6148e3a54c0SPierre Jolivet     rp   = PetscSafePointerPlusOffset(aj, ai[row]);
6158e3a54c0SPierre Jolivet     ap   = PetscSafePointerPlusOffset(aa, ai[row]);
6167eb43aa7SLois Curfman McInnes     nrow = ailen[row];
6177eb43aa7SLois Curfman McInnes     for (l = 0; l < n; l++) { /* loop over columns */
6189371c9d4SSatish Balay       if (in[l] < 0) {
6199371c9d4SSatish Balay         v++;
6209371c9d4SSatish Balay         continue;
6219371c9d4SSatish Balay       } /* negative column */
62254c59aa7SJacob Faibussowitsch       PetscCheck(in[l] < A->cmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Column too large: col %" PetscInt_FMT " max %" PetscInt_FMT, in[l], A->cmap->n - 1);
623bfeeae90SHong Zhang       col  = in[l];
6249371c9d4SSatish Balay       high = nrow;
6259371c9d4SSatish Balay       low  = 0; /* assume unsorted */
6267eb43aa7SLois Curfman McInnes       while (high - low > 5) {
6277eb43aa7SLois Curfman McInnes         t = (low + high) / 2;
6287eb43aa7SLois Curfman McInnes         if (rp[t] > col) high = t;
6297eb43aa7SLois Curfman McInnes         else low = t;
6307eb43aa7SLois Curfman McInnes       }
6317eb43aa7SLois Curfman McInnes       for (i = low; i < high; i++) {
6327eb43aa7SLois Curfman McInnes         if (rp[i] > col) break;
6337eb43aa7SLois Curfman McInnes         if (rp[i] == col) {
634b49de8d1SLois Curfman McInnes           *v++ = ap[i];
6357eb43aa7SLois Curfman McInnes           goto finished;
6367eb43aa7SLois Curfman McInnes         }
6377eb43aa7SLois Curfman McInnes       }
63897e567efSBarry Smith       *v++ = 0.0;
6397eb43aa7SLois Curfman McInnes     finished:;
6407eb43aa7SLois Curfman McInnes     }
6417eb43aa7SLois Curfman McInnes   }
6424e208921SJed Brown   PetscCall(MatSeqAIJRestoreArrayRead(A, &aa));
6433ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
6447eb43aa7SLois Curfman McInnes }
6457eb43aa7SLois Curfman McInnes 
646ba38deedSJacob Faibussowitsch static PetscErrorCode MatView_SeqAIJ_Binary(Mat mat, PetscViewer viewer)
647d71ae5a4SJacob Faibussowitsch {
6483ea6fe3dSLisandro Dalcin   Mat_SeqAIJ        *A = (Mat_SeqAIJ *)mat->data;
649c898d852SStefano Zampini   const PetscScalar *av;
6503ea6fe3dSLisandro Dalcin   PetscInt           header[4], M, N, m, nz, i;
6513ea6fe3dSLisandro Dalcin   PetscInt          *rowlens;
65217ab2063SBarry Smith 
6533a40ed3dSBarry Smith   PetscFunctionBegin;
6549566063dSJacob Faibussowitsch   PetscCall(PetscViewerSetUp(viewer));
6552205254eSKarl Rupp 
6563ea6fe3dSLisandro Dalcin   M  = mat->rmap->N;
6573ea6fe3dSLisandro Dalcin   N  = mat->cmap->N;
6583ea6fe3dSLisandro Dalcin   m  = mat->rmap->n;
6593ea6fe3dSLisandro Dalcin   nz = A->nz;
660416022c9SBarry Smith 
6613ea6fe3dSLisandro Dalcin   /* write matrix header */
6623ea6fe3dSLisandro Dalcin   header[0] = MAT_FILE_CLASSID;
6639371c9d4SSatish Balay   header[1] = M;
6649371c9d4SSatish Balay   header[2] = N;
6659371c9d4SSatish Balay   header[3] = nz;
6669566063dSJacob Faibussowitsch   PetscCall(PetscViewerBinaryWrite(viewer, header, 4, PETSC_INT));
667416022c9SBarry Smith 
6683ea6fe3dSLisandro Dalcin   /* fill in and store row lengths */
6699566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(m, &rowlens));
6703ea6fe3dSLisandro Dalcin   for (i = 0; i < m; i++) rowlens[i] = A->i[i + 1] - A->i[i];
6719566063dSJacob Faibussowitsch   PetscCall(PetscViewerBinaryWrite(viewer, rowlens, m, PETSC_INT));
6729566063dSJacob Faibussowitsch   PetscCall(PetscFree(rowlens));
6733ea6fe3dSLisandro Dalcin   /* store column indices */
6749566063dSJacob Faibussowitsch   PetscCall(PetscViewerBinaryWrite(viewer, A->j, nz, PETSC_INT));
675416022c9SBarry Smith   /* store nonzero values */
6769566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(mat, &av));
6779566063dSJacob Faibussowitsch   PetscCall(PetscViewerBinaryWrite(viewer, av, nz, PETSC_SCALAR));
6789566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(mat, &av));
679b37d52dbSMark F. Adams 
6803ea6fe3dSLisandro Dalcin   /* write block size option to the viewer's .info file */
6819566063dSJacob Faibussowitsch   PetscCall(MatView_Binary_BlockSizes(mat, viewer));
6823ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
68317ab2063SBarry Smith }
684416022c9SBarry Smith 
685d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatView_SeqAIJ_ASCII_structonly(Mat A, PetscViewer viewer)
686d71ae5a4SJacob Faibussowitsch {
6877dc0baabSHong Zhang   Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data;
6887dc0baabSHong Zhang   PetscInt    i, k, m = A->rmap->N;
6897dc0baabSHong Zhang 
6907dc0baabSHong Zhang   PetscFunctionBegin;
6919566063dSJacob Faibussowitsch   PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE));
6927dc0baabSHong Zhang   for (i = 0; i < m; i++) {
6939566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIPrintf(viewer, "row %" PetscInt_FMT ":", i));
69448a46eb9SPierre Jolivet     for (k = a->i[i]; k < a->i[i + 1]; k++) PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ") ", a->j[k]));
6959566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIPrintf(viewer, "\n"));
6967dc0baabSHong Zhang   }
6979566063dSJacob Faibussowitsch   PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE));
6983ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
6997dc0baabSHong Zhang }
7007dc0baabSHong Zhang 
70109573ac7SBarry Smith extern PetscErrorCode MatSeqAIJFactorInfo_Matlab(Mat, PetscViewer);
702cd155464SBarry Smith 
703ba38deedSJacob Faibussowitsch static PetscErrorCode MatView_SeqAIJ_ASCII(Mat A, PetscViewer viewer)
704d71ae5a4SJacob Faibussowitsch {
705416022c9SBarry Smith   Mat_SeqAIJ        *a = (Mat_SeqAIJ *)A->data;
706c898d852SStefano Zampini   const PetscScalar *av;
70760e0710aSBarry Smith   PetscInt           i, j, m = A->rmap->n;
708e060cb09SBarry Smith   const char        *name;
709f3ef73ceSBarry Smith   PetscViewerFormat  format;
71017ab2063SBarry Smith 
7113a40ed3dSBarry Smith   PetscFunctionBegin;
7127dc0baabSHong Zhang   if (A->structure_only) {
7139566063dSJacob Faibussowitsch     PetscCall(MatView_SeqAIJ_ASCII_structonly(A, viewer));
7143ba16761SJacob Faibussowitsch     PetscFunctionReturn(PETSC_SUCCESS);
7157dc0baabSHong Zhang   }
71643e49210SHong Zhang 
7179566063dSJacob Faibussowitsch   PetscCall(PetscViewerGetFormat(viewer, &format));
7183ba16761SJacob Faibussowitsch   if (format == PETSC_VIEWER_ASCII_FACTOR_INFO || format == PETSC_VIEWER_ASCII_INFO || format == PETSC_VIEWER_ASCII_INFO_DETAIL) PetscFunctionReturn(PETSC_SUCCESS);
7192e5835c6SStefano Zampini 
720c898d852SStefano Zampini   /* trigger copy to CPU if needed */
7219566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &av));
7229566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &av));
72371c2f376SKris Buschelman   if (format == PETSC_VIEWER_ASCII_MATLAB) {
72497f1f81fSBarry Smith     PetscInt nofinalvalue = 0;
72560e0710aSBarry Smith     if (m && ((a->i[m] == a->i[m - 1]) || (a->j[a->nz - 1] != A->cmap->n - 1))) {
726c337ccceSJed Brown       /* Need a dummy value to ensure the dimension of the matrix. */
727d00d2cf4SBarry Smith       nofinalvalue = 1;
728d00d2cf4SBarry Smith     }
7299566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE));
7309566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIPrintf(viewer, "%% Size = %" PetscInt_FMT " %" PetscInt_FMT " \n", m, A->cmap->n));
7319566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIPrintf(viewer, "%% Nonzeros = %" PetscInt_FMT " \n", a->nz));
732fbfe6fa7SJed Brown #if defined(PETSC_USE_COMPLEX)
7339566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIPrintf(viewer, "zzz = zeros(%" PetscInt_FMT ",4);\n", a->nz + nofinalvalue));
734fbfe6fa7SJed Brown #else
7359566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIPrintf(viewer, "zzz = zeros(%" PetscInt_FMT ",3);\n", a->nz + nofinalvalue));
736fbfe6fa7SJed Brown #endif
7379566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIPrintf(viewer, "zzz = [\n"));
73817ab2063SBarry Smith 
73917ab2063SBarry Smith     for (i = 0; i < m; i++) {
74060e0710aSBarry Smith       for (j = a->i[i]; j < a->i[i + 1]; j++) {
741aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX)
7429566063dSJacob Faibussowitsch         PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT "  %18.16e %18.16e\n", i + 1, a->j[j] + 1, (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j])));
74317ab2063SBarry Smith #else
7449566063dSJacob Faibussowitsch         PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT "  %18.16e\n", i + 1, a->j[j] + 1, (double)a->a[j]));
74517ab2063SBarry Smith #endif
74617ab2063SBarry Smith       }
74717ab2063SBarry Smith     }
748d00d2cf4SBarry Smith     if (nofinalvalue) {
749c337ccceSJed Brown #if defined(PETSC_USE_COMPLEX)
7509566063dSJacob Faibussowitsch       PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT "  %18.16e %18.16e\n", m, A->cmap->n, 0., 0.));
751c337ccceSJed Brown #else
7529566063dSJacob Faibussowitsch       PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT "  %18.16e\n", m, A->cmap->n, 0.0));
753c337ccceSJed Brown #endif
754d00d2cf4SBarry Smith     }
7559566063dSJacob Faibussowitsch     PetscCall(PetscObjectGetName((PetscObject)A, &name));
7569566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIPrintf(viewer, "];\n %s = spconvert(zzz);\n", name));
7579566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE));
758fb9695e5SSatish Balay   } else if (format == PETSC_VIEWER_ASCII_COMMON) {
7599566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE));
76044cd7ae7SLois Curfman McInnes     for (i = 0; i < m; i++) {
7619566063dSJacob Faibussowitsch       PetscCall(PetscViewerASCIIPrintf(viewer, "row %" PetscInt_FMT ":", i));
76260e0710aSBarry Smith       for (j = a->i[i]; j < a->i[i + 1]; j++) {
763aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX)
76436db0b34SBarry Smith         if (PetscImaginaryPart(a->a[j]) > 0.0 && PetscRealPart(a->a[j]) != 0.0) {
7659566063dSJacob Faibussowitsch           PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g + %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j])));
76636db0b34SBarry Smith         } else if (PetscImaginaryPart(a->a[j]) < 0.0 && PetscRealPart(a->a[j]) != 0.0) {
7679566063dSJacob Faibussowitsch           PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g - %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)-PetscImaginaryPart(a->a[j])));
76836db0b34SBarry Smith         } else if (PetscRealPart(a->a[j]) != 0.0) {
7699566063dSJacob Faibussowitsch           PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)PetscRealPart(a->a[j])));
7706831982aSBarry Smith         }
77144cd7ae7SLois Curfman McInnes #else
7729566063dSJacob Faibussowitsch         if (a->a[j] != 0.0) PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)a->a[j]));
77344cd7ae7SLois Curfman McInnes #endif
77444cd7ae7SLois Curfman McInnes       }
7759566063dSJacob Faibussowitsch       PetscCall(PetscViewerASCIIPrintf(viewer, "\n"));
77644cd7ae7SLois Curfman McInnes     }
7779566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE));
778fb9695e5SSatish Balay   } else if (format == PETSC_VIEWER_ASCII_SYMMODU) {
77997f1f81fSBarry Smith     PetscInt nzd = 0, fshift = 1, *sptr;
7809566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE));
7819566063dSJacob Faibussowitsch     PetscCall(PetscMalloc1(m + 1, &sptr));
782496be53dSLois Curfman McInnes     for (i = 0; i < m; i++) {
783496be53dSLois Curfman McInnes       sptr[i] = nzd + 1;
78460e0710aSBarry Smith       for (j = a->i[i]; j < a->i[i + 1]; j++) {
785496be53dSLois Curfman McInnes         if (a->j[j] >= i) {
786aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX)
78736db0b34SBarry Smith           if (PetscImaginaryPart(a->a[j]) != 0.0 || PetscRealPart(a->a[j]) != 0.0) nzd++;
788496be53dSLois Curfman McInnes #else
789496be53dSLois Curfman McInnes           if (a->a[j] != 0.0) nzd++;
790496be53dSLois Curfman McInnes #endif
791496be53dSLois Curfman McInnes         }
792496be53dSLois Curfman McInnes       }
793496be53dSLois Curfman McInnes     }
7942e44a96cSLois Curfman McInnes     sptr[m] = nzd + 1;
7959566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " %" PetscInt_FMT "\n\n", m, nzd));
7962e44a96cSLois Curfman McInnes     for (i = 0; i < m + 1; i += 6) {
7972205254eSKarl Rupp       if (i + 4 < m) {
7989566063dSJacob Faibussowitsch         PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT "\n", sptr[i], sptr[i + 1], sptr[i + 2], sptr[i + 3], sptr[i + 4], sptr[i + 5]));
7992205254eSKarl Rupp       } else if (i + 3 < m) {
8009566063dSJacob Faibussowitsch         PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT "\n", sptr[i], sptr[i + 1], sptr[i + 2], sptr[i + 3], sptr[i + 4]));
8012205254eSKarl Rupp       } else if (i + 2 < m) {
8029566063dSJacob Faibussowitsch         PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT "\n", sptr[i], sptr[i + 1], sptr[i + 2], sptr[i + 3]));
8032205254eSKarl Rupp       } else if (i + 1 < m) {
8049566063dSJacob Faibussowitsch         PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT "\n", sptr[i], sptr[i + 1], sptr[i + 2]));
8052205254eSKarl Rupp       } else if (i < m) {
8069566063dSJacob Faibussowitsch         PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " %" PetscInt_FMT "\n", sptr[i], sptr[i + 1]));
8072205254eSKarl Rupp       } else {
8089566063dSJacob Faibussowitsch         PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT "\n", sptr[i]));
8092205254eSKarl Rupp       }
810496be53dSLois Curfman McInnes     }
8119566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIPrintf(viewer, "\n"));
8129566063dSJacob Faibussowitsch     PetscCall(PetscFree(sptr));
813496be53dSLois Curfman McInnes     for (i = 0; i < m; i++) {
81460e0710aSBarry Smith       for (j = a->i[i]; j < a->i[i + 1]; j++) {
8159566063dSJacob Faibussowitsch         if (a->j[j] >= i) PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " ", a->j[j] + fshift));
816496be53dSLois Curfman McInnes       }
8179566063dSJacob Faibussowitsch       PetscCall(PetscViewerASCIIPrintf(viewer, "\n"));
818496be53dSLois Curfman McInnes     }
8199566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIPrintf(viewer, "\n"));
820496be53dSLois Curfman McInnes     for (i = 0; i < m; i++) {
82160e0710aSBarry Smith       for (j = a->i[i]; j < a->i[i + 1]; j++) {
822496be53dSLois Curfman McInnes         if (a->j[j] >= i) {
823aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX)
82448a46eb9SPierre Jolivet           if (PetscImaginaryPart(a->a[j]) != 0.0 || PetscRealPart(a->a[j]) != 0.0) PetscCall(PetscViewerASCIIPrintf(viewer, " %18.16e %18.16e ", (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j])));
825496be53dSLois Curfman McInnes #else
8269566063dSJacob Faibussowitsch           if (a->a[j] != 0.0) PetscCall(PetscViewerASCIIPrintf(viewer, " %18.16e ", (double)a->a[j]));
827496be53dSLois Curfman McInnes #endif
828496be53dSLois Curfman McInnes         }
829496be53dSLois Curfman McInnes       }
8309566063dSJacob Faibussowitsch       PetscCall(PetscViewerASCIIPrintf(viewer, "\n"));
831496be53dSLois Curfman McInnes     }
8329566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE));
833fb9695e5SSatish Balay   } else if (format == PETSC_VIEWER_ASCII_DENSE) {
83497f1f81fSBarry Smith     PetscInt    cnt = 0, jcnt;
83587828ca2SBarry Smith     PetscScalar value;
83668f1ed48SBarry Smith #if defined(PETSC_USE_COMPLEX)
83768f1ed48SBarry Smith     PetscBool realonly = PETSC_TRUE;
83868f1ed48SBarry Smith 
83968f1ed48SBarry Smith     for (i = 0; i < a->i[m]; i++) {
84068f1ed48SBarry Smith       if (PetscImaginaryPart(a->a[i]) != 0.0) {
84168f1ed48SBarry Smith         realonly = PETSC_FALSE;
84268f1ed48SBarry Smith         break;
84368f1ed48SBarry Smith       }
84468f1ed48SBarry Smith     }
84568f1ed48SBarry Smith #endif
84602594712SBarry Smith 
8479566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE));
84802594712SBarry Smith     for (i = 0; i < m; i++) {
84902594712SBarry Smith       jcnt = 0;
850d0f46423SBarry Smith       for (j = 0; j < A->cmap->n; j++) {
851e24b481bSBarry Smith         if (jcnt < a->i[i + 1] - a->i[i] && j == a->j[cnt]) {
85202594712SBarry Smith           value = a->a[cnt++];
853e24b481bSBarry Smith           jcnt++;
85402594712SBarry Smith         } else {
85502594712SBarry Smith           value = 0.0;
85602594712SBarry Smith         }
857aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX)
85868f1ed48SBarry Smith         if (realonly) {
8599566063dSJacob Faibussowitsch           PetscCall(PetscViewerASCIIPrintf(viewer, " %7.5e ", (double)PetscRealPart(value)));
86068f1ed48SBarry Smith         } else {
8619566063dSJacob Faibussowitsch           PetscCall(PetscViewerASCIIPrintf(viewer, " %7.5e+%7.5e i ", (double)PetscRealPart(value), (double)PetscImaginaryPart(value)));
86268f1ed48SBarry Smith         }
86302594712SBarry Smith #else
8649566063dSJacob Faibussowitsch         PetscCall(PetscViewerASCIIPrintf(viewer, " %7.5e ", (double)value));
86502594712SBarry Smith #endif
86602594712SBarry Smith       }
8679566063dSJacob Faibussowitsch       PetscCall(PetscViewerASCIIPrintf(viewer, "\n"));
86802594712SBarry Smith     }
8699566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE));
8703c215bfdSMatthew Knepley   } else if (format == PETSC_VIEWER_ASCII_MATRIXMARKET) {
871150b93efSMatthew G. Knepley     PetscInt fshift = 1;
8729566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE));
8733c215bfdSMatthew Knepley #if defined(PETSC_USE_COMPLEX)
8749566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIPrintf(viewer, "%%%%MatrixMarket matrix coordinate complex general\n"));
8753c215bfdSMatthew Knepley #else
8769566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIPrintf(viewer, "%%%%MatrixMarket matrix coordinate real general\n"));
8773c215bfdSMatthew Knepley #endif
8789566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT "\n", m, A->cmap->n, a->nz));
8793c215bfdSMatthew Knepley     for (i = 0; i < m; i++) {
88060e0710aSBarry Smith       for (j = a->i[i]; j < a->i[i + 1]; j++) {
8813c215bfdSMatthew Knepley #if defined(PETSC_USE_COMPLEX)
8829566063dSJacob Faibussowitsch         PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT " %g %g\n", i + fshift, a->j[j] + fshift, (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j])));
8833c215bfdSMatthew Knepley #else
8849566063dSJacob Faibussowitsch         PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT " %g\n", i + fshift, a->j[j] + fshift, (double)a->a[j]));
8853c215bfdSMatthew Knepley #endif
8863c215bfdSMatthew Knepley       }
8873c215bfdSMatthew Knepley     }
8889566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE));
8893a40ed3dSBarry Smith   } else {
8909566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE));
891d5f3da31SBarry Smith     if (A->factortype) {
89216cd7e1dSShri Abhyankar       for (i = 0; i < m; i++) {
8939566063dSJacob Faibussowitsch         PetscCall(PetscViewerASCIIPrintf(viewer, "row %" PetscInt_FMT ":", i));
89416cd7e1dSShri Abhyankar         /* L part */
89560e0710aSBarry Smith         for (j = a->i[i]; j < a->i[i + 1]; j++) {
89616cd7e1dSShri Abhyankar #if defined(PETSC_USE_COMPLEX)
89716cd7e1dSShri Abhyankar           if (PetscImaginaryPart(a->a[j]) > 0.0) {
8989566063dSJacob Faibussowitsch             PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g + %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j])));
89916cd7e1dSShri Abhyankar           } else if (PetscImaginaryPart(a->a[j]) < 0.0) {
9009566063dSJacob Faibussowitsch             PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g - %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)(-PetscImaginaryPart(a->a[j]))));
90116cd7e1dSShri Abhyankar           } else {
9029566063dSJacob Faibussowitsch             PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)PetscRealPart(a->a[j])));
90316cd7e1dSShri Abhyankar           }
90416cd7e1dSShri Abhyankar #else
9059566063dSJacob Faibussowitsch           PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)a->a[j]));
90616cd7e1dSShri Abhyankar #endif
90716cd7e1dSShri Abhyankar         }
90816cd7e1dSShri Abhyankar         /* diagonal */
90916cd7e1dSShri Abhyankar         j = a->diag[i];
91016cd7e1dSShri Abhyankar #if defined(PETSC_USE_COMPLEX)
91116cd7e1dSShri Abhyankar         if (PetscImaginaryPart(a->a[j]) > 0.0) {
9129566063dSJacob Faibussowitsch           PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g + %g i)", a->j[j], (double)PetscRealPart(1.0 / a->a[j]), (double)PetscImaginaryPart(1.0 / a->a[j])));
91316cd7e1dSShri Abhyankar         } else if (PetscImaginaryPart(a->a[j]) < 0.0) {
9149566063dSJacob Faibussowitsch           PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g - %g i)", a->j[j], (double)PetscRealPart(1.0 / a->a[j]), (double)(-PetscImaginaryPart(1.0 / a->a[j]))));
91516cd7e1dSShri Abhyankar         } else {
9169566063dSJacob Faibussowitsch           PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)PetscRealPart(1.0 / a->a[j])));
91716cd7e1dSShri Abhyankar         }
91816cd7e1dSShri Abhyankar #else
9199566063dSJacob Faibussowitsch         PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)(1.0 / a->a[j])));
92016cd7e1dSShri Abhyankar #endif
92116cd7e1dSShri Abhyankar 
92216cd7e1dSShri Abhyankar         /* U part */
92360e0710aSBarry Smith         for (j = a->diag[i + 1] + 1; j < a->diag[i]; j++) {
92416cd7e1dSShri Abhyankar #if defined(PETSC_USE_COMPLEX)
92516cd7e1dSShri Abhyankar           if (PetscImaginaryPart(a->a[j]) > 0.0) {
9269566063dSJacob Faibussowitsch             PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g + %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j])));
92716cd7e1dSShri Abhyankar           } else if (PetscImaginaryPart(a->a[j]) < 0.0) {
9289566063dSJacob Faibussowitsch             PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g - %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)(-PetscImaginaryPart(a->a[j]))));
92916cd7e1dSShri Abhyankar           } else {
9309566063dSJacob Faibussowitsch             PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)PetscRealPart(a->a[j])));
93116cd7e1dSShri Abhyankar           }
93216cd7e1dSShri Abhyankar #else
9339566063dSJacob Faibussowitsch           PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)a->a[j]));
93416cd7e1dSShri Abhyankar #endif
93516cd7e1dSShri Abhyankar         }
9369566063dSJacob Faibussowitsch         PetscCall(PetscViewerASCIIPrintf(viewer, "\n"));
93716cd7e1dSShri Abhyankar       }
93816cd7e1dSShri Abhyankar     } else {
93917ab2063SBarry Smith       for (i = 0; i < m; i++) {
9409566063dSJacob Faibussowitsch         PetscCall(PetscViewerASCIIPrintf(viewer, "row %" PetscInt_FMT ":", i));
94160e0710aSBarry Smith         for (j = a->i[i]; j < a->i[i + 1]; j++) {
942aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX)
94336db0b34SBarry Smith           if (PetscImaginaryPart(a->a[j]) > 0.0) {
9449566063dSJacob Faibussowitsch             PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g + %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j])));
94536db0b34SBarry Smith           } else if (PetscImaginaryPart(a->a[j]) < 0.0) {
9469566063dSJacob Faibussowitsch             PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g - %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)-PetscImaginaryPart(a->a[j])));
9473a40ed3dSBarry Smith           } else {
9489566063dSJacob Faibussowitsch             PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)PetscRealPart(a->a[j])));
94917ab2063SBarry Smith           }
95017ab2063SBarry Smith #else
9519566063dSJacob Faibussowitsch           PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)a->a[j]));
95217ab2063SBarry Smith #endif
95317ab2063SBarry Smith         }
9549566063dSJacob Faibussowitsch         PetscCall(PetscViewerASCIIPrintf(viewer, "\n"));
95517ab2063SBarry Smith       }
95616cd7e1dSShri Abhyankar     }
9579566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE));
95817ab2063SBarry Smith   }
9599566063dSJacob Faibussowitsch   PetscCall(PetscViewerFlush(viewer));
9603ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
961416022c9SBarry Smith }
962416022c9SBarry Smith 
9639804daf3SBarry Smith #include <petscdraw.h>
964ba38deedSJacob Faibussowitsch static PetscErrorCode MatView_SeqAIJ_Draw_Zoom(PetscDraw draw, void *Aa)
965d71ae5a4SJacob Faibussowitsch {
966480ef9eaSBarry Smith   Mat                A = (Mat)Aa;
967416022c9SBarry Smith   Mat_SeqAIJ        *a = (Mat_SeqAIJ *)A->data;
968383922c3SLisandro Dalcin   PetscInt           i, j, m = A->rmap->n;
969383922c3SLisandro Dalcin   int                color;
970b05fc000SLisandro Dalcin   PetscReal          xl, yl, xr, yr, x_l, x_r, y_l, y_r;
971b0a32e0cSBarry Smith   PetscViewer        viewer;
972f3ef73ceSBarry Smith   PetscViewerFormat  format;
973fff043a9SJunchao Zhang   const PetscScalar *aa;
974cddf8d76SBarry Smith 
9753a40ed3dSBarry Smith   PetscFunctionBegin;
9769566063dSJacob Faibussowitsch   PetscCall(PetscObjectQuery((PetscObject)A, "Zoomviewer", (PetscObject *)&viewer));
9779566063dSJacob Faibussowitsch   PetscCall(PetscViewerGetFormat(viewer, &format));
9789566063dSJacob Faibussowitsch   PetscCall(PetscDrawGetCoordinates(draw, &xl, &yl, &xr, &yr));
979383922c3SLisandro Dalcin 
980416022c9SBarry Smith   /* loop over matrix elements drawing boxes */
9819566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &aa));
982fb9695e5SSatish Balay   if (format != PETSC_VIEWER_DRAW_CONTOUR) {
983d0609cedSBarry Smith     PetscDrawCollectiveBegin(draw);
9840513a670SBarry Smith     /* Blue for negative, Cyan for zero and  Red for positive */
985b0a32e0cSBarry Smith     color = PETSC_DRAW_BLUE;
986416022c9SBarry Smith     for (i = 0; i < m; i++) {
9879371c9d4SSatish Balay       y_l = m - i - 1.0;
9889371c9d4SSatish Balay       y_r = y_l + 1.0;
989bfeeae90SHong Zhang       for (j = a->i[i]; j < a->i[i + 1]; j++) {
9909371c9d4SSatish Balay         x_l = a->j[j];
9919371c9d4SSatish Balay         x_r = x_l + 1.0;
992fff043a9SJunchao Zhang         if (PetscRealPart(aa[j]) >= 0.) continue;
9939566063dSJacob Faibussowitsch         PetscCall(PetscDrawRectangle(draw, x_l, y_l, x_r, y_r, color, color, color, color));
994cddf8d76SBarry Smith       }
995cddf8d76SBarry Smith     }
996b0a32e0cSBarry Smith     color = PETSC_DRAW_CYAN;
997cddf8d76SBarry Smith     for (i = 0; i < m; i++) {
9989371c9d4SSatish Balay       y_l = m - i - 1.0;
9999371c9d4SSatish Balay       y_r = y_l + 1.0;
1000bfeeae90SHong Zhang       for (j = a->i[i]; j < a->i[i + 1]; j++) {
10019371c9d4SSatish Balay         x_l = a->j[j];
10029371c9d4SSatish Balay         x_r = x_l + 1.0;
1003fff043a9SJunchao Zhang         if (aa[j] != 0.) continue;
10049566063dSJacob Faibussowitsch         PetscCall(PetscDrawRectangle(draw, x_l, y_l, x_r, y_r, color, color, color, color));
1005cddf8d76SBarry Smith       }
1006cddf8d76SBarry Smith     }
1007b0a32e0cSBarry Smith     color = PETSC_DRAW_RED;
1008cddf8d76SBarry Smith     for (i = 0; i < m; i++) {
10099371c9d4SSatish Balay       y_l = m - i - 1.0;
10109371c9d4SSatish Balay       y_r = y_l + 1.0;
1011bfeeae90SHong Zhang       for (j = a->i[i]; j < a->i[i + 1]; j++) {
10129371c9d4SSatish Balay         x_l = a->j[j];
10139371c9d4SSatish Balay         x_r = x_l + 1.0;
1014fff043a9SJunchao Zhang         if (PetscRealPart(aa[j]) <= 0.) continue;
10159566063dSJacob Faibussowitsch         PetscCall(PetscDrawRectangle(draw, x_l, y_l, x_r, y_r, color, color, color, color));
1016416022c9SBarry Smith       }
1017416022c9SBarry Smith     }
1018d0609cedSBarry Smith     PetscDrawCollectiveEnd(draw);
10190513a670SBarry Smith   } else {
10200513a670SBarry Smith     /* use contour shading to indicate magnitude of values */
10210513a670SBarry Smith     /* first determine max of all nonzero values */
1022b05fc000SLisandro Dalcin     PetscReal minv = 0.0, maxv = 0.0;
1023383922c3SLisandro Dalcin     PetscInt  nz = a->nz, count = 0;
1024b0a32e0cSBarry Smith     PetscDraw popup;
10250513a670SBarry Smith 
10260513a670SBarry Smith     for (i = 0; i < nz; i++) {
1027fff043a9SJunchao Zhang       if (PetscAbsScalar(aa[i]) > maxv) maxv = PetscAbsScalar(aa[i]);
10280513a670SBarry Smith     }
1029383922c3SLisandro Dalcin     if (minv >= maxv) maxv = minv + PETSC_SMALL;
10309566063dSJacob Faibussowitsch     PetscCall(PetscDrawGetPopup(draw, &popup));
10319566063dSJacob Faibussowitsch     PetscCall(PetscDrawScalePopup(popup, minv, maxv));
1032383922c3SLisandro Dalcin 
1033d0609cedSBarry Smith     PetscDrawCollectiveBegin(draw);
10340513a670SBarry Smith     for (i = 0; i < m; i++) {
1035383922c3SLisandro Dalcin       y_l = m - i - 1.0;
1036383922c3SLisandro Dalcin       y_r = y_l + 1.0;
1037bfeeae90SHong Zhang       for (j = a->i[i]; j < a->i[i + 1]; j++) {
1038383922c3SLisandro Dalcin         x_l   = a->j[j];
1039383922c3SLisandro Dalcin         x_r   = x_l + 1.0;
1040fff043a9SJunchao Zhang         color = PetscDrawRealToColor(PetscAbsScalar(aa[count]), minv, maxv);
10419566063dSJacob Faibussowitsch         PetscCall(PetscDrawRectangle(draw, x_l, y_l, x_r, y_r, color, color, color, color));
10420513a670SBarry Smith         count++;
10430513a670SBarry Smith       }
10440513a670SBarry Smith     }
1045d0609cedSBarry Smith     PetscDrawCollectiveEnd(draw);
10460513a670SBarry Smith   }
10479566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &aa));
10483ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
1049480ef9eaSBarry Smith }
1050cddf8d76SBarry Smith 
10519804daf3SBarry Smith #include <petscdraw.h>
1052ba38deedSJacob Faibussowitsch static PetscErrorCode MatView_SeqAIJ_Draw(Mat A, PetscViewer viewer)
1053d71ae5a4SJacob Faibussowitsch {
1054b0a32e0cSBarry Smith   PetscDraw draw;
105536db0b34SBarry Smith   PetscReal xr, yr, xl, yl, h, w;
1056ace3abfcSBarry Smith   PetscBool isnull;
1057480ef9eaSBarry Smith 
1058480ef9eaSBarry Smith   PetscFunctionBegin;
10599566063dSJacob Faibussowitsch   PetscCall(PetscViewerDrawGetDraw(viewer, 0, &draw));
10609566063dSJacob Faibussowitsch   PetscCall(PetscDrawIsNull(draw, &isnull));
10613ba16761SJacob Faibussowitsch   if (isnull) PetscFunctionReturn(PETSC_SUCCESS);
1062480ef9eaSBarry Smith 
10639371c9d4SSatish Balay   xr = A->cmap->n;
10649371c9d4SSatish Balay   yr = A->rmap->n;
10659371c9d4SSatish Balay   h  = yr / 10.0;
10669371c9d4SSatish Balay   w  = xr / 10.0;
10679371c9d4SSatish Balay   xr += w;
10689371c9d4SSatish Balay   yr += h;
10699371c9d4SSatish Balay   xl = -w;
10709371c9d4SSatish Balay   yl = -h;
10719566063dSJacob Faibussowitsch   PetscCall(PetscDrawSetCoordinates(draw, xl, yl, xr, yr));
10729566063dSJacob Faibussowitsch   PetscCall(PetscObjectCompose((PetscObject)A, "Zoomviewer", (PetscObject)viewer));
10739566063dSJacob Faibussowitsch   PetscCall(PetscDrawZoom(draw, MatView_SeqAIJ_Draw_Zoom, A));
10749566063dSJacob Faibussowitsch   PetscCall(PetscObjectCompose((PetscObject)A, "Zoomviewer", NULL));
10759566063dSJacob Faibussowitsch   PetscCall(PetscDrawSave(draw));
10763ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
1077416022c9SBarry Smith }
1078416022c9SBarry Smith 
1079d71ae5a4SJacob Faibussowitsch PetscErrorCode MatView_SeqAIJ(Mat A, PetscViewer viewer)
1080d71ae5a4SJacob Faibussowitsch {
1081ace3abfcSBarry Smith   PetscBool iascii, isbinary, isdraw;
1082416022c9SBarry Smith 
10833a40ed3dSBarry Smith   PetscFunctionBegin;
10849566063dSJacob Faibussowitsch   PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERASCII, &iascii));
10859566063dSJacob Faibussowitsch   PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERBINARY, &isbinary));
10869566063dSJacob Faibussowitsch   PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERDRAW, &isdraw));
10871baa6e33SBarry Smith   if (iascii) PetscCall(MatView_SeqAIJ_ASCII(A, viewer));
10881baa6e33SBarry Smith   else if (isbinary) PetscCall(MatView_SeqAIJ_Binary(A, viewer));
10891baa6e33SBarry Smith   else if (isdraw) PetscCall(MatView_SeqAIJ_Draw(A, viewer));
10909566063dSJacob Faibussowitsch   PetscCall(MatView_SeqAIJ_Inode(A, viewer));
10913ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
109217ab2063SBarry Smith }
109319bcc07fSBarry Smith 
1094d71ae5a4SJacob Faibussowitsch PetscErrorCode MatAssemblyEnd_SeqAIJ(Mat A, MatAssemblyType mode)
1095d71ae5a4SJacob Faibussowitsch {
1096416022c9SBarry Smith   Mat_SeqAIJ *a      = (Mat_SeqAIJ *)A->data;
1097580bdb30SBarry Smith   PetscInt    fshift = 0, i, *ai = a->i, *aj = a->j, *imax = a->imax;
1098bc43efbbSJunchao Zhang   PetscInt    m = A->rmap->n, *ip, N, *ailen = a->ilen, rmax = 0, n;
109954f21887SBarry Smith   MatScalar  *aa    = a->a, *ap;
11003447b6efSHong Zhang   PetscReal   ratio = 0.6;
110117ab2063SBarry Smith 
11023a40ed3dSBarry Smith   PetscFunctionBegin;
11033ba16761SJacob Faibussowitsch   if (mode == MAT_FLUSH_ASSEMBLY) PetscFunctionReturn(PETSC_SUCCESS);
11049566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJInvalidateDiagonal(A));
1105b215bc84SStefano Zampini   if (A->was_assembled && A->ass_nonzerostate == A->nonzerostate) {
1106b215bc84SStefano Zampini     /* we need to respect users asking to use or not the inodes routine in between matrix assemblies */
11079566063dSJacob Faibussowitsch     PetscCall(MatAssemblyEnd_SeqAIJ_Inode(A, mode));
11083ba16761SJacob Faibussowitsch     PetscFunctionReturn(PETSC_SUCCESS);
1109b215bc84SStefano Zampini   }
111017ab2063SBarry Smith 
111143ee02c3SBarry Smith   if (m) rmax = ailen[0]; /* determine row with most nonzeros */
111217ab2063SBarry Smith   for (i = 1; i < m; i++) {
1113416022c9SBarry Smith     /* move each row back by the amount of empty slots (fshift) before it*/
111417ab2063SBarry Smith     fshift += imax[i - 1] - ailen[i - 1];
111594a9d846SBarry Smith     rmax = PetscMax(rmax, ailen[i]);
111617ab2063SBarry Smith     if (fshift) {
1117bfeeae90SHong Zhang       ip = aj + ai[i];
1118bfeeae90SHong Zhang       ap = aa + ai[i];
111917ab2063SBarry Smith       N  = ailen[i];
11209566063dSJacob Faibussowitsch       PetscCall(PetscArraymove(ip - fshift, ip, N));
112148a46eb9SPierre Jolivet       if (!A->structure_only) PetscCall(PetscArraymove(ap - fshift, ap, N));
112217ab2063SBarry Smith     }
112317ab2063SBarry Smith     ai[i] = ai[i - 1] + ailen[i - 1];
112417ab2063SBarry Smith   }
112517ab2063SBarry Smith   if (m) {
112617ab2063SBarry Smith     fshift += imax[m - 1] - ailen[m - 1];
112717ab2063SBarry Smith     ai[m] = ai[m - 1] + ailen[m - 1];
112817ab2063SBarry Smith   }
112917ab2063SBarry Smith   /* reset ilen and imax for each row */
11307b083b7cSBarry Smith   a->nonzerorowcnt = 0;
1131396832f4SHong Zhang   if (A->structure_only) {
11329566063dSJacob Faibussowitsch     PetscCall(PetscFree(a->imax));
11339566063dSJacob Faibussowitsch     PetscCall(PetscFree(a->ilen));
1134396832f4SHong Zhang   } else { /* !A->structure_only */
113517ab2063SBarry Smith     for (i = 0; i < m; i++) {
113617ab2063SBarry Smith       ailen[i] = imax[i] = ai[i + 1] - ai[i];
11377b083b7cSBarry Smith       a->nonzerorowcnt += ((ai[i + 1] - ai[i]) > 0);
113817ab2063SBarry Smith     }
1139396832f4SHong Zhang   }
1140bfeeae90SHong Zhang   a->nz = ai[m];
1141aed4548fSBarry Smith   PetscCheck(!fshift || a->nounused != -1, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Unused space detected in matrix: %" PetscInt_FMT " X %" PetscInt_FMT ", %" PetscInt_FMT " unneeded", m, A->cmap->n, fshift);
1142bc43efbbSJunchao Zhang   PetscCall(MatMarkDiagonal_SeqAIJ(A)); // since diagonal info is used a lot, it is helpful to set them up at the end of assembly
1143bc43efbbSJunchao Zhang   a->diagonaldense = PETSC_TRUE;
1144bc43efbbSJunchao Zhang   n                = PetscMin(A->rmap->n, A->cmap->n);
1145bc43efbbSJunchao Zhang   for (i = 0; i < n; i++) {
1146bc43efbbSJunchao Zhang     if (a->diag[i] >= ai[i + 1]) {
1147bc43efbbSJunchao Zhang       a->diagonaldense = PETSC_FALSE;
1148bc43efbbSJunchao Zhang       break;
1149bc43efbbSJunchao Zhang     }
1150bc43efbbSJunchao Zhang   }
11519566063dSJacob Faibussowitsch   PetscCall(PetscInfo(A, "Matrix size: %" PetscInt_FMT " X %" PetscInt_FMT "; storage space: %" PetscInt_FMT " unneeded,%" PetscInt_FMT " used\n", m, A->cmap->n, fshift, a->nz));
11529566063dSJacob Faibussowitsch   PetscCall(PetscInfo(A, "Number of mallocs during MatSetValues() is %" PetscInt_FMT "\n", a->reallocs));
11539566063dSJacob Faibussowitsch   PetscCall(PetscInfo(A, "Maximum nonzeros in any row is %" PetscInt_FMT "\n", rmax));
11542205254eSKarl Rupp 
11558e58a170SBarry Smith   A->info.mallocs += a->reallocs;
1156dd5f02e7SSatish Balay   a->reallocs         = 0;
11576712e2f1SBarry Smith   A->info.nz_unneeded = (PetscReal)fshift;
115836db0b34SBarry Smith   a->rmax             = rmax;
11594e220ebcSLois Curfman McInnes 
116048a46eb9SPierre Jolivet   if (!A->structure_only) PetscCall(MatCheckCompressedRow(A, a->nonzerorowcnt, &a->compressedrow, a->i, m, ratio));
11619566063dSJacob Faibussowitsch   PetscCall(MatAssemblyEnd_SeqAIJ_Inode(A, mode));
11623ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
116317ab2063SBarry Smith }
116417ab2063SBarry Smith 
1165ba38deedSJacob Faibussowitsch static PetscErrorCode MatRealPart_SeqAIJ(Mat A)
1166d71ae5a4SJacob Faibussowitsch {
116799cafbc1SBarry Smith   Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data;
116899cafbc1SBarry Smith   PetscInt    i, nz = a->nz;
11692e5835c6SStefano Zampini   MatScalar  *aa;
117099cafbc1SBarry Smith 
117199cafbc1SBarry Smith   PetscFunctionBegin;
11729566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArray(A, &aa));
117399cafbc1SBarry Smith   for (i = 0; i < nz; i++) aa[i] = PetscRealPart(aa[i]);
11749566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArray(A, &aa));
11759566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJInvalidateDiagonal(A));
11763ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
117799cafbc1SBarry Smith }
117899cafbc1SBarry Smith 
1179ba38deedSJacob Faibussowitsch static PetscErrorCode MatImaginaryPart_SeqAIJ(Mat A)
1180d71ae5a4SJacob Faibussowitsch {
118199cafbc1SBarry Smith   Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data;
118299cafbc1SBarry Smith   PetscInt    i, nz = a->nz;
11832e5835c6SStefano Zampini   MatScalar  *aa;
118499cafbc1SBarry Smith 
118599cafbc1SBarry Smith   PetscFunctionBegin;
11869566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArray(A, &aa));
118799cafbc1SBarry Smith   for (i = 0; i < nz; i++) aa[i] = PetscImaginaryPart(aa[i]);
11889566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArray(A, &aa));
11899566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJInvalidateDiagonal(A));
11903ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
119199cafbc1SBarry Smith }
119299cafbc1SBarry Smith 
1193d71ae5a4SJacob Faibussowitsch PetscErrorCode MatZeroEntries_SeqAIJ(Mat A)
1194d71ae5a4SJacob Faibussowitsch {
1195fff043a9SJunchao Zhang   Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data;
1196fff043a9SJunchao Zhang   MatScalar  *aa;
11973a40ed3dSBarry Smith 
11983a40ed3dSBarry Smith   PetscFunctionBegin;
11999566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayWrite(A, &aa));
12009566063dSJacob Faibussowitsch   PetscCall(PetscArrayzero(aa, a->i[A->rmap->n]));
12019566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayWrite(A, &aa));
12029566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJInvalidateDiagonal(A));
12033ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
120417ab2063SBarry Smith }
1205416022c9SBarry Smith 
1206d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDestroy_SeqAIJ(Mat A)
1207d71ae5a4SJacob Faibussowitsch {
1208416022c9SBarry Smith   Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data;
1209d5d45c9bSBarry Smith 
12103a40ed3dSBarry Smith   PetscFunctionBegin;
1211b4e2f619SBarry Smith   if (A->hash_active) {
1212e3c72094SPierre Jolivet     A->ops[0] = a->cops;
1213b4e2f619SBarry Smith     PetscCall(PetscHMapIJVDestroy(&a->ht));
1214b4e2f619SBarry Smith     PetscCall(PetscFree(a->dnz));
1215b4e2f619SBarry Smith     A->hash_active = PETSC_FALSE;
1216b4e2f619SBarry Smith   }
1217b4e2f619SBarry Smith 
12183ba16761SJacob Faibussowitsch   PetscCall(PetscLogObjectState((PetscObject)A, "Rows=%" PetscInt_FMT ", Cols=%" PetscInt_FMT ", NZ=%" PetscInt_FMT, A->rmap->n, A->cmap->n, a->nz));
12199566063dSJacob Faibussowitsch   PetscCall(MatSeqXAIJFreeAIJ(A, &a->a, &a->j, &a->i));
12209566063dSJacob Faibussowitsch   PetscCall(ISDestroy(&a->row));
12219566063dSJacob Faibussowitsch   PetscCall(ISDestroy(&a->col));
12229566063dSJacob Faibussowitsch   PetscCall(PetscFree(a->diag));
12239566063dSJacob Faibussowitsch   PetscCall(PetscFree(a->ibdiag));
12249566063dSJacob Faibussowitsch   PetscCall(PetscFree(a->imax));
12259566063dSJacob Faibussowitsch   PetscCall(PetscFree(a->ilen));
12269566063dSJacob Faibussowitsch   PetscCall(PetscFree(a->ipre));
12279566063dSJacob Faibussowitsch   PetscCall(PetscFree3(a->idiag, a->mdiag, a->ssor_work));
12289566063dSJacob Faibussowitsch   PetscCall(PetscFree(a->solve_work));
12299566063dSJacob Faibussowitsch   PetscCall(ISDestroy(&a->icol));
12309566063dSJacob Faibussowitsch   PetscCall(PetscFree(a->saved_values));
12319566063dSJacob Faibussowitsch   PetscCall(PetscFree2(a->compressedrow.i, a->compressedrow.rindex));
12329566063dSJacob Faibussowitsch   PetscCall(MatDestroy_SeqAIJ_Inode(A));
12339566063dSJacob Faibussowitsch   PetscCall(PetscFree(A->data));
1234901853e0SKris Buschelman 
12356718818eSStefano Zampini   /* MatMatMultNumeric_SeqAIJ_SeqAIJ_Sorted may allocate this.
12366718818eSStefano Zampini      That function is so heavily used (sometimes in an hidden way through multnumeric function pointers)
12376718818eSStefano Zampini      that is hard to properly add this data to the MatProduct data. We free it here to avoid
12386718818eSStefano Zampini      users reusing the matrix object with different data to incur in obscure segmentation faults
12396718818eSStefano Zampini      due to different matrix sizes */
12409566063dSJacob Faibussowitsch   PetscCall(PetscObjectCompose((PetscObject)A, "__PETSc__ab_dense", NULL));
12416718818eSStefano Zampini 
12429566063dSJacob Faibussowitsch   PetscCall(PetscObjectChangeTypeName((PetscObject)A, NULL));
12432e956fe4SStefano Zampini   PetscCall(PetscObjectComposeFunction((PetscObject)A, "PetscMatlabEnginePut_C", NULL));
12442e956fe4SStefano Zampini   PetscCall(PetscObjectComposeFunction((PetscObject)A, "PetscMatlabEngineGet_C", NULL));
12459566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSeqAIJSetColumnIndices_C", NULL));
12469566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatStoreValues_C", NULL));
12479566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatRetrieveValues_C", NULL));
12489566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqsbaij_C", NULL));
12499566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqbaij_C", NULL));
12509566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijperm_C", NULL));
12512e956fe4SStefano Zampini   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijsell_C", NULL));
12522e956fe4SStefano Zampini #if defined(PETSC_HAVE_MKL_SPARSE)
12532e956fe4SStefano Zampini   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijmkl_C", NULL));
12542e956fe4SStefano Zampini #endif
12554222ddf1SHong Zhang #if defined(PETSC_HAVE_CUDA)
12569566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijcusparse_C", NULL));
12579566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaijcusparse_seqaij_C", NULL));
12589566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaij_seqaijcusparse_C", NULL));
12594222ddf1SHong Zhang #endif
1260d5e393b6SSuyash Tandon #if defined(PETSC_HAVE_HIP)
1261d5e393b6SSuyash Tandon   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijhipsparse_C", NULL));
1262d5e393b6SSuyash Tandon   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaijhipsparse_seqaij_C", NULL));
1263d5e393b6SSuyash Tandon   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaij_seqaijhipsparse_C", NULL));
1264d5e393b6SSuyash Tandon #endif
12653d0639e7SStefano Zampini #if defined(PETSC_HAVE_KOKKOS_KERNELS)
12669566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijkokkos_C", NULL));
12673d0639e7SStefano Zampini #endif
12689566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijcrl_C", NULL));
1269af8000cdSHong Zhang #if defined(PETSC_HAVE_ELEMENTAL)
12709566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_elemental_C", NULL));
1271af8000cdSHong Zhang #endif
1272d24d4204SJose E. Roman #if defined(PETSC_HAVE_SCALAPACK)
12739566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_scalapack_C", NULL));
1274d24d4204SJose E. Roman #endif
127563c07aadSStefano Zampini #if defined(PETSC_HAVE_HYPRE)
12769566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_hypre_C", NULL));
12779566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_transpose_seqaij_seqaij_C", NULL));
127863c07aadSStefano Zampini #endif
12799566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqdense_C", NULL));
12809566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqsell_C", NULL));
12819566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_is_C", NULL));
12829566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatIsTranspose_C", NULL));
12832e956fe4SStefano Zampini   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatIsHermitianTranspose_C", NULL));
12849566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSeqAIJSetPreallocation_C", NULL));
12859566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatResetPreallocation_C", NULL));
12869566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSeqAIJSetPreallocationCSR_C", NULL));
12879566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatReorderForNonzeroDiagonal_C", NULL));
12889566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_is_seqaij_C", NULL));
12899566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqdense_seqaij_C", NULL));
12909566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaij_seqaij_C", NULL));
12919566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSeqAIJKron_C", NULL));
12929566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSetPreallocationCOO_C", NULL));
12939566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSetValuesCOO_C", NULL));
12942e956fe4SStefano Zampini   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatFactorGetSolverType_C", NULL));
12952e956fe4SStefano Zampini   /* these calls do not belong here: the subclasses Duplicate/Destroy are wrong */
12962e956fe4SStefano Zampini   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaijsell_seqaij_C", NULL));
12972e956fe4SStefano Zampini   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaijperm_seqaij_C", NULL));
12982e956fe4SStefano Zampini   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijviennacl_C", NULL));
12992e956fe4SStefano Zampini   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaijviennacl_seqdense_C", NULL));
13002e956fe4SStefano Zampini   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaijviennacl_seqaij_C", NULL));
13013ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
130217ab2063SBarry Smith }
130317ab2063SBarry Smith 
1304d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetOption_SeqAIJ(Mat A, MatOption op, PetscBool flg)
1305d71ae5a4SJacob Faibussowitsch {
1306416022c9SBarry Smith   Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data;
13073a40ed3dSBarry Smith 
13083a40ed3dSBarry Smith   PetscFunctionBegin;
1309a65d3064SKris Buschelman   switch (op) {
1310d71ae5a4SJacob Faibussowitsch   case MAT_ROW_ORIENTED:
1311d71ae5a4SJacob Faibussowitsch     a->roworiented = flg;
1312d71ae5a4SJacob Faibussowitsch     break;
1313d71ae5a4SJacob Faibussowitsch   case MAT_KEEP_NONZERO_PATTERN:
1314d71ae5a4SJacob Faibussowitsch     a->keepnonzeropattern = flg;
1315d71ae5a4SJacob Faibussowitsch     break;
1316d71ae5a4SJacob Faibussowitsch   case MAT_NEW_NONZERO_LOCATIONS:
1317d71ae5a4SJacob Faibussowitsch     a->nonew = (flg ? 0 : 1);
1318d71ae5a4SJacob Faibussowitsch     break;
1319d71ae5a4SJacob Faibussowitsch   case MAT_NEW_NONZERO_LOCATION_ERR:
1320d71ae5a4SJacob Faibussowitsch     a->nonew = (flg ? -1 : 0);
1321d71ae5a4SJacob Faibussowitsch     break;
1322d71ae5a4SJacob Faibussowitsch   case MAT_NEW_NONZERO_ALLOCATION_ERR:
1323d71ae5a4SJacob Faibussowitsch     a->nonew = (flg ? -2 : 0);
1324d71ae5a4SJacob Faibussowitsch     break;
1325d71ae5a4SJacob Faibussowitsch   case MAT_UNUSED_NONZERO_LOCATION_ERR:
1326d71ae5a4SJacob Faibussowitsch     a->nounused = (flg ? -1 : 0);
1327d71ae5a4SJacob Faibussowitsch     break;
1328d71ae5a4SJacob Faibussowitsch   case MAT_IGNORE_ZERO_ENTRIES:
1329d71ae5a4SJacob Faibussowitsch     a->ignorezeroentries = flg;
1330d71ae5a4SJacob Faibussowitsch     break;
13313d472b54SHong Zhang   case MAT_SPD:
1332b1646e73SJed Brown   case MAT_SYMMETRIC:
1333b1646e73SJed Brown   case MAT_STRUCTURALLY_SYMMETRIC:
1334b1646e73SJed Brown   case MAT_HERMITIAN:
1335b1646e73SJed Brown   case MAT_SYMMETRY_ETERNAL:
1336957cac9fSHong Zhang   case MAT_STRUCTURE_ONLY:
1337b94d7dedSBarry Smith   case MAT_STRUCTURAL_SYMMETRY_ETERNAL:
1338b94d7dedSBarry Smith   case MAT_SPD_ETERNAL:
1339b94d7dedSBarry Smith     /* if the diagonal matrix is square it inherits some of the properties above */
13405021d80fSJed Brown     break;
13418c78258cSHong Zhang   case MAT_FORCE_DIAGONAL_ENTRIES:
1342a65d3064SKris Buschelman   case MAT_IGNORE_OFF_PROC_ENTRIES:
1343d71ae5a4SJacob Faibussowitsch   case MAT_USE_HASH_TABLE:
1344d71ae5a4SJacob Faibussowitsch     PetscCall(PetscInfo(A, "Option %s ignored\n", MatOptions[op]));
1345d71ae5a4SJacob Faibussowitsch     break;
1346d71ae5a4SJacob Faibussowitsch   case MAT_USE_INODES:
1347d71ae5a4SJacob Faibussowitsch     PetscCall(MatSetOption_SeqAIJ_Inode(A, MAT_USE_INODES, flg));
1348d71ae5a4SJacob Faibussowitsch     break;
1349d71ae5a4SJacob Faibussowitsch   case MAT_SUBMAT_SINGLEIS:
1350d71ae5a4SJacob Faibussowitsch     A->submat_singleis = flg;
1351d71ae5a4SJacob Faibussowitsch     break;
1352071fcb05SBarry Smith   case MAT_SORTED_FULL:
1353071fcb05SBarry Smith     if (flg) A->ops->setvalues = MatSetValues_SeqAIJ_SortedFull;
1354071fcb05SBarry Smith     else A->ops->setvalues = MatSetValues_SeqAIJ;
1355071fcb05SBarry Smith     break;
1356d71ae5a4SJacob Faibussowitsch   case MAT_FORM_EXPLICIT_TRANSPOSE:
1357d71ae5a4SJacob Faibussowitsch     A->form_explicit_transpose = flg;
1358d71ae5a4SJacob Faibussowitsch     break;
1359d71ae5a4SJacob Faibussowitsch   default:
1360d71ae5a4SJacob Faibussowitsch     SETERRQ(PETSC_COMM_SELF, PETSC_ERR_SUP, "unknown option %d", op);
1361a65d3064SKris Buschelman   }
13623ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
136317ab2063SBarry Smith }
136417ab2063SBarry Smith 
1365ba38deedSJacob Faibussowitsch static PetscErrorCode MatGetDiagonal_SeqAIJ(Mat A, Vec v)
1366d71ae5a4SJacob Faibussowitsch {
1367416022c9SBarry Smith   Mat_SeqAIJ        *a = (Mat_SeqAIJ *)A->data;
1368fdc842d1SBarry Smith   PetscInt           i, j, n, *ai = a->i, *aj = a->j;
1369c898d852SStefano Zampini   PetscScalar       *x;
1370c898d852SStefano Zampini   const PetscScalar *aa;
137117ab2063SBarry Smith 
13723a40ed3dSBarry Smith   PetscFunctionBegin;
13739566063dSJacob Faibussowitsch   PetscCall(VecGetLocalSize(v, &n));
137408401ef6SPierre Jolivet   PetscCheck(n == A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Nonconforming matrix and vector");
13759566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &aa));
1376d5f3da31SBarry Smith   if (A->factortype == MAT_FACTOR_ILU || A->factortype == MAT_FACTOR_LU) {
1377d3e70bfaSHong Zhang     PetscInt *diag = a->diag;
13789566063dSJacob Faibussowitsch     PetscCall(VecGetArrayWrite(v, &x));
13792c990fa1SHong Zhang     for (i = 0; i < n; i++) x[i] = 1.0 / aa[diag[i]];
13809566063dSJacob Faibussowitsch     PetscCall(VecRestoreArrayWrite(v, &x));
13819566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJRestoreArrayRead(A, &aa));
13823ba16761SJacob Faibussowitsch     PetscFunctionReturn(PETSC_SUCCESS);
138335e7444dSHong Zhang   }
138435e7444dSHong Zhang 
13859566063dSJacob Faibussowitsch   PetscCall(VecGetArrayWrite(v, &x));
138635e7444dSHong Zhang   for (i = 0; i < n; i++) {
1387fdc842d1SBarry Smith     x[i] = 0.0;
138835e7444dSHong Zhang     for (j = ai[i]; j < ai[i + 1]; j++) {
138935e7444dSHong Zhang       if (aj[j] == i) {
139035e7444dSHong Zhang         x[i] = aa[j];
139117ab2063SBarry Smith         break;
139217ab2063SBarry Smith       }
139317ab2063SBarry Smith     }
139417ab2063SBarry Smith   }
13959566063dSJacob Faibussowitsch   PetscCall(VecRestoreArrayWrite(v, &x));
13969566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &aa));
13973ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
139817ab2063SBarry Smith }
139917ab2063SBarry Smith 
1400c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/ftn-kernels/fmult.h>
1401d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMultTransposeAdd_SeqAIJ(Mat A, Vec xx, Vec zz, Vec yy)
1402d71ae5a4SJacob Faibussowitsch {
1403416022c9SBarry Smith   Mat_SeqAIJ        *a = (Mat_SeqAIJ *)A->data;
14045f22a7b3SSebastian Grimberg   const MatScalar   *aa;
1405d9ca1df4SBarry Smith   PetscScalar       *y;
1406d9ca1df4SBarry Smith   const PetscScalar *x;
1407d0f46423SBarry Smith   PetscInt           m = A->rmap->n;
14085c897100SBarry Smith #if !defined(PETSC_USE_FORTRAN_KERNEL_MULTTRANSPOSEAIJ)
14095f22a7b3SSebastian Grimberg   const MatScalar  *v;
1410a77337e4SBarry Smith   PetscScalar       alpha;
1411d9ca1df4SBarry Smith   PetscInt          n, i, j;
1412d9ca1df4SBarry Smith   const PetscInt   *idx, *ii, *ridx = NULL;
14133447b6efSHong Zhang   Mat_CompressedRow cprow    = a->compressedrow;
1414ace3abfcSBarry Smith   PetscBool         usecprow = cprow.use;
14155c897100SBarry Smith #endif
141617ab2063SBarry Smith 
14173a40ed3dSBarry Smith   PetscFunctionBegin;
14189566063dSJacob Faibussowitsch   if (zz != yy) PetscCall(VecCopy(zz, yy));
14199566063dSJacob Faibussowitsch   PetscCall(VecGetArrayRead(xx, &x));
14209566063dSJacob Faibussowitsch   PetscCall(VecGetArray(yy, &y));
14219566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &aa));
14225c897100SBarry Smith 
14235c897100SBarry Smith #if defined(PETSC_USE_FORTRAN_KERNEL_MULTTRANSPOSEAIJ)
1424fff043a9SJunchao Zhang   fortranmulttransposeaddaij_(&m, x, a->i, a->j, aa, y);
14255c897100SBarry Smith #else
14263447b6efSHong Zhang   if (usecprow) {
14273447b6efSHong Zhang     m    = cprow.nrows;
14283447b6efSHong Zhang     ii   = cprow.i;
14297b2bb3b9SHong Zhang     ridx = cprow.rindex;
14303447b6efSHong Zhang   } else {
14313447b6efSHong Zhang     ii = a->i;
14323447b6efSHong Zhang   }
143317ab2063SBarry Smith   for (i = 0; i < m; i++) {
14343447b6efSHong Zhang     idx = a->j + ii[i];
1435fff043a9SJunchao Zhang     v   = aa + ii[i];
14363447b6efSHong Zhang     n   = ii[i + 1] - ii[i];
14373447b6efSHong Zhang     if (usecprow) {
14387b2bb3b9SHong Zhang       alpha = x[ridx[i]];
14393447b6efSHong Zhang     } else {
144017ab2063SBarry Smith       alpha = x[i];
14413447b6efSHong Zhang     }
144204fbf559SBarry Smith     for (j = 0; j < n; j++) y[idx[j]] += alpha * v[j];
144317ab2063SBarry Smith   }
14445c897100SBarry Smith #endif
14459566063dSJacob Faibussowitsch   PetscCall(PetscLogFlops(2.0 * a->nz));
14469566063dSJacob Faibussowitsch   PetscCall(VecRestoreArrayRead(xx, &x));
14479566063dSJacob Faibussowitsch   PetscCall(VecRestoreArray(yy, &y));
14489566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &aa));
14493ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
145017ab2063SBarry Smith }
145117ab2063SBarry Smith 
1452d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMultTranspose_SeqAIJ(Mat A, Vec xx, Vec yy)
1453d71ae5a4SJacob Faibussowitsch {
14545c897100SBarry Smith   PetscFunctionBegin;
14559566063dSJacob Faibussowitsch   PetscCall(VecSet(yy, 0.0));
14569566063dSJacob Faibussowitsch   PetscCall(MatMultTransposeAdd_SeqAIJ(A, xx, yy, yy));
14573ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
14585c897100SBarry Smith }
14595c897100SBarry Smith 
1460c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/ftn-kernels/fmult.h>
146178b84d54SShri Abhyankar 
1462d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMult_SeqAIJ(Mat A, Vec xx, Vec yy)
1463d71ae5a4SJacob Faibussowitsch {
1464416022c9SBarry Smith   Mat_SeqAIJ        *a = (Mat_SeqAIJ *)A->data;
1465d9fead3dSBarry Smith   PetscScalar       *y;
146654f21887SBarry Smith   const PetscScalar *x;
1467*5914357eSBarry Smith   const MatScalar   *a_a;
1468003131ecSBarry Smith   PetscInt           m = A->rmap->n;
1469*5914357eSBarry Smith   const PetscInt    *ii, *ridx = NULL;
1470ace3abfcSBarry Smith   PetscBool          usecprow = a->compressedrow.use;
147117ab2063SBarry Smith 
1472b6410449SSatish Balay #if defined(PETSC_HAVE_PRAGMA_DISJOINT)
147397952fefSHong Zhang   #pragma disjoint(*x, *y, *aa)
1474fee21e36SBarry Smith #endif
1475fee21e36SBarry Smith 
14763a40ed3dSBarry Smith   PetscFunctionBegin;
1477b215bc84SStefano Zampini   if (a->inode.use && a->inode.checked) {
14789566063dSJacob Faibussowitsch     PetscCall(MatMult_SeqAIJ_Inode(A, xx, yy));
14793ba16761SJacob Faibussowitsch     PetscFunctionReturn(PETSC_SUCCESS);
1480b215bc84SStefano Zampini   }
14819566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &a_a));
14829566063dSJacob Faibussowitsch   PetscCall(VecGetArrayRead(xx, &x));
14839566063dSJacob Faibussowitsch   PetscCall(VecGetArray(yy, &y));
1484416022c9SBarry Smith   ii = a->i;
14854eb6d288SHong Zhang   if (usecprow) { /* use compressed row format */
14869566063dSJacob Faibussowitsch     PetscCall(PetscArrayzero(y, m));
148797952fefSHong Zhang     m    = a->compressedrow.nrows;
148897952fefSHong Zhang     ii   = a->compressedrow.i;
148997952fefSHong Zhang     ridx = a->compressedrow.rindex;
1490*5914357eSBarry Smith     PetscPragmaUseOMPKernels(parallel for)
1491*5914357eSBarry Smith     for (PetscInt i = 0; i < m; i++) {
1492*5914357eSBarry Smith       PetscInt           n   = ii[i + 1] - ii[i];
1493*5914357eSBarry Smith       const PetscInt    *aj  = a->j + ii[i];
1494*5914357eSBarry Smith       const PetscScalar *aa  = a_a + ii[i];
1495*5914357eSBarry Smith       PetscScalar        sum = 0.0;
1496003131ecSBarry Smith       PetscSparseDensePlusDot(sum, x, aa, aj, n);
1497003131ecSBarry Smith       /* for (j=0; j<n; j++) sum += (*aa++)*x[*aj++]; */
149897952fefSHong Zhang       y[*ridx++] = sum;
149997952fefSHong Zhang     }
150097952fefSHong Zhang   } else { /* do not use compressed row format */
1501b05257ddSBarry Smith #if defined(PETSC_USE_FORTRAN_KERNEL_MULTAIJ)
1502*5914357eSBarry Smith     fortranmultaij_(&m, x, ii, a->j, a_a, y);
1503b05257ddSBarry Smith #else
1504*5914357eSBarry Smith     PetscPragmaUseOMPKernels(parallel for)
1505*5914357eSBarry Smith     for (PetscInt i = 0; i < m; i++) {
1506*5914357eSBarry Smith       PetscInt           n   = ii[i + 1] - ii[i];
1507*5914357eSBarry Smith       const PetscInt    *aj  = a->j + ii[i];
1508*5914357eSBarry Smith       const PetscScalar *aa  = a_a + ii[i];
1509*5914357eSBarry Smith       PetscScalar        sum = 0.0;
1510003131ecSBarry Smith       PetscSparseDensePlusDot(sum, x, aa, aj, n);
151117ab2063SBarry Smith       y[i] = sum;
151217ab2063SBarry Smith     }
15138d195f9aSBarry Smith #endif
1514b05257ddSBarry Smith   }
15159566063dSJacob Faibussowitsch   PetscCall(PetscLogFlops(2.0 * a->nz - a->nonzerorowcnt));
15169566063dSJacob Faibussowitsch   PetscCall(VecRestoreArrayRead(xx, &x));
15179566063dSJacob Faibussowitsch   PetscCall(VecRestoreArray(yy, &y));
15189566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &a_a));
15193ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
152017ab2063SBarry Smith }
152117ab2063SBarry Smith 
1522ba38deedSJacob Faibussowitsch // HACK!!!!! Used by src/mat/tests/ex170.c
1523ba38deedSJacob Faibussowitsch PETSC_EXTERN PetscErrorCode MatMultMax_SeqAIJ(Mat A, Vec xx, Vec yy)
1524d71ae5a4SJacob Faibussowitsch {
1525b434eb95SMatthew G. Knepley   Mat_SeqAIJ        *a = (Mat_SeqAIJ *)A->data;
1526b434eb95SMatthew G. Knepley   PetscScalar       *y;
1527b434eb95SMatthew G. Knepley   const PetscScalar *x;
1528fff043a9SJunchao Zhang   const MatScalar   *aa, *a_a;
1529b434eb95SMatthew G. Knepley   PetscInt           m = A->rmap->n;
1530b434eb95SMatthew G. Knepley   const PetscInt    *aj, *ii, *ridx   = NULL;
1531b434eb95SMatthew G. Knepley   PetscInt           n, i, nonzerorow = 0;
1532b434eb95SMatthew G. Knepley   PetscScalar        sum;
1533b434eb95SMatthew G. Knepley   PetscBool          usecprow = a->compressedrow.use;
1534b434eb95SMatthew G. Knepley 
1535b434eb95SMatthew G. Knepley #if defined(PETSC_HAVE_PRAGMA_DISJOINT)
1536b434eb95SMatthew G. Knepley   #pragma disjoint(*x, *y, *aa)
1537b434eb95SMatthew G. Knepley #endif
1538b434eb95SMatthew G. Knepley 
1539b434eb95SMatthew G. Knepley   PetscFunctionBegin;
15409566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &a_a));
15419566063dSJacob Faibussowitsch   PetscCall(VecGetArrayRead(xx, &x));
15429566063dSJacob Faibussowitsch   PetscCall(VecGetArray(yy, &y));
1543b434eb95SMatthew G. Knepley   if (usecprow) { /* use compressed row format */
1544b434eb95SMatthew G. Knepley     m    = a->compressedrow.nrows;
1545b434eb95SMatthew G. Knepley     ii   = a->compressedrow.i;
1546b434eb95SMatthew G. Knepley     ridx = a->compressedrow.rindex;
1547b434eb95SMatthew G. Knepley     for (i = 0; i < m; i++) {
1548b434eb95SMatthew G. Knepley       n   = ii[i + 1] - ii[i];
1549b434eb95SMatthew G. Knepley       aj  = a->j + ii[i];
1550fff043a9SJunchao Zhang       aa  = a_a + ii[i];
1551b434eb95SMatthew G. Knepley       sum = 0.0;
1552b434eb95SMatthew G. Knepley       nonzerorow += (n > 0);
1553b434eb95SMatthew G. Knepley       PetscSparseDenseMaxDot(sum, x, aa, aj, n);
1554b434eb95SMatthew G. Knepley       /* for (j=0; j<n; j++) sum += (*aa++)*x[*aj++]; */
1555b434eb95SMatthew G. Knepley       y[*ridx++] = sum;
1556b434eb95SMatthew G. Knepley     }
1557b434eb95SMatthew G. Knepley   } else { /* do not use compressed row format */
15583d3eaba7SBarry Smith     ii = a->i;
1559b434eb95SMatthew G. Knepley     for (i = 0; i < m; i++) {
1560b434eb95SMatthew G. Knepley       n   = ii[i + 1] - ii[i];
1561b434eb95SMatthew G. Knepley       aj  = a->j + ii[i];
1562fff043a9SJunchao Zhang       aa  = a_a + ii[i];
1563b434eb95SMatthew G. Knepley       sum = 0.0;
1564b434eb95SMatthew G. Knepley       nonzerorow += (n > 0);
1565b434eb95SMatthew G. Knepley       PetscSparseDenseMaxDot(sum, x, aa, aj, n);
1566b434eb95SMatthew G. Knepley       y[i] = sum;
1567b434eb95SMatthew G. Knepley     }
1568b434eb95SMatthew G. Knepley   }
15699566063dSJacob Faibussowitsch   PetscCall(PetscLogFlops(2.0 * a->nz - nonzerorow));
15709566063dSJacob Faibussowitsch   PetscCall(VecRestoreArrayRead(xx, &x));
15719566063dSJacob Faibussowitsch   PetscCall(VecRestoreArray(yy, &y));
15729566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &a_a));
15733ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
1574b434eb95SMatthew G. Knepley }
1575b434eb95SMatthew G. Knepley 
1576ba38deedSJacob Faibussowitsch // HACK!!!!! Used by src/mat/tests/ex170.c
1577ba38deedSJacob Faibussowitsch PETSC_EXTERN PetscErrorCode MatMultAddMax_SeqAIJ(Mat A, Vec xx, Vec yy, Vec zz)
1578d71ae5a4SJacob Faibussowitsch {
1579b434eb95SMatthew G. Knepley   Mat_SeqAIJ        *a = (Mat_SeqAIJ *)A->data;
1580b434eb95SMatthew G. Knepley   PetscScalar       *y, *z;
1581b434eb95SMatthew G. Knepley   const PetscScalar *x;
1582fff043a9SJunchao Zhang   const MatScalar   *aa, *a_a;
1583b434eb95SMatthew G. Knepley   PetscInt           m = A->rmap->n, *aj, *ii;
1584b434eb95SMatthew G. Knepley   PetscInt           n, i, *ridx = NULL;
1585b434eb95SMatthew G. Knepley   PetscScalar        sum;
1586b434eb95SMatthew G. Knepley   PetscBool          usecprow = a->compressedrow.use;
1587b434eb95SMatthew G. Knepley 
1588b434eb95SMatthew G. Knepley   PetscFunctionBegin;
15899566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &a_a));
15909566063dSJacob Faibussowitsch   PetscCall(VecGetArrayRead(xx, &x));
15919566063dSJacob Faibussowitsch   PetscCall(VecGetArrayPair(yy, zz, &y, &z));
1592b434eb95SMatthew G. Knepley   if (usecprow) { /* use compressed row format */
159348a46eb9SPierre Jolivet     if (zz != yy) PetscCall(PetscArraycpy(z, y, m));
1594b434eb95SMatthew G. Knepley     m    = a->compressedrow.nrows;
1595b434eb95SMatthew G. Knepley     ii   = a->compressedrow.i;
1596b434eb95SMatthew G. Knepley     ridx = a->compressedrow.rindex;
1597b434eb95SMatthew G. Knepley     for (i = 0; i < m; i++) {
1598b434eb95SMatthew G. Knepley       n   = ii[i + 1] - ii[i];
1599b434eb95SMatthew G. Knepley       aj  = a->j + ii[i];
1600fff043a9SJunchao Zhang       aa  = a_a + ii[i];
1601b434eb95SMatthew G. Knepley       sum = y[*ridx];
1602b434eb95SMatthew G. Knepley       PetscSparseDenseMaxDot(sum, x, aa, aj, n);
1603b434eb95SMatthew G. Knepley       z[*ridx++] = sum;
1604b434eb95SMatthew G. Knepley     }
1605b434eb95SMatthew G. Knepley   } else { /* do not use compressed row format */
16063d3eaba7SBarry Smith     ii = a->i;
1607b434eb95SMatthew G. Knepley     for (i = 0; i < m; i++) {
1608b434eb95SMatthew G. Knepley       n   = ii[i + 1] - ii[i];
1609b434eb95SMatthew G. Knepley       aj  = a->j + ii[i];
1610fff043a9SJunchao Zhang       aa  = a_a + ii[i];
1611b434eb95SMatthew G. Knepley       sum = y[i];
1612b434eb95SMatthew G. Knepley       PetscSparseDenseMaxDot(sum, x, aa, aj, n);
1613b434eb95SMatthew G. Knepley       z[i] = sum;
1614b434eb95SMatthew G. Knepley     }
1615b434eb95SMatthew G. Knepley   }
16169566063dSJacob Faibussowitsch   PetscCall(PetscLogFlops(2.0 * a->nz));
16179566063dSJacob Faibussowitsch   PetscCall(VecRestoreArrayRead(xx, &x));
16189566063dSJacob Faibussowitsch   PetscCall(VecRestoreArrayPair(yy, zz, &y, &z));
16199566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &a_a));
16203ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
1621b434eb95SMatthew G. Knepley }
1622b434eb95SMatthew G. Knepley 
1623c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/ftn-kernels/fmultadd.h>
1624d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMultAdd_SeqAIJ(Mat A, Vec xx, Vec yy, Vec zz)
1625d71ae5a4SJacob Faibussowitsch {
1626416022c9SBarry Smith   Mat_SeqAIJ        *a = (Mat_SeqAIJ *)A->data;
1627f15663dcSBarry Smith   PetscScalar       *y, *z;
1628f15663dcSBarry Smith   const PetscScalar *x;
1629*5914357eSBarry Smith   const MatScalar   *a_a;
1630*5914357eSBarry Smith   const PetscInt    *ii, *ridx = NULL;
1631*5914357eSBarry Smith   PetscInt           m        = A->rmap->n;
1632ace3abfcSBarry Smith   PetscBool          usecprow = a->compressedrow.use;
16339ea0dfa2SSatish Balay 
16343a40ed3dSBarry Smith   PetscFunctionBegin;
1635b215bc84SStefano Zampini   if (a->inode.use && a->inode.checked) {
16369566063dSJacob Faibussowitsch     PetscCall(MatMultAdd_SeqAIJ_Inode(A, xx, yy, zz));
16373ba16761SJacob Faibussowitsch     PetscFunctionReturn(PETSC_SUCCESS);
1638b215bc84SStefano Zampini   }
16399566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &a_a));
16409566063dSJacob Faibussowitsch   PetscCall(VecGetArrayRead(xx, &x));
16419566063dSJacob Faibussowitsch   PetscCall(VecGetArrayPair(yy, zz, &y, &z));
16424eb6d288SHong Zhang   if (usecprow) { /* use compressed row format */
164348a46eb9SPierre Jolivet     if (zz != yy) PetscCall(PetscArraycpy(z, y, m));
164497952fefSHong Zhang     m    = a->compressedrow.nrows;
164597952fefSHong Zhang     ii   = a->compressedrow.i;
164697952fefSHong Zhang     ridx = a->compressedrow.rindex;
1647*5914357eSBarry Smith     for (PetscInt i = 0; i < m; i++) {
1648*5914357eSBarry Smith       PetscInt           n   = ii[i + 1] - ii[i];
1649*5914357eSBarry Smith       const PetscInt    *aj  = a->j + ii[i];
1650*5914357eSBarry Smith       const PetscScalar *aa  = a_a + ii[i];
1651*5914357eSBarry Smith       PetscScalar        sum = y[*ridx];
1652f15663dcSBarry Smith       PetscSparseDensePlusDot(sum, x, aa, aj, n);
165397952fefSHong Zhang       z[*ridx++] = sum;
165497952fefSHong Zhang     }
165597952fefSHong Zhang   } else { /* do not use compressed row format */
16563d3eaba7SBarry Smith     ii = a->i;
1657f15663dcSBarry Smith #if defined(PETSC_USE_FORTRAN_KERNEL_MULTADDAIJ)
1658*5914357eSBarry Smith     fortranmultaddaij_(&m, x, ii, a->j, a_a, y, z);
1659f15663dcSBarry Smith #else
1660*5914357eSBarry Smith     PetscPragmaUseOMPKernels(parallel for)
1661*5914357eSBarry Smith     for (PetscInt i = 0; i < m; i++) {
1662*5914357eSBarry Smith       PetscInt           n   = ii[i + 1] - ii[i];
1663*5914357eSBarry Smith       const PetscInt    *aj  = a->j + ii[i];
1664*5914357eSBarry Smith       const PetscScalar *aa  = a_a + ii[i];
1665*5914357eSBarry Smith       PetscScalar        sum = y[i];
1666f15663dcSBarry Smith       PetscSparseDensePlusDot(sum, x, aa, aj, n);
166717ab2063SBarry Smith       z[i] = sum;
166817ab2063SBarry Smith     }
166902ab625aSSatish Balay #endif
1670f15663dcSBarry Smith   }
16719566063dSJacob Faibussowitsch   PetscCall(PetscLogFlops(2.0 * a->nz));
16729566063dSJacob Faibussowitsch   PetscCall(VecRestoreArrayRead(xx, &x));
16739566063dSJacob Faibussowitsch   PetscCall(VecRestoreArrayPair(yy, zz, &y, &z));
16749566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &a_a));
16753ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
167617ab2063SBarry Smith }
167717ab2063SBarry Smith 
167817ab2063SBarry Smith /*
167917ab2063SBarry Smith      Adds diagonal pointers to sparse matrix structure.
168017ab2063SBarry Smith */
1681d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMarkDiagonal_SeqAIJ(Mat A)
1682d71ae5a4SJacob Faibussowitsch {
1683416022c9SBarry Smith   Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data;
1684d0f46423SBarry Smith   PetscInt    i, j, m = A->rmap->n;
1685c0c07093SJunchao Zhang   PetscBool   alreadySet = PETSC_TRUE;
168617ab2063SBarry Smith 
16873a40ed3dSBarry Smith   PetscFunctionBegin;
168809f38230SBarry Smith   if (!a->diag) {
16899566063dSJacob Faibussowitsch     PetscCall(PetscMalloc1(m, &a->diag));
1690c0c07093SJunchao Zhang     alreadySet = PETSC_FALSE;
169109f38230SBarry Smith   }
1692d0f46423SBarry Smith   for (i = 0; i < A->rmap->n; i++) {
1693c0c07093SJunchao Zhang     /* If A's diagonal is already correctly set, this fast track enables cheap and repeated MatMarkDiagonal_SeqAIJ() calls */
1694c0c07093SJunchao Zhang     if (alreadySet) {
1695c0c07093SJunchao Zhang       PetscInt pos = a->diag[i];
1696c0c07093SJunchao Zhang       if (pos >= a->i[i] && pos < a->i[i + 1] && a->j[pos] == i) continue;
1697c0c07093SJunchao Zhang     }
1698c0c07093SJunchao Zhang 
169909f38230SBarry Smith     a->diag[i] = a->i[i + 1];
1700bfeeae90SHong Zhang     for (j = a->i[i]; j < a->i[i + 1]; j++) {
1701bfeeae90SHong Zhang       if (a->j[j] == i) {
170209f38230SBarry Smith         a->diag[i] = j;
170317ab2063SBarry Smith         break;
170417ab2063SBarry Smith       }
170517ab2063SBarry Smith     }
170617ab2063SBarry Smith   }
17073ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
170817ab2063SBarry Smith }
170917ab2063SBarry Smith 
1710ba38deedSJacob Faibussowitsch static PetscErrorCode MatShift_SeqAIJ(Mat A, PetscScalar v)
1711d71ae5a4SJacob Faibussowitsch {
171261ecd0c6SBarry Smith   Mat_SeqAIJ     *a    = (Mat_SeqAIJ *)A->data;
171361ecd0c6SBarry Smith   const PetscInt *diag = (const PetscInt *)a->diag;
171461ecd0c6SBarry Smith   const PetscInt *ii   = (const PetscInt *)a->i;
171561ecd0c6SBarry Smith   PetscInt        i, *mdiag = NULL;
171661ecd0c6SBarry Smith   PetscInt        cnt = 0; /* how many diagonals are missing */
171761ecd0c6SBarry Smith 
171861ecd0c6SBarry Smith   PetscFunctionBegin;
171961ecd0c6SBarry Smith   if (!A->preallocated || !a->nz) {
17209566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJSetPreallocation(A, 1, NULL));
17219566063dSJacob Faibussowitsch     PetscCall(MatShift_Basic(A, v));
17223ba16761SJacob Faibussowitsch     PetscFunctionReturn(PETSC_SUCCESS);
172361ecd0c6SBarry Smith   }
172461ecd0c6SBarry Smith 
172561ecd0c6SBarry Smith   if (a->diagonaldense) {
172661ecd0c6SBarry Smith     cnt = 0;
172761ecd0c6SBarry Smith   } else {
17289566063dSJacob Faibussowitsch     PetscCall(PetscCalloc1(A->rmap->n, &mdiag));
172961ecd0c6SBarry Smith     for (i = 0; i < A->rmap->n; i++) {
1730349d3b71SJunchao Zhang       if (i < A->cmap->n && diag[i] >= ii[i + 1]) { /* 'out of range' rows never have diagonals */
173161ecd0c6SBarry Smith         cnt++;
173261ecd0c6SBarry Smith         mdiag[i] = 1;
173361ecd0c6SBarry Smith       }
173461ecd0c6SBarry Smith     }
173561ecd0c6SBarry Smith   }
173661ecd0c6SBarry Smith   if (!cnt) {
17379566063dSJacob Faibussowitsch     PetscCall(MatShift_Basic(A, v));
173861ecd0c6SBarry Smith   } else {
1739b6f2aa54SBarry Smith     PetscScalar       *olda = a->a; /* preserve pointers to current matrix nonzeros structure and values */
1740b6f2aa54SBarry Smith     PetscInt          *oldj = a->j, *oldi = a->i;
174161ecd0c6SBarry Smith     PetscBool          singlemalloc = a->singlemalloc, free_a = a->free_a, free_ij = a->free_ij;
17426ea2a7edSJunchao Zhang     const PetscScalar *Aa;
17436ea2a7edSJunchao Zhang 
17446ea2a7edSJunchao Zhang     PetscCall(MatSeqAIJGetArrayRead(A, &Aa)); // sync the host
17456ea2a7edSJunchao Zhang     PetscCall(MatSeqAIJRestoreArrayRead(A, &Aa));
174661ecd0c6SBarry Smith 
174761ecd0c6SBarry Smith     a->a = NULL;
174861ecd0c6SBarry Smith     a->j = NULL;
174961ecd0c6SBarry Smith     a->i = NULL;
175061ecd0c6SBarry Smith     /* increase the values in imax for each row where a diagonal is being inserted then reallocate the matrix data structures */
1751ad540459SPierre Jolivet     for (i = 0; i < PetscMin(A->rmap->n, A->cmap->n); i++) a->imax[i] += mdiag[i];
17529566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(A, 0, a->imax));
175361ecd0c6SBarry Smith 
175461ecd0c6SBarry Smith     /* copy old values into new matrix data structure */
175561ecd0c6SBarry Smith     for (i = 0; i < A->rmap->n; i++) {
17569566063dSJacob Faibussowitsch       PetscCall(MatSetValues(A, 1, &i, a->imax[i] - mdiag[i], &oldj[oldi[i]], &olda[oldi[i]], ADD_VALUES));
175748a46eb9SPierre Jolivet       if (i < A->cmap->n) PetscCall(MatSetValue(A, i, i, v, ADD_VALUES));
1758447d62f5SStefano Zampini     }
17599566063dSJacob Faibussowitsch     PetscCall(MatAssemblyBegin(A, MAT_FINAL_ASSEMBLY));
17609566063dSJacob Faibussowitsch     PetscCall(MatAssemblyEnd(A, MAT_FINAL_ASSEMBLY));
176161ecd0c6SBarry Smith     if (singlemalloc) {
17629566063dSJacob Faibussowitsch       PetscCall(PetscFree3(olda, oldj, oldi));
176361ecd0c6SBarry Smith     } else {
17649566063dSJacob Faibussowitsch       if (free_a) PetscCall(PetscFree(olda));
17659566063dSJacob Faibussowitsch       if (free_ij) PetscCall(PetscFree(oldj));
17669566063dSJacob Faibussowitsch       if (free_ij) PetscCall(PetscFree(oldi));
176761ecd0c6SBarry Smith     }
176861ecd0c6SBarry Smith   }
17699566063dSJacob Faibussowitsch   PetscCall(PetscFree(mdiag));
177061ecd0c6SBarry Smith   a->diagonaldense = PETSC_TRUE;
17713ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
177261ecd0c6SBarry Smith }
177361ecd0c6SBarry Smith 
1774be5855fcSBarry Smith /*
1775be5855fcSBarry Smith      Checks for missing diagonals
1776be5855fcSBarry Smith */
1777d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMissingDiagonal_SeqAIJ(Mat A, PetscBool *missing, PetscInt *d)
1778d71ae5a4SJacob Faibussowitsch {
1779be5855fcSBarry Smith   Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data;
17807734d3b5SMatthew G. Knepley   PetscInt   *diag, *ii = a->i, i;
1781be5855fcSBarry Smith 
1782be5855fcSBarry Smith   PetscFunctionBegin;
178309f38230SBarry Smith   *missing = PETSC_FALSE;
17847734d3b5SMatthew G. Knepley   if (A->rmap->n > 0 && !ii) {
178509f38230SBarry Smith     *missing = PETSC_TRUE;
178609f38230SBarry Smith     if (d) *d = 0;
17879566063dSJacob Faibussowitsch     PetscCall(PetscInfo(A, "Matrix has no entries therefore is missing diagonal\n"));
178809f38230SBarry Smith   } else {
178901445905SHong Zhang     PetscInt n;
179001445905SHong Zhang     n    = PetscMin(A->rmap->n, A->cmap->n);
1791f1e2ffcdSBarry Smith     diag = a->diag;
179201445905SHong Zhang     for (i = 0; i < n; i++) {
17937734d3b5SMatthew G. Knepley       if (diag[i] >= ii[i + 1]) {
179409f38230SBarry Smith         *missing = PETSC_TRUE;
179509f38230SBarry Smith         if (d) *d = i;
17969566063dSJacob Faibussowitsch         PetscCall(PetscInfo(A, "Matrix is missing diagonal number %" PetscInt_FMT "\n", i));
1797358d2f5dSShri Abhyankar         break;
179809f38230SBarry Smith       }
1799be5855fcSBarry Smith     }
1800be5855fcSBarry Smith   }
18013ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
1802be5855fcSBarry Smith }
1803be5855fcSBarry Smith 
18040da83c2eSBarry Smith #include <petscblaslapack.h>
18050da83c2eSBarry Smith #include <petsc/private/kernels/blockinvert.h>
18060da83c2eSBarry Smith 
18070da83c2eSBarry Smith /*
18080da83c2eSBarry Smith     Note that values is allocated externally by the PC and then passed into this routine
18090da83c2eSBarry Smith */
1810ba38deedSJacob Faibussowitsch static PetscErrorCode MatInvertVariableBlockDiagonal_SeqAIJ(Mat A, PetscInt nblocks, const PetscInt *bsizes, PetscScalar *diag)
1811d71ae5a4SJacob Faibussowitsch {
18120da83c2eSBarry Smith   PetscInt        n = A->rmap->n, i, ncnt = 0, *indx, j, bsizemax = 0, *v_pivots;
18130da83c2eSBarry Smith   PetscBool       allowzeropivot, zeropivotdetected = PETSC_FALSE;
18140da83c2eSBarry Smith   const PetscReal shift = 0.0;
18150da83c2eSBarry Smith   PetscInt        ipvt[5];
18164e208921SJed Brown   PetscCount      flops = 0;
18170da83c2eSBarry Smith   PetscScalar     work[25], *v_work;
18180da83c2eSBarry Smith 
18190da83c2eSBarry Smith   PetscFunctionBegin;
18200da83c2eSBarry Smith   allowzeropivot = PetscNot(A->erroriffailure);
18210da83c2eSBarry Smith   for (i = 0; i < nblocks; i++) ncnt += bsizes[i];
182208401ef6SPierre Jolivet   PetscCheck(ncnt == n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Total blocksizes %" PetscInt_FMT " doesn't match number matrix rows %" PetscInt_FMT, ncnt, n);
1823ad540459SPierre Jolivet   for (i = 0; i < nblocks; i++) bsizemax = PetscMax(bsizemax, bsizes[i]);
18249566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(bsizemax, &indx));
182548a46eb9SPierre Jolivet   if (bsizemax > 7) PetscCall(PetscMalloc2(bsizemax, &v_work, bsizemax, &v_pivots));
18260da83c2eSBarry Smith   ncnt = 0;
18270da83c2eSBarry Smith   for (i = 0; i < nblocks; i++) {
18280da83c2eSBarry Smith     for (j = 0; j < bsizes[i]; j++) indx[j] = ncnt + j;
18299566063dSJacob Faibussowitsch     PetscCall(MatGetValues(A, bsizes[i], indx, bsizes[i], indx, diag));
18300da83c2eSBarry Smith     switch (bsizes[i]) {
1831d71ae5a4SJacob Faibussowitsch     case 1:
1832d71ae5a4SJacob Faibussowitsch       *diag = 1.0 / (*diag);
1833d71ae5a4SJacob Faibussowitsch       break;
18340da83c2eSBarry Smith     case 2:
18359566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_inverse_A_2(diag, shift, allowzeropivot, &zeropivotdetected));
18360da83c2eSBarry Smith       if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT;
18379566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_transpose_A_2(diag));
18380da83c2eSBarry Smith       break;
18390da83c2eSBarry Smith     case 3:
18409566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_inverse_A_3(diag, shift, allowzeropivot, &zeropivotdetected));
18410da83c2eSBarry Smith       if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT;
18429566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_transpose_A_3(diag));
18430da83c2eSBarry Smith       break;
18440da83c2eSBarry Smith     case 4:
18459566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_inverse_A_4(diag, shift, allowzeropivot, &zeropivotdetected));
18460da83c2eSBarry Smith       if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT;
18479566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_transpose_A_4(diag));
18480da83c2eSBarry Smith       break;
18490da83c2eSBarry Smith     case 5:
18509566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_inverse_A_5(diag, ipvt, work, shift, allowzeropivot, &zeropivotdetected));
18510da83c2eSBarry Smith       if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT;
18529566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_transpose_A_5(diag));
18530da83c2eSBarry Smith       break;
18540da83c2eSBarry Smith     case 6:
18559566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_inverse_A_6(diag, shift, allowzeropivot, &zeropivotdetected));
18560da83c2eSBarry Smith       if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT;
18579566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_transpose_A_6(diag));
18580da83c2eSBarry Smith       break;
18590da83c2eSBarry Smith     case 7:
18609566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_inverse_A_7(diag, shift, allowzeropivot, &zeropivotdetected));
18610da83c2eSBarry Smith       if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT;
18629566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_transpose_A_7(diag));
18630da83c2eSBarry Smith       break;
18640da83c2eSBarry Smith     default:
18659566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_inverse_A(bsizes[i], diag, v_pivots, v_work, allowzeropivot, &zeropivotdetected));
18660da83c2eSBarry Smith       if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT;
18679566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_transpose_A_N(diag, bsizes[i]));
18680da83c2eSBarry Smith     }
18690da83c2eSBarry Smith     ncnt += bsizes[i];
18700da83c2eSBarry Smith     diag += bsizes[i] * bsizes[i];
1871baa50dc0SBrad Aagaard     flops += 2 * PetscPowInt64(bsizes[i], 3) / 3;
18720da83c2eSBarry Smith   }
18733ba16761SJacob Faibussowitsch   PetscCall(PetscLogFlops(flops));
187448a46eb9SPierre Jolivet   if (bsizemax > 7) PetscCall(PetscFree2(v_work, v_pivots));
18759566063dSJacob Faibussowitsch   PetscCall(PetscFree(indx));
18763ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
18770da83c2eSBarry Smith }
18780da83c2eSBarry Smith 
1879422a814eSBarry Smith /*
1880422a814eSBarry Smith    Negative shift indicates do not generate an error if there is a zero diagonal, just invert it anyways
1881422a814eSBarry Smith */
1882ba38deedSJacob Faibussowitsch static PetscErrorCode MatInvertDiagonal_SeqAIJ(Mat A, PetscScalar omega, PetscScalar fshift)
1883d71ae5a4SJacob Faibussowitsch {
188471f1c65dSBarry Smith   Mat_SeqAIJ      *a = (Mat_SeqAIJ *)A->data;
1885d0f46423SBarry Smith   PetscInt         i, *diag, m = A->rmap->n;
18862e5835c6SStefano Zampini   const MatScalar *v;
188754f21887SBarry Smith   PetscScalar     *idiag, *mdiag;
188871f1c65dSBarry Smith 
188971f1c65dSBarry Smith   PetscFunctionBegin;
18903ba16761SJacob Faibussowitsch   if (a->idiagvalid) PetscFunctionReturn(PETSC_SUCCESS);
18919566063dSJacob Faibussowitsch   PetscCall(MatMarkDiagonal_SeqAIJ(A));
189271f1c65dSBarry Smith   diag = a->diag;
18934dfa11a4SJacob Faibussowitsch   if (!a->idiag) { PetscCall(PetscMalloc3(m, &a->idiag, m, &a->mdiag, m, &a->ssor_work)); }
18942e5835c6SStefano Zampini 
189571f1c65dSBarry Smith   mdiag = a->mdiag;
189671f1c65dSBarry Smith   idiag = a->idiag;
18979566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &v));
1898422a814eSBarry Smith   if (omega == 1.0 && PetscRealPart(fshift) <= 0.0) {
189971f1c65dSBarry Smith     for (i = 0; i < m; i++) {
190071f1c65dSBarry Smith       mdiag[i] = v[diag[i]];
1901899639b0SHong Zhang       if (!PetscAbsScalar(mdiag[i])) { /* zero diagonal */
1902899639b0SHong Zhang         if (PetscRealPart(fshift)) {
19039566063dSJacob Faibussowitsch           PetscCall(PetscInfo(A, "Zero diagonal on row %" PetscInt_FMT "\n", i));
19047b6c816cSBarry Smith           A->factorerrortype             = MAT_FACTOR_NUMERIC_ZEROPIVOT;
19057b6c816cSBarry Smith           A->factorerror_zeropivot_value = 0.0;
19067b6c816cSBarry Smith           A->factorerror_zeropivot_row   = i;
190798921bdaSJacob Faibussowitsch         } else SETERRQ(PETSC_COMM_SELF, PETSC_ERR_ARG_INCOMP, "Zero diagonal on row %" PetscInt_FMT, i);
1908899639b0SHong Zhang       }
190971f1c65dSBarry Smith       idiag[i] = 1.0 / v[diag[i]];
191071f1c65dSBarry Smith     }
19119566063dSJacob Faibussowitsch     PetscCall(PetscLogFlops(m));
191271f1c65dSBarry Smith   } else {
191371f1c65dSBarry Smith     for (i = 0; i < m; i++) {
191471f1c65dSBarry Smith       mdiag[i] = v[diag[i]];
191571f1c65dSBarry Smith       idiag[i] = omega / (fshift + v[diag[i]]);
191671f1c65dSBarry Smith     }
19179566063dSJacob Faibussowitsch     PetscCall(PetscLogFlops(2.0 * m));
191871f1c65dSBarry Smith   }
191971f1c65dSBarry Smith   a->idiagvalid = PETSC_TRUE;
19209566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &v));
19213ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
192271f1c65dSBarry Smith }
192371f1c65dSBarry Smith 
1924d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSOR_SeqAIJ(Mat A, Vec bb, PetscReal omega, MatSORType flag, PetscReal fshift, PetscInt its, PetscInt lits, Vec xx)
1925d71ae5a4SJacob Faibussowitsch {
1926416022c9SBarry Smith   Mat_SeqAIJ        *a = (Mat_SeqAIJ *)A->data;
1927e6d1f457SBarry Smith   PetscScalar       *x, d, sum, *t, scale;
19282e5835c6SStefano Zampini   const MatScalar   *v, *idiag = NULL, *mdiag, *aa;
192954f21887SBarry Smith   const PetscScalar *b, *bs, *xb, *ts;
19303d3eaba7SBarry Smith   PetscInt           n, m = A->rmap->n, i;
193197f1f81fSBarry Smith   const PetscInt    *idx, *diag;
193217ab2063SBarry Smith 
19333a40ed3dSBarry Smith   PetscFunctionBegin;
1934b215bc84SStefano Zampini   if (a->inode.use && a->inode.checked && omega == 1.0 && fshift == 0.0) {
19359566063dSJacob Faibussowitsch     PetscCall(MatSOR_SeqAIJ_Inode(A, bb, omega, flag, fshift, its, lits, xx));
19363ba16761SJacob Faibussowitsch     PetscFunctionReturn(PETSC_SUCCESS);
1937b215bc84SStefano Zampini   }
1938b965ef7fSBarry Smith   its = its * lits;
193991723122SBarry Smith 
194071f1c65dSBarry Smith   if (fshift != a->fshift || omega != a->omega) a->idiagvalid = PETSC_FALSE; /* must recompute idiag[] */
19419566063dSJacob Faibussowitsch   if (!a->idiagvalid) PetscCall(MatInvertDiagonal_SeqAIJ(A, omega, fshift));
194271f1c65dSBarry Smith   a->fshift = fshift;
194371f1c65dSBarry Smith   a->omega  = omega;
1944ed480e8bSBarry Smith 
194571f1c65dSBarry Smith   diag  = a->diag;
194671f1c65dSBarry Smith   t     = a->ssor_work;
1947ed480e8bSBarry Smith   idiag = a->idiag;
194871f1c65dSBarry Smith   mdiag = a->mdiag;
1949ed480e8bSBarry Smith 
19509566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &aa));
19519566063dSJacob Faibussowitsch   PetscCall(VecGetArray(xx, &x));
19529566063dSJacob Faibussowitsch   PetscCall(VecGetArrayRead(bb, &b));
1953ed480e8bSBarry Smith   /* We count flops by assuming the upper triangular and lower triangular parts have the same number of nonzeros */
195417ab2063SBarry Smith   if (flag == SOR_APPLY_UPPER) {
195517ab2063SBarry Smith     /* apply (U + D/omega) to the vector */
1956ed480e8bSBarry Smith     bs = b;
195717ab2063SBarry Smith     for (i = 0; i < m; i++) {
195871f1c65dSBarry Smith       d   = fshift + mdiag[i];
1959416022c9SBarry Smith       n   = a->i[i + 1] - diag[i] - 1;
1960ed480e8bSBarry Smith       idx = a->j + diag[i] + 1;
19612e5835c6SStefano Zampini       v   = aa + diag[i] + 1;
196217ab2063SBarry Smith       sum = b[i] * d / omega;
1963003131ecSBarry Smith       PetscSparseDensePlusDot(sum, bs, v, idx, n);
196417ab2063SBarry Smith       x[i] = sum;
196517ab2063SBarry Smith     }
19669566063dSJacob Faibussowitsch     PetscCall(VecRestoreArray(xx, &x));
19679566063dSJacob Faibussowitsch     PetscCall(VecRestoreArrayRead(bb, &b));
19689566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJRestoreArrayRead(A, &aa));
19699566063dSJacob Faibussowitsch     PetscCall(PetscLogFlops(a->nz));
19703ba16761SJacob Faibussowitsch     PetscFunctionReturn(PETSC_SUCCESS);
197117ab2063SBarry Smith   }
1972c783ea89SBarry Smith 
197308401ef6SPierre Jolivet   PetscCheck(flag != SOR_APPLY_LOWER, PETSC_COMM_SELF, PETSC_ERR_SUP, "SOR_APPLY_LOWER is not implemented");
1974f7d195e4SLawrence Mitchell   if (flag & SOR_EISENSTAT) {
19754c500f23SPierre Jolivet     /* Let  A = L + U + D; where L is lower triangular,
1976887ee2caSBarry Smith     U is upper triangular, E = D/omega; This routine applies
197717ab2063SBarry Smith 
197817ab2063SBarry Smith             (L + E)^{-1} A (U + E)^{-1}
197917ab2063SBarry Smith 
1980887ee2caSBarry Smith     to a vector efficiently using Eisenstat's trick.
198117ab2063SBarry Smith     */
198217ab2063SBarry Smith     scale = (2.0 / omega) - 1.0;
198317ab2063SBarry Smith 
198417ab2063SBarry Smith     /*  x = (E + U)^{-1} b */
198517ab2063SBarry Smith     for (i = m - 1; i >= 0; i--) {
1986416022c9SBarry Smith       n   = a->i[i + 1] - diag[i] - 1;
1987ed480e8bSBarry Smith       idx = a->j + diag[i] + 1;
19882e5835c6SStefano Zampini       v   = aa + diag[i] + 1;
198917ab2063SBarry Smith       sum = b[i];
1990e6d1f457SBarry Smith       PetscSparseDenseMinusDot(sum, x, v, idx, n);
1991ed480e8bSBarry Smith       x[i] = sum * idiag[i];
199217ab2063SBarry Smith     }
199317ab2063SBarry Smith 
199417ab2063SBarry Smith     /*  t = b - (2*E - D)x */
19952e5835c6SStefano Zampini     v = aa;
19962205254eSKarl Rupp     for (i = 0; i < m; i++) t[i] = b[i] - scale * (v[*diag++]) * x[i];
199717ab2063SBarry Smith 
199817ab2063SBarry Smith     /*  t = (E + L)^{-1}t */
1999ed480e8bSBarry Smith     ts   = t;
2000416022c9SBarry Smith     diag = a->diag;
200117ab2063SBarry Smith     for (i = 0; i < m; i++) {
2002416022c9SBarry Smith       n   = diag[i] - a->i[i];
2003ed480e8bSBarry Smith       idx = a->j + a->i[i];
20042e5835c6SStefano Zampini       v   = aa + a->i[i];
200517ab2063SBarry Smith       sum = t[i];
2006003131ecSBarry Smith       PetscSparseDenseMinusDot(sum, ts, v, idx, n);
2007ed480e8bSBarry Smith       t[i] = sum * idiag[i];
2008733d66baSBarry Smith       /*  x = x + t */
2009733d66baSBarry Smith       x[i] += t[i];
201017ab2063SBarry Smith     }
201117ab2063SBarry Smith 
20129566063dSJacob Faibussowitsch     PetscCall(PetscLogFlops(6.0 * m - 1 + 2.0 * a->nz));
20139566063dSJacob Faibussowitsch     PetscCall(VecRestoreArray(xx, &x));
20149566063dSJacob Faibussowitsch     PetscCall(VecRestoreArrayRead(bb, &b));
20153ba16761SJacob Faibussowitsch     PetscFunctionReturn(PETSC_SUCCESS);
201617ab2063SBarry Smith   }
201717ab2063SBarry Smith   if (flag & SOR_ZERO_INITIAL_GUESS) {
201817ab2063SBarry Smith     if (flag & SOR_FORWARD_SWEEP || flag & SOR_LOCAL_FORWARD_SWEEP) {
201917ab2063SBarry Smith       for (i = 0; i < m; i++) {
2020416022c9SBarry Smith         n   = diag[i] - a->i[i];
2021ed480e8bSBarry Smith         idx = a->j + a->i[i];
20222e5835c6SStefano Zampini         v   = aa + a->i[i];
202317ab2063SBarry Smith         sum = b[i];
2024e6d1f457SBarry Smith         PetscSparseDenseMinusDot(sum, x, v, idx, n);
20255c99c7daSBarry Smith         t[i] = sum;
2026ed480e8bSBarry Smith         x[i] = sum * idiag[i];
202717ab2063SBarry Smith       }
20285c99c7daSBarry Smith       xb = t;
20299566063dSJacob Faibussowitsch       PetscCall(PetscLogFlops(a->nz));
20303a40ed3dSBarry Smith     } else xb = b;
203117ab2063SBarry Smith     if (flag & SOR_BACKWARD_SWEEP || flag & SOR_LOCAL_BACKWARD_SWEEP) {
203217ab2063SBarry Smith       for (i = m - 1; i >= 0; i--) {
2033416022c9SBarry Smith         n   = a->i[i + 1] - diag[i] - 1;
2034ed480e8bSBarry Smith         idx = a->j + diag[i] + 1;
20352e5835c6SStefano Zampini         v   = aa + diag[i] + 1;
203617ab2063SBarry Smith         sum = xb[i];
2037e6d1f457SBarry Smith         PetscSparseDenseMinusDot(sum, x, v, idx, n);
20385c99c7daSBarry Smith         if (xb == b) {
2039ed480e8bSBarry Smith           x[i] = sum * idiag[i];
20405c99c7daSBarry Smith         } else {
2041b19a5dc2SMark Adams           x[i] = (1 - omega) * x[i] + sum * idiag[i]; /* omega in idiag */
204217ab2063SBarry Smith         }
20435c99c7daSBarry Smith       }
20449566063dSJacob Faibussowitsch       PetscCall(PetscLogFlops(a->nz)); /* assumes 1/2 in upper */
204517ab2063SBarry Smith     }
204617ab2063SBarry Smith     its--;
204717ab2063SBarry Smith   }
204817ab2063SBarry Smith   while (its--) {
204917ab2063SBarry Smith     if (flag & SOR_FORWARD_SWEEP || flag & SOR_LOCAL_FORWARD_SWEEP) {
205017ab2063SBarry Smith       for (i = 0; i < m; i++) {
2051b19a5dc2SMark Adams         /* lower */
2052b19a5dc2SMark Adams         n   = diag[i] - a->i[i];
2053ed480e8bSBarry Smith         idx = a->j + a->i[i];
20542e5835c6SStefano Zampini         v   = aa + a->i[i];
205517ab2063SBarry Smith         sum = b[i];
2056e6d1f457SBarry Smith         PetscSparseDenseMinusDot(sum, x, v, idx, n);
2057b19a5dc2SMark Adams         t[i] = sum; /* save application of the lower-triangular part */
2058b19a5dc2SMark Adams         /* upper */
2059b19a5dc2SMark Adams         n   = a->i[i + 1] - diag[i] - 1;
2060b19a5dc2SMark Adams         idx = a->j + diag[i] + 1;
20612e5835c6SStefano Zampini         v   = aa + diag[i] + 1;
2062b19a5dc2SMark Adams         PetscSparseDenseMinusDot(sum, x, v, idx, n);
2063b19a5dc2SMark Adams         x[i] = (1. - omega) * x[i] + sum * idiag[i]; /* omega in idiag */
206417ab2063SBarry Smith       }
2065b19a5dc2SMark Adams       xb = t;
20669566063dSJacob Faibussowitsch       PetscCall(PetscLogFlops(2.0 * a->nz));
2067b19a5dc2SMark Adams     } else xb = b;
206817ab2063SBarry Smith     if (flag & SOR_BACKWARD_SWEEP || flag & SOR_LOCAL_BACKWARD_SWEEP) {
206917ab2063SBarry Smith       for (i = m - 1; i >= 0; i--) {
2070b19a5dc2SMark Adams         sum = xb[i];
2071b19a5dc2SMark Adams         if (xb == b) {
2072b19a5dc2SMark Adams           /* whole matrix (no checkpointing available) */
2073416022c9SBarry Smith           n   = a->i[i + 1] - a->i[i];
2074ed480e8bSBarry Smith           idx = a->j + a->i[i];
20752e5835c6SStefano Zampini           v   = aa + a->i[i];
2076e6d1f457SBarry Smith           PetscSparseDenseMinusDot(sum, x, v, idx, n);
2077ed480e8bSBarry Smith           x[i] = (1. - omega) * x[i] + (sum + mdiag[i] * x[i]) * idiag[i];
2078b19a5dc2SMark Adams         } else { /* lower-triangular part has been saved, so only apply upper-triangular */
2079b19a5dc2SMark Adams           n   = a->i[i + 1] - diag[i] - 1;
2080b19a5dc2SMark Adams           idx = a->j + diag[i] + 1;
20812e5835c6SStefano Zampini           v   = aa + diag[i] + 1;
2082b19a5dc2SMark Adams           PetscSparseDenseMinusDot(sum, x, v, idx, n);
2083b19a5dc2SMark Adams           x[i] = (1. - omega) * x[i] + sum * idiag[i]; /* omega in idiag */
208417ab2063SBarry Smith         }
2085b19a5dc2SMark Adams       }
2086b19a5dc2SMark Adams       if (xb == b) {
20879566063dSJacob Faibussowitsch         PetscCall(PetscLogFlops(2.0 * a->nz));
2088b19a5dc2SMark Adams       } else {
20899566063dSJacob Faibussowitsch         PetscCall(PetscLogFlops(a->nz)); /* assumes 1/2 in upper */
2090b19a5dc2SMark Adams       }
209117ab2063SBarry Smith     }
209217ab2063SBarry Smith   }
20939566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &aa));
20949566063dSJacob Faibussowitsch   PetscCall(VecRestoreArray(xx, &x));
20959566063dSJacob Faibussowitsch   PetscCall(VecRestoreArrayRead(bb, &b));
20963ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
209717ab2063SBarry Smith }
209817ab2063SBarry Smith 
2099ba38deedSJacob Faibussowitsch static PetscErrorCode MatGetInfo_SeqAIJ(Mat A, MatInfoType flag, MatInfo *info)
2100d71ae5a4SJacob Faibussowitsch {
2101416022c9SBarry Smith   Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data;
21024e220ebcSLois Curfman McInnes 
21033a40ed3dSBarry Smith   PetscFunctionBegin;
21044e220ebcSLois Curfman McInnes   info->block_size   = 1.0;
21053966268fSBarry Smith   info->nz_allocated = a->maxnz;
21063966268fSBarry Smith   info->nz_used      = a->nz;
21073966268fSBarry Smith   info->nz_unneeded  = (a->maxnz - a->nz);
21083966268fSBarry Smith   info->assemblies   = A->num_ass;
21093966268fSBarry Smith   info->mallocs      = A->info.mallocs;
21104dfa11a4SJacob Faibussowitsch   info->memory       = 0; /* REVIEW ME */
2111d5f3da31SBarry Smith   if (A->factortype) {
21124e220ebcSLois Curfman McInnes     info->fill_ratio_given  = A->info.fill_ratio_given;
21134e220ebcSLois Curfman McInnes     info->fill_ratio_needed = A->info.fill_ratio_needed;
21144e220ebcSLois Curfman McInnes     info->factor_mallocs    = A->info.factor_mallocs;
21154e220ebcSLois Curfman McInnes   } else {
21164e220ebcSLois Curfman McInnes     info->fill_ratio_given  = 0;
21174e220ebcSLois Curfman McInnes     info->fill_ratio_needed = 0;
21184e220ebcSLois Curfman McInnes     info->factor_mallocs    = 0;
21194e220ebcSLois Curfman McInnes   }
21203ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
212117ab2063SBarry Smith }
212217ab2063SBarry Smith 
2123ba38deedSJacob Faibussowitsch static PetscErrorCode MatZeroRows_SeqAIJ(Mat A, PetscInt N, const PetscInt rows[], PetscScalar diag, Vec x, Vec b)
2124d71ae5a4SJacob Faibussowitsch {
2125416022c9SBarry Smith   Mat_SeqAIJ        *a = (Mat_SeqAIJ *)A->data;
2126c7da8527SEric Chamberland   PetscInt           i, m = A->rmap->n - 1;
212797b48c8fSBarry Smith   const PetscScalar *xx;
21282e5835c6SStefano Zampini   PetscScalar       *bb, *aa;
2129c7da8527SEric Chamberland   PetscInt           d = 0;
213017ab2063SBarry Smith 
21313a40ed3dSBarry Smith   PetscFunctionBegin;
213297b48c8fSBarry Smith   if (x && b) {
21339566063dSJacob Faibussowitsch     PetscCall(VecGetArrayRead(x, &xx));
21349566063dSJacob Faibussowitsch     PetscCall(VecGetArray(b, &bb));
213597b48c8fSBarry Smith     for (i = 0; i < N; i++) {
2136aed4548fSBarry Smith       PetscCheck(rows[i] >= 0 && rows[i] <= m, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "row %" PetscInt_FMT " out of range", rows[i]);
2137447d62f5SStefano Zampini       if (rows[i] >= A->cmap->n) continue;
213897b48c8fSBarry Smith       bb[rows[i]] = diag * xx[rows[i]];
213997b48c8fSBarry Smith     }
21409566063dSJacob Faibussowitsch     PetscCall(VecRestoreArrayRead(x, &xx));
21419566063dSJacob Faibussowitsch     PetscCall(VecRestoreArray(b, &bb));
214297b48c8fSBarry Smith   }
214397b48c8fSBarry Smith 
21449566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArray(A, &aa));
2145a9817697SBarry Smith   if (a->keepnonzeropattern) {
2146f1e2ffcdSBarry Smith     for (i = 0; i < N; i++) {
2147aed4548fSBarry Smith       PetscCheck(rows[i] >= 0 && rows[i] <= m, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "row %" PetscInt_FMT " out of range", rows[i]);
21489566063dSJacob Faibussowitsch       PetscCall(PetscArrayzero(&aa[a->i[rows[i]]], a->ilen[rows[i]]));
2149f1e2ffcdSBarry Smith     }
2150f4df32b1SMatthew Knepley     if (diag != 0.0) {
2151c7da8527SEric Chamberland       for (i = 0; i < N; i++) {
2152c7da8527SEric Chamberland         d = rows[i];
2153447d62f5SStefano Zampini         if (rows[i] >= A->cmap->n) continue;
215408401ef6SPierre Jolivet         PetscCheck(a->diag[d] < a->i[d + 1], PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Matrix is missing diagonal entry in the zeroed row %" PetscInt_FMT, d);
2155c7da8527SEric Chamberland       }
2156f1e2ffcdSBarry Smith       for (i = 0; i < N; i++) {
2157447d62f5SStefano Zampini         if (rows[i] >= A->cmap->n) continue;
21582e5835c6SStefano Zampini         aa[a->diag[rows[i]]] = diag;
2159f1e2ffcdSBarry Smith       }
2160f1e2ffcdSBarry Smith     }
2161f1e2ffcdSBarry Smith   } else {
2162f4df32b1SMatthew Knepley     if (diag != 0.0) {
216317ab2063SBarry Smith       for (i = 0; i < N; i++) {
2164aed4548fSBarry Smith         PetscCheck(rows[i] >= 0 && rows[i] <= m, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "row %" PetscInt_FMT " out of range", rows[i]);
21657ae801bdSBarry Smith         if (a->ilen[rows[i]] > 0) {
2166447d62f5SStefano Zampini           if (rows[i] >= A->cmap->n) {
2167447d62f5SStefano Zampini             a->ilen[rows[i]] = 0;
2168447d62f5SStefano Zampini           } else {
2169416022c9SBarry Smith             a->ilen[rows[i]]    = 1;
21702e5835c6SStefano Zampini             aa[a->i[rows[i]]]   = diag;
2171bfeeae90SHong Zhang             a->j[a->i[rows[i]]] = rows[i];
2172447d62f5SStefano Zampini           }
2173447d62f5SStefano Zampini         } else if (rows[i] < A->cmap->n) { /* in case row was completely empty */
21749566063dSJacob Faibussowitsch           PetscCall(MatSetValues_SeqAIJ(A, 1, &rows[i], 1, &rows[i], &diag, INSERT_VALUES));
217517ab2063SBarry Smith         }
217617ab2063SBarry Smith       }
21773a40ed3dSBarry Smith     } else {
217817ab2063SBarry Smith       for (i = 0; i < N; i++) {
2179aed4548fSBarry Smith         PetscCheck(rows[i] >= 0 && rows[i] <= m, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "row %" PetscInt_FMT " out of range", rows[i]);
2180416022c9SBarry Smith         a->ilen[rows[i]] = 0;
218117ab2063SBarry Smith       }
218217ab2063SBarry Smith     }
2183e56f5c9eSBarry Smith     A->nonzerostate++;
2184f1e2ffcdSBarry Smith   }
21859566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArray(A, &aa));
2186dbbe0bcdSBarry Smith   PetscUseTypeMethod(A, assemblyend, MAT_FINAL_ASSEMBLY);
21873ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
218817ab2063SBarry Smith }
218917ab2063SBarry Smith 
2190ba38deedSJacob Faibussowitsch static PetscErrorCode MatZeroRowsColumns_SeqAIJ(Mat A, PetscInt N, const PetscInt rows[], PetscScalar diag, Vec x, Vec b)
2191d71ae5a4SJacob Faibussowitsch {
21926e169961SBarry Smith   Mat_SeqAIJ        *a = (Mat_SeqAIJ *)A->data;
21936e169961SBarry Smith   PetscInt           i, j, m = A->rmap->n - 1, d = 0;
21942b40b63fSBarry Smith   PetscBool          missing, *zeroed, vecs = PETSC_FALSE;
21956e169961SBarry Smith   const PetscScalar *xx;
21962e5835c6SStefano Zampini   PetscScalar       *bb, *aa;
21976e169961SBarry Smith 
21986e169961SBarry Smith   PetscFunctionBegin;
21993ba16761SJacob Faibussowitsch   if (!N) PetscFunctionReturn(PETSC_SUCCESS);
22009566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArray(A, &aa));
22016e169961SBarry Smith   if (x && b) {
22029566063dSJacob Faibussowitsch     PetscCall(VecGetArrayRead(x, &xx));
22039566063dSJacob Faibussowitsch     PetscCall(VecGetArray(b, &bb));
22042b40b63fSBarry Smith     vecs = PETSC_TRUE;
22056e169961SBarry Smith   }
22069566063dSJacob Faibussowitsch   PetscCall(PetscCalloc1(A->rmap->n, &zeroed));
22076e169961SBarry Smith   for (i = 0; i < N; i++) {
2208aed4548fSBarry Smith     PetscCheck(rows[i] >= 0 && rows[i] <= m, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "row %" PetscInt_FMT " out of range", rows[i]);
22098e3a54c0SPierre Jolivet     PetscCall(PetscArrayzero(PetscSafePointerPlusOffset(aa, a->i[rows[i]]), a->ilen[rows[i]]));
22102205254eSKarl Rupp 
22116e169961SBarry Smith     zeroed[rows[i]] = PETSC_TRUE;
22126e169961SBarry Smith   }
22136e169961SBarry Smith   for (i = 0; i < A->rmap->n; i++) {
22146e169961SBarry Smith     if (!zeroed[i]) {
22156e169961SBarry Smith       for (j = a->i[i]; j < a->i[i + 1]; j++) {
22164cf107fdSStefano Zampini         if (a->j[j] < A->rmap->n && zeroed[a->j[j]]) {
22172e5835c6SStefano Zampini           if (vecs) bb[i] -= aa[j] * xx[a->j[j]];
22182e5835c6SStefano Zampini           aa[j] = 0.0;
22196e169961SBarry Smith         }
22206e169961SBarry Smith       }
22214cf107fdSStefano Zampini     } else if (vecs && i < A->cmap->N) bb[i] = diag * xx[i];
22226e169961SBarry Smith   }
22236e169961SBarry Smith   if (x && b) {
22249566063dSJacob Faibussowitsch     PetscCall(VecRestoreArrayRead(x, &xx));
22259566063dSJacob Faibussowitsch     PetscCall(VecRestoreArray(b, &bb));
22266e169961SBarry Smith   }
22279566063dSJacob Faibussowitsch   PetscCall(PetscFree(zeroed));
22286e169961SBarry Smith   if (diag != 0.0) {
22299566063dSJacob Faibussowitsch     PetscCall(MatMissingDiagonal_SeqAIJ(A, &missing, &d));
22301d5a398dSstefano_zampini     if (missing) {
22311d5a398dSstefano_zampini       for (i = 0; i < N; i++) {
22324cf107fdSStefano Zampini         if (rows[i] >= A->cmap->N) continue;
2233aed4548fSBarry Smith         PetscCheck(!a->nonew || rows[i] < d, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Matrix is missing diagonal entry in row %" PetscInt_FMT " (%" PetscInt_FMT ")", d, rows[i]);
22349566063dSJacob Faibussowitsch         PetscCall(MatSetValues_SeqAIJ(A, 1, &rows[i], 1, &rows[i], &diag, INSERT_VALUES));
22351d5a398dSstefano_zampini       }
22361d5a398dSstefano_zampini     } else {
2237ad540459SPierre Jolivet       for (i = 0; i < N; i++) aa[a->diag[rows[i]]] = diag;
22386e169961SBarry Smith     }
22391d5a398dSstefano_zampini   }
22409566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArray(A, &aa));
2241dbbe0bcdSBarry Smith   PetscUseTypeMethod(A, assemblyend, MAT_FINAL_ASSEMBLY);
22423ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
22436e169961SBarry Smith }
22446e169961SBarry Smith 
2245d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetRow_SeqAIJ(Mat A, PetscInt row, PetscInt *nz, PetscInt **idx, PetscScalar **v)
2246d71ae5a4SJacob Faibussowitsch {
2247fff043a9SJunchao Zhang   Mat_SeqAIJ        *a = (Mat_SeqAIJ *)A->data;
2248fff043a9SJunchao Zhang   const PetscScalar *aa;
224917ab2063SBarry Smith 
22503a40ed3dSBarry Smith   PetscFunctionBegin;
22519566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &aa));
2252416022c9SBarry Smith   *nz = a->i[row + 1] - a->i[row];
22538e3a54c0SPierre Jolivet   if (v) *v = PetscSafePointerPlusOffset((PetscScalar *)aa, a->i[row]);
225417ab2063SBarry Smith   if (idx) {
22555c0db29aSPierre Jolivet     if (*nz && a->j) *idx = a->j + a->i[row];
2256f4259b30SLisandro Dalcin     else *idx = NULL;
225717ab2063SBarry Smith   }
22589566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &aa));
22593ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
226017ab2063SBarry Smith }
226117ab2063SBarry Smith 
2262d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRestoreRow_SeqAIJ(Mat A, PetscInt row, PetscInt *nz, PetscInt **idx, PetscScalar **v)
2263d71ae5a4SJacob Faibussowitsch {
22643a40ed3dSBarry Smith   PetscFunctionBegin;
22653ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
226617ab2063SBarry Smith }
226717ab2063SBarry Smith 
2268ba38deedSJacob Faibussowitsch static PetscErrorCode MatNorm_SeqAIJ(Mat A, NormType type, PetscReal *nrm)
2269d71ae5a4SJacob Faibussowitsch {
2270416022c9SBarry Smith   Mat_SeqAIJ      *a = (Mat_SeqAIJ *)A->data;
22712e5835c6SStefano Zampini   const MatScalar *v;
227236db0b34SBarry Smith   PetscReal        sum = 0.0;
227397f1f81fSBarry Smith   PetscInt         i, j;
227417ab2063SBarry Smith 
22753a40ed3dSBarry Smith   PetscFunctionBegin;
22769566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &v));
227717ab2063SBarry Smith   if (type == NORM_FROBENIUS) {
2278570b7f6dSBarry Smith #if defined(PETSC_USE_REAL___FP16)
2279570b7f6dSBarry Smith     PetscBLASInt one = 1, nz = a->nz;
2280792fecdfSBarry Smith     PetscCallBLAS("BLASnrm2", *nrm = BLASnrm2_(&nz, v, &one));
2281570b7f6dSBarry Smith #else
2282416022c9SBarry Smith     for (i = 0; i < a->nz; i++) {
22839371c9d4SSatish Balay       sum += PetscRealPart(PetscConj(*v) * (*v));
22849371c9d4SSatish Balay       v++;
228517ab2063SBarry Smith     }
22868f1a2a5eSBarry Smith     *nrm = PetscSqrtReal(sum);
2287570b7f6dSBarry Smith #endif
22889566063dSJacob Faibussowitsch     PetscCall(PetscLogFlops(2.0 * a->nz));
22893a40ed3dSBarry Smith   } else if (type == NORM_1) {
229036db0b34SBarry Smith     PetscReal *tmp;
229197f1f81fSBarry Smith     PetscInt  *jj = a->j;
22929566063dSJacob Faibussowitsch     PetscCall(PetscCalloc1(A->cmap->n + 1, &tmp));
2293064f8208SBarry Smith     *nrm = 0.0;
2294416022c9SBarry Smith     for (j = 0; j < a->nz; j++) {
22959371c9d4SSatish Balay       tmp[*jj++] += PetscAbsScalar(*v);
22969371c9d4SSatish Balay       v++;
229717ab2063SBarry Smith     }
2298d0f46423SBarry Smith     for (j = 0; j < A->cmap->n; j++) {
2299064f8208SBarry Smith       if (tmp[j] > *nrm) *nrm = tmp[j];
230017ab2063SBarry Smith     }
23019566063dSJacob Faibussowitsch     PetscCall(PetscFree(tmp));
23029566063dSJacob Faibussowitsch     PetscCall(PetscLogFlops(PetscMax(a->nz - 1, 0)));
23033a40ed3dSBarry Smith   } else if (type == NORM_INFINITY) {
2304064f8208SBarry Smith     *nrm = 0.0;
2305d0f46423SBarry Smith     for (j = 0; j < A->rmap->n; j++) {
23068e3a54c0SPierre Jolivet       const PetscScalar *v2 = PetscSafePointerPlusOffset(v, a->i[j]);
230717ab2063SBarry Smith       sum                   = 0.0;
2308416022c9SBarry Smith       for (i = 0; i < a->i[j + 1] - a->i[j]; i++) {
23099371c9d4SSatish Balay         sum += PetscAbsScalar(*v2);
23109371c9d4SSatish Balay         v2++;
231117ab2063SBarry Smith       }
2312064f8208SBarry Smith       if (sum > *nrm) *nrm = sum;
231317ab2063SBarry Smith     }
23149566063dSJacob Faibussowitsch     PetscCall(PetscLogFlops(PetscMax(a->nz - 1, 0)));
2315f23aa3ddSBarry Smith   } else SETERRQ(PETSC_COMM_SELF, PETSC_ERR_SUP, "No support for two norm");
23169566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &v));
23173ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
231817ab2063SBarry Smith }
231917ab2063SBarry Smith 
2320ba38deedSJacob Faibussowitsch static PetscErrorCode MatIsTranspose_SeqAIJ(Mat A, Mat B, PetscReal tol, PetscBool *f)
2321d71ae5a4SJacob Faibussowitsch {
23223d3eaba7SBarry Smith   Mat_SeqAIJ      *aij = (Mat_SeqAIJ *)A->data, *bij = (Mat_SeqAIJ *)B->data;
232354f21887SBarry Smith   PetscInt        *adx, *bdx, *aii, *bii, *aptr, *bptr;
23242e5835c6SStefano Zampini   const MatScalar *va, *vb;
232597f1f81fSBarry Smith   PetscInt         ma, na, mb, nb, i;
2326cd0d46ebSvictorle 
2327cd0d46ebSvictorle   PetscFunctionBegin;
23289566063dSJacob Faibussowitsch   PetscCall(MatGetSize(A, &ma, &na));
23299566063dSJacob Faibussowitsch   PetscCall(MatGetSize(B, &mb, &nb));
23305485867bSBarry Smith   if (ma != nb || na != mb) {
23315485867bSBarry Smith     *f = PETSC_FALSE;
23323ba16761SJacob Faibussowitsch     PetscFunctionReturn(PETSC_SUCCESS);
23335485867bSBarry Smith   }
23349566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &va));
23359566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(B, &vb));
23369371c9d4SSatish Balay   aii = aij->i;
23379371c9d4SSatish Balay   bii = bij->i;
23389371c9d4SSatish Balay   adx = aij->j;
23399371c9d4SSatish Balay   bdx = bij->j;
23409566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(ma, &aptr));
23419566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(mb, &bptr));
2342cd0d46ebSvictorle   for (i = 0; i < ma; i++) aptr[i] = aii[i];
2343cd0d46ebSvictorle   for (i = 0; i < mb; i++) bptr[i] = bii[i];
2344cd0d46ebSvictorle 
2345cd0d46ebSvictorle   *f = PETSC_TRUE;
2346cd0d46ebSvictorle   for (i = 0; i < ma; i++) {
2347cd0d46ebSvictorle     while (aptr[i] < aii[i + 1]) {
234897f1f81fSBarry Smith       PetscInt    idc, idr;
23495485867bSBarry Smith       PetscScalar vc, vr;
2350cd0d46ebSvictorle       /* column/row index/value */
23515485867bSBarry Smith       idc = adx[aptr[i]];
23525485867bSBarry Smith       idr = bdx[bptr[idc]];
23535485867bSBarry Smith       vc  = va[aptr[i]];
23545485867bSBarry Smith       vr  = vb[bptr[idc]];
23555485867bSBarry Smith       if (i != idr || PetscAbsScalar(vc - vr) > tol) {
23565485867bSBarry Smith         *f = PETSC_FALSE;
23575485867bSBarry Smith         goto done;
2358cd0d46ebSvictorle       } else {
23595485867bSBarry Smith         aptr[i]++;
23605485867bSBarry Smith         if (B || i != idc) bptr[idc]++;
2361cd0d46ebSvictorle       }
2362cd0d46ebSvictorle     }
2363cd0d46ebSvictorle   }
2364cd0d46ebSvictorle done:
23659566063dSJacob Faibussowitsch   PetscCall(PetscFree(aptr));
23669566063dSJacob Faibussowitsch   PetscCall(PetscFree(bptr));
23679566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &va));
23689566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(B, &vb));
23693ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
2370cd0d46ebSvictorle }
2371cd0d46ebSvictorle 
2372ba38deedSJacob Faibussowitsch static PetscErrorCode MatIsHermitianTranspose_SeqAIJ(Mat A, Mat B, PetscReal tol, PetscBool *f)
2373d71ae5a4SJacob Faibussowitsch {
23743d3eaba7SBarry Smith   Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data, *bij = (Mat_SeqAIJ *)B->data;
237554f21887SBarry Smith   PetscInt   *adx, *bdx, *aii, *bii, *aptr, *bptr;
237654f21887SBarry Smith   MatScalar  *va, *vb;
23771cbb95d3SBarry Smith   PetscInt    ma, na, mb, nb, i;
23781cbb95d3SBarry Smith 
23791cbb95d3SBarry Smith   PetscFunctionBegin;
23809566063dSJacob Faibussowitsch   PetscCall(MatGetSize(A, &ma, &na));
23819566063dSJacob Faibussowitsch   PetscCall(MatGetSize(B, &mb, &nb));
23821cbb95d3SBarry Smith   if (ma != nb || na != mb) {
23831cbb95d3SBarry Smith     *f = PETSC_FALSE;
23843ba16761SJacob Faibussowitsch     PetscFunctionReturn(PETSC_SUCCESS);
23851cbb95d3SBarry Smith   }
23869371c9d4SSatish Balay   aii = aij->i;
23879371c9d4SSatish Balay   bii = bij->i;
23889371c9d4SSatish Balay   adx = aij->j;
23899371c9d4SSatish Balay   bdx = bij->j;
23909371c9d4SSatish Balay   va  = aij->a;
23919371c9d4SSatish Balay   vb  = bij->a;
23929566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(ma, &aptr));
23939566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(mb, &bptr));
23941cbb95d3SBarry Smith   for (i = 0; i < ma; i++) aptr[i] = aii[i];
23951cbb95d3SBarry Smith   for (i = 0; i < mb; i++) bptr[i] = bii[i];
23961cbb95d3SBarry Smith 
23971cbb95d3SBarry Smith   *f = PETSC_TRUE;
23981cbb95d3SBarry Smith   for (i = 0; i < ma; i++) {
23991cbb95d3SBarry Smith     while (aptr[i] < aii[i + 1]) {
24001cbb95d3SBarry Smith       PetscInt    idc, idr;
24011cbb95d3SBarry Smith       PetscScalar vc, vr;
24021cbb95d3SBarry Smith       /* column/row index/value */
24031cbb95d3SBarry Smith       idc = adx[aptr[i]];
24041cbb95d3SBarry Smith       idr = bdx[bptr[idc]];
24051cbb95d3SBarry Smith       vc  = va[aptr[i]];
24061cbb95d3SBarry Smith       vr  = vb[bptr[idc]];
24071cbb95d3SBarry Smith       if (i != idr || PetscAbsScalar(vc - PetscConj(vr)) > tol) {
24081cbb95d3SBarry Smith         *f = PETSC_FALSE;
24091cbb95d3SBarry Smith         goto done;
24101cbb95d3SBarry Smith       } else {
24111cbb95d3SBarry Smith         aptr[i]++;
24121cbb95d3SBarry Smith         if (B || i != idc) bptr[idc]++;
24131cbb95d3SBarry Smith       }
24141cbb95d3SBarry Smith     }
24151cbb95d3SBarry Smith   }
24161cbb95d3SBarry Smith done:
24179566063dSJacob Faibussowitsch   PetscCall(PetscFree(aptr));
24189566063dSJacob Faibussowitsch   PetscCall(PetscFree(bptr));
24193ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
24201cbb95d3SBarry Smith }
24211cbb95d3SBarry Smith 
2422d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDiagonalScale_SeqAIJ(Mat A, Vec ll, Vec rr)
2423d71ae5a4SJacob Faibussowitsch {
2424416022c9SBarry Smith   Mat_SeqAIJ        *a = (Mat_SeqAIJ *)A->data;
2425fff8e43fSBarry Smith   const PetscScalar *l, *r;
2426fff8e43fSBarry Smith   PetscScalar        x;
242754f21887SBarry Smith   MatScalar         *v;
2428fff8e43fSBarry Smith   PetscInt           i, j, m = A->rmap->n, n = A->cmap->n, M, nz = a->nz;
2429fff8e43fSBarry Smith   const PetscInt    *jj;
243017ab2063SBarry Smith 
24313a40ed3dSBarry Smith   PetscFunctionBegin;
243217ab2063SBarry Smith   if (ll) {
24333ea7c6a1SSatish Balay     /* The local size is used so that VecMPI can be passed to this routine
24343ea7c6a1SSatish Balay        by MatDiagonalScale_MPIAIJ */
24359566063dSJacob Faibussowitsch     PetscCall(VecGetLocalSize(ll, &m));
243608401ef6SPierre Jolivet     PetscCheck(m == A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Left scaling vector wrong length");
24379566063dSJacob Faibussowitsch     PetscCall(VecGetArrayRead(ll, &l));
24389566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJGetArray(A, &v));
243917ab2063SBarry Smith     for (i = 0; i < m; i++) {
244017ab2063SBarry Smith       x = l[i];
2441416022c9SBarry Smith       M = a->i[i + 1] - a->i[i];
24422205254eSKarl Rupp       for (j = 0; j < M; j++) (*v++) *= x;
244317ab2063SBarry Smith     }
24449566063dSJacob Faibussowitsch     PetscCall(VecRestoreArrayRead(ll, &l));
24459566063dSJacob Faibussowitsch     PetscCall(PetscLogFlops(nz));
24469566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJRestoreArray(A, &v));
244717ab2063SBarry Smith   }
244817ab2063SBarry Smith   if (rr) {
24499566063dSJacob Faibussowitsch     PetscCall(VecGetLocalSize(rr, &n));
245008401ef6SPierre Jolivet     PetscCheck(n == A->cmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Right scaling vector wrong length");
24519566063dSJacob Faibussowitsch     PetscCall(VecGetArrayRead(rr, &r));
24529566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJGetArray(A, &v));
24532e5835c6SStefano Zampini     jj = a->j;
24542205254eSKarl Rupp     for (i = 0; i < nz; i++) (*v++) *= r[*jj++];
24559566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJRestoreArray(A, &v));
24569566063dSJacob Faibussowitsch     PetscCall(VecRestoreArrayRead(rr, &r));
24579566063dSJacob Faibussowitsch     PetscCall(PetscLogFlops(nz));
245817ab2063SBarry Smith   }
24599566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJInvalidateDiagonal(A));
24603ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
246117ab2063SBarry Smith }
246217ab2063SBarry Smith 
2463d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateSubMatrix_SeqAIJ(Mat A, IS isrow, IS iscol, PetscInt csize, MatReuse scall, Mat *B)
2464d71ae5a4SJacob Faibussowitsch {
2465db02288aSLois Curfman McInnes   Mat_SeqAIJ        *a = (Mat_SeqAIJ *)A->data, *c;
2466d0f46423SBarry Smith   PetscInt          *smap, i, k, kstart, kend, oldcols = A->cmap->n, *lens;
246797f1f81fSBarry Smith   PetscInt           row, mat_i, *mat_j, tcol, first, step, *mat_ilen, sum, lensi;
24685d0c19d7SBarry Smith   const PetscInt    *irow, *icol;
24692e5835c6SStefano Zampini   const PetscScalar *aa;
24705d0c19d7SBarry Smith   PetscInt           nrows, ncols;
247197f1f81fSBarry Smith   PetscInt          *starts, *j_new, *i_new, *aj = a->j, *ai = a->i, ii, *ailen = a->ilen;
2472fb3c7e2dSJunchao Zhang   MatScalar         *a_new, *mat_a, *c_a;
2473416022c9SBarry Smith   Mat                C;
2474cdc6f3adSToby Isaac   PetscBool          stride;
247517ab2063SBarry Smith 
24763a40ed3dSBarry Smith   PetscFunctionBegin;
24779566063dSJacob Faibussowitsch   PetscCall(ISGetIndices(isrow, &irow));
24789566063dSJacob Faibussowitsch   PetscCall(ISGetLocalSize(isrow, &nrows));
24799566063dSJacob Faibussowitsch   PetscCall(ISGetLocalSize(iscol, &ncols));
248017ab2063SBarry Smith 
24819566063dSJacob Faibussowitsch   PetscCall(PetscObjectTypeCompare((PetscObject)iscol, ISSTRIDE, &stride));
2482ff718158SBarry Smith   if (stride) {
24839566063dSJacob Faibussowitsch     PetscCall(ISStrideGetInfo(iscol, &first, &step));
2484ff718158SBarry Smith   } else {
2485ff718158SBarry Smith     first = 0;
2486ff718158SBarry Smith     step  = 0;
2487ff718158SBarry Smith   }
2488fee21e36SBarry Smith   if (stride && step == 1) {
248902834360SBarry Smith     /* special case of contiguous rows */
24909566063dSJacob Faibussowitsch     PetscCall(PetscMalloc2(nrows, &lens, nrows, &starts));
249102834360SBarry Smith     /* loop over new rows determining lens and starting points */
249202834360SBarry Smith     for (i = 0; i < nrows; i++) {
2493bfeeae90SHong Zhang       kstart    = ai[irow[i]];
2494a2744918SBarry Smith       kend      = kstart + ailen[irow[i]];
2495a91a9bebSLisandro Dalcin       starts[i] = kstart;
249602834360SBarry Smith       for (k = kstart; k < kend; k++) {
2497bfeeae90SHong Zhang         if (aj[k] >= first) {
249802834360SBarry Smith           starts[i] = k;
249902834360SBarry Smith           break;
250002834360SBarry Smith         }
250102834360SBarry Smith       }
2502a2744918SBarry Smith       sum = 0;
250302834360SBarry Smith       while (k < kend) {
2504bfeeae90SHong Zhang         if (aj[k++] >= first + ncols) break;
2505a2744918SBarry Smith         sum++;
250602834360SBarry Smith       }
2507a2744918SBarry Smith       lens[i] = sum;
250802834360SBarry Smith     }
250902834360SBarry Smith     /* create submatrix */
2510cddf8d76SBarry Smith     if (scall == MAT_REUSE_MATRIX) {
251197f1f81fSBarry Smith       PetscInt n_cols, n_rows;
25129566063dSJacob Faibussowitsch       PetscCall(MatGetSize(*B, &n_rows, &n_cols));
2513aed4548fSBarry Smith       PetscCheck(n_rows == nrows && n_cols == ncols, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Reused submatrix wrong size");
25149566063dSJacob Faibussowitsch       PetscCall(MatZeroEntries(*B));
251508480c60SBarry Smith       C = *B;
25163a40ed3dSBarry Smith     } else {
25173bef6203SJed Brown       PetscInt rbs, cbs;
25189566063dSJacob Faibussowitsch       PetscCall(MatCreate(PetscObjectComm((PetscObject)A), &C));
25199566063dSJacob Faibussowitsch       PetscCall(MatSetSizes(C, nrows, ncols, PETSC_DETERMINE, PETSC_DETERMINE));
25209566063dSJacob Faibussowitsch       PetscCall(ISGetBlockSize(isrow, &rbs));
25219566063dSJacob Faibussowitsch       PetscCall(ISGetBlockSize(iscol, &cbs));
25229566063dSJacob Faibussowitsch       PetscCall(MatSetBlockSizes(C, rbs, cbs));
25239566063dSJacob Faibussowitsch       PetscCall(MatSetType(C, ((PetscObject)A)->type_name));
25249566063dSJacob Faibussowitsch       PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(C, 0, lens));
252508480c60SBarry Smith     }
2526db02288aSLois Curfman McInnes     c = (Mat_SeqAIJ *)C->data;
2527db02288aSLois Curfman McInnes 
252802834360SBarry Smith     /* loop over rows inserting into submatrix */
2529fb3c7e2dSJunchao Zhang     PetscCall(MatSeqAIJGetArrayWrite(C, &a_new)); // Not 'a_new = c->a-new', since that raw usage ignores offload state of C
2530db02288aSLois Curfman McInnes     j_new = c->j;
2531db02288aSLois Curfman McInnes     i_new = c->i;
25329566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJGetArrayRead(A, &aa));
253302834360SBarry Smith     for (i = 0; i < nrows; i++) {
2534a2744918SBarry Smith       ii    = starts[i];
2535a2744918SBarry Smith       lensi = lens[i];
2536810441c8SPierre Jolivet       if (lensi) {
2537ad540459SPierre Jolivet         for (k = 0; k < lensi; k++) *j_new++ = aj[ii + k] - first;
25389566063dSJacob Faibussowitsch         PetscCall(PetscArraycpy(a_new, aa + starts[i], lensi));
2539a2744918SBarry Smith         a_new += lensi;
2540810441c8SPierre Jolivet       }
2541a2744918SBarry Smith       i_new[i + 1] = i_new[i] + lensi;
2542a2744918SBarry Smith       c->ilen[i]   = lensi;
254302834360SBarry Smith     }
2544fb3c7e2dSJunchao Zhang     PetscCall(MatSeqAIJRestoreArrayWrite(C, &a_new)); // Set C's offload state properly
25459566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJRestoreArrayRead(A, &aa));
25469566063dSJacob Faibussowitsch     PetscCall(PetscFree2(lens, starts));
25473a40ed3dSBarry Smith   } else {
25489566063dSJacob Faibussowitsch     PetscCall(ISGetIndices(iscol, &icol));
25499566063dSJacob Faibussowitsch     PetscCall(PetscCalloc1(oldcols, &smap));
25509566063dSJacob Faibussowitsch     PetscCall(PetscMalloc1(1 + nrows, &lens));
25514dcab191SBarry Smith     for (i = 0; i < ncols; i++) {
25526bdcaf15SBarry Smith       PetscCheck(icol[i] < oldcols, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Requesting column beyond largest column icol[%" PetscInt_FMT "] %" PetscInt_FMT " >= A->cmap->n %" PetscInt_FMT, i, icol[i], oldcols);
25534dcab191SBarry Smith       smap[icol[i]] = i + 1;
25544dcab191SBarry Smith     }
25554dcab191SBarry Smith 
255602834360SBarry Smith     /* determine lens of each row */
255702834360SBarry Smith     for (i = 0; i < nrows; i++) {
2558bfeeae90SHong Zhang       kstart  = ai[irow[i]];
255902834360SBarry Smith       kend    = kstart + a->ilen[irow[i]];
256002834360SBarry Smith       lens[i] = 0;
256102834360SBarry Smith       for (k = kstart; k < kend; k++) {
2562ad540459SPierre Jolivet         if (smap[aj[k]]) lens[i]++;
256302834360SBarry Smith       }
256402834360SBarry Smith     }
256517ab2063SBarry Smith     /* Create and fill new matrix */
2566a2744918SBarry Smith     if (scall == MAT_REUSE_MATRIX) {
2567ace3abfcSBarry Smith       PetscBool equal;
25680f5bd95cSBarry Smith 
256999141d43SSatish Balay       c = (Mat_SeqAIJ *)((*B)->data);
2570aed4548fSBarry Smith       PetscCheck((*B)->rmap->n == nrows && (*B)->cmap->n == ncols, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Cannot reuse matrix. wrong size");
25719566063dSJacob Faibussowitsch       PetscCall(PetscArraycmp(c->ilen, lens, (*B)->rmap->n, &equal));
2572fdfbdca6SPierre Jolivet       PetscCheck(equal, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Cannot reuse matrix. wrong number of nonzeros");
25739566063dSJacob Faibussowitsch       PetscCall(PetscArrayzero(c->ilen, (*B)->rmap->n));
257408480c60SBarry Smith       C = *B;
25753a40ed3dSBarry Smith     } else {
25763bef6203SJed Brown       PetscInt rbs, cbs;
25779566063dSJacob Faibussowitsch       PetscCall(MatCreate(PetscObjectComm((PetscObject)A), &C));
25789566063dSJacob Faibussowitsch       PetscCall(MatSetSizes(C, nrows, ncols, PETSC_DETERMINE, PETSC_DETERMINE));
25799566063dSJacob Faibussowitsch       PetscCall(ISGetBlockSize(isrow, &rbs));
25809566063dSJacob Faibussowitsch       PetscCall(ISGetBlockSize(iscol, &cbs));
258137a5e0faSPierre Jolivet       if (rbs > 1 || cbs > 1) PetscCall(MatSetBlockSizes(C, rbs, cbs));
25829566063dSJacob Faibussowitsch       PetscCall(MatSetType(C, ((PetscObject)A)->type_name));
25839566063dSJacob Faibussowitsch       PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(C, 0, lens));
258408480c60SBarry Smith     }
25859566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJGetArrayRead(A, &aa));
2586fb3c7e2dSJunchao Zhang 
2587f4f49eeaSPierre Jolivet     c = (Mat_SeqAIJ *)C->data;
2588fb3c7e2dSJunchao Zhang     PetscCall(MatSeqAIJGetArrayWrite(C, &c_a)); // Not 'c->a', since that raw usage ignores offload state of C
258917ab2063SBarry Smith     for (i = 0; i < nrows; i++) {
259099141d43SSatish Balay       row      = irow[i];
2591bfeeae90SHong Zhang       kstart   = ai[row];
259299141d43SSatish Balay       kend     = kstart + a->ilen[row];
2593bfeeae90SHong Zhang       mat_i    = c->i[i];
25948e3a54c0SPierre Jolivet       mat_j    = PetscSafePointerPlusOffset(c->j, mat_i);
25958e3a54c0SPierre Jolivet       mat_a    = PetscSafePointerPlusOffset(c_a, mat_i);
259699141d43SSatish Balay       mat_ilen = c->ilen + i;
259717ab2063SBarry Smith       for (k = kstart; k < kend; k++) {
2598bfeeae90SHong Zhang         if ((tcol = smap[a->j[k]])) {
2599ed480e8bSBarry Smith           *mat_j++ = tcol - 1;
26002e5835c6SStefano Zampini           *mat_a++ = aa[k];
260199141d43SSatish Balay           (*mat_ilen)++;
260217ab2063SBarry Smith         }
260317ab2063SBarry Smith       }
260417ab2063SBarry Smith     }
26059566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJRestoreArrayRead(A, &aa));
260602834360SBarry Smith     /* Free work space */
26079566063dSJacob Faibussowitsch     PetscCall(ISRestoreIndices(iscol, &icol));
26089566063dSJacob Faibussowitsch     PetscCall(PetscFree(smap));
26099566063dSJacob Faibussowitsch     PetscCall(PetscFree(lens));
2610cdc6f3adSToby Isaac     /* sort */
2611cdc6f3adSToby Isaac     for (i = 0; i < nrows; i++) {
2612cdc6f3adSToby Isaac       PetscInt ilen;
2613cdc6f3adSToby Isaac 
2614cdc6f3adSToby Isaac       mat_i = c->i[i];
26158e3a54c0SPierre Jolivet       mat_j = PetscSafePointerPlusOffset(c->j, mat_i);
26168e3a54c0SPierre Jolivet       mat_a = PetscSafePointerPlusOffset(c_a, mat_i);
2617cdc6f3adSToby Isaac       ilen  = c->ilen[i];
26189566063dSJacob Faibussowitsch       PetscCall(PetscSortIntWithScalarArray(ilen, mat_j, mat_a));
2619cdc6f3adSToby Isaac     }
2620fb3c7e2dSJunchao Zhang     PetscCall(MatSeqAIJRestoreArrayWrite(C, &c_a));
262102834360SBarry Smith   }
26228c3ff71bSJunchao Zhang #if defined(PETSC_HAVE_DEVICE)
26239566063dSJacob Faibussowitsch   PetscCall(MatBindToCPU(C, A->boundtocpu));
2624305c6ccfSStefano Zampini #endif
26259566063dSJacob Faibussowitsch   PetscCall(MatAssemblyBegin(C, MAT_FINAL_ASSEMBLY));
26269566063dSJacob Faibussowitsch   PetscCall(MatAssemblyEnd(C, MAT_FINAL_ASSEMBLY));
262717ab2063SBarry Smith 
26289566063dSJacob Faibussowitsch   PetscCall(ISRestoreIndices(isrow, &irow));
2629416022c9SBarry Smith   *B = C;
26303ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
263117ab2063SBarry Smith }
263217ab2063SBarry Smith 
2633ba38deedSJacob Faibussowitsch static PetscErrorCode MatGetMultiProcBlock_SeqAIJ(Mat mat, MPI_Comm subComm, MatReuse scall, Mat *subMat)
2634d71ae5a4SJacob Faibussowitsch {
263582d44351SHong Zhang   Mat B;
263682d44351SHong Zhang 
263782d44351SHong Zhang   PetscFunctionBegin;
2638c2d650bdSHong Zhang   if (scall == MAT_INITIAL_MATRIX) {
26399566063dSJacob Faibussowitsch     PetscCall(MatCreate(subComm, &B));
26409566063dSJacob Faibussowitsch     PetscCall(MatSetSizes(B, mat->rmap->n, mat->cmap->n, mat->rmap->n, mat->cmap->n));
26419566063dSJacob Faibussowitsch     PetscCall(MatSetBlockSizesFromMats(B, mat, mat));
26429566063dSJacob Faibussowitsch     PetscCall(MatSetType(B, MATSEQAIJ));
26439566063dSJacob Faibussowitsch     PetscCall(MatDuplicateNoCreate_SeqAIJ(B, mat, MAT_COPY_VALUES, PETSC_TRUE));
264482d44351SHong Zhang     *subMat = B;
2645c2d650bdSHong Zhang   } else {
26469566063dSJacob Faibussowitsch     PetscCall(MatCopy_SeqAIJ(mat, *subMat, SAME_NONZERO_PATTERN));
2647c2d650bdSHong Zhang   }
26483ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
264982d44351SHong Zhang }
265082d44351SHong Zhang 
2651ba38deedSJacob Faibussowitsch static PetscErrorCode MatILUFactor_SeqAIJ(Mat inA, IS row, IS col, const MatFactorInfo *info)
2652d71ae5a4SJacob Faibussowitsch {
265363b91edcSBarry Smith   Mat_SeqAIJ *a = (Mat_SeqAIJ *)inA->data;
265463b91edcSBarry Smith   Mat         outA;
2655ace3abfcSBarry Smith   PetscBool   row_identity, col_identity;
265663b91edcSBarry Smith 
26573a40ed3dSBarry Smith   PetscFunctionBegin;
265808401ef6SPierre Jolivet   PetscCheck(info->levels == 0, PETSC_COMM_SELF, PETSC_ERR_SUP, "Only levels=0 supported for in-place ilu");
26591df811f5SHong Zhang 
26609566063dSJacob Faibussowitsch   PetscCall(ISIdentity(row, &row_identity));
26619566063dSJacob Faibussowitsch   PetscCall(ISIdentity(col, &col_identity));
2662a871dcd8SBarry Smith 
266363b91edcSBarry Smith   outA             = inA;
2664d5f3da31SBarry Smith   outA->factortype = MAT_FACTOR_LU;
26659566063dSJacob Faibussowitsch   PetscCall(PetscFree(inA->solvertype));
26669566063dSJacob Faibussowitsch   PetscCall(PetscStrallocpy(MATSOLVERPETSC, &inA->solvertype));
26672205254eSKarl Rupp 
26689566063dSJacob Faibussowitsch   PetscCall(PetscObjectReference((PetscObject)row));
26699566063dSJacob Faibussowitsch   PetscCall(ISDestroy(&a->row));
26702205254eSKarl Rupp 
2671c3122656SLisandro Dalcin   a->row = row;
26722205254eSKarl Rupp 
26739566063dSJacob Faibussowitsch   PetscCall(PetscObjectReference((PetscObject)col));
26749566063dSJacob Faibussowitsch   PetscCall(ISDestroy(&a->col));
26752205254eSKarl Rupp 
2676c3122656SLisandro Dalcin   a->col = col;
267763b91edcSBarry Smith 
267836db0b34SBarry Smith   /* Create the inverse permutation so that it can be used in MatLUFactorNumeric() */
26799566063dSJacob Faibussowitsch   PetscCall(ISDestroy(&a->icol));
26809566063dSJacob Faibussowitsch   PetscCall(ISInvertPermutation(col, PETSC_DECIDE, &a->icol));
2681f0ec6fceSSatish Balay 
268294a9d846SBarry Smith   if (!a->solve_work) { /* this matrix may have been factored before */
26839566063dSJacob Faibussowitsch     PetscCall(PetscMalloc1(inA->rmap->n + 1, &a->solve_work));
268494a9d846SBarry Smith   }
268563b91edcSBarry Smith 
26869566063dSJacob Faibussowitsch   PetscCall(MatMarkDiagonal_SeqAIJ(inA));
2687137fb511SHong Zhang   if (row_identity && col_identity) {
26889566063dSJacob Faibussowitsch     PetscCall(MatLUFactorNumeric_SeqAIJ_inplace(outA, inA, info));
2689137fb511SHong Zhang   } else {
26909566063dSJacob Faibussowitsch     PetscCall(MatLUFactorNumeric_SeqAIJ_InplaceWithPerm(outA, inA, info));
2691137fb511SHong Zhang   }
26923ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
2693a871dcd8SBarry Smith }
2694a871dcd8SBarry Smith 
2695d71ae5a4SJacob Faibussowitsch PetscErrorCode MatScale_SeqAIJ(Mat inA, PetscScalar alpha)
2696d71ae5a4SJacob Faibussowitsch {
2697f0b747eeSBarry Smith   Mat_SeqAIJ  *a = (Mat_SeqAIJ *)inA->data;
2698dfa0f9e5SStefano Zampini   PetscScalar *v;
2699c5df96a5SBarry Smith   PetscBLASInt one = 1, bnz;
27003a40ed3dSBarry Smith 
27013a40ed3dSBarry Smith   PetscFunctionBegin;
27029566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArray(inA, &v));
27039566063dSJacob Faibussowitsch   PetscCall(PetscBLASIntCast(a->nz, &bnz));
2704792fecdfSBarry Smith   PetscCallBLAS("BLASscal", BLASscal_(&bnz, &alpha, v, &one));
27059566063dSJacob Faibussowitsch   PetscCall(PetscLogFlops(a->nz));
27069566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArray(inA, &v));
27079566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJInvalidateDiagonal(inA));
27083ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
2709f0b747eeSBarry Smith }
2710f0b747eeSBarry Smith 
2711d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDestroySubMatrix_Private(Mat_SubSppt *submatj)
2712d71ae5a4SJacob Faibussowitsch {
271316b64355SHong Zhang   PetscInt i;
271416b64355SHong Zhang 
271516b64355SHong Zhang   PetscFunctionBegin;
271616b64355SHong Zhang   if (!submatj->id) { /* delete data that are linked only to submats[id=0] */
27179566063dSJacob Faibussowitsch     PetscCall(PetscFree4(submatj->sbuf1, submatj->ptr, submatj->tmp, submatj->ctr));
271816b64355SHong Zhang 
271948a46eb9SPierre Jolivet     for (i = 0; i < submatj->nrqr; ++i) PetscCall(PetscFree(submatj->sbuf2[i]));
27209566063dSJacob Faibussowitsch     PetscCall(PetscFree3(submatj->sbuf2, submatj->req_size, submatj->req_source1));
272116b64355SHong Zhang 
272216b64355SHong Zhang     if (submatj->rbuf1) {
27239566063dSJacob Faibussowitsch       PetscCall(PetscFree(submatj->rbuf1[0]));
27249566063dSJacob Faibussowitsch       PetscCall(PetscFree(submatj->rbuf1));
272516b64355SHong Zhang     }
272616b64355SHong Zhang 
272748a46eb9SPierre Jolivet     for (i = 0; i < submatj->nrqs; ++i) PetscCall(PetscFree(submatj->rbuf3[i]));
27289566063dSJacob Faibussowitsch     PetscCall(PetscFree3(submatj->req_source2, submatj->rbuf2, submatj->rbuf3));
27299566063dSJacob Faibussowitsch     PetscCall(PetscFree(submatj->pa));
273016b64355SHong Zhang   }
273116b64355SHong Zhang 
273216b64355SHong Zhang #if defined(PETSC_USE_CTABLE)
2733eec179cfSJacob Faibussowitsch   PetscCall(PetscHMapIDestroy(&submatj->rmap));
27349566063dSJacob Faibussowitsch   if (submatj->cmap_loc) PetscCall(PetscFree(submatj->cmap_loc));
27359566063dSJacob Faibussowitsch   PetscCall(PetscFree(submatj->rmap_loc));
273616b64355SHong Zhang #else
27379566063dSJacob Faibussowitsch   PetscCall(PetscFree(submatj->rmap));
273816b64355SHong Zhang #endif
273916b64355SHong Zhang 
274016b64355SHong Zhang   if (!submatj->allcolumns) {
274116b64355SHong Zhang #if defined(PETSC_USE_CTABLE)
2742eec179cfSJacob Faibussowitsch     PetscCall(PetscHMapIDestroy((PetscHMapI *)&submatj->cmap));
274316b64355SHong Zhang #else
27449566063dSJacob Faibussowitsch     PetscCall(PetscFree(submatj->cmap));
274516b64355SHong Zhang #endif
274616b64355SHong Zhang   }
27479566063dSJacob Faibussowitsch   PetscCall(PetscFree(submatj->row2proc));
274816b64355SHong Zhang 
27499566063dSJacob Faibussowitsch   PetscCall(PetscFree(submatj));
27503ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
275116b64355SHong Zhang }
275216b64355SHong Zhang 
2753d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDestroySubMatrix_SeqAIJ(Mat C)
2754d71ae5a4SJacob Faibussowitsch {
275516b64355SHong Zhang   Mat_SeqAIJ  *c       = (Mat_SeqAIJ *)C->data;
27565c39f6d9SHong Zhang   Mat_SubSppt *submatj = c->submatis1;
275716b64355SHong Zhang 
275816b64355SHong Zhang   PetscFunctionBegin;
27599566063dSJacob Faibussowitsch   PetscCall((*submatj->destroy)(C));
27609566063dSJacob Faibussowitsch   PetscCall(MatDestroySubMatrix_Private(submatj));
27613ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
276216b64355SHong Zhang }
276316b64355SHong Zhang 
276489a1a59bSHong Zhang /* Note this has code duplication with MatDestroySubMatrices_SeqBAIJ() */
2765ba38deedSJacob Faibussowitsch static PetscErrorCode MatDestroySubMatrices_SeqAIJ(PetscInt n, Mat *mat[])
2766d71ae5a4SJacob Faibussowitsch {
27672d033e1fSHong Zhang   PetscInt     i;
27680fb991dcSHong Zhang   Mat          C;
27690fb991dcSHong Zhang   Mat_SeqAIJ  *c;
27700fb991dcSHong Zhang   Mat_SubSppt *submatj;
27712d033e1fSHong Zhang 
27722d033e1fSHong Zhang   PetscFunctionBegin;
27732d033e1fSHong Zhang   for (i = 0; i < n; i++) {
27740fb991dcSHong Zhang     C       = (*mat)[i];
27750fb991dcSHong Zhang     c       = (Mat_SeqAIJ *)C->data;
27760fb991dcSHong Zhang     submatj = c->submatis1;
27772d033e1fSHong Zhang     if (submatj) {
2778682e4c99SStefano Zampini       if (--((PetscObject)C)->refct <= 0) {
277926cc229bSBarry Smith         PetscCall(PetscFree(C->factorprefix));
27809566063dSJacob Faibussowitsch         PetscCall((*submatj->destroy)(C));
27819566063dSJacob Faibussowitsch         PetscCall(MatDestroySubMatrix_Private(submatj));
27829566063dSJacob Faibussowitsch         PetscCall(PetscFree(C->defaultvectype));
27833faff063SStefano Zampini         PetscCall(PetscFree(C->defaultrandtype));
27849566063dSJacob Faibussowitsch         PetscCall(PetscLayoutDestroy(&C->rmap));
27859566063dSJacob Faibussowitsch         PetscCall(PetscLayoutDestroy(&C->cmap));
27869566063dSJacob Faibussowitsch         PetscCall(PetscHeaderDestroy(&C));
2787682e4c99SStefano Zampini       }
27882d033e1fSHong Zhang     } else {
27899566063dSJacob Faibussowitsch       PetscCall(MatDestroy(&C));
27902d033e1fSHong Zhang     }
27912d033e1fSHong Zhang   }
279286e85357SHong Zhang 
279363a75b2aSHong Zhang   /* Destroy Dummy submatrices created for reuse */
27949566063dSJacob Faibussowitsch   PetscCall(MatDestroySubMatrices_Dummy(n, mat));
279563a75b2aSHong Zhang 
27969566063dSJacob Faibussowitsch   PetscCall(PetscFree(*mat));
27973ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
27982d033e1fSHong Zhang }
27992d033e1fSHong Zhang 
2800ba38deedSJacob Faibussowitsch static PetscErrorCode MatCreateSubMatrices_SeqAIJ(Mat A, PetscInt n, const IS irow[], const IS icol[], MatReuse scall, Mat *B[])
2801d71ae5a4SJacob Faibussowitsch {
280297f1f81fSBarry Smith   PetscInt i;
2803cddf8d76SBarry Smith 
28043a40ed3dSBarry Smith   PetscFunctionBegin;
280548a46eb9SPierre Jolivet   if (scall == MAT_INITIAL_MATRIX) PetscCall(PetscCalloc1(n + 1, B));
2806cddf8d76SBarry Smith 
280748a46eb9SPierre Jolivet   for (i = 0; i < n; i++) PetscCall(MatCreateSubMatrix_SeqAIJ(A, irow[i], icol[i], PETSC_DECIDE, scall, &(*B)[i]));
28083ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
2809cddf8d76SBarry Smith }
2810cddf8d76SBarry Smith 
2811ba38deedSJacob Faibussowitsch static PetscErrorCode MatIncreaseOverlap_SeqAIJ(Mat A, PetscInt is_max, IS is[], PetscInt ov)
2812d71ae5a4SJacob Faibussowitsch {
2813e4d965acSSatish Balay   Mat_SeqAIJ     *a = (Mat_SeqAIJ *)A->data;
28149a88ca10SBarry Smith   PetscInt        row, i, j, k, l, ll, m, n, *nidx, isz, val;
28155d0c19d7SBarry Smith   const PetscInt *idx;
28169a88ca10SBarry Smith   PetscInt        start, end, *ai, *aj, bs = (A->rmap->bs > 0 && A->rmap->bs == A->cmap->bs) ? A->rmap->bs : 1;
2817f1af5d2fSBarry Smith   PetscBT         table;
2818bbd702dbSSatish Balay 
28193a40ed3dSBarry Smith   PetscFunctionBegin;
28209a88ca10SBarry Smith   m  = A->rmap->n / bs;
2821e4d965acSSatish Balay   ai = a->i;
2822bfeeae90SHong Zhang   aj = a->j;
28238a047759SSatish Balay 
282408401ef6SPierre Jolivet   PetscCheck(ov >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "illegal negative overlap value used");
282506763907SSatish Balay 
28269566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(m + 1, &nidx));
28279566063dSJacob Faibussowitsch   PetscCall(PetscBTCreate(m, &table));
282806763907SSatish Balay 
2829e4d965acSSatish Balay   for (i = 0; i < is_max; i++) {
2830b97fc60eSLois Curfman McInnes     /* Initialize the two local arrays */
2831e4d965acSSatish Balay     isz = 0;
28329566063dSJacob Faibussowitsch     PetscCall(PetscBTMemzero(m, table));
2833e4d965acSSatish Balay 
2834e4d965acSSatish Balay     /* Extract the indices, assume there can be duplicate entries */
28359566063dSJacob Faibussowitsch     PetscCall(ISGetIndices(is[i], &idx));
28369566063dSJacob Faibussowitsch     PetscCall(ISGetLocalSize(is[i], &n));
2837e4d965acSSatish Balay 
28389a88ca10SBarry Smith     if (bs > 1) {
28399a88ca10SBarry Smith       /* Enter these into the temp arrays. I.e., mark table[row], enter row into new index */
28409a88ca10SBarry Smith       for (j = 0; j < n; ++j) {
28419a88ca10SBarry Smith         if (!PetscBTLookupSet(table, idx[j] / bs)) nidx[isz++] = idx[j] / bs;
28429a88ca10SBarry Smith       }
28439a88ca10SBarry Smith       PetscCall(ISRestoreIndices(is[i], &idx));
28449a88ca10SBarry Smith       PetscCall(ISDestroy(&is[i]));
28459a88ca10SBarry Smith 
28469a88ca10SBarry Smith       k = 0;
28479a88ca10SBarry Smith       for (j = 0; j < ov; j++) { /* for each overlap */
28489a88ca10SBarry Smith         n = isz;
28499a88ca10SBarry Smith         for (; k < n; k++) { /* do only those rows in nidx[k], which are not done yet */
28509a88ca10SBarry Smith           for (ll = 0; ll < bs; ll++) {
28519a88ca10SBarry Smith             row   = bs * nidx[k] + ll;
28529a88ca10SBarry Smith             start = ai[row];
28539a88ca10SBarry Smith             end   = ai[row + 1];
28549a88ca10SBarry Smith             for (l = start; l < end; l++) {
28559a88ca10SBarry Smith               val = aj[l] / bs;
28569a88ca10SBarry Smith               if (!PetscBTLookupSet(table, val)) nidx[isz++] = val;
28579a88ca10SBarry Smith             }
28589a88ca10SBarry Smith           }
28599a88ca10SBarry Smith         }
28609a88ca10SBarry Smith       }
28619a88ca10SBarry Smith       PetscCall(ISCreateBlock(PETSC_COMM_SELF, bs, isz, nidx, PETSC_COPY_VALUES, (is + i)));
28629a88ca10SBarry Smith     } else {
2863dd097bc3SLois Curfman McInnes       /* Enter these into the temp arrays. I.e., mark table[row], enter row into new index */
2864e4d965acSSatish Balay       for (j = 0; j < n; ++j) {
28652205254eSKarl Rupp         if (!PetscBTLookupSet(table, idx[j])) nidx[isz++] = idx[j];
28664dcbc457SBarry Smith       }
28679566063dSJacob Faibussowitsch       PetscCall(ISRestoreIndices(is[i], &idx));
28689566063dSJacob Faibussowitsch       PetscCall(ISDestroy(&is[i]));
2869e4d965acSSatish Balay 
287004a348a9SBarry Smith       k = 0;
287104a348a9SBarry Smith       for (j = 0; j < ov; j++) { /* for each overlap */
287204a348a9SBarry Smith         n = isz;
287306763907SSatish Balay         for (; k < n; k++) { /* do only those rows in nidx[k], which are not done yet */
2874e4d965acSSatish Balay           row   = nidx[k];
2875e4d965acSSatish Balay           start = ai[row];
2876e4d965acSSatish Balay           end   = ai[row + 1];
287704a348a9SBarry Smith           for (l = start; l < end; l++) {
2878efb16452SHong Zhang             val = aj[l];
28792205254eSKarl Rupp             if (!PetscBTLookupSet(table, val)) nidx[isz++] = val;
2880e4d965acSSatish Balay           }
2881e4d965acSSatish Balay         }
2882e4d965acSSatish Balay       }
28839566063dSJacob Faibussowitsch       PetscCall(ISCreateGeneral(PETSC_COMM_SELF, isz, nidx, PETSC_COPY_VALUES, (is + i)));
2884e4d965acSSatish Balay     }
28859a88ca10SBarry Smith   }
28869566063dSJacob Faibussowitsch   PetscCall(PetscBTDestroy(&table));
28879566063dSJacob Faibussowitsch   PetscCall(PetscFree(nidx));
28883ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
28894dcbc457SBarry Smith }
289017ab2063SBarry Smith 
2891ba38deedSJacob Faibussowitsch static PetscErrorCode MatPermute_SeqAIJ(Mat A, IS rowp, IS colp, Mat *B)
2892d71ae5a4SJacob Faibussowitsch {
28930513a670SBarry Smith   Mat_SeqAIJ     *a = (Mat_SeqAIJ *)A->data;
28943b98c0a2SBarry Smith   PetscInt        i, nz = 0, m = A->rmap->n, n = A->cmap->n;
28955d0c19d7SBarry Smith   const PetscInt *row, *col;
28965d0c19d7SBarry Smith   PetscInt       *cnew, j, *lens;
289756cd22aeSBarry Smith   IS              icolp, irowp;
28980298fd71SBarry Smith   PetscInt       *cwork = NULL;
28990298fd71SBarry Smith   PetscScalar    *vwork = NULL;
29000513a670SBarry Smith 
29013a40ed3dSBarry Smith   PetscFunctionBegin;
29029566063dSJacob Faibussowitsch   PetscCall(ISInvertPermutation(rowp, PETSC_DECIDE, &irowp));
29039566063dSJacob Faibussowitsch   PetscCall(ISGetIndices(irowp, &row));
29049566063dSJacob Faibussowitsch   PetscCall(ISInvertPermutation(colp, PETSC_DECIDE, &icolp));
29059566063dSJacob Faibussowitsch   PetscCall(ISGetIndices(icolp, &col));
29060513a670SBarry Smith 
29070513a670SBarry Smith   /* determine lengths of permuted rows */
29089566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(m + 1, &lens));
29092205254eSKarl Rupp   for (i = 0; i < m; i++) lens[row[i]] = a->i[i + 1] - a->i[i];
29109566063dSJacob Faibussowitsch   PetscCall(MatCreate(PetscObjectComm((PetscObject)A), B));
29119566063dSJacob Faibussowitsch   PetscCall(MatSetSizes(*B, m, n, m, n));
29129566063dSJacob Faibussowitsch   PetscCall(MatSetBlockSizesFromMats(*B, A, A));
29139566063dSJacob Faibussowitsch   PetscCall(MatSetType(*B, ((PetscObject)A)->type_name));
29149566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(*B, 0, lens));
29159566063dSJacob Faibussowitsch   PetscCall(PetscFree(lens));
29160513a670SBarry Smith 
29179566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(n, &cnew));
29180513a670SBarry Smith   for (i = 0; i < m; i++) {
29199566063dSJacob Faibussowitsch     PetscCall(MatGetRow_SeqAIJ(A, i, &nz, &cwork, &vwork));
29202205254eSKarl Rupp     for (j = 0; j < nz; j++) cnew[j] = col[cwork[j]];
29219566063dSJacob Faibussowitsch     PetscCall(MatSetValues_SeqAIJ(*B, 1, &row[i], nz, cnew, vwork, INSERT_VALUES));
29229566063dSJacob Faibussowitsch     PetscCall(MatRestoreRow_SeqAIJ(A, i, &nz, &cwork, &vwork));
29230513a670SBarry Smith   }
29249566063dSJacob Faibussowitsch   PetscCall(PetscFree(cnew));
29252205254eSKarl Rupp 
29263c7d62e4SBarry Smith   (*B)->assembled = PETSC_FALSE;
29272205254eSKarl Rupp 
29288c3ff71bSJunchao Zhang #if defined(PETSC_HAVE_DEVICE)
29299566063dSJacob Faibussowitsch   PetscCall(MatBindToCPU(*B, A->boundtocpu));
29309fe5e383SStefano Zampini #endif
29319566063dSJacob Faibussowitsch   PetscCall(MatAssemblyBegin(*B, MAT_FINAL_ASSEMBLY));
29329566063dSJacob Faibussowitsch   PetscCall(MatAssemblyEnd(*B, MAT_FINAL_ASSEMBLY));
29339566063dSJacob Faibussowitsch   PetscCall(ISRestoreIndices(irowp, &row));
29349566063dSJacob Faibussowitsch   PetscCall(ISRestoreIndices(icolp, &col));
29359566063dSJacob Faibussowitsch   PetscCall(ISDestroy(&irowp));
29369566063dSJacob Faibussowitsch   PetscCall(ISDestroy(&icolp));
293748a46eb9SPierre Jolivet   if (rowp == colp) PetscCall(MatPropagateSymmetryOptions(A, *B));
29383ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
29390513a670SBarry Smith }
29400513a670SBarry Smith 
2941d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCopy_SeqAIJ(Mat A, Mat B, MatStructure str)
2942d71ae5a4SJacob Faibussowitsch {
2943cb5b572fSBarry Smith   PetscFunctionBegin;
294433f4a19fSKris Buschelman   /* If the two matrices have the same copy implementation, use fast copy. */
294533f4a19fSKris Buschelman   if (str == SAME_NONZERO_PATTERN && (A->ops->copy == B->ops->copy)) {
2946be6bf707SBarry Smith     Mat_SeqAIJ        *a = (Mat_SeqAIJ *)A->data;
2947be6bf707SBarry Smith     Mat_SeqAIJ        *b = (Mat_SeqAIJ *)B->data;
29482e5835c6SStefano Zampini     const PetscScalar *aa;
2949be6bf707SBarry Smith 
29509566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJGetArrayRead(A, &aa));
295108401ef6SPierre Jolivet     PetscCheck(a->i[A->rmap->n] == b->i[B->rmap->n], PETSC_COMM_SELF, PETSC_ERR_ARG_INCOMP, "Number of nonzeros in two matrices are different %" PetscInt_FMT " != %" PetscInt_FMT, a->i[A->rmap->n], b->i[B->rmap->n]);
29529566063dSJacob Faibussowitsch     PetscCall(PetscArraycpy(b->a, aa, a->i[A->rmap->n]));
29539566063dSJacob Faibussowitsch     PetscCall(PetscObjectStateIncrease((PetscObject)B));
29549566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJRestoreArrayRead(A, &aa));
2955cb5b572fSBarry Smith   } else {
29569566063dSJacob Faibussowitsch     PetscCall(MatCopy_Basic(A, B, str));
2957cb5b572fSBarry Smith   }
29583ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
2959cb5b572fSBarry Smith }
2960cb5b572fSBarry Smith 
2961d71ae5a4SJacob Faibussowitsch PETSC_INTERN PetscErrorCode MatSeqAIJGetArray_SeqAIJ(Mat A, PetscScalar *array[])
2962d71ae5a4SJacob Faibussowitsch {
29636c0721eeSBarry Smith   Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data;
29646e111a19SKarl Rupp 
29656c0721eeSBarry Smith   PetscFunctionBegin;
29666c0721eeSBarry Smith   *array = a->a;
29673ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
29686c0721eeSBarry Smith }
29696c0721eeSBarry Smith 
2970d71ae5a4SJacob Faibussowitsch PETSC_INTERN PetscErrorCode MatSeqAIJRestoreArray_SeqAIJ(Mat A, PetscScalar *array[])
2971d71ae5a4SJacob Faibussowitsch {
29726c0721eeSBarry Smith   PetscFunctionBegin;
2973f38c1e66SStefano Zampini   *array = NULL;
29743ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
29756c0721eeSBarry Smith }
2976273d9f13SBarry Smith 
29778229c054SShri Abhyankar /*
29788229c054SShri Abhyankar    Computes the number of nonzeros per row needed for preallocation when X and Y
29798229c054SShri Abhyankar    have different nonzero structure.
29808229c054SShri Abhyankar */
2981d71ae5a4SJacob Faibussowitsch PetscErrorCode MatAXPYGetPreallocation_SeqX_private(PetscInt m, const PetscInt *xi, const PetscInt *xj, const PetscInt *yi, const PetscInt *yj, PetscInt *nnz)
2982d71ae5a4SJacob Faibussowitsch {
2983b264fe52SHong Zhang   PetscInt i, j, k, nzx, nzy;
2984ec7775f6SShri Abhyankar 
2985ec7775f6SShri Abhyankar   PetscFunctionBegin;
2986ec7775f6SShri Abhyankar   /* Set the number of nonzeros in the new matrix */
2987ec7775f6SShri Abhyankar   for (i = 0; i < m; i++) {
29888e3a54c0SPierre Jolivet     const PetscInt *xjj = PetscSafePointerPlusOffset(xj, xi[i]), *yjj = PetscSafePointerPlusOffset(yj, yi[i]);
2989b264fe52SHong Zhang     nzx    = xi[i + 1] - xi[i];
2990b264fe52SHong Zhang     nzy    = yi[i + 1] - yi[i];
29918af7cee1SJed Brown     nnz[i] = 0;
29928af7cee1SJed Brown     for (j = 0, k = 0; j < nzx; j++) {                  /* Point in X */
2993b264fe52SHong Zhang       for (; k < nzy && yjj[k] < xjj[j]; k++) nnz[i]++; /* Catch up to X */
2994b264fe52SHong Zhang       if (k < nzy && yjj[k] == xjj[j]) k++;             /* Skip duplicate */
29958af7cee1SJed Brown       nnz[i]++;
29968af7cee1SJed Brown     }
29978af7cee1SJed Brown     for (; k < nzy; k++) nnz[i]++;
2998ec7775f6SShri Abhyankar   }
29993ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3000ec7775f6SShri Abhyankar }
3001ec7775f6SShri Abhyankar 
3002d71ae5a4SJacob Faibussowitsch PetscErrorCode MatAXPYGetPreallocation_SeqAIJ(Mat Y, Mat X, PetscInt *nnz)
3003d71ae5a4SJacob Faibussowitsch {
3004b264fe52SHong Zhang   PetscInt    m = Y->rmap->N;
3005b264fe52SHong Zhang   Mat_SeqAIJ *x = (Mat_SeqAIJ *)X->data;
3006b264fe52SHong Zhang   Mat_SeqAIJ *y = (Mat_SeqAIJ *)Y->data;
3007b264fe52SHong Zhang 
3008b264fe52SHong Zhang   PetscFunctionBegin;
3009b264fe52SHong Zhang   /* Set the number of nonzeros in the new matrix */
30109566063dSJacob Faibussowitsch   PetscCall(MatAXPYGetPreallocation_SeqX_private(m, x->i, x->j, y->i, y->j, nnz));
30113ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3012b264fe52SHong Zhang }
3013b264fe52SHong Zhang 
3014d71ae5a4SJacob Faibussowitsch PetscErrorCode MatAXPY_SeqAIJ(Mat Y, PetscScalar a, Mat X, MatStructure str)
3015d71ae5a4SJacob Faibussowitsch {
3016ac90fabeSBarry Smith   Mat_SeqAIJ *x = (Mat_SeqAIJ *)X->data, *y = (Mat_SeqAIJ *)Y->data;
3017ac90fabeSBarry Smith 
3018ac90fabeSBarry Smith   PetscFunctionBegin;
3019134adf20SPierre Jolivet   if (str == UNKNOWN_NONZERO_PATTERN || (PetscDefined(USE_DEBUG) && str == SAME_NONZERO_PATTERN)) {
3020134adf20SPierre Jolivet     PetscBool e = x->nz == y->nz ? PETSC_TRUE : PETSC_FALSE;
3021134adf20SPierre Jolivet     if (e) {
30229566063dSJacob Faibussowitsch       PetscCall(PetscArraycmp(x->i, y->i, Y->rmap->n + 1, &e));
302381fa06acSBarry Smith       if (e) {
30249566063dSJacob Faibussowitsch         PetscCall(PetscArraycmp(x->j, y->j, y->nz, &e));
3025134adf20SPierre Jolivet         if (e) str = SAME_NONZERO_PATTERN;
302681fa06acSBarry Smith       }
302781fa06acSBarry Smith     }
302854c59aa7SJacob Faibussowitsch     if (!e) PetscCheck(str != SAME_NONZERO_PATTERN, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONG, "MatStructure is not SAME_NONZERO_PATTERN");
302981fa06acSBarry Smith   }
3030ac90fabeSBarry Smith   if (str == SAME_NONZERO_PATTERN) {
30312e5835c6SStefano Zampini     const PetscScalar *xa;
30322e5835c6SStefano Zampini     PetscScalar       *ya, alpha = a;
303381fa06acSBarry Smith     PetscBLASInt       one = 1, bnz;
303481fa06acSBarry Smith 
30359566063dSJacob Faibussowitsch     PetscCall(PetscBLASIntCast(x->nz, &bnz));
30369566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJGetArray(Y, &ya));
30379566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJGetArrayRead(X, &xa));
3038792fecdfSBarry Smith     PetscCallBLAS("BLASaxpy", BLASaxpy_(&bnz, &alpha, xa, &one, ya, &one));
30399566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJRestoreArrayRead(X, &xa));
30409566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJRestoreArray(Y, &ya));
30419566063dSJacob Faibussowitsch     PetscCall(PetscLogFlops(2.0 * bnz));
30429566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJInvalidateDiagonal(Y));
30439566063dSJacob Faibussowitsch     PetscCall(PetscObjectStateIncrease((PetscObject)Y));
3044ab784542SHong Zhang   } else if (str == SUBSET_NONZERO_PATTERN) { /* nonzeros of X is a subset of Y's */
30459566063dSJacob Faibussowitsch     PetscCall(MatAXPY_Basic(Y, a, X, str));
3046ac90fabeSBarry Smith   } else {
30478229c054SShri Abhyankar     Mat       B;
30488229c054SShri Abhyankar     PetscInt *nnz;
30499566063dSJacob Faibussowitsch     PetscCall(PetscMalloc1(Y->rmap->N, &nnz));
30509566063dSJacob Faibussowitsch     PetscCall(MatCreate(PetscObjectComm((PetscObject)Y), &B));
30519566063dSJacob Faibussowitsch     PetscCall(PetscObjectSetName((PetscObject)B, ((PetscObject)Y)->name));
30529566063dSJacob Faibussowitsch     PetscCall(MatSetLayouts(B, Y->rmap, Y->cmap));
30539566063dSJacob Faibussowitsch     PetscCall(MatSetType(B, ((PetscObject)Y)->type_name));
30549566063dSJacob Faibussowitsch     PetscCall(MatAXPYGetPreallocation_SeqAIJ(Y, X, nnz));
30559566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJSetPreallocation(B, 0, nnz));
30569566063dSJacob Faibussowitsch     PetscCall(MatAXPY_BasicWithPreallocation(B, Y, a, X, str));
30579566063dSJacob Faibussowitsch     PetscCall(MatHeaderMerge(Y, &B));
30589bb234a9SBarry Smith     PetscCall(MatSeqAIJCheckInode(Y));
30599566063dSJacob Faibussowitsch     PetscCall(PetscFree(nnz));
3060ac90fabeSBarry Smith   }
30613ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3062ac90fabeSBarry Smith }
3063ac90fabeSBarry Smith 
3064d71ae5a4SJacob Faibussowitsch PETSC_INTERN PetscErrorCode MatConjugate_SeqAIJ(Mat mat)
3065d71ae5a4SJacob Faibussowitsch {
3066354c94deSBarry Smith #if defined(PETSC_USE_COMPLEX)
3067354c94deSBarry Smith   Mat_SeqAIJ  *aij = (Mat_SeqAIJ *)mat->data;
3068354c94deSBarry Smith   PetscInt     i, nz;
3069354c94deSBarry Smith   PetscScalar *a;
3070354c94deSBarry Smith 
3071354c94deSBarry Smith   PetscFunctionBegin;
3072354c94deSBarry Smith   nz = aij->nz;
30739566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArray(mat, &a));
30742205254eSKarl Rupp   for (i = 0; i < nz; i++) a[i] = PetscConj(a[i]);
30759566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArray(mat, &a));
3076354c94deSBarry Smith #else
3077354c94deSBarry Smith   PetscFunctionBegin;
3078354c94deSBarry Smith #endif
30793ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3080354c94deSBarry Smith }
3081354c94deSBarry Smith 
3082ba38deedSJacob Faibussowitsch static PetscErrorCode MatGetRowMaxAbs_SeqAIJ(Mat A, Vec v, PetscInt idx[])
3083d71ae5a4SJacob Faibussowitsch {
3084e34fafa9SBarry Smith   Mat_SeqAIJ      *a = (Mat_SeqAIJ *)A->data;
3085d0f46423SBarry Smith   PetscInt         i, j, m = A->rmap->n, *ai, *aj, ncols, n;
3086e34fafa9SBarry Smith   PetscReal        atmp;
3087985db425SBarry Smith   PetscScalar     *x;
3088ce496241SStefano Zampini   const MatScalar *aa, *av;
3089e34fafa9SBarry Smith 
3090e34fafa9SBarry Smith   PetscFunctionBegin;
309128b400f6SJacob Faibussowitsch   PetscCheck(!A->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix");
30929566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &av));
3093ce496241SStefano Zampini   aa = av;
3094e34fafa9SBarry Smith   ai = a->i;
3095e34fafa9SBarry Smith   aj = a->j;
3096e34fafa9SBarry Smith 
30979566063dSJacob Faibussowitsch   PetscCall(VecSet(v, 0.0));
30989566063dSJacob Faibussowitsch   PetscCall(VecGetArrayWrite(v, &x));
30999566063dSJacob Faibussowitsch   PetscCall(VecGetLocalSize(v, &n));
310008401ef6SPierre Jolivet   PetscCheck(n == A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Nonconforming matrix and vector");
3101e34fafa9SBarry Smith   for (i = 0; i < m; i++) {
31029371c9d4SSatish Balay     ncols = ai[1] - ai[0];
31039371c9d4SSatish Balay     ai++;
3104e34fafa9SBarry Smith     for (j = 0; j < ncols; j++) {
3105985db425SBarry Smith       atmp = PetscAbsScalar(*aa);
31069371c9d4SSatish Balay       if (PetscAbsScalar(x[i]) < atmp) {
31079371c9d4SSatish Balay         x[i] = atmp;
31089371c9d4SSatish Balay         if (idx) idx[i] = *aj;
31099371c9d4SSatish Balay       }
31109371c9d4SSatish Balay       aa++;
31119371c9d4SSatish Balay       aj++;
3112985db425SBarry Smith     }
3113985db425SBarry Smith   }
31149566063dSJacob Faibussowitsch   PetscCall(VecRestoreArrayWrite(v, &x));
31159566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &av));
31163ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3117985db425SBarry Smith }
3118985db425SBarry Smith 
3119eede4a3fSMark Adams static PetscErrorCode MatGetRowSumAbs_SeqAIJ(Mat A, Vec v)
3120eede4a3fSMark Adams {
3121eede4a3fSMark Adams   Mat_SeqAIJ      *a = (Mat_SeqAIJ *)A->data;
3122eede4a3fSMark Adams   PetscInt         i, j, m = A->rmap->n, *ai, ncols, n;
3123eede4a3fSMark Adams   PetscScalar     *x;
3124eede4a3fSMark Adams   const MatScalar *aa, *av;
3125eede4a3fSMark Adams 
3126eede4a3fSMark Adams   PetscFunctionBegin;
3127eede4a3fSMark Adams   PetscCheck(!A->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix");
3128eede4a3fSMark Adams   PetscCall(MatSeqAIJGetArrayRead(A, &av));
3129eede4a3fSMark Adams   aa = av;
3130eede4a3fSMark Adams   ai = a->i;
3131eede4a3fSMark Adams 
3132eede4a3fSMark Adams   PetscCall(VecSet(v, 0.0));
3133eede4a3fSMark Adams   PetscCall(VecGetArrayWrite(v, &x));
3134eede4a3fSMark Adams   PetscCall(VecGetLocalSize(v, &n));
3135eede4a3fSMark Adams   PetscCheck(n == A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Nonconforming matrix and vector");
3136eede4a3fSMark Adams   for (i = 0; i < m; i++) {
3137eede4a3fSMark Adams     ncols = ai[1] - ai[0];
3138eede4a3fSMark Adams     ai++;
3139eede4a3fSMark Adams     for (j = 0; j < ncols; j++) {
3140eede4a3fSMark Adams       x[i] += PetscAbsScalar(*aa);
3141eede4a3fSMark Adams       aa++;
3142eede4a3fSMark Adams     }
3143eede4a3fSMark Adams   }
3144eede4a3fSMark Adams   PetscCall(VecRestoreArrayWrite(v, &x));
3145eede4a3fSMark Adams   PetscCall(MatSeqAIJRestoreArrayRead(A, &av));
3146eede4a3fSMark Adams   PetscFunctionReturn(PETSC_SUCCESS);
3147eede4a3fSMark Adams }
3148eede4a3fSMark Adams 
3149ba38deedSJacob Faibussowitsch static PetscErrorCode MatGetRowMax_SeqAIJ(Mat A, Vec v, PetscInt idx[])
3150d71ae5a4SJacob Faibussowitsch {
3151985db425SBarry Smith   Mat_SeqAIJ      *a = (Mat_SeqAIJ *)A->data;
3152d0f46423SBarry Smith   PetscInt         i, j, m = A->rmap->n, *ai, *aj, ncols, n;
3153985db425SBarry Smith   PetscScalar     *x;
3154ce496241SStefano Zampini   const MatScalar *aa, *av;
3155985db425SBarry Smith 
3156985db425SBarry Smith   PetscFunctionBegin;
315728b400f6SJacob Faibussowitsch   PetscCheck(!A->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix");
31589566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &av));
3159ce496241SStefano Zampini   aa = av;
3160985db425SBarry Smith   ai = a->i;
3161985db425SBarry Smith   aj = a->j;
3162985db425SBarry Smith 
31639566063dSJacob Faibussowitsch   PetscCall(VecSet(v, 0.0));
31649566063dSJacob Faibussowitsch   PetscCall(VecGetArrayWrite(v, &x));
31659566063dSJacob Faibussowitsch   PetscCall(VecGetLocalSize(v, &n));
316608401ef6SPierre Jolivet   PetscCheck(n == A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Nonconforming matrix and vector");
3167985db425SBarry Smith   for (i = 0; i < m; i++) {
31689371c9d4SSatish Balay     ncols = ai[1] - ai[0];
31699371c9d4SSatish Balay     ai++;
3170d0f46423SBarry Smith     if (ncols == A->cmap->n) { /* row is dense */
31719371c9d4SSatish Balay       x[i] = *aa;
31729371c9d4SSatish Balay       if (idx) idx[i] = 0;
3173985db425SBarry Smith     } else { /* row is sparse so already KNOW maximum is 0.0 or higher */
3174985db425SBarry Smith       x[i] = 0.0;
3175985db425SBarry Smith       if (idx) {
3176985db425SBarry Smith         for (j = 0; j < ncols; j++) { /* find first implicit 0.0 in the row */
3177985db425SBarry Smith           if (aj[j] > j) {
3178985db425SBarry Smith             idx[i] = j;
3179985db425SBarry Smith             break;
3180985db425SBarry Smith           }
3181985db425SBarry Smith         }
31821a254869SHong Zhang         /* in case first implicit 0.0 in the row occurs at ncols-th column */
31831a254869SHong Zhang         if (j == ncols && j < A->cmap->n) idx[i] = j;
3184985db425SBarry Smith       }
3185985db425SBarry Smith     }
3186985db425SBarry Smith     for (j = 0; j < ncols; j++) {
31879371c9d4SSatish Balay       if (PetscRealPart(x[i]) < PetscRealPart(*aa)) {
31889371c9d4SSatish Balay         x[i] = *aa;
31899371c9d4SSatish Balay         if (idx) idx[i] = *aj;
31909371c9d4SSatish Balay       }
31919371c9d4SSatish Balay       aa++;
31929371c9d4SSatish Balay       aj++;
3193985db425SBarry Smith     }
3194985db425SBarry Smith   }
31959566063dSJacob Faibussowitsch   PetscCall(VecRestoreArrayWrite(v, &x));
31969566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &av));
31973ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3198985db425SBarry Smith }
3199985db425SBarry Smith 
3200ba38deedSJacob Faibussowitsch static PetscErrorCode MatGetRowMinAbs_SeqAIJ(Mat A, Vec v, PetscInt idx[])
3201d71ae5a4SJacob Faibussowitsch {
3202c87e5d42SMatthew Knepley   Mat_SeqAIJ      *a = (Mat_SeqAIJ *)A->data;
3203c87e5d42SMatthew Knepley   PetscInt         i, j, m = A->rmap->n, *ai, *aj, ncols, n;
3204ce496241SStefano Zampini   PetscScalar     *x;
3205ce496241SStefano Zampini   const MatScalar *aa, *av;
3206c87e5d42SMatthew Knepley 
3207c87e5d42SMatthew Knepley   PetscFunctionBegin;
32089566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &av));
3209ce496241SStefano Zampini   aa = av;
3210c87e5d42SMatthew Knepley   ai = a->i;
3211c87e5d42SMatthew Knepley   aj = a->j;
3212c87e5d42SMatthew Knepley 
32139566063dSJacob Faibussowitsch   PetscCall(VecSet(v, 0.0));
32149566063dSJacob Faibussowitsch   PetscCall(VecGetArrayWrite(v, &x));
32159566063dSJacob Faibussowitsch   PetscCall(VecGetLocalSize(v, &n));
321608401ef6SPierre Jolivet   PetscCheck(n == m, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Nonconforming matrix and vector, %" PetscInt_FMT " vs. %" PetscInt_FMT " rows", m, n);
3217c87e5d42SMatthew Knepley   for (i = 0; i < m; i++) {
32189371c9d4SSatish Balay     ncols = ai[1] - ai[0];
32199371c9d4SSatish Balay     ai++;
3220f07e67edSHong Zhang     if (ncols == A->cmap->n) { /* row is dense */
32219371c9d4SSatish Balay       x[i] = *aa;
32229371c9d4SSatish Balay       if (idx) idx[i] = 0;
3223f07e67edSHong Zhang     } else { /* row is sparse so already KNOW minimum is 0.0 or higher */
3224f07e67edSHong Zhang       x[i] = 0.0;
3225f07e67edSHong Zhang       if (idx) { /* find first implicit 0.0 in the row */
3226289a08f5SMatthew Knepley         for (j = 0; j < ncols; j++) {
3227f07e67edSHong Zhang           if (aj[j] > j) {
3228f07e67edSHong Zhang             idx[i] = j;
32292205254eSKarl Rupp             break;
32302205254eSKarl Rupp           }
3231289a08f5SMatthew Knepley         }
3232f07e67edSHong Zhang         /* in case first implicit 0.0 in the row occurs at ncols-th column */
3233f07e67edSHong Zhang         if (j == ncols && j < A->cmap->n) idx[i] = j;
3234f07e67edSHong Zhang       }
3235289a08f5SMatthew Knepley     }
3236c87e5d42SMatthew Knepley     for (j = 0; j < ncols; j++) {
32379371c9d4SSatish Balay       if (PetscAbsScalar(x[i]) > PetscAbsScalar(*aa)) {
32389371c9d4SSatish Balay         x[i] = *aa;
32399371c9d4SSatish Balay         if (idx) idx[i] = *aj;
32409371c9d4SSatish Balay       }
32419371c9d4SSatish Balay       aa++;
32429371c9d4SSatish Balay       aj++;
3243c87e5d42SMatthew Knepley     }
3244c87e5d42SMatthew Knepley   }
32459566063dSJacob Faibussowitsch   PetscCall(VecRestoreArrayWrite(v, &x));
32469566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &av));
32473ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3248c87e5d42SMatthew Knepley }
3249c87e5d42SMatthew Knepley 
3250ba38deedSJacob Faibussowitsch static PetscErrorCode MatGetRowMin_SeqAIJ(Mat A, Vec v, PetscInt idx[])
3251d71ae5a4SJacob Faibussowitsch {
3252985db425SBarry Smith   Mat_SeqAIJ      *a = (Mat_SeqAIJ *)A->data;
3253d9ca1df4SBarry Smith   PetscInt         i, j, m = A->rmap->n, ncols, n;
3254d9ca1df4SBarry Smith   const PetscInt  *ai, *aj;
3255985db425SBarry Smith   PetscScalar     *x;
3256ce496241SStefano Zampini   const MatScalar *aa, *av;
3257985db425SBarry Smith 
3258985db425SBarry Smith   PetscFunctionBegin;
325928b400f6SJacob Faibussowitsch   PetscCheck(!A->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix");
32609566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &av));
3261ce496241SStefano Zampini   aa = av;
3262985db425SBarry Smith   ai = a->i;
3263985db425SBarry Smith   aj = a->j;
3264985db425SBarry Smith 
32659566063dSJacob Faibussowitsch   PetscCall(VecSet(v, 0.0));
32669566063dSJacob Faibussowitsch   PetscCall(VecGetArrayWrite(v, &x));
32679566063dSJacob Faibussowitsch   PetscCall(VecGetLocalSize(v, &n));
326808401ef6SPierre Jolivet   PetscCheck(n == m, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Nonconforming matrix and vector");
3269985db425SBarry Smith   for (i = 0; i < m; i++) {
32709371c9d4SSatish Balay     ncols = ai[1] - ai[0];
32719371c9d4SSatish Balay     ai++;
3272d0f46423SBarry Smith     if (ncols == A->cmap->n) { /* row is dense */
32739371c9d4SSatish Balay       x[i] = *aa;
32749371c9d4SSatish Balay       if (idx) idx[i] = 0;
3275985db425SBarry Smith     } else { /* row is sparse so already KNOW minimum is 0.0 or lower */
3276985db425SBarry Smith       x[i] = 0.0;
3277985db425SBarry Smith       if (idx) { /* find first implicit 0.0 in the row */
3278985db425SBarry Smith         for (j = 0; j < ncols; j++) {
3279985db425SBarry Smith           if (aj[j] > j) {
3280985db425SBarry Smith             idx[i] = j;
3281985db425SBarry Smith             break;
3282985db425SBarry Smith           }
3283985db425SBarry Smith         }
3284fa213d2fSHong Zhang         /* in case first implicit 0.0 in the row occurs at ncols-th column */
3285fa213d2fSHong Zhang         if (j == ncols && j < A->cmap->n) idx[i] = j;
3286985db425SBarry Smith       }
3287985db425SBarry Smith     }
3288985db425SBarry Smith     for (j = 0; j < ncols; j++) {
32899371c9d4SSatish Balay       if (PetscRealPart(x[i]) > PetscRealPart(*aa)) {
32909371c9d4SSatish Balay         x[i] = *aa;
32919371c9d4SSatish Balay         if (idx) idx[i] = *aj;
32929371c9d4SSatish Balay       }
32939371c9d4SSatish Balay       aa++;
32949371c9d4SSatish Balay       aj++;
3295e34fafa9SBarry Smith     }
3296e34fafa9SBarry Smith   }
32979566063dSJacob Faibussowitsch   PetscCall(VecRestoreArrayWrite(v, &x));
32989566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &av));
32993ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3300e34fafa9SBarry Smith }
3301bbead8a2SBarry Smith 
3302ba38deedSJacob Faibussowitsch static PetscErrorCode MatInvertBlockDiagonal_SeqAIJ(Mat A, const PetscScalar **values)
3303d71ae5a4SJacob Faibussowitsch {
3304bbead8a2SBarry Smith   Mat_SeqAIJ     *a = (Mat_SeqAIJ *)A->data;
330533d57670SJed Brown   PetscInt        i, bs = PetscAbs(A->rmap->bs), mbs = A->rmap->n / bs, ipvt[5], bs2 = bs * bs, *v_pivots, ij[7], *IJ, j;
3306bbead8a2SBarry Smith   MatScalar      *diag, work[25], *v_work;
33070da83c2eSBarry Smith   const PetscReal shift = 0.0;
33081a9391e3SHong Zhang   PetscBool       allowzeropivot, zeropivotdetected = PETSC_FALSE;
3309bbead8a2SBarry Smith 
3310bbead8a2SBarry Smith   PetscFunctionBegin;
3311a455e926SHong Zhang   allowzeropivot = PetscNot(A->erroriffailure);
33124a0d0026SBarry Smith   if (a->ibdiagvalid) {
33134a0d0026SBarry Smith     if (values) *values = a->ibdiag;
33143ba16761SJacob Faibussowitsch     PetscFunctionReturn(PETSC_SUCCESS);
33154a0d0026SBarry Smith   }
33169566063dSJacob Faibussowitsch   PetscCall(MatMarkDiagonal_SeqAIJ(A));
33174dfa11a4SJacob Faibussowitsch   if (!a->ibdiag) { PetscCall(PetscMalloc1(bs2 * mbs, &a->ibdiag)); }
3318bbead8a2SBarry Smith   diag = a->ibdiag;
3319bbead8a2SBarry Smith   if (values) *values = a->ibdiag;
3320bbead8a2SBarry Smith   /* factor and invert each block */
3321bbead8a2SBarry Smith   switch (bs) {
3322bbead8a2SBarry Smith   case 1:
3323bbead8a2SBarry Smith     for (i = 0; i < mbs; i++) {
33249566063dSJacob Faibussowitsch       PetscCall(MatGetValues(A, 1, &i, 1, &i, diag + i));
3325ec1892c8SHong Zhang       if (PetscAbsScalar(diag[i] + shift) < PETSC_MACHINE_EPSILON) {
3326ec1892c8SHong Zhang         if (allowzeropivot) {
33277b6c816cSBarry Smith           A->factorerrortype             = MAT_FACTOR_NUMERIC_ZEROPIVOT;
33287b6c816cSBarry Smith           A->factorerror_zeropivot_value = PetscAbsScalar(diag[i]);
33297b6c816cSBarry Smith           A->factorerror_zeropivot_row   = i;
33309566063dSJacob Faibussowitsch           PetscCall(PetscInfo(A, "Zero pivot, row %" PetscInt_FMT " pivot %g tolerance %g\n", i, (double)PetscAbsScalar(diag[i]), (double)PETSC_MACHINE_EPSILON));
333198921bdaSJacob Faibussowitsch         } else SETERRQ(PETSC_COMM_SELF, PETSC_ERR_MAT_LU_ZRPVT, "Zero pivot, row %" PetscInt_FMT " pivot %g tolerance %g", i, (double)PetscAbsScalar(diag[i]), (double)PETSC_MACHINE_EPSILON);
3332ec1892c8SHong Zhang       }
3333bbead8a2SBarry Smith       diag[i] = (PetscScalar)1.0 / (diag[i] + shift);
3334bbead8a2SBarry Smith     }
3335bbead8a2SBarry Smith     break;
3336bbead8a2SBarry Smith   case 2:
3337bbead8a2SBarry Smith     for (i = 0; i < mbs; i++) {
33389371c9d4SSatish Balay       ij[0] = 2 * i;
33399371c9d4SSatish Balay       ij[1] = 2 * i + 1;
33409566063dSJacob Faibussowitsch       PetscCall(MatGetValues(A, 2, ij, 2, ij, diag));
33419566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_inverse_A_2(diag, shift, allowzeropivot, &zeropivotdetected));
33427b6c816cSBarry Smith       if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT;
33439566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_transpose_A_2(diag));
3344bbead8a2SBarry Smith       diag += 4;
3345bbead8a2SBarry Smith     }
3346bbead8a2SBarry Smith     break;
3347bbead8a2SBarry Smith   case 3:
3348bbead8a2SBarry Smith     for (i = 0; i < mbs; i++) {
33499371c9d4SSatish Balay       ij[0] = 3 * i;
33509371c9d4SSatish Balay       ij[1] = 3 * i + 1;
33519371c9d4SSatish Balay       ij[2] = 3 * i + 2;
33529566063dSJacob Faibussowitsch       PetscCall(MatGetValues(A, 3, ij, 3, ij, diag));
33539566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_inverse_A_3(diag, shift, allowzeropivot, &zeropivotdetected));
33547b6c816cSBarry Smith       if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT;
33559566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_transpose_A_3(diag));
3356bbead8a2SBarry Smith       diag += 9;
3357bbead8a2SBarry Smith     }
3358bbead8a2SBarry Smith     break;
3359bbead8a2SBarry Smith   case 4:
3360bbead8a2SBarry Smith     for (i = 0; i < mbs; i++) {
33619371c9d4SSatish Balay       ij[0] = 4 * i;
33629371c9d4SSatish Balay       ij[1] = 4 * i + 1;
33639371c9d4SSatish Balay       ij[2] = 4 * i + 2;
33649371c9d4SSatish Balay       ij[3] = 4 * i + 3;
33659566063dSJacob Faibussowitsch       PetscCall(MatGetValues(A, 4, ij, 4, ij, diag));
33669566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_inverse_A_4(diag, shift, allowzeropivot, &zeropivotdetected));
33677b6c816cSBarry Smith       if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT;
33689566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_transpose_A_4(diag));
3369bbead8a2SBarry Smith       diag += 16;
3370bbead8a2SBarry Smith     }
3371bbead8a2SBarry Smith     break;
3372bbead8a2SBarry Smith   case 5:
3373bbead8a2SBarry Smith     for (i = 0; i < mbs; i++) {
33749371c9d4SSatish Balay       ij[0] = 5 * i;
33759371c9d4SSatish Balay       ij[1] = 5 * i + 1;
33769371c9d4SSatish Balay       ij[2] = 5 * i + 2;
33779371c9d4SSatish Balay       ij[3] = 5 * i + 3;
33789371c9d4SSatish Balay       ij[4] = 5 * i + 4;
33799566063dSJacob Faibussowitsch       PetscCall(MatGetValues(A, 5, ij, 5, ij, diag));
33809566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_inverse_A_5(diag, ipvt, work, shift, allowzeropivot, &zeropivotdetected));
33817b6c816cSBarry Smith       if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT;
33829566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_transpose_A_5(diag));
3383bbead8a2SBarry Smith       diag += 25;
3384bbead8a2SBarry Smith     }
3385bbead8a2SBarry Smith     break;
3386bbead8a2SBarry Smith   case 6:
3387bbead8a2SBarry Smith     for (i = 0; i < mbs; i++) {
33889371c9d4SSatish Balay       ij[0] = 6 * i;
33899371c9d4SSatish Balay       ij[1] = 6 * i + 1;
33909371c9d4SSatish Balay       ij[2] = 6 * i + 2;
33919371c9d4SSatish Balay       ij[3] = 6 * i + 3;
33929371c9d4SSatish Balay       ij[4] = 6 * i + 4;
33939371c9d4SSatish Balay       ij[5] = 6 * i + 5;
33949566063dSJacob Faibussowitsch       PetscCall(MatGetValues(A, 6, ij, 6, ij, diag));
33959566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_inverse_A_6(diag, shift, allowzeropivot, &zeropivotdetected));
33967b6c816cSBarry Smith       if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT;
33979566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_transpose_A_6(diag));
3398bbead8a2SBarry Smith       diag += 36;
3399bbead8a2SBarry Smith     }
3400bbead8a2SBarry Smith     break;
3401bbead8a2SBarry Smith   case 7:
3402bbead8a2SBarry Smith     for (i = 0; i < mbs; i++) {
34039371c9d4SSatish Balay       ij[0] = 7 * i;
34049371c9d4SSatish Balay       ij[1] = 7 * i + 1;
34059371c9d4SSatish Balay       ij[2] = 7 * i + 2;
34069371c9d4SSatish Balay       ij[3] = 7 * i + 3;
34079371c9d4SSatish Balay       ij[4] = 7 * i + 4;
34089371c9d4SSatish Balay       ij[5] = 7 * i + 5;
3409cdd8bf47SJunchao Zhang       ij[6] = 7 * i + 6;
34109566063dSJacob Faibussowitsch       PetscCall(MatGetValues(A, 7, ij, 7, ij, diag));
34119566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_inverse_A_7(diag, shift, allowzeropivot, &zeropivotdetected));
34127b6c816cSBarry Smith       if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT;
34139566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_transpose_A_7(diag));
3414bbead8a2SBarry Smith       diag += 49;
3415bbead8a2SBarry Smith     }
3416bbead8a2SBarry Smith     break;
3417bbead8a2SBarry Smith   default:
34189566063dSJacob Faibussowitsch     PetscCall(PetscMalloc3(bs, &v_work, bs, &v_pivots, bs, &IJ));
3419bbead8a2SBarry Smith     for (i = 0; i < mbs; i++) {
3420ad540459SPierre Jolivet       for (j = 0; j < bs; j++) IJ[j] = bs * i + j;
34219566063dSJacob Faibussowitsch       PetscCall(MatGetValues(A, bs, IJ, bs, IJ, diag));
34229566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_inverse_A(bs, diag, v_pivots, v_work, allowzeropivot, &zeropivotdetected));
34237b6c816cSBarry Smith       if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT;
34249566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_transpose_A_N(diag, bs));
3425bbead8a2SBarry Smith       diag += bs2;
3426bbead8a2SBarry Smith     }
34279566063dSJacob Faibussowitsch     PetscCall(PetscFree3(v_work, v_pivots, IJ));
3428bbead8a2SBarry Smith   }
3429bbead8a2SBarry Smith   a->ibdiagvalid = PETSC_TRUE;
34303ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3431bbead8a2SBarry Smith }
3432bbead8a2SBarry Smith 
3433d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatSetRandom_SeqAIJ(Mat x, PetscRandom rctx)
3434d71ae5a4SJacob Faibussowitsch {
343573a71a0fSBarry Smith   Mat_SeqAIJ *aij = (Mat_SeqAIJ *)x->data;
3436fff043a9SJunchao Zhang   PetscScalar a, *aa;
343773a71a0fSBarry Smith   PetscInt    m, n, i, j, col;
343873a71a0fSBarry Smith 
343973a71a0fSBarry Smith   PetscFunctionBegin;
344073a71a0fSBarry Smith   if (!x->assembled) {
34419566063dSJacob Faibussowitsch     PetscCall(MatGetSize(x, &m, &n));
344273a71a0fSBarry Smith     for (i = 0; i < m; i++) {
344373a71a0fSBarry Smith       for (j = 0; j < aij->imax[i]; j++) {
34449566063dSJacob Faibussowitsch         PetscCall(PetscRandomGetValue(rctx, &a));
344573a71a0fSBarry Smith         col = (PetscInt)(n * PetscRealPart(a));
34469566063dSJacob Faibussowitsch         PetscCall(MatSetValues(x, 1, &i, 1, &col, &a, ADD_VALUES));
344773a71a0fSBarry Smith       }
344873a71a0fSBarry Smith     }
3449e2ce353bSJunchao Zhang   } else {
34509566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJGetArrayWrite(x, &aa));
34519566063dSJacob Faibussowitsch     for (i = 0; i < aij->nz; i++) PetscCall(PetscRandomGetValue(rctx, aa + i));
34529566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJRestoreArrayWrite(x, &aa));
3453e2ce353bSJunchao Zhang   }
34549566063dSJacob Faibussowitsch   PetscCall(MatAssemblyBegin(x, MAT_FINAL_ASSEMBLY));
34559566063dSJacob Faibussowitsch   PetscCall(MatAssemblyEnd(x, MAT_FINAL_ASSEMBLY));
34563ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
345773a71a0fSBarry Smith }
345873a71a0fSBarry Smith 
3459679944adSJunchao Zhang /* Like MatSetRandom_SeqAIJ, but do not set values on columns in range of [low, high) */
3460d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetRandomSkipColumnRange_SeqAIJ_Private(Mat x, PetscInt low, PetscInt high, PetscRandom rctx)
3461d71ae5a4SJacob Faibussowitsch {
3462679944adSJunchao Zhang   Mat_SeqAIJ *aij = (Mat_SeqAIJ *)x->data;
3463679944adSJunchao Zhang   PetscScalar a;
3464679944adSJunchao Zhang   PetscInt    m, n, i, j, col, nskip;
3465679944adSJunchao Zhang 
3466679944adSJunchao Zhang   PetscFunctionBegin;
3467679944adSJunchao Zhang   nskip = high - low;
34689566063dSJacob Faibussowitsch   PetscCall(MatGetSize(x, &m, &n));
3469679944adSJunchao Zhang   n -= nskip; /* shrink number of columns where nonzeros can be set */
3470679944adSJunchao Zhang   for (i = 0; i < m; i++) {
3471679944adSJunchao Zhang     for (j = 0; j < aij->imax[i]; j++) {
34729566063dSJacob Faibussowitsch       PetscCall(PetscRandomGetValue(rctx, &a));
3473679944adSJunchao Zhang       col = (PetscInt)(n * PetscRealPart(a));
3474679944adSJunchao Zhang       if (col >= low) col += nskip; /* shift col rightward to skip the hole */
34759566063dSJacob Faibussowitsch       PetscCall(MatSetValues(x, 1, &i, 1, &col, &a, ADD_VALUES));
3476679944adSJunchao Zhang     }
3477e2ce353bSJunchao Zhang   }
34789566063dSJacob Faibussowitsch   PetscCall(MatAssemblyBegin(x, MAT_FINAL_ASSEMBLY));
34799566063dSJacob Faibussowitsch   PetscCall(MatAssemblyEnd(x, MAT_FINAL_ASSEMBLY));
34803ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3481679944adSJunchao Zhang }
3482679944adSJunchao Zhang 
34830a6ffc59SBarry Smith static struct _MatOps MatOps_Values = {MatSetValues_SeqAIJ,
3484cb5b572fSBarry Smith                                        MatGetRow_SeqAIJ,
3485cb5b572fSBarry Smith                                        MatRestoreRow_SeqAIJ,
3486cb5b572fSBarry Smith                                        MatMult_SeqAIJ,
348797304618SKris Buschelman                                        /*  4*/ MatMultAdd_SeqAIJ,
34887c922b88SBarry Smith                                        MatMultTranspose_SeqAIJ,
34897c922b88SBarry Smith                                        MatMultTransposeAdd_SeqAIJ,
3490f4259b30SLisandro Dalcin                                        NULL,
3491f4259b30SLisandro Dalcin                                        NULL,
3492f4259b30SLisandro Dalcin                                        NULL,
3493f4259b30SLisandro Dalcin                                        /* 10*/ NULL,
3494cb5b572fSBarry Smith                                        MatLUFactor_SeqAIJ,
3495f4259b30SLisandro Dalcin                                        NULL,
349641f059aeSBarry Smith                                        MatSOR_SeqAIJ,
349791e9d3e2SHong Zhang                                        MatTranspose_SeqAIJ,
349897304618SKris Buschelman                                        /*1 5*/ MatGetInfo_SeqAIJ,
3499cb5b572fSBarry Smith                                        MatEqual_SeqAIJ,
3500cb5b572fSBarry Smith                                        MatGetDiagonal_SeqAIJ,
3501cb5b572fSBarry Smith                                        MatDiagonalScale_SeqAIJ,
3502cb5b572fSBarry Smith                                        MatNorm_SeqAIJ,
3503f4259b30SLisandro Dalcin                                        /* 20*/ NULL,
3504cb5b572fSBarry Smith                                        MatAssemblyEnd_SeqAIJ,
3505cb5b572fSBarry Smith                                        MatSetOption_SeqAIJ,
3506cb5b572fSBarry Smith                                        MatZeroEntries_SeqAIJ,
3507d519adbfSMatthew Knepley                                        /* 24*/ MatZeroRows_SeqAIJ,
3508f4259b30SLisandro Dalcin                                        NULL,
3509f4259b30SLisandro Dalcin                                        NULL,
3510f4259b30SLisandro Dalcin                                        NULL,
3511f4259b30SLisandro Dalcin                                        NULL,
351226cec326SBarry Smith                                        /* 29*/ MatSetUp_Seq_Hash,
3513f4259b30SLisandro Dalcin                                        NULL,
3514f4259b30SLisandro Dalcin                                        NULL,
3515f4259b30SLisandro Dalcin                                        NULL,
3516f4259b30SLisandro Dalcin                                        NULL,
3517d519adbfSMatthew Knepley                                        /* 34*/ MatDuplicate_SeqAIJ,
3518f4259b30SLisandro Dalcin                                        NULL,
3519f4259b30SLisandro Dalcin                                        NULL,
3520cb5b572fSBarry Smith                                        MatILUFactor_SeqAIJ,
3521f4259b30SLisandro Dalcin                                        NULL,
3522d519adbfSMatthew Knepley                                        /* 39*/ MatAXPY_SeqAIJ,
35237dae84e0SHong Zhang                                        MatCreateSubMatrices_SeqAIJ,
3524cb5b572fSBarry Smith                                        MatIncreaseOverlap_SeqAIJ,
3525cb5b572fSBarry Smith                                        MatGetValues_SeqAIJ,
3526cb5b572fSBarry Smith                                        MatCopy_SeqAIJ,
3527d519adbfSMatthew Knepley                                        /* 44*/ MatGetRowMax_SeqAIJ,
3528cb5b572fSBarry Smith                                        MatScale_SeqAIJ,
35297d68702bSBarry Smith                                        MatShift_SeqAIJ,
353079299369SBarry Smith                                        MatDiagonalSet_SeqAIJ,
35316e169961SBarry Smith                                        MatZeroRowsColumns_SeqAIJ,
353273a71a0fSBarry Smith                                        /* 49*/ MatSetRandom_SeqAIJ,
35333b2fbd54SBarry Smith                                        MatGetRowIJ_SeqAIJ,
35343b2fbd54SBarry Smith                                        MatRestoreRowIJ_SeqAIJ,
35353b2fbd54SBarry Smith                                        MatGetColumnIJ_SeqAIJ,
3536a93ec695SBarry Smith                                        MatRestoreColumnIJ_SeqAIJ,
353793dfae19SHong Zhang                                        /* 54*/ MatFDColoringCreate_SeqXAIJ,
3538f4259b30SLisandro Dalcin                                        NULL,
3539f4259b30SLisandro Dalcin                                        NULL,
3540cda55fadSBarry Smith                                        MatPermute_SeqAIJ,
3541f4259b30SLisandro Dalcin                                        NULL,
3542f4259b30SLisandro Dalcin                                        /* 59*/ NULL,
3543b9b97703SBarry Smith                                        MatDestroy_SeqAIJ,
3544b9b97703SBarry Smith                                        MatView_SeqAIJ,
3545f4259b30SLisandro Dalcin                                        NULL,
3546f4259b30SLisandro Dalcin                                        NULL,
3547f4259b30SLisandro Dalcin                                        /* 64*/ NULL,
3548321b30b9SSatish Balay                                        MatMatMatMultNumeric_SeqAIJ_SeqAIJ_SeqAIJ,
3549f4259b30SLisandro Dalcin                                        NULL,
3550f4259b30SLisandro Dalcin                                        NULL,
3551f4259b30SLisandro Dalcin                                        NULL,
3552d519adbfSMatthew Knepley                                        /* 69*/ MatGetRowMaxAbs_SeqAIJ,
3553c87e5d42SMatthew Knepley                                        MatGetRowMinAbs_SeqAIJ,
3554f4259b30SLisandro Dalcin                                        NULL,
3555f4259b30SLisandro Dalcin                                        NULL,
3556f4259b30SLisandro Dalcin                                        NULL,
3557f4259b30SLisandro Dalcin                                        /* 74*/ NULL,
35583acb8795SBarry Smith                                        MatFDColoringApply_AIJ,
3559f4259b30SLisandro Dalcin                                        NULL,
3560f4259b30SLisandro Dalcin                                        NULL,
3561f4259b30SLisandro Dalcin                                        NULL,
35626ce1633cSBarry Smith                                        /* 79*/ MatFindZeroDiagonals_SeqAIJ,
3563f4259b30SLisandro Dalcin                                        NULL,
3564f4259b30SLisandro Dalcin                                        NULL,
3565f4259b30SLisandro Dalcin                                        NULL,
3566bc011b1eSHong Zhang                                        MatLoad_SeqAIJ,
35676cff0a6bSPierre Jolivet                                        /* 84*/ NULL,
35686cff0a6bSPierre Jolivet                                        NULL,
3569f4259b30SLisandro Dalcin                                        NULL,
3570f4259b30SLisandro Dalcin                                        NULL,
3571f4259b30SLisandro Dalcin                                        NULL,
3572f4259b30SLisandro Dalcin                                        /* 89*/ NULL,
3573f4259b30SLisandro Dalcin                                        NULL,
357426be0446SHong Zhang                                        MatMatMultNumeric_SeqAIJ_SeqAIJ,
3575f4259b30SLisandro Dalcin                                        NULL,
3576f4259b30SLisandro Dalcin                                        NULL,
35778fa4b5a6SHong Zhang                                        /* 94*/ MatPtAPNumeric_SeqAIJ_SeqAIJ_SparseAxpy,
3578f4259b30SLisandro Dalcin                                        NULL,
3579f4259b30SLisandro Dalcin                                        NULL,
35806fc122caSHong Zhang                                        MatMatTransposeMultNumeric_SeqAIJ_SeqAIJ,
3581f4259b30SLisandro Dalcin                                        NULL,
35824222ddf1SHong Zhang                                        /* 99*/ MatProductSetFromOptions_SeqAIJ,
3583f4259b30SLisandro Dalcin                                        NULL,
3584f4259b30SLisandro Dalcin                                        NULL,
358587d4246cSBarry Smith                                        MatConjugate_SeqAIJ,
3586f4259b30SLisandro Dalcin                                        NULL,
3587d519adbfSMatthew Knepley                                        /*104*/ MatSetValuesRow_SeqAIJ,
358899cafbc1SBarry Smith                                        MatRealPart_SeqAIJ,
3589f5edf698SHong Zhang                                        MatImaginaryPart_SeqAIJ,
3590f4259b30SLisandro Dalcin                                        NULL,
3591f4259b30SLisandro Dalcin                                        NULL,
3592cbd44569SHong Zhang                                        /*109*/ MatMatSolve_SeqAIJ,
3593f4259b30SLisandro Dalcin                                        NULL,
35942af78befSBarry Smith                                        MatGetRowMin_SeqAIJ,
3595f4259b30SLisandro Dalcin                                        NULL,
3596599ef60dSHong Zhang                                        MatMissingDiagonal_SeqAIJ,
3597f4259b30SLisandro Dalcin                                        /*114*/ NULL,
3598f4259b30SLisandro Dalcin                                        NULL,
3599f4259b30SLisandro Dalcin                                        NULL,
3600f4259b30SLisandro Dalcin                                        NULL,
3601f4259b30SLisandro Dalcin                                        NULL,
3602f4259b30SLisandro Dalcin                                        /*119*/ NULL,
3603f4259b30SLisandro Dalcin                                        NULL,
3604f4259b30SLisandro Dalcin                                        NULL,
3605f4259b30SLisandro Dalcin                                        NULL,
3606b3a44c85SBarry Smith                                        MatGetMultiProcBlock_SeqAIJ,
36070716a85fSBarry Smith                                        /*124*/ MatFindNonzeroRows_SeqAIJ,
3608a873a8cdSSam Reynolds                                        MatGetColumnReductions_SeqAIJ,
360937868618SMatthew G Knepley                                        MatInvertBlockDiagonal_SeqAIJ,
36100da83c2eSBarry Smith                                        MatInvertVariableBlockDiagonal_SeqAIJ,
3611f4259b30SLisandro Dalcin                                        NULL,
3612f4259b30SLisandro Dalcin                                        /*129*/ NULL,
3613f4259b30SLisandro Dalcin                                        NULL,
3614f4259b30SLisandro Dalcin                                        NULL,
361575648e8dSHong Zhang                                        MatTransposeMatMultNumeric_SeqAIJ_SeqAIJ,
3616b9af6bddSHong Zhang                                        MatTransposeColoringCreate_SeqAIJ,
3617b9af6bddSHong Zhang                                        /*134*/ MatTransColoringApplySpToDen_SeqAIJ,
36182b8ad9a3SHong Zhang                                        MatTransColoringApplyDenToSp_SeqAIJ,
3619f4259b30SLisandro Dalcin                                        NULL,
3620f4259b30SLisandro Dalcin                                        NULL,
36213964eb88SJed Brown                                        MatRARtNumeric_SeqAIJ_SeqAIJ,
3622f4259b30SLisandro Dalcin                                        /*139*/ NULL,
3623f4259b30SLisandro Dalcin                                        NULL,
3624f4259b30SLisandro Dalcin                                        NULL,
36253a062f41SBarry Smith                                        MatFDColoringSetUp_SeqXAIJ,
36269c8f2541SHong Zhang                                        MatFindOffBlockDiagonalEntries_SeqAIJ,
36274222ddf1SHong Zhang                                        MatCreateMPIMatConcatenateSeqMat_SeqAIJ,
36284222ddf1SHong Zhang                                        /*145*/ MatDestroySubMatrices_SeqAIJ,
3629f4259b30SLisandro Dalcin                                        NULL,
363072833a62Smarkadams4                                        NULL,
363172833a62Smarkadams4                                        MatCreateGraph_Simple_AIJ,
36322d776b49SBarry Smith                                        NULL,
3633dec0b466SHong Zhang                                        /*150*/ MatTransposeSymbolic_SeqAIJ,
3634eede4a3fSMark Adams                                        MatEliminateZeros_SeqAIJ,
36354cc2b5b5SPierre Jolivet                                        MatGetRowSumAbs_SeqAIJ,
36364cc2b5b5SPierre Jolivet                                        NULL};
363717ab2063SBarry Smith 
3638ba38deedSJacob Faibussowitsch static PetscErrorCode MatSeqAIJSetColumnIndices_SeqAIJ(Mat mat, PetscInt *indices)
3639d71ae5a4SJacob Faibussowitsch {
3640bef8e0ddSBarry Smith   Mat_SeqAIJ *aij = (Mat_SeqAIJ *)mat->data;
364197f1f81fSBarry Smith   PetscInt    i, nz, n;
3642bef8e0ddSBarry Smith 
3643bef8e0ddSBarry Smith   PetscFunctionBegin;
3644bef8e0ddSBarry Smith   nz = aij->maxnz;
3645d0f46423SBarry Smith   n  = mat->rmap->n;
3646ad540459SPierre Jolivet   for (i = 0; i < nz; i++) aij->j[i] = indices[i];
3647bef8e0ddSBarry Smith   aij->nz = nz;
3648ad540459SPierre Jolivet   for (i = 0; i < n; i++) aij->ilen[i] = aij->imax[i];
36493ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3650bef8e0ddSBarry Smith }
3651bef8e0ddSBarry Smith 
3652a3bb6f32SFande Kong /*
3653ddea5d60SJunchao Zhang  * Given a sparse matrix with global column indices, compact it by using a local column space.
3654ddea5d60SJunchao Zhang  * The result matrix helps saving memory in other algorithms, such as MatPtAPSymbolic_MPIAIJ_MPIAIJ_scalable()
3655ddea5d60SJunchao Zhang  */
3656d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJCompactOutExtraColumns_SeqAIJ(Mat mat, ISLocalToGlobalMapping *mapping)
3657d71ae5a4SJacob Faibussowitsch {
3658a3bb6f32SFande Kong   Mat_SeqAIJ   *aij = (Mat_SeqAIJ *)mat->data;
3659eec179cfSJacob Faibussowitsch   PetscHMapI    gid1_lid1;
3660eec179cfSJacob Faibussowitsch   PetscHashIter tpos;
366125b670f0SStefano Zampini   PetscInt      gid, lid, i, ec, nz = aij->nz;
366225b670f0SStefano Zampini   PetscInt     *garray, *jj = aij->j;
3663a3bb6f32SFande Kong 
3664a3bb6f32SFande Kong   PetscFunctionBegin;
3665a3bb6f32SFande Kong   PetscValidHeaderSpecific(mat, MAT_CLASSID, 1);
36664f572ea9SToby Isaac   PetscAssertPointer(mapping, 2);
3667a3bb6f32SFande Kong   /* use a table */
3668eec179cfSJacob Faibussowitsch   PetscCall(PetscHMapICreateWithSize(mat->rmap->n, &gid1_lid1));
3669a3bb6f32SFande Kong   ec = 0;
367025b670f0SStefano Zampini   for (i = 0; i < nz; i++) {
367125b670f0SStefano Zampini     PetscInt data, gid1 = jj[i] + 1;
3672eec179cfSJacob Faibussowitsch     PetscCall(PetscHMapIGetWithDefault(gid1_lid1, gid1, 0, &data));
3673a3bb6f32SFande Kong     if (!data) {
3674a3bb6f32SFande Kong       /* one based table */
3675c76ffc5fSJacob Faibussowitsch       PetscCall(PetscHMapISet(gid1_lid1, gid1, ++ec));
3676a3bb6f32SFande Kong     }
3677a3bb6f32SFande Kong   }
3678a3bb6f32SFande Kong   /* form array of columns we need */
36799566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(ec, &garray));
3680eec179cfSJacob Faibussowitsch   PetscHashIterBegin(gid1_lid1, tpos);
3681eec179cfSJacob Faibussowitsch   while (!PetscHashIterAtEnd(gid1_lid1, tpos)) {
3682eec179cfSJacob Faibussowitsch     PetscHashIterGetKey(gid1_lid1, tpos, gid);
3683eec179cfSJacob Faibussowitsch     PetscHashIterGetVal(gid1_lid1, tpos, lid);
3684eec179cfSJacob Faibussowitsch     PetscHashIterNext(gid1_lid1, tpos);
3685a3bb6f32SFande Kong     gid--;
3686a3bb6f32SFande Kong     lid--;
3687a3bb6f32SFande Kong     garray[lid] = gid;
3688a3bb6f32SFande Kong   }
36899566063dSJacob Faibussowitsch   PetscCall(PetscSortInt(ec, garray)); /* sort, and rebuild */
3690eec179cfSJacob Faibussowitsch   PetscCall(PetscHMapIClear(gid1_lid1));
3691c76ffc5fSJacob Faibussowitsch   for (i = 0; i < ec; i++) PetscCall(PetscHMapISet(gid1_lid1, garray[i] + 1, i + 1));
3692a3bb6f32SFande Kong   /* compact out the extra columns in B */
369325b670f0SStefano Zampini   for (i = 0; i < nz; i++) {
369425b670f0SStefano Zampini     PetscInt gid1 = jj[i] + 1;
3695eec179cfSJacob Faibussowitsch     PetscCall(PetscHMapIGetWithDefault(gid1_lid1, gid1, 0, &lid));
3696a3bb6f32SFande Kong     lid--;
369725b670f0SStefano Zampini     jj[i] = lid;
3698a3bb6f32SFande Kong   }
36999566063dSJacob Faibussowitsch   PetscCall(PetscLayoutDestroy(&mat->cmap));
3700eec179cfSJacob Faibussowitsch   PetscCall(PetscHMapIDestroy(&gid1_lid1));
37019566063dSJacob Faibussowitsch   PetscCall(PetscLayoutCreateFromSizes(PetscObjectComm((PetscObject)mat), ec, ec, 1, &mat->cmap));
37029566063dSJacob Faibussowitsch   PetscCall(ISLocalToGlobalMappingCreate(PETSC_COMM_SELF, mat->cmap->bs, mat->cmap->n, garray, PETSC_OWN_POINTER, mapping));
37039566063dSJacob Faibussowitsch   PetscCall(ISLocalToGlobalMappingSetType(*mapping, ISLOCALTOGLOBALMAPPINGHASH));
37043ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3705a3bb6f32SFande Kong }
3706a3bb6f32SFande Kong 
3707bef8e0ddSBarry Smith /*@
3708bef8e0ddSBarry Smith   MatSeqAIJSetColumnIndices - Set the column indices for all the rows
3709bef8e0ddSBarry Smith   in the matrix.
3710bef8e0ddSBarry Smith 
3711bef8e0ddSBarry Smith   Input Parameters:
371211a5261eSBarry Smith + mat     - the `MATSEQAIJ` matrix
3713bef8e0ddSBarry Smith - indices - the column indices
3714bef8e0ddSBarry Smith 
371515091d37SBarry Smith   Level: advanced
371615091d37SBarry Smith 
3717bef8e0ddSBarry Smith   Notes:
3718bef8e0ddSBarry Smith   This can be called if you have precomputed the nonzero structure of the
3719bef8e0ddSBarry Smith   matrix and want to provide it to the matrix object to improve the performance
372011a5261eSBarry Smith   of the `MatSetValues()` operation.
3721bef8e0ddSBarry Smith 
3722bef8e0ddSBarry Smith   You MUST have set the correct numbers of nonzeros per row in the call to
372311a5261eSBarry Smith   `MatCreateSeqAIJ()`, and the columns indices MUST be sorted.
3724bef8e0ddSBarry Smith 
372511a5261eSBarry Smith   MUST be called before any calls to `MatSetValues()`
3726bef8e0ddSBarry Smith 
3727b9617806SBarry Smith   The indices should start with zero, not one.
3728b9617806SBarry Smith 
37291cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MATSEQAIJ`
3730bef8e0ddSBarry Smith @*/
3731d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetColumnIndices(Mat mat, PetscInt *indices)
3732d71ae5a4SJacob Faibussowitsch {
3733bef8e0ddSBarry Smith   PetscFunctionBegin;
37340700a824SBarry Smith   PetscValidHeaderSpecific(mat, MAT_CLASSID, 1);
37354f572ea9SToby Isaac   PetscAssertPointer(indices, 2);
3736cac4c232SBarry Smith   PetscUseMethod(mat, "MatSeqAIJSetColumnIndices_C", (Mat, PetscInt *), (mat, indices));
37373ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3738bef8e0ddSBarry Smith }
3739bef8e0ddSBarry Smith 
3740ba38deedSJacob Faibussowitsch static PetscErrorCode MatStoreValues_SeqAIJ(Mat mat)
3741d71ae5a4SJacob Faibussowitsch {
3742be6bf707SBarry Smith   Mat_SeqAIJ *aij = (Mat_SeqAIJ *)mat->data;
3743d0f46423SBarry Smith   size_t      nz  = aij->i[mat->rmap->n];
3744be6bf707SBarry Smith 
3745be6bf707SBarry Smith   PetscFunctionBegin;
374628b400f6SJacob Faibussowitsch   PetscCheck(aij->nonew, PETSC_COMM_SELF, PETSC_ERR_ORDER, "Must call MatSetOption(A,MAT_NEW_NONZERO_LOCATIONS,PETSC_FALSE);first");
3747be6bf707SBarry Smith 
3748be6bf707SBarry Smith   /* allocate space for values if not already there */
37494dfa11a4SJacob Faibussowitsch   if (!aij->saved_values) { PetscCall(PetscMalloc1(nz + 1, &aij->saved_values)); }
3750be6bf707SBarry Smith 
3751be6bf707SBarry Smith   /* copy values over */
37529566063dSJacob Faibussowitsch   PetscCall(PetscArraycpy(aij->saved_values, aij->a, nz));
37533ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3754be6bf707SBarry Smith }
3755be6bf707SBarry Smith 
3756be6bf707SBarry Smith /*@
375720f4b53cSBarry Smith   MatStoreValues - Stashes a copy of the matrix values; this allows reusing of the linear part of a Jacobian, while recomputing only the
3758be6bf707SBarry Smith   nonlinear portion.
3759be6bf707SBarry Smith 
3760c3339decSBarry Smith   Logically Collect
3761be6bf707SBarry Smith 
376227430b45SBarry Smith   Input Parameter:
376311a5261eSBarry Smith . mat - the matrix (currently only `MATAIJ` matrices support this option)
3764be6bf707SBarry Smith 
376515091d37SBarry Smith   Level: advanced
376615091d37SBarry Smith 
37672920cce0SJacob Faibussowitsch   Example Usage:
376827430b45SBarry Smith .vb
37692ef1f0ffSBarry Smith     Using SNES
377027430b45SBarry Smith     Create Jacobian matrix
377127430b45SBarry Smith     Set linear terms into matrix
377227430b45SBarry Smith     Apply boundary conditions to matrix, at this time matrix must have
377327430b45SBarry Smith       final nonzero structure (i.e. setting the nonlinear terms and applying
377427430b45SBarry Smith       boundary conditions again will not change the nonzero structure
377527430b45SBarry Smith     MatSetOption(mat, MAT_NEW_NONZERO_LOCATIONS, PETSC_FALSE);
377627430b45SBarry Smith     MatStoreValues(mat);
377727430b45SBarry Smith     Call SNESSetJacobian() with matrix
377827430b45SBarry Smith     In your Jacobian routine
377927430b45SBarry Smith       MatRetrieveValues(mat);
378027430b45SBarry Smith       Set nonlinear terms in matrix
3781be6bf707SBarry Smith 
378227430b45SBarry Smith     Without `SNESSolve()`, i.e. when you handle nonlinear solve yourself:
378327430b45SBarry Smith     // build linear portion of Jacobian
378427430b45SBarry Smith     MatSetOption(mat, MAT_NEW_NONZERO_LOCATIONS, PETSC_FALSE);
378527430b45SBarry Smith     MatStoreValues(mat);
378627430b45SBarry Smith     loop over nonlinear iterations
378727430b45SBarry Smith        MatRetrieveValues(mat);
378827430b45SBarry Smith        // call MatSetValues(mat,...) to set nonliner portion of Jacobian
378927430b45SBarry Smith        // call MatAssemblyBegin/End() on matrix
379027430b45SBarry Smith        Solve linear system with Jacobian
379127430b45SBarry Smith     endloop
379227430b45SBarry Smith .ve
3793be6bf707SBarry Smith 
3794be6bf707SBarry Smith   Notes:
3795da81f932SPierre Jolivet   Matrix must already be assembled before calling this routine
379611a5261eSBarry Smith   Must set the matrix option `MatSetOption`(mat,`MAT_NEW_NONZERO_LOCATIONS`,`PETSC_FALSE`); before
3797be6bf707SBarry Smith   calling this routine.
3798be6bf707SBarry Smith 
37990c468ba9SBarry Smith   When this is called multiple times it overwrites the previous set of stored values
38000c468ba9SBarry Smith   and does not allocated additional space.
38010c468ba9SBarry Smith 
3802fe59aa6dSJacob Faibussowitsch .seealso: [](ch_matrices), `Mat`, `MatRetrieveValues()`
3803be6bf707SBarry Smith @*/
3804d71ae5a4SJacob Faibussowitsch PetscErrorCode MatStoreValues(Mat mat)
3805d71ae5a4SJacob Faibussowitsch {
3806be6bf707SBarry Smith   PetscFunctionBegin;
38070700a824SBarry Smith   PetscValidHeaderSpecific(mat, MAT_CLASSID, 1);
380828b400f6SJacob Faibussowitsch   PetscCheck(mat->assembled, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for unassembled matrix");
380928b400f6SJacob Faibussowitsch   PetscCheck(!mat->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix");
3810cac4c232SBarry Smith   PetscUseMethod(mat, "MatStoreValues_C", (Mat), (mat));
38113ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3812be6bf707SBarry Smith }
3813be6bf707SBarry Smith 
3814ba38deedSJacob Faibussowitsch static PetscErrorCode MatRetrieveValues_SeqAIJ(Mat mat)
3815d71ae5a4SJacob Faibussowitsch {
3816be6bf707SBarry Smith   Mat_SeqAIJ *aij = (Mat_SeqAIJ *)mat->data;
3817d0f46423SBarry Smith   PetscInt    nz  = aij->i[mat->rmap->n];
3818be6bf707SBarry Smith 
3819be6bf707SBarry Smith   PetscFunctionBegin;
382028b400f6SJacob Faibussowitsch   PetscCheck(aij->nonew, PETSC_COMM_SELF, PETSC_ERR_ORDER, "Must call MatSetOption(A,MAT_NEW_NONZERO_LOCATIONS,PETSC_FALSE);first");
382128b400f6SJacob Faibussowitsch   PetscCheck(aij->saved_values, PETSC_COMM_SELF, PETSC_ERR_ORDER, "Must call MatStoreValues(A);first");
3822be6bf707SBarry Smith   /* copy values over */
38239566063dSJacob Faibussowitsch   PetscCall(PetscArraycpy(aij->a, aij->saved_values, nz));
38243ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3825be6bf707SBarry Smith }
3826be6bf707SBarry Smith 
3827be6bf707SBarry Smith /*@
382820f4b53cSBarry Smith   MatRetrieveValues - Retrieves the copy of the matrix values that was stored with `MatStoreValues()`
3829be6bf707SBarry Smith 
3830c3339decSBarry Smith   Logically Collect
3831be6bf707SBarry Smith 
38322fe279fdSBarry Smith   Input Parameter:
383311a5261eSBarry Smith . mat - the matrix (currently only `MATAIJ` matrices support this option)
3834be6bf707SBarry Smith 
383515091d37SBarry Smith   Level: advanced
383615091d37SBarry Smith 
38371cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatStoreValues()`
3838be6bf707SBarry Smith @*/
3839d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRetrieveValues(Mat mat)
3840d71ae5a4SJacob Faibussowitsch {
3841be6bf707SBarry Smith   PetscFunctionBegin;
38420700a824SBarry Smith   PetscValidHeaderSpecific(mat, MAT_CLASSID, 1);
384328b400f6SJacob Faibussowitsch   PetscCheck(mat->assembled, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for unassembled matrix");
384428b400f6SJacob Faibussowitsch   PetscCheck(!mat->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix");
3845cac4c232SBarry Smith   PetscUseMethod(mat, "MatRetrieveValues_C", (Mat), (mat));
38463ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3847be6bf707SBarry Smith }
3848be6bf707SBarry Smith 
38495d83a8b1SBarry Smith /*@
385011a5261eSBarry Smith   MatCreateSeqAIJ - Creates a sparse matrix in `MATSEQAIJ` (compressed row) format
38510d15e28bSLois Curfman McInnes   (the default parallel PETSc format).  For good matrix assembly performance
385220f4b53cSBarry Smith   the user should preallocate the matrix storage by setting the parameter `nz`
385320f4b53cSBarry Smith   (or the array `nnz`).
385417ab2063SBarry Smith 
3855d083f849SBarry Smith   Collective
3856db81eaa0SLois Curfman McInnes 
385717ab2063SBarry Smith   Input Parameters:
385811a5261eSBarry Smith + comm - MPI communicator, set to `PETSC_COMM_SELF`
385917ab2063SBarry Smith . m    - number of rows
386017ab2063SBarry Smith . n    - number of columns
386117ab2063SBarry Smith . nz   - number of nonzeros per row (same for all rows)
386251c19458SBarry Smith - nnz  - array containing the number of nonzeros in the various rows
38630298fd71SBarry Smith          (possibly different for each row) or NULL
386417ab2063SBarry Smith 
386517ab2063SBarry Smith   Output Parameter:
3866416022c9SBarry Smith . A - the matrix
386717ab2063SBarry Smith 
38682ef1f0ffSBarry Smith   Options Database Keys:
38692ef1f0ffSBarry Smith + -mat_no_inode            - Do not use inodes
38702ef1f0ffSBarry Smith - -mat_inode_limit <limit> - Sets inode limit (max limit=5)
38712ef1f0ffSBarry Smith 
38722ef1f0ffSBarry Smith   Level: intermediate
3873175b88e8SBarry Smith 
3874b259b22eSLois Curfman McInnes   Notes:
387577433607SBarry Smith   It is recommend to use `MatCreateFromOptions()` instead of this routine
387677433607SBarry Smith 
38772ef1f0ffSBarry Smith   If `nnz` is given then `nz` is ignored
387849a6f317SBarry Smith 
38792ef1f0ffSBarry Smith   The `MATSEQAIJ` format, also called
38802ef1f0ffSBarry Smith   compressed row storage, is fully compatible with standard Fortran
38810002213bSLois Curfman McInnes   storage.  That is, the stored row and column indices can begin at
38822ef1f0ffSBarry Smith   either one (as in Fortran) or zero.
388317ab2063SBarry Smith 
388420f4b53cSBarry Smith   Specify the preallocated storage with either `nz` or `nnz` (not both).
38852ef1f0ffSBarry Smith   Set `nz` = `PETSC_DEFAULT` and `nnz` = `NULL` for PETSc to control dynamic memory
388620f4b53cSBarry Smith   allocation.
388717ab2063SBarry Smith 
3888682d7d0cSBarry Smith   By default, this format uses inodes (identical nodes) when possible, to
38894fca80b9SLois Curfman McInnes   improve numerical efficiency of matrix-vector products and solves. We
3890682d7d0cSBarry Smith   search for consecutive rows with the same nonzero structure, thereby
38916c7ebb05SLois Curfman McInnes   reusing matrix information to achieve increased efficiency.
38926c7ebb05SLois Curfman McInnes 
38931cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, [Sparse Matrix Creation](sec_matsparse), `MatCreate()`, `MatCreateAIJ()`, `MatSetValues()`, `MatSeqAIJSetColumnIndices()`, `MatCreateSeqAIJWithArrays()`
389417ab2063SBarry Smith @*/
3895d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateSeqAIJ(MPI_Comm comm, PetscInt m, PetscInt n, PetscInt nz, const PetscInt nnz[], Mat *A)
3896d71ae5a4SJacob Faibussowitsch {
38973a40ed3dSBarry Smith   PetscFunctionBegin;
38989566063dSJacob Faibussowitsch   PetscCall(MatCreate(comm, A));
38999566063dSJacob Faibussowitsch   PetscCall(MatSetSizes(*A, m, n, m, n));
39009566063dSJacob Faibussowitsch   PetscCall(MatSetType(*A, MATSEQAIJ));
39019566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(*A, nz, nnz));
39023ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3903273d9f13SBarry Smith }
3904273d9f13SBarry Smith 
39055d83a8b1SBarry Smith /*@
3906273d9f13SBarry Smith   MatSeqAIJSetPreallocation - For good matrix assembly performance
3907273d9f13SBarry Smith   the user should preallocate the matrix storage by setting the parameter nz
3908273d9f13SBarry Smith   (or the array nnz).  By setting these parameters accurately, performance
3909273d9f13SBarry Smith   during matrix assembly can be increased by more than a factor of 50.
3910273d9f13SBarry Smith 
3911d083f849SBarry Smith   Collective
3912273d9f13SBarry Smith 
3913273d9f13SBarry Smith   Input Parameters:
39141c4f3114SJed Brown + B   - The matrix
3915273d9f13SBarry Smith . nz  - number of nonzeros per row (same for all rows)
3916273d9f13SBarry Smith - nnz - array containing the number of nonzeros in the various rows
39170298fd71SBarry Smith          (possibly different for each row) or NULL
3918273d9f13SBarry Smith 
39192ef1f0ffSBarry Smith   Options Database Keys:
39202ef1f0ffSBarry Smith + -mat_no_inode            - Do not use inodes
39212ef1f0ffSBarry Smith - -mat_inode_limit <limit> - Sets inode limit (max limit=5)
39222ef1f0ffSBarry Smith 
39232ef1f0ffSBarry Smith   Level: intermediate
39242ef1f0ffSBarry Smith 
3925273d9f13SBarry Smith   Notes:
39262ef1f0ffSBarry Smith   If `nnz` is given then `nz` is ignored
392749a6f317SBarry Smith 
392811a5261eSBarry Smith   The `MATSEQAIJ` format also called
39292ef1f0ffSBarry Smith   compressed row storage, is fully compatible with standard Fortran
3930273d9f13SBarry Smith   storage.  That is, the stored row and column indices can begin at
3931273d9f13SBarry Smith   either one (as in Fortran) or zero.  See the users' manual for details.
3932273d9f13SBarry Smith 
39332ef1f0ffSBarry Smith   Specify the preallocated storage with either `nz` or `nnz` (not both).
39342ef1f0ffSBarry Smith   Set nz = `PETSC_DEFAULT` and `nnz` = `NULL` for PETSc to control dynamic memory
39352ef1f0ffSBarry Smith   allocation.
3936273d9f13SBarry Smith 
393711a5261eSBarry Smith   You can call `MatGetInfo()` to get information on how effective the preallocation was;
3938aa95bbe8SBarry Smith   for example the fields mallocs,nz_allocated,nz_used,nz_unneeded;
3939aa95bbe8SBarry Smith   You can also run with the option -info and look for messages with the string
3940aa95bbe8SBarry Smith   malloc in them to see if additional memory allocation was needed.
3941aa95bbe8SBarry Smith 
394211a5261eSBarry Smith   Developer Notes:
394311a5261eSBarry Smith   Use nz of `MAT_SKIP_ALLOCATION` to not allocate any space for the matrix
3944a96a251dSBarry Smith   entries or columns indices
3945a96a251dSBarry Smith 
3946273d9f13SBarry Smith   By default, this format uses inodes (identical nodes) when possible, to
3947273d9f13SBarry Smith   improve numerical efficiency of matrix-vector products and solves. We
3948273d9f13SBarry Smith   search for consecutive rows with the same nonzero structure, thereby
3949273d9f13SBarry Smith   reusing matrix information to achieve increased efficiency.
3950273d9f13SBarry Smith 
39511cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatCreate()`, `MatCreateAIJ()`, `MatSetValues()`, `MatSeqAIJSetColumnIndices()`, `MatCreateSeqAIJWithArrays()`, `MatGetInfo()`,
3952db781477SPatrick Sanan           `MatSeqAIJSetTotalPreallocation()`
3953273d9f13SBarry Smith @*/
3954d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetPreallocation(Mat B, PetscInt nz, const PetscInt nnz[])
3955d71ae5a4SJacob Faibussowitsch {
3956a23d5eceSKris Buschelman   PetscFunctionBegin;
39576ba663aaSJed Brown   PetscValidHeaderSpecific(B, MAT_CLASSID, 1);
39586ba663aaSJed Brown   PetscValidType(B, 1);
3959cac4c232SBarry Smith   PetscTryMethod(B, "MatSeqAIJSetPreallocation_C", (Mat, PetscInt, const PetscInt[]), (B, nz, nnz));
39603ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3961a23d5eceSKris Buschelman }
3962a23d5eceSKris Buschelman 
3963d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetPreallocation_SeqAIJ(Mat B, PetscInt nz, const PetscInt *nnz)
3964d71ae5a4SJacob Faibussowitsch {
3965ad79cf63SBarry Smith   Mat_SeqAIJ *b              = (Mat_SeqAIJ *)B->data;
39662576faa2SJed Brown   PetscBool   skipallocation = PETSC_FALSE, realalloc = PETSC_FALSE;
396797f1f81fSBarry Smith   PetscInt    i;
3968273d9f13SBarry Smith 
3969273d9f13SBarry Smith   PetscFunctionBegin;
3970ad79cf63SBarry Smith   if (B->hash_active) {
3971aea10558SJacob Faibussowitsch     B->ops[0] = b->cops;
3972ad79cf63SBarry Smith     PetscCall(PetscHMapIJVDestroy(&b->ht));
3973ad79cf63SBarry Smith     PetscCall(PetscFree(b->dnz));
3974ad79cf63SBarry Smith     B->hash_active = PETSC_FALSE;
3975ad79cf63SBarry Smith   }
39762576faa2SJed Brown   if (nz >= 0 || nnz) realalloc = PETSC_TRUE;
3977a96a251dSBarry Smith   if (nz == MAT_SKIP_ALLOCATION) {
3978c461c341SBarry Smith     skipallocation = PETSC_TRUE;
3979c461c341SBarry Smith     nz             = 0;
3980c461c341SBarry Smith   }
39819566063dSJacob Faibussowitsch   PetscCall(PetscLayoutSetUp(B->rmap));
39829566063dSJacob Faibussowitsch   PetscCall(PetscLayoutSetUp(B->cmap));
3983899cda47SBarry Smith 
3984435da068SBarry Smith   if (nz == PETSC_DEFAULT || nz == PETSC_DECIDE) nz = 5;
398508401ef6SPierre Jolivet   PetscCheck(nz >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "nz cannot be less than 0: value %" PetscInt_FMT, nz);
3986cf9c20a2SJed Brown   if (PetscUnlikelyDebug(nnz)) {
3987d0f46423SBarry Smith     for (i = 0; i < B->rmap->n; i++) {
398808401ef6SPierre Jolivet       PetscCheck(nnz[i] >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "nnz cannot be less than 0: local row %" PetscInt_FMT " value %" PetscInt_FMT, i, nnz[i]);
398908401ef6SPierre Jolivet       PetscCheck(nnz[i] <= B->cmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "nnz cannot be greater than row length: local row %" PetscInt_FMT " value %" PetscInt_FMT " rowlength %" PetscInt_FMT, i, nnz[i], B->cmap->n);
3990b73539f3SBarry Smith     }
3991b73539f3SBarry Smith   }
3992b73539f3SBarry Smith 
3993273d9f13SBarry Smith   B->preallocated = PETSC_TRUE;
3994ab93d7beSBarry Smith   if (!skipallocation) {
39954dfa11a4SJacob Faibussowitsch     if (!b->imax) { PetscCall(PetscMalloc1(B->rmap->n, &b->imax)); }
3996071fcb05SBarry Smith     if (!b->ilen) {
3997071fcb05SBarry Smith       /* b->ilen will count nonzeros in each row so far. */
39989566063dSJacob Faibussowitsch       PetscCall(PetscCalloc1(B->rmap->n, &b->ilen));
3999071fcb05SBarry Smith     } else {
40009566063dSJacob Faibussowitsch       PetscCall(PetscMemzero(b->ilen, B->rmap->n * sizeof(PetscInt)));
40012ee49352SLisandro Dalcin     }
4002aa624791SPierre Jolivet     if (!b->ipre) PetscCall(PetscMalloc1(B->rmap->n, &b->ipre));
4003273d9f13SBarry Smith     if (!nnz) {
4004435da068SBarry Smith       if (nz == PETSC_DEFAULT || nz == PETSC_DECIDE) nz = 10;
4005c62bd62aSJed Brown       else if (nz < 0) nz = 1;
40065d2a9ed1SStefano Zampini       nz = PetscMin(nz, B->cmap->n);
4007d0f46423SBarry Smith       for (i = 0; i < B->rmap->n; i++) b->imax[i] = nz;
4008c43c4a61SBarry Smith       PetscCall(PetscIntMultError(nz, B->rmap->n, &nz));
4009273d9f13SBarry Smith     } else {
4010c73702f5SBarry Smith       PetscInt64 nz64 = 0;
40119371c9d4SSatish Balay       for (i = 0; i < B->rmap->n; i++) {
40129371c9d4SSatish Balay         b->imax[i] = nnz[i];
40139371c9d4SSatish Balay         nz64 += nnz[i];
40149371c9d4SSatish Balay       }
40159566063dSJacob Faibussowitsch       PetscCall(PetscIntCast(nz64, &nz));
4016273d9f13SBarry Smith     }
4017ab93d7beSBarry Smith 
4018273d9f13SBarry Smith     /* allocate the matrix space */
401953dd7562SDmitry Karpeev     /* FIXME: should B's old memory be unlogged? */
40209566063dSJacob Faibussowitsch     PetscCall(MatSeqXAIJFreeAIJ(B, &b->a, &b->j, &b->i));
4021396832f4SHong Zhang     if (B->structure_only) {
40229566063dSJacob Faibussowitsch       PetscCall(PetscMalloc1(nz, &b->j));
40239566063dSJacob Faibussowitsch       PetscCall(PetscMalloc1(B->rmap->n + 1, &b->i));
4024396832f4SHong Zhang     } else {
40259566063dSJacob Faibussowitsch       PetscCall(PetscMalloc3(nz, &b->a, nz, &b->j, B->rmap->n + 1, &b->i));
4026396832f4SHong Zhang     }
4027bfeeae90SHong Zhang     b->i[0] = 0;
4028ad540459SPierre Jolivet     for (i = 1; i < B->rmap->n + 1; i++) b->i[i] = b->i[i - 1] + b->imax[i - 1];
4029396832f4SHong Zhang     if (B->structure_only) {
4030396832f4SHong Zhang       b->singlemalloc = PETSC_FALSE;
4031396832f4SHong Zhang       b->free_a       = PETSC_FALSE;
4032396832f4SHong Zhang     } else {
4033273d9f13SBarry Smith       b->singlemalloc = PETSC_TRUE;
4034e6b907acSBarry Smith       b->free_a       = PETSC_TRUE;
4035396832f4SHong Zhang     }
4036e6b907acSBarry Smith     b->free_ij = PETSC_TRUE;
4037c461c341SBarry Smith   } else {
4038e6b907acSBarry Smith     b->free_a  = PETSC_FALSE;
4039e6b907acSBarry Smith     b->free_ij = PETSC_FALSE;
4040c461c341SBarry Smith   }
4041273d9f13SBarry Smith 
4042846b4da1SFande Kong   if (b->ipre && nnz != b->ipre && b->imax) {
4043846b4da1SFande Kong     /* reserve user-requested sparsity */
40449566063dSJacob Faibussowitsch     PetscCall(PetscArraycpy(b->ipre, b->imax, B->rmap->n));
4045846b4da1SFande Kong   }
4046846b4da1SFande Kong 
4047273d9f13SBarry Smith   b->nz               = 0;
4048273d9f13SBarry Smith   b->maxnz            = nz;
4049273d9f13SBarry Smith   B->info.nz_unneeded = (double)b->maxnz;
40501baa6e33SBarry Smith   if (realalloc) PetscCall(MatSetOption(B, MAT_NEW_NONZERO_ALLOCATION_ERR, PETSC_TRUE));
4051cb7b82ddSBarry Smith   B->was_assembled = PETSC_FALSE;
4052cb7b82ddSBarry Smith   B->assembled     = PETSC_FALSE;
40535519a089SJose E. Roman   /* We simply deem preallocation has changed nonzero state. Updating the state
40545519a089SJose E. Roman      will give clients (like AIJKokkos) a chance to know something has happened.
40555519a089SJose E. Roman   */
40565519a089SJose E. Roman   B->nonzerostate++;
40573ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
4058273d9f13SBarry Smith }
4059273d9f13SBarry Smith 
4060ba38deedSJacob Faibussowitsch static PetscErrorCode MatResetPreallocation_SeqAIJ(Mat A)
4061d71ae5a4SJacob Faibussowitsch {
4062846b4da1SFande Kong   Mat_SeqAIJ *a;
4063a5bbaf83SFande Kong   PetscInt    i;
40641f14be2bSBarry Smith   PetscBool   skipreset;
4065846b4da1SFande Kong 
4066846b4da1SFande Kong   PetscFunctionBegin;
4067846b4da1SFande Kong   PetscValidHeaderSpecific(A, MAT_CLASSID, 1);
406814d0e64fSAlex Lindsay 
406914d0e64fSAlex Lindsay   /* Check local size. If zero, then return */
40703ba16761SJacob Faibussowitsch   if (!A->rmap->n) PetscFunctionReturn(PETSC_SUCCESS);
407114d0e64fSAlex Lindsay 
4072846b4da1SFande Kong   a = (Mat_SeqAIJ *)A->data;
40732c814fdeSFande Kong   /* if no saved info, we error out */
407428b400f6SJacob Faibussowitsch   PetscCheck(a->ipre, PETSC_COMM_SELF, PETSC_ERR_ARG_NULL, "No saved preallocation info ");
40752c814fdeSFande Kong 
40761f14be2bSBarry Smith   PetscCheck(a->i && a->imax && a->ilen, PETSC_COMM_SELF, PETSC_ERR_ARG_NULL, "Memory info is incomplete, and can not reset preallocation ");
40772c814fdeSFande Kong 
40781f14be2bSBarry Smith   PetscCall(PetscArraycmp(a->ipre, a->ilen, A->rmap->n, &skipreset));
40791f14be2bSBarry Smith   if (!skipreset) {
40809566063dSJacob Faibussowitsch     PetscCall(PetscArraycpy(a->imax, a->ipre, A->rmap->n));
40819566063dSJacob Faibussowitsch     PetscCall(PetscArrayzero(a->ilen, A->rmap->n));
4082846b4da1SFande Kong     a->i[0] = 0;
4083ad540459SPierre Jolivet     for (i = 1; i < A->rmap->n + 1; i++) a->i[i] = a->i[i - 1] + a->imax[i - 1];
4084846b4da1SFande Kong     A->preallocated     = PETSC_TRUE;
4085846b4da1SFande Kong     a->nz               = 0;
4086846b4da1SFande Kong     a->maxnz            = a->i[A->rmap->n];
4087846b4da1SFande Kong     A->info.nz_unneeded = (double)a->maxnz;
4088846b4da1SFande Kong     A->was_assembled    = PETSC_FALSE;
4089846b4da1SFande Kong     A->assembled        = PETSC_FALSE;
40901f14be2bSBarry Smith   }
40913ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
4092846b4da1SFande Kong }
4093846b4da1SFande Kong 
409458d36128SBarry Smith /*@
409511a5261eSBarry Smith   MatSeqAIJSetPreallocationCSR - Allocates memory for a sparse sequential matrix in `MATSEQAIJ` format.
4096a1661176SMatthew Knepley 
4097a1661176SMatthew Knepley   Input Parameters:
4098a1661176SMatthew Knepley + B - the matrix
4099d8a51d2aSBarry Smith . i - the indices into `j` for the start of each row (indices start with zero)
4100d8a51d2aSBarry Smith . j - the column indices for each row (indices start with zero) these must be sorted for each row
4101d8a51d2aSBarry Smith - v - optional values in the matrix, use `NULL` if not provided
4102a1661176SMatthew Knepley 
4103a1661176SMatthew Knepley   Level: developer
4104a1661176SMatthew Knepley 
41056a9b8d82SBarry Smith   Notes:
41062ef1f0ffSBarry Smith   The `i`,`j`,`v` values are COPIED with this routine; to avoid the copy use `MatCreateSeqAIJWithArrays()`
410758d36128SBarry Smith 
41086a9b8d82SBarry Smith   This routine may be called multiple times with different nonzero patterns (or the same nonzero pattern). The nonzero
41096a9b8d82SBarry Smith   structure will be the union of all the previous nonzero structures.
41106a9b8d82SBarry Smith 
41116a9b8d82SBarry Smith   Developer Notes:
41122ef1f0ffSBarry Smith   An optimization could be added to the implementation where it checks if the `i`, and `j` are identical to the current `i` and `j` and
41132ef1f0ffSBarry Smith   then just copies the `v` values directly with `PetscMemcpy()`.
41146a9b8d82SBarry Smith 
411511a5261eSBarry Smith   This routine could also take a `PetscCopyMode` argument to allow sharing the values instead of always copying them.
41166a9b8d82SBarry Smith 
4117fe59aa6dSJacob Faibussowitsch .seealso: [](ch_matrices), `Mat`, `MatCreate()`, `MatCreateSeqAIJ()`, `MatSetValues()`, `MatSeqAIJSetPreallocation()`, `MATSEQAIJ`, `MatResetPreallocation()`
4118a1661176SMatthew Knepley @*/
4119d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetPreallocationCSR(Mat B, const PetscInt i[], const PetscInt j[], const PetscScalar v[])
4120d71ae5a4SJacob Faibussowitsch {
4121a1661176SMatthew Knepley   PetscFunctionBegin;
41220700a824SBarry Smith   PetscValidHeaderSpecific(B, MAT_CLASSID, 1);
41236ba663aaSJed Brown   PetscValidType(B, 1);
4124cac4c232SBarry Smith   PetscTryMethod(B, "MatSeqAIJSetPreallocationCSR_C", (Mat, const PetscInt[], const PetscInt[], const PetscScalar[]), (B, i, j, v));
41253ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
4126a1661176SMatthew Knepley }
4127a1661176SMatthew Knepley 
4128ba38deedSJacob Faibussowitsch static PetscErrorCode MatSeqAIJSetPreallocationCSR_SeqAIJ(Mat B, const PetscInt Ii[], const PetscInt J[], const PetscScalar v[])
4129d71ae5a4SJacob Faibussowitsch {
4130a1661176SMatthew Knepley   PetscInt  i;
4131a1661176SMatthew Knepley   PetscInt  m, n;
4132a1661176SMatthew Knepley   PetscInt  nz;
41336a9b8d82SBarry Smith   PetscInt *nnz;
4134a1661176SMatthew Knepley 
4135a1661176SMatthew Knepley   PetscFunctionBegin;
4136aed4548fSBarry Smith   PetscCheck(Ii[0] == 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Ii[0] must be 0 it is %" PetscInt_FMT, Ii[0]);
4137779a8d59SSatish Balay 
41389566063dSJacob Faibussowitsch   PetscCall(PetscLayoutSetUp(B->rmap));
41399566063dSJacob Faibussowitsch   PetscCall(PetscLayoutSetUp(B->cmap));
4140779a8d59SSatish Balay 
41419566063dSJacob Faibussowitsch   PetscCall(MatGetSize(B, &m, &n));
41429566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(m + 1, &nnz));
4143a1661176SMatthew Knepley   for (i = 0; i < m; i++) {
4144b7940d39SSatish Balay     nz = Ii[i + 1] - Ii[i];
414508401ef6SPierre Jolivet     PetscCheck(nz >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Local row %" PetscInt_FMT " has a negative number of columns %" PetscInt_FMT, i, nz);
4146a1661176SMatthew Knepley     nnz[i] = nz;
4147a1661176SMatthew Knepley   }
41489566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJSetPreallocation(B, 0, nnz));
41499566063dSJacob Faibussowitsch   PetscCall(PetscFree(nnz));
4150a1661176SMatthew Knepley 
41518e3a54c0SPierre Jolivet   for (i = 0; i < m; i++) PetscCall(MatSetValues_SeqAIJ(B, 1, &i, Ii[i + 1] - Ii[i], J + Ii[i], PetscSafePointerPlusOffset(v, Ii[i]), INSERT_VALUES));
4152a1661176SMatthew Knepley 
41539566063dSJacob Faibussowitsch   PetscCall(MatAssemblyBegin(B, MAT_FINAL_ASSEMBLY));
41549566063dSJacob Faibussowitsch   PetscCall(MatAssemblyEnd(B, MAT_FINAL_ASSEMBLY));
4155a1661176SMatthew Knepley 
41569566063dSJacob Faibussowitsch   PetscCall(MatSetOption(B, MAT_NEW_NONZERO_LOCATION_ERR, PETSC_TRUE));
41573ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
4158a1661176SMatthew Knepley }
4159a1661176SMatthew Knepley 
4160ad7e164aSPierre Jolivet /*@
41612ef1f0ffSBarry Smith   MatSeqAIJKron - Computes `C`, the Kronecker product of `A` and `B`.
4162ad7e164aSPierre Jolivet 
4163ad7e164aSPierre Jolivet   Input Parameters:
4164ad7e164aSPierre Jolivet + A     - left-hand side matrix
4165ad7e164aSPierre Jolivet . B     - right-hand side matrix
416611a5261eSBarry Smith - reuse - either `MAT_INITIAL_MATRIX` or `MAT_REUSE_MATRIX`
4167ad7e164aSPierre Jolivet 
4168ad7e164aSPierre Jolivet   Output Parameter:
41692ef1f0ffSBarry Smith . C - Kronecker product of `A` and `B`
4170ad7e164aSPierre Jolivet 
4171ad7e164aSPierre Jolivet   Level: intermediate
4172ad7e164aSPierre Jolivet 
417311a5261eSBarry Smith   Note:
417411a5261eSBarry Smith   `MAT_REUSE_MATRIX` can only be used when the nonzero structure of the product matrix has not changed from that last call to `MatSeqAIJKron()`.
4175ad7e164aSPierre Jolivet 
41761cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatCreateSeqAIJ()`, `MATSEQAIJ`, `MATKAIJ`, `MatReuse`
4177ad7e164aSPierre Jolivet @*/
4178d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJKron(Mat A, Mat B, MatReuse reuse, Mat *C)
4179d71ae5a4SJacob Faibussowitsch {
4180ad7e164aSPierre Jolivet   PetscFunctionBegin;
4181ad7e164aSPierre Jolivet   PetscValidHeaderSpecific(A, MAT_CLASSID, 1);
4182ad7e164aSPierre Jolivet   PetscValidType(A, 1);
4183ad7e164aSPierre Jolivet   PetscValidHeaderSpecific(B, MAT_CLASSID, 2);
4184ad7e164aSPierre Jolivet   PetscValidType(B, 2);
41854f572ea9SToby Isaac   PetscAssertPointer(C, 4);
4186ad7e164aSPierre Jolivet   if (reuse == MAT_REUSE_MATRIX) {
4187ad7e164aSPierre Jolivet     PetscValidHeaderSpecific(*C, MAT_CLASSID, 4);
4188ad7e164aSPierre Jolivet     PetscValidType(*C, 4);
4189ad7e164aSPierre Jolivet   }
4190cac4c232SBarry Smith   PetscTryMethod(A, "MatSeqAIJKron_C", (Mat, Mat, MatReuse, Mat *), (A, B, reuse, C));
41913ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
4192ad7e164aSPierre Jolivet }
4193ad7e164aSPierre Jolivet 
4194ba38deedSJacob Faibussowitsch static PetscErrorCode MatSeqAIJKron_SeqAIJ(Mat A, Mat B, MatReuse reuse, Mat *C)
4195d71ae5a4SJacob Faibussowitsch {
4196ad7e164aSPierre Jolivet   Mat                newmat;
4197ad7e164aSPierre Jolivet   Mat_SeqAIJ        *a = (Mat_SeqAIJ *)A->data;
4198ad7e164aSPierre Jolivet   Mat_SeqAIJ        *b = (Mat_SeqAIJ *)B->data;
4199ad7e164aSPierre Jolivet   PetscScalar       *v;
4200fff043a9SJunchao Zhang   const PetscScalar *aa, *ba;
4201ad7e164aSPierre Jolivet   PetscInt          *i, *j, m, n, p, q, nnz = 0, am = A->rmap->n, bm = B->rmap->n, an = A->cmap->n, bn = B->cmap->n;
4202ad7e164aSPierre Jolivet   PetscBool          flg;
4203ad7e164aSPierre Jolivet 
4204ad7e164aSPierre Jolivet   PetscFunctionBegin;
420528b400f6SJacob Faibussowitsch   PetscCheck(!A->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix");
420628b400f6SJacob Faibussowitsch   PetscCheck(A->assembled, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for unassembled matrix");
420728b400f6SJacob Faibussowitsch   PetscCheck(!B->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix");
420828b400f6SJacob Faibussowitsch   PetscCheck(B->assembled, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for unassembled matrix");
42099566063dSJacob Faibussowitsch   PetscCall(PetscObjectTypeCompare((PetscObject)B, MATSEQAIJ, &flg));
421028b400f6SJacob Faibussowitsch   PetscCheck(flg, PETSC_COMM_SELF, PETSC_ERR_SUP, "MatType %s", ((PetscObject)B)->type_name);
4211aed4548fSBarry Smith   PetscCheck(reuse == MAT_INITIAL_MATRIX || reuse == MAT_REUSE_MATRIX, PETSC_COMM_SELF, PETSC_ERR_SUP, "MatReuse %d", (int)reuse);
4212ad7e164aSPierre Jolivet   if (reuse == MAT_INITIAL_MATRIX) {
42139566063dSJacob Faibussowitsch     PetscCall(PetscMalloc2(am * bm + 1, &i, a->i[am] * b->i[bm], &j));
42149566063dSJacob Faibussowitsch     PetscCall(MatCreate(PETSC_COMM_SELF, &newmat));
42159566063dSJacob Faibussowitsch     PetscCall(MatSetSizes(newmat, am * bm, an * bn, am * bm, an * bn));
42169566063dSJacob Faibussowitsch     PetscCall(MatSetType(newmat, MATAIJ));
4217ad7e164aSPierre Jolivet     i[0] = 0;
4218ad7e164aSPierre Jolivet     for (m = 0; m < am; ++m) {
4219ad7e164aSPierre Jolivet       for (p = 0; p < bm; ++p) {
4220ad7e164aSPierre Jolivet         i[m * bm + p + 1] = i[m * bm + p] + (a->i[m + 1] - a->i[m]) * (b->i[p + 1] - b->i[p]);
4221ad7e164aSPierre Jolivet         for (n = a->i[m]; n < a->i[m + 1]; ++n) {
4222ad540459SPierre Jolivet           for (q = b->i[p]; q < b->i[p + 1]; ++q) j[nnz++] = a->j[n] * bn + b->j[q];
4223ad7e164aSPierre Jolivet         }
4224ad7e164aSPierre Jolivet       }
4225ad7e164aSPierre Jolivet     }
42269566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJSetPreallocationCSR(newmat, i, j, NULL));
4227ad7e164aSPierre Jolivet     *C = newmat;
42289566063dSJacob Faibussowitsch     PetscCall(PetscFree2(i, j));
4229ad7e164aSPierre Jolivet     nnz = 0;
4230ad7e164aSPierre Jolivet   }
42319566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArray(*C, &v));
42329566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &aa));
42339566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(B, &ba));
4234ad7e164aSPierre Jolivet   for (m = 0; m < am; ++m) {
4235ad7e164aSPierre Jolivet     for (p = 0; p < bm; ++p) {
4236ad7e164aSPierre Jolivet       for (n = a->i[m]; n < a->i[m + 1]; ++n) {
4237ad540459SPierre Jolivet         for (q = b->i[p]; q < b->i[p + 1]; ++q) v[nnz++] = aa[n] * ba[q];
4238ad7e164aSPierre Jolivet       }
4239ad7e164aSPierre Jolivet     }
4240ad7e164aSPierre Jolivet   }
42419566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArray(*C, &v));
42429566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &aa));
42439566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(B, &ba));
42443ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
4245ad7e164aSPierre Jolivet }
4246ad7e164aSPierre Jolivet 
4247c6db04a5SJed Brown #include <../src/mat/impls/dense/seq/dense.h>
4248af0996ceSBarry Smith #include <petsc/private/kernels/petscaxpy.h>
4249170fe5c8SBarry Smith 
4250170fe5c8SBarry Smith /*
4251170fe5c8SBarry Smith     Computes (B'*A')' since computing B*A directly is untenable
4252170fe5c8SBarry Smith 
4253170fe5c8SBarry Smith                n                       p                          p
42542da392ccSBarry Smith         [             ]       [             ]         [                 ]
42552da392ccSBarry Smith       m [      A      ]  *  n [       B     ]   =   m [         C       ]
42562da392ccSBarry Smith         [             ]       [             ]         [                 ]
4257170fe5c8SBarry Smith 
4258170fe5c8SBarry Smith */
4259d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMatMultNumeric_SeqDense_SeqAIJ(Mat A, Mat B, Mat C)
4260d71ae5a4SJacob Faibussowitsch {
4261170fe5c8SBarry Smith   Mat_SeqDense      *sub_a = (Mat_SeqDense *)A->data;
4262170fe5c8SBarry Smith   Mat_SeqAIJ        *sub_b = (Mat_SeqAIJ *)B->data;
4263170fe5c8SBarry Smith   Mat_SeqDense      *sub_c = (Mat_SeqDense *)C->data;
426486214ceeSStefano Zampini   PetscInt           i, j, n, m, q, p;
4265170fe5c8SBarry Smith   const PetscInt    *ii, *idx;
4266170fe5c8SBarry Smith   const PetscScalar *b, *a, *a_q;
4267170fe5c8SBarry Smith   PetscScalar       *c, *c_q;
426886214ceeSStefano Zampini   PetscInt           clda = sub_c->lda;
426986214ceeSStefano Zampini   PetscInt           alda = sub_a->lda;
4270170fe5c8SBarry Smith 
4271170fe5c8SBarry Smith   PetscFunctionBegin;
4272d0f46423SBarry Smith   m = A->rmap->n;
4273d0f46423SBarry Smith   n = A->cmap->n;
4274d0f46423SBarry Smith   p = B->cmap->n;
4275170fe5c8SBarry Smith   a = sub_a->v;
4276170fe5c8SBarry Smith   b = sub_b->a;
4277170fe5c8SBarry Smith   c = sub_c->v;
427886214ceeSStefano Zampini   if (clda == m) {
42799566063dSJacob Faibussowitsch     PetscCall(PetscArrayzero(c, m * p));
428086214ceeSStefano Zampini   } else {
428186214ceeSStefano Zampini     for (j = 0; j < p; j++)
42829371c9d4SSatish Balay       for (i = 0; i < m; i++) c[j * clda + i] = 0.0;
428386214ceeSStefano Zampini   }
4284170fe5c8SBarry Smith   ii  = sub_b->i;
4285170fe5c8SBarry Smith   idx = sub_b->j;
4286170fe5c8SBarry Smith   for (i = 0; i < n; i++) {
4287170fe5c8SBarry Smith     q = ii[i + 1] - ii[i];
4288170fe5c8SBarry Smith     while (q-- > 0) {
428986214ceeSStefano Zampini       c_q = c + clda * (*idx);
429086214ceeSStefano Zampini       a_q = a + alda * i;
4291854c7f52SBarry Smith       PetscKernelAXPY(c_q, *b, a_q, m);
4292170fe5c8SBarry Smith       idx++;
4293170fe5c8SBarry Smith       b++;
4294170fe5c8SBarry Smith     }
4295170fe5c8SBarry Smith   }
42963ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
4297170fe5c8SBarry Smith }
4298170fe5c8SBarry Smith 
4299d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMatMultSymbolic_SeqDense_SeqAIJ(Mat A, Mat B, PetscReal fill, Mat C)
4300d71ae5a4SJacob Faibussowitsch {
4301d0f46423SBarry Smith   PetscInt  m = A->rmap->n, n = B->cmap->n;
430286214ceeSStefano Zampini   PetscBool cisdense;
4303170fe5c8SBarry Smith 
4304170fe5c8SBarry Smith   PetscFunctionBegin;
430508401ef6SPierre Jolivet   PetscCheck(A->cmap->n == B->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "A->cmap->n %" PetscInt_FMT " != B->rmap->n %" PetscInt_FMT, A->cmap->n, B->rmap->n);
43069566063dSJacob Faibussowitsch   PetscCall(MatSetSizes(C, m, n, m, n));
43079566063dSJacob Faibussowitsch   PetscCall(MatSetBlockSizesFromMats(C, A, B));
4308d5e393b6SSuyash Tandon   PetscCall(PetscObjectTypeCompareAny((PetscObject)C, &cisdense, MATSEQDENSE, MATSEQDENSECUDA, MATSEQDENSEHIP, ""));
430948a46eb9SPierre Jolivet   if (!cisdense) PetscCall(MatSetType(C, MATDENSE));
43109566063dSJacob Faibussowitsch   PetscCall(MatSetUp(C));
4311d73949e8SHong Zhang 
43124222ddf1SHong Zhang   C->ops->matmultnumeric = MatMatMultNumeric_SeqDense_SeqAIJ;
43133ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
4314170fe5c8SBarry Smith }
4315170fe5c8SBarry Smith 
43160bad9183SKris Buschelman /*MC
4317fafad747SKris Buschelman    MATSEQAIJ - MATSEQAIJ = "seqaij" - A matrix type to be used for sequential sparse matrices,
43180bad9183SKris Buschelman    based on compressed sparse row format.
43190bad9183SKris Buschelman 
43202ef1f0ffSBarry Smith    Options Database Key:
43210bad9183SKris Buschelman . -mat_type seqaij - sets the matrix type to "seqaij" during a call to MatSetFromOptions()
43220bad9183SKris Buschelman 
43230bad9183SKris Buschelman    Level: beginner
43240bad9183SKris Buschelman 
43250cd7f59aSBarry Smith    Notes:
43262ef1f0ffSBarry Smith     `MatSetValues()` may be called for this matrix type with a `NULL` argument for the numerical values,
43270cd7f59aSBarry Smith     in this case the values associated with the rows and columns one passes in are set to zero
43280cd7f59aSBarry Smith     in the matrix
43290cd7f59aSBarry Smith 
433011a5261eSBarry Smith     `MatSetOptions`(,`MAT_STRUCTURE_ONLY`,`PETSC_TRUE`) may be called for this matrix type. In this no
433111a5261eSBarry Smith     space is allocated for the nonzero entries and any entries passed with `MatSetValues()` are ignored
43320cd7f59aSBarry Smith 
433311a5261eSBarry Smith   Developer Note:
43342ef1f0ffSBarry Smith     It would be nice if all matrix formats supported passing `NULL` in for the numerical values
43350cd7f59aSBarry Smith 
43361cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatCreateSeqAIJ()`, `MatSetFromOptions()`, `MatSetType()`, `MatCreate()`, `MatType`, `MATSELL`, `MATSEQSELL`, `MATMPISELL`
43370bad9183SKris Buschelman M*/
43380bad9183SKris Buschelman 
4339ccd284c7SBarry Smith /*MC
4340ccd284c7SBarry Smith    MATAIJ - MATAIJ = "aij" - A matrix type to be used for sparse matrices.
4341ccd284c7SBarry Smith 
434211a5261eSBarry Smith    This matrix type is identical to `MATSEQAIJ` when constructed with a single process communicator,
434311a5261eSBarry Smith    and `MATMPIAIJ` otherwise.  As a result, for single process communicators,
434411a5261eSBarry Smith    `MatSeqAIJSetPreallocation()` is supported, and similarly `MatMPIAIJSetPreallocation()` is supported
4345ccd284c7SBarry Smith    for communicators controlling multiple processes.  It is recommended that you call both of
4346ccd284c7SBarry Smith    the above preallocation routines for simplicity.
4347ccd284c7SBarry Smith 
43482ef1f0ffSBarry Smith    Options Database Key:
434911a5261eSBarry Smith . -mat_type aij - sets the matrix type to "aij" during a call to `MatSetFromOptions()`
4350ccd284c7SBarry Smith 
43512ef1f0ffSBarry Smith   Level: beginner
43522ef1f0ffSBarry Smith 
435311a5261eSBarry Smith    Note:
435411a5261eSBarry Smith    Subclasses include `MATAIJCUSPARSE`, `MATAIJPERM`, `MATAIJSELL`, `MATAIJMKL`, `MATAIJCRL`, and also automatically switches over to use inodes when
4355ccd284c7SBarry Smith    enough exist.
4356ccd284c7SBarry Smith 
43571cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatCreateAIJ()`, `MatCreateSeqAIJ()`, `MATSEQAIJ`, `MATMPIAIJ`, `MATSELL`, `MATSEQSELL`, `MATMPISELL`
4358ccd284c7SBarry Smith M*/
4359ccd284c7SBarry Smith 
4360ccd284c7SBarry Smith /*MC
4361ccd284c7SBarry Smith    MATAIJCRL - MATAIJCRL = "aijcrl" - A matrix type to be used for sparse matrices.
4362ccd284c7SBarry Smith 
43632ef1f0ffSBarry Smith    Options Database Key:
43642ef1f0ffSBarry Smith . -mat_type aijcrl - sets the matrix type to "aijcrl" during a call to `MatSetFromOptions()`
43652ef1f0ffSBarry Smith 
43662ef1f0ffSBarry Smith   Level: beginner
43672ef1f0ffSBarry Smith 
43682ef1f0ffSBarry Smith    Note:
436911a5261eSBarry Smith    This matrix type is identical to `MATSEQAIJCRL` when constructed with a single process communicator,
437011a5261eSBarry Smith    and `MATMPIAIJCRL` otherwise.  As a result, for single process communicators,
437111a5261eSBarry Smith    `MatSeqAIJSetPreallocation()` is supported, and similarly `MatMPIAIJSetPreallocation()` is supported
4372ccd284c7SBarry Smith    for communicators controlling multiple processes.  It is recommended that you call both of
4373ccd284c7SBarry Smith    the above preallocation routines for simplicity.
4374ccd284c7SBarry Smith 
43751cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatCreateMPIAIJCRL`, `MATSEQAIJCRL`, `MATMPIAIJCRL`, `MATSEQAIJCRL`, `MATMPIAIJCRL`
4376ccd284c7SBarry Smith M*/
4377ccd284c7SBarry Smith 
43787906f579SHong Zhang PETSC_INTERN PetscErrorCode MatConvert_SeqAIJ_SeqAIJCRL(Mat, MatType, MatReuse, Mat *);
43797906f579SHong Zhang #if defined(PETSC_HAVE_ELEMENTAL)
43807906f579SHong Zhang PETSC_INTERN PetscErrorCode MatConvert_SeqAIJ_Elemental(Mat, MatType, MatReuse, Mat *);
43817906f579SHong Zhang #endif
4382d24d4204SJose E. Roman #if defined(PETSC_HAVE_SCALAPACK)
4383d24d4204SJose E. Roman PETSC_INTERN PetscErrorCode MatConvert_AIJ_ScaLAPACK(Mat, MatType, MatReuse, Mat *);
4384d24d4204SJose E. Roman #endif
43857906f579SHong Zhang #if defined(PETSC_HAVE_HYPRE)
43867906f579SHong Zhang PETSC_INTERN PetscErrorCode MatConvert_AIJ_HYPRE(Mat A, MatType, MatReuse, Mat *);
43877906f579SHong Zhang #endif
43887906f579SHong Zhang 
4389d4002b98SHong Zhang PETSC_EXTERN PetscErrorCode MatConvert_SeqAIJ_SeqSELL(Mat, MatType, MatReuse, Mat *);
4390c9225affSStefano Zampini PETSC_INTERN PetscErrorCode MatConvert_XAIJ_IS(Mat, MatType, MatReuse, Mat *);
43914222ddf1SHong Zhang PETSC_INTERN PetscErrorCode MatProductSetFromOptions_IS_XAIJ(Mat);
43927906f579SHong Zhang 
43938c778c55SBarry Smith /*@C
439411a5261eSBarry Smith   MatSeqAIJGetArray - gives read/write access to the array where the data for a `MATSEQAIJ` matrix is stored
43958c778c55SBarry Smith 
43968c778c55SBarry Smith   Not Collective
43978c778c55SBarry Smith 
43988c778c55SBarry Smith   Input Parameter:
4399fe59aa6dSJacob Faibussowitsch . A - a `MATSEQAIJ` matrix
44008c778c55SBarry Smith 
44018c778c55SBarry Smith   Output Parameter:
44028c778c55SBarry Smith . array - pointer to the data
44038c778c55SBarry Smith 
44048c778c55SBarry Smith   Level: intermediate
44058c778c55SBarry Smith 
4406fe59aa6dSJacob Faibussowitsch   Fortran Notes:
44070ab4885dSBarry Smith   `MatSeqAIJGetArray()` Fortran binding is deprecated (since PETSc 3.19), use `MatSeqAIJGetArrayF90()`
44080ab4885dSBarry Smith 
44091cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJRestoreArray()`, `MatSeqAIJGetArrayF90()`
44108c778c55SBarry Smith @*/
44115d83a8b1SBarry Smith PetscErrorCode MatSeqAIJGetArray(Mat A, PetscScalar *array[])
4412d71ae5a4SJacob Faibussowitsch {
4413d67d9f35SJunchao Zhang   Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data;
44148c778c55SBarry Smith 
44158c778c55SBarry Smith   PetscFunctionBegin;
4416d67d9f35SJunchao Zhang   if (aij->ops->getarray) {
44179566063dSJacob Faibussowitsch     PetscCall((*aij->ops->getarray)(A, array));
4418d67d9f35SJunchao Zhang   } else {
4419d67d9f35SJunchao Zhang     *array = aij->a;
4420d67d9f35SJunchao Zhang   }
44213ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
4422d67d9f35SJunchao Zhang }
4423d67d9f35SJunchao Zhang 
4424d67d9f35SJunchao Zhang /*@C
442511a5261eSBarry Smith   MatSeqAIJRestoreArray - returns access to the array where the data for a `MATSEQAIJ` matrix is stored obtained by `MatSeqAIJGetArray()`
4426d67d9f35SJunchao Zhang 
4427d67d9f35SJunchao Zhang   Not Collective
4428d67d9f35SJunchao Zhang 
4429d67d9f35SJunchao Zhang   Input Parameters:
4430fe59aa6dSJacob Faibussowitsch + A     - a `MATSEQAIJ` matrix
4431d67d9f35SJunchao Zhang - array - pointer to the data
4432d67d9f35SJunchao Zhang 
4433d67d9f35SJunchao Zhang   Level: intermediate
4434d67d9f35SJunchao Zhang 
4435fe59aa6dSJacob Faibussowitsch   Fortran Notes:
44360ab4885dSBarry Smith   `MatSeqAIJRestoreArray()` Fortran binding is deprecated (since PETSc 3.19), use `MatSeqAIJRestoreArrayF90()`
44370ab4885dSBarry Smith 
44381cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJGetArray()`, `MatSeqAIJRestoreArrayF90()`
4439d67d9f35SJunchao Zhang @*/
44405d83a8b1SBarry Smith PetscErrorCode MatSeqAIJRestoreArray(Mat A, PetscScalar *array[])
4441d71ae5a4SJacob Faibussowitsch {
4442d67d9f35SJunchao Zhang   Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data;
4443d67d9f35SJunchao Zhang 
4444d67d9f35SJunchao Zhang   PetscFunctionBegin;
4445d67d9f35SJunchao Zhang   if (aij->ops->restorearray) {
44469566063dSJacob Faibussowitsch     PetscCall((*aij->ops->restorearray)(A, array));
4447d67d9f35SJunchao Zhang   } else {
4448d67d9f35SJunchao Zhang     *array = NULL;
4449d67d9f35SJunchao Zhang   }
44509566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJInvalidateDiagonal(A));
44519566063dSJacob Faibussowitsch   PetscCall(PetscObjectStateIncrease((PetscObject)A));
44523ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
44538c778c55SBarry Smith }
44548c778c55SBarry Smith 
445521e72a00SBarry Smith /*@C
445611a5261eSBarry Smith   MatSeqAIJGetArrayRead - gives read-only access to the array where the data for a `MATSEQAIJ` matrix is stored
44578f1ea47aSStefano Zampini 
44580ab4885dSBarry Smith   Not Collective; No Fortran Support
44598f1ea47aSStefano Zampini 
44608f1ea47aSStefano Zampini   Input Parameter:
4461fe59aa6dSJacob Faibussowitsch . A - a `MATSEQAIJ` matrix
44628f1ea47aSStefano Zampini 
44638f1ea47aSStefano Zampini   Output Parameter:
44648f1ea47aSStefano Zampini . array - pointer to the data
44658f1ea47aSStefano Zampini 
44668f1ea47aSStefano Zampini   Level: intermediate
44678f1ea47aSStefano Zampini 
44681cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJGetArray()`, `MatSeqAIJRestoreArrayRead()`
44698f1ea47aSStefano Zampini @*/
44705d83a8b1SBarry Smith PetscErrorCode MatSeqAIJGetArrayRead(Mat A, const PetscScalar *array[])
4471d71ae5a4SJacob Faibussowitsch {
4472d67d9f35SJunchao Zhang   Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data;
44738f1ea47aSStefano Zampini 
44748f1ea47aSStefano Zampini   PetscFunctionBegin;
4475d67d9f35SJunchao Zhang   if (aij->ops->getarrayread) {
44769566063dSJacob Faibussowitsch     PetscCall((*aij->ops->getarrayread)(A, array));
4477d67d9f35SJunchao Zhang   } else {
4478d67d9f35SJunchao Zhang     *array = aij->a;
4479d67d9f35SJunchao Zhang   }
44803ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
44818f1ea47aSStefano Zampini }
44828f1ea47aSStefano Zampini 
44838f1ea47aSStefano Zampini /*@C
448411a5261eSBarry Smith   MatSeqAIJRestoreArrayRead - restore the read-only access array obtained from `MatSeqAIJGetArrayRead()`
44858f1ea47aSStefano Zampini 
44860ab4885dSBarry Smith   Not Collective; No Fortran Support
44878f1ea47aSStefano Zampini 
44888f1ea47aSStefano Zampini   Input Parameter:
4489fe59aa6dSJacob Faibussowitsch . A - a `MATSEQAIJ` matrix
44908f1ea47aSStefano Zampini 
44918f1ea47aSStefano Zampini   Output Parameter:
44928f1ea47aSStefano Zampini . array - pointer to the data
44938f1ea47aSStefano Zampini 
44948f1ea47aSStefano Zampini   Level: intermediate
44958f1ea47aSStefano Zampini 
44961cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJGetArray()`, `MatSeqAIJGetArrayRead()`
44978f1ea47aSStefano Zampini @*/
44985d83a8b1SBarry Smith PetscErrorCode MatSeqAIJRestoreArrayRead(Mat A, const PetscScalar *array[])
4499d71ae5a4SJacob Faibussowitsch {
4500d67d9f35SJunchao Zhang   Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data;
45018f1ea47aSStefano Zampini 
45028f1ea47aSStefano Zampini   PetscFunctionBegin;
4503d67d9f35SJunchao Zhang   if (aij->ops->restorearrayread) {
45049566063dSJacob Faibussowitsch     PetscCall((*aij->ops->restorearrayread)(A, array));
4505d67d9f35SJunchao Zhang   } else {
4506d67d9f35SJunchao Zhang     *array = NULL;
4507d67d9f35SJunchao Zhang   }
45083ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
4509d67d9f35SJunchao Zhang }
4510d67d9f35SJunchao Zhang 
4511d67d9f35SJunchao Zhang /*@C
451211a5261eSBarry Smith   MatSeqAIJGetArrayWrite - gives write-only access to the array where the data for a `MATSEQAIJ` matrix is stored
4513d67d9f35SJunchao Zhang 
45140ab4885dSBarry Smith   Not Collective; No Fortran Support
4515d67d9f35SJunchao Zhang 
4516d67d9f35SJunchao Zhang   Input Parameter:
4517fe59aa6dSJacob Faibussowitsch . A - a `MATSEQAIJ` matrix
4518d67d9f35SJunchao Zhang 
4519d67d9f35SJunchao Zhang   Output Parameter:
4520d67d9f35SJunchao Zhang . array - pointer to the data
4521d67d9f35SJunchao Zhang 
4522d67d9f35SJunchao Zhang   Level: intermediate
4523d67d9f35SJunchao Zhang 
45241cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJGetArray()`, `MatSeqAIJRestoreArrayRead()`
4525d67d9f35SJunchao Zhang @*/
45265d83a8b1SBarry Smith PetscErrorCode MatSeqAIJGetArrayWrite(Mat A, PetscScalar *array[])
4527d71ae5a4SJacob Faibussowitsch {
4528d67d9f35SJunchao Zhang   Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data;
4529d67d9f35SJunchao Zhang 
4530d67d9f35SJunchao Zhang   PetscFunctionBegin;
4531d67d9f35SJunchao Zhang   if (aij->ops->getarraywrite) {
45329566063dSJacob Faibussowitsch     PetscCall((*aij->ops->getarraywrite)(A, array));
4533d67d9f35SJunchao Zhang   } else {
4534d67d9f35SJunchao Zhang     *array = aij->a;
4535d67d9f35SJunchao Zhang   }
45369566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJInvalidateDiagonal(A));
45379566063dSJacob Faibussowitsch   PetscCall(PetscObjectStateIncrease((PetscObject)A));
45383ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
4539d67d9f35SJunchao Zhang }
4540d67d9f35SJunchao Zhang 
4541d67d9f35SJunchao Zhang /*@C
4542d67d9f35SJunchao Zhang   MatSeqAIJRestoreArrayWrite - restore the read-only access array obtained from MatSeqAIJGetArrayRead
4543d67d9f35SJunchao Zhang 
45440ab4885dSBarry Smith   Not Collective; No Fortran Support
4545d67d9f35SJunchao Zhang 
4546d67d9f35SJunchao Zhang   Input Parameter:
4547fe59aa6dSJacob Faibussowitsch . A - a MATSEQAIJ matrix
4548d67d9f35SJunchao Zhang 
4549d67d9f35SJunchao Zhang   Output Parameter:
4550d67d9f35SJunchao Zhang . array - pointer to the data
4551d67d9f35SJunchao Zhang 
4552d67d9f35SJunchao Zhang   Level: intermediate
4553d67d9f35SJunchao Zhang 
45541cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJGetArray()`, `MatSeqAIJGetArrayRead()`
4555d67d9f35SJunchao Zhang @*/
45565d83a8b1SBarry Smith PetscErrorCode MatSeqAIJRestoreArrayWrite(Mat A, PetscScalar *array[])
4557d71ae5a4SJacob Faibussowitsch {
4558d67d9f35SJunchao Zhang   Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data;
4559d67d9f35SJunchao Zhang 
4560d67d9f35SJunchao Zhang   PetscFunctionBegin;
4561d67d9f35SJunchao Zhang   if (aij->ops->restorearraywrite) {
45629566063dSJacob Faibussowitsch     PetscCall((*aij->ops->restorearraywrite)(A, array));
4563d67d9f35SJunchao Zhang   } else {
4564d67d9f35SJunchao Zhang     *array = NULL;
4565d67d9f35SJunchao Zhang   }
45663ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
45678f1ea47aSStefano Zampini }
45688f1ea47aSStefano Zampini 
45698f1ea47aSStefano Zampini /*@C
457011a5261eSBarry Smith   MatSeqAIJGetCSRAndMemType - Get the CSR arrays and the memory type of the `MATSEQAIJ` matrix
45717ee59b9bSJunchao Zhang 
45720ab4885dSBarry Smith   Not Collective; No Fortran Support
45737ee59b9bSJunchao Zhang 
45747ee59b9bSJunchao Zhang   Input Parameter:
457511a5261eSBarry Smith . mat - a matrix of type `MATSEQAIJ` or its subclasses
45767ee59b9bSJunchao Zhang 
45777ee59b9bSJunchao Zhang   Output Parameters:
45787ee59b9bSJunchao Zhang + i     - row map array of the matrix
45797ee59b9bSJunchao Zhang . j     - column index array of the matrix
45807ee59b9bSJunchao Zhang . a     - data array of the matrix
4581fe59aa6dSJacob Faibussowitsch - mtype - memory type of the arrays
45827ee59b9bSJunchao Zhang 
4583fe59aa6dSJacob Faibussowitsch   Level: developer
45842ef1f0ffSBarry Smith 
45857ee59b9bSJunchao Zhang   Notes:
45862ef1f0ffSBarry Smith   Any of the output parameters can be `NULL`, in which case the corresponding value is not returned.
45877ee59b9bSJunchao Zhang   If mat is a device matrix, the arrays are on the device. Otherwise, they are on the host.
45887ee59b9bSJunchao Zhang 
45897ee59b9bSJunchao Zhang   One can call this routine on a preallocated but not assembled matrix to just get the memory of the CSR underneath the matrix.
45902ef1f0ffSBarry Smith   If the matrix is assembled, the data array `a` is guaranteed to have the latest values of the matrix.
45917ee59b9bSJunchao Zhang 
45921cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJGetArray()`, `MatSeqAIJGetArrayRead()`
45937ee59b9bSJunchao Zhang @*/
45945d83a8b1SBarry Smith PetscErrorCode MatSeqAIJGetCSRAndMemType(Mat mat, const PetscInt *i[], const PetscInt *j[], PetscScalar *a[], PetscMemType *mtype)
4595d71ae5a4SJacob Faibussowitsch {
45967ee59b9bSJunchao Zhang   Mat_SeqAIJ *aij = (Mat_SeqAIJ *)mat->data;
45977ee59b9bSJunchao Zhang 
45987ee59b9bSJunchao Zhang   PetscFunctionBegin;
45997ee59b9bSJunchao Zhang   PetscCheck(mat->preallocated, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "matrix is not preallocated");
46007ee59b9bSJunchao Zhang   if (aij->ops->getcsrandmemtype) {
46017ee59b9bSJunchao Zhang     PetscCall((*aij->ops->getcsrandmemtype)(mat, i, j, a, mtype));
46027ee59b9bSJunchao Zhang   } else {
46037ee59b9bSJunchao Zhang     if (i) *i = aij->i;
46047ee59b9bSJunchao Zhang     if (j) *j = aij->j;
46057ee59b9bSJunchao Zhang     if (a) *a = aij->a;
46067ee59b9bSJunchao Zhang     if (mtype) *mtype = PETSC_MEMTYPE_HOST;
46077ee59b9bSJunchao Zhang   }
46083ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
46097ee59b9bSJunchao Zhang }
46107ee59b9bSJunchao Zhang 
4611cc4c1da9SBarry Smith /*@
461221e72a00SBarry Smith   MatSeqAIJGetMaxRowNonzeros - returns the maximum number of nonzeros in any row
461321e72a00SBarry Smith 
461421e72a00SBarry Smith   Not Collective
461521e72a00SBarry Smith 
461621e72a00SBarry Smith   Input Parameter:
4617fe59aa6dSJacob Faibussowitsch . A - a `MATSEQAIJ` matrix
461821e72a00SBarry Smith 
461921e72a00SBarry Smith   Output Parameter:
462021e72a00SBarry Smith . nz - the maximum number of nonzeros in any row
462121e72a00SBarry Smith 
462221e72a00SBarry Smith   Level: intermediate
462321e72a00SBarry Smith 
46241cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJRestoreArray()`, `MatSeqAIJGetArrayF90()`
462521e72a00SBarry Smith @*/
4626d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJGetMaxRowNonzeros(Mat A, PetscInt *nz)
4627d71ae5a4SJacob Faibussowitsch {
462821e72a00SBarry Smith   Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data;
462921e72a00SBarry Smith 
463021e72a00SBarry Smith   PetscFunctionBegin;
463121e72a00SBarry Smith   *nz = aij->rmax;
46323ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
463321e72a00SBarry Smith }
463421e72a00SBarry Smith 
46352c4ab24aSJunchao Zhang static PetscErrorCode MatCOOStructDestroy_SeqAIJ(void *data)
46362c4ab24aSJunchao Zhang {
46372c4ab24aSJunchao Zhang   MatCOOStruct_SeqAIJ *coo = (MatCOOStruct_SeqAIJ *)data;
46384d86920dSPierre Jolivet 
46392c4ab24aSJunchao Zhang   PetscFunctionBegin;
46402c4ab24aSJunchao Zhang   PetscCall(PetscFree(coo->perm));
46412c4ab24aSJunchao Zhang   PetscCall(PetscFree(coo->jmap));
46422c4ab24aSJunchao Zhang   PetscCall(PetscFree(coo));
46432c4ab24aSJunchao Zhang   PetscFunctionReturn(PETSC_SUCCESS);
46442c4ab24aSJunchao Zhang }
46452c4ab24aSJunchao Zhang 
4646d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetPreallocationCOO_SeqAIJ(Mat mat, PetscCount coo_n, PetscInt coo_i[], PetscInt coo_j[])
4647d71ae5a4SJacob Faibussowitsch {
4648394ed5ebSJunchao Zhang   MPI_Comm             comm;
4649394ed5ebSJunchao Zhang   PetscInt            *i, *j;
46500d88f7f4SJunchao Zhang   PetscInt             M, N, row, iprev;
4651394ed5ebSJunchao Zhang   PetscCount           k, p, q, nneg, nnz, start, end; /* Index the coo array, so use PetscCount as their type */
4652394ed5ebSJunchao Zhang   PetscInt            *Ai;                             /* Change to PetscCount once we use it for row pointers */
4653394ed5ebSJunchao Zhang   PetscInt            *Aj;
4654394ed5ebSJunchao Zhang   PetscScalar         *Aa;
4655f4f49eeaSPierre Jolivet   Mat_SeqAIJ          *seqaij = (Mat_SeqAIJ *)mat->data;
4656cbc6b225SStefano Zampini   MatType              rtype;
4657394ed5ebSJunchao Zhang   PetscCount          *perm, *jmap;
46582c4ab24aSJunchao Zhang   PetscContainer       container;
46592c4ab24aSJunchao Zhang   MatCOOStruct_SeqAIJ *coo;
46600d88f7f4SJunchao Zhang   PetscBool            isorted;
4661394ed5ebSJunchao Zhang 
4662394ed5ebSJunchao Zhang   PetscFunctionBegin;
46639566063dSJacob Faibussowitsch   PetscCall(PetscObjectGetComm((PetscObject)mat, &comm));
46649566063dSJacob Faibussowitsch   PetscCall(MatGetSize(mat, &M, &N));
4665e8729f6fSJunchao Zhang   i = coo_i;
4666e8729f6fSJunchao Zhang   j = coo_j;
46679566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(coo_n, &perm));
46680d88f7f4SJunchao Zhang 
46690d88f7f4SJunchao Zhang   /* Ignore entries with negative row or col indices; at the same time, check if i[] is already sorted (e.g., MatConvert_AlJ_HYPRE results in this case) */
46700d88f7f4SJunchao Zhang   isorted = PETSC_TRUE;
46710d88f7f4SJunchao Zhang   iprev   = PETSC_INT_MIN;
46720d88f7f4SJunchao Zhang   for (k = 0; k < coo_n; k++) {
4673394ed5ebSJunchao Zhang     if (j[k] < 0) i[k] = -1;
46740d88f7f4SJunchao Zhang     if (isorted) {
46750d88f7f4SJunchao Zhang       if (i[k] < iprev) isorted = PETSC_FALSE;
46760d88f7f4SJunchao Zhang       else iprev = i[k];
46770d88f7f4SJunchao Zhang     }
4678394ed5ebSJunchao Zhang     perm[k] = k;
4679394ed5ebSJunchao Zhang   }
4680394ed5ebSJunchao Zhang 
46810d88f7f4SJunchao Zhang   /* Sort by row if not already */
46820d88f7f4SJunchao Zhang   if (!isorted) PetscCall(PetscSortIntWithIntCountArrayPair(coo_n, i, j, perm));
4683651b1cf9SStefano Zampini 
4684651b1cf9SStefano Zampini   /* Advance k to the first row with a non-negative index */
4685651b1cf9SStefano Zampini   for (k = 0; k < coo_n; k++)
46869371c9d4SSatish Balay     if (i[k] >= 0) break;
4687394ed5ebSJunchao Zhang   nneg = k;
46889566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(coo_n - nneg + 1, &jmap)); /* +1 to make a CSR-like data structure. jmap[i] originally is the number of repeats for i-th nonzero */
4689394ed5ebSJunchao Zhang   nnz = 0;                                          /* Total number of unique nonzeros to be counted */
469035cb6cd3SPierre Jolivet   jmap++;                                           /* Inc jmap by 1 for convenience */
4691394ed5ebSJunchao Zhang 
46929566063dSJacob Faibussowitsch   PetscCall(PetscCalloc1(M + 1, &Ai));        /* CSR of A */
46939566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(coo_n - nneg, &Aj)); /* We have at most coo_n-nneg unique nonzeros */
4694394ed5ebSJunchao Zhang 
4695651b1cf9SStefano Zampini   /* Support for HYPRE */
4696651b1cf9SStefano Zampini   PetscBool   hypre;
4697651b1cf9SStefano Zampini   const char *name;
4698651b1cf9SStefano Zampini   PetscCall(PetscObjectGetName((PetscObject)mat, &name));
4699651b1cf9SStefano Zampini   PetscCall(PetscStrcmp("_internal_COO_mat_for_hypre", name, &hypre));
4700651b1cf9SStefano Zampini 
4701394ed5ebSJunchao Zhang   /* In each row, sort by column, then unique column indices to get row length */
470235cb6cd3SPierre Jolivet   Ai++;  /* Inc by 1 for convenience */
4703394ed5ebSJunchao Zhang   q = 0; /* q-th unique nonzero, with q starting from 0 */
4704394ed5ebSJunchao Zhang   while (k < coo_n) {
47050d88f7f4SJunchao Zhang     PetscBool strictly_sorted; // this row is strictly sorted?
47060d88f7f4SJunchao Zhang     PetscInt  jprev;
47070d88f7f4SJunchao Zhang 
47080d88f7f4SJunchao Zhang     /* get [start,end) indices for this row; also check if cols in this row are strictly sorted */
4709394ed5ebSJunchao Zhang     row             = i[k];
47100d88f7f4SJunchao Zhang     start           = k;
47110d88f7f4SJunchao Zhang     jprev           = PETSC_INT_MIN;
47120d88f7f4SJunchao Zhang     strictly_sorted = PETSC_TRUE;
47130d88f7f4SJunchao Zhang     while (k < coo_n && i[k] == row) {
47140d88f7f4SJunchao Zhang       if (strictly_sorted) {
47150d88f7f4SJunchao Zhang         if (j[k] <= jprev) strictly_sorted = PETSC_FALSE;
47160d88f7f4SJunchao Zhang         else jprev = j[k];
47170d88f7f4SJunchao Zhang       }
47180d88f7f4SJunchao Zhang       k++;
47190d88f7f4SJunchao Zhang     }
4720394ed5ebSJunchao Zhang     end = k;
47210d88f7f4SJunchao Zhang 
4722651b1cf9SStefano Zampini     /* hack for HYPRE: swap min column to diag so that diagonal values will go first */
4723651b1cf9SStefano Zampini     if (hypre) {
4724651b1cf9SStefano Zampini       PetscInt  minj    = PETSC_MAX_INT;
4725651b1cf9SStefano Zampini       PetscBool hasdiag = PETSC_FALSE;
47260d88f7f4SJunchao Zhang 
47270d88f7f4SJunchao Zhang       if (strictly_sorted) { // fast path to swap the first and the diag
47280d88f7f4SJunchao Zhang         PetscCount tmp;
47290d88f7f4SJunchao Zhang         for (p = start; p < end; p++) {
47300d88f7f4SJunchao Zhang           if (j[p] == row && p != start) {
47310d88f7f4SJunchao Zhang             j[p]        = j[start];
47320d88f7f4SJunchao Zhang             j[start]    = row;
47330d88f7f4SJunchao Zhang             tmp         = perm[start];
47340d88f7f4SJunchao Zhang             perm[start] = perm[p];
47350d88f7f4SJunchao Zhang             perm[p]     = tmp;
47360d88f7f4SJunchao Zhang             break;
47370d88f7f4SJunchao Zhang           }
47380d88f7f4SJunchao Zhang         }
47390d88f7f4SJunchao Zhang       } else {
4740651b1cf9SStefano Zampini         for (p = start; p < end; p++) {
4741651b1cf9SStefano Zampini           hasdiag = (PetscBool)(hasdiag || (j[p] == row));
4742651b1cf9SStefano Zampini           minj    = PetscMin(minj, j[p]);
4743651b1cf9SStefano Zampini         }
47440d88f7f4SJunchao Zhang 
4745651b1cf9SStefano Zampini         if (hasdiag) {
4746651b1cf9SStefano Zampini           for (p = start; p < end; p++) {
4747651b1cf9SStefano Zampini             if (j[p] == minj) j[p] = row;
4748651b1cf9SStefano Zampini             else if (j[p] == row) j[p] = minj;
4749651b1cf9SStefano Zampini           }
4750651b1cf9SStefano Zampini         }
4751651b1cf9SStefano Zampini       }
47520d88f7f4SJunchao Zhang     }
47530d88f7f4SJunchao Zhang     // sort by columns in a row
47540d88f7f4SJunchao Zhang     if (!strictly_sorted) PetscCall(PetscSortIntWithCountArray(end - start, j + start, perm + start));
4755651b1cf9SStefano Zampini 
47560d88f7f4SJunchao Zhang     if (strictly_sorted) { // fast path to set Aj[], jmap[], Ai[], nnz, q
47570d88f7f4SJunchao Zhang       for (p = start; p < end; p++, q++) {
47580d88f7f4SJunchao Zhang         Aj[q]   = j[p];
47590d88f7f4SJunchao Zhang         jmap[q] = 1;
47600d88f7f4SJunchao Zhang       }
47610d88f7f4SJunchao Zhang       Ai[row] = end - start;
47620d88f7f4SJunchao Zhang       nnz += Ai[row]; // q is already advanced
47630d88f7f4SJunchao Zhang     } else {
4764394ed5ebSJunchao Zhang       /* Find number of unique col entries in this row */
4765394ed5ebSJunchao Zhang       Aj[q]   = j[start]; /* Log the first nonzero in this row */
4766651b1cf9SStefano Zampini       jmap[q] = 1;        /* Number of repeats of this nonzero entry */
4767394ed5ebSJunchao Zhang       Ai[row] = 1;
4768394ed5ebSJunchao Zhang       nnz++;
4769394ed5ebSJunchao Zhang 
4770394ed5ebSJunchao Zhang       for (p = start + 1; p < end; p++) { /* Scan remaining nonzero in this row */
4771394ed5ebSJunchao Zhang         if (j[p] != j[p - 1]) {           /* Meet a new nonzero */
4772394ed5ebSJunchao Zhang           q++;
4773394ed5ebSJunchao Zhang           jmap[q] = 1;
4774394ed5ebSJunchao Zhang           Aj[q]   = j[p];
4775394ed5ebSJunchao Zhang           Ai[row]++;
4776394ed5ebSJunchao Zhang           nnz++;
4777394ed5ebSJunchao Zhang         } else {
4778394ed5ebSJunchao Zhang           jmap[q]++;
4779394ed5ebSJunchao Zhang         }
4780394ed5ebSJunchao Zhang       }
4781394ed5ebSJunchao Zhang       q++; /* Move to next row and thus next unique nonzero */
4782394ed5ebSJunchao Zhang     }
47830d88f7f4SJunchao Zhang   }
47840d88f7f4SJunchao Zhang 
4785394ed5ebSJunchao Zhang   Ai--; /* Back to the beginning of Ai[] */
4786394ed5ebSJunchao Zhang   for (k = 0; k < M; k++) Ai[k + 1] += Ai[k];
47870d88f7f4SJunchao Zhang   jmap--; // Back to the beginning of jmap[]
4788394ed5ebSJunchao Zhang   jmap[0] = 0;
4789394ed5ebSJunchao Zhang   for (k = 0; k < nnz; k++) jmap[k + 1] += jmap[k];
47900d88f7f4SJunchao Zhang 
4791394ed5ebSJunchao Zhang   if (nnz < coo_n - nneg) { /* Realloc with actual number of unique nonzeros */
4792394ed5ebSJunchao Zhang     PetscCount *jmap_new;
4793394ed5ebSJunchao Zhang     PetscInt   *Aj_new;
4794394ed5ebSJunchao Zhang 
47959566063dSJacob Faibussowitsch     PetscCall(PetscMalloc1(nnz + 1, &jmap_new));
47969566063dSJacob Faibussowitsch     PetscCall(PetscArraycpy(jmap_new, jmap, nnz + 1));
47979566063dSJacob Faibussowitsch     PetscCall(PetscFree(jmap));
4798394ed5ebSJunchao Zhang     jmap = jmap_new;
4799394ed5ebSJunchao Zhang 
48009566063dSJacob Faibussowitsch     PetscCall(PetscMalloc1(nnz, &Aj_new));
48019566063dSJacob Faibussowitsch     PetscCall(PetscArraycpy(Aj_new, Aj, nnz));
48029566063dSJacob Faibussowitsch     PetscCall(PetscFree(Aj));
4803394ed5ebSJunchao Zhang     Aj = Aj_new;
4804394ed5ebSJunchao Zhang   }
4805394ed5ebSJunchao Zhang 
4806394ed5ebSJunchao Zhang   if (nneg) { /* Discard heading entries with negative indices in perm[], as we'll access it from index 0 in MatSetValuesCOO */
4807394ed5ebSJunchao Zhang     PetscCount *perm_new;
4808cbc6b225SStefano Zampini 
48099566063dSJacob Faibussowitsch     PetscCall(PetscMalloc1(coo_n - nneg, &perm_new));
48109566063dSJacob Faibussowitsch     PetscCall(PetscArraycpy(perm_new, perm + nneg, coo_n - nneg));
48119566063dSJacob Faibussowitsch     PetscCall(PetscFree(perm));
4812394ed5ebSJunchao Zhang     perm = perm_new;
4813394ed5ebSJunchao Zhang   }
4814394ed5ebSJunchao Zhang 
48159566063dSJacob Faibussowitsch   PetscCall(MatGetRootType_Private(mat, &rtype));
48169566063dSJacob Faibussowitsch   PetscCall(PetscCalloc1(nnz, &Aa)); /* Zero the matrix */
48179566063dSJacob Faibussowitsch   PetscCall(MatSetSeqAIJWithArrays_private(PETSC_COMM_SELF, M, N, Ai, Aj, Aa, rtype, mat));
4818394ed5ebSJunchao Zhang 
4819394ed5ebSJunchao Zhang   seqaij->singlemalloc = PETSC_FALSE;            /* Ai, Aj and Aa are not allocated in one big malloc */
4820394ed5ebSJunchao Zhang   seqaij->free_a = seqaij->free_ij = PETSC_TRUE; /* Let newmat own Ai, Aj and Aa */
48212c4ab24aSJunchao Zhang 
48222c4ab24aSJunchao Zhang   // Put the COO struct in a container and then attach that to the matrix
48232c4ab24aSJunchao Zhang   PetscCall(PetscMalloc1(1, &coo));
48242c4ab24aSJunchao Zhang   coo->nz   = nnz;
48252c4ab24aSJunchao Zhang   coo->n    = coo_n;
48262c4ab24aSJunchao Zhang   coo->Atot = coo_n - nneg; // Annz is seqaij->nz, so no need to record that again
48272c4ab24aSJunchao Zhang   coo->jmap = jmap;         // of length nnz+1
48282c4ab24aSJunchao Zhang   coo->perm = perm;
48292c4ab24aSJunchao Zhang   PetscCall(PetscContainerCreate(PETSC_COMM_SELF, &container));
48302c4ab24aSJunchao Zhang   PetscCall(PetscContainerSetPointer(container, coo));
48312c4ab24aSJunchao Zhang   PetscCall(PetscContainerSetUserDestroy(container, MatCOOStructDestroy_SeqAIJ));
48322c4ab24aSJunchao Zhang   PetscCall(PetscObjectCompose((PetscObject)mat, "__PETSc_MatCOOStruct_Host", (PetscObject)container));
48332c4ab24aSJunchao Zhang   PetscCall(PetscContainerDestroy(&container));
48343ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
4835394ed5ebSJunchao Zhang }
4836394ed5ebSJunchao Zhang 
4837d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatSetValuesCOO_SeqAIJ(Mat A, const PetscScalar v[], InsertMode imode)
4838d71ae5a4SJacob Faibussowitsch {
4839394ed5ebSJunchao Zhang   Mat_SeqAIJ          *aseq = (Mat_SeqAIJ *)A->data;
4840394ed5ebSJunchao Zhang   PetscCount           i, j, Annz = aseq->nz;
48412c4ab24aSJunchao Zhang   PetscCount          *perm, *jmap;
4842394ed5ebSJunchao Zhang   PetscScalar         *Aa;
48432c4ab24aSJunchao Zhang   PetscContainer       container;
48442c4ab24aSJunchao Zhang   MatCOOStruct_SeqAIJ *coo;
4845394ed5ebSJunchao Zhang 
4846394ed5ebSJunchao Zhang   PetscFunctionBegin;
48472c4ab24aSJunchao Zhang   PetscCall(PetscObjectQuery((PetscObject)A, "__PETSc_MatCOOStruct_Host", (PetscObject *)&container));
48482c4ab24aSJunchao Zhang   PetscCheck(container, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Not found MatCOOStruct on this matrix");
48492c4ab24aSJunchao Zhang   PetscCall(PetscContainerGetPointer(container, (void **)&coo));
48502c4ab24aSJunchao Zhang   perm = coo->perm;
48512c4ab24aSJunchao Zhang   jmap = coo->jmap;
48529566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArray(A, &Aa));
4853394ed5ebSJunchao Zhang   for (i = 0; i < Annz; i++) {
4854b6c38306SJunchao Zhang     PetscScalar sum = 0.0;
4855b6c38306SJunchao Zhang     for (j = jmap[i]; j < jmap[i + 1]; j++) sum += v[perm[j]];
4856b6c38306SJunchao Zhang     Aa[i] = (imode == INSERT_VALUES ? 0.0 : Aa[i]) + sum;
4857394ed5ebSJunchao Zhang   }
48589566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArray(A, &Aa));
48593ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
4860394ed5ebSJunchao Zhang }
4861394ed5ebSJunchao Zhang 
486234b5b067SBarry Smith #if defined(PETSC_HAVE_CUDA)
48635063d097SStefano Zampini PETSC_INTERN PetscErrorCode MatConvert_SeqAIJ_SeqAIJCUSPARSE(Mat, MatType, MatReuse, Mat *);
486402fe1965SBarry Smith #endif
4865d5e393b6SSuyash Tandon #if defined(PETSC_HAVE_HIP)
4866d5e393b6SSuyash Tandon PETSC_INTERN PetscErrorCode MatConvert_SeqAIJ_SeqAIJHIPSPARSE(Mat, MatType, MatReuse, Mat *);
4867d5e393b6SSuyash Tandon #endif
48683d0639e7SStefano Zampini #if defined(PETSC_HAVE_KOKKOS_KERNELS)
48695063d097SStefano Zampini PETSC_INTERN PetscErrorCode MatConvert_SeqAIJ_SeqAIJKokkos(Mat, MatType, MatReuse, Mat *);
48703d0639e7SStefano Zampini #endif
487102fe1965SBarry Smith 
4872d71ae5a4SJacob Faibussowitsch PETSC_EXTERN PetscErrorCode MatCreate_SeqAIJ(Mat B)
4873d71ae5a4SJacob Faibussowitsch {
4874273d9f13SBarry Smith   Mat_SeqAIJ *b;
487538baddfdSBarry Smith   PetscMPIInt size;
4876273d9f13SBarry Smith 
4877273d9f13SBarry Smith   PetscFunctionBegin;
48789566063dSJacob Faibussowitsch   PetscCallMPI(MPI_Comm_size(PetscObjectComm((PetscObject)B), &size));
487908401ef6SPierre Jolivet   PetscCheck(size <= 1, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Comm must be of size 1");
4880273d9f13SBarry Smith 
48814dfa11a4SJacob Faibussowitsch   PetscCall(PetscNew(&b));
48822205254eSKarl Rupp 
4883b0a32e0cSBarry Smith   B->data   = (void *)b;
4884aea10558SJacob Faibussowitsch   B->ops[0] = MatOps_Values;
4885071fcb05SBarry Smith   if (B->sortedfull) B->ops->setvalues = MatSetValues_SeqAIJ_SortedFull;
48862205254eSKarl Rupp 
4887f4259b30SLisandro Dalcin   b->row                = NULL;
4888f4259b30SLisandro Dalcin   b->col                = NULL;
4889f4259b30SLisandro Dalcin   b->icol               = NULL;
4890b810aeb4SBarry Smith   b->reallocs           = 0;
489136db0b34SBarry Smith   b->ignorezeroentries  = PETSC_FALSE;
4892f1e2ffcdSBarry Smith   b->roworiented        = PETSC_TRUE;
4893416022c9SBarry Smith   b->nonew              = 0;
4894f4259b30SLisandro Dalcin   b->diag               = NULL;
4895f4259b30SLisandro Dalcin   b->solve_work         = NULL;
4896f4259b30SLisandro Dalcin   B->spptr              = NULL;
4897f4259b30SLisandro Dalcin   b->saved_values       = NULL;
4898f4259b30SLisandro Dalcin   b->idiag              = NULL;
4899f4259b30SLisandro Dalcin   b->mdiag              = NULL;
4900f4259b30SLisandro Dalcin   b->ssor_work          = NULL;
490171f1c65dSBarry Smith   b->omega              = 1.0;
490271f1c65dSBarry Smith   b->fshift             = 0.0;
490371f1c65dSBarry Smith   b->idiagvalid         = PETSC_FALSE;
4904bbead8a2SBarry Smith   b->ibdiagvalid        = PETSC_FALSE;
4905a9817697SBarry Smith   b->keepnonzeropattern = PETSC_FALSE;
490617ab2063SBarry Smith 
49079566063dSJacob Faibussowitsch   PetscCall(PetscObjectChangeTypeName((PetscObject)B, MATSEQAIJ));
4908d1e78c4fSBarry Smith #if defined(PETSC_HAVE_MATLAB)
49099566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "PetscMatlabEnginePut_C", MatlabEnginePut_SeqAIJ));
49109566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "PetscMatlabEngineGet_C", MatlabEngineGet_SeqAIJ));
4911b3866ffcSBarry Smith #endif
49129566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSeqAIJSetColumnIndices_C", MatSeqAIJSetColumnIndices_SeqAIJ));
49139566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatStoreValues_C", MatStoreValues_SeqAIJ));
49149566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatRetrieveValues_C", MatRetrieveValues_SeqAIJ));
49159566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqsbaij_C", MatConvert_SeqAIJ_SeqSBAIJ));
49169566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqbaij_C", MatConvert_SeqAIJ_SeqBAIJ));
49179566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijperm_C", MatConvert_SeqAIJ_SeqAIJPERM));
49189566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijsell_C", MatConvert_SeqAIJ_SeqAIJSELL));
49199779e05dSSatish Balay #if defined(PETSC_HAVE_MKL_SPARSE)
49209566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijmkl_C", MatConvert_SeqAIJ_SeqAIJMKL));
4921191b95cbSRichard Tran Mills #endif
492234b5b067SBarry Smith #if defined(PETSC_HAVE_CUDA)
49239566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijcusparse_C", MatConvert_SeqAIJ_SeqAIJCUSPARSE));
49249566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_seqaijcusparse_seqaij_C", MatProductSetFromOptions_SeqAIJ));
49259566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_seqaij_seqaijcusparse_C", MatProductSetFromOptions_SeqAIJ));
492602fe1965SBarry Smith #endif
4927d5e393b6SSuyash Tandon #if defined(PETSC_HAVE_HIP)
4928d5e393b6SSuyash Tandon   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijhipsparse_C", MatConvert_SeqAIJ_SeqAIJHIPSPARSE));
4929d5e393b6SSuyash Tandon   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_seqaijhipsparse_seqaij_C", MatProductSetFromOptions_SeqAIJ));
4930d5e393b6SSuyash Tandon   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_seqaij_seqaijhipsparse_C", MatProductSetFromOptions_SeqAIJ));
4931d5e393b6SSuyash Tandon #endif
49323d0639e7SStefano Zampini #if defined(PETSC_HAVE_KOKKOS_KERNELS)
49339566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijkokkos_C", MatConvert_SeqAIJ_SeqAIJKokkos));
49343d0639e7SStefano Zampini #endif
49359566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijcrl_C", MatConvert_SeqAIJ_SeqAIJCRL));
4936af8000cdSHong Zhang #if defined(PETSC_HAVE_ELEMENTAL)
49379566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_elemental_C", MatConvert_SeqAIJ_Elemental));
4938af8000cdSHong Zhang #endif
4939d24d4204SJose E. Roman #if defined(PETSC_HAVE_SCALAPACK)
49409566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_scalapack_C", MatConvert_AIJ_ScaLAPACK));
4941d24d4204SJose E. Roman #endif
494263c07aadSStefano Zampini #if defined(PETSC_HAVE_HYPRE)
49439566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_hypre_C", MatConvert_AIJ_HYPRE));
49449566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_transpose_seqaij_seqaij_C", MatProductSetFromOptions_Transpose_AIJ_AIJ));
494563c07aadSStefano Zampini #endif
49469566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqdense_C", MatConvert_SeqAIJ_SeqDense));
49479566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqsell_C", MatConvert_SeqAIJ_SeqSELL));
49489566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_is_C", MatConvert_XAIJ_IS));
49499566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatIsTranspose_C", MatIsTranspose_SeqAIJ));
495014e4dea2SJose E. Roman   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatIsHermitianTranspose_C", MatIsHermitianTranspose_SeqAIJ));
49519566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSeqAIJSetPreallocation_C", MatSeqAIJSetPreallocation_SeqAIJ));
49529566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatResetPreallocation_C", MatResetPreallocation_SeqAIJ));
49539566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSeqAIJSetPreallocationCSR_C", MatSeqAIJSetPreallocationCSR_SeqAIJ));
49549566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatReorderForNonzeroDiagonal_C", MatReorderForNonzeroDiagonal_SeqAIJ));
49559566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_is_seqaij_C", MatProductSetFromOptions_IS_XAIJ));
49569566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_seqdense_seqaij_C", MatProductSetFromOptions_SeqDense_SeqAIJ));
49579566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_seqaij_seqaij_C", MatProductSetFromOptions_SeqAIJ));
49589566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSeqAIJKron_C", MatSeqAIJKron_SeqAIJ));
49599566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSetPreallocationCOO_C", MatSetPreallocationCOO_SeqAIJ));
49609566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSetValuesCOO_C", MatSetValuesCOO_SeqAIJ));
49619566063dSJacob Faibussowitsch   PetscCall(MatCreate_SeqAIJ_Inode(B));
49629566063dSJacob Faibussowitsch   PetscCall(PetscObjectChangeTypeName((PetscObject)B, MATSEQAIJ));
49639566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJSetTypeFromOptions(B)); /* this allows changing the matrix subtype to say MATSEQAIJPERM */
49643ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
496517ab2063SBarry Smith }
496617ab2063SBarry Smith 
4967b24902e0SBarry Smith /*
49683893b582SJunchao Zhang     Given a matrix generated with MatGetFactor() duplicates all the information in A into C
4969b24902e0SBarry Smith */
4970d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDuplicateNoCreate_SeqAIJ(Mat C, Mat A, MatDuplicateOption cpvalues, PetscBool mallocmatspace)
4971d71ae5a4SJacob Faibussowitsch {
49722a350339SBarry Smith   Mat_SeqAIJ *c = (Mat_SeqAIJ *)C->data, *a = (Mat_SeqAIJ *)A->data;
4973071fcb05SBarry Smith   PetscInt    m = A->rmap->n, i;
497417ab2063SBarry Smith 
49753a40ed3dSBarry Smith   PetscFunctionBegin;
4976aed4548fSBarry Smith   PetscCheck(A->assembled || cpvalues == MAT_DO_NOT_COPY_VALUES, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Cannot duplicate unassembled matrix");
4977273d9f13SBarry Smith 
4978d5f3da31SBarry Smith   C->factortype    = A->factortype;
4979f4259b30SLisandro Dalcin   c->row           = NULL;
4980f4259b30SLisandro Dalcin   c->col           = NULL;
4981f4259b30SLisandro Dalcin   c->icol          = NULL;
49826ad4291fSHong Zhang   c->reallocs      = 0;
4983bc43efbbSJunchao Zhang   c->diagonaldense = a->diagonaldense;
498417ab2063SBarry Smith 
498569272f91SPierre Jolivet   C->assembled = A->assembled;
498617ab2063SBarry Smith 
498769272f91SPierre Jolivet   if (A->preallocated) {
49889566063dSJacob Faibussowitsch     PetscCall(PetscLayoutReference(A->rmap, &C->rmap));
49899566063dSJacob Faibussowitsch     PetscCall(PetscLayoutReference(A->cmap, &C->cmap));
4990eec197d1SBarry Smith 
499131fe6a7dSBarry Smith     if (!A->hash_active) {
49929566063dSJacob Faibussowitsch       PetscCall(PetscMalloc1(m, &c->imax));
49939566063dSJacob Faibussowitsch       PetscCall(PetscMemcpy(c->imax, a->imax, m * sizeof(PetscInt)));
49949566063dSJacob Faibussowitsch       PetscCall(PetscMalloc1(m, &c->ilen));
49959566063dSJacob Faibussowitsch       PetscCall(PetscMemcpy(c->ilen, a->ilen, m * sizeof(PetscInt)));
499617ab2063SBarry Smith 
499717ab2063SBarry Smith       /* allocate the matrix space */
4998f77e22a1SHong Zhang       if (mallocmatspace) {
49999566063dSJacob Faibussowitsch         PetscCall(PetscMalloc3(a->i[m], &c->a, a->i[m], &c->j, m + 1, &c->i));
50002205254eSKarl Rupp 
5001f1e2ffcdSBarry Smith         c->singlemalloc = PETSC_TRUE;
50022205254eSKarl Rupp 
50039566063dSJacob Faibussowitsch         PetscCall(PetscArraycpy(c->i, a->i, m + 1));
500417ab2063SBarry Smith         if (m > 0) {
50059566063dSJacob Faibussowitsch           PetscCall(PetscArraycpy(c->j, a->j, a->i[m]));
5006be6bf707SBarry Smith           if (cpvalues == MAT_COPY_VALUES) {
50072e5835c6SStefano Zampini             const PetscScalar *aa;
50082e5835c6SStefano Zampini 
50099566063dSJacob Faibussowitsch             PetscCall(MatSeqAIJGetArrayRead(A, &aa));
50109566063dSJacob Faibussowitsch             PetscCall(PetscArraycpy(c->a, aa, a->i[m]));
50119566063dSJacob Faibussowitsch             PetscCall(MatSeqAIJGetArrayRead(A, &aa));
5012be6bf707SBarry Smith           } else {
50139566063dSJacob Faibussowitsch             PetscCall(PetscArrayzero(c->a, a->i[m]));
501417ab2063SBarry Smith           }
501508480c60SBarry Smith         }
5016f77e22a1SHong Zhang       }
501731fe6a7dSBarry Smith       C->preallocated = PETSC_TRUE;
501831fe6a7dSBarry Smith     } else {
501931fe6a7dSBarry Smith       PetscCheck(mallocmatspace, PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_WRONGSTATE, "Cannot malloc matrix memory from a non-preallocated matrix");
502031fe6a7dSBarry Smith       PetscCall(MatSetUp(C));
502131fe6a7dSBarry Smith     }
502217ab2063SBarry Smith 
50236ad4291fSHong Zhang     c->ignorezeroentries = a->ignorezeroentries;
5024416022c9SBarry Smith     c->roworiented       = a->roworiented;
5025416022c9SBarry Smith     c->nonew             = a->nonew;
5026416022c9SBarry Smith     if (a->diag) {
50279566063dSJacob Faibussowitsch       PetscCall(PetscMalloc1(m + 1, &c->diag));
50289566063dSJacob Faibussowitsch       PetscCall(PetscMemcpy(c->diag, a->diag, m * sizeof(PetscInt)));
5029071fcb05SBarry Smith     } else c->diag = NULL;
50302205254eSKarl Rupp 
5031f4259b30SLisandro Dalcin     c->solve_work         = NULL;
5032f4259b30SLisandro Dalcin     c->saved_values       = NULL;
5033f4259b30SLisandro Dalcin     c->idiag              = NULL;
5034f4259b30SLisandro Dalcin     c->ssor_work          = NULL;
5035a9817697SBarry Smith     c->keepnonzeropattern = a->keepnonzeropattern;
5036e6b907acSBarry Smith     c->free_a             = PETSC_TRUE;
5037e6b907acSBarry Smith     c->free_ij            = PETSC_TRUE;
50386ad4291fSHong Zhang 
5039893ad86cSHong Zhang     c->rmax  = a->rmax;
5040416022c9SBarry Smith     c->nz    = a->nz;
50418ed568f8SMatthew G Knepley     c->maxnz = a->nz; /* Since we allocate exactly the right amount */
5042754ec7b1SSatish Balay 
50436ad4291fSHong Zhang     c->compressedrow.use   = a->compressedrow.use;
50446ad4291fSHong Zhang     c->compressedrow.nrows = a->compressedrow.nrows;
5045cd6b891eSBarry Smith     if (a->compressedrow.use) {
50466ad4291fSHong Zhang       i = a->compressedrow.nrows;
50479566063dSJacob Faibussowitsch       PetscCall(PetscMalloc2(i + 1, &c->compressedrow.i, i, &c->compressedrow.rindex));
50489566063dSJacob Faibussowitsch       PetscCall(PetscArraycpy(c->compressedrow.i, a->compressedrow.i, i + 1));
50499566063dSJacob Faibussowitsch       PetscCall(PetscArraycpy(c->compressedrow.rindex, a->compressedrow.rindex, i));
505027ea64f8SHong Zhang     } else {
505127ea64f8SHong Zhang       c->compressedrow.use    = PETSC_FALSE;
50520298fd71SBarry Smith       c->compressedrow.i      = NULL;
50530298fd71SBarry Smith       c->compressedrow.rindex = NULL;
50546ad4291fSHong Zhang     }
5055ea632784SBarry Smith     c->nonzerorowcnt = a->nonzerorowcnt;
5056e56f5c9eSBarry Smith     C->nonzerostate  = A->nonzerostate;
50574846f1f5SKris Buschelman 
50589566063dSJacob Faibussowitsch     PetscCall(MatDuplicate_SeqAIJ_Inode(A, cpvalues, &C));
505969272f91SPierre Jolivet   }
50609566063dSJacob Faibussowitsch   PetscCall(PetscFunctionListDuplicate(((PetscObject)A)->qlist, &((PetscObject)C)->qlist));
50613ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
506217ab2063SBarry Smith }
506317ab2063SBarry Smith 
5064d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDuplicate_SeqAIJ(Mat A, MatDuplicateOption cpvalues, Mat *B)
5065d71ae5a4SJacob Faibussowitsch {
5066b24902e0SBarry Smith   PetscFunctionBegin;
50679566063dSJacob Faibussowitsch   PetscCall(MatCreate(PetscObjectComm((PetscObject)A), B));
50689566063dSJacob Faibussowitsch   PetscCall(MatSetSizes(*B, A->rmap->n, A->cmap->n, A->rmap->n, A->cmap->n));
506948a46eb9SPierre Jolivet   if (!(A->rmap->n % A->rmap->bs) && !(A->cmap->n % A->cmap->bs)) PetscCall(MatSetBlockSizesFromMats(*B, A, A));
50709566063dSJacob Faibussowitsch   PetscCall(MatSetType(*B, ((PetscObject)A)->type_name));
50719566063dSJacob Faibussowitsch   PetscCall(MatDuplicateNoCreate_SeqAIJ(*B, A, cpvalues, PETSC_TRUE));
50723ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
5073b24902e0SBarry Smith }
5074b24902e0SBarry Smith 
5075d71ae5a4SJacob Faibussowitsch PetscErrorCode MatLoad_SeqAIJ(Mat newMat, PetscViewer viewer)
5076d71ae5a4SJacob Faibussowitsch {
507752f91c60SVaclav Hapla   PetscBool isbinary, ishdf5;
507852f91c60SVaclav Hapla 
507952f91c60SVaclav Hapla   PetscFunctionBegin;
508052f91c60SVaclav Hapla   PetscValidHeaderSpecific(newMat, MAT_CLASSID, 1);
508152f91c60SVaclav Hapla   PetscValidHeaderSpecific(viewer, PETSC_VIEWER_CLASSID, 2);
5082c27b3999SVaclav Hapla   /* force binary viewer to load .info file if it has not yet done so */
50839566063dSJacob Faibussowitsch   PetscCall(PetscViewerSetUp(viewer));
50849566063dSJacob Faibussowitsch   PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERBINARY, &isbinary));
50859566063dSJacob Faibussowitsch   PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERHDF5, &ishdf5));
508652f91c60SVaclav Hapla   if (isbinary) {
50879566063dSJacob Faibussowitsch     PetscCall(MatLoad_SeqAIJ_Binary(newMat, viewer));
508852f91c60SVaclav Hapla   } else if (ishdf5) {
508952f91c60SVaclav Hapla #if defined(PETSC_HAVE_HDF5)
50909566063dSJacob Faibussowitsch     PetscCall(MatLoad_AIJ_HDF5(newMat, viewer));
509152f91c60SVaclav Hapla #else
509252f91c60SVaclav Hapla     SETERRQ(PetscObjectComm((PetscObject)newMat), PETSC_ERR_SUP, "HDF5 not supported in this build.\nPlease reconfigure using --download-hdf5");
509352f91c60SVaclav Hapla #endif
509452f91c60SVaclav Hapla   } else {
509598921bdaSJacob Faibussowitsch     SETERRQ(PetscObjectComm((PetscObject)newMat), PETSC_ERR_SUP, "Viewer type %s not yet supported for reading %s matrices", ((PetscObject)viewer)->type_name, ((PetscObject)newMat)->type_name);
509652f91c60SVaclav Hapla   }
50973ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
509852f91c60SVaclav Hapla }
509952f91c60SVaclav Hapla 
5100d71ae5a4SJacob Faibussowitsch PetscErrorCode MatLoad_SeqAIJ_Binary(Mat mat, PetscViewer viewer)
5101d71ae5a4SJacob Faibussowitsch {
51023ea6fe3dSLisandro Dalcin   Mat_SeqAIJ *a = (Mat_SeqAIJ *)mat->data;
51033ea6fe3dSLisandro Dalcin   PetscInt    header[4], *rowlens, M, N, nz, sum, rows, cols, i;
5104fbdbba38SShri Abhyankar 
5105fbdbba38SShri Abhyankar   PetscFunctionBegin;
51069566063dSJacob Faibussowitsch   PetscCall(PetscViewerSetUp(viewer));
5107bbead8a2SBarry Smith 
51083ea6fe3dSLisandro Dalcin   /* read in matrix header */
51099566063dSJacob Faibussowitsch   PetscCall(PetscViewerBinaryRead(viewer, header, 4, NULL, PETSC_INT));
511008401ef6SPierre Jolivet   PetscCheck(header[0] == MAT_FILE_CLASSID, PETSC_COMM_SELF, PETSC_ERR_FILE_UNEXPECTED, "Not a matrix object in file");
51119371c9d4SSatish Balay   M  = header[1];
51129371c9d4SSatish Balay   N  = header[2];
51139371c9d4SSatish Balay   nz = header[3];
511408401ef6SPierre Jolivet   PetscCheck(M >= 0, PetscObjectComm((PetscObject)viewer), PETSC_ERR_FILE_UNEXPECTED, "Matrix row size (%" PetscInt_FMT ") in file is negative", M);
511508401ef6SPierre Jolivet   PetscCheck(N >= 0, PetscObjectComm((PetscObject)viewer), PETSC_ERR_FILE_UNEXPECTED, "Matrix column size (%" PetscInt_FMT ") in file is negative", N);
511608401ef6SPierre Jolivet   PetscCheck(nz >= 0, PETSC_COMM_SELF, PETSC_ERR_FILE_UNEXPECTED, "Matrix stored in special format on disk, cannot load as SeqAIJ");
5117fbdbba38SShri Abhyankar 
51183ea6fe3dSLisandro Dalcin   /* set block sizes from the viewer's .info file */
51199566063dSJacob Faibussowitsch   PetscCall(MatLoad_Binary_BlockSizes(mat, viewer));
51203ea6fe3dSLisandro Dalcin   /* set local and global sizes if not set already */
51213ea6fe3dSLisandro Dalcin   if (mat->rmap->n < 0) mat->rmap->n = M;
51223ea6fe3dSLisandro Dalcin   if (mat->cmap->n < 0) mat->cmap->n = N;
51233ea6fe3dSLisandro Dalcin   if (mat->rmap->N < 0) mat->rmap->N = M;
51243ea6fe3dSLisandro Dalcin   if (mat->cmap->N < 0) mat->cmap->N = N;
51259566063dSJacob Faibussowitsch   PetscCall(PetscLayoutSetUp(mat->rmap));
51269566063dSJacob Faibussowitsch   PetscCall(PetscLayoutSetUp(mat->cmap));
51273ea6fe3dSLisandro Dalcin 
51283ea6fe3dSLisandro Dalcin   /* check if the matrix sizes are correct */
51299566063dSJacob Faibussowitsch   PetscCall(MatGetSize(mat, &rows, &cols));
5130aed4548fSBarry Smith   PetscCheck(M == rows && N == cols, PETSC_COMM_SELF, PETSC_ERR_FILE_UNEXPECTED, "Matrix in file of different sizes (%" PetscInt_FMT ", %" PetscInt_FMT ") than the input matrix (%" PetscInt_FMT ", %" PetscInt_FMT ")", M, N, rows, cols);
51313ea6fe3dSLisandro Dalcin 
5132fbdbba38SShri Abhyankar   /* read in row lengths */
51339566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(M, &rowlens));
51349566063dSJacob Faibussowitsch   PetscCall(PetscViewerBinaryRead(viewer, rowlens, M, NULL, PETSC_INT));
51353ea6fe3dSLisandro Dalcin   /* check if sum(rowlens) is same as nz */
51369371c9d4SSatish Balay   sum = 0;
51379371c9d4SSatish Balay   for (i = 0; i < M; i++) sum += rowlens[i];
513808401ef6SPierre Jolivet   PetscCheck(sum == nz, PETSC_COMM_SELF, PETSC_ERR_FILE_UNEXPECTED, "Inconsistent matrix data in file: nonzeros = %" PetscInt_FMT ", sum-row-lengths = %" PetscInt_FMT, nz, sum);
51393ea6fe3dSLisandro Dalcin   /* preallocate and check sizes */
51409566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(mat, 0, rowlens));
51419566063dSJacob Faibussowitsch   PetscCall(MatGetSize(mat, &rows, &cols));
5142aed4548fSBarry Smith   PetscCheck(M == rows && N == cols, PETSC_COMM_SELF, PETSC_ERR_FILE_UNEXPECTED, "Matrix in file of different length (%" PetscInt_FMT ", %" PetscInt_FMT ") than the input matrix (%" PetscInt_FMT ", %" PetscInt_FMT ")", M, N, rows, cols);
51433ea6fe3dSLisandro Dalcin   /* store row lengths */
51449566063dSJacob Faibussowitsch   PetscCall(PetscArraycpy(a->ilen, rowlens, M));
51459566063dSJacob Faibussowitsch   PetscCall(PetscFree(rowlens));
5146fbdbba38SShri Abhyankar 
51473ea6fe3dSLisandro Dalcin   /* fill in "i" row pointers */
51489371c9d4SSatish Balay   a->i[0] = 0;
51499371c9d4SSatish Balay   for (i = 0; i < M; i++) a->i[i + 1] = a->i[i] + a->ilen[i];
51503ea6fe3dSLisandro Dalcin   /* read in "j" column indices */
51519566063dSJacob Faibussowitsch   PetscCall(PetscViewerBinaryRead(viewer, a->j, nz, NULL, PETSC_INT));
51523ea6fe3dSLisandro Dalcin   /* read in "a" nonzero values */
51539566063dSJacob Faibussowitsch   PetscCall(PetscViewerBinaryRead(viewer, a->a, nz, NULL, PETSC_SCALAR));
5154fbdbba38SShri Abhyankar 
51559566063dSJacob Faibussowitsch   PetscCall(MatAssemblyBegin(mat, MAT_FINAL_ASSEMBLY));
51569566063dSJacob Faibussowitsch   PetscCall(MatAssemblyEnd(mat, MAT_FINAL_ASSEMBLY));
51573ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
5158fbdbba38SShri Abhyankar }
5159fbdbba38SShri Abhyankar 
5160d71ae5a4SJacob Faibussowitsch PetscErrorCode MatEqual_SeqAIJ(Mat A, Mat B, PetscBool *flg)
5161d71ae5a4SJacob Faibussowitsch {
51627264ac53SSatish Balay   Mat_SeqAIJ        *a = (Mat_SeqAIJ *)A->data, *b = (Mat_SeqAIJ *)B->data;
5163fff043a9SJunchao Zhang   const PetscScalar *aa, *ba;
5164eeffb40dSHong Zhang #if defined(PETSC_USE_COMPLEX)
5165eeffb40dSHong Zhang   PetscInt k;
5166eeffb40dSHong Zhang #endif
51677264ac53SSatish Balay 
51683a40ed3dSBarry Smith   PetscFunctionBegin;
5169bfeeae90SHong Zhang   /* If the  matrix dimensions are not equal,or no of nonzeros */
5170d0f46423SBarry Smith   if ((A->rmap->n != B->rmap->n) || (A->cmap->n != B->cmap->n) || (a->nz != b->nz)) {
5171ca44d042SBarry Smith     *flg = PETSC_FALSE;
51723ba16761SJacob Faibussowitsch     PetscFunctionReturn(PETSC_SUCCESS);
5173bcd2baecSBarry Smith   }
51747264ac53SSatish Balay 
51757264ac53SSatish Balay   /* if the a->i are the same */
51769566063dSJacob Faibussowitsch   PetscCall(PetscArraycmp(a->i, b->i, A->rmap->n + 1, flg));
51773ba16761SJacob Faibussowitsch   if (!*flg) PetscFunctionReturn(PETSC_SUCCESS);
51787264ac53SSatish Balay 
51797264ac53SSatish Balay   /* if a->j are the same */
51809566063dSJacob Faibussowitsch   PetscCall(PetscArraycmp(a->j, b->j, a->nz, flg));
51813ba16761SJacob Faibussowitsch   if (!*flg) PetscFunctionReturn(PETSC_SUCCESS);
5182bcd2baecSBarry Smith 
51839566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &aa));
51849566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(B, &ba));
5185bcd2baecSBarry Smith   /* if a->a are the same */
5186eeffb40dSHong Zhang #if defined(PETSC_USE_COMPLEX)
5187eeffb40dSHong Zhang   for (k = 0; k < a->nz; k++) {
5188fff043a9SJunchao Zhang     if (PetscRealPart(aa[k]) != PetscRealPart(ba[k]) || PetscImaginaryPart(aa[k]) != PetscImaginaryPart(ba[k])) {
5189eeffb40dSHong Zhang       *flg = PETSC_FALSE;
51903ba16761SJacob Faibussowitsch       PetscFunctionReturn(PETSC_SUCCESS);
5191eeffb40dSHong Zhang     }
5192eeffb40dSHong Zhang   }
5193eeffb40dSHong Zhang #else
51949566063dSJacob Faibussowitsch   PetscCall(PetscArraycmp(aa, ba, a->nz, flg));
5195eeffb40dSHong Zhang #endif
51969566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &aa));
51979566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(B, &ba));
51983ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
51997264ac53SSatish Balay }
520036db0b34SBarry Smith 
520105869f15SSatish Balay /*@
520211a5261eSBarry Smith   MatCreateSeqAIJWithArrays - Creates an sequential `MATSEQAIJ` matrix using matrix elements (in CSR format)
520336db0b34SBarry Smith   provided by the user.
520436db0b34SBarry Smith 
5205d083f849SBarry Smith   Collective
520636db0b34SBarry Smith 
520736db0b34SBarry Smith   Input Parameters:
520836db0b34SBarry Smith + comm - must be an MPI communicator of size 1
520936db0b34SBarry Smith . m    - number of rows
521036db0b34SBarry Smith . n    - number of columns
5211483a2f95SBarry Smith . i    - row indices; that is i[0] = 0, i[row] = i[row-1] + number of elements in that row of the matrix
521236db0b34SBarry Smith . j    - column indices
521336db0b34SBarry Smith - a    - matrix values
521436db0b34SBarry Smith 
521536db0b34SBarry Smith   Output Parameter:
521636db0b34SBarry Smith . mat - the matrix
521736db0b34SBarry Smith 
521836db0b34SBarry Smith   Level: intermediate
521936db0b34SBarry Smith 
522036db0b34SBarry Smith   Notes:
52212ef1f0ffSBarry Smith   The `i`, `j`, and `a` arrays are not copied by this routine, the user must free these arrays
5222292fb18eSBarry Smith   once the matrix is destroyed and not before
522336db0b34SBarry Smith 
522436db0b34SBarry Smith   You cannot set new nonzero locations into this matrix, that will generate an error.
522536db0b34SBarry Smith 
52262ef1f0ffSBarry Smith   The `i` and `j` indices are 0 based
522736db0b34SBarry Smith 
5228a4552177SSatish Balay   The format which is used for the sparse matrix input, is equivalent to a
5229a4552177SSatish Balay   row-major ordering.. i.e for the following matrix, the input data expected is
52308eef79e4SBarry Smith   as shown
52312ef1f0ffSBarry Smith .vb
52322ef1f0ffSBarry Smith         1 0 0
52332ef1f0ffSBarry Smith         2 0 3
52342ef1f0ffSBarry Smith         4 5 6
5235a4552177SSatish Balay 
52362ef1f0ffSBarry Smith         i =  {0,1,3,6}  [size = nrow+1  = 3+1]
52372ef1f0ffSBarry Smith         j =  {0,0,2,0,1,2}  [size = 6]; values must be sorted for each row
52382ef1f0ffSBarry Smith         v =  {1,2,3,4,5,6}  [size = 6]
52392ef1f0ffSBarry Smith .ve
5240a4552177SSatish Balay 
52411cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatCreate()`, `MatCreateAIJ()`, `MatCreateSeqAIJ()`, `MatCreateMPIAIJWithArrays()`, `MatMPIAIJSetPreallocationCSR()`
524236db0b34SBarry Smith @*/
5243d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateSeqAIJWithArrays(MPI_Comm comm, PetscInt m, PetscInt n, PetscInt i[], PetscInt j[], PetscScalar a[], Mat *mat)
5244d71ae5a4SJacob Faibussowitsch {
5245cbcfb4deSHong Zhang   PetscInt    ii;
524636db0b34SBarry Smith   Mat_SeqAIJ *aij;
5247cbcfb4deSHong Zhang   PetscInt    jj;
524836db0b34SBarry Smith 
524936db0b34SBarry Smith   PetscFunctionBegin;
5250aed4548fSBarry Smith   PetscCheck(m <= 0 || i[0] == 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "i (row indices) must start with 0");
52519566063dSJacob Faibussowitsch   PetscCall(MatCreate(comm, mat));
52529566063dSJacob Faibussowitsch   PetscCall(MatSetSizes(*mat, m, n, m, n));
52539566063dSJacob Faibussowitsch   /* PetscCall(MatSetBlockSizes(*mat,,)); */
52549566063dSJacob Faibussowitsch   PetscCall(MatSetType(*mat, MATSEQAIJ));
52559566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(*mat, MAT_SKIP_ALLOCATION, NULL));
5256ab93d7beSBarry Smith   aij = (Mat_SeqAIJ *)(*mat)->data;
52579566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(m, &aij->imax));
52589566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(m, &aij->ilen));
5259ab93d7beSBarry Smith 
526036db0b34SBarry Smith   aij->i            = i;
526136db0b34SBarry Smith   aij->j            = j;
526236db0b34SBarry Smith   aij->a            = a;
526336db0b34SBarry Smith   aij->singlemalloc = PETSC_FALSE;
526436db0b34SBarry Smith   aij->nonew        = -1; /*this indicates that inserting a new value in the matrix that generates a new nonzero is an error*/
5265e6b907acSBarry Smith   aij->free_a       = PETSC_FALSE;
5266e6b907acSBarry Smith   aij->free_ij      = PETSC_FALSE;
526736db0b34SBarry Smith 
5268cbc6b225SStefano Zampini   for (ii = 0, aij->nonzerorowcnt = 0, aij->rmax = 0; ii < m; ii++) {
526936db0b34SBarry Smith     aij->ilen[ii] = aij->imax[ii] = i[ii + 1] - i[ii];
527076bd3646SJed Brown     if (PetscDefined(USE_DEBUG)) {
5271aed4548fSBarry Smith       PetscCheck(i[ii + 1] - i[ii] >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Negative row length in i (row indices) row = %" PetscInt_FMT " length = %" PetscInt_FMT, ii, i[ii + 1] - i[ii]);
52729985e31cSBarry Smith       for (jj = i[ii] + 1; jj < i[ii + 1]; jj++) {
527308401ef6SPierre Jolivet         PetscCheck(j[jj] >= j[jj - 1], PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Column entry number %" PetscInt_FMT " (actual column %" PetscInt_FMT ") in row %" PetscInt_FMT " is not sorted", jj - i[ii], j[jj], ii);
527408401ef6SPierre Jolivet         PetscCheck(j[jj] != j[jj - 1], PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Column entry number %" PetscInt_FMT " (actual column %" PetscInt_FMT ") in row %" PetscInt_FMT " is identical to previous entry", jj - i[ii], j[jj], ii);
52759985e31cSBarry Smith       }
527636db0b34SBarry Smith     }
527776bd3646SJed Brown   }
527876bd3646SJed Brown   if (PetscDefined(USE_DEBUG)) {
527936db0b34SBarry Smith     for (ii = 0; ii < aij->i[m]; ii++) {
528008401ef6SPierre Jolivet       PetscCheck(j[ii] >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Negative column index at location = %" PetscInt_FMT " index = %" PetscInt_FMT, ii, j[ii]);
5281da0802e2SStefano Zampini       PetscCheck(j[ii] <= n - 1, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Column index to large at location = %" PetscInt_FMT " index = %" PetscInt_FMT " last column = %" PetscInt_FMT, ii, j[ii], n - 1);
528236db0b34SBarry Smith     }
528376bd3646SJed Brown   }
528436db0b34SBarry Smith 
52859566063dSJacob Faibussowitsch   PetscCall(MatAssemblyBegin(*mat, MAT_FINAL_ASSEMBLY));
52869566063dSJacob Faibussowitsch   PetscCall(MatAssemblyEnd(*mat, MAT_FINAL_ASSEMBLY));
52873ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
528836db0b34SBarry Smith }
5289cbc6b225SStefano Zampini 
5290f62e3866SBarry Smith /*@
529111a5261eSBarry Smith   MatCreateSeqAIJFromTriple - Creates an sequential `MATSEQAIJ` matrix using matrix elements (in COO format)
52928a0b0e6bSVictor Minden   provided by the user.
52938a0b0e6bSVictor Minden 
5294d083f849SBarry Smith   Collective
52958a0b0e6bSVictor Minden 
52968a0b0e6bSVictor Minden   Input Parameters:
52978a0b0e6bSVictor Minden + comm - must be an MPI communicator of size 1
52988a0b0e6bSVictor Minden . m    - number of rows
52998a0b0e6bSVictor Minden . n    - number of columns
53008a0b0e6bSVictor Minden . i    - row indices
53018a0b0e6bSVictor Minden . j    - column indices
53021230e6d1SVictor Minden . a    - matrix values
53031230e6d1SVictor Minden . nz   - number of nonzeros
53042ef1f0ffSBarry Smith - idx  - if the `i` and `j` indices start with 1 use `PETSC_TRUE` otherwise use `PETSC_FALSE`
53058a0b0e6bSVictor Minden 
53068a0b0e6bSVictor Minden   Output Parameter:
53078a0b0e6bSVictor Minden . mat - the matrix
53088a0b0e6bSVictor Minden 
53098a0b0e6bSVictor Minden   Level: intermediate
53108a0b0e6bSVictor Minden 
5311f62e3866SBarry Smith   Example:
5312f62e3866SBarry Smith   For the following matrix, the input data expected is as shown (using 0 based indexing)
53139e99939fSJunchao Zhang .vb
53148a0b0e6bSVictor Minden         1 0 0
53158a0b0e6bSVictor Minden         2 0 3
53168a0b0e6bSVictor Minden         4 5 6
53178a0b0e6bSVictor Minden 
53188a0b0e6bSVictor Minden         i =  {0,1,1,2,2,2}
53198a0b0e6bSVictor Minden         j =  {0,0,2,0,1,2}
53208a0b0e6bSVictor Minden         v =  {1,2,3,4,5,6}
53219e99939fSJunchao Zhang .ve
5322fe59aa6dSJacob Faibussowitsch 
53232ef1f0ffSBarry Smith   Note:
5324d7547e51SJunchao Zhang   Instead of using this function, users should also consider `MatSetPreallocationCOO()` and `MatSetValuesCOO()`, which allow repeated or remote entries,
5325d7547e51SJunchao Zhang   and are particularly useful in iterative applications.
53268a0b0e6bSVictor Minden 
53271cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatCreate()`, `MatCreateAIJ()`, `MatCreateSeqAIJ()`, `MatCreateSeqAIJWithArrays()`, `MatMPIAIJSetPreallocationCSR()`, `MatSetValuesCOO()`, `MatSetPreallocationCOO()`
53288a0b0e6bSVictor Minden @*/
5329d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateSeqAIJFromTriple(MPI_Comm comm, PetscInt m, PetscInt n, PetscInt i[], PetscInt j[], PetscScalar a[], Mat *mat, PetscInt nz, PetscBool idx)
5330d71ae5a4SJacob Faibussowitsch {
5331d021a1c5SVictor Minden   PetscInt ii, *nnz, one = 1, row, col;
53328a0b0e6bSVictor Minden 
53338a0b0e6bSVictor Minden   PetscFunctionBegin;
53349566063dSJacob Faibussowitsch   PetscCall(PetscCalloc1(m, &nnz));
5335ad540459SPierre Jolivet   for (ii = 0; ii < nz; ii++) nnz[i[ii] - !!idx] += 1;
53369566063dSJacob Faibussowitsch   PetscCall(MatCreate(comm, mat));
53379566063dSJacob Faibussowitsch   PetscCall(MatSetSizes(*mat, m, n, m, n));
53389566063dSJacob Faibussowitsch   PetscCall(MatSetType(*mat, MATSEQAIJ));
53399566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(*mat, 0, nnz));
53401230e6d1SVictor Minden   for (ii = 0; ii < nz; ii++) {
53411230e6d1SVictor Minden     if (idx) {
53421230e6d1SVictor Minden       row = i[ii] - 1;
53431230e6d1SVictor Minden       col = j[ii] - 1;
53441230e6d1SVictor Minden     } else {
53451230e6d1SVictor Minden       row = i[ii];
53461230e6d1SVictor Minden       col = j[ii];
53478a0b0e6bSVictor Minden     }
53489566063dSJacob Faibussowitsch     PetscCall(MatSetValues(*mat, one, &row, one, &col, &a[ii], ADD_VALUES));
53498a0b0e6bSVictor Minden   }
53509566063dSJacob Faibussowitsch   PetscCall(MatAssemblyBegin(*mat, MAT_FINAL_ASSEMBLY));
53519566063dSJacob Faibussowitsch   PetscCall(MatAssemblyEnd(*mat, MAT_FINAL_ASSEMBLY));
53529566063dSJacob Faibussowitsch   PetscCall(PetscFree(nnz));
53533ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
53548a0b0e6bSVictor Minden }
535536db0b34SBarry Smith 
5356d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJInvalidateDiagonal(Mat A)
5357d71ae5a4SJacob Faibussowitsch {
5358acf2f550SJed Brown   Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data;
5359acf2f550SJed Brown 
5360acf2f550SJed Brown   PetscFunctionBegin;
5361acf2f550SJed Brown   a->idiagvalid  = PETSC_FALSE;
5362acf2f550SJed Brown   a->ibdiagvalid = PETSC_FALSE;
53632205254eSKarl Rupp 
53649566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJInvalidateDiagonal_Inode(A));
53653ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
5366acf2f550SJed Brown }
5367acf2f550SJed Brown 
5368d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateMPIMatConcatenateSeqMat_SeqAIJ(MPI_Comm comm, Mat inmat, PetscInt n, MatReuse scall, Mat *outmat)
5369d71ae5a4SJacob Faibussowitsch {
53709c8f2541SHong Zhang   PetscFunctionBegin;
53719566063dSJacob Faibussowitsch   PetscCall(MatCreateMPIMatConcatenateSeqMat_MPIAIJ(comm, inmat, n, scall, outmat));
53723ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
53739c8f2541SHong Zhang }
53749c8f2541SHong Zhang 
537581824310SBarry Smith /*
537653dd7562SDmitry Karpeev  Permute A into C's *local* index space using rowemb,colemb.
537753dd7562SDmitry Karpeev  The embedding are supposed to be injections and the above implies that the range of rowemb is a subset
537853dd7562SDmitry Karpeev  of [0,m), colemb is in [0,n).
537953dd7562SDmitry Karpeev  If pattern == DIFFERENT_NONZERO_PATTERN, C is preallocated according to A.
538053dd7562SDmitry Karpeev  */
5381d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetSeqMat_SeqAIJ(Mat C, IS rowemb, IS colemb, MatStructure pattern, Mat B)
5382d71ae5a4SJacob Faibussowitsch {
538353dd7562SDmitry Karpeev   /* If making this function public, change the error returned in this function away from _PLIB. */
538453dd7562SDmitry Karpeev   Mat_SeqAIJ     *Baij;
538553dd7562SDmitry Karpeev   PetscBool       seqaij;
538653dd7562SDmitry Karpeev   PetscInt        m, n, *nz, i, j, count;
538753dd7562SDmitry Karpeev   PetscScalar     v;
538853dd7562SDmitry Karpeev   const PetscInt *rowindices, *colindices;
538953dd7562SDmitry Karpeev 
539053dd7562SDmitry Karpeev   PetscFunctionBegin;
53913ba16761SJacob Faibussowitsch   if (!B) PetscFunctionReturn(PETSC_SUCCESS);
539253dd7562SDmitry Karpeev   /* Check to make sure the target matrix (and embeddings) are compatible with C and each other. */
53939566063dSJacob Faibussowitsch   PetscCall(PetscObjectBaseTypeCompare((PetscObject)B, MATSEQAIJ, &seqaij));
539428b400f6SJacob Faibussowitsch   PetscCheck(seqaij, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Input matrix is of wrong type");
539553dd7562SDmitry Karpeev   if (rowemb) {
53969566063dSJacob Faibussowitsch     PetscCall(ISGetLocalSize(rowemb, &m));
539708401ef6SPierre Jolivet     PetscCheck(m == B->rmap->n, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Row IS of size %" PetscInt_FMT " is incompatible with matrix row size %" PetscInt_FMT, m, B->rmap->n);
539853dd7562SDmitry Karpeev   } else {
539908401ef6SPierre Jolivet     PetscCheck(C->rmap->n == B->rmap->n, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Input matrix is row-incompatible with the target matrix");
540053dd7562SDmitry Karpeev   }
540153dd7562SDmitry Karpeev   if (colemb) {
54029566063dSJacob Faibussowitsch     PetscCall(ISGetLocalSize(colemb, &n));
540308401ef6SPierre Jolivet     PetscCheck(n == B->cmap->n, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Diag col IS of size %" PetscInt_FMT " is incompatible with input matrix col size %" PetscInt_FMT, n, B->cmap->n);
540453dd7562SDmitry Karpeev   } else {
540508401ef6SPierre Jolivet     PetscCheck(C->cmap->n == B->cmap->n, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Input matrix is col-incompatible with the target matrix");
540653dd7562SDmitry Karpeev   }
540753dd7562SDmitry Karpeev 
5408f4f49eeaSPierre Jolivet   Baij = (Mat_SeqAIJ *)B->data;
540953dd7562SDmitry Karpeev   if (pattern == DIFFERENT_NONZERO_PATTERN) {
54109566063dSJacob Faibussowitsch     PetscCall(PetscMalloc1(B->rmap->n, &nz));
5411ad540459SPierre Jolivet     for (i = 0; i < B->rmap->n; i++) nz[i] = Baij->i[i + 1] - Baij->i[i];
54129566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJSetPreallocation(C, 0, nz));
54139566063dSJacob Faibussowitsch     PetscCall(PetscFree(nz));
541453dd7562SDmitry Karpeev   }
541548a46eb9SPierre Jolivet   if (pattern == SUBSET_NONZERO_PATTERN) PetscCall(MatZeroEntries(C));
541653dd7562SDmitry Karpeev   count      = 0;
541753dd7562SDmitry Karpeev   rowindices = NULL;
541853dd7562SDmitry Karpeev   colindices = NULL;
541948a46eb9SPierre Jolivet   if (rowemb) PetscCall(ISGetIndices(rowemb, &rowindices));
542048a46eb9SPierre Jolivet   if (colemb) PetscCall(ISGetIndices(colemb, &colindices));
542153dd7562SDmitry Karpeev   for (i = 0; i < B->rmap->n; i++) {
542253dd7562SDmitry Karpeev     PetscInt row;
542353dd7562SDmitry Karpeev     row = i;
542453dd7562SDmitry Karpeev     if (rowindices) row = rowindices[i];
542553dd7562SDmitry Karpeev     for (j = Baij->i[i]; j < Baij->i[i + 1]; j++) {
542653dd7562SDmitry Karpeev       PetscInt col;
542753dd7562SDmitry Karpeev       col = Baij->j[count];
542853dd7562SDmitry Karpeev       if (colindices) col = colindices[col];
542953dd7562SDmitry Karpeev       v = Baij->a[count];
54309566063dSJacob Faibussowitsch       PetscCall(MatSetValues(C, 1, &row, 1, &col, &v, INSERT_VALUES));
543153dd7562SDmitry Karpeev       ++count;
543253dd7562SDmitry Karpeev     }
543353dd7562SDmitry Karpeev   }
543453dd7562SDmitry Karpeev   /* FIXME: set C's nonzerostate correctly. */
543553dd7562SDmitry Karpeev   /* Assembly for C is necessary. */
543653dd7562SDmitry Karpeev   C->preallocated  = PETSC_TRUE;
543753dd7562SDmitry Karpeev   C->assembled     = PETSC_TRUE;
543853dd7562SDmitry Karpeev   C->was_assembled = PETSC_FALSE;
54393ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
544053dd7562SDmitry Karpeev }
544153dd7562SDmitry Karpeev 
544258c11ad4SPierre Jolivet PetscErrorCode MatEliminateZeros_SeqAIJ(Mat A, PetscBool keep)
5443dec0b466SHong Zhang {
5444dec0b466SHong Zhang   Mat_SeqAIJ *a  = (Mat_SeqAIJ *)A->data;
5445dec0b466SHong Zhang   MatScalar  *aa = a->a;
5446dec0b466SHong Zhang   PetscInt    m = A->rmap->n, fshift = 0, fshift_prev = 0, i, k;
5447dec0b466SHong Zhang   PetscInt   *ailen = a->ilen, *imax = a->imax, *ai = a->i, *aj = a->j, rmax = 0;
5448dec0b466SHong Zhang 
5449dec0b466SHong Zhang   PetscFunctionBegin;
5450dec0b466SHong Zhang   PetscCheck(A->assembled, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Cannot eliminate zeros for unassembled matrix");
5451dec0b466SHong Zhang   if (m) rmax = ailen[0]; /* determine row with most nonzeros */
5452dec0b466SHong Zhang   for (i = 1; i <= m; i++) {
5453dec0b466SHong Zhang     /* move each nonzero entry back by the amount of zero slots (fshift) before it*/
5454dec0b466SHong Zhang     for (k = ai[i - 1]; k < ai[i]; k++) {
545558c11ad4SPierre Jolivet       if (aa[k] == 0 && (aj[k] != i - 1 || !keep)) fshift++;
5456dec0b466SHong Zhang       else {
5457dec0b466SHong Zhang         if (aa[k] == 0 && aj[k] == i - 1) PetscCall(PetscInfo(A, "Keep the diagonal zero at row %" PetscInt_FMT "\n", i - 1));
5458dec0b466SHong Zhang         aa[k - fshift] = aa[k];
5459dec0b466SHong Zhang         aj[k - fshift] = aj[k];
5460dec0b466SHong Zhang       }
5461dec0b466SHong Zhang     }
5462dec0b466SHong Zhang     ai[i - 1] -= fshift_prev; // safe to update ai[i-1] now since it will not be used in the next iteration
5463dec0b466SHong Zhang     fshift_prev = fshift;
5464dec0b466SHong Zhang     /* reset ilen and imax for each row */
5465dec0b466SHong Zhang     ailen[i - 1] = imax[i - 1] = ai[i] - fshift - ai[i - 1];
5466dec0b466SHong Zhang     a->nonzerorowcnt += ((ai[i] - fshift - ai[i - 1]) > 0);
5467dec0b466SHong Zhang     rmax = PetscMax(rmax, ailen[i - 1]);
5468dec0b466SHong Zhang   }
5469312eded4SPierre Jolivet   if (fshift) {
5470dec0b466SHong Zhang     if (m) {
5471dec0b466SHong Zhang       ai[m] -= fshift;
5472dec0b466SHong Zhang       a->nz = ai[m];
5473dec0b466SHong Zhang     }
5474dec0b466SHong Zhang     PetscCall(PetscInfo(A, "Matrix size: %" PetscInt_FMT " X %" PetscInt_FMT "; zeros eliminated: %" PetscInt_FMT "; nonzeros left: %" PetscInt_FMT "\n", m, A->cmap->n, fshift, a->nz));
5475312eded4SPierre Jolivet     A->nonzerostate++;
5476dec0b466SHong Zhang     A->info.nz_unneeded += (PetscReal)fshift;
5477dec0b466SHong Zhang     a->rmax = rmax;
5478dec0b466SHong Zhang     if (a->inode.use && a->inode.checked) PetscCall(MatSeqAIJCheckInode(A));
5479dec0b466SHong Zhang     PetscCall(MatAssemblyBegin(A, MAT_FINAL_ASSEMBLY));
5480dec0b466SHong Zhang     PetscCall(MatAssemblyEnd(A, MAT_FINAL_ASSEMBLY));
5481312eded4SPierre Jolivet   }
54823ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
5483dec0b466SHong Zhang }
5484dec0b466SHong Zhang 
54854099cc6bSBarry Smith PetscFunctionList MatSeqAIJList = NULL;
54864099cc6bSBarry Smith 
5487cc4c1da9SBarry Smith /*@
548811a5261eSBarry Smith   MatSeqAIJSetType - Converts a `MATSEQAIJ` matrix to a subtype
54894099cc6bSBarry Smith 
5490c3339decSBarry Smith   Collective
54914099cc6bSBarry Smith 
54924099cc6bSBarry Smith   Input Parameters:
54934099cc6bSBarry Smith + mat    - the matrix object
54944099cc6bSBarry Smith - matype - matrix type
54954099cc6bSBarry Smith 
54964099cc6bSBarry Smith   Options Database Key:
54974e187271SRichard Tran Mills . -mat_seqaij_type  <method> - for example seqaijcrl
54984099cc6bSBarry Smith 
54994099cc6bSBarry Smith   Level: intermediate
55004099cc6bSBarry Smith 
5501fe59aa6dSJacob Faibussowitsch .seealso: [](ch_matrices), `Mat`, `PCSetType()`, `VecSetType()`, `MatCreate()`, `MatType`
55024099cc6bSBarry Smith @*/
5503d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetType(Mat mat, MatType matype)
5504d71ae5a4SJacob Faibussowitsch {
55054099cc6bSBarry Smith   PetscBool sametype;
55065f80ce2aSJacob Faibussowitsch   PetscErrorCode (*r)(Mat, MatType, MatReuse, Mat *);
55074099cc6bSBarry Smith 
55084099cc6bSBarry Smith   PetscFunctionBegin;
55094099cc6bSBarry Smith   PetscValidHeaderSpecific(mat, MAT_CLASSID, 1);
55109566063dSJacob Faibussowitsch   PetscCall(PetscObjectTypeCompare((PetscObject)mat, matype, &sametype));
55113ba16761SJacob Faibussowitsch   if (sametype) PetscFunctionReturn(PETSC_SUCCESS);
55124099cc6bSBarry Smith 
55139566063dSJacob Faibussowitsch   PetscCall(PetscFunctionListFind(MatSeqAIJList, matype, &r));
55146adde796SStefano Zampini   PetscCheck(r, PetscObjectComm((PetscObject)mat), PETSC_ERR_ARG_UNKNOWN_TYPE, "Unknown Mat type given: %s", matype);
55159566063dSJacob Faibussowitsch   PetscCall((*r)(mat, matype, MAT_INPLACE_MATRIX, &mat));
55163ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
55174099cc6bSBarry Smith }
55184099cc6bSBarry Smith 
55194099cc6bSBarry Smith /*@C
552011a5261eSBarry Smith   MatSeqAIJRegister -  - Adds a new sub-matrix type for sequential `MATSEQAIJ` matrices
55214099cc6bSBarry Smith 
5522cc4c1da9SBarry Smith   Not Collective, No Fortran Support
55234099cc6bSBarry Smith 
55244099cc6bSBarry Smith   Input Parameters:
5525fe59aa6dSJacob Faibussowitsch + sname    - name of a new user-defined matrix type, for example `MATSEQAIJCRL`
55264099cc6bSBarry Smith - function - routine to convert to subtype
55274099cc6bSBarry Smith 
55282ef1f0ffSBarry Smith   Level: advanced
55292ef1f0ffSBarry Smith 
55304099cc6bSBarry Smith   Notes:
553111a5261eSBarry Smith   `MatSeqAIJRegister()` may be called multiple times to add several user-defined solvers.
55324099cc6bSBarry Smith 
55334099cc6bSBarry Smith   Then, your matrix can be chosen with the procedural interface at runtime via the option
55344099cc6bSBarry Smith $     -mat_seqaij_type my_mat
55354099cc6bSBarry Smith 
55361cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJRegisterAll()`
55374099cc6bSBarry Smith @*/
5538d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJRegister(const char sname[], PetscErrorCode (*function)(Mat, MatType, MatReuse, Mat *))
5539d71ae5a4SJacob Faibussowitsch {
55404099cc6bSBarry Smith   PetscFunctionBegin;
55419566063dSJacob Faibussowitsch   PetscCall(MatInitializePackage());
55429566063dSJacob Faibussowitsch   PetscCall(PetscFunctionListAdd(&MatSeqAIJList, sname, function));
55433ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
55444099cc6bSBarry Smith }
55454099cc6bSBarry Smith 
55464099cc6bSBarry Smith PetscBool MatSeqAIJRegisterAllCalled = PETSC_FALSE;
55474099cc6bSBarry Smith 
55484099cc6bSBarry Smith /*@C
554911a5261eSBarry Smith   MatSeqAIJRegisterAll - Registers all of the matrix subtypes of `MATSSEQAIJ`
55504099cc6bSBarry Smith 
55514099cc6bSBarry Smith   Not Collective
55524099cc6bSBarry Smith 
55534099cc6bSBarry Smith   Level: advanced
55544099cc6bSBarry Smith 
55552ef1f0ffSBarry Smith   Note:
55562ef1f0ffSBarry Smith   This registers the versions of `MATSEQAIJ` for GPUs
55572ef1f0ffSBarry Smith 
55581cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatRegisterAll()`, `MatSeqAIJRegister()`
55594099cc6bSBarry Smith @*/
5560d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJRegisterAll(void)
5561d71ae5a4SJacob Faibussowitsch {
55624099cc6bSBarry Smith   PetscFunctionBegin;
55633ba16761SJacob Faibussowitsch   if (MatSeqAIJRegisterAllCalled) PetscFunctionReturn(PETSC_SUCCESS);
55644099cc6bSBarry Smith   MatSeqAIJRegisterAllCalled = PETSC_TRUE;
55654099cc6bSBarry Smith 
55669566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRegister(MATSEQAIJCRL, MatConvert_SeqAIJ_SeqAIJCRL));
55679566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRegister(MATSEQAIJPERM, MatConvert_SeqAIJ_SeqAIJPERM));
55689566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRegister(MATSEQAIJSELL, MatConvert_SeqAIJ_SeqAIJSELL));
55699779e05dSSatish Balay #if defined(PETSC_HAVE_MKL_SPARSE)
55709566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRegister(MATSEQAIJMKL, MatConvert_SeqAIJ_SeqAIJMKL));
5571485f9817SRichard Tran Mills #endif
55725063d097SStefano Zampini #if defined(PETSC_HAVE_CUDA)
55739566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRegister(MATSEQAIJCUSPARSE, MatConvert_SeqAIJ_SeqAIJCUSPARSE));
55745063d097SStefano Zampini #endif
5575d5e393b6SSuyash Tandon #if defined(PETSC_HAVE_HIP)
5576d5e393b6SSuyash Tandon   PetscCall(MatSeqAIJRegister(MATSEQAIJHIPSPARSE, MatConvert_SeqAIJ_SeqAIJHIPSPARSE));
5577d5e393b6SSuyash Tandon #endif
55785063d097SStefano Zampini #if defined(PETSC_HAVE_KOKKOS_KERNELS)
55799566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRegister(MATSEQAIJKOKKOS, MatConvert_SeqAIJ_SeqAIJKokkos));
55805063d097SStefano Zampini #endif
55814099cc6bSBarry Smith #if defined(PETSC_HAVE_VIENNACL) && defined(PETSC_HAVE_VIENNACL_NO_CUDA)
55829566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRegister(MATMPIAIJVIENNACL, MatConvert_SeqAIJ_SeqAIJViennaCL));
55834099cc6bSBarry Smith #endif
55843ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
55854099cc6bSBarry Smith }
558653dd7562SDmitry Karpeev 
558753dd7562SDmitry Karpeev /*
558881824310SBarry Smith     Special version for direct calls from Fortran
558981824310SBarry Smith */
559081824310SBarry Smith #if defined(PETSC_HAVE_FORTRAN_CAPS)
559181824310SBarry Smith   #define matsetvaluesseqaij_ MATSETVALUESSEQAIJ
559281824310SBarry Smith #elif !defined(PETSC_HAVE_FORTRAN_UNDERSCORE)
559381824310SBarry Smith   #define matsetvaluesseqaij_ matsetvaluesseqaij
559481824310SBarry Smith #endif
559581824310SBarry Smith 
559681824310SBarry Smith /* Change these macros so can be used in void function */
559798921bdaSJacob Faibussowitsch 
559898921bdaSJacob Faibussowitsch /* Change these macros so can be used in void function */
55999566063dSJacob Faibussowitsch /* Identical to PetscCallVoid, except it assigns to *_ierr */
56009566063dSJacob Faibussowitsch #undef PetscCall
56019371c9d4SSatish Balay #define PetscCall(...) \
56029371c9d4SSatish Balay   do { \
56035f80ce2aSJacob Faibussowitsch     PetscErrorCode ierr_msv_mpiaij = __VA_ARGS__; \
560498921bdaSJacob Faibussowitsch     if (PetscUnlikely(ierr_msv_mpiaij)) { \
560598921bdaSJacob Faibussowitsch       *_ierr = PetscError(PETSC_COMM_SELF, __LINE__, PETSC_FUNCTION_NAME, __FILE__, ierr_msv_mpiaij, PETSC_ERROR_REPEAT, " "); \
560698921bdaSJacob Faibussowitsch       return; \
560798921bdaSJacob Faibussowitsch     } \
560898921bdaSJacob Faibussowitsch   } while (0)
560998921bdaSJacob Faibussowitsch 
561098921bdaSJacob Faibussowitsch #undef SETERRQ
56119371c9d4SSatish Balay #define SETERRQ(comm, ierr, ...) \
56129371c9d4SSatish Balay   do { \
561398921bdaSJacob Faibussowitsch     *_ierr = PetscError(comm, __LINE__, PETSC_FUNCTION_NAME, __FILE__, ierr, PETSC_ERROR_INITIAL, __VA_ARGS__); \
561498921bdaSJacob Faibussowitsch     return; \
561598921bdaSJacob Faibussowitsch   } while (0)
561681824310SBarry Smith 
5617d71ae5a4SJacob Faibussowitsch PETSC_EXTERN void matsetvaluesseqaij_(Mat *AA, PetscInt *mm, const PetscInt im[], PetscInt *nn, const PetscInt in[], const PetscScalar v[], InsertMode *isis, PetscErrorCode *_ierr)
5618d71ae5a4SJacob Faibussowitsch {
561981824310SBarry Smith   Mat         A = *AA;
562081824310SBarry Smith   PetscInt    m = *mm, n = *nn;
562181824310SBarry Smith   InsertMode  is = *isis;
562281824310SBarry Smith   Mat_SeqAIJ *a  = (Mat_SeqAIJ *)A->data;
562381824310SBarry Smith   PetscInt   *rp, k, low, high, t, ii, row, nrow, i, col, l, rmax, N;
562481824310SBarry Smith   PetscInt   *imax, *ai, *ailen;
562581824310SBarry Smith   PetscInt   *aj, nonew = a->nonew, lastcol = -1;
562654f21887SBarry Smith   MatScalar  *ap, value, *aa;
5627ace3abfcSBarry Smith   PetscBool   ignorezeroentries = a->ignorezeroentries;
5628ace3abfcSBarry Smith   PetscBool   roworiented       = a->roworiented;
562981824310SBarry Smith 
563081824310SBarry Smith   PetscFunctionBegin;
56314994cf47SJed Brown   MatCheckPreallocated(A, 1);
563281824310SBarry Smith   imax  = a->imax;
563381824310SBarry Smith   ai    = a->i;
563481824310SBarry Smith   ailen = a->ilen;
563581824310SBarry Smith   aj    = a->j;
563681824310SBarry Smith   aa    = a->a;
563781824310SBarry Smith 
563881824310SBarry Smith   for (k = 0; k < m; k++) { /* loop over added rows */
563981824310SBarry Smith     row = im[k];
564081824310SBarry Smith     if (row < 0) continue;
56415f80ce2aSJacob Faibussowitsch     PetscCheck(row < A->rmap->n, PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_OUTOFRANGE, "Row too large");
56429371c9d4SSatish Balay     rp   = aj + ai[row];
56439371c9d4SSatish Balay     ap   = aa + ai[row];
56449371c9d4SSatish Balay     rmax = imax[row];
56459371c9d4SSatish Balay     nrow = ailen[row];
564681824310SBarry Smith     low  = 0;
564781824310SBarry Smith     high = nrow;
564881824310SBarry Smith     for (l = 0; l < n; l++) { /* loop over added columns */
564981824310SBarry Smith       if (in[l] < 0) continue;
56505f80ce2aSJacob Faibussowitsch       PetscCheck(in[l] < A->cmap->n, PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_OUTOFRANGE, "Column too large");
565181824310SBarry Smith       col = in[l];
56522205254eSKarl Rupp       if (roworiented) value = v[l + k * n];
56532205254eSKarl Rupp       else value = v[k + l * m];
56542205254eSKarl Rupp 
565581824310SBarry Smith       if (value == 0.0 && ignorezeroentries && (is == ADD_VALUES)) continue;
565681824310SBarry Smith 
56572205254eSKarl Rupp       if (col <= lastcol) low = 0;
56582205254eSKarl Rupp       else high = nrow;
565981824310SBarry Smith       lastcol = col;
566081824310SBarry Smith       while (high - low > 5) {
566181824310SBarry Smith         t = (low + high) / 2;
566281824310SBarry Smith         if (rp[t] > col) high = t;
566381824310SBarry Smith         else low = t;
566481824310SBarry Smith       }
566581824310SBarry Smith       for (i = low; i < high; i++) {
566681824310SBarry Smith         if (rp[i] > col) break;
566781824310SBarry Smith         if (rp[i] == col) {
566881824310SBarry Smith           if (is == ADD_VALUES) ap[i] += value;
566981824310SBarry Smith           else ap[i] = value;
567081824310SBarry Smith           goto noinsert;
567181824310SBarry Smith         }
567281824310SBarry Smith       }
567381824310SBarry Smith       if (value == 0.0 && ignorezeroentries) goto noinsert;
567481824310SBarry Smith       if (nonew == 1) goto noinsert;
56755f80ce2aSJacob Faibussowitsch       PetscCheck(nonew != -1, PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_OUTOFRANGE, "Inserting a new nonzero in the matrix");
5676fef13f97SBarry Smith       MatSeqXAIJReallocateAIJ(A, A->rmap->n, 1, nrow, row, col, rmax, aa, ai, aj, rp, ap, imax, nonew, MatScalar);
56779371c9d4SSatish Balay       N = nrow++ - 1;
56789371c9d4SSatish Balay       a->nz++;
56799371c9d4SSatish Balay       high++;
568081824310SBarry Smith       /* shift up all the later entries in this row */
568181824310SBarry Smith       for (ii = N; ii >= i; ii--) {
568281824310SBarry Smith         rp[ii + 1] = rp[ii];
568381824310SBarry Smith         ap[ii + 1] = ap[ii];
568481824310SBarry Smith       }
568581824310SBarry Smith       rp[i] = col;
568681824310SBarry Smith       ap[i] = value;
568781824310SBarry Smith     noinsert:;
568881824310SBarry Smith       low = i + 1;
568981824310SBarry Smith     }
569081824310SBarry Smith     ailen[row] = nrow;
569181824310SBarry Smith   }
569281824310SBarry Smith   PetscFunctionReturnVoid();
569381824310SBarry Smith }
569498921bdaSJacob Faibussowitsch /* Undefining these here since they were redefined from their original definition above! No
569598921bdaSJacob Faibussowitsch  * other PETSc functions should be defined past this point, as it is impossible to recover the
569698921bdaSJacob Faibussowitsch  * original definitions */
56979566063dSJacob Faibussowitsch #undef PetscCall
569898921bdaSJacob Faibussowitsch #undef SETERRQ
5699