xref: /petsc/src/mat/impls/aij/seq/aij.c (revision e3c720941f06ea1a5bfc20f190bf798d81831d82)
1d5d45c9bSBarry Smith /*
23369ce9aSBarry Smith     Defines the basic matrix operations for the AIJ (compressed row)
3d5d45c9bSBarry Smith   matrix storage format.
4d5d45c9bSBarry Smith */
53369ce9aSBarry Smith 
6c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/aij.h> /*I "petscmat.h" I*/
7c6db04a5SJed Brown #include <petscblaslapack.h>
8c6db04a5SJed Brown #include <petscbt.h>
9af0996ceSBarry Smith #include <petsc/private/kernels/blocktranspose.h>
100716a85fSBarry Smith 
1126cec326SBarry Smith /* defines MatSetValues_Seq_Hash(), MatAssemblyEnd_Seq_Hash(), MatSetUp_Seq_Hash() */
1226cec326SBarry Smith #define TYPE AIJ
1326cec326SBarry Smith #define TYPE_BS
1426cec326SBarry Smith #include "../src/mat/impls/aij/seq/seqhashmatsetvalues.h"
1526cec326SBarry Smith #include "../src/mat/impls/aij/seq/seqhashmat.h"
1626cec326SBarry Smith #undef TYPE
1726cec326SBarry Smith #undef TYPE_BS
1826cec326SBarry Smith 
19d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetTypeFromOptions(Mat A)
20d71ae5a4SJacob Faibussowitsch {
214099cc6bSBarry Smith   PetscBool flg;
224099cc6bSBarry Smith   char      type[256];
234099cc6bSBarry Smith 
244099cc6bSBarry Smith   PetscFunctionBegin;
25d0609cedSBarry Smith   PetscObjectOptionsBegin((PetscObject)A);
269566063dSJacob Faibussowitsch   PetscCall(PetscOptionsFList("-mat_seqaij_type", "Matrix SeqAIJ type", "MatSeqAIJSetType", MatSeqAIJList, "seqaij", type, 256, &flg));
279566063dSJacob Faibussowitsch   if (flg) PetscCall(MatSeqAIJSetType(A, type));
28d0609cedSBarry Smith   PetscOptionsEnd();
293ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
304099cc6bSBarry Smith }
314099cc6bSBarry Smith 
32d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetColumnReductions_SeqAIJ(Mat A, PetscInt type, PetscReal *reductions)
33d71ae5a4SJacob Faibussowitsch {
340716a85fSBarry Smith   PetscInt    i, m, n;
350716a85fSBarry Smith   Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data;
360716a85fSBarry Smith 
370716a85fSBarry Smith   PetscFunctionBegin;
389566063dSJacob Faibussowitsch   PetscCall(MatGetSize(A, &m, &n));
399566063dSJacob Faibussowitsch   PetscCall(PetscArrayzero(reductions, n));
400716a85fSBarry Smith   if (type == NORM_2) {
41ad540459SPierre Jolivet     for (i = 0; i < aij->i[m]; i++) reductions[aij->j[i]] += PetscAbsScalar(aij->a[i] * aij->a[i]);
420716a85fSBarry Smith   } else if (type == NORM_1) {
43ad540459SPierre Jolivet     for (i = 0; i < aij->i[m]; i++) reductions[aij->j[i]] += PetscAbsScalar(aij->a[i]);
440716a85fSBarry Smith   } else if (type == NORM_INFINITY) {
45ad540459SPierre Jolivet     for (i = 0; i < aij->i[m]; i++) reductions[aij->j[i]] = PetscMax(PetscAbsScalar(aij->a[i]), reductions[aij->j[i]]);
46857cbf51SRichard Tran Mills   } else if (type == REDUCTION_SUM_REALPART || type == REDUCTION_MEAN_REALPART) {
47ad540459SPierre Jolivet     for (i = 0; i < aij->i[m]; i++) reductions[aij->j[i]] += PetscRealPart(aij->a[i]);
48857cbf51SRichard Tran Mills   } else if (type == REDUCTION_SUM_IMAGINARYPART || type == REDUCTION_MEAN_IMAGINARYPART) {
49ad540459SPierre Jolivet     for (i = 0; i < aij->i[m]; i++) reductions[aij->j[i]] += PetscImaginaryPart(aij->a[i]);
506adde796SStefano Zampini   } else SETERRQ(PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_WRONG, "Unknown reduction type");
510716a85fSBarry Smith 
520716a85fSBarry Smith   if (type == NORM_2) {
53a873a8cdSSam Reynolds     for (i = 0; i < n; i++) reductions[i] = PetscSqrtReal(reductions[i]);
54857cbf51SRichard Tran Mills   } else if (type == REDUCTION_MEAN_REALPART || type == REDUCTION_MEAN_IMAGINARYPART) {
55a873a8cdSSam Reynolds     for (i = 0; i < n; i++) reductions[i] /= m;
560716a85fSBarry Smith   }
573ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
580716a85fSBarry Smith }
590716a85fSBarry Smith 
60d71ae5a4SJacob Faibussowitsch PetscErrorCode MatFindOffBlockDiagonalEntries_SeqAIJ(Mat A, IS *is)
61d71ae5a4SJacob Faibussowitsch {
623a062f41SBarry Smith   Mat_SeqAIJ     *a = (Mat_SeqAIJ *)A->data;
633a062f41SBarry Smith   PetscInt        i, m = A->rmap->n, cnt = 0, bs = A->rmap->bs;
643a062f41SBarry Smith   const PetscInt *jj = a->j, *ii = a->i;
653a062f41SBarry Smith   PetscInt       *rows;
663a062f41SBarry Smith 
673a062f41SBarry Smith   PetscFunctionBegin;
683a062f41SBarry Smith   for (i = 0; i < m; i++) {
69ad540459SPierre Jolivet     if ((ii[i] != ii[i + 1]) && ((jj[ii[i]] < bs * (i / bs)) || (jj[ii[i + 1] - 1] > bs * ((i + bs) / bs) - 1))) cnt++;
703a062f41SBarry Smith   }
719566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(cnt, &rows));
723a062f41SBarry Smith   cnt = 0;
733a062f41SBarry Smith   for (i = 0; i < m; i++) {
743a062f41SBarry Smith     if ((ii[i] != ii[i + 1]) && ((jj[ii[i]] < bs * (i / bs)) || (jj[ii[i + 1] - 1] > bs * ((i + bs) / bs) - 1))) {
753a062f41SBarry Smith       rows[cnt] = i;
763a062f41SBarry Smith       cnt++;
773a062f41SBarry Smith     }
783a062f41SBarry Smith   }
799566063dSJacob Faibussowitsch   PetscCall(ISCreateGeneral(PETSC_COMM_SELF, cnt, rows, PETSC_OWN_POINTER, is));
803ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
813a062f41SBarry Smith }
823a062f41SBarry Smith 
83d71ae5a4SJacob Faibussowitsch PetscErrorCode MatFindZeroDiagonals_SeqAIJ_Private(Mat A, PetscInt *nrows, PetscInt **zrows)
84d71ae5a4SJacob Faibussowitsch {
856ce1633cSBarry Smith   Mat_SeqAIJ      *a = (Mat_SeqAIJ *)A->data;
86fff043a9SJunchao Zhang   const MatScalar *aa;
876ce1633cSBarry Smith   PetscInt         i, m = A->rmap->n, cnt = 0;
88b2db7409Sstefano_zampini   const PetscInt  *ii = a->i, *jj = a->j, *diag;
896ce1633cSBarry Smith   PetscInt        *rows;
906ce1633cSBarry Smith 
916ce1633cSBarry Smith   PetscFunctionBegin;
929566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &aa));
939566063dSJacob Faibussowitsch   PetscCall(MatMarkDiagonal_SeqAIJ(A));
946ce1633cSBarry Smith   diag = a->diag;
956ce1633cSBarry Smith   for (i = 0; i < m; i++) {
96ad540459SPierre Jolivet     if ((diag[i] >= ii[i + 1]) || (jj[diag[i]] != i) || (aa[diag[i]] == 0.0)) cnt++;
976ce1633cSBarry Smith   }
989566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(cnt, &rows));
996ce1633cSBarry Smith   cnt = 0;
1006ce1633cSBarry Smith   for (i = 0; i < m; i++) {
101ad540459SPierre Jolivet     if ((diag[i] >= ii[i + 1]) || (jj[diag[i]] != i) || (aa[diag[i]] == 0.0)) rows[cnt++] = i;
1026ce1633cSBarry Smith   }
103f1f41ecbSJed Brown   *nrows = cnt;
104f1f41ecbSJed Brown   *zrows = rows;
1059566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &aa));
1063ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
107f1f41ecbSJed Brown }
108f1f41ecbSJed Brown 
109d71ae5a4SJacob Faibussowitsch PetscErrorCode MatFindZeroDiagonals_SeqAIJ(Mat A, IS *zrows)
110d71ae5a4SJacob Faibussowitsch {
111f1f41ecbSJed Brown   PetscInt nrows, *rows;
112f1f41ecbSJed Brown 
113f1f41ecbSJed Brown   PetscFunctionBegin;
1140298fd71SBarry Smith   *zrows = NULL;
1159566063dSJacob Faibussowitsch   PetscCall(MatFindZeroDiagonals_SeqAIJ_Private(A, &nrows, &rows));
1169566063dSJacob Faibussowitsch   PetscCall(ISCreateGeneral(PetscObjectComm((PetscObject)A), nrows, rows, PETSC_OWN_POINTER, zrows));
1173ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
1186ce1633cSBarry Smith }
1196ce1633cSBarry Smith 
120d71ae5a4SJacob Faibussowitsch PetscErrorCode MatFindNonzeroRows_SeqAIJ(Mat A, IS *keptrows)
121d71ae5a4SJacob Faibussowitsch {
122b3a44c85SBarry Smith   Mat_SeqAIJ      *a = (Mat_SeqAIJ *)A->data;
123b3a44c85SBarry Smith   const MatScalar *aa;
124b3a44c85SBarry Smith   PetscInt         m = A->rmap->n, cnt = 0;
125b3a44c85SBarry Smith   const PetscInt  *ii;
126b3a44c85SBarry Smith   PetscInt         n, i, j, *rows;
127b3a44c85SBarry Smith 
128b3a44c85SBarry Smith   PetscFunctionBegin;
1299566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &aa));
130f4259b30SLisandro Dalcin   *keptrows = NULL;
131b3a44c85SBarry Smith   ii        = a->i;
132b3a44c85SBarry Smith   for (i = 0; i < m; i++) {
133b3a44c85SBarry Smith     n = ii[i + 1] - ii[i];
134b3a44c85SBarry Smith     if (!n) {
135b3a44c85SBarry Smith       cnt++;
136b3a44c85SBarry Smith       goto ok1;
137b3a44c85SBarry Smith     }
1382e5835c6SStefano Zampini     for (j = ii[i]; j < ii[i + 1]; j++) {
139b3a44c85SBarry Smith       if (aa[j] != 0.0) goto ok1;
140b3a44c85SBarry Smith     }
141b3a44c85SBarry Smith     cnt++;
142b3a44c85SBarry Smith   ok1:;
143b3a44c85SBarry Smith   }
1442e5835c6SStefano Zampini   if (!cnt) {
1459566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJRestoreArrayRead(A, &aa));
1463ba16761SJacob Faibussowitsch     PetscFunctionReturn(PETSC_SUCCESS);
1472e5835c6SStefano Zampini   }
1489566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(A->rmap->n - cnt, &rows));
149b3a44c85SBarry Smith   cnt = 0;
150b3a44c85SBarry Smith   for (i = 0; i < m; i++) {
151b3a44c85SBarry Smith     n = ii[i + 1] - ii[i];
152b3a44c85SBarry Smith     if (!n) continue;
1532e5835c6SStefano Zampini     for (j = ii[i]; j < ii[i + 1]; j++) {
154b3a44c85SBarry Smith       if (aa[j] != 0.0) {
155b3a44c85SBarry Smith         rows[cnt++] = i;
156b3a44c85SBarry Smith         break;
157b3a44c85SBarry Smith       }
158b3a44c85SBarry Smith     }
159b3a44c85SBarry Smith   }
1609566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &aa));
1619566063dSJacob Faibussowitsch   PetscCall(ISCreateGeneral(PETSC_COMM_SELF, cnt, rows, PETSC_OWN_POINTER, keptrows));
1623ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
163b3a44c85SBarry Smith }
164b3a44c85SBarry Smith 
165d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDiagonalSet_SeqAIJ(Mat Y, Vec D, InsertMode is)
166d71ae5a4SJacob Faibussowitsch {
16779299369SBarry Smith   Mat_SeqAIJ        *aij = (Mat_SeqAIJ *)Y->data;
16899e65526SBarry Smith   PetscInt           i, m = Y->rmap->n;
16999e65526SBarry Smith   const PetscInt    *diag;
1702e5835c6SStefano Zampini   MatScalar         *aa;
17199e65526SBarry Smith   const PetscScalar *v;
172ace3abfcSBarry Smith   PetscBool          missing;
17379299369SBarry Smith 
17479299369SBarry Smith   PetscFunctionBegin;
17509f38230SBarry Smith   if (Y->assembled) {
1769566063dSJacob Faibussowitsch     PetscCall(MatMissingDiagonal_SeqAIJ(Y, &missing, NULL));
17709f38230SBarry Smith     if (!missing) {
17879299369SBarry Smith       diag = aij->diag;
1799566063dSJacob Faibussowitsch       PetscCall(VecGetArrayRead(D, &v));
1809566063dSJacob Faibussowitsch       PetscCall(MatSeqAIJGetArray(Y, &aa));
18179299369SBarry Smith       if (is == INSERT_VALUES) {
182ad540459SPierre Jolivet         for (i = 0; i < m; i++) aa[diag[i]] = v[i];
18379299369SBarry Smith       } else {
184ad540459SPierre Jolivet         for (i = 0; i < m; i++) aa[diag[i]] += v[i];
18579299369SBarry Smith       }
1869566063dSJacob Faibussowitsch       PetscCall(MatSeqAIJRestoreArray(Y, &aa));
1879566063dSJacob Faibussowitsch       PetscCall(VecRestoreArrayRead(D, &v));
1883ba16761SJacob Faibussowitsch       PetscFunctionReturn(PETSC_SUCCESS);
18979299369SBarry Smith     }
1909566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJInvalidateDiagonal(Y));
19109f38230SBarry Smith   }
1929566063dSJacob Faibussowitsch   PetscCall(MatDiagonalSet_Default(Y, D, is));
1933ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
19409f38230SBarry Smith }
19579299369SBarry Smith 
196d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetRowIJ_SeqAIJ(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *m, const PetscInt *ia[], const PetscInt *ja[], PetscBool *done)
197d71ae5a4SJacob Faibussowitsch {
198416022c9SBarry Smith   Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data;
19997f1f81fSBarry Smith   PetscInt    i, ishift;
20017ab2063SBarry Smith 
2013a40ed3dSBarry Smith   PetscFunctionBegin;
202f1f2ae84SBarry Smith   if (m) *m = A->rmap->n;
2033ba16761SJacob Faibussowitsch   if (!ia) PetscFunctionReturn(PETSC_SUCCESS);
204bfeeae90SHong Zhang   ishift = 0;
205b94d7dedSBarry Smith   if (symmetric && A->structurally_symmetric != PETSC_BOOL3_TRUE) {
2069566063dSJacob Faibussowitsch     PetscCall(MatToSymmetricIJ_SeqAIJ(A->rmap->n, a->i, a->j, PETSC_TRUE, ishift, oshift, (PetscInt **)ia, (PetscInt **)ja));
207bfeeae90SHong Zhang   } else if (oshift == 1) {
2081a83f524SJed Brown     PetscInt *tia;
209d0f46423SBarry Smith     PetscInt  nz = a->i[A->rmap->n];
2103b2fbd54SBarry Smith     /* malloc space and  add 1 to i and j indices */
2119566063dSJacob Faibussowitsch     PetscCall(PetscMalloc1(A->rmap->n + 1, &tia));
2121a83f524SJed Brown     for (i = 0; i < A->rmap->n + 1; i++) tia[i] = a->i[i] + 1;
2131a83f524SJed Brown     *ia = tia;
214ecc77c7aSBarry Smith     if (ja) {
2151a83f524SJed Brown       PetscInt *tja;
2169566063dSJacob Faibussowitsch       PetscCall(PetscMalloc1(nz + 1, &tja));
2171a83f524SJed Brown       for (i = 0; i < nz; i++) tja[i] = a->j[i] + 1;
2181a83f524SJed Brown       *ja = tja;
219ecc77c7aSBarry Smith     }
2206945ee14SBarry Smith   } else {
221ecc77c7aSBarry Smith     *ia = a->i;
222ecc77c7aSBarry Smith     if (ja) *ja = a->j;
223a2ce50c7SBarry Smith   }
2243ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
225a2744918SBarry Smith }
226a2744918SBarry Smith 
227d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRestoreRowIJ_SeqAIJ(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *n, const PetscInt *ia[], const PetscInt *ja[], PetscBool *done)
228d71ae5a4SJacob Faibussowitsch {
2293a40ed3dSBarry Smith   PetscFunctionBegin;
2303ba16761SJacob Faibussowitsch   if (!ia) PetscFunctionReturn(PETSC_SUCCESS);
231b94d7dedSBarry Smith   if ((symmetric && A->structurally_symmetric != PETSC_BOOL3_TRUE) || oshift == 1) {
2329566063dSJacob Faibussowitsch     PetscCall(PetscFree(*ia));
2339566063dSJacob Faibussowitsch     if (ja) PetscCall(PetscFree(*ja));
234bcd2baecSBarry Smith   }
2353ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
23617ab2063SBarry Smith }
23717ab2063SBarry Smith 
238d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetColumnIJ_SeqAIJ(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *nn, const PetscInt *ia[], const PetscInt *ja[], PetscBool *done)
239d71ae5a4SJacob Faibussowitsch {
2403b2fbd54SBarry Smith   Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data;
241d0f46423SBarry Smith   PetscInt    i, *collengths, *cia, *cja, n = A->cmap->n, m = A->rmap->n;
24297f1f81fSBarry Smith   PetscInt    nz = a->i[m], row, *jj, mr, col;
2433b2fbd54SBarry Smith 
2443a40ed3dSBarry Smith   PetscFunctionBegin;
245899cda47SBarry Smith   *nn = n;
2463ba16761SJacob Faibussowitsch   if (!ia) PetscFunctionReturn(PETSC_SUCCESS);
2473b2fbd54SBarry Smith   if (symmetric) {
2489566063dSJacob Faibussowitsch     PetscCall(MatToSymmetricIJ_SeqAIJ(A->rmap->n, a->i, a->j, PETSC_TRUE, 0, oshift, (PetscInt **)ia, (PetscInt **)ja));
2493b2fbd54SBarry Smith   } else {
2509566063dSJacob Faibussowitsch     PetscCall(PetscCalloc1(n, &collengths));
2519566063dSJacob Faibussowitsch     PetscCall(PetscMalloc1(n + 1, &cia));
2529566063dSJacob Faibussowitsch     PetscCall(PetscMalloc1(nz, &cja));
2533b2fbd54SBarry Smith     jj = a->j;
254ad540459SPierre Jolivet     for (i = 0; i < nz; i++) collengths[jj[i]]++;
2553b2fbd54SBarry Smith     cia[0] = oshift;
256ad540459SPierre Jolivet     for (i = 0; i < n; i++) cia[i + 1] = cia[i] + collengths[i];
2579566063dSJacob Faibussowitsch     PetscCall(PetscArrayzero(collengths, n));
2583b2fbd54SBarry Smith     jj = a->j;
259a93ec695SBarry Smith     for (row = 0; row < m; row++) {
260a93ec695SBarry Smith       mr = a->i[row + 1] - a->i[row];
261a93ec695SBarry Smith       for (i = 0; i < mr; i++) {
262bfeeae90SHong Zhang         col = *jj++;
2632205254eSKarl Rupp 
2643b2fbd54SBarry Smith         cja[cia[col] + collengths[col]++ - oshift] = row + oshift;
2653b2fbd54SBarry Smith       }
2663b2fbd54SBarry Smith     }
2679566063dSJacob Faibussowitsch     PetscCall(PetscFree(collengths));
2689371c9d4SSatish Balay     *ia = cia;
2699371c9d4SSatish Balay     *ja = cja;
2703b2fbd54SBarry Smith   }
2713ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
2723b2fbd54SBarry Smith }
2733b2fbd54SBarry Smith 
274d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRestoreColumnIJ_SeqAIJ(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *n, const PetscInt *ia[], const PetscInt *ja[], PetscBool *done)
275d71ae5a4SJacob Faibussowitsch {
2763a40ed3dSBarry Smith   PetscFunctionBegin;
2773ba16761SJacob Faibussowitsch   if (!ia) PetscFunctionReturn(PETSC_SUCCESS);
2783b2fbd54SBarry Smith 
2799566063dSJacob Faibussowitsch   PetscCall(PetscFree(*ia));
2809566063dSJacob Faibussowitsch   PetscCall(PetscFree(*ja));
2813ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
2823b2fbd54SBarry Smith }
2833b2fbd54SBarry Smith 
2847cee066cSHong Zhang /*
2857cee066cSHong Zhang  MatGetColumnIJ_SeqAIJ_Color() and MatRestoreColumnIJ_SeqAIJ_Color() are customized from
2867cee066cSHong Zhang  MatGetColumnIJ_SeqAIJ() and MatRestoreColumnIJ_SeqAIJ() by adding an output
287040ebd07SHong Zhang  spidx[], index of a->a, to be used in MatTransposeColoringCreate_SeqAIJ() and MatFDColoringCreate_SeqXAIJ()
2887cee066cSHong Zhang */
289d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetColumnIJ_SeqAIJ_Color(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *nn, const PetscInt *ia[], const PetscInt *ja[], PetscInt *spidx[], PetscBool *done)
290d71ae5a4SJacob Faibussowitsch {
2917cee066cSHong Zhang   Mat_SeqAIJ     *a = (Mat_SeqAIJ *)A->data;
2927cee066cSHong Zhang   PetscInt        i, *collengths, *cia, *cja, n = A->cmap->n, m = A->rmap->n;
293071fcb05SBarry Smith   PetscInt        nz = a->i[m], row, mr, col, tmp;
2947cee066cSHong Zhang   PetscInt       *cspidx;
295071fcb05SBarry Smith   const PetscInt *jj;
2967cee066cSHong Zhang 
2977cee066cSHong Zhang   PetscFunctionBegin;
2987cee066cSHong Zhang   *nn = n;
2993ba16761SJacob Faibussowitsch   if (!ia) PetscFunctionReturn(PETSC_SUCCESS);
300625f6d37SHong Zhang 
3019566063dSJacob Faibussowitsch   PetscCall(PetscCalloc1(n, &collengths));
3029566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(n + 1, &cia));
3039566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(nz, &cja));
3049566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(nz, &cspidx));
3057cee066cSHong Zhang   jj = a->j;
306ad540459SPierre Jolivet   for (i = 0; i < nz; i++) collengths[jj[i]]++;
3077cee066cSHong Zhang   cia[0] = oshift;
308ad540459SPierre Jolivet   for (i = 0; i < n; i++) cia[i + 1] = cia[i] + collengths[i];
3099566063dSJacob Faibussowitsch   PetscCall(PetscArrayzero(collengths, n));
3107cee066cSHong Zhang   jj = a->j;
3117cee066cSHong Zhang   for (row = 0; row < m; row++) {
3127cee066cSHong Zhang     mr = a->i[row + 1] - a->i[row];
3137cee066cSHong Zhang     for (i = 0; i < mr; i++) {
3147cee066cSHong Zhang       col         = *jj++;
315071fcb05SBarry Smith       tmp         = cia[col] + collengths[col]++ - oshift;
316071fcb05SBarry Smith       cspidx[tmp] = a->i[row] + i; /* index of a->j */
317071fcb05SBarry Smith       cja[tmp]    = row + oshift;
3187cee066cSHong Zhang     }
3197cee066cSHong Zhang   }
3209566063dSJacob Faibussowitsch   PetscCall(PetscFree(collengths));
321071fcb05SBarry Smith   *ia    = cia;
322071fcb05SBarry Smith   *ja    = cja;
3237cee066cSHong Zhang   *spidx = cspidx;
3243ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3257cee066cSHong Zhang }
3267cee066cSHong Zhang 
327d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRestoreColumnIJ_SeqAIJ_Color(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *n, const PetscInt *ia[], const PetscInt *ja[], PetscInt *spidx[], PetscBool *done)
328d71ae5a4SJacob Faibussowitsch {
3297cee066cSHong Zhang   PetscFunctionBegin;
3309566063dSJacob Faibussowitsch   PetscCall(MatRestoreColumnIJ_SeqAIJ(A, oshift, symmetric, inodecompressed, n, ia, ja, done));
3319566063dSJacob Faibussowitsch   PetscCall(PetscFree(*spidx));
3323ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3337cee066cSHong Zhang }
3347cee066cSHong Zhang 
335d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetValuesRow_SeqAIJ(Mat A, PetscInt row, const PetscScalar v[])
336d71ae5a4SJacob Faibussowitsch {
33787d4246cSBarry Smith   Mat_SeqAIJ  *a  = (Mat_SeqAIJ *)A->data;
33887d4246cSBarry Smith   PetscInt    *ai = a->i;
339fff043a9SJunchao Zhang   PetscScalar *aa;
34087d4246cSBarry Smith 
34187d4246cSBarry Smith   PetscFunctionBegin;
3429566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArray(A, &aa));
3439566063dSJacob Faibussowitsch   PetscCall(PetscArraycpy(aa + ai[row], v, ai[row + 1] - ai[row]));
3449566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArray(A, &aa));
3453ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
34687d4246cSBarry Smith }
34787d4246cSBarry Smith 
348bd04181cSBarry Smith /*
349bd04181cSBarry Smith     MatSeqAIJSetValuesLocalFast - An optimized version of MatSetValuesLocal() for SeqAIJ matrices with several assumptions
350bd04181cSBarry Smith 
351bd04181cSBarry Smith       -   a single row of values is set with each call
352bd04181cSBarry Smith       -   no row or column indices are negative or (in error) larger than the number of rows or columns
353bd04181cSBarry Smith       -   the values are always added to the matrix, not set
354bd04181cSBarry Smith       -   no new locations are introduced in the nonzero structure of the matrix
355bd04181cSBarry Smith 
3561f763a69SBarry Smith      This does NOT assume the global column indices are sorted
357bd04181cSBarry Smith 
3581f763a69SBarry Smith */
359bd04181cSBarry Smith 
360af0996ceSBarry Smith #include <petsc/private/isimpl.h>
361d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetValuesLocalFast(Mat A, PetscInt m, const PetscInt im[], PetscInt n, const PetscInt in[], const PetscScalar v[], InsertMode is)
362d71ae5a4SJacob Faibussowitsch {
363189e4007SBarry Smith   Mat_SeqAIJ     *a = (Mat_SeqAIJ *)A->data;
3641f763a69SBarry Smith   PetscInt        low, high, t, row, nrow, i, col, l;
3651f763a69SBarry Smith   const PetscInt *rp, *ai = a->i, *ailen = a->ilen, *aj = a->j;
3661f763a69SBarry Smith   PetscInt        lastcol = -1;
367fff043a9SJunchao Zhang   MatScalar      *ap, value, *aa;
368189e4007SBarry Smith   const PetscInt *ridx = A->rmap->mapping->indices, *cidx = A->cmap->mapping->indices;
369189e4007SBarry Smith 
370fff043a9SJunchao Zhang   PetscFunctionBegin;
3719566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArray(A, &aa));
372f38dd0b8SBarry Smith   row  = ridx[im[0]];
3731f763a69SBarry Smith   rp   = aj + ai[row];
3741f763a69SBarry Smith   ap   = aa + ai[row];
3751f763a69SBarry Smith   nrow = ailen[row];
376189e4007SBarry Smith   low  = 0;
377189e4007SBarry Smith   high = nrow;
378189e4007SBarry Smith   for (l = 0; l < n; l++) { /* loop over added columns */
379189e4007SBarry Smith     col   = cidx[in[l]];
380f38dd0b8SBarry Smith     value = v[l];
381189e4007SBarry Smith 
382189e4007SBarry Smith     if (col <= lastcol) low = 0;
383189e4007SBarry Smith     else high = nrow;
384189e4007SBarry Smith     lastcol = col;
385189e4007SBarry Smith     while (high - low > 5) {
386189e4007SBarry Smith       t = (low + high) / 2;
387189e4007SBarry Smith       if (rp[t] > col) high = t;
388189e4007SBarry Smith       else low = t;
389189e4007SBarry Smith     }
390189e4007SBarry Smith     for (i = low; i < high; i++) {
391189e4007SBarry Smith       if (rp[i] == col) {
3921f763a69SBarry Smith         ap[i] += value;
393189e4007SBarry Smith         low = i + 1;
3941f763a69SBarry Smith         break;
395189e4007SBarry Smith       }
396189e4007SBarry Smith     }
397189e4007SBarry Smith   }
3989566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArray(A, &aa));
3993ba16761SJacob Faibussowitsch   return PETSC_SUCCESS;
400189e4007SBarry Smith }
401189e4007SBarry Smith 
402d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetValues_SeqAIJ(Mat A, PetscInt m, const PetscInt im[], PetscInt n, const PetscInt in[], const PetscScalar v[], InsertMode is)
403d71ae5a4SJacob Faibussowitsch {
404416022c9SBarry Smith   Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data;
405e2ee6c50SBarry Smith   PetscInt   *rp, k, low, high, t, ii, row, nrow, i, col, l, rmax, N;
40697f1f81fSBarry Smith   PetscInt   *imax = a->imax, *ai = a->i, *ailen = a->ilen;
407e2ee6c50SBarry Smith   PetscInt   *aj = a->j, nonew = a->nonew, lastcol = -1;
408ce496241SStefano Zampini   MatScalar  *ap = NULL, value = 0.0, *aa;
409ace3abfcSBarry Smith   PetscBool   ignorezeroentries = a->ignorezeroentries;
410ace3abfcSBarry Smith   PetscBool   roworiented       = a->roworiented;
41117ab2063SBarry Smith 
4123a40ed3dSBarry Smith   PetscFunctionBegin;
4139566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArray(A, &aa));
41417ab2063SBarry Smith   for (k = 0; k < m; k++) { /* loop over added rows */
415416022c9SBarry Smith     row = im[k];
4165ef9f2a5SBarry Smith     if (row < 0) continue;
4176bdcaf15SBarry Smith     PetscCheck(row < A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Row too large: row %" PetscInt_FMT " max %" PetscInt_FMT, row, A->rmap->n - 1);
418720833daSHong Zhang     rp = aj + ai[row];
419876c6284SHong Zhang     if (!A->structure_only) ap = aa + ai[row];
4209371c9d4SSatish Balay     rmax = imax[row];
4219371c9d4SSatish Balay     nrow = ailen[row];
422416022c9SBarry Smith     low  = 0;
423c71e6ed7SBarry Smith     high = nrow;
42417ab2063SBarry Smith     for (l = 0; l < n; l++) { /* loop over added columns */
4255ef9f2a5SBarry Smith       if (in[l] < 0) continue;
4266bdcaf15SBarry Smith       PetscCheck(in[l] < A->cmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Column too large: col %" PetscInt_FMT " max %" PetscInt_FMT, in[l], A->cmap->n - 1);
427bfeeae90SHong Zhang       col = in[l];
428071fcb05SBarry Smith       if (v && !A->structure_only) value = roworiented ? v[l + k * n] : v[k + l * m];
429071fcb05SBarry Smith       if (!A->structure_only && value == 0.0 && ignorezeroentries && is == ADD_VALUES && row != col) continue;
43036db0b34SBarry Smith 
4312205254eSKarl Rupp       if (col <= lastcol) low = 0;
4322205254eSKarl Rupp       else high = nrow;
433e2ee6c50SBarry Smith       lastcol = col;
434416022c9SBarry Smith       while (high - low > 5) {
435416022c9SBarry Smith         t = (low + high) / 2;
436416022c9SBarry Smith         if (rp[t] > col) high = t;
437416022c9SBarry Smith         else low = t;
43817ab2063SBarry Smith       }
439416022c9SBarry Smith       for (i = low; i < high; i++) {
44017ab2063SBarry Smith         if (rp[i] > col) break;
44117ab2063SBarry Smith         if (rp[i] == col) {
442876c6284SHong Zhang           if (!A->structure_only) {
4430c0d7e18SFande Kong             if (is == ADD_VALUES) {
4440c0d7e18SFande Kong               ap[i] += value;
4450c0d7e18SFande Kong               (void)PetscLogFlops(1.0);
4469371c9d4SSatish Balay             } else ap[i] = value;
447720833daSHong Zhang           }
448e44c0bd4SBarry Smith           low = i + 1;
44917ab2063SBarry Smith           goto noinsert;
45017ab2063SBarry Smith         }
45117ab2063SBarry Smith       }
452dcd36c23SBarry Smith       if (value == 0.0 && ignorezeroentries && row != col) goto noinsert;
453c2653b3dSLois Curfman McInnes       if (nonew == 1) goto noinsert;
45408401ef6SPierre Jolivet       PetscCheck(nonew != -1, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Inserting a new nonzero at (%" PetscInt_FMT ",%" PetscInt_FMT ") in the matrix", row, col);
455720833daSHong Zhang       if (A->structure_only) {
456876c6284SHong Zhang         MatSeqXAIJReallocateAIJ_structure_only(A, A->rmap->n, 1, nrow, row, col, rmax, ai, aj, rp, imax, nonew, MatScalar);
457720833daSHong Zhang       } else {
458fef13f97SBarry Smith         MatSeqXAIJReallocateAIJ(A, A->rmap->n, 1, nrow, row, col, rmax, aa, ai, aj, rp, ap, imax, nonew, MatScalar);
459720833daSHong Zhang       }
4609371c9d4SSatish Balay       N = nrow++ - 1;
4619371c9d4SSatish Balay       a->nz++;
4629371c9d4SSatish Balay       high++;
463416022c9SBarry Smith       /* shift up all the later entries in this row */
4649566063dSJacob Faibussowitsch       PetscCall(PetscArraymove(rp + i + 1, rp + i, N - i + 1));
46517ab2063SBarry Smith       rp[i] = col;
466580bdb30SBarry Smith       if (!A->structure_only) {
4679566063dSJacob Faibussowitsch         PetscCall(PetscArraymove(ap + i + 1, ap + i, N - i + 1));
468580bdb30SBarry Smith         ap[i] = value;
469580bdb30SBarry Smith       }
470416022c9SBarry Smith       low = i + 1;
471e56f5c9eSBarry Smith       A->nonzerostate++;
472e44c0bd4SBarry Smith     noinsert:;
47317ab2063SBarry Smith     }
47417ab2063SBarry Smith     ailen[row] = nrow;
47517ab2063SBarry Smith   }
4769566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArray(A, &aa));
4773ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
47817ab2063SBarry Smith }
47917ab2063SBarry Smith 
480d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetValues_SeqAIJ_SortedFullNoPreallocation(Mat A, PetscInt m, const PetscInt im[], PetscInt n, const PetscInt in[], const PetscScalar v[], InsertMode is)
481d71ae5a4SJacob Faibussowitsch {
48219b08ed1SBarry Smith   Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data;
48319b08ed1SBarry Smith   PetscInt   *rp, k, row;
48419b08ed1SBarry Smith   PetscInt   *ai = a->i;
48519b08ed1SBarry Smith   PetscInt   *aj = a->j;
486fff043a9SJunchao Zhang   MatScalar  *aa, *ap;
48719b08ed1SBarry Smith 
48819b08ed1SBarry Smith   PetscFunctionBegin;
48928b400f6SJacob Faibussowitsch   PetscCheck(!A->was_assembled, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Cannot call on assembled matrix.");
49008401ef6SPierre Jolivet   PetscCheck(m * n + a->nz <= a->maxnz, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Number of entries in matrix will be larger than maximum nonzeros allocated for %" PetscInt_FMT " in MatSeqAIJSetTotalPreallocation()", a->maxnz);
491fff043a9SJunchao Zhang 
4929566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArray(A, &aa));
49319b08ed1SBarry Smith   for (k = 0; k < m; k++) { /* loop over added rows */
49419b08ed1SBarry Smith     row = im[k];
49519b08ed1SBarry Smith     rp  = aj + ai[row];
49619b08ed1SBarry Smith     ap  = aa + ai[row];
49719b08ed1SBarry Smith 
4989566063dSJacob Faibussowitsch     PetscCall(PetscMemcpy(rp, in, n * sizeof(PetscInt)));
49919b08ed1SBarry Smith     if (!A->structure_only) {
50019b08ed1SBarry Smith       if (v) {
5019566063dSJacob Faibussowitsch         PetscCall(PetscMemcpy(ap, v, n * sizeof(PetscScalar)));
50219b08ed1SBarry Smith         v += n;
50319b08ed1SBarry Smith       } else {
5049566063dSJacob Faibussowitsch         PetscCall(PetscMemzero(ap, n * sizeof(PetscScalar)));
50519b08ed1SBarry Smith       }
50619b08ed1SBarry Smith     }
50719b08ed1SBarry Smith     a->ilen[row]  = n;
50819b08ed1SBarry Smith     a->imax[row]  = n;
50919b08ed1SBarry Smith     a->i[row + 1] = a->i[row] + n;
51019b08ed1SBarry Smith     a->nz += n;
51119b08ed1SBarry Smith   }
5129566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArray(A, &aa));
5133ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
51419b08ed1SBarry Smith }
51519b08ed1SBarry Smith 
51619b08ed1SBarry Smith /*@
51719b08ed1SBarry Smith     MatSeqAIJSetTotalPreallocation - Sets an upper bound on the total number of expected nonzeros in the matrix.
51819b08ed1SBarry Smith 
51919b08ed1SBarry Smith   Input Parameters:
52011a5261eSBarry Smith +  A - the `MATSEQAIJ` matrix
52119b08ed1SBarry Smith -  nztotal - bound on the number of nonzeros
52219b08ed1SBarry Smith 
52319b08ed1SBarry Smith   Level: advanced
52419b08ed1SBarry Smith 
52519b08ed1SBarry Smith   Notes:
52619b08ed1SBarry Smith     This can be called if you will be provided the matrix row by row (from row zero) with sorted column indices for each row.
52711a5261eSBarry Smith     Simply call `MatSetValues()` after this call to provide the matrix entries in the usual manner. This matrix may be used
52819b08ed1SBarry Smith     as always with multiple matrix assemblies.
52919b08ed1SBarry Smith 
5301cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSetOption()`, `MAT_SORTED_FULL`, `MatSetValues()`, `MatSeqAIJSetPreallocation()`
53119b08ed1SBarry Smith @*/
53219b08ed1SBarry Smith 
533d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetTotalPreallocation(Mat A, PetscInt nztotal)
534d71ae5a4SJacob Faibussowitsch {
53519b08ed1SBarry Smith   Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data;
53619b08ed1SBarry Smith 
53719b08ed1SBarry Smith   PetscFunctionBegin;
5389566063dSJacob Faibussowitsch   PetscCall(PetscLayoutSetUp(A->rmap));
5399566063dSJacob Faibussowitsch   PetscCall(PetscLayoutSetUp(A->cmap));
54019b08ed1SBarry Smith   a->maxnz = nztotal;
5414dfa11a4SJacob Faibussowitsch   if (!a->imax) { PetscCall(PetscMalloc1(A->rmap->n, &a->imax)); }
54219b08ed1SBarry Smith   if (!a->ilen) {
5439566063dSJacob Faibussowitsch     PetscCall(PetscMalloc1(A->rmap->n, &a->ilen));
54419b08ed1SBarry Smith   } else {
5459566063dSJacob Faibussowitsch     PetscCall(PetscMemzero(a->ilen, A->rmap->n * sizeof(PetscInt)));
54619b08ed1SBarry Smith   }
54719b08ed1SBarry Smith 
54819b08ed1SBarry Smith   /* allocate the matrix space */
54919b08ed1SBarry Smith   if (A->structure_only) {
5509566063dSJacob Faibussowitsch     PetscCall(PetscMalloc1(nztotal, &a->j));
5519566063dSJacob Faibussowitsch     PetscCall(PetscMalloc1(A->rmap->n + 1, &a->i));
55219b08ed1SBarry Smith   } else {
5539566063dSJacob Faibussowitsch     PetscCall(PetscMalloc3(nztotal, &a->a, nztotal, &a->j, A->rmap->n + 1, &a->i));
55419b08ed1SBarry Smith   }
55519b08ed1SBarry Smith   a->i[0] = 0;
55619b08ed1SBarry Smith   if (A->structure_only) {
55719b08ed1SBarry Smith     a->singlemalloc = PETSC_FALSE;
55819b08ed1SBarry Smith     a->free_a       = PETSC_FALSE;
55919b08ed1SBarry Smith   } else {
56019b08ed1SBarry Smith     a->singlemalloc = PETSC_TRUE;
56119b08ed1SBarry Smith     a->free_a       = PETSC_TRUE;
56219b08ed1SBarry Smith   }
56319b08ed1SBarry Smith   a->free_ij        = PETSC_TRUE;
56419b08ed1SBarry Smith   A->ops->setvalues = MatSetValues_SeqAIJ_SortedFullNoPreallocation;
56519b08ed1SBarry Smith   A->preallocated   = PETSC_TRUE;
5663ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
56719b08ed1SBarry Smith }
56819b08ed1SBarry Smith 
569d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetValues_SeqAIJ_SortedFull(Mat A, PetscInt m, const PetscInt im[], PetscInt n, const PetscInt in[], const PetscScalar v[], InsertMode is)
570d71ae5a4SJacob Faibussowitsch {
571071fcb05SBarry Smith   Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data;
572071fcb05SBarry Smith   PetscInt   *rp, k, row;
573071fcb05SBarry Smith   PetscInt   *ai = a->i, *ailen = a->ilen;
574071fcb05SBarry Smith   PetscInt   *aj = a->j;
575fff043a9SJunchao Zhang   MatScalar  *aa, *ap;
576071fcb05SBarry Smith 
577071fcb05SBarry Smith   PetscFunctionBegin;
5789566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArray(A, &aa));
579071fcb05SBarry Smith   for (k = 0; k < m; k++) { /* loop over added rows */
580071fcb05SBarry Smith     row = im[k];
5816bdcaf15SBarry Smith     PetscCheck(n <= a->imax[row], PETSC_COMM_SELF, PETSC_ERR_ARG_WRONG, "Preallocation for row %" PetscInt_FMT " does not match number of columns provided", n);
582071fcb05SBarry Smith     rp = aj + ai[row];
583071fcb05SBarry Smith     ap = aa + ai[row];
58448a46eb9SPierre Jolivet     if (!A->was_assembled) PetscCall(PetscMemcpy(rp, in, n * sizeof(PetscInt)));
585071fcb05SBarry Smith     if (!A->structure_only) {
586071fcb05SBarry Smith       if (v) {
5879566063dSJacob Faibussowitsch         PetscCall(PetscMemcpy(ap, v, n * sizeof(PetscScalar)));
588071fcb05SBarry Smith         v += n;
589071fcb05SBarry Smith       } else {
5909566063dSJacob Faibussowitsch         PetscCall(PetscMemzero(ap, n * sizeof(PetscScalar)));
591071fcb05SBarry Smith       }
592071fcb05SBarry Smith     }
593071fcb05SBarry Smith     ailen[row] = n;
594071fcb05SBarry Smith     a->nz += n;
595071fcb05SBarry Smith   }
5969566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArray(A, &aa));
5973ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
598071fcb05SBarry Smith }
599071fcb05SBarry Smith 
600d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetValues_SeqAIJ(Mat A, PetscInt m, const PetscInt im[], PetscInt n, const PetscInt in[], PetscScalar v[])
601d71ae5a4SJacob Faibussowitsch {
6027eb43aa7SLois Curfman McInnes   Mat_SeqAIJ      *a = (Mat_SeqAIJ *)A->data;
60397f1f81fSBarry Smith   PetscInt        *rp, k, low, high, t, row, nrow, i, col, l, *aj = a->j;
60497f1f81fSBarry Smith   PetscInt        *ai = a->i, *ailen = a->ilen;
6054e208921SJed Brown   const MatScalar *ap, *aa;
6067eb43aa7SLois Curfman McInnes 
6073a40ed3dSBarry Smith   PetscFunctionBegin;
6084e208921SJed Brown   PetscCall(MatSeqAIJGetArrayRead(A, &aa));
6097eb43aa7SLois Curfman McInnes   for (k = 0; k < m; k++) { /* loop over rows */
6107eb43aa7SLois Curfman McInnes     row = im[k];
6119371c9d4SSatish Balay     if (row < 0) {
6129371c9d4SSatish Balay       v += n;
6139371c9d4SSatish Balay       continue;
6149371c9d4SSatish Balay     } /* negative row */
61554c59aa7SJacob Faibussowitsch     PetscCheck(row < A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Row too large: row %" PetscInt_FMT " max %" PetscInt_FMT, row, A->rmap->n - 1);
6169371c9d4SSatish Balay     rp   = aj + ai[row];
6179371c9d4SSatish Balay     ap   = aa + ai[row];
6187eb43aa7SLois Curfman McInnes     nrow = ailen[row];
6197eb43aa7SLois Curfman McInnes     for (l = 0; l < n; l++) { /* loop over columns */
6209371c9d4SSatish Balay       if (in[l] < 0) {
6219371c9d4SSatish Balay         v++;
6229371c9d4SSatish Balay         continue;
6239371c9d4SSatish Balay       } /* negative column */
62454c59aa7SJacob Faibussowitsch       PetscCheck(in[l] < A->cmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Column too large: col %" PetscInt_FMT " max %" PetscInt_FMT, in[l], A->cmap->n - 1);
625bfeeae90SHong Zhang       col  = in[l];
6269371c9d4SSatish Balay       high = nrow;
6279371c9d4SSatish Balay       low  = 0; /* assume unsorted */
6287eb43aa7SLois Curfman McInnes       while (high - low > 5) {
6297eb43aa7SLois Curfman McInnes         t = (low + high) / 2;
6307eb43aa7SLois Curfman McInnes         if (rp[t] > col) high = t;
6317eb43aa7SLois Curfman McInnes         else low = t;
6327eb43aa7SLois Curfman McInnes       }
6337eb43aa7SLois Curfman McInnes       for (i = low; i < high; i++) {
6347eb43aa7SLois Curfman McInnes         if (rp[i] > col) break;
6357eb43aa7SLois Curfman McInnes         if (rp[i] == col) {
636b49de8d1SLois Curfman McInnes           *v++ = ap[i];
6377eb43aa7SLois Curfman McInnes           goto finished;
6387eb43aa7SLois Curfman McInnes         }
6397eb43aa7SLois Curfman McInnes       }
64097e567efSBarry Smith       *v++ = 0.0;
6417eb43aa7SLois Curfman McInnes     finished:;
6427eb43aa7SLois Curfman McInnes     }
6437eb43aa7SLois Curfman McInnes   }
6444e208921SJed Brown   PetscCall(MatSeqAIJRestoreArrayRead(A, &aa));
6453ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
6467eb43aa7SLois Curfman McInnes }
6477eb43aa7SLois Curfman McInnes 
648d71ae5a4SJacob Faibussowitsch PetscErrorCode MatView_SeqAIJ_Binary(Mat mat, PetscViewer viewer)
649d71ae5a4SJacob Faibussowitsch {
6503ea6fe3dSLisandro Dalcin   Mat_SeqAIJ        *A = (Mat_SeqAIJ *)mat->data;
651c898d852SStefano Zampini   const PetscScalar *av;
6523ea6fe3dSLisandro Dalcin   PetscInt           header[4], M, N, m, nz, i;
6533ea6fe3dSLisandro Dalcin   PetscInt          *rowlens;
65417ab2063SBarry Smith 
6553a40ed3dSBarry Smith   PetscFunctionBegin;
6569566063dSJacob Faibussowitsch   PetscCall(PetscViewerSetUp(viewer));
6572205254eSKarl Rupp 
6583ea6fe3dSLisandro Dalcin   M  = mat->rmap->N;
6593ea6fe3dSLisandro Dalcin   N  = mat->cmap->N;
6603ea6fe3dSLisandro Dalcin   m  = mat->rmap->n;
6613ea6fe3dSLisandro Dalcin   nz = A->nz;
662416022c9SBarry Smith 
6633ea6fe3dSLisandro Dalcin   /* write matrix header */
6643ea6fe3dSLisandro Dalcin   header[0] = MAT_FILE_CLASSID;
6659371c9d4SSatish Balay   header[1] = M;
6669371c9d4SSatish Balay   header[2] = N;
6679371c9d4SSatish Balay   header[3] = nz;
6689566063dSJacob Faibussowitsch   PetscCall(PetscViewerBinaryWrite(viewer, header, 4, PETSC_INT));
669416022c9SBarry Smith 
6703ea6fe3dSLisandro Dalcin   /* fill in and store row lengths */
6719566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(m, &rowlens));
6723ea6fe3dSLisandro Dalcin   for (i = 0; i < m; i++) rowlens[i] = A->i[i + 1] - A->i[i];
6739566063dSJacob Faibussowitsch   PetscCall(PetscViewerBinaryWrite(viewer, rowlens, m, PETSC_INT));
6749566063dSJacob Faibussowitsch   PetscCall(PetscFree(rowlens));
6753ea6fe3dSLisandro Dalcin   /* store column indices */
6769566063dSJacob Faibussowitsch   PetscCall(PetscViewerBinaryWrite(viewer, A->j, nz, PETSC_INT));
677416022c9SBarry Smith   /* store nonzero values */
6789566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(mat, &av));
6799566063dSJacob Faibussowitsch   PetscCall(PetscViewerBinaryWrite(viewer, av, nz, PETSC_SCALAR));
6809566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(mat, &av));
681b37d52dbSMark F. Adams 
6823ea6fe3dSLisandro Dalcin   /* write block size option to the viewer's .info file */
6839566063dSJacob Faibussowitsch   PetscCall(MatView_Binary_BlockSizes(mat, viewer));
6843ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
68517ab2063SBarry Smith }
686416022c9SBarry Smith 
687d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatView_SeqAIJ_ASCII_structonly(Mat A, PetscViewer viewer)
688d71ae5a4SJacob Faibussowitsch {
6897dc0baabSHong Zhang   Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data;
6907dc0baabSHong Zhang   PetscInt    i, k, m = A->rmap->N;
6917dc0baabSHong Zhang 
6927dc0baabSHong Zhang   PetscFunctionBegin;
6939566063dSJacob Faibussowitsch   PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE));
6947dc0baabSHong Zhang   for (i = 0; i < m; i++) {
6959566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIPrintf(viewer, "row %" PetscInt_FMT ":", i));
69648a46eb9SPierre Jolivet     for (k = a->i[i]; k < a->i[i + 1]; k++) PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ") ", a->j[k]));
6979566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIPrintf(viewer, "\n"));
6987dc0baabSHong Zhang   }
6999566063dSJacob Faibussowitsch   PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE));
7003ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
7017dc0baabSHong Zhang }
7027dc0baabSHong Zhang 
70309573ac7SBarry Smith extern PetscErrorCode MatSeqAIJFactorInfo_Matlab(Mat, PetscViewer);
704cd155464SBarry Smith 
705d71ae5a4SJacob Faibussowitsch PetscErrorCode MatView_SeqAIJ_ASCII(Mat A, PetscViewer viewer)
706d71ae5a4SJacob Faibussowitsch {
707416022c9SBarry Smith   Mat_SeqAIJ        *a = (Mat_SeqAIJ *)A->data;
708c898d852SStefano Zampini   const PetscScalar *av;
70960e0710aSBarry Smith   PetscInt           i, j, m = A->rmap->n;
710e060cb09SBarry Smith   const char        *name;
711f3ef73ceSBarry Smith   PetscViewerFormat  format;
71217ab2063SBarry Smith 
7133a40ed3dSBarry Smith   PetscFunctionBegin;
7147dc0baabSHong Zhang   if (A->structure_only) {
7159566063dSJacob Faibussowitsch     PetscCall(MatView_SeqAIJ_ASCII_structonly(A, viewer));
7163ba16761SJacob Faibussowitsch     PetscFunctionReturn(PETSC_SUCCESS);
7177dc0baabSHong Zhang   }
71843e49210SHong Zhang 
7199566063dSJacob Faibussowitsch   PetscCall(PetscViewerGetFormat(viewer, &format));
7203ba16761SJacob Faibussowitsch   if (format == PETSC_VIEWER_ASCII_FACTOR_INFO || format == PETSC_VIEWER_ASCII_INFO || format == PETSC_VIEWER_ASCII_INFO_DETAIL) PetscFunctionReturn(PETSC_SUCCESS);
7212e5835c6SStefano Zampini 
722c898d852SStefano Zampini   /* trigger copy to CPU if needed */
7239566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &av));
7249566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &av));
72571c2f376SKris Buschelman   if (format == PETSC_VIEWER_ASCII_MATLAB) {
72697f1f81fSBarry Smith     PetscInt nofinalvalue = 0;
72760e0710aSBarry Smith     if (m && ((a->i[m] == a->i[m - 1]) || (a->j[a->nz - 1] != A->cmap->n - 1))) {
728c337ccceSJed Brown       /* Need a dummy value to ensure the dimension of the matrix. */
729d00d2cf4SBarry Smith       nofinalvalue = 1;
730d00d2cf4SBarry Smith     }
7319566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE));
7329566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIPrintf(viewer, "%% Size = %" PetscInt_FMT " %" PetscInt_FMT " \n", m, A->cmap->n));
7339566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIPrintf(viewer, "%% Nonzeros = %" PetscInt_FMT " \n", a->nz));
734fbfe6fa7SJed Brown #if defined(PETSC_USE_COMPLEX)
7359566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIPrintf(viewer, "zzz = zeros(%" PetscInt_FMT ",4);\n", a->nz + nofinalvalue));
736fbfe6fa7SJed Brown #else
7379566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIPrintf(viewer, "zzz = zeros(%" PetscInt_FMT ",3);\n", a->nz + nofinalvalue));
738fbfe6fa7SJed Brown #endif
7399566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIPrintf(viewer, "zzz = [\n"));
74017ab2063SBarry Smith 
74117ab2063SBarry Smith     for (i = 0; i < m; i++) {
74260e0710aSBarry Smith       for (j = a->i[i]; j < a->i[i + 1]; j++) {
743aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX)
7449566063dSJacob Faibussowitsch         PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT "  %18.16e %18.16e\n", i + 1, a->j[j] + 1, (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j])));
74517ab2063SBarry Smith #else
7469566063dSJacob Faibussowitsch         PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT "  %18.16e\n", i + 1, a->j[j] + 1, (double)a->a[j]));
74717ab2063SBarry Smith #endif
74817ab2063SBarry Smith       }
74917ab2063SBarry Smith     }
750d00d2cf4SBarry Smith     if (nofinalvalue) {
751c337ccceSJed Brown #if defined(PETSC_USE_COMPLEX)
7529566063dSJacob Faibussowitsch       PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT "  %18.16e %18.16e\n", m, A->cmap->n, 0., 0.));
753c337ccceSJed Brown #else
7549566063dSJacob Faibussowitsch       PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT "  %18.16e\n", m, A->cmap->n, 0.0));
755c337ccceSJed Brown #endif
756d00d2cf4SBarry Smith     }
7579566063dSJacob Faibussowitsch     PetscCall(PetscObjectGetName((PetscObject)A, &name));
7589566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIPrintf(viewer, "];\n %s = spconvert(zzz);\n", name));
7599566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE));
760fb9695e5SSatish Balay   } else if (format == PETSC_VIEWER_ASCII_COMMON) {
7619566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE));
76244cd7ae7SLois Curfman McInnes     for (i = 0; i < m; i++) {
7639566063dSJacob Faibussowitsch       PetscCall(PetscViewerASCIIPrintf(viewer, "row %" PetscInt_FMT ":", i));
76460e0710aSBarry Smith       for (j = a->i[i]; j < a->i[i + 1]; j++) {
765aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX)
76636db0b34SBarry Smith         if (PetscImaginaryPart(a->a[j]) > 0.0 && PetscRealPart(a->a[j]) != 0.0) {
7679566063dSJacob Faibussowitsch           PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g + %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j])));
76836db0b34SBarry Smith         } else if (PetscImaginaryPart(a->a[j]) < 0.0 && PetscRealPart(a->a[j]) != 0.0) {
7699566063dSJacob Faibussowitsch           PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g - %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)-PetscImaginaryPart(a->a[j])));
77036db0b34SBarry Smith         } else if (PetscRealPart(a->a[j]) != 0.0) {
7719566063dSJacob Faibussowitsch           PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)PetscRealPart(a->a[j])));
7726831982aSBarry Smith         }
77344cd7ae7SLois Curfman McInnes #else
7749566063dSJacob Faibussowitsch         if (a->a[j] != 0.0) PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)a->a[j]));
77544cd7ae7SLois Curfman McInnes #endif
77644cd7ae7SLois Curfman McInnes       }
7779566063dSJacob Faibussowitsch       PetscCall(PetscViewerASCIIPrintf(viewer, "\n"));
77844cd7ae7SLois Curfman McInnes     }
7799566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE));
780fb9695e5SSatish Balay   } else if (format == PETSC_VIEWER_ASCII_SYMMODU) {
78197f1f81fSBarry Smith     PetscInt nzd = 0, fshift = 1, *sptr;
7829566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE));
7839566063dSJacob Faibussowitsch     PetscCall(PetscMalloc1(m + 1, &sptr));
784496be53dSLois Curfman McInnes     for (i = 0; i < m; i++) {
785496be53dSLois Curfman McInnes       sptr[i] = nzd + 1;
78660e0710aSBarry Smith       for (j = a->i[i]; j < a->i[i + 1]; j++) {
787496be53dSLois Curfman McInnes         if (a->j[j] >= i) {
788aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX)
78936db0b34SBarry Smith           if (PetscImaginaryPart(a->a[j]) != 0.0 || PetscRealPart(a->a[j]) != 0.0) nzd++;
790496be53dSLois Curfman McInnes #else
791496be53dSLois Curfman McInnes           if (a->a[j] != 0.0) nzd++;
792496be53dSLois Curfman McInnes #endif
793496be53dSLois Curfman McInnes         }
794496be53dSLois Curfman McInnes       }
795496be53dSLois Curfman McInnes     }
7962e44a96cSLois Curfman McInnes     sptr[m] = nzd + 1;
7979566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " %" PetscInt_FMT "\n\n", m, nzd));
7982e44a96cSLois Curfman McInnes     for (i = 0; i < m + 1; i += 6) {
7992205254eSKarl Rupp       if (i + 4 < m) {
8009566063dSJacob Faibussowitsch         PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT "\n", sptr[i], sptr[i + 1], sptr[i + 2], sptr[i + 3], sptr[i + 4], sptr[i + 5]));
8012205254eSKarl Rupp       } else if (i + 3 < m) {
8029566063dSJacob Faibussowitsch         PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT "\n", sptr[i], sptr[i + 1], sptr[i + 2], sptr[i + 3], sptr[i + 4]));
8032205254eSKarl Rupp       } else if (i + 2 < m) {
8049566063dSJacob Faibussowitsch         PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT "\n", sptr[i], sptr[i + 1], sptr[i + 2], sptr[i + 3]));
8052205254eSKarl Rupp       } else if (i + 1 < m) {
8069566063dSJacob Faibussowitsch         PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT "\n", sptr[i], sptr[i + 1], sptr[i + 2]));
8072205254eSKarl Rupp       } else if (i < m) {
8089566063dSJacob Faibussowitsch         PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " %" PetscInt_FMT "\n", sptr[i], sptr[i + 1]));
8092205254eSKarl Rupp       } else {
8109566063dSJacob Faibussowitsch         PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT "\n", sptr[i]));
8112205254eSKarl Rupp       }
812496be53dSLois Curfman McInnes     }
8139566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIPrintf(viewer, "\n"));
8149566063dSJacob Faibussowitsch     PetscCall(PetscFree(sptr));
815496be53dSLois Curfman McInnes     for (i = 0; i < m; i++) {
81660e0710aSBarry Smith       for (j = a->i[i]; j < a->i[i + 1]; j++) {
8179566063dSJacob Faibussowitsch         if (a->j[j] >= i) PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " ", a->j[j] + fshift));
818496be53dSLois Curfman McInnes       }
8199566063dSJacob Faibussowitsch       PetscCall(PetscViewerASCIIPrintf(viewer, "\n"));
820496be53dSLois Curfman McInnes     }
8219566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIPrintf(viewer, "\n"));
822496be53dSLois Curfman McInnes     for (i = 0; i < m; i++) {
82360e0710aSBarry Smith       for (j = a->i[i]; j < a->i[i + 1]; j++) {
824496be53dSLois Curfman McInnes         if (a->j[j] >= i) {
825aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX)
82648a46eb9SPierre Jolivet           if (PetscImaginaryPart(a->a[j]) != 0.0 || PetscRealPart(a->a[j]) != 0.0) PetscCall(PetscViewerASCIIPrintf(viewer, " %18.16e %18.16e ", (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j])));
827496be53dSLois Curfman McInnes #else
8289566063dSJacob Faibussowitsch           if (a->a[j] != 0.0) PetscCall(PetscViewerASCIIPrintf(viewer, " %18.16e ", (double)a->a[j]));
829496be53dSLois Curfman McInnes #endif
830496be53dSLois Curfman McInnes         }
831496be53dSLois Curfman McInnes       }
8329566063dSJacob Faibussowitsch       PetscCall(PetscViewerASCIIPrintf(viewer, "\n"));
833496be53dSLois Curfman McInnes     }
8349566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE));
835fb9695e5SSatish Balay   } else if (format == PETSC_VIEWER_ASCII_DENSE) {
83697f1f81fSBarry Smith     PetscInt    cnt = 0, jcnt;
83787828ca2SBarry Smith     PetscScalar value;
83868f1ed48SBarry Smith #if defined(PETSC_USE_COMPLEX)
83968f1ed48SBarry Smith     PetscBool realonly = PETSC_TRUE;
84068f1ed48SBarry Smith 
84168f1ed48SBarry Smith     for (i = 0; i < a->i[m]; i++) {
84268f1ed48SBarry Smith       if (PetscImaginaryPart(a->a[i]) != 0.0) {
84368f1ed48SBarry Smith         realonly = PETSC_FALSE;
84468f1ed48SBarry Smith         break;
84568f1ed48SBarry Smith       }
84668f1ed48SBarry Smith     }
84768f1ed48SBarry Smith #endif
84802594712SBarry Smith 
8499566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE));
85002594712SBarry Smith     for (i = 0; i < m; i++) {
85102594712SBarry Smith       jcnt = 0;
852d0f46423SBarry Smith       for (j = 0; j < A->cmap->n; j++) {
853e24b481bSBarry Smith         if (jcnt < a->i[i + 1] - a->i[i] && j == a->j[cnt]) {
85402594712SBarry Smith           value = a->a[cnt++];
855e24b481bSBarry Smith           jcnt++;
85602594712SBarry Smith         } else {
85702594712SBarry Smith           value = 0.0;
85802594712SBarry Smith         }
859aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX)
86068f1ed48SBarry Smith         if (realonly) {
8619566063dSJacob Faibussowitsch           PetscCall(PetscViewerASCIIPrintf(viewer, " %7.5e ", (double)PetscRealPart(value)));
86268f1ed48SBarry Smith         } else {
8639566063dSJacob Faibussowitsch           PetscCall(PetscViewerASCIIPrintf(viewer, " %7.5e+%7.5e i ", (double)PetscRealPart(value), (double)PetscImaginaryPart(value)));
86468f1ed48SBarry Smith         }
86502594712SBarry Smith #else
8669566063dSJacob Faibussowitsch         PetscCall(PetscViewerASCIIPrintf(viewer, " %7.5e ", (double)value));
86702594712SBarry Smith #endif
86802594712SBarry Smith       }
8699566063dSJacob Faibussowitsch       PetscCall(PetscViewerASCIIPrintf(viewer, "\n"));
87002594712SBarry Smith     }
8719566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE));
8723c215bfdSMatthew Knepley   } else if (format == PETSC_VIEWER_ASCII_MATRIXMARKET) {
873150b93efSMatthew G. Knepley     PetscInt fshift = 1;
8749566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE));
8753c215bfdSMatthew Knepley #if defined(PETSC_USE_COMPLEX)
8769566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIPrintf(viewer, "%%%%MatrixMarket matrix coordinate complex general\n"));
8773c215bfdSMatthew Knepley #else
8789566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIPrintf(viewer, "%%%%MatrixMarket matrix coordinate real general\n"));
8793c215bfdSMatthew Knepley #endif
8809566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT "\n", m, A->cmap->n, a->nz));
8813c215bfdSMatthew Knepley     for (i = 0; i < m; i++) {
88260e0710aSBarry Smith       for (j = a->i[i]; j < a->i[i + 1]; j++) {
8833c215bfdSMatthew Knepley #if defined(PETSC_USE_COMPLEX)
8849566063dSJacob Faibussowitsch         PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT " %g %g\n", i + fshift, a->j[j] + fshift, (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j])));
8853c215bfdSMatthew Knepley #else
8869566063dSJacob Faibussowitsch         PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT " %g\n", i + fshift, a->j[j] + fshift, (double)a->a[j]));
8873c215bfdSMatthew Knepley #endif
8883c215bfdSMatthew Knepley       }
8893c215bfdSMatthew Knepley     }
8909566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE));
8913a40ed3dSBarry Smith   } else {
8929566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE));
893d5f3da31SBarry Smith     if (A->factortype) {
89416cd7e1dSShri Abhyankar       for (i = 0; i < m; i++) {
8959566063dSJacob Faibussowitsch         PetscCall(PetscViewerASCIIPrintf(viewer, "row %" PetscInt_FMT ":", i));
89616cd7e1dSShri Abhyankar         /* L part */
89760e0710aSBarry Smith         for (j = a->i[i]; j < a->i[i + 1]; j++) {
89816cd7e1dSShri Abhyankar #if defined(PETSC_USE_COMPLEX)
89916cd7e1dSShri Abhyankar           if (PetscImaginaryPart(a->a[j]) > 0.0) {
9009566063dSJacob Faibussowitsch             PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g + %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j])));
90116cd7e1dSShri Abhyankar           } else if (PetscImaginaryPart(a->a[j]) < 0.0) {
9029566063dSJacob Faibussowitsch             PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g - %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)(-PetscImaginaryPart(a->a[j]))));
90316cd7e1dSShri Abhyankar           } else {
9049566063dSJacob Faibussowitsch             PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)PetscRealPart(a->a[j])));
90516cd7e1dSShri Abhyankar           }
90616cd7e1dSShri Abhyankar #else
9079566063dSJacob Faibussowitsch           PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)a->a[j]));
90816cd7e1dSShri Abhyankar #endif
90916cd7e1dSShri Abhyankar         }
91016cd7e1dSShri Abhyankar         /* diagonal */
91116cd7e1dSShri Abhyankar         j = a->diag[i];
91216cd7e1dSShri Abhyankar #if defined(PETSC_USE_COMPLEX)
91316cd7e1dSShri Abhyankar         if (PetscImaginaryPart(a->a[j]) > 0.0) {
9149566063dSJacob Faibussowitsch           PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g + %g i)", a->j[j], (double)PetscRealPart(1.0 / a->a[j]), (double)PetscImaginaryPart(1.0 / a->a[j])));
91516cd7e1dSShri Abhyankar         } else if (PetscImaginaryPart(a->a[j]) < 0.0) {
9169566063dSJacob Faibussowitsch           PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g - %g i)", a->j[j], (double)PetscRealPart(1.0 / a->a[j]), (double)(-PetscImaginaryPart(1.0 / a->a[j]))));
91716cd7e1dSShri Abhyankar         } else {
9189566063dSJacob Faibussowitsch           PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)PetscRealPart(1.0 / a->a[j])));
91916cd7e1dSShri Abhyankar         }
92016cd7e1dSShri Abhyankar #else
9219566063dSJacob Faibussowitsch         PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)(1.0 / a->a[j])));
92216cd7e1dSShri Abhyankar #endif
92316cd7e1dSShri Abhyankar 
92416cd7e1dSShri Abhyankar         /* U part */
92560e0710aSBarry Smith         for (j = a->diag[i + 1] + 1; j < a->diag[i]; j++) {
92616cd7e1dSShri Abhyankar #if defined(PETSC_USE_COMPLEX)
92716cd7e1dSShri Abhyankar           if (PetscImaginaryPart(a->a[j]) > 0.0) {
9289566063dSJacob Faibussowitsch             PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g + %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j])));
92916cd7e1dSShri Abhyankar           } else if (PetscImaginaryPart(a->a[j]) < 0.0) {
9309566063dSJacob Faibussowitsch             PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g - %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)(-PetscImaginaryPart(a->a[j]))));
93116cd7e1dSShri Abhyankar           } else {
9329566063dSJacob Faibussowitsch             PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)PetscRealPart(a->a[j])));
93316cd7e1dSShri Abhyankar           }
93416cd7e1dSShri Abhyankar #else
9359566063dSJacob Faibussowitsch           PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)a->a[j]));
93616cd7e1dSShri Abhyankar #endif
93716cd7e1dSShri Abhyankar         }
9389566063dSJacob Faibussowitsch         PetscCall(PetscViewerASCIIPrintf(viewer, "\n"));
93916cd7e1dSShri Abhyankar       }
94016cd7e1dSShri Abhyankar     } else {
94117ab2063SBarry Smith       for (i = 0; i < m; i++) {
9429566063dSJacob Faibussowitsch         PetscCall(PetscViewerASCIIPrintf(viewer, "row %" PetscInt_FMT ":", i));
94360e0710aSBarry Smith         for (j = a->i[i]; j < a->i[i + 1]; j++) {
944aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX)
94536db0b34SBarry Smith           if (PetscImaginaryPart(a->a[j]) > 0.0) {
9469566063dSJacob Faibussowitsch             PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g + %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j])));
94736db0b34SBarry Smith           } else if (PetscImaginaryPart(a->a[j]) < 0.0) {
9489566063dSJacob Faibussowitsch             PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g - %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)-PetscImaginaryPart(a->a[j])));
9493a40ed3dSBarry Smith           } else {
9509566063dSJacob Faibussowitsch             PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)PetscRealPart(a->a[j])));
95117ab2063SBarry Smith           }
95217ab2063SBarry Smith #else
9539566063dSJacob Faibussowitsch           PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)a->a[j]));
95417ab2063SBarry Smith #endif
95517ab2063SBarry Smith         }
9569566063dSJacob Faibussowitsch         PetscCall(PetscViewerASCIIPrintf(viewer, "\n"));
95717ab2063SBarry Smith       }
95816cd7e1dSShri Abhyankar     }
9599566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE));
96017ab2063SBarry Smith   }
9619566063dSJacob Faibussowitsch   PetscCall(PetscViewerFlush(viewer));
9623ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
963416022c9SBarry Smith }
964416022c9SBarry Smith 
9659804daf3SBarry Smith #include <petscdraw.h>
966d71ae5a4SJacob Faibussowitsch PetscErrorCode MatView_SeqAIJ_Draw_Zoom(PetscDraw draw, void *Aa)
967d71ae5a4SJacob Faibussowitsch {
968480ef9eaSBarry Smith   Mat                A = (Mat)Aa;
969416022c9SBarry Smith   Mat_SeqAIJ        *a = (Mat_SeqAIJ *)A->data;
970383922c3SLisandro Dalcin   PetscInt           i, j, m = A->rmap->n;
971383922c3SLisandro Dalcin   int                color;
972b05fc000SLisandro Dalcin   PetscReal          xl, yl, xr, yr, x_l, x_r, y_l, y_r;
973b0a32e0cSBarry Smith   PetscViewer        viewer;
974f3ef73ceSBarry Smith   PetscViewerFormat  format;
975fff043a9SJunchao Zhang   const PetscScalar *aa;
976cddf8d76SBarry Smith 
9773a40ed3dSBarry Smith   PetscFunctionBegin;
9789566063dSJacob Faibussowitsch   PetscCall(PetscObjectQuery((PetscObject)A, "Zoomviewer", (PetscObject *)&viewer));
9799566063dSJacob Faibussowitsch   PetscCall(PetscViewerGetFormat(viewer, &format));
9809566063dSJacob Faibussowitsch   PetscCall(PetscDrawGetCoordinates(draw, &xl, &yl, &xr, &yr));
981383922c3SLisandro Dalcin 
982416022c9SBarry Smith   /* loop over matrix elements drawing boxes */
9839566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &aa));
984fb9695e5SSatish Balay   if (format != PETSC_VIEWER_DRAW_CONTOUR) {
985d0609cedSBarry Smith     PetscDrawCollectiveBegin(draw);
9860513a670SBarry Smith     /* Blue for negative, Cyan for zero and  Red for positive */
987b0a32e0cSBarry Smith     color = PETSC_DRAW_BLUE;
988416022c9SBarry Smith     for (i = 0; i < m; i++) {
9899371c9d4SSatish Balay       y_l = m - i - 1.0;
9909371c9d4SSatish Balay       y_r = y_l + 1.0;
991bfeeae90SHong Zhang       for (j = a->i[i]; j < a->i[i + 1]; j++) {
9929371c9d4SSatish Balay         x_l = a->j[j];
9939371c9d4SSatish Balay         x_r = x_l + 1.0;
994fff043a9SJunchao Zhang         if (PetscRealPart(aa[j]) >= 0.) continue;
9959566063dSJacob Faibussowitsch         PetscCall(PetscDrawRectangle(draw, x_l, y_l, x_r, y_r, color, color, color, color));
996cddf8d76SBarry Smith       }
997cddf8d76SBarry Smith     }
998b0a32e0cSBarry Smith     color = PETSC_DRAW_CYAN;
999cddf8d76SBarry Smith     for (i = 0; i < m; i++) {
10009371c9d4SSatish Balay       y_l = m - i - 1.0;
10019371c9d4SSatish Balay       y_r = y_l + 1.0;
1002bfeeae90SHong Zhang       for (j = a->i[i]; j < a->i[i + 1]; j++) {
10039371c9d4SSatish Balay         x_l = a->j[j];
10049371c9d4SSatish Balay         x_r = x_l + 1.0;
1005fff043a9SJunchao Zhang         if (aa[j] != 0.) continue;
10069566063dSJacob Faibussowitsch         PetscCall(PetscDrawRectangle(draw, x_l, y_l, x_r, y_r, color, color, color, color));
1007cddf8d76SBarry Smith       }
1008cddf8d76SBarry Smith     }
1009b0a32e0cSBarry Smith     color = PETSC_DRAW_RED;
1010cddf8d76SBarry Smith     for (i = 0; i < m; i++) {
10119371c9d4SSatish Balay       y_l = m - i - 1.0;
10129371c9d4SSatish Balay       y_r = y_l + 1.0;
1013bfeeae90SHong Zhang       for (j = a->i[i]; j < a->i[i + 1]; j++) {
10149371c9d4SSatish Balay         x_l = a->j[j];
10159371c9d4SSatish Balay         x_r = x_l + 1.0;
1016fff043a9SJunchao Zhang         if (PetscRealPart(aa[j]) <= 0.) continue;
10179566063dSJacob Faibussowitsch         PetscCall(PetscDrawRectangle(draw, x_l, y_l, x_r, y_r, color, color, color, color));
1018416022c9SBarry Smith       }
1019416022c9SBarry Smith     }
1020d0609cedSBarry Smith     PetscDrawCollectiveEnd(draw);
10210513a670SBarry Smith   } else {
10220513a670SBarry Smith     /* use contour shading to indicate magnitude of values */
10230513a670SBarry Smith     /* first determine max of all nonzero values */
1024b05fc000SLisandro Dalcin     PetscReal minv = 0.0, maxv = 0.0;
1025383922c3SLisandro Dalcin     PetscInt  nz = a->nz, count = 0;
1026b0a32e0cSBarry Smith     PetscDraw popup;
10270513a670SBarry Smith 
10280513a670SBarry Smith     for (i = 0; i < nz; i++) {
1029fff043a9SJunchao Zhang       if (PetscAbsScalar(aa[i]) > maxv) maxv = PetscAbsScalar(aa[i]);
10300513a670SBarry Smith     }
1031383922c3SLisandro Dalcin     if (minv >= maxv) maxv = minv + PETSC_SMALL;
10329566063dSJacob Faibussowitsch     PetscCall(PetscDrawGetPopup(draw, &popup));
10339566063dSJacob Faibussowitsch     PetscCall(PetscDrawScalePopup(popup, minv, maxv));
1034383922c3SLisandro Dalcin 
1035d0609cedSBarry Smith     PetscDrawCollectiveBegin(draw);
10360513a670SBarry Smith     for (i = 0; i < m; i++) {
1037383922c3SLisandro Dalcin       y_l = m - i - 1.0;
1038383922c3SLisandro Dalcin       y_r = y_l + 1.0;
1039bfeeae90SHong Zhang       for (j = a->i[i]; j < a->i[i + 1]; j++) {
1040383922c3SLisandro Dalcin         x_l   = a->j[j];
1041383922c3SLisandro Dalcin         x_r   = x_l + 1.0;
1042fff043a9SJunchao Zhang         color = PetscDrawRealToColor(PetscAbsScalar(aa[count]), minv, maxv);
10439566063dSJacob Faibussowitsch         PetscCall(PetscDrawRectangle(draw, x_l, y_l, x_r, y_r, color, color, color, color));
10440513a670SBarry Smith         count++;
10450513a670SBarry Smith       }
10460513a670SBarry Smith     }
1047d0609cedSBarry Smith     PetscDrawCollectiveEnd(draw);
10480513a670SBarry Smith   }
10499566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &aa));
10503ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
1051480ef9eaSBarry Smith }
1052cddf8d76SBarry Smith 
10539804daf3SBarry Smith #include <petscdraw.h>
1054d71ae5a4SJacob Faibussowitsch PetscErrorCode MatView_SeqAIJ_Draw(Mat A, PetscViewer viewer)
1055d71ae5a4SJacob Faibussowitsch {
1056b0a32e0cSBarry Smith   PetscDraw draw;
105736db0b34SBarry Smith   PetscReal xr, yr, xl, yl, h, w;
1058ace3abfcSBarry Smith   PetscBool isnull;
1059480ef9eaSBarry Smith 
1060480ef9eaSBarry Smith   PetscFunctionBegin;
10619566063dSJacob Faibussowitsch   PetscCall(PetscViewerDrawGetDraw(viewer, 0, &draw));
10629566063dSJacob Faibussowitsch   PetscCall(PetscDrawIsNull(draw, &isnull));
10633ba16761SJacob Faibussowitsch   if (isnull) PetscFunctionReturn(PETSC_SUCCESS);
1064480ef9eaSBarry Smith 
10659371c9d4SSatish Balay   xr = A->cmap->n;
10669371c9d4SSatish Balay   yr = A->rmap->n;
10679371c9d4SSatish Balay   h  = yr / 10.0;
10689371c9d4SSatish Balay   w  = xr / 10.0;
10699371c9d4SSatish Balay   xr += w;
10709371c9d4SSatish Balay   yr += h;
10719371c9d4SSatish Balay   xl = -w;
10729371c9d4SSatish Balay   yl = -h;
10739566063dSJacob Faibussowitsch   PetscCall(PetscDrawSetCoordinates(draw, xl, yl, xr, yr));
10749566063dSJacob Faibussowitsch   PetscCall(PetscObjectCompose((PetscObject)A, "Zoomviewer", (PetscObject)viewer));
10759566063dSJacob Faibussowitsch   PetscCall(PetscDrawZoom(draw, MatView_SeqAIJ_Draw_Zoom, A));
10769566063dSJacob Faibussowitsch   PetscCall(PetscObjectCompose((PetscObject)A, "Zoomviewer", NULL));
10779566063dSJacob Faibussowitsch   PetscCall(PetscDrawSave(draw));
10783ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
1079416022c9SBarry Smith }
1080416022c9SBarry Smith 
1081d71ae5a4SJacob Faibussowitsch PetscErrorCode MatView_SeqAIJ(Mat A, PetscViewer viewer)
1082d71ae5a4SJacob Faibussowitsch {
1083ace3abfcSBarry Smith   PetscBool iascii, isbinary, isdraw;
1084416022c9SBarry Smith 
10853a40ed3dSBarry Smith   PetscFunctionBegin;
10869566063dSJacob Faibussowitsch   PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERASCII, &iascii));
10879566063dSJacob Faibussowitsch   PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERBINARY, &isbinary));
10889566063dSJacob Faibussowitsch   PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERDRAW, &isdraw));
10891baa6e33SBarry Smith   if (iascii) PetscCall(MatView_SeqAIJ_ASCII(A, viewer));
10901baa6e33SBarry Smith   else if (isbinary) PetscCall(MatView_SeqAIJ_Binary(A, viewer));
10911baa6e33SBarry Smith   else if (isdraw) PetscCall(MatView_SeqAIJ_Draw(A, viewer));
10929566063dSJacob Faibussowitsch   PetscCall(MatView_SeqAIJ_Inode(A, viewer));
10933ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
109417ab2063SBarry Smith }
109519bcc07fSBarry Smith 
1096d71ae5a4SJacob Faibussowitsch PetscErrorCode MatAssemblyEnd_SeqAIJ(Mat A, MatAssemblyType mode)
1097d71ae5a4SJacob Faibussowitsch {
1098416022c9SBarry Smith   Mat_SeqAIJ *a      = (Mat_SeqAIJ *)A->data;
1099580bdb30SBarry Smith   PetscInt    fshift = 0, i, *ai = a->i, *aj = a->j, *imax = a->imax;
1100d0f46423SBarry Smith   PetscInt    m = A->rmap->n, *ip, N, *ailen = a->ilen, rmax = 0;
110154f21887SBarry Smith   MatScalar  *aa    = a->a, *ap;
11023447b6efSHong Zhang   PetscReal   ratio = 0.6;
110317ab2063SBarry Smith 
11043a40ed3dSBarry Smith   PetscFunctionBegin;
11053ba16761SJacob Faibussowitsch   if (mode == MAT_FLUSH_ASSEMBLY) PetscFunctionReturn(PETSC_SUCCESS);
11069566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJInvalidateDiagonal(A));
1107b215bc84SStefano Zampini   if (A->was_assembled && A->ass_nonzerostate == A->nonzerostate) {
1108b215bc84SStefano Zampini     /* we need to respect users asking to use or not the inodes routine in between matrix assemblies */
11099566063dSJacob Faibussowitsch     PetscCall(MatAssemblyEnd_SeqAIJ_Inode(A, mode));
11103ba16761SJacob Faibussowitsch     PetscFunctionReturn(PETSC_SUCCESS);
1111b215bc84SStefano Zampini   }
111217ab2063SBarry Smith 
111343ee02c3SBarry Smith   if (m) rmax = ailen[0]; /* determine row with most nonzeros */
111417ab2063SBarry Smith   for (i = 1; i < m; i++) {
1115416022c9SBarry Smith     /* move each row back by the amount of empty slots (fshift) before it*/
111617ab2063SBarry Smith     fshift += imax[i - 1] - ailen[i - 1];
111794a9d846SBarry Smith     rmax = PetscMax(rmax, ailen[i]);
111817ab2063SBarry Smith     if (fshift) {
1119bfeeae90SHong Zhang       ip = aj + ai[i];
1120bfeeae90SHong Zhang       ap = aa + ai[i];
112117ab2063SBarry Smith       N  = ailen[i];
11229566063dSJacob Faibussowitsch       PetscCall(PetscArraymove(ip - fshift, ip, N));
112348a46eb9SPierre Jolivet       if (!A->structure_only) PetscCall(PetscArraymove(ap - fshift, ap, N));
112417ab2063SBarry Smith     }
112517ab2063SBarry Smith     ai[i] = ai[i - 1] + ailen[i - 1];
112617ab2063SBarry Smith   }
112717ab2063SBarry Smith   if (m) {
112817ab2063SBarry Smith     fshift += imax[m - 1] - ailen[m - 1];
112917ab2063SBarry Smith     ai[m] = ai[m - 1] + ailen[m - 1];
113017ab2063SBarry Smith   }
113117ab2063SBarry Smith   /* reset ilen and imax for each row */
11327b083b7cSBarry Smith   a->nonzerorowcnt = 0;
1133396832f4SHong Zhang   if (A->structure_only) {
11349566063dSJacob Faibussowitsch     PetscCall(PetscFree(a->imax));
11359566063dSJacob Faibussowitsch     PetscCall(PetscFree(a->ilen));
1136396832f4SHong Zhang   } else { /* !A->structure_only */
113717ab2063SBarry Smith     for (i = 0; i < m; i++) {
113817ab2063SBarry Smith       ailen[i] = imax[i] = ai[i + 1] - ai[i];
11397b083b7cSBarry Smith       a->nonzerorowcnt += ((ai[i + 1] - ai[i]) > 0);
114017ab2063SBarry Smith     }
1141396832f4SHong Zhang   }
1142bfeeae90SHong Zhang   a->nz = ai[m];
1143aed4548fSBarry Smith   PetscCheck(!fshift || a->nounused != -1, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Unused space detected in matrix: %" PetscInt_FMT " X %" PetscInt_FMT ", %" PetscInt_FMT " unneeded", m, A->cmap->n, fshift);
114417ab2063SBarry Smith 
11459566063dSJacob Faibussowitsch   PetscCall(MatMarkDiagonal_SeqAIJ(A));
11469566063dSJacob Faibussowitsch   PetscCall(PetscInfo(A, "Matrix size: %" PetscInt_FMT " X %" PetscInt_FMT "; storage space: %" PetscInt_FMT " unneeded,%" PetscInt_FMT " used\n", m, A->cmap->n, fshift, a->nz));
11479566063dSJacob Faibussowitsch   PetscCall(PetscInfo(A, "Number of mallocs during MatSetValues() is %" PetscInt_FMT "\n", a->reallocs));
11489566063dSJacob Faibussowitsch   PetscCall(PetscInfo(A, "Maximum nonzeros in any row is %" PetscInt_FMT "\n", rmax));
11492205254eSKarl Rupp 
11508e58a170SBarry Smith   A->info.mallocs += a->reallocs;
1151dd5f02e7SSatish Balay   a->reallocs         = 0;
11526712e2f1SBarry Smith   A->info.nz_unneeded = (PetscReal)fshift;
115336db0b34SBarry Smith   a->rmax             = rmax;
11544e220ebcSLois Curfman McInnes 
115548a46eb9SPierre Jolivet   if (!A->structure_only) PetscCall(MatCheckCompressedRow(A, a->nonzerorowcnt, &a->compressedrow, a->i, m, ratio));
11569566063dSJacob Faibussowitsch   PetscCall(MatAssemblyEnd_SeqAIJ_Inode(A, mode));
11573ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
115817ab2063SBarry Smith }
115917ab2063SBarry Smith 
1160d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRealPart_SeqAIJ(Mat A)
1161d71ae5a4SJacob Faibussowitsch {
116299cafbc1SBarry Smith   Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data;
116399cafbc1SBarry Smith   PetscInt    i, nz = a->nz;
11642e5835c6SStefano Zampini   MatScalar  *aa;
116599cafbc1SBarry Smith 
116699cafbc1SBarry Smith   PetscFunctionBegin;
11679566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArray(A, &aa));
116899cafbc1SBarry Smith   for (i = 0; i < nz; i++) aa[i] = PetscRealPart(aa[i]);
11699566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArray(A, &aa));
11709566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJInvalidateDiagonal(A));
11713ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
117299cafbc1SBarry Smith }
117399cafbc1SBarry Smith 
1174d71ae5a4SJacob Faibussowitsch PetscErrorCode MatImaginaryPart_SeqAIJ(Mat A)
1175d71ae5a4SJacob Faibussowitsch {
117699cafbc1SBarry Smith   Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data;
117799cafbc1SBarry Smith   PetscInt    i, nz = a->nz;
11782e5835c6SStefano Zampini   MatScalar  *aa;
117999cafbc1SBarry Smith 
118099cafbc1SBarry Smith   PetscFunctionBegin;
11819566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArray(A, &aa));
118299cafbc1SBarry Smith   for (i = 0; i < nz; i++) aa[i] = PetscImaginaryPart(aa[i]);
11839566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArray(A, &aa));
11849566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJInvalidateDiagonal(A));
11853ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
118699cafbc1SBarry Smith }
118799cafbc1SBarry Smith 
1188d71ae5a4SJacob Faibussowitsch PetscErrorCode MatZeroEntries_SeqAIJ(Mat A)
1189d71ae5a4SJacob Faibussowitsch {
1190fff043a9SJunchao Zhang   Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data;
1191fff043a9SJunchao Zhang   MatScalar  *aa;
11923a40ed3dSBarry Smith 
11933a40ed3dSBarry Smith   PetscFunctionBegin;
11949566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayWrite(A, &aa));
11959566063dSJacob Faibussowitsch   PetscCall(PetscArrayzero(aa, a->i[A->rmap->n]));
11969566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayWrite(A, &aa));
11979566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJInvalidateDiagonal(A));
11983ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
119917ab2063SBarry Smith }
1200416022c9SBarry Smith 
1201d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDestroy_SeqAIJ(Mat A)
1202d71ae5a4SJacob Faibussowitsch {
1203416022c9SBarry Smith   Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data;
1204d5d45c9bSBarry Smith 
12053a40ed3dSBarry Smith   PetscFunctionBegin;
1206b4e2f619SBarry Smith   if (A->hash_active) {
1207*e3c72094SPierre Jolivet     A->ops[0] = a->cops;
1208b4e2f619SBarry Smith     PetscCall(PetscHMapIJVDestroy(&a->ht));
1209b4e2f619SBarry Smith     PetscCall(PetscFree(a->dnz));
1210b4e2f619SBarry Smith     A->hash_active = PETSC_FALSE;
1211b4e2f619SBarry Smith   }
1212b4e2f619SBarry Smith 
1213aa482453SBarry Smith #if defined(PETSC_USE_LOG)
12143ba16761SJacob Faibussowitsch   PetscCall(PetscLogObjectState((PetscObject)A, "Rows=%" PetscInt_FMT ", Cols=%" PetscInt_FMT ", NZ=%" PetscInt_FMT, A->rmap->n, A->cmap->n, a->nz));
121517ab2063SBarry Smith #endif
12169566063dSJacob Faibussowitsch   PetscCall(MatSeqXAIJFreeAIJ(A, &a->a, &a->j, &a->i));
12179566063dSJacob Faibussowitsch   PetscCall(ISDestroy(&a->row));
12189566063dSJacob Faibussowitsch   PetscCall(ISDestroy(&a->col));
12199566063dSJacob Faibussowitsch   PetscCall(PetscFree(a->diag));
12209566063dSJacob Faibussowitsch   PetscCall(PetscFree(a->ibdiag));
12219566063dSJacob Faibussowitsch   PetscCall(PetscFree(a->imax));
12229566063dSJacob Faibussowitsch   PetscCall(PetscFree(a->ilen));
12239566063dSJacob Faibussowitsch   PetscCall(PetscFree(a->ipre));
12249566063dSJacob Faibussowitsch   PetscCall(PetscFree3(a->idiag, a->mdiag, a->ssor_work));
12259566063dSJacob Faibussowitsch   PetscCall(PetscFree(a->solve_work));
12269566063dSJacob Faibussowitsch   PetscCall(ISDestroy(&a->icol));
12279566063dSJacob Faibussowitsch   PetscCall(PetscFree(a->saved_values));
12289566063dSJacob Faibussowitsch   PetscCall(PetscFree2(a->compressedrow.i, a->compressedrow.rindex));
12299566063dSJacob Faibussowitsch   PetscCall(MatDestroy_SeqAIJ_Inode(A));
12309566063dSJacob Faibussowitsch   PetscCall(PetscFree(A->data));
1231901853e0SKris Buschelman 
12326718818eSStefano Zampini   /* MatMatMultNumeric_SeqAIJ_SeqAIJ_Sorted may allocate this.
12336718818eSStefano Zampini      That function is so heavily used (sometimes in an hidden way through multnumeric function pointers)
12346718818eSStefano Zampini      that is hard to properly add this data to the MatProduct data. We free it here to avoid
12356718818eSStefano Zampini      users reusing the matrix object with different data to incur in obscure segmentation faults
12366718818eSStefano Zampini      due to different matrix sizes */
12379566063dSJacob Faibussowitsch   PetscCall(PetscObjectCompose((PetscObject)A, "__PETSc__ab_dense", NULL));
12386718818eSStefano Zampini 
12399566063dSJacob Faibussowitsch   PetscCall(PetscObjectChangeTypeName((PetscObject)A, NULL));
12402e956fe4SStefano Zampini   PetscCall(PetscObjectComposeFunction((PetscObject)A, "PetscMatlabEnginePut_C", NULL));
12412e956fe4SStefano Zampini   PetscCall(PetscObjectComposeFunction((PetscObject)A, "PetscMatlabEngineGet_C", NULL));
12429566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSeqAIJSetColumnIndices_C", NULL));
12439566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatStoreValues_C", NULL));
12449566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatRetrieveValues_C", NULL));
12459566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqsbaij_C", NULL));
12469566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqbaij_C", NULL));
12479566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijperm_C", NULL));
12482e956fe4SStefano Zampini   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijsell_C", NULL));
12492e956fe4SStefano Zampini #if defined(PETSC_HAVE_MKL_SPARSE)
12502e956fe4SStefano Zampini   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijmkl_C", NULL));
12512e956fe4SStefano Zampini #endif
12524222ddf1SHong Zhang #if defined(PETSC_HAVE_CUDA)
12539566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijcusparse_C", NULL));
12549566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaijcusparse_seqaij_C", NULL));
12559566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaij_seqaijcusparse_C", NULL));
12564222ddf1SHong Zhang #endif
1257d5e393b6SSuyash Tandon #if defined(PETSC_HAVE_HIP)
1258d5e393b6SSuyash Tandon   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijhipsparse_C", NULL));
1259d5e393b6SSuyash Tandon   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaijhipsparse_seqaij_C", NULL));
1260d5e393b6SSuyash Tandon   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaij_seqaijhipsparse_C", NULL));
1261d5e393b6SSuyash Tandon #endif
12623d0639e7SStefano Zampini #if defined(PETSC_HAVE_KOKKOS_KERNELS)
12639566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijkokkos_C", NULL));
12643d0639e7SStefano Zampini #endif
12659566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijcrl_C", NULL));
1266af8000cdSHong Zhang #if defined(PETSC_HAVE_ELEMENTAL)
12679566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_elemental_C", NULL));
1268af8000cdSHong Zhang #endif
1269d24d4204SJose E. Roman #if defined(PETSC_HAVE_SCALAPACK)
12709566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_scalapack_C", NULL));
1271d24d4204SJose E. Roman #endif
127263c07aadSStefano Zampini #if defined(PETSC_HAVE_HYPRE)
12739566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_hypre_C", NULL));
12749566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_transpose_seqaij_seqaij_C", NULL));
127563c07aadSStefano Zampini #endif
12769566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqdense_C", NULL));
12779566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqsell_C", NULL));
12789566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_is_C", NULL));
12799566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatIsTranspose_C", NULL));
12802e956fe4SStefano Zampini   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatIsHermitianTranspose_C", NULL));
12819566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSeqAIJSetPreallocation_C", NULL));
12829566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatResetPreallocation_C", NULL));
12839566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSeqAIJSetPreallocationCSR_C", NULL));
12849566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatReorderForNonzeroDiagonal_C", NULL));
12859566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_is_seqaij_C", NULL));
12869566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqdense_seqaij_C", NULL));
12879566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaij_seqaij_C", NULL));
12889566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSeqAIJKron_C", NULL));
12899566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSetPreallocationCOO_C", NULL));
12909566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSetValuesCOO_C", NULL));
12912e956fe4SStefano Zampini   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatFactorGetSolverType_C", NULL));
12922e956fe4SStefano Zampini   /* these calls do not belong here: the subclasses Duplicate/Destroy are wrong */
12932e956fe4SStefano Zampini   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaijsell_seqaij_C", NULL));
12942e956fe4SStefano Zampini   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaijperm_seqaij_C", NULL));
12952e956fe4SStefano Zampini   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijviennacl_C", NULL));
12962e956fe4SStefano Zampini   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaijviennacl_seqdense_C", NULL));
12972e956fe4SStefano Zampini   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaijviennacl_seqaij_C", NULL));
12983ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
129917ab2063SBarry Smith }
130017ab2063SBarry Smith 
1301d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetOption_SeqAIJ(Mat A, MatOption op, PetscBool flg)
1302d71ae5a4SJacob Faibussowitsch {
1303416022c9SBarry Smith   Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data;
13043a40ed3dSBarry Smith 
13053a40ed3dSBarry Smith   PetscFunctionBegin;
1306a65d3064SKris Buschelman   switch (op) {
1307d71ae5a4SJacob Faibussowitsch   case MAT_ROW_ORIENTED:
1308d71ae5a4SJacob Faibussowitsch     a->roworiented = flg;
1309d71ae5a4SJacob Faibussowitsch     break;
1310d71ae5a4SJacob Faibussowitsch   case MAT_KEEP_NONZERO_PATTERN:
1311d71ae5a4SJacob Faibussowitsch     a->keepnonzeropattern = flg;
1312d71ae5a4SJacob Faibussowitsch     break;
1313d71ae5a4SJacob Faibussowitsch   case MAT_NEW_NONZERO_LOCATIONS:
1314d71ae5a4SJacob Faibussowitsch     a->nonew = (flg ? 0 : 1);
1315d71ae5a4SJacob Faibussowitsch     break;
1316d71ae5a4SJacob Faibussowitsch   case MAT_NEW_NONZERO_LOCATION_ERR:
1317d71ae5a4SJacob Faibussowitsch     a->nonew = (flg ? -1 : 0);
1318d71ae5a4SJacob Faibussowitsch     break;
1319d71ae5a4SJacob Faibussowitsch   case MAT_NEW_NONZERO_ALLOCATION_ERR:
1320d71ae5a4SJacob Faibussowitsch     a->nonew = (flg ? -2 : 0);
1321d71ae5a4SJacob Faibussowitsch     break;
1322d71ae5a4SJacob Faibussowitsch   case MAT_UNUSED_NONZERO_LOCATION_ERR:
1323d71ae5a4SJacob Faibussowitsch     a->nounused = (flg ? -1 : 0);
1324d71ae5a4SJacob Faibussowitsch     break;
1325d71ae5a4SJacob Faibussowitsch   case MAT_IGNORE_ZERO_ENTRIES:
1326d71ae5a4SJacob Faibussowitsch     a->ignorezeroentries = flg;
1327d71ae5a4SJacob Faibussowitsch     break;
13283d472b54SHong Zhang   case MAT_SPD:
1329b1646e73SJed Brown   case MAT_SYMMETRIC:
1330b1646e73SJed Brown   case MAT_STRUCTURALLY_SYMMETRIC:
1331b1646e73SJed Brown   case MAT_HERMITIAN:
1332b1646e73SJed Brown   case MAT_SYMMETRY_ETERNAL:
1333957cac9fSHong Zhang   case MAT_STRUCTURE_ONLY:
1334b94d7dedSBarry Smith   case MAT_STRUCTURAL_SYMMETRY_ETERNAL:
1335b94d7dedSBarry Smith   case MAT_SPD_ETERNAL:
1336b94d7dedSBarry Smith     /* if the diagonal matrix is square it inherits some of the properties above */
13375021d80fSJed Brown     break;
13388c78258cSHong Zhang   case MAT_FORCE_DIAGONAL_ENTRIES:
1339a65d3064SKris Buschelman   case MAT_IGNORE_OFF_PROC_ENTRIES:
1340d71ae5a4SJacob Faibussowitsch   case MAT_USE_HASH_TABLE:
1341d71ae5a4SJacob Faibussowitsch     PetscCall(PetscInfo(A, "Option %s ignored\n", MatOptions[op]));
1342d71ae5a4SJacob Faibussowitsch     break;
1343d71ae5a4SJacob Faibussowitsch   case MAT_USE_INODES:
1344d71ae5a4SJacob Faibussowitsch     PetscCall(MatSetOption_SeqAIJ_Inode(A, MAT_USE_INODES, flg));
1345d71ae5a4SJacob Faibussowitsch     break;
1346d71ae5a4SJacob Faibussowitsch   case MAT_SUBMAT_SINGLEIS:
1347d71ae5a4SJacob Faibussowitsch     A->submat_singleis = flg;
1348d71ae5a4SJacob Faibussowitsch     break;
1349071fcb05SBarry Smith   case MAT_SORTED_FULL:
1350071fcb05SBarry Smith     if (flg) A->ops->setvalues = MatSetValues_SeqAIJ_SortedFull;
1351071fcb05SBarry Smith     else A->ops->setvalues = MatSetValues_SeqAIJ;
1352071fcb05SBarry Smith     break;
1353d71ae5a4SJacob Faibussowitsch   case MAT_FORM_EXPLICIT_TRANSPOSE:
1354d71ae5a4SJacob Faibussowitsch     A->form_explicit_transpose = flg;
1355d71ae5a4SJacob Faibussowitsch     break;
1356d71ae5a4SJacob Faibussowitsch   default:
1357d71ae5a4SJacob Faibussowitsch     SETERRQ(PETSC_COMM_SELF, PETSC_ERR_SUP, "unknown option %d", op);
1358a65d3064SKris Buschelman   }
13593ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
136017ab2063SBarry Smith }
136117ab2063SBarry Smith 
1362d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetDiagonal_SeqAIJ(Mat A, Vec v)
1363d71ae5a4SJacob Faibussowitsch {
1364416022c9SBarry Smith   Mat_SeqAIJ        *a = (Mat_SeqAIJ *)A->data;
1365fdc842d1SBarry Smith   PetscInt           i, j, n, *ai = a->i, *aj = a->j;
1366c898d852SStefano Zampini   PetscScalar       *x;
1367c898d852SStefano Zampini   const PetscScalar *aa;
136817ab2063SBarry Smith 
13693a40ed3dSBarry Smith   PetscFunctionBegin;
13709566063dSJacob Faibussowitsch   PetscCall(VecGetLocalSize(v, &n));
137108401ef6SPierre Jolivet   PetscCheck(n == A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Nonconforming matrix and vector");
13729566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &aa));
1373d5f3da31SBarry Smith   if (A->factortype == MAT_FACTOR_ILU || A->factortype == MAT_FACTOR_LU) {
1374d3e70bfaSHong Zhang     PetscInt *diag = a->diag;
13759566063dSJacob Faibussowitsch     PetscCall(VecGetArrayWrite(v, &x));
13762c990fa1SHong Zhang     for (i = 0; i < n; i++) x[i] = 1.0 / aa[diag[i]];
13779566063dSJacob Faibussowitsch     PetscCall(VecRestoreArrayWrite(v, &x));
13789566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJRestoreArrayRead(A, &aa));
13793ba16761SJacob Faibussowitsch     PetscFunctionReturn(PETSC_SUCCESS);
138035e7444dSHong Zhang   }
138135e7444dSHong Zhang 
13829566063dSJacob Faibussowitsch   PetscCall(VecGetArrayWrite(v, &x));
138335e7444dSHong Zhang   for (i = 0; i < n; i++) {
1384fdc842d1SBarry Smith     x[i] = 0.0;
138535e7444dSHong Zhang     for (j = ai[i]; j < ai[i + 1]; j++) {
138635e7444dSHong Zhang       if (aj[j] == i) {
138735e7444dSHong Zhang         x[i] = aa[j];
138817ab2063SBarry Smith         break;
138917ab2063SBarry Smith       }
139017ab2063SBarry Smith     }
139117ab2063SBarry Smith   }
13929566063dSJacob Faibussowitsch   PetscCall(VecRestoreArrayWrite(v, &x));
13939566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &aa));
13943ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
139517ab2063SBarry Smith }
139617ab2063SBarry Smith 
1397c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/ftn-kernels/fmult.h>
1398d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMultTransposeAdd_SeqAIJ(Mat A, Vec xx, Vec zz, Vec yy)
1399d71ae5a4SJacob Faibussowitsch {
1400416022c9SBarry Smith   Mat_SeqAIJ        *a = (Mat_SeqAIJ *)A->data;
14015f22a7b3SSebastian Grimberg   const MatScalar   *aa;
1402d9ca1df4SBarry Smith   PetscScalar       *y;
1403d9ca1df4SBarry Smith   const PetscScalar *x;
1404d0f46423SBarry Smith   PetscInt           m = A->rmap->n;
14055c897100SBarry Smith #if !defined(PETSC_USE_FORTRAN_KERNEL_MULTTRANSPOSEAIJ)
14065f22a7b3SSebastian Grimberg   const MatScalar  *v;
1407a77337e4SBarry Smith   PetscScalar       alpha;
1408d9ca1df4SBarry Smith   PetscInt          n, i, j;
1409d9ca1df4SBarry Smith   const PetscInt   *idx, *ii, *ridx = NULL;
14103447b6efSHong Zhang   Mat_CompressedRow cprow    = a->compressedrow;
1411ace3abfcSBarry Smith   PetscBool         usecprow = cprow.use;
14125c897100SBarry Smith #endif
141317ab2063SBarry Smith 
14143a40ed3dSBarry Smith   PetscFunctionBegin;
14159566063dSJacob Faibussowitsch   if (zz != yy) PetscCall(VecCopy(zz, yy));
14169566063dSJacob Faibussowitsch   PetscCall(VecGetArrayRead(xx, &x));
14179566063dSJacob Faibussowitsch   PetscCall(VecGetArray(yy, &y));
14189566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &aa));
14195c897100SBarry Smith 
14205c897100SBarry Smith #if defined(PETSC_USE_FORTRAN_KERNEL_MULTTRANSPOSEAIJ)
1421fff043a9SJunchao Zhang   fortranmulttransposeaddaij_(&m, x, a->i, a->j, aa, y);
14225c897100SBarry Smith #else
14233447b6efSHong Zhang   if (usecprow) {
14243447b6efSHong Zhang     m    = cprow.nrows;
14253447b6efSHong Zhang     ii   = cprow.i;
14267b2bb3b9SHong Zhang     ridx = cprow.rindex;
14273447b6efSHong Zhang   } else {
14283447b6efSHong Zhang     ii = a->i;
14293447b6efSHong Zhang   }
143017ab2063SBarry Smith   for (i = 0; i < m; i++) {
14313447b6efSHong Zhang     idx = a->j + ii[i];
1432fff043a9SJunchao Zhang     v   = aa + ii[i];
14333447b6efSHong Zhang     n   = ii[i + 1] - ii[i];
14343447b6efSHong Zhang     if (usecprow) {
14357b2bb3b9SHong Zhang       alpha = x[ridx[i]];
14363447b6efSHong Zhang     } else {
143717ab2063SBarry Smith       alpha = x[i];
14383447b6efSHong Zhang     }
143904fbf559SBarry Smith     for (j = 0; j < n; j++) y[idx[j]] += alpha * v[j];
144017ab2063SBarry Smith   }
14415c897100SBarry Smith #endif
14429566063dSJacob Faibussowitsch   PetscCall(PetscLogFlops(2.0 * a->nz));
14439566063dSJacob Faibussowitsch   PetscCall(VecRestoreArrayRead(xx, &x));
14449566063dSJacob Faibussowitsch   PetscCall(VecRestoreArray(yy, &y));
14459566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &aa));
14463ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
144717ab2063SBarry Smith }
144817ab2063SBarry Smith 
1449d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMultTranspose_SeqAIJ(Mat A, Vec xx, Vec yy)
1450d71ae5a4SJacob Faibussowitsch {
14515c897100SBarry Smith   PetscFunctionBegin;
14529566063dSJacob Faibussowitsch   PetscCall(VecSet(yy, 0.0));
14539566063dSJacob Faibussowitsch   PetscCall(MatMultTransposeAdd_SeqAIJ(A, xx, yy, yy));
14543ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
14555c897100SBarry Smith }
14565c897100SBarry Smith 
1457c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/ftn-kernels/fmult.h>
145878b84d54SShri Abhyankar 
1459d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMult_SeqAIJ(Mat A, Vec xx, Vec yy)
1460d71ae5a4SJacob Faibussowitsch {
1461416022c9SBarry Smith   Mat_SeqAIJ        *a = (Mat_SeqAIJ *)A->data;
1462d9fead3dSBarry Smith   PetscScalar       *y;
146354f21887SBarry Smith   const PetscScalar *x;
1464fff043a9SJunchao Zhang   const MatScalar   *aa, *a_a;
1465003131ecSBarry Smith   PetscInt           m = A->rmap->n;
14660298fd71SBarry Smith   const PetscInt    *aj, *ii, *ridx = NULL;
14677b083b7cSBarry Smith   PetscInt           n, i;
1468362ced78SSatish Balay   PetscScalar        sum;
1469ace3abfcSBarry Smith   PetscBool          usecprow = a->compressedrow.use;
147017ab2063SBarry Smith 
1471b6410449SSatish Balay #if defined(PETSC_HAVE_PRAGMA_DISJOINT)
147297952fefSHong Zhang   #pragma disjoint(*x, *y, *aa)
1473fee21e36SBarry Smith #endif
1474fee21e36SBarry Smith 
14753a40ed3dSBarry Smith   PetscFunctionBegin;
1476b215bc84SStefano Zampini   if (a->inode.use && a->inode.checked) {
14779566063dSJacob Faibussowitsch     PetscCall(MatMult_SeqAIJ_Inode(A, xx, yy));
14783ba16761SJacob Faibussowitsch     PetscFunctionReturn(PETSC_SUCCESS);
1479b215bc84SStefano Zampini   }
14809566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &a_a));
14819566063dSJacob Faibussowitsch   PetscCall(VecGetArrayRead(xx, &x));
14829566063dSJacob Faibussowitsch   PetscCall(VecGetArray(yy, &y));
1483416022c9SBarry Smith   ii = a->i;
14844eb6d288SHong Zhang   if (usecprow) { /* use compressed row format */
14859566063dSJacob Faibussowitsch     PetscCall(PetscArrayzero(y, m));
148697952fefSHong Zhang     m    = a->compressedrow.nrows;
148797952fefSHong Zhang     ii   = a->compressedrow.i;
148897952fefSHong Zhang     ridx = a->compressedrow.rindex;
148997952fefSHong Zhang     for (i = 0; i < m; i++) {
149097952fefSHong Zhang       n   = ii[i + 1] - ii[i];
149197952fefSHong Zhang       aj  = a->j + ii[i];
1492fff043a9SJunchao Zhang       aa  = a_a + ii[i];
149397952fefSHong Zhang       sum = 0.0;
1494003131ecSBarry Smith       PetscSparseDensePlusDot(sum, x, aa, aj, n);
1495003131ecSBarry Smith       /* for (j=0; j<n; j++) sum += (*aa++)*x[*aj++]; */
149697952fefSHong Zhang       y[*ridx++] = sum;
149797952fefSHong Zhang     }
149897952fefSHong Zhang   } else { /* do not use compressed row format */
1499b05257ddSBarry Smith #if defined(PETSC_USE_FORTRAN_KERNEL_MULTAIJ)
15003d3eaba7SBarry Smith     aj = a->j;
1501fff043a9SJunchao Zhang     aa = a_a;
1502b05257ddSBarry Smith     fortranmultaij_(&m, x, ii, aj, aa, y);
1503b05257ddSBarry Smith #else
150417ab2063SBarry Smith     for (i = 0; i < m; i++) {
1505003131ecSBarry Smith       n   = ii[i + 1] - ii[i];
1506003131ecSBarry Smith       aj  = a->j + ii[i];
1507fff043a9SJunchao Zhang       aa  = a_a + ii[i];
150817ab2063SBarry Smith       sum = 0.0;
1509003131ecSBarry Smith       PetscSparseDensePlusDot(sum, x, aa, aj, n);
151017ab2063SBarry Smith       y[i] = sum;
151117ab2063SBarry Smith     }
15128d195f9aSBarry Smith #endif
1513b05257ddSBarry Smith   }
15149566063dSJacob Faibussowitsch   PetscCall(PetscLogFlops(2.0 * a->nz - a->nonzerorowcnt));
15159566063dSJacob Faibussowitsch   PetscCall(VecRestoreArrayRead(xx, &x));
15169566063dSJacob Faibussowitsch   PetscCall(VecRestoreArray(yy, &y));
15179566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &a_a));
15183ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
151917ab2063SBarry Smith }
152017ab2063SBarry Smith 
1521d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMultMax_SeqAIJ(Mat A, Vec xx, Vec yy)
1522d71ae5a4SJacob Faibussowitsch {
1523b434eb95SMatthew G. Knepley   Mat_SeqAIJ        *a = (Mat_SeqAIJ *)A->data;
1524b434eb95SMatthew G. Knepley   PetscScalar       *y;
1525b434eb95SMatthew G. Knepley   const PetscScalar *x;
1526fff043a9SJunchao Zhang   const MatScalar   *aa, *a_a;
1527b434eb95SMatthew G. Knepley   PetscInt           m = A->rmap->n;
1528b434eb95SMatthew G. Knepley   const PetscInt    *aj, *ii, *ridx   = NULL;
1529b434eb95SMatthew G. Knepley   PetscInt           n, i, nonzerorow = 0;
1530b434eb95SMatthew G. Knepley   PetscScalar        sum;
1531b434eb95SMatthew G. Knepley   PetscBool          usecprow = a->compressedrow.use;
1532b434eb95SMatthew G. Knepley 
1533b434eb95SMatthew G. Knepley #if defined(PETSC_HAVE_PRAGMA_DISJOINT)
1534b434eb95SMatthew G. Knepley   #pragma disjoint(*x, *y, *aa)
1535b434eb95SMatthew G. Knepley #endif
1536b434eb95SMatthew G. Knepley 
1537b434eb95SMatthew G. Knepley   PetscFunctionBegin;
15389566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &a_a));
15399566063dSJacob Faibussowitsch   PetscCall(VecGetArrayRead(xx, &x));
15409566063dSJacob Faibussowitsch   PetscCall(VecGetArray(yy, &y));
1541b434eb95SMatthew G. Knepley   if (usecprow) { /* use compressed row format */
1542b434eb95SMatthew G. Knepley     m    = a->compressedrow.nrows;
1543b434eb95SMatthew G. Knepley     ii   = a->compressedrow.i;
1544b434eb95SMatthew G. Knepley     ridx = a->compressedrow.rindex;
1545b434eb95SMatthew G. Knepley     for (i = 0; i < m; i++) {
1546b434eb95SMatthew G. Knepley       n   = ii[i + 1] - ii[i];
1547b434eb95SMatthew G. Knepley       aj  = a->j + ii[i];
1548fff043a9SJunchao Zhang       aa  = a_a + ii[i];
1549b434eb95SMatthew G. Knepley       sum = 0.0;
1550b434eb95SMatthew G. Knepley       nonzerorow += (n > 0);
1551b434eb95SMatthew G. Knepley       PetscSparseDenseMaxDot(sum, x, aa, aj, n);
1552b434eb95SMatthew G. Knepley       /* for (j=0; j<n; j++) sum += (*aa++)*x[*aj++]; */
1553b434eb95SMatthew G. Knepley       y[*ridx++] = sum;
1554b434eb95SMatthew G. Knepley     }
1555b434eb95SMatthew G. Knepley   } else { /* do not use compressed row format */
15563d3eaba7SBarry Smith     ii = a->i;
1557b434eb95SMatthew G. Knepley     for (i = 0; i < m; i++) {
1558b434eb95SMatthew G. Knepley       n   = ii[i + 1] - ii[i];
1559b434eb95SMatthew G. Knepley       aj  = a->j + ii[i];
1560fff043a9SJunchao Zhang       aa  = a_a + ii[i];
1561b434eb95SMatthew G. Knepley       sum = 0.0;
1562b434eb95SMatthew G. Knepley       nonzerorow += (n > 0);
1563b434eb95SMatthew G. Knepley       PetscSparseDenseMaxDot(sum, x, aa, aj, n);
1564b434eb95SMatthew G. Knepley       y[i] = sum;
1565b434eb95SMatthew G. Knepley     }
1566b434eb95SMatthew G. Knepley   }
15679566063dSJacob Faibussowitsch   PetscCall(PetscLogFlops(2.0 * a->nz - nonzerorow));
15689566063dSJacob Faibussowitsch   PetscCall(VecRestoreArrayRead(xx, &x));
15699566063dSJacob Faibussowitsch   PetscCall(VecRestoreArray(yy, &y));
15709566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &a_a));
15713ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
1572b434eb95SMatthew G. Knepley }
1573b434eb95SMatthew G. Knepley 
1574d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMultAddMax_SeqAIJ(Mat A, Vec xx, Vec yy, Vec zz)
1575d71ae5a4SJacob Faibussowitsch {
1576b434eb95SMatthew G. Knepley   Mat_SeqAIJ        *a = (Mat_SeqAIJ *)A->data;
1577b434eb95SMatthew G. Knepley   PetscScalar       *y, *z;
1578b434eb95SMatthew G. Knepley   const PetscScalar *x;
1579fff043a9SJunchao Zhang   const MatScalar   *aa, *a_a;
1580b434eb95SMatthew G. Knepley   PetscInt           m = A->rmap->n, *aj, *ii;
1581b434eb95SMatthew G. Knepley   PetscInt           n, i, *ridx = NULL;
1582b434eb95SMatthew G. Knepley   PetscScalar        sum;
1583b434eb95SMatthew G. Knepley   PetscBool          usecprow = a->compressedrow.use;
1584b434eb95SMatthew G. Knepley 
1585b434eb95SMatthew G. Knepley   PetscFunctionBegin;
15869566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &a_a));
15879566063dSJacob Faibussowitsch   PetscCall(VecGetArrayRead(xx, &x));
15889566063dSJacob Faibussowitsch   PetscCall(VecGetArrayPair(yy, zz, &y, &z));
1589b434eb95SMatthew G. Knepley   if (usecprow) { /* use compressed row format */
159048a46eb9SPierre Jolivet     if (zz != yy) PetscCall(PetscArraycpy(z, y, m));
1591b434eb95SMatthew G. Knepley     m    = a->compressedrow.nrows;
1592b434eb95SMatthew G. Knepley     ii   = a->compressedrow.i;
1593b434eb95SMatthew G. Knepley     ridx = a->compressedrow.rindex;
1594b434eb95SMatthew G. Knepley     for (i = 0; i < m; i++) {
1595b434eb95SMatthew G. Knepley       n   = ii[i + 1] - ii[i];
1596b434eb95SMatthew G. Knepley       aj  = a->j + ii[i];
1597fff043a9SJunchao Zhang       aa  = a_a + ii[i];
1598b434eb95SMatthew G. Knepley       sum = y[*ridx];
1599b434eb95SMatthew G. Knepley       PetscSparseDenseMaxDot(sum, x, aa, aj, n);
1600b434eb95SMatthew G. Knepley       z[*ridx++] = sum;
1601b434eb95SMatthew G. Knepley     }
1602b434eb95SMatthew G. Knepley   } else { /* do not use compressed row format */
16033d3eaba7SBarry Smith     ii = a->i;
1604b434eb95SMatthew G. Knepley     for (i = 0; i < m; i++) {
1605b434eb95SMatthew G. Knepley       n   = ii[i + 1] - ii[i];
1606b434eb95SMatthew G. Knepley       aj  = a->j + ii[i];
1607fff043a9SJunchao Zhang       aa  = a_a + ii[i];
1608b434eb95SMatthew G. Knepley       sum = y[i];
1609b434eb95SMatthew G. Knepley       PetscSparseDenseMaxDot(sum, x, aa, aj, n);
1610b434eb95SMatthew G. Knepley       z[i] = sum;
1611b434eb95SMatthew G. Knepley     }
1612b434eb95SMatthew G. Knepley   }
16139566063dSJacob Faibussowitsch   PetscCall(PetscLogFlops(2.0 * a->nz));
16149566063dSJacob Faibussowitsch   PetscCall(VecRestoreArrayRead(xx, &x));
16159566063dSJacob Faibussowitsch   PetscCall(VecRestoreArrayPair(yy, zz, &y, &z));
16169566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &a_a));
16173ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
1618b434eb95SMatthew G. Knepley }
1619b434eb95SMatthew G. Knepley 
1620c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/ftn-kernels/fmultadd.h>
1621d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMultAdd_SeqAIJ(Mat A, Vec xx, Vec yy, Vec zz)
1622d71ae5a4SJacob Faibussowitsch {
1623416022c9SBarry Smith   Mat_SeqAIJ        *a = (Mat_SeqAIJ *)A->data;
1624f15663dcSBarry Smith   PetscScalar       *y, *z;
1625f15663dcSBarry Smith   const PetscScalar *x;
1626fff043a9SJunchao Zhang   const MatScalar   *aa, *a_a;
1627d9ca1df4SBarry Smith   const PetscInt    *aj, *ii, *ridx = NULL;
1628d9ca1df4SBarry Smith   PetscInt           m = A->rmap->n, n, i;
1629362ced78SSatish Balay   PetscScalar        sum;
1630ace3abfcSBarry Smith   PetscBool          usecprow = a->compressedrow.use;
16319ea0dfa2SSatish Balay 
16323a40ed3dSBarry Smith   PetscFunctionBegin;
1633b215bc84SStefano Zampini   if (a->inode.use && a->inode.checked) {
16349566063dSJacob Faibussowitsch     PetscCall(MatMultAdd_SeqAIJ_Inode(A, xx, yy, zz));
16353ba16761SJacob Faibussowitsch     PetscFunctionReturn(PETSC_SUCCESS);
1636b215bc84SStefano Zampini   }
16379566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &a_a));
16389566063dSJacob Faibussowitsch   PetscCall(VecGetArrayRead(xx, &x));
16399566063dSJacob Faibussowitsch   PetscCall(VecGetArrayPair(yy, zz, &y, &z));
16404eb6d288SHong Zhang   if (usecprow) { /* use compressed row format */
164148a46eb9SPierre Jolivet     if (zz != yy) PetscCall(PetscArraycpy(z, y, m));
164297952fefSHong Zhang     m    = a->compressedrow.nrows;
164397952fefSHong Zhang     ii   = a->compressedrow.i;
164497952fefSHong Zhang     ridx = a->compressedrow.rindex;
164597952fefSHong Zhang     for (i = 0; i < m; i++) {
164697952fefSHong Zhang       n   = ii[i + 1] - ii[i];
164797952fefSHong Zhang       aj  = a->j + ii[i];
1648fff043a9SJunchao Zhang       aa  = a_a + ii[i];
164997952fefSHong Zhang       sum = y[*ridx];
1650f15663dcSBarry Smith       PetscSparseDensePlusDot(sum, x, aa, aj, n);
165197952fefSHong Zhang       z[*ridx++] = sum;
165297952fefSHong Zhang     }
165397952fefSHong Zhang   } else { /* do not use compressed row format */
16543d3eaba7SBarry Smith     ii = a->i;
1655f15663dcSBarry Smith #if defined(PETSC_USE_FORTRAN_KERNEL_MULTADDAIJ)
16563d3eaba7SBarry Smith     aj = a->j;
1657fff043a9SJunchao Zhang     aa = a_a;
1658f15663dcSBarry Smith     fortranmultaddaij_(&m, x, ii, aj, aa, y, z);
1659f15663dcSBarry Smith #else
166017ab2063SBarry Smith     for (i = 0; i < m; i++) {
1661f15663dcSBarry Smith       n   = ii[i + 1] - ii[i];
1662f15663dcSBarry Smith       aj  = a->j + ii[i];
1663fff043a9SJunchao Zhang       aa  = a_a + ii[i];
166417ab2063SBarry Smith       sum = y[i];
1665f15663dcSBarry Smith       PetscSparseDensePlusDot(sum, x, aa, aj, n);
166617ab2063SBarry Smith       z[i] = sum;
166717ab2063SBarry Smith     }
166802ab625aSSatish Balay #endif
1669f15663dcSBarry Smith   }
16709566063dSJacob Faibussowitsch   PetscCall(PetscLogFlops(2.0 * a->nz));
16719566063dSJacob Faibussowitsch   PetscCall(VecRestoreArrayRead(xx, &x));
16729566063dSJacob Faibussowitsch   PetscCall(VecRestoreArrayPair(yy, zz, &y, &z));
16739566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &a_a));
16743ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
167517ab2063SBarry Smith }
167617ab2063SBarry Smith 
167717ab2063SBarry Smith /*
167817ab2063SBarry Smith      Adds diagonal pointers to sparse matrix structure.
167917ab2063SBarry Smith */
1680d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMarkDiagonal_SeqAIJ(Mat A)
1681d71ae5a4SJacob Faibussowitsch {
1682416022c9SBarry Smith   Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data;
1683d0f46423SBarry Smith   PetscInt    i, j, m = A->rmap->n;
1684c0c07093SJunchao Zhang   PetscBool   alreadySet = PETSC_TRUE;
168517ab2063SBarry Smith 
16863a40ed3dSBarry Smith   PetscFunctionBegin;
168709f38230SBarry Smith   if (!a->diag) {
16889566063dSJacob Faibussowitsch     PetscCall(PetscMalloc1(m, &a->diag));
1689c0c07093SJunchao Zhang     alreadySet = PETSC_FALSE;
169009f38230SBarry Smith   }
1691d0f46423SBarry Smith   for (i = 0; i < A->rmap->n; i++) {
1692c0c07093SJunchao Zhang     /* If A's diagonal is already correctly set, this fast track enables cheap and repeated MatMarkDiagonal_SeqAIJ() calls */
1693c0c07093SJunchao Zhang     if (alreadySet) {
1694c0c07093SJunchao Zhang       PetscInt pos = a->diag[i];
1695c0c07093SJunchao Zhang       if (pos >= a->i[i] && pos < a->i[i + 1] && a->j[pos] == i) continue;
1696c0c07093SJunchao Zhang     }
1697c0c07093SJunchao Zhang 
169809f38230SBarry Smith     a->diag[i] = a->i[i + 1];
1699bfeeae90SHong Zhang     for (j = a->i[i]; j < a->i[i + 1]; j++) {
1700bfeeae90SHong Zhang       if (a->j[j] == i) {
170109f38230SBarry Smith         a->diag[i] = j;
170217ab2063SBarry Smith         break;
170317ab2063SBarry Smith       }
170417ab2063SBarry Smith     }
170517ab2063SBarry Smith   }
17063ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
170717ab2063SBarry Smith }
170817ab2063SBarry Smith 
1709d71ae5a4SJacob Faibussowitsch PetscErrorCode MatShift_SeqAIJ(Mat A, PetscScalar v)
1710d71ae5a4SJacob Faibussowitsch {
171161ecd0c6SBarry Smith   Mat_SeqAIJ     *a    = (Mat_SeqAIJ *)A->data;
171261ecd0c6SBarry Smith   const PetscInt *diag = (const PetscInt *)a->diag;
171361ecd0c6SBarry Smith   const PetscInt *ii   = (const PetscInt *)a->i;
171461ecd0c6SBarry Smith   PetscInt        i, *mdiag = NULL;
171561ecd0c6SBarry Smith   PetscInt        cnt = 0; /* how many diagonals are missing */
171661ecd0c6SBarry Smith 
171761ecd0c6SBarry Smith   PetscFunctionBegin;
171861ecd0c6SBarry Smith   if (!A->preallocated || !a->nz) {
17199566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJSetPreallocation(A, 1, NULL));
17209566063dSJacob Faibussowitsch     PetscCall(MatShift_Basic(A, v));
17213ba16761SJacob Faibussowitsch     PetscFunctionReturn(PETSC_SUCCESS);
172261ecd0c6SBarry Smith   }
172361ecd0c6SBarry Smith 
172461ecd0c6SBarry Smith   if (a->diagonaldense) {
172561ecd0c6SBarry Smith     cnt = 0;
172661ecd0c6SBarry Smith   } else {
17279566063dSJacob Faibussowitsch     PetscCall(PetscCalloc1(A->rmap->n, &mdiag));
172861ecd0c6SBarry Smith     for (i = 0; i < A->rmap->n; i++) {
1729349d3b71SJunchao Zhang       if (i < A->cmap->n && diag[i] >= ii[i + 1]) { /* 'out of range' rows never have diagonals */
173061ecd0c6SBarry Smith         cnt++;
173161ecd0c6SBarry Smith         mdiag[i] = 1;
173261ecd0c6SBarry Smith       }
173361ecd0c6SBarry Smith     }
173461ecd0c6SBarry Smith   }
173561ecd0c6SBarry Smith   if (!cnt) {
17369566063dSJacob Faibussowitsch     PetscCall(MatShift_Basic(A, v));
173761ecd0c6SBarry Smith   } else {
1738b6f2aa54SBarry Smith     PetscScalar *olda = a->a; /* preserve pointers to current matrix nonzeros structure and values */
1739b6f2aa54SBarry Smith     PetscInt    *oldj = a->j, *oldi = a->i;
174061ecd0c6SBarry Smith     PetscBool    singlemalloc = a->singlemalloc, free_a = a->free_a, free_ij = a->free_ij;
174161ecd0c6SBarry Smith 
174261ecd0c6SBarry Smith     a->a = NULL;
174361ecd0c6SBarry Smith     a->j = NULL;
174461ecd0c6SBarry Smith     a->i = NULL;
174561ecd0c6SBarry Smith     /* increase the values in imax for each row where a diagonal is being inserted then reallocate the matrix data structures */
1746ad540459SPierre Jolivet     for (i = 0; i < PetscMin(A->rmap->n, A->cmap->n); i++) a->imax[i] += mdiag[i];
17479566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(A, 0, a->imax));
174861ecd0c6SBarry Smith 
174961ecd0c6SBarry Smith     /* copy old values into new matrix data structure */
175061ecd0c6SBarry Smith     for (i = 0; i < A->rmap->n; i++) {
17519566063dSJacob Faibussowitsch       PetscCall(MatSetValues(A, 1, &i, a->imax[i] - mdiag[i], &oldj[oldi[i]], &olda[oldi[i]], ADD_VALUES));
175248a46eb9SPierre Jolivet       if (i < A->cmap->n) PetscCall(MatSetValue(A, i, i, v, ADD_VALUES));
1753447d62f5SStefano Zampini     }
17549566063dSJacob Faibussowitsch     PetscCall(MatAssemblyBegin(A, MAT_FINAL_ASSEMBLY));
17559566063dSJacob Faibussowitsch     PetscCall(MatAssemblyEnd(A, MAT_FINAL_ASSEMBLY));
175661ecd0c6SBarry Smith     if (singlemalloc) {
17579566063dSJacob Faibussowitsch       PetscCall(PetscFree3(olda, oldj, oldi));
175861ecd0c6SBarry Smith     } else {
17599566063dSJacob Faibussowitsch       if (free_a) PetscCall(PetscFree(olda));
17609566063dSJacob Faibussowitsch       if (free_ij) PetscCall(PetscFree(oldj));
17619566063dSJacob Faibussowitsch       if (free_ij) PetscCall(PetscFree(oldi));
176261ecd0c6SBarry Smith     }
176361ecd0c6SBarry Smith   }
17649566063dSJacob Faibussowitsch   PetscCall(PetscFree(mdiag));
176561ecd0c6SBarry Smith   a->diagonaldense = PETSC_TRUE;
17663ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
176761ecd0c6SBarry Smith }
176861ecd0c6SBarry Smith 
1769be5855fcSBarry Smith /*
1770be5855fcSBarry Smith      Checks for missing diagonals
1771be5855fcSBarry Smith */
1772d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMissingDiagonal_SeqAIJ(Mat A, PetscBool *missing, PetscInt *d)
1773d71ae5a4SJacob Faibussowitsch {
1774be5855fcSBarry Smith   Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data;
17757734d3b5SMatthew G. Knepley   PetscInt   *diag, *ii = a->i, i;
1776be5855fcSBarry Smith 
1777be5855fcSBarry Smith   PetscFunctionBegin;
177809f38230SBarry Smith   *missing = PETSC_FALSE;
17797734d3b5SMatthew G. Knepley   if (A->rmap->n > 0 && !ii) {
178009f38230SBarry Smith     *missing = PETSC_TRUE;
178109f38230SBarry Smith     if (d) *d = 0;
17829566063dSJacob Faibussowitsch     PetscCall(PetscInfo(A, "Matrix has no entries therefore is missing diagonal\n"));
178309f38230SBarry Smith   } else {
178401445905SHong Zhang     PetscInt n;
178501445905SHong Zhang     n    = PetscMin(A->rmap->n, A->cmap->n);
1786f1e2ffcdSBarry Smith     diag = a->diag;
178701445905SHong Zhang     for (i = 0; i < n; i++) {
17887734d3b5SMatthew G. Knepley       if (diag[i] >= ii[i + 1]) {
178909f38230SBarry Smith         *missing = PETSC_TRUE;
179009f38230SBarry Smith         if (d) *d = i;
17919566063dSJacob Faibussowitsch         PetscCall(PetscInfo(A, "Matrix is missing diagonal number %" PetscInt_FMT "\n", i));
1792358d2f5dSShri Abhyankar         break;
179309f38230SBarry Smith       }
1794be5855fcSBarry Smith     }
1795be5855fcSBarry Smith   }
17963ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
1797be5855fcSBarry Smith }
1798be5855fcSBarry Smith 
17990da83c2eSBarry Smith #include <petscblaslapack.h>
18000da83c2eSBarry Smith #include <petsc/private/kernels/blockinvert.h>
18010da83c2eSBarry Smith 
18020da83c2eSBarry Smith /*
18030da83c2eSBarry Smith     Note that values is allocated externally by the PC and then passed into this routine
18040da83c2eSBarry Smith */
1805d71ae5a4SJacob Faibussowitsch PetscErrorCode MatInvertVariableBlockDiagonal_SeqAIJ(Mat A, PetscInt nblocks, const PetscInt *bsizes, PetscScalar *diag)
1806d71ae5a4SJacob Faibussowitsch {
18070da83c2eSBarry Smith   PetscInt        n = A->rmap->n, i, ncnt = 0, *indx, j, bsizemax = 0, *v_pivots;
18080da83c2eSBarry Smith   PetscBool       allowzeropivot, zeropivotdetected = PETSC_FALSE;
18090da83c2eSBarry Smith   const PetscReal shift = 0.0;
18100da83c2eSBarry Smith   PetscInt        ipvt[5];
18114e208921SJed Brown   PetscCount      flops = 0;
18120da83c2eSBarry Smith   PetscScalar     work[25], *v_work;
18130da83c2eSBarry Smith 
18140da83c2eSBarry Smith   PetscFunctionBegin;
18150da83c2eSBarry Smith   allowzeropivot = PetscNot(A->erroriffailure);
18160da83c2eSBarry Smith   for (i = 0; i < nblocks; i++) ncnt += bsizes[i];
181708401ef6SPierre Jolivet   PetscCheck(ncnt == n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Total blocksizes %" PetscInt_FMT " doesn't match number matrix rows %" PetscInt_FMT, ncnt, n);
1818ad540459SPierre Jolivet   for (i = 0; i < nblocks; i++) bsizemax = PetscMax(bsizemax, bsizes[i]);
18199566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(bsizemax, &indx));
182048a46eb9SPierre Jolivet   if (bsizemax > 7) PetscCall(PetscMalloc2(bsizemax, &v_work, bsizemax, &v_pivots));
18210da83c2eSBarry Smith   ncnt = 0;
18220da83c2eSBarry Smith   for (i = 0; i < nblocks; i++) {
18230da83c2eSBarry Smith     for (j = 0; j < bsizes[i]; j++) indx[j] = ncnt + j;
18249566063dSJacob Faibussowitsch     PetscCall(MatGetValues(A, bsizes[i], indx, bsizes[i], indx, diag));
18250da83c2eSBarry Smith     switch (bsizes[i]) {
1826d71ae5a4SJacob Faibussowitsch     case 1:
1827d71ae5a4SJacob Faibussowitsch       *diag = 1.0 / (*diag);
1828d71ae5a4SJacob Faibussowitsch       break;
18290da83c2eSBarry Smith     case 2:
18309566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_inverse_A_2(diag, shift, allowzeropivot, &zeropivotdetected));
18310da83c2eSBarry Smith       if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT;
18329566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_transpose_A_2(diag));
18330da83c2eSBarry Smith       break;
18340da83c2eSBarry Smith     case 3:
18359566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_inverse_A_3(diag, shift, allowzeropivot, &zeropivotdetected));
18360da83c2eSBarry Smith       if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT;
18379566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_transpose_A_3(diag));
18380da83c2eSBarry Smith       break;
18390da83c2eSBarry Smith     case 4:
18409566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_inverse_A_4(diag, shift, allowzeropivot, &zeropivotdetected));
18410da83c2eSBarry Smith       if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT;
18429566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_transpose_A_4(diag));
18430da83c2eSBarry Smith       break;
18440da83c2eSBarry Smith     case 5:
18459566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_inverse_A_5(diag, ipvt, work, shift, allowzeropivot, &zeropivotdetected));
18460da83c2eSBarry Smith       if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT;
18479566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_transpose_A_5(diag));
18480da83c2eSBarry Smith       break;
18490da83c2eSBarry Smith     case 6:
18509566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_inverse_A_6(diag, shift, allowzeropivot, &zeropivotdetected));
18510da83c2eSBarry Smith       if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT;
18529566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_transpose_A_6(diag));
18530da83c2eSBarry Smith       break;
18540da83c2eSBarry Smith     case 7:
18559566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_inverse_A_7(diag, shift, allowzeropivot, &zeropivotdetected));
18560da83c2eSBarry Smith       if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT;
18579566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_transpose_A_7(diag));
18580da83c2eSBarry Smith       break;
18590da83c2eSBarry Smith     default:
18609566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_inverse_A(bsizes[i], diag, v_pivots, v_work, allowzeropivot, &zeropivotdetected));
18610da83c2eSBarry Smith       if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT;
18629566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_transpose_A_N(diag, bsizes[i]));
18630da83c2eSBarry Smith     }
18640da83c2eSBarry Smith     ncnt += bsizes[i];
18650da83c2eSBarry Smith     diag += bsizes[i] * bsizes[i];
18664e208921SJed Brown     flops += 2 * PetscPowInt(bsizes[i], 3) / 3;
18670da83c2eSBarry Smith   }
18683ba16761SJacob Faibussowitsch   PetscCall(PetscLogFlops(flops));
186948a46eb9SPierre Jolivet   if (bsizemax > 7) PetscCall(PetscFree2(v_work, v_pivots));
18709566063dSJacob Faibussowitsch   PetscCall(PetscFree(indx));
18713ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
18720da83c2eSBarry Smith }
18730da83c2eSBarry Smith 
1874422a814eSBarry Smith /*
1875422a814eSBarry Smith    Negative shift indicates do not generate an error if there is a zero diagonal, just invert it anyways
1876422a814eSBarry Smith */
1877d71ae5a4SJacob Faibussowitsch PetscErrorCode MatInvertDiagonal_SeqAIJ(Mat A, PetscScalar omega, PetscScalar fshift)
1878d71ae5a4SJacob Faibussowitsch {
187971f1c65dSBarry Smith   Mat_SeqAIJ      *a = (Mat_SeqAIJ *)A->data;
1880d0f46423SBarry Smith   PetscInt         i, *diag, m = A->rmap->n;
18812e5835c6SStefano Zampini   const MatScalar *v;
188254f21887SBarry Smith   PetscScalar     *idiag, *mdiag;
188371f1c65dSBarry Smith 
188471f1c65dSBarry Smith   PetscFunctionBegin;
18853ba16761SJacob Faibussowitsch   if (a->idiagvalid) PetscFunctionReturn(PETSC_SUCCESS);
18869566063dSJacob Faibussowitsch   PetscCall(MatMarkDiagonal_SeqAIJ(A));
188771f1c65dSBarry Smith   diag = a->diag;
18884dfa11a4SJacob Faibussowitsch   if (!a->idiag) { PetscCall(PetscMalloc3(m, &a->idiag, m, &a->mdiag, m, &a->ssor_work)); }
18892e5835c6SStefano Zampini 
189071f1c65dSBarry Smith   mdiag = a->mdiag;
189171f1c65dSBarry Smith   idiag = a->idiag;
18929566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &v));
1893422a814eSBarry Smith   if (omega == 1.0 && PetscRealPart(fshift) <= 0.0) {
189471f1c65dSBarry Smith     for (i = 0; i < m; i++) {
189571f1c65dSBarry Smith       mdiag[i] = v[diag[i]];
1896899639b0SHong Zhang       if (!PetscAbsScalar(mdiag[i])) { /* zero diagonal */
1897899639b0SHong Zhang         if (PetscRealPart(fshift)) {
18989566063dSJacob Faibussowitsch           PetscCall(PetscInfo(A, "Zero diagonal on row %" PetscInt_FMT "\n", i));
18997b6c816cSBarry Smith           A->factorerrortype             = MAT_FACTOR_NUMERIC_ZEROPIVOT;
19007b6c816cSBarry Smith           A->factorerror_zeropivot_value = 0.0;
19017b6c816cSBarry Smith           A->factorerror_zeropivot_row   = i;
190298921bdaSJacob Faibussowitsch         } else SETERRQ(PETSC_COMM_SELF, PETSC_ERR_ARG_INCOMP, "Zero diagonal on row %" PetscInt_FMT, i);
1903899639b0SHong Zhang       }
190471f1c65dSBarry Smith       idiag[i] = 1.0 / v[diag[i]];
190571f1c65dSBarry Smith     }
19069566063dSJacob Faibussowitsch     PetscCall(PetscLogFlops(m));
190771f1c65dSBarry Smith   } else {
190871f1c65dSBarry Smith     for (i = 0; i < m; i++) {
190971f1c65dSBarry Smith       mdiag[i] = v[diag[i]];
191071f1c65dSBarry Smith       idiag[i] = omega / (fshift + v[diag[i]]);
191171f1c65dSBarry Smith     }
19129566063dSJacob Faibussowitsch     PetscCall(PetscLogFlops(2.0 * m));
191371f1c65dSBarry Smith   }
191471f1c65dSBarry Smith   a->idiagvalid = PETSC_TRUE;
19159566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &v));
19163ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
191771f1c65dSBarry Smith }
191871f1c65dSBarry Smith 
1919c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/ftn-kernels/frelax.h>
1920d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSOR_SeqAIJ(Mat A, Vec bb, PetscReal omega, MatSORType flag, PetscReal fshift, PetscInt its, PetscInt lits, Vec xx)
1921d71ae5a4SJacob Faibussowitsch {
1922416022c9SBarry Smith   Mat_SeqAIJ        *a = (Mat_SeqAIJ *)A->data;
1923e6d1f457SBarry Smith   PetscScalar       *x, d, sum, *t, scale;
19242e5835c6SStefano Zampini   const MatScalar   *v, *idiag = NULL, *mdiag, *aa;
192554f21887SBarry Smith   const PetscScalar *b, *bs, *xb, *ts;
19263d3eaba7SBarry Smith   PetscInt           n, m = A->rmap->n, i;
192797f1f81fSBarry Smith   const PetscInt    *idx, *diag;
192817ab2063SBarry Smith 
19293a40ed3dSBarry Smith   PetscFunctionBegin;
1930b215bc84SStefano Zampini   if (a->inode.use && a->inode.checked && omega == 1.0 && fshift == 0.0) {
19319566063dSJacob Faibussowitsch     PetscCall(MatSOR_SeqAIJ_Inode(A, bb, omega, flag, fshift, its, lits, xx));
19323ba16761SJacob Faibussowitsch     PetscFunctionReturn(PETSC_SUCCESS);
1933b215bc84SStefano Zampini   }
1934b965ef7fSBarry Smith   its = its * lits;
193591723122SBarry Smith 
193671f1c65dSBarry Smith   if (fshift != a->fshift || omega != a->omega) a->idiagvalid = PETSC_FALSE; /* must recompute idiag[] */
19379566063dSJacob Faibussowitsch   if (!a->idiagvalid) PetscCall(MatInvertDiagonal_SeqAIJ(A, omega, fshift));
193871f1c65dSBarry Smith   a->fshift = fshift;
193971f1c65dSBarry Smith   a->omega  = omega;
1940ed480e8bSBarry Smith 
194171f1c65dSBarry Smith   diag  = a->diag;
194271f1c65dSBarry Smith   t     = a->ssor_work;
1943ed480e8bSBarry Smith   idiag = a->idiag;
194471f1c65dSBarry Smith   mdiag = a->mdiag;
1945ed480e8bSBarry Smith 
19469566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &aa));
19479566063dSJacob Faibussowitsch   PetscCall(VecGetArray(xx, &x));
19489566063dSJacob Faibussowitsch   PetscCall(VecGetArrayRead(bb, &b));
1949ed480e8bSBarry Smith   /* We count flops by assuming the upper triangular and lower triangular parts have the same number of nonzeros */
195017ab2063SBarry Smith   if (flag == SOR_APPLY_UPPER) {
195117ab2063SBarry Smith     /* apply (U + D/omega) to the vector */
1952ed480e8bSBarry Smith     bs = b;
195317ab2063SBarry Smith     for (i = 0; i < m; i++) {
195471f1c65dSBarry Smith       d   = fshift + mdiag[i];
1955416022c9SBarry Smith       n   = a->i[i + 1] - diag[i] - 1;
1956ed480e8bSBarry Smith       idx = a->j + diag[i] + 1;
19572e5835c6SStefano Zampini       v   = aa + diag[i] + 1;
195817ab2063SBarry Smith       sum = b[i] * d / omega;
1959003131ecSBarry Smith       PetscSparseDensePlusDot(sum, bs, v, idx, n);
196017ab2063SBarry Smith       x[i] = sum;
196117ab2063SBarry Smith     }
19629566063dSJacob Faibussowitsch     PetscCall(VecRestoreArray(xx, &x));
19639566063dSJacob Faibussowitsch     PetscCall(VecRestoreArrayRead(bb, &b));
19649566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJRestoreArrayRead(A, &aa));
19659566063dSJacob Faibussowitsch     PetscCall(PetscLogFlops(a->nz));
19663ba16761SJacob Faibussowitsch     PetscFunctionReturn(PETSC_SUCCESS);
196717ab2063SBarry Smith   }
1968c783ea89SBarry Smith 
196908401ef6SPierre Jolivet   PetscCheck(flag != SOR_APPLY_LOWER, PETSC_COMM_SELF, PETSC_ERR_SUP, "SOR_APPLY_LOWER is not implemented");
1970f7d195e4SLawrence Mitchell   if (flag & SOR_EISENSTAT) {
19714c500f23SPierre Jolivet     /* Let  A = L + U + D; where L is lower triangular,
1972887ee2caSBarry Smith     U is upper triangular, E = D/omega; This routine applies
197317ab2063SBarry Smith 
197417ab2063SBarry Smith             (L + E)^{-1} A (U + E)^{-1}
197517ab2063SBarry Smith 
1976887ee2caSBarry Smith     to a vector efficiently using Eisenstat's trick.
197717ab2063SBarry Smith     */
197817ab2063SBarry Smith     scale = (2.0 / omega) - 1.0;
197917ab2063SBarry Smith 
198017ab2063SBarry Smith     /*  x = (E + U)^{-1} b */
198117ab2063SBarry Smith     for (i = m - 1; i >= 0; i--) {
1982416022c9SBarry Smith       n   = a->i[i + 1] - diag[i] - 1;
1983ed480e8bSBarry Smith       idx = a->j + diag[i] + 1;
19842e5835c6SStefano Zampini       v   = aa + diag[i] + 1;
198517ab2063SBarry Smith       sum = b[i];
1986e6d1f457SBarry Smith       PetscSparseDenseMinusDot(sum, x, v, idx, n);
1987ed480e8bSBarry Smith       x[i] = sum * idiag[i];
198817ab2063SBarry Smith     }
198917ab2063SBarry Smith 
199017ab2063SBarry Smith     /*  t = b - (2*E - D)x */
19912e5835c6SStefano Zampini     v = aa;
19922205254eSKarl Rupp     for (i = 0; i < m; i++) t[i] = b[i] - scale * (v[*diag++]) * x[i];
199317ab2063SBarry Smith 
199417ab2063SBarry Smith     /*  t = (E + L)^{-1}t */
1995ed480e8bSBarry Smith     ts   = t;
1996416022c9SBarry Smith     diag = a->diag;
199717ab2063SBarry Smith     for (i = 0; i < m; i++) {
1998416022c9SBarry Smith       n   = diag[i] - a->i[i];
1999ed480e8bSBarry Smith       idx = a->j + a->i[i];
20002e5835c6SStefano Zampini       v   = aa + a->i[i];
200117ab2063SBarry Smith       sum = t[i];
2002003131ecSBarry Smith       PetscSparseDenseMinusDot(sum, ts, v, idx, n);
2003ed480e8bSBarry Smith       t[i] = sum * idiag[i];
2004733d66baSBarry Smith       /*  x = x + t */
2005733d66baSBarry Smith       x[i] += t[i];
200617ab2063SBarry Smith     }
200717ab2063SBarry Smith 
20089566063dSJacob Faibussowitsch     PetscCall(PetscLogFlops(6.0 * m - 1 + 2.0 * a->nz));
20099566063dSJacob Faibussowitsch     PetscCall(VecRestoreArray(xx, &x));
20109566063dSJacob Faibussowitsch     PetscCall(VecRestoreArrayRead(bb, &b));
20113ba16761SJacob Faibussowitsch     PetscFunctionReturn(PETSC_SUCCESS);
201217ab2063SBarry Smith   }
201317ab2063SBarry Smith   if (flag & SOR_ZERO_INITIAL_GUESS) {
201417ab2063SBarry Smith     if (flag & SOR_FORWARD_SWEEP || flag & SOR_LOCAL_FORWARD_SWEEP) {
201517ab2063SBarry Smith       for (i = 0; i < m; i++) {
2016416022c9SBarry Smith         n   = diag[i] - a->i[i];
2017ed480e8bSBarry Smith         idx = a->j + a->i[i];
20182e5835c6SStefano Zampini         v   = aa + a->i[i];
201917ab2063SBarry Smith         sum = b[i];
2020e6d1f457SBarry Smith         PetscSparseDenseMinusDot(sum, x, v, idx, n);
20215c99c7daSBarry Smith         t[i] = sum;
2022ed480e8bSBarry Smith         x[i] = sum * idiag[i];
202317ab2063SBarry Smith       }
20245c99c7daSBarry Smith       xb = t;
20259566063dSJacob Faibussowitsch       PetscCall(PetscLogFlops(a->nz));
20263a40ed3dSBarry Smith     } else xb = b;
202717ab2063SBarry Smith     if (flag & SOR_BACKWARD_SWEEP || flag & SOR_LOCAL_BACKWARD_SWEEP) {
202817ab2063SBarry Smith       for (i = m - 1; i >= 0; i--) {
2029416022c9SBarry Smith         n   = a->i[i + 1] - diag[i] - 1;
2030ed480e8bSBarry Smith         idx = a->j + diag[i] + 1;
20312e5835c6SStefano Zampini         v   = aa + diag[i] + 1;
203217ab2063SBarry Smith         sum = xb[i];
2033e6d1f457SBarry Smith         PetscSparseDenseMinusDot(sum, x, v, idx, n);
20345c99c7daSBarry Smith         if (xb == b) {
2035ed480e8bSBarry Smith           x[i] = sum * idiag[i];
20365c99c7daSBarry Smith         } else {
2037b19a5dc2SMark Adams           x[i] = (1 - omega) * x[i] + sum * idiag[i]; /* omega in idiag */
203817ab2063SBarry Smith         }
20395c99c7daSBarry Smith       }
20409566063dSJacob Faibussowitsch       PetscCall(PetscLogFlops(a->nz)); /* assumes 1/2 in upper */
204117ab2063SBarry Smith     }
204217ab2063SBarry Smith     its--;
204317ab2063SBarry Smith   }
204417ab2063SBarry Smith   while (its--) {
204517ab2063SBarry Smith     if (flag & SOR_FORWARD_SWEEP || flag & SOR_LOCAL_FORWARD_SWEEP) {
204617ab2063SBarry Smith       for (i = 0; i < m; i++) {
2047b19a5dc2SMark Adams         /* lower */
2048b19a5dc2SMark Adams         n   = diag[i] - a->i[i];
2049ed480e8bSBarry Smith         idx = a->j + a->i[i];
20502e5835c6SStefano Zampini         v   = aa + a->i[i];
205117ab2063SBarry Smith         sum = b[i];
2052e6d1f457SBarry Smith         PetscSparseDenseMinusDot(sum, x, v, idx, n);
2053b19a5dc2SMark Adams         t[i] = sum; /* save application of the lower-triangular part */
2054b19a5dc2SMark Adams         /* upper */
2055b19a5dc2SMark Adams         n   = a->i[i + 1] - diag[i] - 1;
2056b19a5dc2SMark Adams         idx = a->j + diag[i] + 1;
20572e5835c6SStefano Zampini         v   = aa + diag[i] + 1;
2058b19a5dc2SMark Adams         PetscSparseDenseMinusDot(sum, x, v, idx, n);
2059b19a5dc2SMark Adams         x[i] = (1. - omega) * x[i] + sum * idiag[i]; /* omega in idiag */
206017ab2063SBarry Smith       }
2061b19a5dc2SMark Adams       xb = t;
20629566063dSJacob Faibussowitsch       PetscCall(PetscLogFlops(2.0 * a->nz));
2063b19a5dc2SMark Adams     } else xb = b;
206417ab2063SBarry Smith     if (flag & SOR_BACKWARD_SWEEP || flag & SOR_LOCAL_BACKWARD_SWEEP) {
206517ab2063SBarry Smith       for (i = m - 1; i >= 0; i--) {
2066b19a5dc2SMark Adams         sum = xb[i];
2067b19a5dc2SMark Adams         if (xb == b) {
2068b19a5dc2SMark Adams           /* whole matrix (no checkpointing available) */
2069416022c9SBarry Smith           n   = a->i[i + 1] - a->i[i];
2070ed480e8bSBarry Smith           idx = a->j + a->i[i];
20712e5835c6SStefano Zampini           v   = aa + a->i[i];
2072e6d1f457SBarry Smith           PetscSparseDenseMinusDot(sum, x, v, idx, n);
2073ed480e8bSBarry Smith           x[i] = (1. - omega) * x[i] + (sum + mdiag[i] * x[i]) * idiag[i];
2074b19a5dc2SMark Adams         } else { /* lower-triangular part has been saved, so only apply upper-triangular */
2075b19a5dc2SMark Adams           n   = a->i[i + 1] - diag[i] - 1;
2076b19a5dc2SMark Adams           idx = a->j + diag[i] + 1;
20772e5835c6SStefano Zampini           v   = aa + diag[i] + 1;
2078b19a5dc2SMark Adams           PetscSparseDenseMinusDot(sum, x, v, idx, n);
2079b19a5dc2SMark Adams           x[i] = (1. - omega) * x[i] + sum * idiag[i]; /* omega in idiag */
208017ab2063SBarry Smith         }
2081b19a5dc2SMark Adams       }
2082b19a5dc2SMark Adams       if (xb == b) {
20839566063dSJacob Faibussowitsch         PetscCall(PetscLogFlops(2.0 * a->nz));
2084b19a5dc2SMark Adams       } else {
20859566063dSJacob Faibussowitsch         PetscCall(PetscLogFlops(a->nz)); /* assumes 1/2 in upper */
2086b19a5dc2SMark Adams       }
208717ab2063SBarry Smith     }
208817ab2063SBarry Smith   }
20899566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &aa));
20909566063dSJacob Faibussowitsch   PetscCall(VecRestoreArray(xx, &x));
20919566063dSJacob Faibussowitsch   PetscCall(VecRestoreArrayRead(bb, &b));
20923ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
209317ab2063SBarry Smith }
209417ab2063SBarry Smith 
2095d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetInfo_SeqAIJ(Mat A, MatInfoType flag, MatInfo *info)
2096d71ae5a4SJacob Faibussowitsch {
2097416022c9SBarry Smith   Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data;
20984e220ebcSLois Curfman McInnes 
20993a40ed3dSBarry Smith   PetscFunctionBegin;
21004e220ebcSLois Curfman McInnes   info->block_size   = 1.0;
21013966268fSBarry Smith   info->nz_allocated = a->maxnz;
21023966268fSBarry Smith   info->nz_used      = a->nz;
21033966268fSBarry Smith   info->nz_unneeded  = (a->maxnz - a->nz);
21043966268fSBarry Smith   info->assemblies   = A->num_ass;
21053966268fSBarry Smith   info->mallocs      = A->info.mallocs;
21064dfa11a4SJacob Faibussowitsch   info->memory       = 0; /* REVIEW ME */
2107d5f3da31SBarry Smith   if (A->factortype) {
21084e220ebcSLois Curfman McInnes     info->fill_ratio_given  = A->info.fill_ratio_given;
21094e220ebcSLois Curfman McInnes     info->fill_ratio_needed = A->info.fill_ratio_needed;
21104e220ebcSLois Curfman McInnes     info->factor_mallocs    = A->info.factor_mallocs;
21114e220ebcSLois Curfman McInnes   } else {
21124e220ebcSLois Curfman McInnes     info->fill_ratio_given  = 0;
21134e220ebcSLois Curfman McInnes     info->fill_ratio_needed = 0;
21144e220ebcSLois Curfman McInnes     info->factor_mallocs    = 0;
21154e220ebcSLois Curfman McInnes   }
21163ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
211717ab2063SBarry Smith }
211817ab2063SBarry Smith 
2119d71ae5a4SJacob Faibussowitsch PetscErrorCode MatZeroRows_SeqAIJ(Mat A, PetscInt N, const PetscInt rows[], PetscScalar diag, Vec x, Vec b)
2120d71ae5a4SJacob Faibussowitsch {
2121416022c9SBarry Smith   Mat_SeqAIJ        *a = (Mat_SeqAIJ *)A->data;
2122c7da8527SEric Chamberland   PetscInt           i, m = A->rmap->n - 1;
212397b48c8fSBarry Smith   const PetscScalar *xx;
21242e5835c6SStefano Zampini   PetscScalar       *bb, *aa;
2125c7da8527SEric Chamberland   PetscInt           d = 0;
212617ab2063SBarry Smith 
21273a40ed3dSBarry Smith   PetscFunctionBegin;
212897b48c8fSBarry Smith   if (x && b) {
21299566063dSJacob Faibussowitsch     PetscCall(VecGetArrayRead(x, &xx));
21309566063dSJacob Faibussowitsch     PetscCall(VecGetArray(b, &bb));
213197b48c8fSBarry Smith     for (i = 0; i < N; i++) {
2132aed4548fSBarry Smith       PetscCheck(rows[i] >= 0 && rows[i] <= m, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "row %" PetscInt_FMT " out of range", rows[i]);
2133447d62f5SStefano Zampini       if (rows[i] >= A->cmap->n) continue;
213497b48c8fSBarry Smith       bb[rows[i]] = diag * xx[rows[i]];
213597b48c8fSBarry Smith     }
21369566063dSJacob Faibussowitsch     PetscCall(VecRestoreArrayRead(x, &xx));
21379566063dSJacob Faibussowitsch     PetscCall(VecRestoreArray(b, &bb));
213897b48c8fSBarry Smith   }
213997b48c8fSBarry Smith 
21409566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArray(A, &aa));
2141a9817697SBarry Smith   if (a->keepnonzeropattern) {
2142f1e2ffcdSBarry Smith     for (i = 0; i < N; i++) {
2143aed4548fSBarry Smith       PetscCheck(rows[i] >= 0 && rows[i] <= m, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "row %" PetscInt_FMT " out of range", rows[i]);
21449566063dSJacob Faibussowitsch       PetscCall(PetscArrayzero(&aa[a->i[rows[i]]], a->ilen[rows[i]]));
2145f1e2ffcdSBarry Smith     }
2146f4df32b1SMatthew Knepley     if (diag != 0.0) {
2147c7da8527SEric Chamberland       for (i = 0; i < N; i++) {
2148c7da8527SEric Chamberland         d = rows[i];
2149447d62f5SStefano Zampini         if (rows[i] >= A->cmap->n) continue;
215008401ef6SPierre Jolivet         PetscCheck(a->diag[d] < a->i[d + 1], PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Matrix is missing diagonal entry in the zeroed row %" PetscInt_FMT, d);
2151c7da8527SEric Chamberland       }
2152f1e2ffcdSBarry Smith       for (i = 0; i < N; i++) {
2153447d62f5SStefano Zampini         if (rows[i] >= A->cmap->n) continue;
21542e5835c6SStefano Zampini         aa[a->diag[rows[i]]] = diag;
2155f1e2ffcdSBarry Smith       }
2156f1e2ffcdSBarry Smith     }
2157f1e2ffcdSBarry Smith   } else {
2158f4df32b1SMatthew Knepley     if (diag != 0.0) {
215917ab2063SBarry Smith       for (i = 0; i < N; i++) {
2160aed4548fSBarry Smith         PetscCheck(rows[i] >= 0 && rows[i] <= m, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "row %" PetscInt_FMT " out of range", rows[i]);
21617ae801bdSBarry Smith         if (a->ilen[rows[i]] > 0) {
2162447d62f5SStefano Zampini           if (rows[i] >= A->cmap->n) {
2163447d62f5SStefano Zampini             a->ilen[rows[i]] = 0;
2164447d62f5SStefano Zampini           } else {
2165416022c9SBarry Smith             a->ilen[rows[i]]    = 1;
21662e5835c6SStefano Zampini             aa[a->i[rows[i]]]   = diag;
2167bfeeae90SHong Zhang             a->j[a->i[rows[i]]] = rows[i];
2168447d62f5SStefano Zampini           }
2169447d62f5SStefano Zampini         } else if (rows[i] < A->cmap->n) { /* in case row was completely empty */
21709566063dSJacob Faibussowitsch           PetscCall(MatSetValues_SeqAIJ(A, 1, &rows[i], 1, &rows[i], &diag, INSERT_VALUES));
217117ab2063SBarry Smith         }
217217ab2063SBarry Smith       }
21733a40ed3dSBarry Smith     } else {
217417ab2063SBarry Smith       for (i = 0; i < N; i++) {
2175aed4548fSBarry Smith         PetscCheck(rows[i] >= 0 && rows[i] <= m, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "row %" PetscInt_FMT " out of range", rows[i]);
2176416022c9SBarry Smith         a->ilen[rows[i]] = 0;
217717ab2063SBarry Smith       }
217817ab2063SBarry Smith     }
2179e56f5c9eSBarry Smith     A->nonzerostate++;
2180f1e2ffcdSBarry Smith   }
21819566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArray(A, &aa));
2182dbbe0bcdSBarry Smith   PetscUseTypeMethod(A, assemblyend, MAT_FINAL_ASSEMBLY);
21833ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
218417ab2063SBarry Smith }
218517ab2063SBarry Smith 
2186d71ae5a4SJacob Faibussowitsch PetscErrorCode MatZeroRowsColumns_SeqAIJ(Mat A, PetscInt N, const PetscInt rows[], PetscScalar diag, Vec x, Vec b)
2187d71ae5a4SJacob Faibussowitsch {
21886e169961SBarry Smith   Mat_SeqAIJ        *a = (Mat_SeqAIJ *)A->data;
21896e169961SBarry Smith   PetscInt           i, j, m = A->rmap->n - 1, d = 0;
21902b40b63fSBarry Smith   PetscBool          missing, *zeroed, vecs = PETSC_FALSE;
21916e169961SBarry Smith   const PetscScalar *xx;
21922e5835c6SStefano Zampini   PetscScalar       *bb, *aa;
21936e169961SBarry Smith 
21946e169961SBarry Smith   PetscFunctionBegin;
21953ba16761SJacob Faibussowitsch   if (!N) PetscFunctionReturn(PETSC_SUCCESS);
21969566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArray(A, &aa));
21976e169961SBarry Smith   if (x && b) {
21989566063dSJacob Faibussowitsch     PetscCall(VecGetArrayRead(x, &xx));
21999566063dSJacob Faibussowitsch     PetscCall(VecGetArray(b, &bb));
22002b40b63fSBarry Smith     vecs = PETSC_TRUE;
22016e169961SBarry Smith   }
22029566063dSJacob Faibussowitsch   PetscCall(PetscCalloc1(A->rmap->n, &zeroed));
22036e169961SBarry Smith   for (i = 0; i < N; i++) {
2204aed4548fSBarry Smith     PetscCheck(rows[i] >= 0 && rows[i] <= m, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "row %" PetscInt_FMT " out of range", rows[i]);
22059566063dSJacob Faibussowitsch     PetscCall(PetscArrayzero(&aa[a->i[rows[i]]], a->ilen[rows[i]]));
22062205254eSKarl Rupp 
22076e169961SBarry Smith     zeroed[rows[i]] = PETSC_TRUE;
22086e169961SBarry Smith   }
22096e169961SBarry Smith   for (i = 0; i < A->rmap->n; i++) {
22106e169961SBarry Smith     if (!zeroed[i]) {
22116e169961SBarry Smith       for (j = a->i[i]; j < a->i[i + 1]; j++) {
22124cf107fdSStefano Zampini         if (a->j[j] < A->rmap->n && zeroed[a->j[j]]) {
22132e5835c6SStefano Zampini           if (vecs) bb[i] -= aa[j] * xx[a->j[j]];
22142e5835c6SStefano Zampini           aa[j] = 0.0;
22156e169961SBarry Smith         }
22166e169961SBarry Smith       }
22174cf107fdSStefano Zampini     } else if (vecs && i < A->cmap->N) bb[i] = diag * xx[i];
22186e169961SBarry Smith   }
22196e169961SBarry Smith   if (x && b) {
22209566063dSJacob Faibussowitsch     PetscCall(VecRestoreArrayRead(x, &xx));
22219566063dSJacob Faibussowitsch     PetscCall(VecRestoreArray(b, &bb));
22226e169961SBarry Smith   }
22239566063dSJacob Faibussowitsch   PetscCall(PetscFree(zeroed));
22246e169961SBarry Smith   if (diag != 0.0) {
22259566063dSJacob Faibussowitsch     PetscCall(MatMissingDiagonal_SeqAIJ(A, &missing, &d));
22261d5a398dSstefano_zampini     if (missing) {
22271d5a398dSstefano_zampini       for (i = 0; i < N; i++) {
22284cf107fdSStefano Zampini         if (rows[i] >= A->cmap->N) continue;
2229aed4548fSBarry Smith         PetscCheck(!a->nonew || rows[i] < d, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Matrix is missing diagonal entry in row %" PetscInt_FMT " (%" PetscInt_FMT ")", d, rows[i]);
22309566063dSJacob Faibussowitsch         PetscCall(MatSetValues_SeqAIJ(A, 1, &rows[i], 1, &rows[i], &diag, INSERT_VALUES));
22311d5a398dSstefano_zampini       }
22321d5a398dSstefano_zampini     } else {
2233ad540459SPierre Jolivet       for (i = 0; i < N; i++) aa[a->diag[rows[i]]] = diag;
22346e169961SBarry Smith     }
22351d5a398dSstefano_zampini   }
22369566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArray(A, &aa));
2237dbbe0bcdSBarry Smith   PetscUseTypeMethod(A, assemblyend, MAT_FINAL_ASSEMBLY);
22383ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
22396e169961SBarry Smith }
22406e169961SBarry Smith 
2241d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetRow_SeqAIJ(Mat A, PetscInt row, PetscInt *nz, PetscInt **idx, PetscScalar **v)
2242d71ae5a4SJacob Faibussowitsch {
2243fff043a9SJunchao Zhang   Mat_SeqAIJ        *a = (Mat_SeqAIJ *)A->data;
2244fff043a9SJunchao Zhang   const PetscScalar *aa;
2245fff043a9SJunchao Zhang   PetscInt          *itmp;
224617ab2063SBarry Smith 
22473a40ed3dSBarry Smith   PetscFunctionBegin;
22489566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &aa));
2249416022c9SBarry Smith   *nz = a->i[row + 1] - a->i[row];
22502e5835c6SStefano Zampini   if (v) *v = (PetscScalar *)(aa + a->i[row]);
225117ab2063SBarry Smith   if (idx) {
2252bfeeae90SHong Zhang     itmp = a->j + a->i[row];
225326fbe8dcSKarl Rupp     if (*nz) *idx = itmp;
2254f4259b30SLisandro Dalcin     else *idx = NULL;
225517ab2063SBarry Smith   }
22569566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &aa));
22573ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
225817ab2063SBarry Smith }
225917ab2063SBarry Smith 
2260d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRestoreRow_SeqAIJ(Mat A, PetscInt row, PetscInt *nz, PetscInt **idx, PetscScalar **v)
2261d71ae5a4SJacob Faibussowitsch {
22623a40ed3dSBarry Smith   PetscFunctionBegin;
2263cb4a9cd9SHong Zhang   if (nz) *nz = 0;
22642e5835c6SStefano Zampini   if (idx) *idx = NULL;
22652e5835c6SStefano Zampini   if (v) *v = NULL;
22663ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
226717ab2063SBarry Smith }
226817ab2063SBarry Smith 
2269d71ae5a4SJacob Faibussowitsch PetscErrorCode MatNorm_SeqAIJ(Mat A, NormType type, PetscReal *nrm)
2270d71ae5a4SJacob Faibussowitsch {
2271416022c9SBarry Smith   Mat_SeqAIJ      *a = (Mat_SeqAIJ *)A->data;
22722e5835c6SStefano Zampini   const MatScalar *v;
227336db0b34SBarry Smith   PetscReal        sum = 0.0;
227497f1f81fSBarry Smith   PetscInt         i, j;
227517ab2063SBarry Smith 
22763a40ed3dSBarry Smith   PetscFunctionBegin;
22779566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &v));
227817ab2063SBarry Smith   if (type == NORM_FROBENIUS) {
2279570b7f6dSBarry Smith #if defined(PETSC_USE_REAL___FP16)
2280570b7f6dSBarry Smith     PetscBLASInt one = 1, nz = a->nz;
2281792fecdfSBarry Smith     PetscCallBLAS("BLASnrm2", *nrm = BLASnrm2_(&nz, v, &one));
2282570b7f6dSBarry Smith #else
2283416022c9SBarry Smith     for (i = 0; i < a->nz; i++) {
22849371c9d4SSatish Balay       sum += PetscRealPart(PetscConj(*v) * (*v));
22859371c9d4SSatish Balay       v++;
228617ab2063SBarry Smith     }
22878f1a2a5eSBarry Smith     *nrm = PetscSqrtReal(sum);
2288570b7f6dSBarry Smith #endif
22899566063dSJacob Faibussowitsch     PetscCall(PetscLogFlops(2.0 * a->nz));
22903a40ed3dSBarry Smith   } else if (type == NORM_1) {
229136db0b34SBarry Smith     PetscReal *tmp;
229297f1f81fSBarry Smith     PetscInt  *jj = a->j;
22939566063dSJacob Faibussowitsch     PetscCall(PetscCalloc1(A->cmap->n + 1, &tmp));
2294064f8208SBarry Smith     *nrm = 0.0;
2295416022c9SBarry Smith     for (j = 0; j < a->nz; j++) {
22969371c9d4SSatish Balay       tmp[*jj++] += PetscAbsScalar(*v);
22979371c9d4SSatish Balay       v++;
229817ab2063SBarry Smith     }
2299d0f46423SBarry Smith     for (j = 0; j < A->cmap->n; j++) {
2300064f8208SBarry Smith       if (tmp[j] > *nrm) *nrm = tmp[j];
230117ab2063SBarry Smith     }
23029566063dSJacob Faibussowitsch     PetscCall(PetscFree(tmp));
23039566063dSJacob Faibussowitsch     PetscCall(PetscLogFlops(PetscMax(a->nz - 1, 0)));
23043a40ed3dSBarry Smith   } else if (type == NORM_INFINITY) {
2305064f8208SBarry Smith     *nrm = 0.0;
2306d0f46423SBarry Smith     for (j = 0; j < A->rmap->n; j++) {
23072e5835c6SStefano Zampini       const PetscScalar *v2 = v + a->i[j];
230817ab2063SBarry Smith       sum                   = 0.0;
2309416022c9SBarry Smith       for (i = 0; i < a->i[j + 1] - a->i[j]; i++) {
23109371c9d4SSatish Balay         sum += PetscAbsScalar(*v2);
23119371c9d4SSatish Balay         v2++;
231217ab2063SBarry Smith       }
2313064f8208SBarry Smith       if (sum > *nrm) *nrm = sum;
231417ab2063SBarry Smith     }
23159566063dSJacob Faibussowitsch     PetscCall(PetscLogFlops(PetscMax(a->nz - 1, 0)));
2316f23aa3ddSBarry Smith   } else SETERRQ(PETSC_COMM_SELF, PETSC_ERR_SUP, "No support for two norm");
23179566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &v));
23183ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
231917ab2063SBarry Smith }
232017ab2063SBarry Smith 
2321d71ae5a4SJacob Faibussowitsch PetscErrorCode MatIsTranspose_SeqAIJ(Mat A, Mat B, PetscReal tol, PetscBool *f)
2322d71ae5a4SJacob Faibussowitsch {
23233d3eaba7SBarry Smith   Mat_SeqAIJ      *aij = (Mat_SeqAIJ *)A->data, *bij = (Mat_SeqAIJ *)B->data;
232454f21887SBarry Smith   PetscInt        *adx, *bdx, *aii, *bii, *aptr, *bptr;
23252e5835c6SStefano Zampini   const MatScalar *va, *vb;
232697f1f81fSBarry Smith   PetscInt         ma, na, mb, nb, i;
2327cd0d46ebSvictorle 
2328cd0d46ebSvictorle   PetscFunctionBegin;
23299566063dSJacob Faibussowitsch   PetscCall(MatGetSize(A, &ma, &na));
23309566063dSJacob Faibussowitsch   PetscCall(MatGetSize(B, &mb, &nb));
23315485867bSBarry Smith   if (ma != nb || na != mb) {
23325485867bSBarry Smith     *f = PETSC_FALSE;
23333ba16761SJacob Faibussowitsch     PetscFunctionReturn(PETSC_SUCCESS);
23345485867bSBarry Smith   }
23359566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &va));
23369566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(B, &vb));
23379371c9d4SSatish Balay   aii = aij->i;
23389371c9d4SSatish Balay   bii = bij->i;
23399371c9d4SSatish Balay   adx = aij->j;
23409371c9d4SSatish Balay   bdx = bij->j;
23419566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(ma, &aptr));
23429566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(mb, &bptr));
2343cd0d46ebSvictorle   for (i = 0; i < ma; i++) aptr[i] = aii[i];
2344cd0d46ebSvictorle   for (i = 0; i < mb; i++) bptr[i] = bii[i];
2345cd0d46ebSvictorle 
2346cd0d46ebSvictorle   *f = PETSC_TRUE;
2347cd0d46ebSvictorle   for (i = 0; i < ma; i++) {
2348cd0d46ebSvictorle     while (aptr[i] < aii[i + 1]) {
234997f1f81fSBarry Smith       PetscInt    idc, idr;
23505485867bSBarry Smith       PetscScalar vc, vr;
2351cd0d46ebSvictorle       /* column/row index/value */
23525485867bSBarry Smith       idc = adx[aptr[i]];
23535485867bSBarry Smith       idr = bdx[bptr[idc]];
23545485867bSBarry Smith       vc  = va[aptr[i]];
23555485867bSBarry Smith       vr  = vb[bptr[idc]];
23565485867bSBarry Smith       if (i != idr || PetscAbsScalar(vc - vr) > tol) {
23575485867bSBarry Smith         *f = PETSC_FALSE;
23585485867bSBarry Smith         goto done;
2359cd0d46ebSvictorle       } else {
23605485867bSBarry Smith         aptr[i]++;
23615485867bSBarry Smith         if (B || i != idc) bptr[idc]++;
2362cd0d46ebSvictorle       }
2363cd0d46ebSvictorle     }
2364cd0d46ebSvictorle   }
2365cd0d46ebSvictorle done:
23669566063dSJacob Faibussowitsch   PetscCall(PetscFree(aptr));
23679566063dSJacob Faibussowitsch   PetscCall(PetscFree(bptr));
23689566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &va));
23699566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(B, &vb));
23703ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
2371cd0d46ebSvictorle }
2372cd0d46ebSvictorle 
2373d71ae5a4SJacob Faibussowitsch PetscErrorCode MatIsHermitianTranspose_SeqAIJ(Mat A, Mat B, PetscReal tol, PetscBool *f)
2374d71ae5a4SJacob Faibussowitsch {
23753d3eaba7SBarry Smith   Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data, *bij = (Mat_SeqAIJ *)B->data;
237654f21887SBarry Smith   PetscInt   *adx, *bdx, *aii, *bii, *aptr, *bptr;
237754f21887SBarry Smith   MatScalar  *va, *vb;
23781cbb95d3SBarry Smith   PetscInt    ma, na, mb, nb, i;
23791cbb95d3SBarry Smith 
23801cbb95d3SBarry Smith   PetscFunctionBegin;
23819566063dSJacob Faibussowitsch   PetscCall(MatGetSize(A, &ma, &na));
23829566063dSJacob Faibussowitsch   PetscCall(MatGetSize(B, &mb, &nb));
23831cbb95d3SBarry Smith   if (ma != nb || na != mb) {
23841cbb95d3SBarry Smith     *f = PETSC_FALSE;
23853ba16761SJacob Faibussowitsch     PetscFunctionReturn(PETSC_SUCCESS);
23861cbb95d3SBarry Smith   }
23879371c9d4SSatish Balay   aii = aij->i;
23889371c9d4SSatish Balay   bii = bij->i;
23899371c9d4SSatish Balay   adx = aij->j;
23909371c9d4SSatish Balay   bdx = bij->j;
23919371c9d4SSatish Balay   va  = aij->a;
23929371c9d4SSatish Balay   vb  = bij->a;
23939566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(ma, &aptr));
23949566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(mb, &bptr));
23951cbb95d3SBarry Smith   for (i = 0; i < ma; i++) aptr[i] = aii[i];
23961cbb95d3SBarry Smith   for (i = 0; i < mb; i++) bptr[i] = bii[i];
23971cbb95d3SBarry Smith 
23981cbb95d3SBarry Smith   *f = PETSC_TRUE;
23991cbb95d3SBarry Smith   for (i = 0; i < ma; i++) {
24001cbb95d3SBarry Smith     while (aptr[i] < aii[i + 1]) {
24011cbb95d3SBarry Smith       PetscInt    idc, idr;
24021cbb95d3SBarry Smith       PetscScalar vc, vr;
24031cbb95d3SBarry Smith       /* column/row index/value */
24041cbb95d3SBarry Smith       idc = adx[aptr[i]];
24051cbb95d3SBarry Smith       idr = bdx[bptr[idc]];
24061cbb95d3SBarry Smith       vc  = va[aptr[i]];
24071cbb95d3SBarry Smith       vr  = vb[bptr[idc]];
24081cbb95d3SBarry Smith       if (i != idr || PetscAbsScalar(vc - PetscConj(vr)) > tol) {
24091cbb95d3SBarry Smith         *f = PETSC_FALSE;
24101cbb95d3SBarry Smith         goto done;
24111cbb95d3SBarry Smith       } else {
24121cbb95d3SBarry Smith         aptr[i]++;
24131cbb95d3SBarry Smith         if (B || i != idc) bptr[idc]++;
24141cbb95d3SBarry Smith       }
24151cbb95d3SBarry Smith     }
24161cbb95d3SBarry Smith   }
24171cbb95d3SBarry Smith done:
24189566063dSJacob Faibussowitsch   PetscCall(PetscFree(aptr));
24199566063dSJacob Faibussowitsch   PetscCall(PetscFree(bptr));
24203ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
24211cbb95d3SBarry Smith }
24221cbb95d3SBarry Smith 
2423d71ae5a4SJacob Faibussowitsch PetscErrorCode MatIsSymmetric_SeqAIJ(Mat A, PetscReal tol, PetscBool *f)
2424d71ae5a4SJacob Faibussowitsch {
24259e29f15eSvictorle   PetscFunctionBegin;
24269566063dSJacob Faibussowitsch   PetscCall(MatIsTranspose_SeqAIJ(A, A, tol, f));
24273ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
24289e29f15eSvictorle }
24299e29f15eSvictorle 
2430d71ae5a4SJacob Faibussowitsch PetscErrorCode MatIsHermitian_SeqAIJ(Mat A, PetscReal tol, PetscBool *f)
2431d71ae5a4SJacob Faibussowitsch {
24321cbb95d3SBarry Smith   PetscFunctionBegin;
24339566063dSJacob Faibussowitsch   PetscCall(MatIsHermitianTranspose_SeqAIJ(A, A, tol, f));
24343ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
24351cbb95d3SBarry Smith }
24361cbb95d3SBarry Smith 
2437d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDiagonalScale_SeqAIJ(Mat A, Vec ll, Vec rr)
2438d71ae5a4SJacob Faibussowitsch {
2439416022c9SBarry Smith   Mat_SeqAIJ        *a = (Mat_SeqAIJ *)A->data;
2440fff8e43fSBarry Smith   const PetscScalar *l, *r;
2441fff8e43fSBarry Smith   PetscScalar        x;
244254f21887SBarry Smith   MatScalar         *v;
2443fff8e43fSBarry Smith   PetscInt           i, j, m = A->rmap->n, n = A->cmap->n, M, nz = a->nz;
2444fff8e43fSBarry Smith   const PetscInt    *jj;
244517ab2063SBarry Smith 
24463a40ed3dSBarry Smith   PetscFunctionBegin;
244717ab2063SBarry Smith   if (ll) {
24483ea7c6a1SSatish Balay     /* The local size is used so that VecMPI can be passed to this routine
24493ea7c6a1SSatish Balay        by MatDiagonalScale_MPIAIJ */
24509566063dSJacob Faibussowitsch     PetscCall(VecGetLocalSize(ll, &m));
245108401ef6SPierre Jolivet     PetscCheck(m == A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Left scaling vector wrong length");
24529566063dSJacob Faibussowitsch     PetscCall(VecGetArrayRead(ll, &l));
24539566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJGetArray(A, &v));
245417ab2063SBarry Smith     for (i = 0; i < m; i++) {
245517ab2063SBarry Smith       x = l[i];
2456416022c9SBarry Smith       M = a->i[i + 1] - a->i[i];
24572205254eSKarl Rupp       for (j = 0; j < M; j++) (*v++) *= x;
245817ab2063SBarry Smith     }
24599566063dSJacob Faibussowitsch     PetscCall(VecRestoreArrayRead(ll, &l));
24609566063dSJacob Faibussowitsch     PetscCall(PetscLogFlops(nz));
24619566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJRestoreArray(A, &v));
246217ab2063SBarry Smith   }
246317ab2063SBarry Smith   if (rr) {
24649566063dSJacob Faibussowitsch     PetscCall(VecGetLocalSize(rr, &n));
246508401ef6SPierre Jolivet     PetscCheck(n == A->cmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Right scaling vector wrong length");
24669566063dSJacob Faibussowitsch     PetscCall(VecGetArrayRead(rr, &r));
24679566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJGetArray(A, &v));
24682e5835c6SStefano Zampini     jj = a->j;
24692205254eSKarl Rupp     for (i = 0; i < nz; i++) (*v++) *= r[*jj++];
24709566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJRestoreArray(A, &v));
24719566063dSJacob Faibussowitsch     PetscCall(VecRestoreArrayRead(rr, &r));
24729566063dSJacob Faibussowitsch     PetscCall(PetscLogFlops(nz));
247317ab2063SBarry Smith   }
24749566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJInvalidateDiagonal(A));
24753ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
247617ab2063SBarry Smith }
247717ab2063SBarry Smith 
2478d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateSubMatrix_SeqAIJ(Mat A, IS isrow, IS iscol, PetscInt csize, MatReuse scall, Mat *B)
2479d71ae5a4SJacob Faibussowitsch {
2480db02288aSLois Curfman McInnes   Mat_SeqAIJ        *a = (Mat_SeqAIJ *)A->data, *c;
2481d0f46423SBarry Smith   PetscInt          *smap, i, k, kstart, kend, oldcols = A->cmap->n, *lens;
248297f1f81fSBarry Smith   PetscInt           row, mat_i, *mat_j, tcol, first, step, *mat_ilen, sum, lensi;
24835d0c19d7SBarry Smith   const PetscInt    *irow, *icol;
24842e5835c6SStefano Zampini   const PetscScalar *aa;
24855d0c19d7SBarry Smith   PetscInt           nrows, ncols;
248697f1f81fSBarry Smith   PetscInt          *starts, *j_new, *i_new, *aj = a->j, *ai = a->i, ii, *ailen = a->ilen;
2487fb3c7e2dSJunchao Zhang   MatScalar         *a_new, *mat_a, *c_a;
2488416022c9SBarry Smith   Mat                C;
2489cdc6f3adSToby Isaac   PetscBool          stride;
249017ab2063SBarry Smith 
24913a40ed3dSBarry Smith   PetscFunctionBegin;
24929566063dSJacob Faibussowitsch   PetscCall(ISGetIndices(isrow, &irow));
24939566063dSJacob Faibussowitsch   PetscCall(ISGetLocalSize(isrow, &nrows));
24949566063dSJacob Faibussowitsch   PetscCall(ISGetLocalSize(iscol, &ncols));
249517ab2063SBarry Smith 
24969566063dSJacob Faibussowitsch   PetscCall(PetscObjectTypeCompare((PetscObject)iscol, ISSTRIDE, &stride));
2497ff718158SBarry Smith   if (stride) {
24989566063dSJacob Faibussowitsch     PetscCall(ISStrideGetInfo(iscol, &first, &step));
2499ff718158SBarry Smith   } else {
2500ff718158SBarry Smith     first = 0;
2501ff718158SBarry Smith     step  = 0;
2502ff718158SBarry Smith   }
2503fee21e36SBarry Smith   if (stride && step == 1) {
250402834360SBarry Smith     /* special case of contiguous rows */
25059566063dSJacob Faibussowitsch     PetscCall(PetscMalloc2(nrows, &lens, nrows, &starts));
250602834360SBarry Smith     /* loop over new rows determining lens and starting points */
250702834360SBarry Smith     for (i = 0; i < nrows; i++) {
2508bfeeae90SHong Zhang       kstart    = ai[irow[i]];
2509a2744918SBarry Smith       kend      = kstart + ailen[irow[i]];
2510a91a9bebSLisandro Dalcin       starts[i] = kstart;
251102834360SBarry Smith       for (k = kstart; k < kend; k++) {
2512bfeeae90SHong Zhang         if (aj[k] >= first) {
251302834360SBarry Smith           starts[i] = k;
251402834360SBarry Smith           break;
251502834360SBarry Smith         }
251602834360SBarry Smith       }
2517a2744918SBarry Smith       sum = 0;
251802834360SBarry Smith       while (k < kend) {
2519bfeeae90SHong Zhang         if (aj[k++] >= first + ncols) break;
2520a2744918SBarry Smith         sum++;
252102834360SBarry Smith       }
2522a2744918SBarry Smith       lens[i] = sum;
252302834360SBarry Smith     }
252402834360SBarry Smith     /* create submatrix */
2525cddf8d76SBarry Smith     if (scall == MAT_REUSE_MATRIX) {
252697f1f81fSBarry Smith       PetscInt n_cols, n_rows;
25279566063dSJacob Faibussowitsch       PetscCall(MatGetSize(*B, &n_rows, &n_cols));
2528aed4548fSBarry Smith       PetscCheck(n_rows == nrows && n_cols == ncols, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Reused submatrix wrong size");
25299566063dSJacob Faibussowitsch       PetscCall(MatZeroEntries(*B));
253008480c60SBarry Smith       C = *B;
25313a40ed3dSBarry Smith     } else {
25323bef6203SJed Brown       PetscInt rbs, cbs;
25339566063dSJacob Faibussowitsch       PetscCall(MatCreate(PetscObjectComm((PetscObject)A), &C));
25349566063dSJacob Faibussowitsch       PetscCall(MatSetSizes(C, nrows, ncols, PETSC_DETERMINE, PETSC_DETERMINE));
25359566063dSJacob Faibussowitsch       PetscCall(ISGetBlockSize(isrow, &rbs));
25369566063dSJacob Faibussowitsch       PetscCall(ISGetBlockSize(iscol, &cbs));
25379566063dSJacob Faibussowitsch       PetscCall(MatSetBlockSizes(C, rbs, cbs));
25389566063dSJacob Faibussowitsch       PetscCall(MatSetType(C, ((PetscObject)A)->type_name));
25399566063dSJacob Faibussowitsch       PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(C, 0, lens));
254008480c60SBarry Smith     }
2541db02288aSLois Curfman McInnes     c = (Mat_SeqAIJ *)C->data;
2542db02288aSLois Curfman McInnes 
254302834360SBarry Smith     /* loop over rows inserting into submatrix */
2544fb3c7e2dSJunchao Zhang     PetscCall(MatSeqAIJGetArrayWrite(C, &a_new)); // Not 'a_new = c->a-new', since that raw usage ignores offload state of C
2545db02288aSLois Curfman McInnes     j_new = c->j;
2546db02288aSLois Curfman McInnes     i_new = c->i;
25479566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJGetArrayRead(A, &aa));
254802834360SBarry Smith     for (i = 0; i < nrows; i++) {
2549a2744918SBarry Smith       ii    = starts[i];
2550a2744918SBarry Smith       lensi = lens[i];
2551ad540459SPierre Jolivet       for (k = 0; k < lensi; k++) *j_new++ = aj[ii + k] - first;
25529566063dSJacob Faibussowitsch       PetscCall(PetscArraycpy(a_new, aa + starts[i], lensi));
2553a2744918SBarry Smith       a_new += lensi;
2554a2744918SBarry Smith       i_new[i + 1] = i_new[i] + lensi;
2555a2744918SBarry Smith       c->ilen[i]   = lensi;
255602834360SBarry Smith     }
2557fb3c7e2dSJunchao Zhang     PetscCall(MatSeqAIJRestoreArrayWrite(C, &a_new)); // Set C's offload state properly
25589566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJRestoreArrayRead(A, &aa));
25599566063dSJacob Faibussowitsch     PetscCall(PetscFree2(lens, starts));
25603a40ed3dSBarry Smith   } else {
25619566063dSJacob Faibussowitsch     PetscCall(ISGetIndices(iscol, &icol));
25629566063dSJacob Faibussowitsch     PetscCall(PetscCalloc1(oldcols, &smap));
25639566063dSJacob Faibussowitsch     PetscCall(PetscMalloc1(1 + nrows, &lens));
25644dcab191SBarry Smith     for (i = 0; i < ncols; i++) {
25656bdcaf15SBarry Smith       PetscCheck(icol[i] < oldcols, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Requesting column beyond largest column icol[%" PetscInt_FMT "] %" PetscInt_FMT " >= A->cmap->n %" PetscInt_FMT, i, icol[i], oldcols);
25664dcab191SBarry Smith       smap[icol[i]] = i + 1;
25674dcab191SBarry Smith     }
25684dcab191SBarry Smith 
256902834360SBarry Smith     /* determine lens of each row */
257002834360SBarry Smith     for (i = 0; i < nrows; i++) {
2571bfeeae90SHong Zhang       kstart  = ai[irow[i]];
257202834360SBarry Smith       kend    = kstart + a->ilen[irow[i]];
257302834360SBarry Smith       lens[i] = 0;
257402834360SBarry Smith       for (k = kstart; k < kend; k++) {
2575ad540459SPierre Jolivet         if (smap[aj[k]]) lens[i]++;
257602834360SBarry Smith       }
257702834360SBarry Smith     }
257817ab2063SBarry Smith     /* Create and fill new matrix */
2579a2744918SBarry Smith     if (scall == MAT_REUSE_MATRIX) {
2580ace3abfcSBarry Smith       PetscBool equal;
25810f5bd95cSBarry Smith 
258299141d43SSatish Balay       c = (Mat_SeqAIJ *)((*B)->data);
2583aed4548fSBarry Smith       PetscCheck((*B)->rmap->n == nrows && (*B)->cmap->n == ncols, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Cannot reuse matrix. wrong size");
25849566063dSJacob Faibussowitsch       PetscCall(PetscArraycmp(c->ilen, lens, (*B)->rmap->n, &equal));
258528b400f6SJacob Faibussowitsch       PetscCheck(equal, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Cannot reuse matrix. wrong no of nonzeros");
25869566063dSJacob Faibussowitsch       PetscCall(PetscArrayzero(c->ilen, (*B)->rmap->n));
258708480c60SBarry Smith       C = *B;
25883a40ed3dSBarry Smith     } else {
25893bef6203SJed Brown       PetscInt rbs, cbs;
25909566063dSJacob Faibussowitsch       PetscCall(MatCreate(PetscObjectComm((PetscObject)A), &C));
25919566063dSJacob Faibussowitsch       PetscCall(MatSetSizes(C, nrows, ncols, PETSC_DETERMINE, PETSC_DETERMINE));
25929566063dSJacob Faibussowitsch       PetscCall(ISGetBlockSize(isrow, &rbs));
25939566063dSJacob Faibussowitsch       PetscCall(ISGetBlockSize(iscol, &cbs));
25949566063dSJacob Faibussowitsch       PetscCall(MatSetBlockSizes(C, rbs, cbs));
25959566063dSJacob Faibussowitsch       PetscCall(MatSetType(C, ((PetscObject)A)->type_name));
25969566063dSJacob Faibussowitsch       PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(C, 0, lens));
259708480c60SBarry Smith     }
25989566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJGetArrayRead(A, &aa));
2599fb3c7e2dSJunchao Zhang 
260099141d43SSatish Balay     c = (Mat_SeqAIJ *)(C->data);
2601fb3c7e2dSJunchao Zhang     PetscCall(MatSeqAIJGetArrayWrite(C, &c_a)); // Not 'c->a', since that raw usage ignores offload state of C
260217ab2063SBarry Smith     for (i = 0; i < nrows; i++) {
260399141d43SSatish Balay       row      = irow[i];
2604bfeeae90SHong Zhang       kstart   = ai[row];
260599141d43SSatish Balay       kend     = kstart + a->ilen[row];
2606bfeeae90SHong Zhang       mat_i    = c->i[i];
260799141d43SSatish Balay       mat_j    = c->j + mat_i;
2608fb3c7e2dSJunchao Zhang       mat_a    = c_a + mat_i;
260999141d43SSatish Balay       mat_ilen = c->ilen + i;
261017ab2063SBarry Smith       for (k = kstart; k < kend; k++) {
2611bfeeae90SHong Zhang         if ((tcol = smap[a->j[k]])) {
2612ed480e8bSBarry Smith           *mat_j++ = tcol - 1;
26132e5835c6SStefano Zampini           *mat_a++ = aa[k];
261499141d43SSatish Balay           (*mat_ilen)++;
261517ab2063SBarry Smith         }
261617ab2063SBarry Smith       }
261717ab2063SBarry Smith     }
26189566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJRestoreArrayRead(A, &aa));
261902834360SBarry Smith     /* Free work space */
26209566063dSJacob Faibussowitsch     PetscCall(ISRestoreIndices(iscol, &icol));
26219566063dSJacob Faibussowitsch     PetscCall(PetscFree(smap));
26229566063dSJacob Faibussowitsch     PetscCall(PetscFree(lens));
2623cdc6f3adSToby Isaac     /* sort */
2624cdc6f3adSToby Isaac     for (i = 0; i < nrows; i++) {
2625cdc6f3adSToby Isaac       PetscInt ilen;
2626cdc6f3adSToby Isaac 
2627cdc6f3adSToby Isaac       mat_i = c->i[i];
2628cdc6f3adSToby Isaac       mat_j = c->j + mat_i;
2629fb3c7e2dSJunchao Zhang       mat_a = c_a + mat_i;
2630cdc6f3adSToby Isaac       ilen  = c->ilen[i];
26319566063dSJacob Faibussowitsch       PetscCall(PetscSortIntWithScalarArray(ilen, mat_j, mat_a));
2632cdc6f3adSToby Isaac     }
2633fb3c7e2dSJunchao Zhang     PetscCall(MatSeqAIJRestoreArrayWrite(C, &c_a));
263402834360SBarry Smith   }
26358c3ff71bSJunchao Zhang #if defined(PETSC_HAVE_DEVICE)
26369566063dSJacob Faibussowitsch   PetscCall(MatBindToCPU(C, A->boundtocpu));
2637305c6ccfSStefano Zampini #endif
26389566063dSJacob Faibussowitsch   PetscCall(MatAssemblyBegin(C, MAT_FINAL_ASSEMBLY));
26399566063dSJacob Faibussowitsch   PetscCall(MatAssemblyEnd(C, MAT_FINAL_ASSEMBLY));
264017ab2063SBarry Smith 
26419566063dSJacob Faibussowitsch   PetscCall(ISRestoreIndices(isrow, &irow));
2642416022c9SBarry Smith   *B = C;
26433ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
264417ab2063SBarry Smith }
264517ab2063SBarry Smith 
2646d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetMultiProcBlock_SeqAIJ(Mat mat, MPI_Comm subComm, MatReuse scall, Mat *subMat)
2647d71ae5a4SJacob Faibussowitsch {
264882d44351SHong Zhang   Mat B;
264982d44351SHong Zhang 
265082d44351SHong Zhang   PetscFunctionBegin;
2651c2d650bdSHong Zhang   if (scall == MAT_INITIAL_MATRIX) {
26529566063dSJacob Faibussowitsch     PetscCall(MatCreate(subComm, &B));
26539566063dSJacob Faibussowitsch     PetscCall(MatSetSizes(B, mat->rmap->n, mat->cmap->n, mat->rmap->n, mat->cmap->n));
26549566063dSJacob Faibussowitsch     PetscCall(MatSetBlockSizesFromMats(B, mat, mat));
26559566063dSJacob Faibussowitsch     PetscCall(MatSetType(B, MATSEQAIJ));
26569566063dSJacob Faibussowitsch     PetscCall(MatDuplicateNoCreate_SeqAIJ(B, mat, MAT_COPY_VALUES, PETSC_TRUE));
265782d44351SHong Zhang     *subMat = B;
2658c2d650bdSHong Zhang   } else {
26599566063dSJacob Faibussowitsch     PetscCall(MatCopy_SeqAIJ(mat, *subMat, SAME_NONZERO_PATTERN));
2660c2d650bdSHong Zhang   }
26613ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
266282d44351SHong Zhang }
266382d44351SHong Zhang 
2664d71ae5a4SJacob Faibussowitsch PetscErrorCode MatILUFactor_SeqAIJ(Mat inA, IS row, IS col, const MatFactorInfo *info)
2665d71ae5a4SJacob Faibussowitsch {
266663b91edcSBarry Smith   Mat_SeqAIJ *a = (Mat_SeqAIJ *)inA->data;
266763b91edcSBarry Smith   Mat         outA;
2668ace3abfcSBarry Smith   PetscBool   row_identity, col_identity;
266963b91edcSBarry Smith 
26703a40ed3dSBarry Smith   PetscFunctionBegin;
267108401ef6SPierre Jolivet   PetscCheck(info->levels == 0, PETSC_COMM_SELF, PETSC_ERR_SUP, "Only levels=0 supported for in-place ilu");
26721df811f5SHong Zhang 
26739566063dSJacob Faibussowitsch   PetscCall(ISIdentity(row, &row_identity));
26749566063dSJacob Faibussowitsch   PetscCall(ISIdentity(col, &col_identity));
2675a871dcd8SBarry Smith 
267663b91edcSBarry Smith   outA             = inA;
2677d5f3da31SBarry Smith   outA->factortype = MAT_FACTOR_LU;
26789566063dSJacob Faibussowitsch   PetscCall(PetscFree(inA->solvertype));
26799566063dSJacob Faibussowitsch   PetscCall(PetscStrallocpy(MATSOLVERPETSC, &inA->solvertype));
26802205254eSKarl Rupp 
26819566063dSJacob Faibussowitsch   PetscCall(PetscObjectReference((PetscObject)row));
26829566063dSJacob Faibussowitsch   PetscCall(ISDestroy(&a->row));
26832205254eSKarl Rupp 
2684c3122656SLisandro Dalcin   a->row = row;
26852205254eSKarl Rupp 
26869566063dSJacob Faibussowitsch   PetscCall(PetscObjectReference((PetscObject)col));
26879566063dSJacob Faibussowitsch   PetscCall(ISDestroy(&a->col));
26882205254eSKarl Rupp 
2689c3122656SLisandro Dalcin   a->col = col;
269063b91edcSBarry Smith 
269136db0b34SBarry Smith   /* Create the inverse permutation so that it can be used in MatLUFactorNumeric() */
26929566063dSJacob Faibussowitsch   PetscCall(ISDestroy(&a->icol));
26939566063dSJacob Faibussowitsch   PetscCall(ISInvertPermutation(col, PETSC_DECIDE, &a->icol));
2694f0ec6fceSSatish Balay 
269594a9d846SBarry Smith   if (!a->solve_work) { /* this matrix may have been factored before */
26969566063dSJacob Faibussowitsch     PetscCall(PetscMalloc1(inA->rmap->n + 1, &a->solve_work));
269794a9d846SBarry Smith   }
269863b91edcSBarry Smith 
26999566063dSJacob Faibussowitsch   PetscCall(MatMarkDiagonal_SeqAIJ(inA));
2700137fb511SHong Zhang   if (row_identity && col_identity) {
27019566063dSJacob Faibussowitsch     PetscCall(MatLUFactorNumeric_SeqAIJ_inplace(outA, inA, info));
2702137fb511SHong Zhang   } else {
27039566063dSJacob Faibussowitsch     PetscCall(MatLUFactorNumeric_SeqAIJ_InplaceWithPerm(outA, inA, info));
2704137fb511SHong Zhang   }
27053ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
2706a871dcd8SBarry Smith }
2707a871dcd8SBarry Smith 
2708d71ae5a4SJacob Faibussowitsch PetscErrorCode MatScale_SeqAIJ(Mat inA, PetscScalar alpha)
2709d71ae5a4SJacob Faibussowitsch {
2710f0b747eeSBarry Smith   Mat_SeqAIJ  *a = (Mat_SeqAIJ *)inA->data;
2711dfa0f9e5SStefano Zampini   PetscScalar *v;
2712c5df96a5SBarry Smith   PetscBLASInt one = 1, bnz;
27133a40ed3dSBarry Smith 
27143a40ed3dSBarry Smith   PetscFunctionBegin;
27159566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArray(inA, &v));
27169566063dSJacob Faibussowitsch   PetscCall(PetscBLASIntCast(a->nz, &bnz));
2717792fecdfSBarry Smith   PetscCallBLAS("BLASscal", BLASscal_(&bnz, &alpha, v, &one));
27189566063dSJacob Faibussowitsch   PetscCall(PetscLogFlops(a->nz));
27199566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArray(inA, &v));
27209566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJInvalidateDiagonal(inA));
27213ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
2722f0b747eeSBarry Smith }
2723f0b747eeSBarry Smith 
2724d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDestroySubMatrix_Private(Mat_SubSppt *submatj)
2725d71ae5a4SJacob Faibussowitsch {
272616b64355SHong Zhang   PetscInt i;
272716b64355SHong Zhang 
272816b64355SHong Zhang   PetscFunctionBegin;
272916b64355SHong Zhang   if (!submatj->id) { /* delete data that are linked only to submats[id=0] */
27309566063dSJacob Faibussowitsch     PetscCall(PetscFree4(submatj->sbuf1, submatj->ptr, submatj->tmp, submatj->ctr));
273116b64355SHong Zhang 
273248a46eb9SPierre Jolivet     for (i = 0; i < submatj->nrqr; ++i) PetscCall(PetscFree(submatj->sbuf2[i]));
27339566063dSJacob Faibussowitsch     PetscCall(PetscFree3(submatj->sbuf2, submatj->req_size, submatj->req_source1));
273416b64355SHong Zhang 
273516b64355SHong Zhang     if (submatj->rbuf1) {
27369566063dSJacob Faibussowitsch       PetscCall(PetscFree(submatj->rbuf1[0]));
27379566063dSJacob Faibussowitsch       PetscCall(PetscFree(submatj->rbuf1));
273816b64355SHong Zhang     }
273916b64355SHong Zhang 
274048a46eb9SPierre Jolivet     for (i = 0; i < submatj->nrqs; ++i) PetscCall(PetscFree(submatj->rbuf3[i]));
27419566063dSJacob Faibussowitsch     PetscCall(PetscFree3(submatj->req_source2, submatj->rbuf2, submatj->rbuf3));
27429566063dSJacob Faibussowitsch     PetscCall(PetscFree(submatj->pa));
274316b64355SHong Zhang   }
274416b64355SHong Zhang 
274516b64355SHong Zhang #if defined(PETSC_USE_CTABLE)
2746eec179cfSJacob Faibussowitsch   PetscCall(PetscHMapIDestroy(&submatj->rmap));
27479566063dSJacob Faibussowitsch   if (submatj->cmap_loc) PetscCall(PetscFree(submatj->cmap_loc));
27489566063dSJacob Faibussowitsch   PetscCall(PetscFree(submatj->rmap_loc));
274916b64355SHong Zhang #else
27509566063dSJacob Faibussowitsch   PetscCall(PetscFree(submatj->rmap));
275116b64355SHong Zhang #endif
275216b64355SHong Zhang 
275316b64355SHong Zhang   if (!submatj->allcolumns) {
275416b64355SHong Zhang #if defined(PETSC_USE_CTABLE)
2755eec179cfSJacob Faibussowitsch     PetscCall(PetscHMapIDestroy((PetscHMapI *)&submatj->cmap));
275616b64355SHong Zhang #else
27579566063dSJacob Faibussowitsch     PetscCall(PetscFree(submatj->cmap));
275816b64355SHong Zhang #endif
275916b64355SHong Zhang   }
27609566063dSJacob Faibussowitsch   PetscCall(PetscFree(submatj->row2proc));
276116b64355SHong Zhang 
27629566063dSJacob Faibussowitsch   PetscCall(PetscFree(submatj));
27633ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
276416b64355SHong Zhang }
276516b64355SHong Zhang 
2766d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDestroySubMatrix_SeqAIJ(Mat C)
2767d71ae5a4SJacob Faibussowitsch {
276816b64355SHong Zhang   Mat_SeqAIJ  *c       = (Mat_SeqAIJ *)C->data;
27695c39f6d9SHong Zhang   Mat_SubSppt *submatj = c->submatis1;
277016b64355SHong Zhang 
277116b64355SHong Zhang   PetscFunctionBegin;
27729566063dSJacob Faibussowitsch   PetscCall((*submatj->destroy)(C));
27739566063dSJacob Faibussowitsch   PetscCall(MatDestroySubMatrix_Private(submatj));
27743ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
277516b64355SHong Zhang }
277616b64355SHong Zhang 
277789a1a59bSHong Zhang /* Note this has code duplication with MatDestroySubMatrices_SeqBAIJ() */
2778d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDestroySubMatrices_SeqAIJ(PetscInt n, Mat *mat[])
2779d71ae5a4SJacob Faibussowitsch {
27802d033e1fSHong Zhang   PetscInt     i;
27810fb991dcSHong Zhang   Mat          C;
27820fb991dcSHong Zhang   Mat_SeqAIJ  *c;
27830fb991dcSHong Zhang   Mat_SubSppt *submatj;
27842d033e1fSHong Zhang 
27852d033e1fSHong Zhang   PetscFunctionBegin;
27862d033e1fSHong Zhang   for (i = 0; i < n; i++) {
27870fb991dcSHong Zhang     C       = (*mat)[i];
27880fb991dcSHong Zhang     c       = (Mat_SeqAIJ *)C->data;
27890fb991dcSHong Zhang     submatj = c->submatis1;
27902d033e1fSHong Zhang     if (submatj) {
2791682e4c99SStefano Zampini       if (--((PetscObject)C)->refct <= 0) {
279226cc229bSBarry Smith         PetscCall(PetscFree(C->factorprefix));
27939566063dSJacob Faibussowitsch         PetscCall((*submatj->destroy)(C));
27949566063dSJacob Faibussowitsch         PetscCall(MatDestroySubMatrix_Private(submatj));
27959566063dSJacob Faibussowitsch         PetscCall(PetscFree(C->defaultvectype));
27963faff063SStefano Zampini         PetscCall(PetscFree(C->defaultrandtype));
27979566063dSJacob Faibussowitsch         PetscCall(PetscLayoutDestroy(&C->rmap));
27989566063dSJacob Faibussowitsch         PetscCall(PetscLayoutDestroy(&C->cmap));
27999566063dSJacob Faibussowitsch         PetscCall(PetscHeaderDestroy(&C));
2800682e4c99SStefano Zampini       }
28012d033e1fSHong Zhang     } else {
28029566063dSJacob Faibussowitsch       PetscCall(MatDestroy(&C));
28032d033e1fSHong Zhang     }
28042d033e1fSHong Zhang   }
280586e85357SHong Zhang 
280663a75b2aSHong Zhang   /* Destroy Dummy submatrices created for reuse */
28079566063dSJacob Faibussowitsch   PetscCall(MatDestroySubMatrices_Dummy(n, mat));
280863a75b2aSHong Zhang 
28099566063dSJacob Faibussowitsch   PetscCall(PetscFree(*mat));
28103ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
28112d033e1fSHong Zhang }
28122d033e1fSHong Zhang 
2813d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateSubMatrices_SeqAIJ(Mat A, PetscInt n, const IS irow[], const IS icol[], MatReuse scall, Mat *B[])
2814d71ae5a4SJacob Faibussowitsch {
281597f1f81fSBarry Smith   PetscInt i;
2816cddf8d76SBarry Smith 
28173a40ed3dSBarry Smith   PetscFunctionBegin;
281848a46eb9SPierre Jolivet   if (scall == MAT_INITIAL_MATRIX) PetscCall(PetscCalloc1(n + 1, B));
2819cddf8d76SBarry Smith 
282048a46eb9SPierre Jolivet   for (i = 0; i < n; i++) PetscCall(MatCreateSubMatrix_SeqAIJ(A, irow[i], icol[i], PETSC_DECIDE, scall, &(*B)[i]));
28213ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
2822cddf8d76SBarry Smith }
2823cddf8d76SBarry Smith 
2824d71ae5a4SJacob Faibussowitsch PetscErrorCode MatIncreaseOverlap_SeqAIJ(Mat A, PetscInt is_max, IS is[], PetscInt ov)
2825d71ae5a4SJacob Faibussowitsch {
2826e4d965acSSatish Balay   Mat_SeqAIJ     *a = (Mat_SeqAIJ *)A->data;
28279a88ca10SBarry Smith   PetscInt        row, i, j, k, l, ll, m, n, *nidx, isz, val;
28285d0c19d7SBarry Smith   const PetscInt *idx;
28299a88ca10SBarry Smith   PetscInt        start, end, *ai, *aj, bs = (A->rmap->bs > 0 && A->rmap->bs == A->cmap->bs) ? A->rmap->bs : 1;
2830f1af5d2fSBarry Smith   PetscBT         table;
2831bbd702dbSSatish Balay 
28323a40ed3dSBarry Smith   PetscFunctionBegin;
28339a88ca10SBarry Smith   m  = A->rmap->n / bs;
2834e4d965acSSatish Balay   ai = a->i;
2835bfeeae90SHong Zhang   aj = a->j;
28368a047759SSatish Balay 
283708401ef6SPierre Jolivet   PetscCheck(ov >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "illegal negative overlap value used");
283806763907SSatish Balay 
28399566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(m + 1, &nidx));
28409566063dSJacob Faibussowitsch   PetscCall(PetscBTCreate(m, &table));
284106763907SSatish Balay 
2842e4d965acSSatish Balay   for (i = 0; i < is_max; i++) {
2843b97fc60eSLois Curfman McInnes     /* Initialize the two local arrays */
2844e4d965acSSatish Balay     isz = 0;
28459566063dSJacob Faibussowitsch     PetscCall(PetscBTMemzero(m, table));
2846e4d965acSSatish Balay 
2847e4d965acSSatish Balay     /* Extract the indices, assume there can be duplicate entries */
28489566063dSJacob Faibussowitsch     PetscCall(ISGetIndices(is[i], &idx));
28499566063dSJacob Faibussowitsch     PetscCall(ISGetLocalSize(is[i], &n));
2850e4d965acSSatish Balay 
28519a88ca10SBarry Smith     if (bs > 1) {
28529a88ca10SBarry Smith       /* Enter these into the temp arrays. I.e., mark table[row], enter row into new index */
28539a88ca10SBarry Smith       for (j = 0; j < n; ++j) {
28549a88ca10SBarry Smith         if (!PetscBTLookupSet(table, idx[j] / bs)) nidx[isz++] = idx[j] / bs;
28559a88ca10SBarry Smith       }
28569a88ca10SBarry Smith       PetscCall(ISRestoreIndices(is[i], &idx));
28579a88ca10SBarry Smith       PetscCall(ISDestroy(&is[i]));
28589a88ca10SBarry Smith 
28599a88ca10SBarry Smith       k = 0;
28609a88ca10SBarry Smith       for (j = 0; j < ov; j++) { /* for each overlap */
28619a88ca10SBarry Smith         n = isz;
28629a88ca10SBarry Smith         for (; k < n; k++) { /* do only those rows in nidx[k], which are not done yet */
28639a88ca10SBarry Smith           for (ll = 0; ll < bs; ll++) {
28649a88ca10SBarry Smith             row   = bs * nidx[k] + ll;
28659a88ca10SBarry Smith             start = ai[row];
28669a88ca10SBarry Smith             end   = ai[row + 1];
28679a88ca10SBarry Smith             for (l = start; l < end; l++) {
28689a88ca10SBarry Smith               val = aj[l] / bs;
28699a88ca10SBarry Smith               if (!PetscBTLookupSet(table, val)) nidx[isz++] = val;
28709a88ca10SBarry Smith             }
28719a88ca10SBarry Smith           }
28729a88ca10SBarry Smith         }
28739a88ca10SBarry Smith       }
28749a88ca10SBarry Smith       PetscCall(ISCreateBlock(PETSC_COMM_SELF, bs, isz, nidx, PETSC_COPY_VALUES, (is + i)));
28759a88ca10SBarry Smith     } else {
2876dd097bc3SLois Curfman McInnes       /* Enter these into the temp arrays. I.e., mark table[row], enter row into new index */
2877e4d965acSSatish Balay       for (j = 0; j < n; ++j) {
28782205254eSKarl Rupp         if (!PetscBTLookupSet(table, idx[j])) nidx[isz++] = idx[j];
28794dcbc457SBarry Smith       }
28809566063dSJacob Faibussowitsch       PetscCall(ISRestoreIndices(is[i], &idx));
28819566063dSJacob Faibussowitsch       PetscCall(ISDestroy(&is[i]));
2882e4d965acSSatish Balay 
288304a348a9SBarry Smith       k = 0;
288404a348a9SBarry Smith       for (j = 0; j < ov; j++) { /* for each overlap */
288504a348a9SBarry Smith         n = isz;
288606763907SSatish Balay         for (; k < n; k++) { /* do only those rows in nidx[k], which are not done yet */
2887e4d965acSSatish Balay           row   = nidx[k];
2888e4d965acSSatish Balay           start = ai[row];
2889e4d965acSSatish Balay           end   = ai[row + 1];
289004a348a9SBarry Smith           for (l = start; l < end; l++) {
2891efb16452SHong Zhang             val = aj[l];
28922205254eSKarl Rupp             if (!PetscBTLookupSet(table, val)) nidx[isz++] = val;
2893e4d965acSSatish Balay           }
2894e4d965acSSatish Balay         }
2895e4d965acSSatish Balay       }
28969566063dSJacob Faibussowitsch       PetscCall(ISCreateGeneral(PETSC_COMM_SELF, isz, nidx, PETSC_COPY_VALUES, (is + i)));
2897e4d965acSSatish Balay     }
28989a88ca10SBarry Smith   }
28999566063dSJacob Faibussowitsch   PetscCall(PetscBTDestroy(&table));
29009566063dSJacob Faibussowitsch   PetscCall(PetscFree(nidx));
29013ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
29024dcbc457SBarry Smith }
290317ab2063SBarry Smith 
2904d71ae5a4SJacob Faibussowitsch PetscErrorCode MatPermute_SeqAIJ(Mat A, IS rowp, IS colp, Mat *B)
2905d71ae5a4SJacob Faibussowitsch {
29060513a670SBarry Smith   Mat_SeqAIJ     *a = (Mat_SeqAIJ *)A->data;
29073b98c0a2SBarry Smith   PetscInt        i, nz = 0, m = A->rmap->n, n = A->cmap->n;
29085d0c19d7SBarry Smith   const PetscInt *row, *col;
29095d0c19d7SBarry Smith   PetscInt       *cnew, j, *lens;
291056cd22aeSBarry Smith   IS              icolp, irowp;
29110298fd71SBarry Smith   PetscInt       *cwork = NULL;
29120298fd71SBarry Smith   PetscScalar    *vwork = NULL;
29130513a670SBarry Smith 
29143a40ed3dSBarry Smith   PetscFunctionBegin;
29159566063dSJacob Faibussowitsch   PetscCall(ISInvertPermutation(rowp, PETSC_DECIDE, &irowp));
29169566063dSJacob Faibussowitsch   PetscCall(ISGetIndices(irowp, &row));
29179566063dSJacob Faibussowitsch   PetscCall(ISInvertPermutation(colp, PETSC_DECIDE, &icolp));
29189566063dSJacob Faibussowitsch   PetscCall(ISGetIndices(icolp, &col));
29190513a670SBarry Smith 
29200513a670SBarry Smith   /* determine lengths of permuted rows */
29219566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(m + 1, &lens));
29222205254eSKarl Rupp   for (i = 0; i < m; i++) lens[row[i]] = a->i[i + 1] - a->i[i];
29239566063dSJacob Faibussowitsch   PetscCall(MatCreate(PetscObjectComm((PetscObject)A), B));
29249566063dSJacob Faibussowitsch   PetscCall(MatSetSizes(*B, m, n, m, n));
29259566063dSJacob Faibussowitsch   PetscCall(MatSetBlockSizesFromMats(*B, A, A));
29269566063dSJacob Faibussowitsch   PetscCall(MatSetType(*B, ((PetscObject)A)->type_name));
29279566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(*B, 0, lens));
29289566063dSJacob Faibussowitsch   PetscCall(PetscFree(lens));
29290513a670SBarry Smith 
29309566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(n, &cnew));
29310513a670SBarry Smith   for (i = 0; i < m; i++) {
29329566063dSJacob Faibussowitsch     PetscCall(MatGetRow_SeqAIJ(A, i, &nz, &cwork, &vwork));
29332205254eSKarl Rupp     for (j = 0; j < nz; j++) cnew[j] = col[cwork[j]];
29349566063dSJacob Faibussowitsch     PetscCall(MatSetValues_SeqAIJ(*B, 1, &row[i], nz, cnew, vwork, INSERT_VALUES));
29359566063dSJacob Faibussowitsch     PetscCall(MatRestoreRow_SeqAIJ(A, i, &nz, &cwork, &vwork));
29360513a670SBarry Smith   }
29379566063dSJacob Faibussowitsch   PetscCall(PetscFree(cnew));
29382205254eSKarl Rupp 
29393c7d62e4SBarry Smith   (*B)->assembled = PETSC_FALSE;
29402205254eSKarl Rupp 
29418c3ff71bSJunchao Zhang #if defined(PETSC_HAVE_DEVICE)
29429566063dSJacob Faibussowitsch   PetscCall(MatBindToCPU(*B, A->boundtocpu));
29439fe5e383SStefano Zampini #endif
29449566063dSJacob Faibussowitsch   PetscCall(MatAssemblyBegin(*B, MAT_FINAL_ASSEMBLY));
29459566063dSJacob Faibussowitsch   PetscCall(MatAssemblyEnd(*B, MAT_FINAL_ASSEMBLY));
29469566063dSJacob Faibussowitsch   PetscCall(ISRestoreIndices(irowp, &row));
29479566063dSJacob Faibussowitsch   PetscCall(ISRestoreIndices(icolp, &col));
29489566063dSJacob Faibussowitsch   PetscCall(ISDestroy(&irowp));
29499566063dSJacob Faibussowitsch   PetscCall(ISDestroy(&icolp));
295048a46eb9SPierre Jolivet   if (rowp == colp) PetscCall(MatPropagateSymmetryOptions(A, *B));
29513ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
29520513a670SBarry Smith }
29530513a670SBarry Smith 
2954d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCopy_SeqAIJ(Mat A, Mat B, MatStructure str)
2955d71ae5a4SJacob Faibussowitsch {
2956cb5b572fSBarry Smith   PetscFunctionBegin;
295733f4a19fSKris Buschelman   /* If the two matrices have the same copy implementation, use fast copy. */
295833f4a19fSKris Buschelman   if (str == SAME_NONZERO_PATTERN && (A->ops->copy == B->ops->copy)) {
2959be6bf707SBarry Smith     Mat_SeqAIJ        *a = (Mat_SeqAIJ *)A->data;
2960be6bf707SBarry Smith     Mat_SeqAIJ        *b = (Mat_SeqAIJ *)B->data;
29612e5835c6SStefano Zampini     const PetscScalar *aa;
2962be6bf707SBarry Smith 
29639566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJGetArrayRead(A, &aa));
296408401ef6SPierre Jolivet     PetscCheck(a->i[A->rmap->n] == b->i[B->rmap->n], PETSC_COMM_SELF, PETSC_ERR_ARG_INCOMP, "Number of nonzeros in two matrices are different %" PetscInt_FMT " != %" PetscInt_FMT, a->i[A->rmap->n], b->i[B->rmap->n]);
29659566063dSJacob Faibussowitsch     PetscCall(PetscArraycpy(b->a, aa, a->i[A->rmap->n]));
29669566063dSJacob Faibussowitsch     PetscCall(PetscObjectStateIncrease((PetscObject)B));
29679566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJRestoreArrayRead(A, &aa));
2968cb5b572fSBarry Smith   } else {
29699566063dSJacob Faibussowitsch     PetscCall(MatCopy_Basic(A, B, str));
2970cb5b572fSBarry Smith   }
29713ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
2972cb5b572fSBarry Smith }
2973cb5b572fSBarry Smith 
2974d71ae5a4SJacob Faibussowitsch PETSC_INTERN PetscErrorCode MatSeqAIJGetArray_SeqAIJ(Mat A, PetscScalar *array[])
2975d71ae5a4SJacob Faibussowitsch {
29766c0721eeSBarry Smith   Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data;
29776e111a19SKarl Rupp 
29786c0721eeSBarry Smith   PetscFunctionBegin;
29796c0721eeSBarry Smith   *array = a->a;
29803ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
29816c0721eeSBarry Smith }
29826c0721eeSBarry Smith 
2983d71ae5a4SJacob Faibussowitsch PETSC_INTERN PetscErrorCode MatSeqAIJRestoreArray_SeqAIJ(Mat A, PetscScalar *array[])
2984d71ae5a4SJacob Faibussowitsch {
29856c0721eeSBarry Smith   PetscFunctionBegin;
2986f38c1e66SStefano Zampini   *array = NULL;
29873ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
29886c0721eeSBarry Smith }
2989273d9f13SBarry Smith 
29908229c054SShri Abhyankar /*
29918229c054SShri Abhyankar    Computes the number of nonzeros per row needed for preallocation when X and Y
29928229c054SShri Abhyankar    have different nonzero structure.
29938229c054SShri Abhyankar */
2994d71ae5a4SJacob Faibussowitsch PetscErrorCode MatAXPYGetPreallocation_SeqX_private(PetscInt m, const PetscInt *xi, const PetscInt *xj, const PetscInt *yi, const PetscInt *yj, PetscInt *nnz)
2995d71ae5a4SJacob Faibussowitsch {
2996b264fe52SHong Zhang   PetscInt i, j, k, nzx, nzy;
2997ec7775f6SShri Abhyankar 
2998ec7775f6SShri Abhyankar   PetscFunctionBegin;
2999ec7775f6SShri Abhyankar   /* Set the number of nonzeros in the new matrix */
3000ec7775f6SShri Abhyankar   for (i = 0; i < m; i++) {
3001b264fe52SHong Zhang     const PetscInt *xjj = xj + xi[i], *yjj = yj + yi[i];
3002b264fe52SHong Zhang     nzx    = xi[i + 1] - xi[i];
3003b264fe52SHong Zhang     nzy    = yi[i + 1] - yi[i];
30048af7cee1SJed Brown     nnz[i] = 0;
30058af7cee1SJed Brown     for (j = 0, k = 0; j < nzx; j++) {                  /* Point in X */
3006b264fe52SHong Zhang       for (; k < nzy && yjj[k] < xjj[j]; k++) nnz[i]++; /* Catch up to X */
3007b264fe52SHong Zhang       if (k < nzy && yjj[k] == xjj[j]) k++;             /* Skip duplicate */
30088af7cee1SJed Brown       nnz[i]++;
30098af7cee1SJed Brown     }
30108af7cee1SJed Brown     for (; k < nzy; k++) nnz[i]++;
3011ec7775f6SShri Abhyankar   }
30123ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3013ec7775f6SShri Abhyankar }
3014ec7775f6SShri Abhyankar 
3015d71ae5a4SJacob Faibussowitsch PetscErrorCode MatAXPYGetPreallocation_SeqAIJ(Mat Y, Mat X, PetscInt *nnz)
3016d71ae5a4SJacob Faibussowitsch {
3017b264fe52SHong Zhang   PetscInt    m = Y->rmap->N;
3018b264fe52SHong Zhang   Mat_SeqAIJ *x = (Mat_SeqAIJ *)X->data;
3019b264fe52SHong Zhang   Mat_SeqAIJ *y = (Mat_SeqAIJ *)Y->data;
3020b264fe52SHong Zhang 
3021b264fe52SHong Zhang   PetscFunctionBegin;
3022b264fe52SHong Zhang   /* Set the number of nonzeros in the new matrix */
30239566063dSJacob Faibussowitsch   PetscCall(MatAXPYGetPreallocation_SeqX_private(m, x->i, x->j, y->i, y->j, nnz));
30243ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3025b264fe52SHong Zhang }
3026b264fe52SHong Zhang 
3027d71ae5a4SJacob Faibussowitsch PetscErrorCode MatAXPY_SeqAIJ(Mat Y, PetscScalar a, Mat X, MatStructure str)
3028d71ae5a4SJacob Faibussowitsch {
3029ac90fabeSBarry Smith   Mat_SeqAIJ *x = (Mat_SeqAIJ *)X->data, *y = (Mat_SeqAIJ *)Y->data;
3030ac90fabeSBarry Smith 
3031ac90fabeSBarry Smith   PetscFunctionBegin;
3032134adf20SPierre Jolivet   if (str == UNKNOWN_NONZERO_PATTERN || (PetscDefined(USE_DEBUG) && str == SAME_NONZERO_PATTERN)) {
3033134adf20SPierre Jolivet     PetscBool e = x->nz == y->nz ? PETSC_TRUE : PETSC_FALSE;
3034134adf20SPierre Jolivet     if (e) {
30359566063dSJacob Faibussowitsch       PetscCall(PetscArraycmp(x->i, y->i, Y->rmap->n + 1, &e));
303681fa06acSBarry Smith       if (e) {
30379566063dSJacob Faibussowitsch         PetscCall(PetscArraycmp(x->j, y->j, y->nz, &e));
3038134adf20SPierre Jolivet         if (e) str = SAME_NONZERO_PATTERN;
303981fa06acSBarry Smith       }
304081fa06acSBarry Smith     }
304154c59aa7SJacob Faibussowitsch     if (!e) PetscCheck(str != SAME_NONZERO_PATTERN, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONG, "MatStructure is not SAME_NONZERO_PATTERN");
304281fa06acSBarry Smith   }
3043ac90fabeSBarry Smith   if (str == SAME_NONZERO_PATTERN) {
30442e5835c6SStefano Zampini     const PetscScalar *xa;
30452e5835c6SStefano Zampini     PetscScalar       *ya, alpha = a;
304681fa06acSBarry Smith     PetscBLASInt       one = 1, bnz;
304781fa06acSBarry Smith 
30489566063dSJacob Faibussowitsch     PetscCall(PetscBLASIntCast(x->nz, &bnz));
30499566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJGetArray(Y, &ya));
30509566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJGetArrayRead(X, &xa));
3051792fecdfSBarry Smith     PetscCallBLAS("BLASaxpy", BLASaxpy_(&bnz, &alpha, xa, &one, ya, &one));
30529566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJRestoreArrayRead(X, &xa));
30539566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJRestoreArray(Y, &ya));
30549566063dSJacob Faibussowitsch     PetscCall(PetscLogFlops(2.0 * bnz));
30559566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJInvalidateDiagonal(Y));
30569566063dSJacob Faibussowitsch     PetscCall(PetscObjectStateIncrease((PetscObject)Y));
3057ab784542SHong Zhang   } else if (str == SUBSET_NONZERO_PATTERN) { /* nonzeros of X is a subset of Y's */
30589566063dSJacob Faibussowitsch     PetscCall(MatAXPY_Basic(Y, a, X, str));
3059ac90fabeSBarry Smith   } else {
30608229c054SShri Abhyankar     Mat       B;
30618229c054SShri Abhyankar     PetscInt *nnz;
30629566063dSJacob Faibussowitsch     PetscCall(PetscMalloc1(Y->rmap->N, &nnz));
30639566063dSJacob Faibussowitsch     PetscCall(MatCreate(PetscObjectComm((PetscObject)Y), &B));
30649566063dSJacob Faibussowitsch     PetscCall(PetscObjectSetName((PetscObject)B, ((PetscObject)Y)->name));
30659566063dSJacob Faibussowitsch     PetscCall(MatSetLayouts(B, Y->rmap, Y->cmap));
30669566063dSJacob Faibussowitsch     PetscCall(MatSetType(B, ((PetscObject)Y)->type_name));
30679566063dSJacob Faibussowitsch     PetscCall(MatAXPYGetPreallocation_SeqAIJ(Y, X, nnz));
30689566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJSetPreallocation(B, 0, nnz));
30699566063dSJacob Faibussowitsch     PetscCall(MatAXPY_BasicWithPreallocation(B, Y, a, X, str));
30709566063dSJacob Faibussowitsch     PetscCall(MatHeaderMerge(Y, &B));
30719bb234a9SBarry Smith     PetscCall(MatSeqAIJCheckInode(Y));
30729566063dSJacob Faibussowitsch     PetscCall(PetscFree(nnz));
3073ac90fabeSBarry Smith   }
30743ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3075ac90fabeSBarry Smith }
3076ac90fabeSBarry Smith 
3077d71ae5a4SJacob Faibussowitsch PETSC_INTERN PetscErrorCode MatConjugate_SeqAIJ(Mat mat)
3078d71ae5a4SJacob Faibussowitsch {
3079354c94deSBarry Smith #if defined(PETSC_USE_COMPLEX)
3080354c94deSBarry Smith   Mat_SeqAIJ  *aij = (Mat_SeqAIJ *)mat->data;
3081354c94deSBarry Smith   PetscInt     i, nz;
3082354c94deSBarry Smith   PetscScalar *a;
3083354c94deSBarry Smith 
3084354c94deSBarry Smith   PetscFunctionBegin;
3085354c94deSBarry Smith   nz = aij->nz;
30869566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArray(mat, &a));
30872205254eSKarl Rupp   for (i = 0; i < nz; i++) a[i] = PetscConj(a[i]);
30889566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArray(mat, &a));
3089354c94deSBarry Smith #else
3090354c94deSBarry Smith   PetscFunctionBegin;
3091354c94deSBarry Smith #endif
30923ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3093354c94deSBarry Smith }
3094354c94deSBarry Smith 
3095d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetRowMaxAbs_SeqAIJ(Mat A, Vec v, PetscInt idx[])
3096d71ae5a4SJacob Faibussowitsch {
3097e34fafa9SBarry Smith   Mat_SeqAIJ      *a = (Mat_SeqAIJ *)A->data;
3098d0f46423SBarry Smith   PetscInt         i, j, m = A->rmap->n, *ai, *aj, ncols, n;
3099e34fafa9SBarry Smith   PetscReal        atmp;
3100985db425SBarry Smith   PetscScalar     *x;
3101ce496241SStefano Zampini   const MatScalar *aa, *av;
3102e34fafa9SBarry Smith 
3103e34fafa9SBarry Smith   PetscFunctionBegin;
310428b400f6SJacob Faibussowitsch   PetscCheck(!A->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix");
31059566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &av));
3106ce496241SStefano Zampini   aa = av;
3107e34fafa9SBarry Smith   ai = a->i;
3108e34fafa9SBarry Smith   aj = a->j;
3109e34fafa9SBarry Smith 
31109566063dSJacob Faibussowitsch   PetscCall(VecSet(v, 0.0));
31119566063dSJacob Faibussowitsch   PetscCall(VecGetArrayWrite(v, &x));
31129566063dSJacob Faibussowitsch   PetscCall(VecGetLocalSize(v, &n));
311308401ef6SPierre Jolivet   PetscCheck(n == A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Nonconforming matrix and vector");
3114e34fafa9SBarry Smith   for (i = 0; i < m; i++) {
31159371c9d4SSatish Balay     ncols = ai[1] - ai[0];
31169371c9d4SSatish Balay     ai++;
3117e34fafa9SBarry Smith     for (j = 0; j < ncols; j++) {
3118985db425SBarry Smith       atmp = PetscAbsScalar(*aa);
31199371c9d4SSatish Balay       if (PetscAbsScalar(x[i]) < atmp) {
31209371c9d4SSatish Balay         x[i] = atmp;
31219371c9d4SSatish Balay         if (idx) idx[i] = *aj;
31229371c9d4SSatish Balay       }
31239371c9d4SSatish Balay       aa++;
31249371c9d4SSatish Balay       aj++;
3125985db425SBarry Smith     }
3126985db425SBarry Smith   }
31279566063dSJacob Faibussowitsch   PetscCall(VecRestoreArrayWrite(v, &x));
31289566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &av));
31293ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3130985db425SBarry Smith }
3131985db425SBarry Smith 
3132d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetRowMax_SeqAIJ(Mat A, Vec v, PetscInt idx[])
3133d71ae5a4SJacob Faibussowitsch {
3134985db425SBarry Smith   Mat_SeqAIJ      *a = (Mat_SeqAIJ *)A->data;
3135d0f46423SBarry Smith   PetscInt         i, j, m = A->rmap->n, *ai, *aj, ncols, n;
3136985db425SBarry Smith   PetscScalar     *x;
3137ce496241SStefano Zampini   const MatScalar *aa, *av;
3138985db425SBarry Smith 
3139985db425SBarry Smith   PetscFunctionBegin;
314028b400f6SJacob Faibussowitsch   PetscCheck(!A->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix");
31419566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &av));
3142ce496241SStefano Zampini   aa = av;
3143985db425SBarry Smith   ai = a->i;
3144985db425SBarry Smith   aj = a->j;
3145985db425SBarry Smith 
31469566063dSJacob Faibussowitsch   PetscCall(VecSet(v, 0.0));
31479566063dSJacob Faibussowitsch   PetscCall(VecGetArrayWrite(v, &x));
31489566063dSJacob Faibussowitsch   PetscCall(VecGetLocalSize(v, &n));
314908401ef6SPierre Jolivet   PetscCheck(n == A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Nonconforming matrix and vector");
3150985db425SBarry Smith   for (i = 0; i < m; i++) {
31519371c9d4SSatish Balay     ncols = ai[1] - ai[0];
31529371c9d4SSatish Balay     ai++;
3153d0f46423SBarry Smith     if (ncols == A->cmap->n) { /* row is dense */
31549371c9d4SSatish Balay       x[i] = *aa;
31559371c9d4SSatish Balay       if (idx) idx[i] = 0;
3156985db425SBarry Smith     } else { /* row is sparse so already KNOW maximum is 0.0 or higher */
3157985db425SBarry Smith       x[i] = 0.0;
3158985db425SBarry Smith       if (idx) {
3159985db425SBarry Smith         for (j = 0; j < ncols; j++) { /* find first implicit 0.0 in the row */
3160985db425SBarry Smith           if (aj[j] > j) {
3161985db425SBarry Smith             idx[i] = j;
3162985db425SBarry Smith             break;
3163985db425SBarry Smith           }
3164985db425SBarry Smith         }
31651a254869SHong Zhang         /* in case first implicit 0.0 in the row occurs at ncols-th column */
31661a254869SHong Zhang         if (j == ncols && j < A->cmap->n) idx[i] = j;
3167985db425SBarry Smith       }
3168985db425SBarry Smith     }
3169985db425SBarry Smith     for (j = 0; j < ncols; j++) {
31709371c9d4SSatish Balay       if (PetscRealPart(x[i]) < PetscRealPart(*aa)) {
31719371c9d4SSatish Balay         x[i] = *aa;
31729371c9d4SSatish Balay         if (idx) idx[i] = *aj;
31739371c9d4SSatish Balay       }
31749371c9d4SSatish Balay       aa++;
31759371c9d4SSatish Balay       aj++;
3176985db425SBarry Smith     }
3177985db425SBarry Smith   }
31789566063dSJacob Faibussowitsch   PetscCall(VecRestoreArrayWrite(v, &x));
31799566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &av));
31803ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3181985db425SBarry Smith }
3182985db425SBarry Smith 
3183d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetRowMinAbs_SeqAIJ(Mat A, Vec v, PetscInt idx[])
3184d71ae5a4SJacob Faibussowitsch {
3185c87e5d42SMatthew Knepley   Mat_SeqAIJ      *a = (Mat_SeqAIJ *)A->data;
3186c87e5d42SMatthew Knepley   PetscInt         i, j, m = A->rmap->n, *ai, *aj, ncols, n;
3187ce496241SStefano Zampini   PetscScalar     *x;
3188ce496241SStefano Zampini   const MatScalar *aa, *av;
3189c87e5d42SMatthew Knepley 
3190c87e5d42SMatthew Knepley   PetscFunctionBegin;
31919566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &av));
3192ce496241SStefano Zampini   aa = av;
3193c87e5d42SMatthew Knepley   ai = a->i;
3194c87e5d42SMatthew Knepley   aj = a->j;
3195c87e5d42SMatthew Knepley 
31969566063dSJacob Faibussowitsch   PetscCall(VecSet(v, 0.0));
31979566063dSJacob Faibussowitsch   PetscCall(VecGetArrayWrite(v, &x));
31989566063dSJacob Faibussowitsch   PetscCall(VecGetLocalSize(v, &n));
319908401ef6SPierre Jolivet   PetscCheck(n == m, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Nonconforming matrix and vector, %" PetscInt_FMT " vs. %" PetscInt_FMT " rows", m, n);
3200c87e5d42SMatthew Knepley   for (i = 0; i < m; i++) {
32019371c9d4SSatish Balay     ncols = ai[1] - ai[0];
32029371c9d4SSatish Balay     ai++;
3203f07e67edSHong Zhang     if (ncols == A->cmap->n) { /* row is dense */
32049371c9d4SSatish Balay       x[i] = *aa;
32059371c9d4SSatish Balay       if (idx) idx[i] = 0;
3206f07e67edSHong Zhang     } else { /* row is sparse so already KNOW minimum is 0.0 or higher */
3207f07e67edSHong Zhang       x[i] = 0.0;
3208f07e67edSHong Zhang       if (idx) { /* find first implicit 0.0 in the row */
3209289a08f5SMatthew Knepley         for (j = 0; j < ncols; j++) {
3210f07e67edSHong Zhang           if (aj[j] > j) {
3211f07e67edSHong Zhang             idx[i] = j;
32122205254eSKarl Rupp             break;
32132205254eSKarl Rupp           }
3214289a08f5SMatthew Knepley         }
3215f07e67edSHong Zhang         /* in case first implicit 0.0 in the row occurs at ncols-th column */
3216f07e67edSHong Zhang         if (j == ncols && j < A->cmap->n) idx[i] = j;
3217f07e67edSHong Zhang       }
3218289a08f5SMatthew Knepley     }
3219c87e5d42SMatthew Knepley     for (j = 0; j < ncols; j++) {
32209371c9d4SSatish Balay       if (PetscAbsScalar(x[i]) > PetscAbsScalar(*aa)) {
32219371c9d4SSatish Balay         x[i] = *aa;
32229371c9d4SSatish Balay         if (idx) idx[i] = *aj;
32239371c9d4SSatish Balay       }
32249371c9d4SSatish Balay       aa++;
32259371c9d4SSatish Balay       aj++;
3226c87e5d42SMatthew Knepley     }
3227c87e5d42SMatthew Knepley   }
32289566063dSJacob Faibussowitsch   PetscCall(VecRestoreArrayWrite(v, &x));
32299566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &av));
32303ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3231c87e5d42SMatthew Knepley }
3232c87e5d42SMatthew Knepley 
3233d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetRowMin_SeqAIJ(Mat A, Vec v, PetscInt idx[])
3234d71ae5a4SJacob Faibussowitsch {
3235985db425SBarry Smith   Mat_SeqAIJ      *a = (Mat_SeqAIJ *)A->data;
3236d9ca1df4SBarry Smith   PetscInt         i, j, m = A->rmap->n, ncols, n;
3237d9ca1df4SBarry Smith   const PetscInt  *ai, *aj;
3238985db425SBarry Smith   PetscScalar     *x;
3239ce496241SStefano Zampini   const MatScalar *aa, *av;
3240985db425SBarry Smith 
3241985db425SBarry Smith   PetscFunctionBegin;
324228b400f6SJacob Faibussowitsch   PetscCheck(!A->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix");
32439566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &av));
3244ce496241SStefano Zampini   aa = av;
3245985db425SBarry Smith   ai = a->i;
3246985db425SBarry Smith   aj = a->j;
3247985db425SBarry Smith 
32489566063dSJacob Faibussowitsch   PetscCall(VecSet(v, 0.0));
32499566063dSJacob Faibussowitsch   PetscCall(VecGetArrayWrite(v, &x));
32509566063dSJacob Faibussowitsch   PetscCall(VecGetLocalSize(v, &n));
325108401ef6SPierre Jolivet   PetscCheck(n == m, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Nonconforming matrix and vector");
3252985db425SBarry Smith   for (i = 0; i < m; i++) {
32539371c9d4SSatish Balay     ncols = ai[1] - ai[0];
32549371c9d4SSatish Balay     ai++;
3255d0f46423SBarry Smith     if (ncols == A->cmap->n) { /* row is dense */
32569371c9d4SSatish Balay       x[i] = *aa;
32579371c9d4SSatish Balay       if (idx) idx[i] = 0;
3258985db425SBarry Smith     } else { /* row is sparse so already KNOW minimum is 0.0 or lower */
3259985db425SBarry Smith       x[i] = 0.0;
3260985db425SBarry Smith       if (idx) { /* find first implicit 0.0 in the row */
3261985db425SBarry Smith         for (j = 0; j < ncols; j++) {
3262985db425SBarry Smith           if (aj[j] > j) {
3263985db425SBarry Smith             idx[i] = j;
3264985db425SBarry Smith             break;
3265985db425SBarry Smith           }
3266985db425SBarry Smith         }
3267fa213d2fSHong Zhang         /* in case first implicit 0.0 in the row occurs at ncols-th column */
3268fa213d2fSHong Zhang         if (j == ncols && j < A->cmap->n) idx[i] = j;
3269985db425SBarry Smith       }
3270985db425SBarry Smith     }
3271985db425SBarry Smith     for (j = 0; j < ncols; j++) {
32729371c9d4SSatish Balay       if (PetscRealPart(x[i]) > PetscRealPart(*aa)) {
32739371c9d4SSatish Balay         x[i] = *aa;
32749371c9d4SSatish Balay         if (idx) idx[i] = *aj;
32759371c9d4SSatish Balay       }
32769371c9d4SSatish Balay       aa++;
32779371c9d4SSatish Balay       aj++;
3278e34fafa9SBarry Smith     }
3279e34fafa9SBarry Smith   }
32809566063dSJacob Faibussowitsch   PetscCall(VecRestoreArrayWrite(v, &x));
32819566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &av));
32823ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3283e34fafa9SBarry Smith }
3284bbead8a2SBarry Smith 
3285d71ae5a4SJacob Faibussowitsch PetscErrorCode MatInvertBlockDiagonal_SeqAIJ(Mat A, const PetscScalar **values)
3286d71ae5a4SJacob Faibussowitsch {
3287bbead8a2SBarry Smith   Mat_SeqAIJ     *a = (Mat_SeqAIJ *)A->data;
328833d57670SJed Brown   PetscInt        i, bs = PetscAbs(A->rmap->bs), mbs = A->rmap->n / bs, ipvt[5], bs2 = bs * bs, *v_pivots, ij[7], *IJ, j;
3289bbead8a2SBarry Smith   MatScalar      *diag, work[25], *v_work;
32900da83c2eSBarry Smith   const PetscReal shift = 0.0;
32911a9391e3SHong Zhang   PetscBool       allowzeropivot, zeropivotdetected = PETSC_FALSE;
3292bbead8a2SBarry Smith 
3293bbead8a2SBarry Smith   PetscFunctionBegin;
3294a455e926SHong Zhang   allowzeropivot = PetscNot(A->erroriffailure);
32954a0d0026SBarry Smith   if (a->ibdiagvalid) {
32964a0d0026SBarry Smith     if (values) *values = a->ibdiag;
32973ba16761SJacob Faibussowitsch     PetscFunctionReturn(PETSC_SUCCESS);
32984a0d0026SBarry Smith   }
32999566063dSJacob Faibussowitsch   PetscCall(MatMarkDiagonal_SeqAIJ(A));
33004dfa11a4SJacob Faibussowitsch   if (!a->ibdiag) { PetscCall(PetscMalloc1(bs2 * mbs, &a->ibdiag)); }
3301bbead8a2SBarry Smith   diag = a->ibdiag;
3302bbead8a2SBarry Smith   if (values) *values = a->ibdiag;
3303bbead8a2SBarry Smith   /* factor and invert each block */
3304bbead8a2SBarry Smith   switch (bs) {
3305bbead8a2SBarry Smith   case 1:
3306bbead8a2SBarry Smith     for (i = 0; i < mbs; i++) {
33079566063dSJacob Faibussowitsch       PetscCall(MatGetValues(A, 1, &i, 1, &i, diag + i));
3308ec1892c8SHong Zhang       if (PetscAbsScalar(diag[i] + shift) < PETSC_MACHINE_EPSILON) {
3309ec1892c8SHong Zhang         if (allowzeropivot) {
33107b6c816cSBarry Smith           A->factorerrortype             = MAT_FACTOR_NUMERIC_ZEROPIVOT;
33117b6c816cSBarry Smith           A->factorerror_zeropivot_value = PetscAbsScalar(diag[i]);
33127b6c816cSBarry Smith           A->factorerror_zeropivot_row   = i;
33139566063dSJacob Faibussowitsch           PetscCall(PetscInfo(A, "Zero pivot, row %" PetscInt_FMT " pivot %g tolerance %g\n", i, (double)PetscAbsScalar(diag[i]), (double)PETSC_MACHINE_EPSILON));
331498921bdaSJacob Faibussowitsch         } else SETERRQ(PETSC_COMM_SELF, PETSC_ERR_MAT_LU_ZRPVT, "Zero pivot, row %" PetscInt_FMT " pivot %g tolerance %g", i, (double)PetscAbsScalar(diag[i]), (double)PETSC_MACHINE_EPSILON);
3315ec1892c8SHong Zhang       }
3316bbead8a2SBarry Smith       diag[i] = (PetscScalar)1.0 / (diag[i] + shift);
3317bbead8a2SBarry Smith     }
3318bbead8a2SBarry Smith     break;
3319bbead8a2SBarry Smith   case 2:
3320bbead8a2SBarry Smith     for (i = 0; i < mbs; i++) {
33219371c9d4SSatish Balay       ij[0] = 2 * i;
33229371c9d4SSatish Balay       ij[1] = 2 * i + 1;
33239566063dSJacob Faibussowitsch       PetscCall(MatGetValues(A, 2, ij, 2, ij, diag));
33249566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_inverse_A_2(diag, shift, allowzeropivot, &zeropivotdetected));
33257b6c816cSBarry Smith       if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT;
33269566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_transpose_A_2(diag));
3327bbead8a2SBarry Smith       diag += 4;
3328bbead8a2SBarry Smith     }
3329bbead8a2SBarry Smith     break;
3330bbead8a2SBarry Smith   case 3:
3331bbead8a2SBarry Smith     for (i = 0; i < mbs; i++) {
33329371c9d4SSatish Balay       ij[0] = 3 * i;
33339371c9d4SSatish Balay       ij[1] = 3 * i + 1;
33349371c9d4SSatish Balay       ij[2] = 3 * i + 2;
33359566063dSJacob Faibussowitsch       PetscCall(MatGetValues(A, 3, ij, 3, ij, diag));
33369566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_inverse_A_3(diag, shift, allowzeropivot, &zeropivotdetected));
33377b6c816cSBarry Smith       if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT;
33389566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_transpose_A_3(diag));
3339bbead8a2SBarry Smith       diag += 9;
3340bbead8a2SBarry Smith     }
3341bbead8a2SBarry Smith     break;
3342bbead8a2SBarry Smith   case 4:
3343bbead8a2SBarry Smith     for (i = 0; i < mbs; i++) {
33449371c9d4SSatish Balay       ij[0] = 4 * i;
33459371c9d4SSatish Balay       ij[1] = 4 * i + 1;
33469371c9d4SSatish Balay       ij[2] = 4 * i + 2;
33479371c9d4SSatish Balay       ij[3] = 4 * i + 3;
33489566063dSJacob Faibussowitsch       PetscCall(MatGetValues(A, 4, ij, 4, ij, diag));
33499566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_inverse_A_4(diag, shift, allowzeropivot, &zeropivotdetected));
33507b6c816cSBarry Smith       if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT;
33519566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_transpose_A_4(diag));
3352bbead8a2SBarry Smith       diag += 16;
3353bbead8a2SBarry Smith     }
3354bbead8a2SBarry Smith     break;
3355bbead8a2SBarry Smith   case 5:
3356bbead8a2SBarry Smith     for (i = 0; i < mbs; i++) {
33579371c9d4SSatish Balay       ij[0] = 5 * i;
33589371c9d4SSatish Balay       ij[1] = 5 * i + 1;
33599371c9d4SSatish Balay       ij[2] = 5 * i + 2;
33609371c9d4SSatish Balay       ij[3] = 5 * i + 3;
33619371c9d4SSatish Balay       ij[4] = 5 * i + 4;
33629566063dSJacob Faibussowitsch       PetscCall(MatGetValues(A, 5, ij, 5, ij, diag));
33639566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_inverse_A_5(diag, ipvt, work, shift, allowzeropivot, &zeropivotdetected));
33647b6c816cSBarry Smith       if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT;
33659566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_transpose_A_5(diag));
3366bbead8a2SBarry Smith       diag += 25;
3367bbead8a2SBarry Smith     }
3368bbead8a2SBarry Smith     break;
3369bbead8a2SBarry Smith   case 6:
3370bbead8a2SBarry Smith     for (i = 0; i < mbs; i++) {
33719371c9d4SSatish Balay       ij[0] = 6 * i;
33729371c9d4SSatish Balay       ij[1] = 6 * i + 1;
33739371c9d4SSatish Balay       ij[2] = 6 * i + 2;
33749371c9d4SSatish Balay       ij[3] = 6 * i + 3;
33759371c9d4SSatish Balay       ij[4] = 6 * i + 4;
33769371c9d4SSatish Balay       ij[5] = 6 * i + 5;
33779566063dSJacob Faibussowitsch       PetscCall(MatGetValues(A, 6, ij, 6, ij, diag));
33789566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_inverse_A_6(diag, shift, allowzeropivot, &zeropivotdetected));
33797b6c816cSBarry Smith       if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT;
33809566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_transpose_A_6(diag));
3381bbead8a2SBarry Smith       diag += 36;
3382bbead8a2SBarry Smith     }
3383bbead8a2SBarry Smith     break;
3384bbead8a2SBarry Smith   case 7:
3385bbead8a2SBarry Smith     for (i = 0; i < mbs; i++) {
33869371c9d4SSatish Balay       ij[0] = 7 * i;
33879371c9d4SSatish Balay       ij[1] = 7 * i + 1;
33889371c9d4SSatish Balay       ij[2] = 7 * i + 2;
33899371c9d4SSatish Balay       ij[3] = 7 * i + 3;
33909371c9d4SSatish Balay       ij[4] = 7 * i + 4;
33919371c9d4SSatish Balay       ij[5] = 7 * i + 5;
3392cdd8bf47SJunchao Zhang       ij[6] = 7 * i + 6;
33939566063dSJacob Faibussowitsch       PetscCall(MatGetValues(A, 7, ij, 7, ij, diag));
33949566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_inverse_A_7(diag, shift, allowzeropivot, &zeropivotdetected));
33957b6c816cSBarry Smith       if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT;
33969566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_transpose_A_7(diag));
3397bbead8a2SBarry Smith       diag += 49;
3398bbead8a2SBarry Smith     }
3399bbead8a2SBarry Smith     break;
3400bbead8a2SBarry Smith   default:
34019566063dSJacob Faibussowitsch     PetscCall(PetscMalloc3(bs, &v_work, bs, &v_pivots, bs, &IJ));
3402bbead8a2SBarry Smith     for (i = 0; i < mbs; i++) {
3403ad540459SPierre Jolivet       for (j = 0; j < bs; j++) IJ[j] = bs * i + j;
34049566063dSJacob Faibussowitsch       PetscCall(MatGetValues(A, bs, IJ, bs, IJ, diag));
34059566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_inverse_A(bs, diag, v_pivots, v_work, allowzeropivot, &zeropivotdetected));
34067b6c816cSBarry Smith       if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT;
34079566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_transpose_A_N(diag, bs));
3408bbead8a2SBarry Smith       diag += bs2;
3409bbead8a2SBarry Smith     }
34109566063dSJacob Faibussowitsch     PetscCall(PetscFree3(v_work, v_pivots, IJ));
3411bbead8a2SBarry Smith   }
3412bbead8a2SBarry Smith   a->ibdiagvalid = PETSC_TRUE;
34133ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3414bbead8a2SBarry Smith }
3415bbead8a2SBarry Smith 
3416d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatSetRandom_SeqAIJ(Mat x, PetscRandom rctx)
3417d71ae5a4SJacob Faibussowitsch {
341873a71a0fSBarry Smith   Mat_SeqAIJ *aij = (Mat_SeqAIJ *)x->data;
3419fff043a9SJunchao Zhang   PetscScalar a, *aa;
342073a71a0fSBarry Smith   PetscInt    m, n, i, j, col;
342173a71a0fSBarry Smith 
342273a71a0fSBarry Smith   PetscFunctionBegin;
342373a71a0fSBarry Smith   if (!x->assembled) {
34249566063dSJacob Faibussowitsch     PetscCall(MatGetSize(x, &m, &n));
342573a71a0fSBarry Smith     for (i = 0; i < m; i++) {
342673a71a0fSBarry Smith       for (j = 0; j < aij->imax[i]; j++) {
34279566063dSJacob Faibussowitsch         PetscCall(PetscRandomGetValue(rctx, &a));
342873a71a0fSBarry Smith         col = (PetscInt)(n * PetscRealPart(a));
34299566063dSJacob Faibussowitsch         PetscCall(MatSetValues(x, 1, &i, 1, &col, &a, ADD_VALUES));
343073a71a0fSBarry Smith       }
343173a71a0fSBarry Smith     }
3432e2ce353bSJunchao Zhang   } else {
34339566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJGetArrayWrite(x, &aa));
34349566063dSJacob Faibussowitsch     for (i = 0; i < aij->nz; i++) PetscCall(PetscRandomGetValue(rctx, aa + i));
34359566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJRestoreArrayWrite(x, &aa));
3436e2ce353bSJunchao Zhang   }
34379566063dSJacob Faibussowitsch   PetscCall(MatAssemblyBegin(x, MAT_FINAL_ASSEMBLY));
34389566063dSJacob Faibussowitsch   PetscCall(MatAssemblyEnd(x, MAT_FINAL_ASSEMBLY));
34393ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
344073a71a0fSBarry Smith }
344173a71a0fSBarry Smith 
3442679944adSJunchao Zhang /* Like MatSetRandom_SeqAIJ, but do not set values on columns in range of [low, high) */
3443d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetRandomSkipColumnRange_SeqAIJ_Private(Mat x, PetscInt low, PetscInt high, PetscRandom rctx)
3444d71ae5a4SJacob Faibussowitsch {
3445679944adSJunchao Zhang   Mat_SeqAIJ *aij = (Mat_SeqAIJ *)x->data;
3446679944adSJunchao Zhang   PetscScalar a;
3447679944adSJunchao Zhang   PetscInt    m, n, i, j, col, nskip;
3448679944adSJunchao Zhang 
3449679944adSJunchao Zhang   PetscFunctionBegin;
3450679944adSJunchao Zhang   nskip = high - low;
34519566063dSJacob Faibussowitsch   PetscCall(MatGetSize(x, &m, &n));
3452679944adSJunchao Zhang   n -= nskip; /* shrink number of columns where nonzeros can be set */
3453679944adSJunchao Zhang   for (i = 0; i < m; i++) {
3454679944adSJunchao Zhang     for (j = 0; j < aij->imax[i]; j++) {
34559566063dSJacob Faibussowitsch       PetscCall(PetscRandomGetValue(rctx, &a));
3456679944adSJunchao Zhang       col = (PetscInt)(n * PetscRealPart(a));
3457679944adSJunchao Zhang       if (col >= low) col += nskip; /* shift col rightward to skip the hole */
34589566063dSJacob Faibussowitsch       PetscCall(MatSetValues(x, 1, &i, 1, &col, &a, ADD_VALUES));
3459679944adSJunchao Zhang     }
3460e2ce353bSJunchao Zhang   }
34619566063dSJacob Faibussowitsch   PetscCall(MatAssemblyBegin(x, MAT_FINAL_ASSEMBLY));
34629566063dSJacob Faibussowitsch   PetscCall(MatAssemblyEnd(x, MAT_FINAL_ASSEMBLY));
34633ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3464679944adSJunchao Zhang }
3465679944adSJunchao Zhang 
34660a6ffc59SBarry Smith static struct _MatOps MatOps_Values = {MatSetValues_SeqAIJ,
3467cb5b572fSBarry Smith                                        MatGetRow_SeqAIJ,
3468cb5b572fSBarry Smith                                        MatRestoreRow_SeqAIJ,
3469cb5b572fSBarry Smith                                        MatMult_SeqAIJ,
347097304618SKris Buschelman                                        /*  4*/ MatMultAdd_SeqAIJ,
34717c922b88SBarry Smith                                        MatMultTranspose_SeqAIJ,
34727c922b88SBarry Smith                                        MatMultTransposeAdd_SeqAIJ,
3473f4259b30SLisandro Dalcin                                        NULL,
3474f4259b30SLisandro Dalcin                                        NULL,
3475f4259b30SLisandro Dalcin                                        NULL,
3476f4259b30SLisandro Dalcin                                        /* 10*/ NULL,
3477cb5b572fSBarry Smith                                        MatLUFactor_SeqAIJ,
3478f4259b30SLisandro Dalcin                                        NULL,
347941f059aeSBarry Smith                                        MatSOR_SeqAIJ,
348091e9d3e2SHong Zhang                                        MatTranspose_SeqAIJ,
348197304618SKris Buschelman                                        /*1 5*/ MatGetInfo_SeqAIJ,
3482cb5b572fSBarry Smith                                        MatEqual_SeqAIJ,
3483cb5b572fSBarry Smith                                        MatGetDiagonal_SeqAIJ,
3484cb5b572fSBarry Smith                                        MatDiagonalScale_SeqAIJ,
3485cb5b572fSBarry Smith                                        MatNorm_SeqAIJ,
3486f4259b30SLisandro Dalcin                                        /* 20*/ NULL,
3487cb5b572fSBarry Smith                                        MatAssemblyEnd_SeqAIJ,
3488cb5b572fSBarry Smith                                        MatSetOption_SeqAIJ,
3489cb5b572fSBarry Smith                                        MatZeroEntries_SeqAIJ,
3490d519adbfSMatthew Knepley                                        /* 24*/ MatZeroRows_SeqAIJ,
3491f4259b30SLisandro Dalcin                                        NULL,
3492f4259b30SLisandro Dalcin                                        NULL,
3493f4259b30SLisandro Dalcin                                        NULL,
3494f4259b30SLisandro Dalcin                                        NULL,
349526cec326SBarry Smith                                        /* 29*/ MatSetUp_Seq_Hash,
3496f4259b30SLisandro Dalcin                                        NULL,
3497f4259b30SLisandro Dalcin                                        NULL,
3498f4259b30SLisandro Dalcin                                        NULL,
3499f4259b30SLisandro Dalcin                                        NULL,
3500d519adbfSMatthew Knepley                                        /* 34*/ MatDuplicate_SeqAIJ,
3501f4259b30SLisandro Dalcin                                        NULL,
3502f4259b30SLisandro Dalcin                                        NULL,
3503cb5b572fSBarry Smith                                        MatILUFactor_SeqAIJ,
3504f4259b30SLisandro Dalcin                                        NULL,
3505d519adbfSMatthew Knepley                                        /* 39*/ MatAXPY_SeqAIJ,
35067dae84e0SHong Zhang                                        MatCreateSubMatrices_SeqAIJ,
3507cb5b572fSBarry Smith                                        MatIncreaseOverlap_SeqAIJ,
3508cb5b572fSBarry Smith                                        MatGetValues_SeqAIJ,
3509cb5b572fSBarry Smith                                        MatCopy_SeqAIJ,
3510d519adbfSMatthew Knepley                                        /* 44*/ MatGetRowMax_SeqAIJ,
3511cb5b572fSBarry Smith                                        MatScale_SeqAIJ,
35127d68702bSBarry Smith                                        MatShift_SeqAIJ,
351379299369SBarry Smith                                        MatDiagonalSet_SeqAIJ,
35146e169961SBarry Smith                                        MatZeroRowsColumns_SeqAIJ,
351573a71a0fSBarry Smith                                        /* 49*/ MatSetRandom_SeqAIJ,
35163b2fbd54SBarry Smith                                        MatGetRowIJ_SeqAIJ,
35173b2fbd54SBarry Smith                                        MatRestoreRowIJ_SeqAIJ,
35183b2fbd54SBarry Smith                                        MatGetColumnIJ_SeqAIJ,
3519a93ec695SBarry Smith                                        MatRestoreColumnIJ_SeqAIJ,
352093dfae19SHong Zhang                                        /* 54*/ MatFDColoringCreate_SeqXAIJ,
3521f4259b30SLisandro Dalcin                                        NULL,
3522f4259b30SLisandro Dalcin                                        NULL,
3523cda55fadSBarry Smith                                        MatPermute_SeqAIJ,
3524f4259b30SLisandro Dalcin                                        NULL,
3525f4259b30SLisandro Dalcin                                        /* 59*/ NULL,
3526b9b97703SBarry Smith                                        MatDestroy_SeqAIJ,
3527b9b97703SBarry Smith                                        MatView_SeqAIJ,
3528f4259b30SLisandro Dalcin                                        NULL,
3529f4259b30SLisandro Dalcin                                        NULL,
3530f4259b30SLisandro Dalcin                                        /* 64*/ NULL,
3531321b30b9SSatish Balay                                        MatMatMatMultNumeric_SeqAIJ_SeqAIJ_SeqAIJ,
3532f4259b30SLisandro Dalcin                                        NULL,
3533f4259b30SLisandro Dalcin                                        NULL,
3534f4259b30SLisandro Dalcin                                        NULL,
3535d519adbfSMatthew Knepley                                        /* 69*/ MatGetRowMaxAbs_SeqAIJ,
3536c87e5d42SMatthew Knepley                                        MatGetRowMinAbs_SeqAIJ,
3537f4259b30SLisandro Dalcin                                        NULL,
3538f4259b30SLisandro Dalcin                                        NULL,
3539f4259b30SLisandro Dalcin                                        NULL,
3540f4259b30SLisandro Dalcin                                        /* 74*/ NULL,
35413acb8795SBarry Smith                                        MatFDColoringApply_AIJ,
3542f4259b30SLisandro Dalcin                                        NULL,
3543f4259b30SLisandro Dalcin                                        NULL,
3544f4259b30SLisandro Dalcin                                        NULL,
35456ce1633cSBarry Smith                                        /* 79*/ MatFindZeroDiagonals_SeqAIJ,
3546f4259b30SLisandro Dalcin                                        NULL,
3547f4259b30SLisandro Dalcin                                        NULL,
3548f4259b30SLisandro Dalcin                                        NULL,
3549bc011b1eSHong Zhang                                        MatLoad_SeqAIJ,
3550d519adbfSMatthew Knepley                                        /* 84*/ MatIsSymmetric_SeqAIJ,
35511cbb95d3SBarry Smith                                        MatIsHermitian_SeqAIJ,
3552f4259b30SLisandro Dalcin                                        NULL,
3553f4259b30SLisandro Dalcin                                        NULL,
3554f4259b30SLisandro Dalcin                                        NULL,
3555f4259b30SLisandro Dalcin                                        /* 89*/ NULL,
3556f4259b30SLisandro Dalcin                                        NULL,
355726be0446SHong Zhang                                        MatMatMultNumeric_SeqAIJ_SeqAIJ,
3558f4259b30SLisandro Dalcin                                        NULL,
3559f4259b30SLisandro Dalcin                                        NULL,
35608fa4b5a6SHong Zhang                                        /* 94*/ MatPtAPNumeric_SeqAIJ_SeqAIJ_SparseAxpy,
3561f4259b30SLisandro Dalcin                                        NULL,
3562f4259b30SLisandro Dalcin                                        NULL,
35636fc122caSHong Zhang                                        MatMatTransposeMultNumeric_SeqAIJ_SeqAIJ,
3564f4259b30SLisandro Dalcin                                        NULL,
35654222ddf1SHong Zhang                                        /* 99*/ MatProductSetFromOptions_SeqAIJ,
3566f4259b30SLisandro Dalcin                                        NULL,
3567f4259b30SLisandro Dalcin                                        NULL,
356887d4246cSBarry Smith                                        MatConjugate_SeqAIJ,
3569f4259b30SLisandro Dalcin                                        NULL,
3570d519adbfSMatthew Knepley                                        /*104*/ MatSetValuesRow_SeqAIJ,
357199cafbc1SBarry Smith                                        MatRealPart_SeqAIJ,
3572f5edf698SHong Zhang                                        MatImaginaryPart_SeqAIJ,
3573f4259b30SLisandro Dalcin                                        NULL,
3574f4259b30SLisandro Dalcin                                        NULL,
3575cbd44569SHong Zhang                                        /*109*/ MatMatSolve_SeqAIJ,
3576f4259b30SLisandro Dalcin                                        NULL,
35772af78befSBarry Smith                                        MatGetRowMin_SeqAIJ,
3578f4259b30SLisandro Dalcin                                        NULL,
3579599ef60dSHong Zhang                                        MatMissingDiagonal_SeqAIJ,
3580f4259b30SLisandro Dalcin                                        /*114*/ NULL,
3581f4259b30SLisandro Dalcin                                        NULL,
3582f4259b30SLisandro Dalcin                                        NULL,
3583f4259b30SLisandro Dalcin                                        NULL,
3584f4259b30SLisandro Dalcin                                        NULL,
3585f4259b30SLisandro Dalcin                                        /*119*/ NULL,
3586f4259b30SLisandro Dalcin                                        NULL,
3587f4259b30SLisandro Dalcin                                        NULL,
3588f4259b30SLisandro Dalcin                                        NULL,
3589b3a44c85SBarry Smith                                        MatGetMultiProcBlock_SeqAIJ,
35900716a85fSBarry Smith                                        /*124*/ MatFindNonzeroRows_SeqAIJ,
3591a873a8cdSSam Reynolds                                        MatGetColumnReductions_SeqAIJ,
359237868618SMatthew G Knepley                                        MatInvertBlockDiagonal_SeqAIJ,
35930da83c2eSBarry Smith                                        MatInvertVariableBlockDiagonal_SeqAIJ,
3594f4259b30SLisandro Dalcin                                        NULL,
3595f4259b30SLisandro Dalcin                                        /*129*/ NULL,
3596f4259b30SLisandro Dalcin                                        NULL,
3597f4259b30SLisandro Dalcin                                        NULL,
359875648e8dSHong Zhang                                        MatTransposeMatMultNumeric_SeqAIJ_SeqAIJ,
3599b9af6bddSHong Zhang                                        MatTransposeColoringCreate_SeqAIJ,
3600b9af6bddSHong Zhang                                        /*134*/ MatTransColoringApplySpToDen_SeqAIJ,
36012b8ad9a3SHong Zhang                                        MatTransColoringApplyDenToSp_SeqAIJ,
3602f4259b30SLisandro Dalcin                                        NULL,
3603f4259b30SLisandro Dalcin                                        NULL,
36043964eb88SJed Brown                                        MatRARtNumeric_SeqAIJ_SeqAIJ,
3605f4259b30SLisandro Dalcin                                        /*139*/ NULL,
3606f4259b30SLisandro Dalcin                                        NULL,
3607f4259b30SLisandro Dalcin                                        NULL,
36083a062f41SBarry Smith                                        MatFDColoringSetUp_SeqXAIJ,
36099c8f2541SHong Zhang                                        MatFindOffBlockDiagonalEntries_SeqAIJ,
36104222ddf1SHong Zhang                                        MatCreateMPIMatConcatenateSeqMat_SeqAIJ,
36114222ddf1SHong Zhang                                        /*145*/ MatDestroySubMatrices_SeqAIJ,
3612f4259b30SLisandro Dalcin                                        NULL,
361372833a62Smarkadams4                                        NULL,
361472833a62Smarkadams4                                        MatCreateGraph_Simple_AIJ,
36152d776b49SBarry Smith                                        NULL,
3616dec0b466SHong Zhang                                        /*150*/ MatTransposeSymbolic_SeqAIJ,
3617dec0b466SHong Zhang                                        MatEliminateZeros_SeqAIJ};
361817ab2063SBarry Smith 
3619d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetColumnIndices_SeqAIJ(Mat mat, PetscInt *indices)
3620d71ae5a4SJacob Faibussowitsch {
3621bef8e0ddSBarry Smith   Mat_SeqAIJ *aij = (Mat_SeqAIJ *)mat->data;
362297f1f81fSBarry Smith   PetscInt    i, nz, n;
3623bef8e0ddSBarry Smith 
3624bef8e0ddSBarry Smith   PetscFunctionBegin;
3625bef8e0ddSBarry Smith   nz = aij->maxnz;
3626d0f46423SBarry Smith   n  = mat->rmap->n;
3627ad540459SPierre Jolivet   for (i = 0; i < nz; i++) aij->j[i] = indices[i];
3628bef8e0ddSBarry Smith   aij->nz = nz;
3629ad540459SPierre Jolivet   for (i = 0; i < n; i++) aij->ilen[i] = aij->imax[i];
36303ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3631bef8e0ddSBarry Smith }
3632bef8e0ddSBarry Smith 
3633a3bb6f32SFande Kong /*
3634ddea5d60SJunchao Zhang  * Given a sparse matrix with global column indices, compact it by using a local column space.
3635ddea5d60SJunchao Zhang  * The result matrix helps saving memory in other algorithms, such as MatPtAPSymbolic_MPIAIJ_MPIAIJ_scalable()
3636ddea5d60SJunchao Zhang  */
3637d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJCompactOutExtraColumns_SeqAIJ(Mat mat, ISLocalToGlobalMapping *mapping)
3638d71ae5a4SJacob Faibussowitsch {
3639a3bb6f32SFande Kong   Mat_SeqAIJ   *aij = (Mat_SeqAIJ *)mat->data;
3640eec179cfSJacob Faibussowitsch   PetscHMapI    gid1_lid1;
3641eec179cfSJacob Faibussowitsch   PetscHashIter tpos;
364225b670f0SStefano Zampini   PetscInt      gid, lid, i, ec, nz = aij->nz;
364325b670f0SStefano Zampini   PetscInt     *garray, *jj = aij->j;
3644a3bb6f32SFande Kong 
3645a3bb6f32SFande Kong   PetscFunctionBegin;
3646a3bb6f32SFande Kong   PetscValidHeaderSpecific(mat, MAT_CLASSID, 1);
3647a3bb6f32SFande Kong   PetscValidPointer(mapping, 2);
3648a3bb6f32SFande Kong   /* use a table */
3649eec179cfSJacob Faibussowitsch   PetscCall(PetscHMapICreateWithSize(mat->rmap->n, &gid1_lid1));
3650a3bb6f32SFande Kong   ec = 0;
365125b670f0SStefano Zampini   for (i = 0; i < nz; i++) {
365225b670f0SStefano Zampini     PetscInt data, gid1 = jj[i] + 1;
3653eec179cfSJacob Faibussowitsch     PetscCall(PetscHMapIGetWithDefault(gid1_lid1, gid1, 0, &data));
3654a3bb6f32SFande Kong     if (!data) {
3655a3bb6f32SFande Kong       /* one based table */
3656c76ffc5fSJacob Faibussowitsch       PetscCall(PetscHMapISet(gid1_lid1, gid1, ++ec));
3657a3bb6f32SFande Kong     }
3658a3bb6f32SFande Kong   }
3659a3bb6f32SFande Kong   /* form array of columns we need */
36609566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(ec, &garray));
3661eec179cfSJacob Faibussowitsch   PetscHashIterBegin(gid1_lid1, tpos);
3662eec179cfSJacob Faibussowitsch   while (!PetscHashIterAtEnd(gid1_lid1, tpos)) {
3663eec179cfSJacob Faibussowitsch     PetscHashIterGetKey(gid1_lid1, tpos, gid);
3664eec179cfSJacob Faibussowitsch     PetscHashIterGetVal(gid1_lid1, tpos, lid);
3665eec179cfSJacob Faibussowitsch     PetscHashIterNext(gid1_lid1, tpos);
3666a3bb6f32SFande Kong     gid--;
3667a3bb6f32SFande Kong     lid--;
3668a3bb6f32SFande Kong     garray[lid] = gid;
3669a3bb6f32SFande Kong   }
36709566063dSJacob Faibussowitsch   PetscCall(PetscSortInt(ec, garray)); /* sort, and rebuild */
3671eec179cfSJacob Faibussowitsch   PetscCall(PetscHMapIClear(gid1_lid1));
3672c76ffc5fSJacob Faibussowitsch   for (i = 0; i < ec; i++) PetscCall(PetscHMapISet(gid1_lid1, garray[i] + 1, i + 1));
3673a3bb6f32SFande Kong   /* compact out the extra columns in B */
367425b670f0SStefano Zampini   for (i = 0; i < nz; i++) {
367525b670f0SStefano Zampini     PetscInt gid1 = jj[i] + 1;
3676eec179cfSJacob Faibussowitsch     PetscCall(PetscHMapIGetWithDefault(gid1_lid1, gid1, 0, &lid));
3677a3bb6f32SFande Kong     lid--;
367825b670f0SStefano Zampini     jj[i] = lid;
3679a3bb6f32SFande Kong   }
36809566063dSJacob Faibussowitsch   PetscCall(PetscLayoutDestroy(&mat->cmap));
3681eec179cfSJacob Faibussowitsch   PetscCall(PetscHMapIDestroy(&gid1_lid1));
36829566063dSJacob Faibussowitsch   PetscCall(PetscLayoutCreateFromSizes(PetscObjectComm((PetscObject)mat), ec, ec, 1, &mat->cmap));
36839566063dSJacob Faibussowitsch   PetscCall(ISLocalToGlobalMappingCreate(PETSC_COMM_SELF, mat->cmap->bs, mat->cmap->n, garray, PETSC_OWN_POINTER, mapping));
36849566063dSJacob Faibussowitsch   PetscCall(ISLocalToGlobalMappingSetType(*mapping, ISLOCALTOGLOBALMAPPINGHASH));
36853ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3686a3bb6f32SFande Kong }
3687a3bb6f32SFande Kong 
3688bef8e0ddSBarry Smith /*@
3689bef8e0ddSBarry Smith     MatSeqAIJSetColumnIndices - Set the column indices for all the rows
3690bef8e0ddSBarry Smith        in the matrix.
3691bef8e0ddSBarry Smith 
3692bef8e0ddSBarry Smith   Input Parameters:
369311a5261eSBarry Smith +  mat - the `MATSEQAIJ` matrix
3694bef8e0ddSBarry Smith -  indices - the column indices
3695bef8e0ddSBarry Smith 
369615091d37SBarry Smith   Level: advanced
369715091d37SBarry Smith 
3698bef8e0ddSBarry Smith   Notes:
3699bef8e0ddSBarry Smith     This can be called if you have precomputed the nonzero structure of the
3700bef8e0ddSBarry Smith   matrix and want to provide it to the matrix object to improve the performance
370111a5261eSBarry Smith   of the `MatSetValues()` operation.
3702bef8e0ddSBarry Smith 
3703bef8e0ddSBarry Smith     You MUST have set the correct numbers of nonzeros per row in the call to
370411a5261eSBarry Smith   `MatCreateSeqAIJ()`, and the columns indices MUST be sorted.
3705bef8e0ddSBarry Smith 
370611a5261eSBarry Smith     MUST be called before any calls to `MatSetValues()`
3707bef8e0ddSBarry Smith 
3708b9617806SBarry Smith     The indices should start with zero, not one.
3709b9617806SBarry Smith 
37101cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MATSEQAIJ`
3711bef8e0ddSBarry Smith @*/
3712d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetColumnIndices(Mat mat, PetscInt *indices)
3713d71ae5a4SJacob Faibussowitsch {
3714bef8e0ddSBarry Smith   PetscFunctionBegin;
37150700a824SBarry Smith   PetscValidHeaderSpecific(mat, MAT_CLASSID, 1);
3716dadcf809SJacob Faibussowitsch   PetscValidIntPointer(indices, 2);
3717cac4c232SBarry Smith   PetscUseMethod(mat, "MatSeqAIJSetColumnIndices_C", (Mat, PetscInt *), (mat, indices));
37183ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3719bef8e0ddSBarry Smith }
3720bef8e0ddSBarry Smith 
3721d71ae5a4SJacob Faibussowitsch PetscErrorCode MatStoreValues_SeqAIJ(Mat mat)
3722d71ae5a4SJacob Faibussowitsch {
3723be6bf707SBarry Smith   Mat_SeqAIJ *aij = (Mat_SeqAIJ *)mat->data;
3724d0f46423SBarry Smith   size_t      nz  = aij->i[mat->rmap->n];
3725be6bf707SBarry Smith 
3726be6bf707SBarry Smith   PetscFunctionBegin;
372728b400f6SJacob Faibussowitsch   PetscCheck(aij->nonew, PETSC_COMM_SELF, PETSC_ERR_ORDER, "Must call MatSetOption(A,MAT_NEW_NONZERO_LOCATIONS,PETSC_FALSE);first");
3728be6bf707SBarry Smith 
3729be6bf707SBarry Smith   /* allocate space for values if not already there */
37304dfa11a4SJacob Faibussowitsch   if (!aij->saved_values) { PetscCall(PetscMalloc1(nz + 1, &aij->saved_values)); }
3731be6bf707SBarry Smith 
3732be6bf707SBarry Smith   /* copy values over */
37339566063dSJacob Faibussowitsch   PetscCall(PetscArraycpy(aij->saved_values, aij->a, nz));
37343ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3735be6bf707SBarry Smith }
3736be6bf707SBarry Smith 
3737be6bf707SBarry Smith /*@
373820f4b53cSBarry Smith     MatStoreValues - Stashes a copy of the matrix values; this allows reusing of the linear part of a Jacobian, while recomputing only the
3739be6bf707SBarry Smith     nonlinear portion.
3740be6bf707SBarry Smith 
3741c3339decSBarry Smith    Logically Collect
3742be6bf707SBarry Smith 
374327430b45SBarry Smith   Input Parameter:
374411a5261eSBarry Smith .  mat - the matrix (currently only `MATAIJ` matrices support this option)
3745be6bf707SBarry Smith 
374615091d37SBarry Smith   Level: advanced
374715091d37SBarry Smith 
374827430b45SBarry Smith   Usage:
374927430b45SBarry Smith .vb
37502ef1f0ffSBarry Smith     Using SNES
375127430b45SBarry Smith     Create Jacobian matrix
375227430b45SBarry Smith     Set linear terms into matrix
375327430b45SBarry Smith     Apply boundary conditions to matrix, at this time matrix must have
375427430b45SBarry Smith       final nonzero structure (i.e. setting the nonlinear terms and applying
375527430b45SBarry Smith       boundary conditions again will not change the nonzero structure
375627430b45SBarry Smith     MatSetOption(mat,MAT_NEW_NONZERO_LOCATIONS,PETSC_FALSE);
375727430b45SBarry Smith     MatStoreValues(mat);
375827430b45SBarry Smith     Call SNESSetJacobian() with matrix
375927430b45SBarry Smith     In your Jacobian routine
376027430b45SBarry Smith       MatRetrieveValues(mat);
376127430b45SBarry Smith       Set nonlinear terms in matrix
3762be6bf707SBarry Smith 
376327430b45SBarry Smith     Without `SNESSolve()`, i.e. when you handle nonlinear solve yourself:
376427430b45SBarry Smith     // build linear portion of Jacobian
376527430b45SBarry Smith     MatSetOption(mat,MAT_NEW_NONZERO_LOCATIONS,PETSC_FALSE);
376627430b45SBarry Smith     MatStoreValues(mat);
376727430b45SBarry Smith     loop over nonlinear iterations
376827430b45SBarry Smith        MatRetrieveValues(mat);
376927430b45SBarry Smith        // call MatSetValues(mat,...) to set nonliner portion of Jacobian
377027430b45SBarry Smith        // call MatAssemblyBegin/End() on matrix
377127430b45SBarry Smith        Solve linear system with Jacobian
377227430b45SBarry Smith     endloop
377327430b45SBarry Smith .ve
3774be6bf707SBarry Smith 
3775be6bf707SBarry Smith   Notes:
3776da81f932SPierre Jolivet     Matrix must already be assembled before calling this routine
377711a5261eSBarry Smith     Must set the matrix option `MatSetOption`(mat,`MAT_NEW_NONZERO_LOCATIONS`,`PETSC_FALSE`); before
3778be6bf707SBarry Smith     calling this routine.
3779be6bf707SBarry Smith 
37800c468ba9SBarry Smith     When this is called multiple times it overwrites the previous set of stored values
37810c468ba9SBarry Smith     and does not allocated additional space.
37820c468ba9SBarry Smith 
37831cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `Mat`, `MatRetrieveValues()`
3784be6bf707SBarry Smith @*/
3785d71ae5a4SJacob Faibussowitsch PetscErrorCode MatStoreValues(Mat mat)
3786d71ae5a4SJacob Faibussowitsch {
3787be6bf707SBarry Smith   PetscFunctionBegin;
37880700a824SBarry Smith   PetscValidHeaderSpecific(mat, MAT_CLASSID, 1);
378928b400f6SJacob Faibussowitsch   PetscCheck(mat->assembled, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for unassembled matrix");
379028b400f6SJacob Faibussowitsch   PetscCheck(!mat->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix");
3791cac4c232SBarry Smith   PetscUseMethod(mat, "MatStoreValues_C", (Mat), (mat));
37923ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3793be6bf707SBarry Smith }
3794be6bf707SBarry Smith 
3795d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRetrieveValues_SeqAIJ(Mat mat)
3796d71ae5a4SJacob Faibussowitsch {
3797be6bf707SBarry Smith   Mat_SeqAIJ *aij = (Mat_SeqAIJ *)mat->data;
3798d0f46423SBarry Smith   PetscInt    nz  = aij->i[mat->rmap->n];
3799be6bf707SBarry Smith 
3800be6bf707SBarry Smith   PetscFunctionBegin;
380128b400f6SJacob Faibussowitsch   PetscCheck(aij->nonew, PETSC_COMM_SELF, PETSC_ERR_ORDER, "Must call MatSetOption(A,MAT_NEW_NONZERO_LOCATIONS,PETSC_FALSE);first");
380228b400f6SJacob Faibussowitsch   PetscCheck(aij->saved_values, PETSC_COMM_SELF, PETSC_ERR_ORDER, "Must call MatStoreValues(A);first");
3803be6bf707SBarry Smith   /* copy values over */
38049566063dSJacob Faibussowitsch   PetscCall(PetscArraycpy(aij->a, aij->saved_values, nz));
38053ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3806be6bf707SBarry Smith }
3807be6bf707SBarry Smith 
3808be6bf707SBarry Smith /*@
380920f4b53cSBarry Smith     MatRetrieveValues - Retrieves the copy of the matrix values that was stored with `MatStoreValues()`
3810be6bf707SBarry Smith 
3811c3339decSBarry Smith    Logically Collect
3812be6bf707SBarry Smith 
38132fe279fdSBarry Smith   Input Parameter:
381411a5261eSBarry Smith .  mat - the matrix (currently only `MATAIJ` matrices support this option)
3815be6bf707SBarry Smith 
381615091d37SBarry Smith   Level: advanced
381715091d37SBarry Smith 
38181cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatStoreValues()`
3819be6bf707SBarry Smith @*/
3820d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRetrieveValues(Mat mat)
3821d71ae5a4SJacob Faibussowitsch {
3822be6bf707SBarry Smith   PetscFunctionBegin;
38230700a824SBarry Smith   PetscValidHeaderSpecific(mat, MAT_CLASSID, 1);
382428b400f6SJacob Faibussowitsch   PetscCheck(mat->assembled, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for unassembled matrix");
382528b400f6SJacob Faibussowitsch   PetscCheck(!mat->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix");
3826cac4c232SBarry Smith   PetscUseMethod(mat, "MatRetrieveValues_C", (Mat), (mat));
38273ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3828be6bf707SBarry Smith }
3829be6bf707SBarry Smith 
383017ab2063SBarry Smith /*@C
383111a5261eSBarry Smith    MatCreateSeqAIJ - Creates a sparse matrix in `MATSEQAIJ` (compressed row) format
38320d15e28bSLois Curfman McInnes    (the default parallel PETSc format).  For good matrix assembly performance
383320f4b53cSBarry Smith    the user should preallocate the matrix storage by setting the parameter `nz`
383420f4b53cSBarry Smith    (or the array `nnz`).
383517ab2063SBarry Smith 
3836d083f849SBarry Smith    Collective
3837db81eaa0SLois Curfman McInnes 
383817ab2063SBarry Smith    Input Parameters:
383911a5261eSBarry Smith +  comm - MPI communicator, set to `PETSC_COMM_SELF`
384017ab2063SBarry Smith .  m - number of rows
384117ab2063SBarry Smith .  n - number of columns
384217ab2063SBarry Smith .  nz - number of nonzeros per row (same for all rows)
384351c19458SBarry Smith -  nnz - array containing the number of nonzeros in the various rows
38440298fd71SBarry Smith          (possibly different for each row) or NULL
384517ab2063SBarry Smith 
384617ab2063SBarry Smith    Output Parameter:
3847416022c9SBarry Smith .  A - the matrix
384817ab2063SBarry Smith 
38492ef1f0ffSBarry Smith    Options Database Keys:
38502ef1f0ffSBarry Smith +  -mat_no_inode  - Do not use inodes
38512ef1f0ffSBarry Smith -  -mat_inode_limit <limit> - Sets inode limit (max limit=5)
38522ef1f0ffSBarry Smith 
38532ef1f0ffSBarry Smith    Level: intermediate
3854175b88e8SBarry Smith 
3855b259b22eSLois Curfman McInnes    Notes:
38562ef1f0ffSBarry Smith    If `nnz` is given then `nz` is ignored
385749a6f317SBarry Smith 
38582ef1f0ffSBarry Smith    The `MATSEQAIJ` format, also called
38592ef1f0ffSBarry Smith    compressed row storage, is fully compatible with standard Fortran
38600002213bSLois Curfman McInnes    storage.  That is, the stored row and column indices can begin at
38612ef1f0ffSBarry Smith    either one (as in Fortran) or zero.
386217ab2063SBarry Smith 
386320f4b53cSBarry Smith    Specify the preallocated storage with either `nz` or `nnz` (not both).
38642ef1f0ffSBarry Smith    Set `nz` = `PETSC_DEFAULT` and `nnz` = `NULL` for PETSc to control dynamic memory
386520f4b53cSBarry Smith    allocation.
386617ab2063SBarry Smith 
3867682d7d0cSBarry Smith    By default, this format uses inodes (identical nodes) when possible, to
38684fca80b9SLois Curfman McInnes    improve numerical efficiency of matrix-vector products and solves. We
3869682d7d0cSBarry Smith    search for consecutive rows with the same nonzero structure, thereby
38706c7ebb05SLois Curfman McInnes    reusing matrix information to achieve increased efficiency.
38716c7ebb05SLois Curfman McInnes 
38721cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, [Sparse Matrix Creation](sec_matsparse), `MatCreate()`, `MatCreateAIJ()`, `MatSetValues()`, `MatSeqAIJSetColumnIndices()`, `MatCreateSeqAIJWithArrays()`
387317ab2063SBarry Smith @*/
3874d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateSeqAIJ(MPI_Comm comm, PetscInt m, PetscInt n, PetscInt nz, const PetscInt nnz[], Mat *A)
3875d71ae5a4SJacob Faibussowitsch {
38763a40ed3dSBarry Smith   PetscFunctionBegin;
38779566063dSJacob Faibussowitsch   PetscCall(MatCreate(comm, A));
38789566063dSJacob Faibussowitsch   PetscCall(MatSetSizes(*A, m, n, m, n));
38799566063dSJacob Faibussowitsch   PetscCall(MatSetType(*A, MATSEQAIJ));
38809566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(*A, nz, nnz));
38813ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3882273d9f13SBarry Smith }
3883273d9f13SBarry Smith 
3884273d9f13SBarry Smith /*@C
3885273d9f13SBarry Smith    MatSeqAIJSetPreallocation - For good matrix assembly performance
3886273d9f13SBarry Smith    the user should preallocate the matrix storage by setting the parameter nz
3887273d9f13SBarry Smith    (or the array nnz).  By setting these parameters accurately, performance
3888273d9f13SBarry Smith    during matrix assembly can be increased by more than a factor of 50.
3889273d9f13SBarry Smith 
3890d083f849SBarry Smith    Collective
3891273d9f13SBarry Smith 
3892273d9f13SBarry Smith    Input Parameters:
38931c4f3114SJed Brown +  B - The matrix
3894273d9f13SBarry Smith .  nz - number of nonzeros per row (same for all rows)
3895273d9f13SBarry Smith -  nnz - array containing the number of nonzeros in the various rows
38960298fd71SBarry Smith          (possibly different for each row) or NULL
3897273d9f13SBarry Smith 
38982ef1f0ffSBarry Smith    Options Database Keys:
38992ef1f0ffSBarry Smith +  -mat_no_inode  - Do not use inodes
39002ef1f0ffSBarry Smith -  -mat_inode_limit <limit> - Sets inode limit (max limit=5)
39012ef1f0ffSBarry Smith 
39022ef1f0ffSBarry Smith    Level: intermediate
39032ef1f0ffSBarry Smith 
3904273d9f13SBarry Smith    Notes:
39052ef1f0ffSBarry Smith      If `nnz` is given then `nz` is ignored
390649a6f317SBarry Smith 
390711a5261eSBarry Smith     The `MATSEQAIJ` format also called
39082ef1f0ffSBarry Smith    compressed row storage, is fully compatible with standard Fortran
3909273d9f13SBarry Smith    storage.  That is, the stored row and column indices can begin at
3910273d9f13SBarry Smith    either one (as in Fortran) or zero.  See the users' manual for details.
3911273d9f13SBarry Smith 
39122ef1f0ffSBarry Smith    Specify the preallocated storage with either `nz` or `nnz` (not both).
39132ef1f0ffSBarry Smith    Set nz = `PETSC_DEFAULT` and `nnz` = `NULL` for PETSc to control dynamic memory
39142ef1f0ffSBarry Smith    allocation.
3915273d9f13SBarry Smith 
391611a5261eSBarry Smith    You can call `MatGetInfo()` to get information on how effective the preallocation was;
3917aa95bbe8SBarry Smith    for example the fields mallocs,nz_allocated,nz_used,nz_unneeded;
3918aa95bbe8SBarry Smith    You can also run with the option -info and look for messages with the string
3919aa95bbe8SBarry Smith    malloc in them to see if additional memory allocation was needed.
3920aa95bbe8SBarry Smith 
392111a5261eSBarry Smith    Developer Notes:
392211a5261eSBarry Smith    Use nz of `MAT_SKIP_ALLOCATION` to not allocate any space for the matrix
3923a96a251dSBarry Smith    entries or columns indices
3924a96a251dSBarry Smith 
3925273d9f13SBarry Smith    By default, this format uses inodes (identical nodes) when possible, to
3926273d9f13SBarry Smith    improve numerical efficiency of matrix-vector products and solves. We
3927273d9f13SBarry Smith    search for consecutive rows with the same nonzero structure, thereby
3928273d9f13SBarry Smith    reusing matrix information to achieve increased efficiency.
3929273d9f13SBarry Smith 
39301cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatCreate()`, `MatCreateAIJ()`, `MatSetValues()`, `MatSeqAIJSetColumnIndices()`, `MatCreateSeqAIJWithArrays()`, `MatGetInfo()`,
3931db781477SPatrick Sanan           `MatSeqAIJSetTotalPreallocation()`
3932273d9f13SBarry Smith @*/
3933d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetPreallocation(Mat B, PetscInt nz, const PetscInt nnz[])
3934d71ae5a4SJacob Faibussowitsch {
3935a23d5eceSKris Buschelman   PetscFunctionBegin;
39366ba663aaSJed Brown   PetscValidHeaderSpecific(B, MAT_CLASSID, 1);
39376ba663aaSJed Brown   PetscValidType(B, 1);
3938cac4c232SBarry Smith   PetscTryMethod(B, "MatSeqAIJSetPreallocation_C", (Mat, PetscInt, const PetscInt[]), (B, nz, nnz));
39393ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3940a23d5eceSKris Buschelman }
3941a23d5eceSKris Buschelman 
3942d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetPreallocation_SeqAIJ(Mat B, PetscInt nz, const PetscInt *nnz)
3943d71ae5a4SJacob Faibussowitsch {
3944ad79cf63SBarry Smith   Mat_SeqAIJ *b              = (Mat_SeqAIJ *)B->data;
39452576faa2SJed Brown   PetscBool   skipallocation = PETSC_FALSE, realalloc = PETSC_FALSE;
394697f1f81fSBarry Smith   PetscInt    i;
3947273d9f13SBarry Smith 
3948273d9f13SBarry Smith   PetscFunctionBegin;
3949ad79cf63SBarry Smith   if (B->hash_active) {
3950aea10558SJacob Faibussowitsch     B->ops[0] = b->cops;
3951ad79cf63SBarry Smith     PetscCall(PetscHMapIJVDestroy(&b->ht));
3952ad79cf63SBarry Smith     PetscCall(PetscFree(b->dnz));
3953ad79cf63SBarry Smith     B->hash_active = PETSC_FALSE;
3954ad79cf63SBarry Smith   }
39552576faa2SJed Brown   if (nz >= 0 || nnz) realalloc = PETSC_TRUE;
3956a96a251dSBarry Smith   if (nz == MAT_SKIP_ALLOCATION) {
3957c461c341SBarry Smith     skipallocation = PETSC_TRUE;
3958c461c341SBarry Smith     nz             = 0;
3959c461c341SBarry Smith   }
39609566063dSJacob Faibussowitsch   PetscCall(PetscLayoutSetUp(B->rmap));
39619566063dSJacob Faibussowitsch   PetscCall(PetscLayoutSetUp(B->cmap));
3962899cda47SBarry Smith 
3963435da068SBarry Smith   if (nz == PETSC_DEFAULT || nz == PETSC_DECIDE) nz = 5;
396408401ef6SPierre Jolivet   PetscCheck(nz >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "nz cannot be less than 0: value %" PetscInt_FMT, nz);
3965cf9c20a2SJed Brown   if (PetscUnlikelyDebug(nnz)) {
3966d0f46423SBarry Smith     for (i = 0; i < B->rmap->n; i++) {
396708401ef6SPierre Jolivet       PetscCheck(nnz[i] >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "nnz cannot be less than 0: local row %" PetscInt_FMT " value %" PetscInt_FMT, i, nnz[i]);
396808401ef6SPierre Jolivet       PetscCheck(nnz[i] <= B->cmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "nnz cannot be greater than row length: local row %" PetscInt_FMT " value %" PetscInt_FMT " rowlength %" PetscInt_FMT, i, nnz[i], B->cmap->n);
3969b73539f3SBarry Smith     }
3970b73539f3SBarry Smith   }
3971b73539f3SBarry Smith 
3972273d9f13SBarry Smith   B->preallocated = PETSC_TRUE;
3973ab93d7beSBarry Smith   if (!skipallocation) {
39744dfa11a4SJacob Faibussowitsch     if (!b->imax) { PetscCall(PetscMalloc1(B->rmap->n, &b->imax)); }
3975071fcb05SBarry Smith     if (!b->ilen) {
3976071fcb05SBarry Smith       /* b->ilen will count nonzeros in each row so far. */
39779566063dSJacob Faibussowitsch       PetscCall(PetscCalloc1(B->rmap->n, &b->ilen));
3978071fcb05SBarry Smith     } else {
39799566063dSJacob Faibussowitsch       PetscCall(PetscMemzero(b->ilen, B->rmap->n * sizeof(PetscInt)));
39802ee49352SLisandro Dalcin     }
3981aa624791SPierre Jolivet     if (!b->ipre) PetscCall(PetscMalloc1(B->rmap->n, &b->ipre));
3982273d9f13SBarry Smith     if (!nnz) {
3983435da068SBarry Smith       if (nz == PETSC_DEFAULT || nz == PETSC_DECIDE) nz = 10;
3984c62bd62aSJed Brown       else if (nz < 0) nz = 1;
39855d2a9ed1SStefano Zampini       nz = PetscMin(nz, B->cmap->n);
3986d0f46423SBarry Smith       for (i = 0; i < B->rmap->n; i++) b->imax[i] = nz;
3987d0f46423SBarry Smith       nz = nz * B->rmap->n;
3988273d9f13SBarry Smith     } else {
3989c73702f5SBarry Smith       PetscInt64 nz64 = 0;
39909371c9d4SSatish Balay       for (i = 0; i < B->rmap->n; i++) {
39919371c9d4SSatish Balay         b->imax[i] = nnz[i];
39929371c9d4SSatish Balay         nz64 += nnz[i];
39939371c9d4SSatish Balay       }
39949566063dSJacob Faibussowitsch       PetscCall(PetscIntCast(nz64, &nz));
3995273d9f13SBarry Smith     }
3996ab93d7beSBarry Smith 
3997273d9f13SBarry Smith     /* allocate the matrix space */
399853dd7562SDmitry Karpeev     /* FIXME: should B's old memory be unlogged? */
39999566063dSJacob Faibussowitsch     PetscCall(MatSeqXAIJFreeAIJ(B, &b->a, &b->j, &b->i));
4000396832f4SHong Zhang     if (B->structure_only) {
40019566063dSJacob Faibussowitsch       PetscCall(PetscMalloc1(nz, &b->j));
40029566063dSJacob Faibussowitsch       PetscCall(PetscMalloc1(B->rmap->n + 1, &b->i));
4003396832f4SHong Zhang     } else {
40049566063dSJacob Faibussowitsch       PetscCall(PetscMalloc3(nz, &b->a, nz, &b->j, B->rmap->n + 1, &b->i));
4005396832f4SHong Zhang     }
4006bfeeae90SHong Zhang     b->i[0] = 0;
4007ad540459SPierre Jolivet     for (i = 1; i < B->rmap->n + 1; i++) b->i[i] = b->i[i - 1] + b->imax[i - 1];
4008396832f4SHong Zhang     if (B->structure_only) {
4009396832f4SHong Zhang       b->singlemalloc = PETSC_FALSE;
4010396832f4SHong Zhang       b->free_a       = PETSC_FALSE;
4011396832f4SHong Zhang     } else {
4012273d9f13SBarry Smith       b->singlemalloc = PETSC_TRUE;
4013e6b907acSBarry Smith       b->free_a       = PETSC_TRUE;
4014396832f4SHong Zhang     }
4015e6b907acSBarry Smith     b->free_ij = PETSC_TRUE;
4016c461c341SBarry Smith   } else {
4017e6b907acSBarry Smith     b->free_a  = PETSC_FALSE;
4018e6b907acSBarry Smith     b->free_ij = PETSC_FALSE;
4019c461c341SBarry Smith   }
4020273d9f13SBarry Smith 
4021846b4da1SFande Kong   if (b->ipre && nnz != b->ipre && b->imax) {
4022846b4da1SFande Kong     /* reserve user-requested sparsity */
40239566063dSJacob Faibussowitsch     PetscCall(PetscArraycpy(b->ipre, b->imax, B->rmap->n));
4024846b4da1SFande Kong   }
4025846b4da1SFande Kong 
4026273d9f13SBarry Smith   b->nz               = 0;
4027273d9f13SBarry Smith   b->maxnz            = nz;
4028273d9f13SBarry Smith   B->info.nz_unneeded = (double)b->maxnz;
40291baa6e33SBarry Smith   if (realalloc) PetscCall(MatSetOption(B, MAT_NEW_NONZERO_ALLOCATION_ERR, PETSC_TRUE));
4030cb7b82ddSBarry Smith   B->was_assembled = PETSC_FALSE;
4031cb7b82ddSBarry Smith   B->assembled     = PETSC_FALSE;
40325519a089SJose E. Roman   /* We simply deem preallocation has changed nonzero state. Updating the state
40335519a089SJose E. Roman      will give clients (like AIJKokkos) a chance to know something has happened.
40345519a089SJose E. Roman   */
40355519a089SJose E. Roman   B->nonzerostate++;
40363ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
4037273d9f13SBarry Smith }
4038273d9f13SBarry Smith 
4039d71ae5a4SJacob Faibussowitsch PetscErrorCode MatResetPreallocation_SeqAIJ(Mat A)
4040d71ae5a4SJacob Faibussowitsch {
4041846b4da1SFande Kong   Mat_SeqAIJ *a;
4042a5bbaf83SFande Kong   PetscInt    i;
40431f14be2bSBarry Smith   PetscBool   skipreset;
4044846b4da1SFande Kong 
4045846b4da1SFande Kong   PetscFunctionBegin;
4046846b4da1SFande Kong   PetscValidHeaderSpecific(A, MAT_CLASSID, 1);
404714d0e64fSAlex Lindsay 
404814d0e64fSAlex Lindsay   /* Check local size. If zero, then return */
40493ba16761SJacob Faibussowitsch   if (!A->rmap->n) PetscFunctionReturn(PETSC_SUCCESS);
405014d0e64fSAlex Lindsay 
4051846b4da1SFande Kong   a = (Mat_SeqAIJ *)A->data;
40522c814fdeSFande Kong   /* if no saved info, we error out */
405328b400f6SJacob Faibussowitsch   PetscCheck(a->ipre, PETSC_COMM_SELF, PETSC_ERR_ARG_NULL, "No saved preallocation info ");
40542c814fdeSFande Kong 
40551f14be2bSBarry Smith   PetscCheck(a->i && a->imax && a->ilen, PETSC_COMM_SELF, PETSC_ERR_ARG_NULL, "Memory info is incomplete, and can not reset preallocation ");
40562c814fdeSFande Kong 
40571f14be2bSBarry Smith   PetscCall(PetscArraycmp(a->ipre, a->ilen, A->rmap->n, &skipreset));
40581f14be2bSBarry Smith   if (!skipreset) {
40599566063dSJacob Faibussowitsch     PetscCall(PetscArraycpy(a->imax, a->ipre, A->rmap->n));
40609566063dSJacob Faibussowitsch     PetscCall(PetscArrayzero(a->ilen, A->rmap->n));
4061846b4da1SFande Kong     a->i[0] = 0;
4062ad540459SPierre Jolivet     for (i = 1; i < A->rmap->n + 1; i++) a->i[i] = a->i[i - 1] + a->imax[i - 1];
4063846b4da1SFande Kong     A->preallocated     = PETSC_TRUE;
4064846b4da1SFande Kong     a->nz               = 0;
4065846b4da1SFande Kong     a->maxnz            = a->i[A->rmap->n];
4066846b4da1SFande Kong     A->info.nz_unneeded = (double)a->maxnz;
4067846b4da1SFande Kong     A->was_assembled    = PETSC_FALSE;
4068846b4da1SFande Kong     A->assembled        = PETSC_FALSE;
40691f14be2bSBarry Smith   }
40703ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
4071846b4da1SFande Kong }
4072846b4da1SFande Kong 
407358d36128SBarry Smith /*@
407411a5261eSBarry Smith    MatSeqAIJSetPreallocationCSR - Allocates memory for a sparse sequential matrix in `MATSEQAIJ` format.
4075a1661176SMatthew Knepley 
4076a1661176SMatthew Knepley    Input Parameters:
4077a1661176SMatthew Knepley +  B - the matrix
4078a1661176SMatthew Knepley .  i - the indices into j for the start of each row (starts with zero)
4079a1661176SMatthew Knepley .  j - the column indices for each row (starts with zero) these must be sorted for each row
4080a1661176SMatthew Knepley -  v - optional values in the matrix
4081a1661176SMatthew Knepley 
4082a1661176SMatthew Knepley    Level: developer
4083a1661176SMatthew Knepley 
40846a9b8d82SBarry Smith    Notes:
40852ef1f0ffSBarry Smith       The `i`,`j`,`v` values are COPIED with this routine; to avoid the copy use `MatCreateSeqAIJWithArrays()`
408658d36128SBarry Smith 
40876a9b8d82SBarry Smith       This routine may be called multiple times with different nonzero patterns (or the same nonzero pattern). The nonzero
40886a9b8d82SBarry Smith       structure will be the union of all the previous nonzero structures.
40896a9b8d82SBarry Smith 
40906a9b8d82SBarry Smith     Developer Notes:
40912ef1f0ffSBarry Smith       An optimization could be added to the implementation where it checks if the `i`, and `j` are identical to the current `i` and `j` and
40922ef1f0ffSBarry Smith       then just copies the `v` values directly with `PetscMemcpy()`.
40936a9b8d82SBarry Smith 
409411a5261eSBarry Smith       This routine could also take a `PetscCopyMode` argument to allow sharing the values instead of always copying them.
40956a9b8d82SBarry Smith 
40961cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatCreate()`, `MatCreateSeqAIJ()`, `MatSetValues()`, `MatSeqAIJSetPreallocation()`, `MatCreateSeqAIJ()`, `MATSEQAIJ`, `MatResetPreallocation()`
4097a1661176SMatthew Knepley @*/
4098d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetPreallocationCSR(Mat B, const PetscInt i[], const PetscInt j[], const PetscScalar v[])
4099d71ae5a4SJacob Faibussowitsch {
4100a1661176SMatthew Knepley   PetscFunctionBegin;
41010700a824SBarry Smith   PetscValidHeaderSpecific(B, MAT_CLASSID, 1);
41026ba663aaSJed Brown   PetscValidType(B, 1);
4103cac4c232SBarry Smith   PetscTryMethod(B, "MatSeqAIJSetPreallocationCSR_C", (Mat, const PetscInt[], const PetscInt[], const PetscScalar[]), (B, i, j, v));
41043ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
4105a1661176SMatthew Knepley }
4106a1661176SMatthew Knepley 
4107d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetPreallocationCSR_SeqAIJ(Mat B, const PetscInt Ii[], const PetscInt J[], const PetscScalar v[])
4108d71ae5a4SJacob Faibussowitsch {
4109a1661176SMatthew Knepley   PetscInt  i;
4110a1661176SMatthew Knepley   PetscInt  m, n;
4111a1661176SMatthew Knepley   PetscInt  nz;
41126a9b8d82SBarry Smith   PetscInt *nnz;
4113a1661176SMatthew Knepley 
4114a1661176SMatthew Knepley   PetscFunctionBegin;
4115aed4548fSBarry Smith   PetscCheck(Ii[0] == 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Ii[0] must be 0 it is %" PetscInt_FMT, Ii[0]);
4116779a8d59SSatish Balay 
41179566063dSJacob Faibussowitsch   PetscCall(PetscLayoutSetUp(B->rmap));
41189566063dSJacob Faibussowitsch   PetscCall(PetscLayoutSetUp(B->cmap));
4119779a8d59SSatish Balay 
41209566063dSJacob Faibussowitsch   PetscCall(MatGetSize(B, &m, &n));
41219566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(m + 1, &nnz));
4122a1661176SMatthew Knepley   for (i = 0; i < m; i++) {
4123b7940d39SSatish Balay     nz = Ii[i + 1] - Ii[i];
412408401ef6SPierre Jolivet     PetscCheck(nz >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Local row %" PetscInt_FMT " has a negative number of columns %" PetscInt_FMT, i, nz);
4125a1661176SMatthew Knepley     nnz[i] = nz;
4126a1661176SMatthew Knepley   }
41279566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJSetPreallocation(B, 0, nnz));
41289566063dSJacob Faibussowitsch   PetscCall(PetscFree(nnz));
4129a1661176SMatthew Knepley 
413048a46eb9SPierre Jolivet   for (i = 0; i < m; i++) PetscCall(MatSetValues_SeqAIJ(B, 1, &i, Ii[i + 1] - Ii[i], J + Ii[i], v ? v + Ii[i] : NULL, INSERT_VALUES));
4131a1661176SMatthew Knepley 
41329566063dSJacob Faibussowitsch   PetscCall(MatAssemblyBegin(B, MAT_FINAL_ASSEMBLY));
41339566063dSJacob Faibussowitsch   PetscCall(MatAssemblyEnd(B, MAT_FINAL_ASSEMBLY));
4134a1661176SMatthew Knepley 
41359566063dSJacob Faibussowitsch   PetscCall(MatSetOption(B, MAT_NEW_NONZERO_LOCATION_ERR, PETSC_TRUE));
41363ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
4137a1661176SMatthew Knepley }
4138a1661176SMatthew Knepley 
4139ad7e164aSPierre Jolivet /*@
41402ef1f0ffSBarry Smith    MatSeqAIJKron - Computes `C`, the Kronecker product of `A` and `B`.
4141ad7e164aSPierre Jolivet 
4142ad7e164aSPierre Jolivet    Input Parameters:
4143ad7e164aSPierre Jolivet +  A - left-hand side matrix
4144ad7e164aSPierre Jolivet .  B - right-hand side matrix
414511a5261eSBarry Smith -  reuse - either `MAT_INITIAL_MATRIX` or `MAT_REUSE_MATRIX`
4146ad7e164aSPierre Jolivet 
4147ad7e164aSPierre Jolivet    Output Parameter:
41482ef1f0ffSBarry Smith .  C - Kronecker product of `A` and `B`
4149ad7e164aSPierre Jolivet 
4150ad7e164aSPierre Jolivet    Level: intermediate
4151ad7e164aSPierre Jolivet 
415211a5261eSBarry Smith    Note:
415311a5261eSBarry Smith       `MAT_REUSE_MATRIX` can only be used when the nonzero structure of the product matrix has not changed from that last call to `MatSeqAIJKron()`.
4154ad7e164aSPierre Jolivet 
41551cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatCreateSeqAIJ()`, `MATSEQAIJ`, `MATKAIJ`, `MatReuse`
4156ad7e164aSPierre Jolivet @*/
4157d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJKron(Mat A, Mat B, MatReuse reuse, Mat *C)
4158d71ae5a4SJacob Faibussowitsch {
4159ad7e164aSPierre Jolivet   PetscFunctionBegin;
4160ad7e164aSPierre Jolivet   PetscValidHeaderSpecific(A, MAT_CLASSID, 1);
4161ad7e164aSPierre Jolivet   PetscValidType(A, 1);
4162ad7e164aSPierre Jolivet   PetscValidHeaderSpecific(B, MAT_CLASSID, 2);
4163ad7e164aSPierre Jolivet   PetscValidType(B, 2);
4164ad7e164aSPierre Jolivet   PetscValidPointer(C, 4);
4165ad7e164aSPierre Jolivet   if (reuse == MAT_REUSE_MATRIX) {
4166ad7e164aSPierre Jolivet     PetscValidHeaderSpecific(*C, MAT_CLASSID, 4);
4167ad7e164aSPierre Jolivet     PetscValidType(*C, 4);
4168ad7e164aSPierre Jolivet   }
4169cac4c232SBarry Smith   PetscTryMethod(A, "MatSeqAIJKron_C", (Mat, Mat, MatReuse, Mat *), (A, B, reuse, C));
41703ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
4171ad7e164aSPierre Jolivet }
4172ad7e164aSPierre Jolivet 
4173d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJKron_SeqAIJ(Mat A, Mat B, MatReuse reuse, Mat *C)
4174d71ae5a4SJacob Faibussowitsch {
4175ad7e164aSPierre Jolivet   Mat                newmat;
4176ad7e164aSPierre Jolivet   Mat_SeqAIJ        *a = (Mat_SeqAIJ *)A->data;
4177ad7e164aSPierre Jolivet   Mat_SeqAIJ        *b = (Mat_SeqAIJ *)B->data;
4178ad7e164aSPierre Jolivet   PetscScalar       *v;
4179fff043a9SJunchao Zhang   const PetscScalar *aa, *ba;
4180ad7e164aSPierre Jolivet   PetscInt          *i, *j, m, n, p, q, nnz = 0, am = A->rmap->n, bm = B->rmap->n, an = A->cmap->n, bn = B->cmap->n;
4181ad7e164aSPierre Jolivet   PetscBool          flg;
4182ad7e164aSPierre Jolivet 
4183ad7e164aSPierre Jolivet   PetscFunctionBegin;
418428b400f6SJacob Faibussowitsch   PetscCheck(!A->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix");
418528b400f6SJacob Faibussowitsch   PetscCheck(A->assembled, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for unassembled matrix");
418628b400f6SJacob Faibussowitsch   PetscCheck(!B->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix");
418728b400f6SJacob Faibussowitsch   PetscCheck(B->assembled, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for unassembled matrix");
41889566063dSJacob Faibussowitsch   PetscCall(PetscObjectTypeCompare((PetscObject)B, MATSEQAIJ, &flg));
418928b400f6SJacob Faibussowitsch   PetscCheck(flg, PETSC_COMM_SELF, PETSC_ERR_SUP, "MatType %s", ((PetscObject)B)->type_name);
4190aed4548fSBarry Smith   PetscCheck(reuse == MAT_INITIAL_MATRIX || reuse == MAT_REUSE_MATRIX, PETSC_COMM_SELF, PETSC_ERR_SUP, "MatReuse %d", (int)reuse);
4191ad7e164aSPierre Jolivet   if (reuse == MAT_INITIAL_MATRIX) {
41929566063dSJacob Faibussowitsch     PetscCall(PetscMalloc2(am * bm + 1, &i, a->i[am] * b->i[bm], &j));
41939566063dSJacob Faibussowitsch     PetscCall(MatCreate(PETSC_COMM_SELF, &newmat));
41949566063dSJacob Faibussowitsch     PetscCall(MatSetSizes(newmat, am * bm, an * bn, am * bm, an * bn));
41959566063dSJacob Faibussowitsch     PetscCall(MatSetType(newmat, MATAIJ));
4196ad7e164aSPierre Jolivet     i[0] = 0;
4197ad7e164aSPierre Jolivet     for (m = 0; m < am; ++m) {
4198ad7e164aSPierre Jolivet       for (p = 0; p < bm; ++p) {
4199ad7e164aSPierre Jolivet         i[m * bm + p + 1] = i[m * bm + p] + (a->i[m + 1] - a->i[m]) * (b->i[p + 1] - b->i[p]);
4200ad7e164aSPierre Jolivet         for (n = a->i[m]; n < a->i[m + 1]; ++n) {
4201ad540459SPierre Jolivet           for (q = b->i[p]; q < b->i[p + 1]; ++q) j[nnz++] = a->j[n] * bn + b->j[q];
4202ad7e164aSPierre Jolivet         }
4203ad7e164aSPierre Jolivet       }
4204ad7e164aSPierre Jolivet     }
42059566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJSetPreallocationCSR(newmat, i, j, NULL));
4206ad7e164aSPierre Jolivet     *C = newmat;
42079566063dSJacob Faibussowitsch     PetscCall(PetscFree2(i, j));
4208ad7e164aSPierre Jolivet     nnz = 0;
4209ad7e164aSPierre Jolivet   }
42109566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArray(*C, &v));
42119566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &aa));
42129566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(B, &ba));
4213ad7e164aSPierre Jolivet   for (m = 0; m < am; ++m) {
4214ad7e164aSPierre Jolivet     for (p = 0; p < bm; ++p) {
4215ad7e164aSPierre Jolivet       for (n = a->i[m]; n < a->i[m + 1]; ++n) {
4216ad540459SPierre Jolivet         for (q = b->i[p]; q < b->i[p + 1]; ++q) v[nnz++] = aa[n] * ba[q];
4217ad7e164aSPierre Jolivet       }
4218ad7e164aSPierre Jolivet     }
4219ad7e164aSPierre Jolivet   }
42209566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArray(*C, &v));
42219566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &aa));
42229566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(B, &ba));
42233ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
4224ad7e164aSPierre Jolivet }
4225ad7e164aSPierre Jolivet 
4226c6db04a5SJed Brown #include <../src/mat/impls/dense/seq/dense.h>
4227af0996ceSBarry Smith #include <petsc/private/kernels/petscaxpy.h>
4228170fe5c8SBarry Smith 
4229170fe5c8SBarry Smith /*
4230170fe5c8SBarry Smith     Computes (B'*A')' since computing B*A directly is untenable
4231170fe5c8SBarry Smith 
4232170fe5c8SBarry Smith                n                       p                          p
42332da392ccSBarry Smith         [             ]       [             ]         [                 ]
42342da392ccSBarry Smith       m [      A      ]  *  n [       B     ]   =   m [         C       ]
42352da392ccSBarry Smith         [             ]       [             ]         [                 ]
4236170fe5c8SBarry Smith 
4237170fe5c8SBarry Smith */
4238d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMatMultNumeric_SeqDense_SeqAIJ(Mat A, Mat B, Mat C)
4239d71ae5a4SJacob Faibussowitsch {
4240170fe5c8SBarry Smith   Mat_SeqDense      *sub_a = (Mat_SeqDense *)A->data;
4241170fe5c8SBarry Smith   Mat_SeqAIJ        *sub_b = (Mat_SeqAIJ *)B->data;
4242170fe5c8SBarry Smith   Mat_SeqDense      *sub_c = (Mat_SeqDense *)C->data;
424386214ceeSStefano Zampini   PetscInt           i, j, n, m, q, p;
4244170fe5c8SBarry Smith   const PetscInt    *ii, *idx;
4245170fe5c8SBarry Smith   const PetscScalar *b, *a, *a_q;
4246170fe5c8SBarry Smith   PetscScalar       *c, *c_q;
424786214ceeSStefano Zampini   PetscInt           clda = sub_c->lda;
424886214ceeSStefano Zampini   PetscInt           alda = sub_a->lda;
4249170fe5c8SBarry Smith 
4250170fe5c8SBarry Smith   PetscFunctionBegin;
4251d0f46423SBarry Smith   m = A->rmap->n;
4252d0f46423SBarry Smith   n = A->cmap->n;
4253d0f46423SBarry Smith   p = B->cmap->n;
4254170fe5c8SBarry Smith   a = sub_a->v;
4255170fe5c8SBarry Smith   b = sub_b->a;
4256170fe5c8SBarry Smith   c = sub_c->v;
425786214ceeSStefano Zampini   if (clda == m) {
42589566063dSJacob Faibussowitsch     PetscCall(PetscArrayzero(c, m * p));
425986214ceeSStefano Zampini   } else {
426086214ceeSStefano Zampini     for (j = 0; j < p; j++)
42619371c9d4SSatish Balay       for (i = 0; i < m; i++) c[j * clda + i] = 0.0;
426286214ceeSStefano Zampini   }
4263170fe5c8SBarry Smith   ii  = sub_b->i;
4264170fe5c8SBarry Smith   idx = sub_b->j;
4265170fe5c8SBarry Smith   for (i = 0; i < n; i++) {
4266170fe5c8SBarry Smith     q = ii[i + 1] - ii[i];
4267170fe5c8SBarry Smith     while (q-- > 0) {
426886214ceeSStefano Zampini       c_q = c + clda * (*idx);
426986214ceeSStefano Zampini       a_q = a + alda * i;
4270854c7f52SBarry Smith       PetscKernelAXPY(c_q, *b, a_q, m);
4271170fe5c8SBarry Smith       idx++;
4272170fe5c8SBarry Smith       b++;
4273170fe5c8SBarry Smith     }
4274170fe5c8SBarry Smith   }
42753ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
4276170fe5c8SBarry Smith }
4277170fe5c8SBarry Smith 
4278d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMatMultSymbolic_SeqDense_SeqAIJ(Mat A, Mat B, PetscReal fill, Mat C)
4279d71ae5a4SJacob Faibussowitsch {
4280d0f46423SBarry Smith   PetscInt  m = A->rmap->n, n = B->cmap->n;
428186214ceeSStefano Zampini   PetscBool cisdense;
4282170fe5c8SBarry Smith 
4283170fe5c8SBarry Smith   PetscFunctionBegin;
428408401ef6SPierre Jolivet   PetscCheck(A->cmap->n == B->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "A->cmap->n %" PetscInt_FMT " != B->rmap->n %" PetscInt_FMT, A->cmap->n, B->rmap->n);
42859566063dSJacob Faibussowitsch   PetscCall(MatSetSizes(C, m, n, m, n));
42869566063dSJacob Faibussowitsch   PetscCall(MatSetBlockSizesFromMats(C, A, B));
4287d5e393b6SSuyash Tandon   PetscCall(PetscObjectTypeCompareAny((PetscObject)C, &cisdense, MATSEQDENSE, MATSEQDENSECUDA, MATSEQDENSEHIP, ""));
428848a46eb9SPierre Jolivet   if (!cisdense) PetscCall(MatSetType(C, MATDENSE));
42899566063dSJacob Faibussowitsch   PetscCall(MatSetUp(C));
4290d73949e8SHong Zhang 
42914222ddf1SHong Zhang   C->ops->matmultnumeric = MatMatMultNumeric_SeqDense_SeqAIJ;
42923ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
4293170fe5c8SBarry Smith }
4294170fe5c8SBarry Smith 
42950bad9183SKris Buschelman /*MC
4296fafad747SKris Buschelman    MATSEQAIJ - MATSEQAIJ = "seqaij" - A matrix type to be used for sequential sparse matrices,
42970bad9183SKris Buschelman    based on compressed sparse row format.
42980bad9183SKris Buschelman 
42992ef1f0ffSBarry Smith    Options Database Key:
43000bad9183SKris Buschelman . -mat_type seqaij - sets the matrix type to "seqaij" during a call to MatSetFromOptions()
43010bad9183SKris Buschelman 
43020bad9183SKris Buschelman    Level: beginner
43030bad9183SKris Buschelman 
43040cd7f59aSBarry Smith    Notes:
43052ef1f0ffSBarry Smith     `MatSetValues()` may be called for this matrix type with a `NULL` argument for the numerical values,
43060cd7f59aSBarry Smith     in this case the values associated with the rows and columns one passes in are set to zero
43070cd7f59aSBarry Smith     in the matrix
43080cd7f59aSBarry Smith 
430911a5261eSBarry Smith     `MatSetOptions`(,`MAT_STRUCTURE_ONLY`,`PETSC_TRUE`) may be called for this matrix type. In this no
431011a5261eSBarry Smith     space is allocated for the nonzero entries and any entries passed with `MatSetValues()` are ignored
43110cd7f59aSBarry Smith 
431211a5261eSBarry Smith   Developer Note:
43132ef1f0ffSBarry Smith     It would be nice if all matrix formats supported passing `NULL` in for the numerical values
43140cd7f59aSBarry Smith 
43151cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatCreateSeqAIJ()`, `MatSetFromOptions()`, `MatSetType()`, `MatCreate()`, `MatType`, `MATSELL`, `MATSEQSELL`, `MATMPISELL`
43160bad9183SKris Buschelman M*/
43170bad9183SKris Buschelman 
4318ccd284c7SBarry Smith /*MC
4319ccd284c7SBarry Smith    MATAIJ - MATAIJ = "aij" - A matrix type to be used for sparse matrices.
4320ccd284c7SBarry Smith 
432111a5261eSBarry Smith    This matrix type is identical to `MATSEQAIJ` when constructed with a single process communicator,
432211a5261eSBarry Smith    and `MATMPIAIJ` otherwise.  As a result, for single process communicators,
432311a5261eSBarry Smith    `MatSeqAIJSetPreallocation()` is supported, and similarly `MatMPIAIJSetPreallocation()` is supported
4324ccd284c7SBarry Smith    for communicators controlling multiple processes.  It is recommended that you call both of
4325ccd284c7SBarry Smith    the above preallocation routines for simplicity.
4326ccd284c7SBarry Smith 
43272ef1f0ffSBarry Smith    Options Database Key:
432811a5261eSBarry Smith . -mat_type aij - sets the matrix type to "aij" during a call to `MatSetFromOptions()`
4329ccd284c7SBarry Smith 
43302ef1f0ffSBarry Smith   Level: beginner
43312ef1f0ffSBarry Smith 
433211a5261eSBarry Smith    Note:
433311a5261eSBarry Smith    Subclasses include `MATAIJCUSPARSE`, `MATAIJPERM`, `MATAIJSELL`, `MATAIJMKL`, `MATAIJCRL`, and also automatically switches over to use inodes when
4334ccd284c7SBarry Smith    enough exist.
4335ccd284c7SBarry Smith 
43361cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatCreateAIJ()`, `MatCreateSeqAIJ()`, `MATSEQAIJ`, `MATMPIAIJ`, `MATSELL`, `MATSEQSELL`, `MATMPISELL`
4337ccd284c7SBarry Smith M*/
4338ccd284c7SBarry Smith 
4339ccd284c7SBarry Smith /*MC
4340ccd284c7SBarry Smith    MATAIJCRL - MATAIJCRL = "aijcrl" - A matrix type to be used for sparse matrices.
4341ccd284c7SBarry Smith 
43422ef1f0ffSBarry Smith    Options Database Key:
43432ef1f0ffSBarry Smith . -mat_type aijcrl - sets the matrix type to "aijcrl" during a call to `MatSetFromOptions()`
43442ef1f0ffSBarry Smith 
43452ef1f0ffSBarry Smith   Level: beginner
43462ef1f0ffSBarry Smith 
43472ef1f0ffSBarry Smith    Note:
434811a5261eSBarry Smith    This matrix type is identical to `MATSEQAIJCRL` when constructed with a single process communicator,
434911a5261eSBarry Smith    and `MATMPIAIJCRL` otherwise.  As a result, for single process communicators,
435011a5261eSBarry Smith    `MatSeqAIJSetPreallocation()` is supported, and similarly `MatMPIAIJSetPreallocation()` is supported
4351ccd284c7SBarry Smith    for communicators controlling multiple processes.  It is recommended that you call both of
4352ccd284c7SBarry Smith    the above preallocation routines for simplicity.
4353ccd284c7SBarry Smith 
43541cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatCreateMPIAIJCRL`, `MATSEQAIJCRL`, `MATMPIAIJCRL`, `MATSEQAIJCRL`, `MATMPIAIJCRL`
4355ccd284c7SBarry Smith M*/
4356ccd284c7SBarry Smith 
43577906f579SHong Zhang PETSC_INTERN PetscErrorCode MatConvert_SeqAIJ_SeqAIJCRL(Mat, MatType, MatReuse, Mat *);
43587906f579SHong Zhang #if defined(PETSC_HAVE_ELEMENTAL)
43597906f579SHong Zhang PETSC_INTERN PetscErrorCode MatConvert_SeqAIJ_Elemental(Mat, MatType, MatReuse, Mat *);
43607906f579SHong Zhang #endif
4361d24d4204SJose E. Roman #if defined(PETSC_HAVE_SCALAPACK)
4362d24d4204SJose E. Roman PETSC_INTERN PetscErrorCode MatConvert_AIJ_ScaLAPACK(Mat, MatType, MatReuse, Mat *);
4363d24d4204SJose E. Roman #endif
43647906f579SHong Zhang #if defined(PETSC_HAVE_HYPRE)
43657906f579SHong Zhang PETSC_INTERN PetscErrorCode MatConvert_AIJ_HYPRE(Mat A, MatType, MatReuse, Mat *);
43667906f579SHong Zhang #endif
43677906f579SHong Zhang 
4368d4002b98SHong Zhang PETSC_EXTERN PetscErrorCode MatConvert_SeqAIJ_SeqSELL(Mat, MatType, MatReuse, Mat *);
4369c9225affSStefano Zampini PETSC_INTERN PetscErrorCode MatConvert_XAIJ_IS(Mat, MatType, MatReuse, Mat *);
43704222ddf1SHong Zhang PETSC_INTERN PetscErrorCode MatProductSetFromOptions_IS_XAIJ(Mat);
43717906f579SHong Zhang 
43728c778c55SBarry Smith /*@C
437311a5261eSBarry Smith    MatSeqAIJGetArray - gives read/write access to the array where the data for a `MATSEQAIJ` matrix is stored
43748c778c55SBarry Smith 
43758c778c55SBarry Smith    Not Collective
43768c778c55SBarry Smith 
43778c778c55SBarry Smith    Input Parameter:
437811a5261eSBarry Smith .  mat - a `MATSEQAIJ` matrix
43798c778c55SBarry Smith 
43808c778c55SBarry Smith    Output Parameter:
43818c778c55SBarry Smith .   array - pointer to the data
43828c778c55SBarry Smith 
43838c778c55SBarry Smith    Level: intermediate
43848c778c55SBarry Smith 
43850ab4885dSBarry Smith    Fortran Note:
43860ab4885dSBarry Smith    `MatSeqAIJGetArray()` Fortran binding is deprecated (since PETSc 3.19), use `MatSeqAIJGetArrayF90()`
43870ab4885dSBarry Smith 
43881cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJRestoreArray()`, `MatSeqAIJGetArrayF90()`
43898c778c55SBarry Smith @*/
4390d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJGetArray(Mat A, PetscScalar **array)
4391d71ae5a4SJacob Faibussowitsch {
4392d67d9f35SJunchao Zhang   Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data;
43938c778c55SBarry Smith 
43948c778c55SBarry Smith   PetscFunctionBegin;
4395d67d9f35SJunchao Zhang   if (aij->ops->getarray) {
43969566063dSJacob Faibussowitsch     PetscCall((*aij->ops->getarray)(A, array));
4397d67d9f35SJunchao Zhang   } else {
4398d67d9f35SJunchao Zhang     *array = aij->a;
4399d67d9f35SJunchao Zhang   }
44003ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
4401d67d9f35SJunchao Zhang }
4402d67d9f35SJunchao Zhang 
4403d67d9f35SJunchao Zhang /*@C
440411a5261eSBarry Smith    MatSeqAIJRestoreArray - returns access to the array where the data for a `MATSEQAIJ` matrix is stored obtained by `MatSeqAIJGetArray()`
4405d67d9f35SJunchao Zhang 
4406d67d9f35SJunchao Zhang    Not Collective
4407d67d9f35SJunchao Zhang 
4408d67d9f35SJunchao Zhang    Input Parameters:
440911a5261eSBarry Smith +  mat - a `MATSEQAIJ` matrix
4410d67d9f35SJunchao Zhang -  array - pointer to the data
4411d67d9f35SJunchao Zhang 
4412d67d9f35SJunchao Zhang    Level: intermediate
4413d67d9f35SJunchao Zhang 
44140ab4885dSBarry Smith    Fortran Note:
44150ab4885dSBarry Smith    `MatSeqAIJRestoreArray()` Fortran binding is deprecated (since PETSc 3.19), use `MatSeqAIJRestoreArrayF90()`
44160ab4885dSBarry Smith 
44171cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJGetArray()`, `MatSeqAIJRestoreArrayF90()`
4418d67d9f35SJunchao Zhang @*/
4419d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJRestoreArray(Mat A, PetscScalar **array)
4420d71ae5a4SJacob Faibussowitsch {
4421d67d9f35SJunchao Zhang   Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data;
4422d67d9f35SJunchao Zhang 
4423d67d9f35SJunchao Zhang   PetscFunctionBegin;
4424d67d9f35SJunchao Zhang   if (aij->ops->restorearray) {
44259566063dSJacob Faibussowitsch     PetscCall((*aij->ops->restorearray)(A, array));
4426d67d9f35SJunchao Zhang   } else {
4427d67d9f35SJunchao Zhang     *array = NULL;
4428d67d9f35SJunchao Zhang   }
44299566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJInvalidateDiagonal(A));
44309566063dSJacob Faibussowitsch   PetscCall(PetscObjectStateIncrease((PetscObject)A));
44313ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
44328c778c55SBarry Smith }
44338c778c55SBarry Smith 
443421e72a00SBarry Smith /*@C
443511a5261eSBarry Smith    MatSeqAIJGetArrayRead - gives read-only access to the array where the data for a `MATSEQAIJ` matrix is stored
44368f1ea47aSStefano Zampini 
44370ab4885dSBarry Smith    Not Collective; No Fortran Support
44388f1ea47aSStefano Zampini 
44398f1ea47aSStefano Zampini    Input Parameter:
444011a5261eSBarry Smith .  mat - a `MATSEQAIJ` matrix
44418f1ea47aSStefano Zampini 
44428f1ea47aSStefano Zampini    Output Parameter:
44438f1ea47aSStefano Zampini .   array - pointer to the data
44448f1ea47aSStefano Zampini 
44458f1ea47aSStefano Zampini    Level: intermediate
44468f1ea47aSStefano Zampini 
44471cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJGetArray()`, `MatSeqAIJRestoreArrayRead()`
44488f1ea47aSStefano Zampini @*/
4449d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJGetArrayRead(Mat A, const PetscScalar **array)
4450d71ae5a4SJacob Faibussowitsch {
4451d67d9f35SJunchao Zhang   Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data;
44528f1ea47aSStefano Zampini 
44538f1ea47aSStefano Zampini   PetscFunctionBegin;
4454d67d9f35SJunchao Zhang   if (aij->ops->getarrayread) {
44559566063dSJacob Faibussowitsch     PetscCall((*aij->ops->getarrayread)(A, array));
4456d67d9f35SJunchao Zhang   } else {
4457d67d9f35SJunchao Zhang     *array = aij->a;
4458d67d9f35SJunchao Zhang   }
44593ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
44608f1ea47aSStefano Zampini }
44618f1ea47aSStefano Zampini 
44628f1ea47aSStefano Zampini /*@C
446311a5261eSBarry Smith    MatSeqAIJRestoreArrayRead - restore the read-only access array obtained from `MatSeqAIJGetArrayRead()`
44648f1ea47aSStefano Zampini 
44650ab4885dSBarry Smith    Not Collective; No Fortran Support
44668f1ea47aSStefano Zampini 
44678f1ea47aSStefano Zampini    Input Parameter:
446811a5261eSBarry Smith .  mat - a `MATSEQAIJ` matrix
44698f1ea47aSStefano Zampini 
44708f1ea47aSStefano Zampini    Output Parameter:
44718f1ea47aSStefano Zampini .   array - pointer to the data
44728f1ea47aSStefano Zampini 
44738f1ea47aSStefano Zampini    Level: intermediate
44748f1ea47aSStefano Zampini 
44751cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJGetArray()`, `MatSeqAIJGetArrayRead()`
44768f1ea47aSStefano Zampini @*/
4477d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJRestoreArrayRead(Mat A, const PetscScalar **array)
4478d71ae5a4SJacob Faibussowitsch {
4479d67d9f35SJunchao Zhang   Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data;
44808f1ea47aSStefano Zampini 
44818f1ea47aSStefano Zampini   PetscFunctionBegin;
4482d67d9f35SJunchao Zhang   if (aij->ops->restorearrayread) {
44839566063dSJacob Faibussowitsch     PetscCall((*aij->ops->restorearrayread)(A, array));
4484d67d9f35SJunchao Zhang   } else {
4485d67d9f35SJunchao Zhang     *array = NULL;
4486d67d9f35SJunchao Zhang   }
44873ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
4488d67d9f35SJunchao Zhang }
4489d67d9f35SJunchao Zhang 
4490d67d9f35SJunchao Zhang /*@C
449111a5261eSBarry Smith    MatSeqAIJGetArrayWrite - gives write-only access to the array where the data for a `MATSEQAIJ` matrix is stored
4492d67d9f35SJunchao Zhang 
44930ab4885dSBarry Smith    Not Collective; No Fortran Support
4494d67d9f35SJunchao Zhang 
4495d67d9f35SJunchao Zhang    Input Parameter:
449611a5261eSBarry Smith .  mat - a `MATSEQAIJ` matrix
4497d67d9f35SJunchao Zhang 
4498d67d9f35SJunchao Zhang    Output Parameter:
4499d67d9f35SJunchao Zhang .   array - pointer to the data
4500d67d9f35SJunchao Zhang 
4501d67d9f35SJunchao Zhang    Level: intermediate
4502d67d9f35SJunchao Zhang 
45031cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJGetArray()`, `MatSeqAIJRestoreArrayRead()`
4504d67d9f35SJunchao Zhang @*/
4505d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJGetArrayWrite(Mat A, PetscScalar **array)
4506d71ae5a4SJacob Faibussowitsch {
4507d67d9f35SJunchao Zhang   Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data;
4508d67d9f35SJunchao Zhang 
4509d67d9f35SJunchao Zhang   PetscFunctionBegin;
4510d67d9f35SJunchao Zhang   if (aij->ops->getarraywrite) {
45119566063dSJacob Faibussowitsch     PetscCall((*aij->ops->getarraywrite)(A, array));
4512d67d9f35SJunchao Zhang   } else {
4513d67d9f35SJunchao Zhang     *array = aij->a;
4514d67d9f35SJunchao Zhang   }
45159566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJInvalidateDiagonal(A));
45169566063dSJacob Faibussowitsch   PetscCall(PetscObjectStateIncrease((PetscObject)A));
45173ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
4518d67d9f35SJunchao Zhang }
4519d67d9f35SJunchao Zhang 
4520d67d9f35SJunchao Zhang /*@C
4521d67d9f35SJunchao Zhang    MatSeqAIJRestoreArrayWrite - restore the read-only access array obtained from MatSeqAIJGetArrayRead
4522d67d9f35SJunchao Zhang 
45230ab4885dSBarry Smith    Not Collective; No Fortran Support
4524d67d9f35SJunchao Zhang 
4525d67d9f35SJunchao Zhang    Input Parameter:
4526d67d9f35SJunchao Zhang .  mat - a MATSEQAIJ matrix
4527d67d9f35SJunchao Zhang 
4528d67d9f35SJunchao Zhang    Output Parameter:
4529d67d9f35SJunchao Zhang .   array - pointer to the data
4530d67d9f35SJunchao Zhang 
4531d67d9f35SJunchao Zhang    Level: intermediate
4532d67d9f35SJunchao Zhang 
45331cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJGetArray()`, `MatSeqAIJGetArrayRead()`
4534d67d9f35SJunchao Zhang @*/
4535d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJRestoreArrayWrite(Mat A, PetscScalar **array)
4536d71ae5a4SJacob Faibussowitsch {
4537d67d9f35SJunchao Zhang   Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data;
4538d67d9f35SJunchao Zhang 
4539d67d9f35SJunchao Zhang   PetscFunctionBegin;
4540d67d9f35SJunchao Zhang   if (aij->ops->restorearraywrite) {
45419566063dSJacob Faibussowitsch     PetscCall((*aij->ops->restorearraywrite)(A, array));
4542d67d9f35SJunchao Zhang   } else {
4543d67d9f35SJunchao Zhang     *array = NULL;
4544d67d9f35SJunchao Zhang   }
45453ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
45468f1ea47aSStefano Zampini }
45478f1ea47aSStefano Zampini 
45488f1ea47aSStefano Zampini /*@C
454911a5261eSBarry Smith    MatSeqAIJGetCSRAndMemType - Get the CSR arrays and the memory type of the `MATSEQAIJ` matrix
45507ee59b9bSJunchao Zhang 
45510ab4885dSBarry Smith    Not Collective; No Fortran Support
45527ee59b9bSJunchao Zhang 
45537ee59b9bSJunchao Zhang    Input Parameter:
455411a5261eSBarry Smith .  mat - a matrix of type `MATSEQAIJ` or its subclasses
45557ee59b9bSJunchao Zhang 
45567ee59b9bSJunchao Zhang    Output Parameters:
45577ee59b9bSJunchao Zhang +  i - row map array of the matrix
45587ee59b9bSJunchao Zhang .  j - column index array of the matrix
45597ee59b9bSJunchao Zhang .  a - data array of the matrix
45607ee59b9bSJunchao Zhang -  memtype - memory type of the arrays
45617ee59b9bSJunchao Zhang 
45622ef1f0ffSBarry Smith    Level: Developer
45632ef1f0ffSBarry Smith 
45647ee59b9bSJunchao Zhang   Notes:
45652ef1f0ffSBarry Smith    Any of the output parameters can be `NULL`, in which case the corresponding value is not returned.
45667ee59b9bSJunchao Zhang    If mat is a device matrix, the arrays are on the device. Otherwise, they are on the host.
45677ee59b9bSJunchao Zhang 
45687ee59b9bSJunchao Zhang    One can call this routine on a preallocated but not assembled matrix to just get the memory of the CSR underneath the matrix.
45692ef1f0ffSBarry Smith    If the matrix is assembled, the data array `a` is guaranteed to have the latest values of the matrix.
45707ee59b9bSJunchao Zhang 
45711cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJGetArray()`, `MatSeqAIJGetArrayRead()`
45727ee59b9bSJunchao Zhang @*/
4573d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJGetCSRAndMemType(Mat mat, const PetscInt **i, const PetscInt **j, PetscScalar **a, PetscMemType *mtype)
4574d71ae5a4SJacob Faibussowitsch {
45757ee59b9bSJunchao Zhang   Mat_SeqAIJ *aij = (Mat_SeqAIJ *)mat->data;
45767ee59b9bSJunchao Zhang 
45777ee59b9bSJunchao Zhang   PetscFunctionBegin;
45787ee59b9bSJunchao Zhang   PetscCheck(mat->preallocated, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "matrix is not preallocated");
45797ee59b9bSJunchao Zhang   if (aij->ops->getcsrandmemtype) {
45807ee59b9bSJunchao Zhang     PetscCall((*aij->ops->getcsrandmemtype)(mat, i, j, a, mtype));
45817ee59b9bSJunchao Zhang   } else {
45827ee59b9bSJunchao Zhang     if (i) *i = aij->i;
45837ee59b9bSJunchao Zhang     if (j) *j = aij->j;
45847ee59b9bSJunchao Zhang     if (a) *a = aij->a;
45857ee59b9bSJunchao Zhang     if (mtype) *mtype = PETSC_MEMTYPE_HOST;
45867ee59b9bSJunchao Zhang   }
45873ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
45887ee59b9bSJunchao Zhang }
45897ee59b9bSJunchao Zhang 
45907ee59b9bSJunchao Zhang /*@C
459121e72a00SBarry Smith    MatSeqAIJGetMaxRowNonzeros - returns the maximum number of nonzeros in any row
459221e72a00SBarry Smith 
459321e72a00SBarry Smith    Not Collective
459421e72a00SBarry Smith 
459521e72a00SBarry Smith    Input Parameter:
459611a5261eSBarry Smith .  mat - a `MATSEQAIJ` matrix
459721e72a00SBarry Smith 
459821e72a00SBarry Smith    Output Parameter:
459921e72a00SBarry Smith .   nz - the maximum number of nonzeros in any row
460021e72a00SBarry Smith 
460121e72a00SBarry Smith    Level: intermediate
460221e72a00SBarry Smith 
46031cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJRestoreArray()`, `MatSeqAIJGetArrayF90()`
460421e72a00SBarry Smith @*/
4605d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJGetMaxRowNonzeros(Mat A, PetscInt *nz)
4606d71ae5a4SJacob Faibussowitsch {
460721e72a00SBarry Smith   Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data;
460821e72a00SBarry Smith 
460921e72a00SBarry Smith   PetscFunctionBegin;
461021e72a00SBarry Smith   *nz = aij->rmax;
46113ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
461221e72a00SBarry Smith }
461321e72a00SBarry Smith 
46142c4ab24aSJunchao Zhang static PetscErrorCode MatCOOStructDestroy_SeqAIJ(void *data)
46152c4ab24aSJunchao Zhang {
46162c4ab24aSJunchao Zhang   MatCOOStruct_SeqAIJ *coo = (MatCOOStruct_SeqAIJ *)data;
46172c4ab24aSJunchao Zhang   PetscFunctionBegin;
46182c4ab24aSJunchao Zhang   PetscCall(PetscFree(coo->perm));
46192c4ab24aSJunchao Zhang   PetscCall(PetscFree(coo->jmap));
46202c4ab24aSJunchao Zhang   PetscCall(PetscFree(coo));
46212c4ab24aSJunchao Zhang   PetscFunctionReturn(PETSC_SUCCESS);
46222c4ab24aSJunchao Zhang }
46232c4ab24aSJunchao Zhang 
4624d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetPreallocationCOO_SeqAIJ(Mat mat, PetscCount coo_n, PetscInt coo_i[], PetscInt coo_j[])
4625d71ae5a4SJacob Faibussowitsch {
4626394ed5ebSJunchao Zhang   MPI_Comm             comm;
4627394ed5ebSJunchao Zhang   PetscInt            *i, *j;
4628394ed5ebSJunchao Zhang   PetscInt             M, N, row;
4629394ed5ebSJunchao Zhang   PetscCount           k, p, q, nneg, nnz, start, end; /* Index the coo array, so use PetscCount as their type */
4630394ed5ebSJunchao Zhang   PetscInt            *Ai;                             /* Change to PetscCount once we use it for row pointers */
4631394ed5ebSJunchao Zhang   PetscInt            *Aj;
4632394ed5ebSJunchao Zhang   PetscScalar         *Aa;
4633cbc6b225SStefano Zampini   Mat_SeqAIJ          *seqaij = (Mat_SeqAIJ *)(mat->data);
4634cbc6b225SStefano Zampini   MatType              rtype;
4635394ed5ebSJunchao Zhang   PetscCount          *perm, *jmap;
46362c4ab24aSJunchao Zhang   PetscContainer       container;
46372c4ab24aSJunchao Zhang   MatCOOStruct_SeqAIJ *coo;
4638394ed5ebSJunchao Zhang 
4639394ed5ebSJunchao Zhang   PetscFunctionBegin;
46409566063dSJacob Faibussowitsch   PetscCall(PetscObjectGetComm((PetscObject)mat, &comm));
46419566063dSJacob Faibussowitsch   PetscCall(MatGetSize(mat, &M, &N));
4642e8729f6fSJunchao Zhang   i = coo_i;
4643e8729f6fSJunchao Zhang   j = coo_j;
46449566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(coo_n, &perm));
4645394ed5ebSJunchao Zhang   for (k = 0; k < coo_n; k++) { /* Ignore entries with negative row or col indices */
4646394ed5ebSJunchao Zhang     if (j[k] < 0) i[k] = -1;
4647394ed5ebSJunchao Zhang     perm[k] = k;
4648394ed5ebSJunchao Zhang   }
4649394ed5ebSJunchao Zhang 
4650394ed5ebSJunchao Zhang   /* Sort by row */
46519566063dSJacob Faibussowitsch   PetscCall(PetscSortIntWithIntCountArrayPair(coo_n, i, j, perm));
4652651b1cf9SStefano Zampini 
4653651b1cf9SStefano Zampini   /* Advance k to the first row with a non-negative index */
4654651b1cf9SStefano Zampini   for (k = 0; k < coo_n; k++)
46559371c9d4SSatish Balay     if (i[k] >= 0) break;
4656394ed5ebSJunchao Zhang   nneg = k;
46579566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(coo_n - nneg + 1, &jmap)); /* +1 to make a CSR-like data structure. jmap[i] originally is the number of repeats for i-th nonzero */
4658394ed5ebSJunchao Zhang   nnz = 0;                                          /* Total number of unique nonzeros to be counted */
465935cb6cd3SPierre Jolivet   jmap++;                                           /* Inc jmap by 1 for convenience */
4660394ed5ebSJunchao Zhang 
46619566063dSJacob Faibussowitsch   PetscCall(PetscCalloc1(M + 1, &Ai));        /* CSR of A */
46629566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(coo_n - nneg, &Aj)); /* We have at most coo_n-nneg unique nonzeros */
4663394ed5ebSJunchao Zhang 
4664651b1cf9SStefano Zampini   /* Support for HYPRE */
4665651b1cf9SStefano Zampini   PetscBool   hypre;
4666651b1cf9SStefano Zampini   const char *name;
4667651b1cf9SStefano Zampini   PetscCall(PetscObjectGetName((PetscObject)mat, &name));
4668651b1cf9SStefano Zampini   PetscCall(PetscStrcmp("_internal_COO_mat_for_hypre", name, &hypre));
4669651b1cf9SStefano Zampini 
4670394ed5ebSJunchao Zhang   /* In each row, sort by column, then unique column indices to get row length */
467135cb6cd3SPierre Jolivet   Ai++;  /* Inc by 1 for convenience */
4672394ed5ebSJunchao Zhang   q = 0; /* q-th unique nonzero, with q starting from 0 */
4673394ed5ebSJunchao Zhang   while (k < coo_n) {
4674394ed5ebSJunchao Zhang     row   = i[k];
4675394ed5ebSJunchao Zhang     start = k; /* [start,end) indices for this row */
4676394ed5ebSJunchao Zhang     while (k < coo_n && i[k] == row) k++;
4677394ed5ebSJunchao Zhang     end = k;
4678651b1cf9SStefano Zampini     /* hack for HYPRE: swap min column to diag so that diagonal values will go first */
4679651b1cf9SStefano Zampini     if (hypre) {
4680651b1cf9SStefano Zampini       PetscInt  minj    = PETSC_MAX_INT;
4681651b1cf9SStefano Zampini       PetscBool hasdiag = PETSC_FALSE;
4682651b1cf9SStefano Zampini       for (p = start; p < end; p++) {
4683651b1cf9SStefano Zampini         hasdiag = (PetscBool)(hasdiag || (j[p] == row));
4684651b1cf9SStefano Zampini         minj    = PetscMin(minj, j[p]);
4685651b1cf9SStefano Zampini       }
4686651b1cf9SStefano Zampini       if (hasdiag) {
4687651b1cf9SStefano Zampini         for (p = start; p < end; p++) {
4688651b1cf9SStefano Zampini           if (j[p] == minj) j[p] = row;
4689651b1cf9SStefano Zampini           else if (j[p] == row) j[p] = minj;
4690651b1cf9SStefano Zampini         }
4691651b1cf9SStefano Zampini       }
4692651b1cf9SStefano Zampini     }
46939566063dSJacob Faibussowitsch     PetscCall(PetscSortIntWithCountArray(end - start, j + start, perm + start));
4694651b1cf9SStefano Zampini 
4695394ed5ebSJunchao Zhang     /* Find number of unique col entries in this row */
4696394ed5ebSJunchao Zhang     Aj[q]   = j[start]; /* Log the first nonzero in this row */
4697651b1cf9SStefano Zampini     jmap[q] = 1;        /* Number of repeats of this nonzero entry */
4698394ed5ebSJunchao Zhang     Ai[row] = 1;
4699394ed5ebSJunchao Zhang     nnz++;
4700394ed5ebSJunchao Zhang 
4701394ed5ebSJunchao Zhang     for (p = start + 1; p < end; p++) { /* Scan remaining nonzero in this row */
4702394ed5ebSJunchao Zhang       if (j[p] != j[p - 1]) {           /* Meet a new nonzero */
4703394ed5ebSJunchao Zhang         q++;
4704394ed5ebSJunchao Zhang         jmap[q] = 1;
4705394ed5ebSJunchao Zhang         Aj[q]   = j[p];
4706394ed5ebSJunchao Zhang         Ai[row]++;
4707394ed5ebSJunchao Zhang         nnz++;
4708394ed5ebSJunchao Zhang       } else {
4709394ed5ebSJunchao Zhang         jmap[q]++;
4710394ed5ebSJunchao Zhang       }
4711394ed5ebSJunchao Zhang     }
4712394ed5ebSJunchao Zhang     q++; /* Move to next row and thus next unique nonzero */
4713394ed5ebSJunchao Zhang   }
4714394ed5ebSJunchao Zhang   Ai--; /* Back to the beginning of Ai[] */
4715394ed5ebSJunchao Zhang   for (k = 0; k < M; k++) Ai[k + 1] += Ai[k];
4716394ed5ebSJunchao Zhang   jmap--; /* Back to the beginning of jmap[] */
4717394ed5ebSJunchao Zhang   jmap[0] = 0;
4718394ed5ebSJunchao Zhang   for (k = 0; k < nnz; k++) jmap[k + 1] += jmap[k];
4719394ed5ebSJunchao Zhang   if (nnz < coo_n - nneg) { /* Realloc with actual number of unique nonzeros */
4720394ed5ebSJunchao Zhang     PetscCount *jmap_new;
4721394ed5ebSJunchao Zhang     PetscInt   *Aj_new;
4722394ed5ebSJunchao Zhang 
47239566063dSJacob Faibussowitsch     PetscCall(PetscMalloc1(nnz + 1, &jmap_new));
47249566063dSJacob Faibussowitsch     PetscCall(PetscArraycpy(jmap_new, jmap, nnz + 1));
47259566063dSJacob Faibussowitsch     PetscCall(PetscFree(jmap));
4726394ed5ebSJunchao Zhang     jmap = jmap_new;
4727394ed5ebSJunchao Zhang 
47289566063dSJacob Faibussowitsch     PetscCall(PetscMalloc1(nnz, &Aj_new));
47299566063dSJacob Faibussowitsch     PetscCall(PetscArraycpy(Aj_new, Aj, nnz));
47309566063dSJacob Faibussowitsch     PetscCall(PetscFree(Aj));
4731394ed5ebSJunchao Zhang     Aj = Aj_new;
4732394ed5ebSJunchao Zhang   }
4733394ed5ebSJunchao Zhang 
4734394ed5ebSJunchao Zhang   if (nneg) { /* Discard heading entries with negative indices in perm[], as we'll access it from index 0 in MatSetValuesCOO */
4735394ed5ebSJunchao Zhang     PetscCount *perm_new;
4736cbc6b225SStefano Zampini 
47379566063dSJacob Faibussowitsch     PetscCall(PetscMalloc1(coo_n - nneg, &perm_new));
47389566063dSJacob Faibussowitsch     PetscCall(PetscArraycpy(perm_new, perm + nneg, coo_n - nneg));
47399566063dSJacob Faibussowitsch     PetscCall(PetscFree(perm));
4740394ed5ebSJunchao Zhang     perm = perm_new;
4741394ed5ebSJunchao Zhang   }
4742394ed5ebSJunchao Zhang 
47439566063dSJacob Faibussowitsch   PetscCall(MatGetRootType_Private(mat, &rtype));
47449566063dSJacob Faibussowitsch   PetscCall(PetscCalloc1(nnz, &Aa)); /* Zero the matrix */
47459566063dSJacob Faibussowitsch   PetscCall(MatSetSeqAIJWithArrays_private(PETSC_COMM_SELF, M, N, Ai, Aj, Aa, rtype, mat));
4746394ed5ebSJunchao Zhang 
4747394ed5ebSJunchao Zhang   seqaij->singlemalloc = PETSC_FALSE;            /* Ai, Aj and Aa are not allocated in one big malloc */
4748394ed5ebSJunchao Zhang   seqaij->free_a = seqaij->free_ij = PETSC_TRUE; /* Let newmat own Ai, Aj and Aa */
47492c4ab24aSJunchao Zhang 
47502c4ab24aSJunchao Zhang   // Put the COO struct in a container and then attach that to the matrix
47512c4ab24aSJunchao Zhang   PetscCall(PetscMalloc1(1, &coo));
47522c4ab24aSJunchao Zhang   coo->nz   = nnz;
47532c4ab24aSJunchao Zhang   coo->n    = coo_n;
47542c4ab24aSJunchao Zhang   coo->Atot = coo_n - nneg; // Annz is seqaij->nz, so no need to record that again
47552c4ab24aSJunchao Zhang   coo->jmap = jmap;         // of length nnz+1
47562c4ab24aSJunchao Zhang   coo->perm = perm;
47572c4ab24aSJunchao Zhang   PetscCall(PetscContainerCreate(PETSC_COMM_SELF, &container));
47582c4ab24aSJunchao Zhang   PetscCall(PetscContainerSetPointer(container, coo));
47592c4ab24aSJunchao Zhang   PetscCall(PetscContainerSetUserDestroy(container, MatCOOStructDestroy_SeqAIJ));
47602c4ab24aSJunchao Zhang   PetscCall(PetscObjectCompose((PetscObject)mat, "__PETSc_MatCOOStruct_Host", (PetscObject)container));
47612c4ab24aSJunchao Zhang   PetscCall(PetscContainerDestroy(&container));
47623ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
4763394ed5ebSJunchao Zhang }
4764394ed5ebSJunchao Zhang 
4765d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatSetValuesCOO_SeqAIJ(Mat A, const PetscScalar v[], InsertMode imode)
4766d71ae5a4SJacob Faibussowitsch {
4767394ed5ebSJunchao Zhang   Mat_SeqAIJ          *aseq = (Mat_SeqAIJ *)A->data;
4768394ed5ebSJunchao Zhang   PetscCount           i, j, Annz = aseq->nz;
47692c4ab24aSJunchao Zhang   PetscCount          *perm, *jmap;
4770394ed5ebSJunchao Zhang   PetscScalar         *Aa;
47712c4ab24aSJunchao Zhang   PetscContainer       container;
47722c4ab24aSJunchao Zhang   MatCOOStruct_SeqAIJ *coo;
4773394ed5ebSJunchao Zhang 
4774394ed5ebSJunchao Zhang   PetscFunctionBegin;
47752c4ab24aSJunchao Zhang   PetscCall(PetscObjectQuery((PetscObject)A, "__PETSc_MatCOOStruct_Host", (PetscObject *)&container));
47762c4ab24aSJunchao Zhang   PetscCheck(container, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Not found MatCOOStruct on this matrix");
47772c4ab24aSJunchao Zhang   PetscCall(PetscContainerGetPointer(container, (void **)&coo));
47782c4ab24aSJunchao Zhang   perm = coo->perm;
47792c4ab24aSJunchao Zhang   jmap = coo->jmap;
47809566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArray(A, &Aa));
4781394ed5ebSJunchao Zhang   for (i = 0; i < Annz; i++) {
4782b6c38306SJunchao Zhang     PetscScalar sum = 0.0;
4783b6c38306SJunchao Zhang     for (j = jmap[i]; j < jmap[i + 1]; j++) sum += v[perm[j]];
4784b6c38306SJunchao Zhang     Aa[i] = (imode == INSERT_VALUES ? 0.0 : Aa[i]) + sum;
4785394ed5ebSJunchao Zhang   }
47869566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArray(A, &Aa));
47873ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
4788394ed5ebSJunchao Zhang }
4789394ed5ebSJunchao Zhang 
479034b5b067SBarry Smith #if defined(PETSC_HAVE_CUDA)
47915063d097SStefano Zampini PETSC_INTERN PetscErrorCode MatConvert_SeqAIJ_SeqAIJCUSPARSE(Mat, MatType, MatReuse, Mat *);
479202fe1965SBarry Smith #endif
4793d5e393b6SSuyash Tandon #if defined(PETSC_HAVE_HIP)
4794d5e393b6SSuyash Tandon PETSC_INTERN PetscErrorCode MatConvert_SeqAIJ_SeqAIJHIPSPARSE(Mat, MatType, MatReuse, Mat *);
4795d5e393b6SSuyash Tandon #endif
47963d0639e7SStefano Zampini #if defined(PETSC_HAVE_KOKKOS_KERNELS)
47975063d097SStefano Zampini PETSC_INTERN PetscErrorCode MatConvert_SeqAIJ_SeqAIJKokkos(Mat, MatType, MatReuse, Mat *);
47983d0639e7SStefano Zampini #endif
479902fe1965SBarry Smith 
4800d71ae5a4SJacob Faibussowitsch PETSC_EXTERN PetscErrorCode MatCreate_SeqAIJ(Mat B)
4801d71ae5a4SJacob Faibussowitsch {
4802273d9f13SBarry Smith   Mat_SeqAIJ *b;
480338baddfdSBarry Smith   PetscMPIInt size;
4804273d9f13SBarry Smith 
4805273d9f13SBarry Smith   PetscFunctionBegin;
48069566063dSJacob Faibussowitsch   PetscCallMPI(MPI_Comm_size(PetscObjectComm((PetscObject)B), &size));
480708401ef6SPierre Jolivet   PetscCheck(size <= 1, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Comm must be of size 1");
4808273d9f13SBarry Smith 
48094dfa11a4SJacob Faibussowitsch   PetscCall(PetscNew(&b));
48102205254eSKarl Rupp 
4811b0a32e0cSBarry Smith   B->data   = (void *)b;
4812aea10558SJacob Faibussowitsch   B->ops[0] = MatOps_Values;
4813071fcb05SBarry Smith   if (B->sortedfull) B->ops->setvalues = MatSetValues_SeqAIJ_SortedFull;
48142205254eSKarl Rupp 
4815f4259b30SLisandro Dalcin   b->row                = NULL;
4816f4259b30SLisandro Dalcin   b->col                = NULL;
4817f4259b30SLisandro Dalcin   b->icol               = NULL;
4818b810aeb4SBarry Smith   b->reallocs           = 0;
481936db0b34SBarry Smith   b->ignorezeroentries  = PETSC_FALSE;
4820f1e2ffcdSBarry Smith   b->roworiented        = PETSC_TRUE;
4821416022c9SBarry Smith   b->nonew              = 0;
4822f4259b30SLisandro Dalcin   b->diag               = NULL;
4823f4259b30SLisandro Dalcin   b->solve_work         = NULL;
4824f4259b30SLisandro Dalcin   B->spptr              = NULL;
4825f4259b30SLisandro Dalcin   b->saved_values       = NULL;
4826f4259b30SLisandro Dalcin   b->idiag              = NULL;
4827f4259b30SLisandro Dalcin   b->mdiag              = NULL;
4828f4259b30SLisandro Dalcin   b->ssor_work          = NULL;
482971f1c65dSBarry Smith   b->omega              = 1.0;
483071f1c65dSBarry Smith   b->fshift             = 0.0;
483171f1c65dSBarry Smith   b->idiagvalid         = PETSC_FALSE;
4832bbead8a2SBarry Smith   b->ibdiagvalid        = PETSC_FALSE;
4833a9817697SBarry Smith   b->keepnonzeropattern = PETSC_FALSE;
483417ab2063SBarry Smith 
48359566063dSJacob Faibussowitsch   PetscCall(PetscObjectChangeTypeName((PetscObject)B, MATSEQAIJ));
4836d1e78c4fSBarry Smith #if defined(PETSC_HAVE_MATLAB)
48379566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "PetscMatlabEnginePut_C", MatlabEnginePut_SeqAIJ));
48389566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "PetscMatlabEngineGet_C", MatlabEngineGet_SeqAIJ));
4839b3866ffcSBarry Smith #endif
48409566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSeqAIJSetColumnIndices_C", MatSeqAIJSetColumnIndices_SeqAIJ));
48419566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatStoreValues_C", MatStoreValues_SeqAIJ));
48429566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatRetrieveValues_C", MatRetrieveValues_SeqAIJ));
48439566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqsbaij_C", MatConvert_SeqAIJ_SeqSBAIJ));
48449566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqbaij_C", MatConvert_SeqAIJ_SeqBAIJ));
48459566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijperm_C", MatConvert_SeqAIJ_SeqAIJPERM));
48469566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijsell_C", MatConvert_SeqAIJ_SeqAIJSELL));
48479779e05dSSatish Balay #if defined(PETSC_HAVE_MKL_SPARSE)
48489566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijmkl_C", MatConvert_SeqAIJ_SeqAIJMKL));
4849191b95cbSRichard Tran Mills #endif
485034b5b067SBarry Smith #if defined(PETSC_HAVE_CUDA)
48519566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijcusparse_C", MatConvert_SeqAIJ_SeqAIJCUSPARSE));
48529566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_seqaijcusparse_seqaij_C", MatProductSetFromOptions_SeqAIJ));
48539566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_seqaij_seqaijcusparse_C", MatProductSetFromOptions_SeqAIJ));
485402fe1965SBarry Smith #endif
4855d5e393b6SSuyash Tandon #if defined(PETSC_HAVE_HIP)
4856d5e393b6SSuyash Tandon   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijhipsparse_C", MatConvert_SeqAIJ_SeqAIJHIPSPARSE));
4857d5e393b6SSuyash Tandon   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_seqaijhipsparse_seqaij_C", MatProductSetFromOptions_SeqAIJ));
4858d5e393b6SSuyash Tandon   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_seqaij_seqaijhipsparse_C", MatProductSetFromOptions_SeqAIJ));
4859d5e393b6SSuyash Tandon #endif
48603d0639e7SStefano Zampini #if defined(PETSC_HAVE_KOKKOS_KERNELS)
48619566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijkokkos_C", MatConvert_SeqAIJ_SeqAIJKokkos));
48623d0639e7SStefano Zampini #endif
48639566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijcrl_C", MatConvert_SeqAIJ_SeqAIJCRL));
4864af8000cdSHong Zhang #if defined(PETSC_HAVE_ELEMENTAL)
48659566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_elemental_C", MatConvert_SeqAIJ_Elemental));
4866af8000cdSHong Zhang #endif
4867d24d4204SJose E. Roman #if defined(PETSC_HAVE_SCALAPACK)
48689566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_scalapack_C", MatConvert_AIJ_ScaLAPACK));
4869d24d4204SJose E. Roman #endif
487063c07aadSStefano Zampini #if defined(PETSC_HAVE_HYPRE)
48719566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_hypre_C", MatConvert_AIJ_HYPRE));
48729566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_transpose_seqaij_seqaij_C", MatProductSetFromOptions_Transpose_AIJ_AIJ));
487363c07aadSStefano Zampini #endif
48749566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqdense_C", MatConvert_SeqAIJ_SeqDense));
48759566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqsell_C", MatConvert_SeqAIJ_SeqSELL));
48769566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_is_C", MatConvert_XAIJ_IS));
48779566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatIsTranspose_C", MatIsTranspose_SeqAIJ));
48789566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatIsHermitianTranspose_C", MatIsTranspose_SeqAIJ));
48799566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSeqAIJSetPreallocation_C", MatSeqAIJSetPreallocation_SeqAIJ));
48809566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatResetPreallocation_C", MatResetPreallocation_SeqAIJ));
48819566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSeqAIJSetPreallocationCSR_C", MatSeqAIJSetPreallocationCSR_SeqAIJ));
48829566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatReorderForNonzeroDiagonal_C", MatReorderForNonzeroDiagonal_SeqAIJ));
48839566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_is_seqaij_C", MatProductSetFromOptions_IS_XAIJ));
48849566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_seqdense_seqaij_C", MatProductSetFromOptions_SeqDense_SeqAIJ));
48859566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_seqaij_seqaij_C", MatProductSetFromOptions_SeqAIJ));
48869566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSeqAIJKron_C", MatSeqAIJKron_SeqAIJ));
48879566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSetPreallocationCOO_C", MatSetPreallocationCOO_SeqAIJ));
48889566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSetValuesCOO_C", MatSetValuesCOO_SeqAIJ));
48899566063dSJacob Faibussowitsch   PetscCall(MatCreate_SeqAIJ_Inode(B));
48909566063dSJacob Faibussowitsch   PetscCall(PetscObjectChangeTypeName((PetscObject)B, MATSEQAIJ));
48919566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJSetTypeFromOptions(B)); /* this allows changing the matrix subtype to say MATSEQAIJPERM */
48923ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
489317ab2063SBarry Smith }
489417ab2063SBarry Smith 
4895b24902e0SBarry Smith /*
48963893b582SJunchao Zhang     Given a matrix generated with MatGetFactor() duplicates all the information in A into C
4897b24902e0SBarry Smith */
4898d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDuplicateNoCreate_SeqAIJ(Mat C, Mat A, MatDuplicateOption cpvalues, PetscBool mallocmatspace)
4899d71ae5a4SJacob Faibussowitsch {
49002a350339SBarry Smith   Mat_SeqAIJ *c = (Mat_SeqAIJ *)C->data, *a = (Mat_SeqAIJ *)A->data;
4901071fcb05SBarry Smith   PetscInt    m = A->rmap->n, i;
490217ab2063SBarry Smith 
49033a40ed3dSBarry Smith   PetscFunctionBegin;
4904aed4548fSBarry Smith   PetscCheck(A->assembled || cpvalues == MAT_DO_NOT_COPY_VALUES, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Cannot duplicate unassembled matrix");
4905273d9f13SBarry Smith 
4906d5f3da31SBarry Smith   C->factortype = A->factortype;
4907f4259b30SLisandro Dalcin   c->row        = NULL;
4908f4259b30SLisandro Dalcin   c->col        = NULL;
4909f4259b30SLisandro Dalcin   c->icol       = NULL;
49106ad4291fSHong Zhang   c->reallocs   = 0;
491117ab2063SBarry Smith 
491269272f91SPierre Jolivet   C->assembled = A->assembled;
491317ab2063SBarry Smith 
491469272f91SPierre Jolivet   if (A->preallocated) {
49159566063dSJacob Faibussowitsch     PetscCall(PetscLayoutReference(A->rmap, &C->rmap));
49169566063dSJacob Faibussowitsch     PetscCall(PetscLayoutReference(A->cmap, &C->cmap));
4917eec197d1SBarry Smith 
491831fe6a7dSBarry Smith     if (!A->hash_active) {
49199566063dSJacob Faibussowitsch       PetscCall(PetscMalloc1(m, &c->imax));
49209566063dSJacob Faibussowitsch       PetscCall(PetscMemcpy(c->imax, a->imax, m * sizeof(PetscInt)));
49219566063dSJacob Faibussowitsch       PetscCall(PetscMalloc1(m, &c->ilen));
49229566063dSJacob Faibussowitsch       PetscCall(PetscMemcpy(c->ilen, a->ilen, m * sizeof(PetscInt)));
492317ab2063SBarry Smith 
492417ab2063SBarry Smith       /* allocate the matrix space */
4925f77e22a1SHong Zhang       if (mallocmatspace) {
49269566063dSJacob Faibussowitsch         PetscCall(PetscMalloc3(a->i[m], &c->a, a->i[m], &c->j, m + 1, &c->i));
49272205254eSKarl Rupp 
4928f1e2ffcdSBarry Smith         c->singlemalloc = PETSC_TRUE;
49292205254eSKarl Rupp 
49309566063dSJacob Faibussowitsch         PetscCall(PetscArraycpy(c->i, a->i, m + 1));
493117ab2063SBarry Smith         if (m > 0) {
49329566063dSJacob Faibussowitsch           PetscCall(PetscArraycpy(c->j, a->j, a->i[m]));
4933be6bf707SBarry Smith           if (cpvalues == MAT_COPY_VALUES) {
49342e5835c6SStefano Zampini             const PetscScalar *aa;
49352e5835c6SStefano Zampini 
49369566063dSJacob Faibussowitsch             PetscCall(MatSeqAIJGetArrayRead(A, &aa));
49379566063dSJacob Faibussowitsch             PetscCall(PetscArraycpy(c->a, aa, a->i[m]));
49389566063dSJacob Faibussowitsch             PetscCall(MatSeqAIJGetArrayRead(A, &aa));
4939be6bf707SBarry Smith           } else {
49409566063dSJacob Faibussowitsch             PetscCall(PetscArrayzero(c->a, a->i[m]));
494117ab2063SBarry Smith           }
494208480c60SBarry Smith         }
4943f77e22a1SHong Zhang       }
494431fe6a7dSBarry Smith       C->preallocated = PETSC_TRUE;
494531fe6a7dSBarry Smith     } else {
494631fe6a7dSBarry Smith       PetscCheck(mallocmatspace, PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_WRONGSTATE, "Cannot malloc matrix memory from a non-preallocated matrix");
494731fe6a7dSBarry Smith       PetscCall(MatSetUp(C));
494831fe6a7dSBarry Smith     }
494917ab2063SBarry Smith 
49506ad4291fSHong Zhang     c->ignorezeroentries = a->ignorezeroentries;
4951416022c9SBarry Smith     c->roworiented       = a->roworiented;
4952416022c9SBarry Smith     c->nonew             = a->nonew;
4953416022c9SBarry Smith     if (a->diag) {
49549566063dSJacob Faibussowitsch       PetscCall(PetscMalloc1(m + 1, &c->diag));
49559566063dSJacob Faibussowitsch       PetscCall(PetscMemcpy(c->diag, a->diag, m * sizeof(PetscInt)));
4956071fcb05SBarry Smith     } else c->diag = NULL;
49572205254eSKarl Rupp 
4958f4259b30SLisandro Dalcin     c->solve_work         = NULL;
4959f4259b30SLisandro Dalcin     c->saved_values       = NULL;
4960f4259b30SLisandro Dalcin     c->idiag              = NULL;
4961f4259b30SLisandro Dalcin     c->ssor_work          = NULL;
4962a9817697SBarry Smith     c->keepnonzeropattern = a->keepnonzeropattern;
4963e6b907acSBarry Smith     c->free_a             = PETSC_TRUE;
4964e6b907acSBarry Smith     c->free_ij            = PETSC_TRUE;
49656ad4291fSHong Zhang 
4966893ad86cSHong Zhang     c->rmax  = a->rmax;
4967416022c9SBarry Smith     c->nz    = a->nz;
49688ed568f8SMatthew G Knepley     c->maxnz = a->nz; /* Since we allocate exactly the right amount */
4969754ec7b1SSatish Balay 
49706ad4291fSHong Zhang     c->compressedrow.use   = a->compressedrow.use;
49716ad4291fSHong Zhang     c->compressedrow.nrows = a->compressedrow.nrows;
4972cd6b891eSBarry Smith     if (a->compressedrow.use) {
49736ad4291fSHong Zhang       i = a->compressedrow.nrows;
49749566063dSJacob Faibussowitsch       PetscCall(PetscMalloc2(i + 1, &c->compressedrow.i, i, &c->compressedrow.rindex));
49759566063dSJacob Faibussowitsch       PetscCall(PetscArraycpy(c->compressedrow.i, a->compressedrow.i, i + 1));
49769566063dSJacob Faibussowitsch       PetscCall(PetscArraycpy(c->compressedrow.rindex, a->compressedrow.rindex, i));
497727ea64f8SHong Zhang     } else {
497827ea64f8SHong Zhang       c->compressedrow.use    = PETSC_FALSE;
49790298fd71SBarry Smith       c->compressedrow.i      = NULL;
49800298fd71SBarry Smith       c->compressedrow.rindex = NULL;
49816ad4291fSHong Zhang     }
4982ea632784SBarry Smith     c->nonzerorowcnt = a->nonzerorowcnt;
4983e56f5c9eSBarry Smith     C->nonzerostate  = A->nonzerostate;
49844846f1f5SKris Buschelman 
49859566063dSJacob Faibussowitsch     PetscCall(MatDuplicate_SeqAIJ_Inode(A, cpvalues, &C));
498669272f91SPierre Jolivet   }
49879566063dSJacob Faibussowitsch   PetscCall(PetscFunctionListDuplicate(((PetscObject)A)->qlist, &((PetscObject)C)->qlist));
49883ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
498917ab2063SBarry Smith }
499017ab2063SBarry Smith 
4991d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDuplicate_SeqAIJ(Mat A, MatDuplicateOption cpvalues, Mat *B)
4992d71ae5a4SJacob Faibussowitsch {
4993b24902e0SBarry Smith   PetscFunctionBegin;
49949566063dSJacob Faibussowitsch   PetscCall(MatCreate(PetscObjectComm((PetscObject)A), B));
49959566063dSJacob Faibussowitsch   PetscCall(MatSetSizes(*B, A->rmap->n, A->cmap->n, A->rmap->n, A->cmap->n));
499648a46eb9SPierre Jolivet   if (!(A->rmap->n % A->rmap->bs) && !(A->cmap->n % A->cmap->bs)) PetscCall(MatSetBlockSizesFromMats(*B, A, A));
49979566063dSJacob Faibussowitsch   PetscCall(MatSetType(*B, ((PetscObject)A)->type_name));
49989566063dSJacob Faibussowitsch   PetscCall(MatDuplicateNoCreate_SeqAIJ(*B, A, cpvalues, PETSC_TRUE));
49993ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
5000b24902e0SBarry Smith }
5001b24902e0SBarry Smith 
5002d71ae5a4SJacob Faibussowitsch PetscErrorCode MatLoad_SeqAIJ(Mat newMat, PetscViewer viewer)
5003d71ae5a4SJacob Faibussowitsch {
500452f91c60SVaclav Hapla   PetscBool isbinary, ishdf5;
500552f91c60SVaclav Hapla 
500652f91c60SVaclav Hapla   PetscFunctionBegin;
500752f91c60SVaclav Hapla   PetscValidHeaderSpecific(newMat, MAT_CLASSID, 1);
500852f91c60SVaclav Hapla   PetscValidHeaderSpecific(viewer, PETSC_VIEWER_CLASSID, 2);
5009c27b3999SVaclav Hapla   /* force binary viewer to load .info file if it has not yet done so */
50109566063dSJacob Faibussowitsch   PetscCall(PetscViewerSetUp(viewer));
50119566063dSJacob Faibussowitsch   PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERBINARY, &isbinary));
50129566063dSJacob Faibussowitsch   PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERHDF5, &ishdf5));
501352f91c60SVaclav Hapla   if (isbinary) {
50149566063dSJacob Faibussowitsch     PetscCall(MatLoad_SeqAIJ_Binary(newMat, viewer));
501552f91c60SVaclav Hapla   } else if (ishdf5) {
501652f91c60SVaclav Hapla #if defined(PETSC_HAVE_HDF5)
50179566063dSJacob Faibussowitsch     PetscCall(MatLoad_AIJ_HDF5(newMat, viewer));
501852f91c60SVaclav Hapla #else
501952f91c60SVaclav Hapla     SETERRQ(PetscObjectComm((PetscObject)newMat), PETSC_ERR_SUP, "HDF5 not supported in this build.\nPlease reconfigure using --download-hdf5");
502052f91c60SVaclav Hapla #endif
502152f91c60SVaclav Hapla   } else {
502298921bdaSJacob Faibussowitsch     SETERRQ(PetscObjectComm((PetscObject)newMat), PETSC_ERR_SUP, "Viewer type %s not yet supported for reading %s matrices", ((PetscObject)viewer)->type_name, ((PetscObject)newMat)->type_name);
502352f91c60SVaclav Hapla   }
50243ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
502552f91c60SVaclav Hapla }
502652f91c60SVaclav Hapla 
5027d71ae5a4SJacob Faibussowitsch PetscErrorCode MatLoad_SeqAIJ_Binary(Mat mat, PetscViewer viewer)
5028d71ae5a4SJacob Faibussowitsch {
50293ea6fe3dSLisandro Dalcin   Mat_SeqAIJ *a = (Mat_SeqAIJ *)mat->data;
50303ea6fe3dSLisandro Dalcin   PetscInt    header[4], *rowlens, M, N, nz, sum, rows, cols, i;
5031fbdbba38SShri Abhyankar 
5032fbdbba38SShri Abhyankar   PetscFunctionBegin;
50339566063dSJacob Faibussowitsch   PetscCall(PetscViewerSetUp(viewer));
5034bbead8a2SBarry Smith 
50353ea6fe3dSLisandro Dalcin   /* read in matrix header */
50369566063dSJacob Faibussowitsch   PetscCall(PetscViewerBinaryRead(viewer, header, 4, NULL, PETSC_INT));
503708401ef6SPierre Jolivet   PetscCheck(header[0] == MAT_FILE_CLASSID, PETSC_COMM_SELF, PETSC_ERR_FILE_UNEXPECTED, "Not a matrix object in file");
50389371c9d4SSatish Balay   M  = header[1];
50399371c9d4SSatish Balay   N  = header[2];
50409371c9d4SSatish Balay   nz = header[3];
504108401ef6SPierre Jolivet   PetscCheck(M >= 0, PetscObjectComm((PetscObject)viewer), PETSC_ERR_FILE_UNEXPECTED, "Matrix row size (%" PetscInt_FMT ") in file is negative", M);
504208401ef6SPierre Jolivet   PetscCheck(N >= 0, PetscObjectComm((PetscObject)viewer), PETSC_ERR_FILE_UNEXPECTED, "Matrix column size (%" PetscInt_FMT ") in file is negative", N);
504308401ef6SPierre Jolivet   PetscCheck(nz >= 0, PETSC_COMM_SELF, PETSC_ERR_FILE_UNEXPECTED, "Matrix stored in special format on disk, cannot load as SeqAIJ");
5044fbdbba38SShri Abhyankar 
50453ea6fe3dSLisandro Dalcin   /* set block sizes from the viewer's .info file */
50469566063dSJacob Faibussowitsch   PetscCall(MatLoad_Binary_BlockSizes(mat, viewer));
50473ea6fe3dSLisandro Dalcin   /* set local and global sizes if not set already */
50483ea6fe3dSLisandro Dalcin   if (mat->rmap->n < 0) mat->rmap->n = M;
50493ea6fe3dSLisandro Dalcin   if (mat->cmap->n < 0) mat->cmap->n = N;
50503ea6fe3dSLisandro Dalcin   if (mat->rmap->N < 0) mat->rmap->N = M;
50513ea6fe3dSLisandro Dalcin   if (mat->cmap->N < 0) mat->cmap->N = N;
50529566063dSJacob Faibussowitsch   PetscCall(PetscLayoutSetUp(mat->rmap));
50539566063dSJacob Faibussowitsch   PetscCall(PetscLayoutSetUp(mat->cmap));
50543ea6fe3dSLisandro Dalcin 
50553ea6fe3dSLisandro Dalcin   /* check if the matrix sizes are correct */
50569566063dSJacob Faibussowitsch   PetscCall(MatGetSize(mat, &rows, &cols));
5057aed4548fSBarry Smith   PetscCheck(M == rows && N == cols, PETSC_COMM_SELF, PETSC_ERR_FILE_UNEXPECTED, "Matrix in file of different sizes (%" PetscInt_FMT ", %" PetscInt_FMT ") than the input matrix (%" PetscInt_FMT ", %" PetscInt_FMT ")", M, N, rows, cols);
50583ea6fe3dSLisandro Dalcin 
5059fbdbba38SShri Abhyankar   /* read in row lengths */
50609566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(M, &rowlens));
50619566063dSJacob Faibussowitsch   PetscCall(PetscViewerBinaryRead(viewer, rowlens, M, NULL, PETSC_INT));
50623ea6fe3dSLisandro Dalcin   /* check if sum(rowlens) is same as nz */
50639371c9d4SSatish Balay   sum = 0;
50649371c9d4SSatish Balay   for (i = 0; i < M; i++) sum += rowlens[i];
506508401ef6SPierre Jolivet   PetscCheck(sum == nz, PETSC_COMM_SELF, PETSC_ERR_FILE_UNEXPECTED, "Inconsistent matrix data in file: nonzeros = %" PetscInt_FMT ", sum-row-lengths = %" PetscInt_FMT, nz, sum);
50663ea6fe3dSLisandro Dalcin   /* preallocate and check sizes */
50679566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(mat, 0, rowlens));
50689566063dSJacob Faibussowitsch   PetscCall(MatGetSize(mat, &rows, &cols));
5069aed4548fSBarry Smith   PetscCheck(M == rows && N == cols, PETSC_COMM_SELF, PETSC_ERR_FILE_UNEXPECTED, "Matrix in file of different length (%" PetscInt_FMT ", %" PetscInt_FMT ") than the input matrix (%" PetscInt_FMT ", %" PetscInt_FMT ")", M, N, rows, cols);
50703ea6fe3dSLisandro Dalcin   /* store row lengths */
50719566063dSJacob Faibussowitsch   PetscCall(PetscArraycpy(a->ilen, rowlens, M));
50729566063dSJacob Faibussowitsch   PetscCall(PetscFree(rowlens));
5073fbdbba38SShri Abhyankar 
50743ea6fe3dSLisandro Dalcin   /* fill in "i" row pointers */
50759371c9d4SSatish Balay   a->i[0] = 0;
50769371c9d4SSatish Balay   for (i = 0; i < M; i++) a->i[i + 1] = a->i[i] + a->ilen[i];
50773ea6fe3dSLisandro Dalcin   /* read in "j" column indices */
50789566063dSJacob Faibussowitsch   PetscCall(PetscViewerBinaryRead(viewer, a->j, nz, NULL, PETSC_INT));
50793ea6fe3dSLisandro Dalcin   /* read in "a" nonzero values */
50809566063dSJacob Faibussowitsch   PetscCall(PetscViewerBinaryRead(viewer, a->a, nz, NULL, PETSC_SCALAR));
5081fbdbba38SShri Abhyankar 
50829566063dSJacob Faibussowitsch   PetscCall(MatAssemblyBegin(mat, MAT_FINAL_ASSEMBLY));
50839566063dSJacob Faibussowitsch   PetscCall(MatAssemblyEnd(mat, MAT_FINAL_ASSEMBLY));
50843ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
5085fbdbba38SShri Abhyankar }
5086fbdbba38SShri Abhyankar 
5087d71ae5a4SJacob Faibussowitsch PetscErrorCode MatEqual_SeqAIJ(Mat A, Mat B, PetscBool *flg)
5088d71ae5a4SJacob Faibussowitsch {
50897264ac53SSatish Balay   Mat_SeqAIJ        *a = (Mat_SeqAIJ *)A->data, *b = (Mat_SeqAIJ *)B->data;
5090fff043a9SJunchao Zhang   const PetscScalar *aa, *ba;
5091eeffb40dSHong Zhang #if defined(PETSC_USE_COMPLEX)
5092eeffb40dSHong Zhang   PetscInt k;
5093eeffb40dSHong Zhang #endif
50947264ac53SSatish Balay 
50953a40ed3dSBarry Smith   PetscFunctionBegin;
5096bfeeae90SHong Zhang   /* If the  matrix dimensions are not equal,or no of nonzeros */
5097d0f46423SBarry Smith   if ((A->rmap->n != B->rmap->n) || (A->cmap->n != B->cmap->n) || (a->nz != b->nz)) {
5098ca44d042SBarry Smith     *flg = PETSC_FALSE;
50993ba16761SJacob Faibussowitsch     PetscFunctionReturn(PETSC_SUCCESS);
5100bcd2baecSBarry Smith   }
51017264ac53SSatish Balay 
51027264ac53SSatish Balay   /* if the a->i are the same */
51039566063dSJacob Faibussowitsch   PetscCall(PetscArraycmp(a->i, b->i, A->rmap->n + 1, flg));
51043ba16761SJacob Faibussowitsch   if (!*flg) PetscFunctionReturn(PETSC_SUCCESS);
51057264ac53SSatish Balay 
51067264ac53SSatish Balay   /* if a->j are the same */
51079566063dSJacob Faibussowitsch   PetscCall(PetscArraycmp(a->j, b->j, a->nz, flg));
51083ba16761SJacob Faibussowitsch   if (!*flg) PetscFunctionReturn(PETSC_SUCCESS);
5109bcd2baecSBarry Smith 
51109566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &aa));
51119566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(B, &ba));
5112bcd2baecSBarry Smith   /* if a->a are the same */
5113eeffb40dSHong Zhang #if defined(PETSC_USE_COMPLEX)
5114eeffb40dSHong Zhang   for (k = 0; k < a->nz; k++) {
5115fff043a9SJunchao Zhang     if (PetscRealPart(aa[k]) != PetscRealPart(ba[k]) || PetscImaginaryPart(aa[k]) != PetscImaginaryPart(ba[k])) {
5116eeffb40dSHong Zhang       *flg = PETSC_FALSE;
51173ba16761SJacob Faibussowitsch       PetscFunctionReturn(PETSC_SUCCESS);
5118eeffb40dSHong Zhang     }
5119eeffb40dSHong Zhang   }
5120eeffb40dSHong Zhang #else
51219566063dSJacob Faibussowitsch   PetscCall(PetscArraycmp(aa, ba, a->nz, flg));
5122eeffb40dSHong Zhang #endif
51239566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &aa));
51249566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(B, &ba));
51253ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
51267264ac53SSatish Balay }
512736db0b34SBarry Smith 
512805869f15SSatish Balay /*@
512911a5261eSBarry Smith      MatCreateSeqAIJWithArrays - Creates an sequential `MATSEQAIJ` matrix using matrix elements (in CSR format)
513036db0b34SBarry Smith               provided by the user.
513136db0b34SBarry Smith 
5132d083f849SBarry Smith       Collective
513336db0b34SBarry Smith 
513436db0b34SBarry Smith    Input Parameters:
513536db0b34SBarry Smith +   comm - must be an MPI communicator of size 1
513636db0b34SBarry Smith .   m - number of rows
513736db0b34SBarry Smith .   n - number of columns
5138483a2f95SBarry Smith .   i - row indices; that is i[0] = 0, i[row] = i[row-1] + number of elements in that row of the matrix
513936db0b34SBarry Smith .   j - column indices
514036db0b34SBarry Smith -   a - matrix values
514136db0b34SBarry Smith 
514236db0b34SBarry Smith    Output Parameter:
514336db0b34SBarry Smith .   mat - the matrix
514436db0b34SBarry Smith 
514536db0b34SBarry Smith    Level: intermediate
514636db0b34SBarry Smith 
514736db0b34SBarry Smith    Notes:
51482ef1f0ffSBarry Smith        The `i`, `j`, and `a` arrays are not copied by this routine, the user must free these arrays
5149292fb18eSBarry Smith     once the matrix is destroyed and not before
515036db0b34SBarry Smith 
515136db0b34SBarry Smith        You cannot set new nonzero locations into this matrix, that will generate an error.
515236db0b34SBarry Smith 
51532ef1f0ffSBarry Smith        The `i` and `j` indices are 0 based
515436db0b34SBarry Smith 
5155a4552177SSatish Balay        The format which is used for the sparse matrix input, is equivalent to a
5156a4552177SSatish Balay     row-major ordering.. i.e for the following matrix, the input data expected is
51578eef79e4SBarry Smith     as shown
51582ef1f0ffSBarry Smith .vb
51592ef1f0ffSBarry Smith         1 0 0
51602ef1f0ffSBarry Smith         2 0 3
51612ef1f0ffSBarry Smith         4 5 6
5162a4552177SSatish Balay 
51632ef1f0ffSBarry Smith         i =  {0,1,3,6}  [size = nrow+1  = 3+1]
51642ef1f0ffSBarry Smith         j =  {0,0,2,0,1,2}  [size = 6]; values must be sorted for each row
51652ef1f0ffSBarry Smith         v =  {1,2,3,4,5,6}  [size = 6]
51662ef1f0ffSBarry Smith .ve
5167a4552177SSatish Balay 
51681cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatCreate()`, `MatCreateAIJ()`, `MatCreateSeqAIJ()`, `MatCreateMPIAIJWithArrays()`, `MatMPIAIJSetPreallocationCSR()`
516936db0b34SBarry Smith @*/
5170d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateSeqAIJWithArrays(MPI_Comm comm, PetscInt m, PetscInt n, PetscInt i[], PetscInt j[], PetscScalar a[], Mat *mat)
5171d71ae5a4SJacob Faibussowitsch {
5172cbcfb4deSHong Zhang   PetscInt    ii;
517336db0b34SBarry Smith   Mat_SeqAIJ *aij;
5174cbcfb4deSHong Zhang   PetscInt    jj;
517536db0b34SBarry Smith 
517636db0b34SBarry Smith   PetscFunctionBegin;
5177aed4548fSBarry Smith   PetscCheck(m <= 0 || i[0] == 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "i (row indices) must start with 0");
51789566063dSJacob Faibussowitsch   PetscCall(MatCreate(comm, mat));
51799566063dSJacob Faibussowitsch   PetscCall(MatSetSizes(*mat, m, n, m, n));
51809566063dSJacob Faibussowitsch   /* PetscCall(MatSetBlockSizes(*mat,,)); */
51819566063dSJacob Faibussowitsch   PetscCall(MatSetType(*mat, MATSEQAIJ));
51829566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(*mat, MAT_SKIP_ALLOCATION, NULL));
5183ab93d7beSBarry Smith   aij = (Mat_SeqAIJ *)(*mat)->data;
51849566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(m, &aij->imax));
51859566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(m, &aij->ilen));
5186ab93d7beSBarry Smith 
518736db0b34SBarry Smith   aij->i            = i;
518836db0b34SBarry Smith   aij->j            = j;
518936db0b34SBarry Smith   aij->a            = a;
519036db0b34SBarry Smith   aij->singlemalloc = PETSC_FALSE;
519136db0b34SBarry Smith   aij->nonew        = -1; /*this indicates that inserting a new value in the matrix that generates a new nonzero is an error*/
5192e6b907acSBarry Smith   aij->free_a       = PETSC_FALSE;
5193e6b907acSBarry Smith   aij->free_ij      = PETSC_FALSE;
519436db0b34SBarry Smith 
5195cbc6b225SStefano Zampini   for (ii = 0, aij->nonzerorowcnt = 0, aij->rmax = 0; ii < m; ii++) {
519636db0b34SBarry Smith     aij->ilen[ii] = aij->imax[ii] = i[ii + 1] - i[ii];
519776bd3646SJed Brown     if (PetscDefined(USE_DEBUG)) {
5198aed4548fSBarry Smith       PetscCheck(i[ii + 1] - i[ii] >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Negative row length in i (row indices) row = %" PetscInt_FMT " length = %" PetscInt_FMT, ii, i[ii + 1] - i[ii]);
51999985e31cSBarry Smith       for (jj = i[ii] + 1; jj < i[ii + 1]; jj++) {
520008401ef6SPierre Jolivet         PetscCheck(j[jj] >= j[jj - 1], PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Column entry number %" PetscInt_FMT " (actual column %" PetscInt_FMT ") in row %" PetscInt_FMT " is not sorted", jj - i[ii], j[jj], ii);
520108401ef6SPierre Jolivet         PetscCheck(j[jj] != j[jj - 1], PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Column entry number %" PetscInt_FMT " (actual column %" PetscInt_FMT ") in row %" PetscInt_FMT " is identical to previous entry", jj - i[ii], j[jj], ii);
52029985e31cSBarry Smith       }
520336db0b34SBarry Smith     }
520476bd3646SJed Brown   }
520576bd3646SJed Brown   if (PetscDefined(USE_DEBUG)) {
520636db0b34SBarry Smith     for (ii = 0; ii < aij->i[m]; ii++) {
520708401ef6SPierre Jolivet       PetscCheck(j[ii] >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Negative column index at location = %" PetscInt_FMT " index = %" PetscInt_FMT, ii, j[ii]);
5208aed4548fSBarry Smith       PetscCheck(j[ii] <= n - 1, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Column index to large at location = %" PetscInt_FMT " index = %" PetscInt_FMT, ii, j[ii]);
520936db0b34SBarry Smith     }
521076bd3646SJed Brown   }
521136db0b34SBarry Smith 
52129566063dSJacob Faibussowitsch   PetscCall(MatAssemblyBegin(*mat, MAT_FINAL_ASSEMBLY));
52139566063dSJacob Faibussowitsch   PetscCall(MatAssemblyEnd(*mat, MAT_FINAL_ASSEMBLY));
52143ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
521536db0b34SBarry Smith }
5216cbc6b225SStefano Zampini 
5217f62e3866SBarry Smith /*@
521811a5261eSBarry Smith      MatCreateSeqAIJFromTriple - Creates an sequential `MATSEQAIJ` matrix using matrix elements (in COO format)
52198a0b0e6bSVictor Minden               provided by the user.
52208a0b0e6bSVictor Minden 
5221d083f849SBarry Smith       Collective
52228a0b0e6bSVictor Minden 
52238a0b0e6bSVictor Minden    Input Parameters:
52248a0b0e6bSVictor Minden +   comm - must be an MPI communicator of size 1
52258a0b0e6bSVictor Minden .   m   - number of rows
52268a0b0e6bSVictor Minden .   n   - number of columns
52278a0b0e6bSVictor Minden .   i   - row indices
52288a0b0e6bSVictor Minden .   j   - column indices
52291230e6d1SVictor Minden .   a   - matrix values
52301230e6d1SVictor Minden .   nz  - number of nonzeros
52312ef1f0ffSBarry Smith -   idx - if the `i` and `j` indices start with 1 use `PETSC_TRUE` otherwise use `PETSC_FALSE`
52328a0b0e6bSVictor Minden 
52338a0b0e6bSVictor Minden    Output Parameter:
52348a0b0e6bSVictor Minden .   mat - the matrix
52358a0b0e6bSVictor Minden 
52368a0b0e6bSVictor Minden    Level: intermediate
52378a0b0e6bSVictor Minden 
5238f62e3866SBarry Smith    Example:
5239f62e3866SBarry Smith        For the following matrix, the input data expected is as shown (using 0 based indexing)
52409e99939fSJunchao Zhang .vb
52418a0b0e6bSVictor Minden         1 0 0
52428a0b0e6bSVictor Minden         2 0 3
52438a0b0e6bSVictor Minden         4 5 6
52448a0b0e6bSVictor Minden 
52458a0b0e6bSVictor Minden         i =  {0,1,1,2,2,2}
52468a0b0e6bSVictor Minden         j =  {0,0,2,0,1,2}
52478a0b0e6bSVictor Minden         v =  {1,2,3,4,5,6}
52489e99939fSJunchao Zhang .ve
52492ef1f0ffSBarry Smith   Note:
5250d7547e51SJunchao Zhang     Instead of using this function, users should also consider `MatSetPreallocationCOO()` and `MatSetValuesCOO()`, which allow repeated or remote entries,
5251d7547e51SJunchao Zhang     and are particularly useful in iterative applications.
52528a0b0e6bSVictor Minden 
52531cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatCreate()`, `MatCreateAIJ()`, `MatCreateSeqAIJ()`, `MatCreateSeqAIJWithArrays()`, `MatMPIAIJSetPreallocationCSR()`, `MatSetValuesCOO()`, `MatSetPreallocationCOO()`
52548a0b0e6bSVictor Minden @*/
5255d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateSeqAIJFromTriple(MPI_Comm comm, PetscInt m, PetscInt n, PetscInt i[], PetscInt j[], PetscScalar a[], Mat *mat, PetscInt nz, PetscBool idx)
5256d71ae5a4SJacob Faibussowitsch {
5257d021a1c5SVictor Minden   PetscInt ii, *nnz, one = 1, row, col;
52588a0b0e6bSVictor Minden 
52598a0b0e6bSVictor Minden   PetscFunctionBegin;
52609566063dSJacob Faibussowitsch   PetscCall(PetscCalloc1(m, &nnz));
5261ad540459SPierre Jolivet   for (ii = 0; ii < nz; ii++) nnz[i[ii] - !!idx] += 1;
52629566063dSJacob Faibussowitsch   PetscCall(MatCreate(comm, mat));
52639566063dSJacob Faibussowitsch   PetscCall(MatSetSizes(*mat, m, n, m, n));
52649566063dSJacob Faibussowitsch   PetscCall(MatSetType(*mat, MATSEQAIJ));
52659566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(*mat, 0, nnz));
52661230e6d1SVictor Minden   for (ii = 0; ii < nz; ii++) {
52671230e6d1SVictor Minden     if (idx) {
52681230e6d1SVictor Minden       row = i[ii] - 1;
52691230e6d1SVictor Minden       col = j[ii] - 1;
52701230e6d1SVictor Minden     } else {
52711230e6d1SVictor Minden       row = i[ii];
52721230e6d1SVictor Minden       col = j[ii];
52738a0b0e6bSVictor Minden     }
52749566063dSJacob Faibussowitsch     PetscCall(MatSetValues(*mat, one, &row, one, &col, &a[ii], ADD_VALUES));
52758a0b0e6bSVictor Minden   }
52769566063dSJacob Faibussowitsch   PetscCall(MatAssemblyBegin(*mat, MAT_FINAL_ASSEMBLY));
52779566063dSJacob Faibussowitsch   PetscCall(MatAssemblyEnd(*mat, MAT_FINAL_ASSEMBLY));
52789566063dSJacob Faibussowitsch   PetscCall(PetscFree(nnz));
52793ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
52808a0b0e6bSVictor Minden }
528136db0b34SBarry Smith 
5282d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJInvalidateDiagonal(Mat A)
5283d71ae5a4SJacob Faibussowitsch {
5284acf2f550SJed Brown   Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data;
5285acf2f550SJed Brown 
5286acf2f550SJed Brown   PetscFunctionBegin;
5287acf2f550SJed Brown   a->idiagvalid  = PETSC_FALSE;
5288acf2f550SJed Brown   a->ibdiagvalid = PETSC_FALSE;
52892205254eSKarl Rupp 
52909566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJInvalidateDiagonal_Inode(A));
52913ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
5292acf2f550SJed Brown }
5293acf2f550SJed Brown 
5294d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateMPIMatConcatenateSeqMat_SeqAIJ(MPI_Comm comm, Mat inmat, PetscInt n, MatReuse scall, Mat *outmat)
5295d71ae5a4SJacob Faibussowitsch {
52969c8f2541SHong Zhang   PetscFunctionBegin;
52979566063dSJacob Faibussowitsch   PetscCall(MatCreateMPIMatConcatenateSeqMat_MPIAIJ(comm, inmat, n, scall, outmat));
52983ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
52999c8f2541SHong Zhang }
53009c8f2541SHong Zhang 
530181824310SBarry Smith /*
530253dd7562SDmitry Karpeev  Permute A into C's *local* index space using rowemb,colemb.
530353dd7562SDmitry Karpeev  The embedding are supposed to be injections and the above implies that the range of rowemb is a subset
530453dd7562SDmitry Karpeev  of [0,m), colemb is in [0,n).
530553dd7562SDmitry Karpeev  If pattern == DIFFERENT_NONZERO_PATTERN, C is preallocated according to A.
530653dd7562SDmitry Karpeev  */
5307d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetSeqMat_SeqAIJ(Mat C, IS rowemb, IS colemb, MatStructure pattern, Mat B)
5308d71ae5a4SJacob Faibussowitsch {
530953dd7562SDmitry Karpeev   /* If making this function public, change the error returned in this function away from _PLIB. */
531053dd7562SDmitry Karpeev   Mat_SeqAIJ     *Baij;
531153dd7562SDmitry Karpeev   PetscBool       seqaij;
531253dd7562SDmitry Karpeev   PetscInt        m, n, *nz, i, j, count;
531353dd7562SDmitry Karpeev   PetscScalar     v;
531453dd7562SDmitry Karpeev   const PetscInt *rowindices, *colindices;
531553dd7562SDmitry Karpeev 
531653dd7562SDmitry Karpeev   PetscFunctionBegin;
53173ba16761SJacob Faibussowitsch   if (!B) PetscFunctionReturn(PETSC_SUCCESS);
531853dd7562SDmitry Karpeev   /* Check to make sure the target matrix (and embeddings) are compatible with C and each other. */
53199566063dSJacob Faibussowitsch   PetscCall(PetscObjectBaseTypeCompare((PetscObject)B, MATSEQAIJ, &seqaij));
532028b400f6SJacob Faibussowitsch   PetscCheck(seqaij, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Input matrix is of wrong type");
532153dd7562SDmitry Karpeev   if (rowemb) {
53229566063dSJacob Faibussowitsch     PetscCall(ISGetLocalSize(rowemb, &m));
532308401ef6SPierre Jolivet     PetscCheck(m == B->rmap->n, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Row IS of size %" PetscInt_FMT " is incompatible with matrix row size %" PetscInt_FMT, m, B->rmap->n);
532453dd7562SDmitry Karpeev   } else {
532508401ef6SPierre Jolivet     PetscCheck(C->rmap->n == B->rmap->n, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Input matrix is row-incompatible with the target matrix");
532653dd7562SDmitry Karpeev   }
532753dd7562SDmitry Karpeev   if (colemb) {
53289566063dSJacob Faibussowitsch     PetscCall(ISGetLocalSize(colemb, &n));
532908401ef6SPierre Jolivet     PetscCheck(n == B->cmap->n, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Diag col IS of size %" PetscInt_FMT " is incompatible with input matrix col size %" PetscInt_FMT, n, B->cmap->n);
533053dd7562SDmitry Karpeev   } else {
533108401ef6SPierre Jolivet     PetscCheck(C->cmap->n == B->cmap->n, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Input matrix is col-incompatible with the target matrix");
533253dd7562SDmitry Karpeev   }
533353dd7562SDmitry Karpeev 
533453dd7562SDmitry Karpeev   Baij = (Mat_SeqAIJ *)(B->data);
533553dd7562SDmitry Karpeev   if (pattern == DIFFERENT_NONZERO_PATTERN) {
53369566063dSJacob Faibussowitsch     PetscCall(PetscMalloc1(B->rmap->n, &nz));
5337ad540459SPierre Jolivet     for (i = 0; i < B->rmap->n; i++) nz[i] = Baij->i[i + 1] - Baij->i[i];
53389566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJSetPreallocation(C, 0, nz));
53399566063dSJacob Faibussowitsch     PetscCall(PetscFree(nz));
534053dd7562SDmitry Karpeev   }
534148a46eb9SPierre Jolivet   if (pattern == SUBSET_NONZERO_PATTERN) PetscCall(MatZeroEntries(C));
534253dd7562SDmitry Karpeev   count      = 0;
534353dd7562SDmitry Karpeev   rowindices = NULL;
534453dd7562SDmitry Karpeev   colindices = NULL;
534548a46eb9SPierre Jolivet   if (rowemb) PetscCall(ISGetIndices(rowemb, &rowindices));
534648a46eb9SPierre Jolivet   if (colemb) PetscCall(ISGetIndices(colemb, &colindices));
534753dd7562SDmitry Karpeev   for (i = 0; i < B->rmap->n; i++) {
534853dd7562SDmitry Karpeev     PetscInt row;
534953dd7562SDmitry Karpeev     row = i;
535053dd7562SDmitry Karpeev     if (rowindices) row = rowindices[i];
535153dd7562SDmitry Karpeev     for (j = Baij->i[i]; j < Baij->i[i + 1]; j++) {
535253dd7562SDmitry Karpeev       PetscInt col;
535353dd7562SDmitry Karpeev       col = Baij->j[count];
535453dd7562SDmitry Karpeev       if (colindices) col = colindices[col];
535553dd7562SDmitry Karpeev       v = Baij->a[count];
53569566063dSJacob Faibussowitsch       PetscCall(MatSetValues(C, 1, &row, 1, &col, &v, INSERT_VALUES));
535753dd7562SDmitry Karpeev       ++count;
535853dd7562SDmitry Karpeev     }
535953dd7562SDmitry Karpeev   }
536053dd7562SDmitry Karpeev   /* FIXME: set C's nonzerostate correctly. */
536153dd7562SDmitry Karpeev   /* Assembly for C is necessary. */
536253dd7562SDmitry Karpeev   C->preallocated  = PETSC_TRUE;
536353dd7562SDmitry Karpeev   C->assembled     = PETSC_TRUE;
536453dd7562SDmitry Karpeev   C->was_assembled = PETSC_FALSE;
53653ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
536653dd7562SDmitry Karpeev }
536753dd7562SDmitry Karpeev 
5368dec0b466SHong Zhang PetscErrorCode MatEliminateZeros_SeqAIJ(Mat A)
5369dec0b466SHong Zhang {
5370dec0b466SHong Zhang   Mat_SeqAIJ *a  = (Mat_SeqAIJ *)A->data;
5371dec0b466SHong Zhang   MatScalar  *aa = a->a;
5372dec0b466SHong Zhang   PetscInt    m = A->rmap->n, fshift = 0, fshift_prev = 0, i, k;
5373dec0b466SHong Zhang   PetscInt   *ailen = a->ilen, *imax = a->imax, *ai = a->i, *aj = a->j, rmax = 0;
5374dec0b466SHong Zhang 
5375dec0b466SHong Zhang   PetscFunctionBegin;
5376dec0b466SHong Zhang   PetscCheck(A->assembled, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Cannot eliminate zeros for unassembled matrix");
5377dec0b466SHong Zhang   if (m) rmax = ailen[0]; /* determine row with most nonzeros */
5378dec0b466SHong Zhang   for (i = 1; i <= m; i++) {
5379dec0b466SHong Zhang     /* move each nonzero entry back by the amount of zero slots (fshift) before it*/
5380dec0b466SHong Zhang     for (k = ai[i - 1]; k < ai[i]; k++) {
5381dec0b466SHong Zhang       if (aa[k] == 0 && aj[k] != i - 1) fshift++;
5382dec0b466SHong Zhang       else {
5383dec0b466SHong Zhang         if (aa[k] == 0 && aj[k] == i - 1) PetscCall(PetscInfo(A, "Keep the diagonal zero at row %" PetscInt_FMT "\n", i - 1));
5384dec0b466SHong Zhang         aa[k - fshift] = aa[k];
5385dec0b466SHong Zhang         aj[k - fshift] = aj[k];
5386dec0b466SHong Zhang       }
5387dec0b466SHong Zhang     }
5388dec0b466SHong Zhang     ai[i - 1] -= fshift_prev; // safe to update ai[i-1] now since it will not be used in the next iteration
5389dec0b466SHong Zhang     fshift_prev = fshift;
5390dec0b466SHong Zhang     /* reset ilen and imax for each row */
5391dec0b466SHong Zhang     ailen[i - 1] = imax[i - 1] = ai[i] - fshift - ai[i - 1];
5392dec0b466SHong Zhang     a->nonzerorowcnt += ((ai[i] - fshift - ai[i - 1]) > 0);
5393dec0b466SHong Zhang     rmax = PetscMax(rmax, ailen[i - 1]);
5394dec0b466SHong Zhang   }
5395dec0b466SHong Zhang   if (m) {
5396dec0b466SHong Zhang     ai[m] -= fshift;
5397dec0b466SHong Zhang     a->nz = ai[m];
5398dec0b466SHong Zhang   }
5399dec0b466SHong Zhang   PetscCall(PetscInfo(A, "Matrix size: %" PetscInt_FMT " X %" PetscInt_FMT "; zeros eliminated: %" PetscInt_FMT "; nonzeros left: %" PetscInt_FMT "\n", m, A->cmap->n, fshift, a->nz));
5400dec0b466SHong Zhang   A->nonzerostate -= fshift;
5401dec0b466SHong Zhang   A->info.nz_unneeded += (PetscReal)fshift;
5402dec0b466SHong Zhang   a->rmax = rmax;
5403dec0b466SHong Zhang   if (a->inode.use && a->inode.checked) PetscCall(MatSeqAIJCheckInode(A));
5404dec0b466SHong Zhang   PetscCall(MatAssemblyBegin(A, MAT_FINAL_ASSEMBLY));
5405dec0b466SHong Zhang   PetscCall(MatAssemblyEnd(A, MAT_FINAL_ASSEMBLY));
54063ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
5407dec0b466SHong Zhang }
5408dec0b466SHong Zhang 
54094099cc6bSBarry Smith PetscFunctionList MatSeqAIJList = NULL;
54104099cc6bSBarry Smith 
54114099cc6bSBarry Smith /*@C
541211a5261eSBarry Smith    MatSeqAIJSetType - Converts a `MATSEQAIJ` matrix to a subtype
54134099cc6bSBarry Smith 
5414c3339decSBarry Smith    Collective
54154099cc6bSBarry Smith 
54164099cc6bSBarry Smith    Input Parameters:
54174099cc6bSBarry Smith +  mat      - the matrix object
54184099cc6bSBarry Smith -  matype   - matrix type
54194099cc6bSBarry Smith 
54204099cc6bSBarry Smith    Options Database Key:
54214e187271SRichard Tran Mills .  -mat_seqaij_type  <method> - for example seqaijcrl
54224099cc6bSBarry Smith 
54234099cc6bSBarry Smith   Level: intermediate
54244099cc6bSBarry Smith 
54251cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `PCSetType()`, `VecSetType()`, `MatCreate()`, `MatType`, `Mat`
54264099cc6bSBarry Smith @*/
5427d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetType(Mat mat, MatType matype)
5428d71ae5a4SJacob Faibussowitsch {
54294099cc6bSBarry Smith   PetscBool sametype;
54305f80ce2aSJacob Faibussowitsch   PetscErrorCode (*r)(Mat, MatType, MatReuse, Mat *);
54314099cc6bSBarry Smith 
54324099cc6bSBarry Smith   PetscFunctionBegin;
54334099cc6bSBarry Smith   PetscValidHeaderSpecific(mat, MAT_CLASSID, 1);
54349566063dSJacob Faibussowitsch   PetscCall(PetscObjectTypeCompare((PetscObject)mat, matype, &sametype));
54353ba16761SJacob Faibussowitsch   if (sametype) PetscFunctionReturn(PETSC_SUCCESS);
54364099cc6bSBarry Smith 
54379566063dSJacob Faibussowitsch   PetscCall(PetscFunctionListFind(MatSeqAIJList, matype, &r));
54386adde796SStefano Zampini   PetscCheck(r, PetscObjectComm((PetscObject)mat), PETSC_ERR_ARG_UNKNOWN_TYPE, "Unknown Mat type given: %s", matype);
54399566063dSJacob Faibussowitsch   PetscCall((*r)(mat, matype, MAT_INPLACE_MATRIX, &mat));
54403ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
54414099cc6bSBarry Smith }
54424099cc6bSBarry Smith 
54434099cc6bSBarry Smith /*@C
544411a5261eSBarry Smith   MatSeqAIJRegister -  - Adds a new sub-matrix type for sequential `MATSEQAIJ` matrices
54454099cc6bSBarry Smith 
54464099cc6bSBarry Smith    Not Collective
54474099cc6bSBarry Smith 
54484099cc6bSBarry Smith    Input Parameters:
544911a5261eSBarry Smith +  name - name of a new user-defined matrix type, for example `MATSEQAIJCRL`
54504099cc6bSBarry Smith -  function - routine to convert to subtype
54514099cc6bSBarry Smith 
54522ef1f0ffSBarry Smith    Level: advanced
54532ef1f0ffSBarry Smith 
54544099cc6bSBarry Smith    Notes:
545511a5261eSBarry Smith    `MatSeqAIJRegister()` may be called multiple times to add several user-defined solvers.
54564099cc6bSBarry Smith 
54574099cc6bSBarry Smith    Then, your matrix can be chosen with the procedural interface at runtime via the option
54584099cc6bSBarry Smith $     -mat_seqaij_type my_mat
54594099cc6bSBarry Smith 
54601cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJRegisterAll()`
54614099cc6bSBarry Smith @*/
5462d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJRegister(const char sname[], PetscErrorCode (*function)(Mat, MatType, MatReuse, Mat *))
5463d71ae5a4SJacob Faibussowitsch {
54644099cc6bSBarry Smith   PetscFunctionBegin;
54659566063dSJacob Faibussowitsch   PetscCall(MatInitializePackage());
54669566063dSJacob Faibussowitsch   PetscCall(PetscFunctionListAdd(&MatSeqAIJList, sname, function));
54673ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
54684099cc6bSBarry Smith }
54694099cc6bSBarry Smith 
54704099cc6bSBarry Smith PetscBool MatSeqAIJRegisterAllCalled = PETSC_FALSE;
54714099cc6bSBarry Smith 
54724099cc6bSBarry Smith /*@C
547311a5261eSBarry Smith   MatSeqAIJRegisterAll - Registers all of the matrix subtypes of `MATSSEQAIJ`
54744099cc6bSBarry Smith 
54754099cc6bSBarry Smith   Not Collective
54764099cc6bSBarry Smith 
54774099cc6bSBarry Smith   Level: advanced
54784099cc6bSBarry Smith 
54792ef1f0ffSBarry Smith   Note:
54802ef1f0ffSBarry Smith   This registers the versions of `MATSEQAIJ` for GPUs
54812ef1f0ffSBarry Smith 
54821cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatRegisterAll()`, `MatSeqAIJRegister()`
54834099cc6bSBarry Smith @*/
5484d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJRegisterAll(void)
5485d71ae5a4SJacob Faibussowitsch {
54864099cc6bSBarry Smith   PetscFunctionBegin;
54873ba16761SJacob Faibussowitsch   if (MatSeqAIJRegisterAllCalled) PetscFunctionReturn(PETSC_SUCCESS);
54884099cc6bSBarry Smith   MatSeqAIJRegisterAllCalled = PETSC_TRUE;
54894099cc6bSBarry Smith 
54909566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRegister(MATSEQAIJCRL, MatConvert_SeqAIJ_SeqAIJCRL));
54919566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRegister(MATSEQAIJPERM, MatConvert_SeqAIJ_SeqAIJPERM));
54929566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRegister(MATSEQAIJSELL, MatConvert_SeqAIJ_SeqAIJSELL));
54939779e05dSSatish Balay #if defined(PETSC_HAVE_MKL_SPARSE)
54949566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRegister(MATSEQAIJMKL, MatConvert_SeqAIJ_SeqAIJMKL));
5495485f9817SRichard Tran Mills #endif
54965063d097SStefano Zampini #if defined(PETSC_HAVE_CUDA)
54979566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRegister(MATSEQAIJCUSPARSE, MatConvert_SeqAIJ_SeqAIJCUSPARSE));
54985063d097SStefano Zampini #endif
5499d5e393b6SSuyash Tandon #if defined(PETSC_HAVE_HIP)
5500d5e393b6SSuyash Tandon   PetscCall(MatSeqAIJRegister(MATSEQAIJHIPSPARSE, MatConvert_SeqAIJ_SeqAIJHIPSPARSE));
5501d5e393b6SSuyash Tandon #endif
55025063d097SStefano Zampini #if defined(PETSC_HAVE_KOKKOS_KERNELS)
55039566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRegister(MATSEQAIJKOKKOS, MatConvert_SeqAIJ_SeqAIJKokkos));
55045063d097SStefano Zampini #endif
55054099cc6bSBarry Smith #if defined(PETSC_HAVE_VIENNACL) && defined(PETSC_HAVE_VIENNACL_NO_CUDA)
55069566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRegister(MATMPIAIJVIENNACL, MatConvert_SeqAIJ_SeqAIJViennaCL));
55074099cc6bSBarry Smith #endif
55083ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
55094099cc6bSBarry Smith }
551053dd7562SDmitry Karpeev 
551153dd7562SDmitry Karpeev /*
551281824310SBarry Smith     Special version for direct calls from Fortran
551381824310SBarry Smith */
5514af0996ceSBarry Smith #include <petsc/private/fortranimpl.h>
551581824310SBarry Smith #if defined(PETSC_HAVE_FORTRAN_CAPS)
551681824310SBarry Smith   #define matsetvaluesseqaij_ MATSETVALUESSEQAIJ
551781824310SBarry Smith #elif !defined(PETSC_HAVE_FORTRAN_UNDERSCORE)
551881824310SBarry Smith   #define matsetvaluesseqaij_ matsetvaluesseqaij
551981824310SBarry Smith #endif
552081824310SBarry Smith 
552181824310SBarry Smith /* Change these macros so can be used in void function */
552298921bdaSJacob Faibussowitsch 
552398921bdaSJacob Faibussowitsch /* Change these macros so can be used in void function */
55249566063dSJacob Faibussowitsch /* Identical to PetscCallVoid, except it assigns to *_ierr */
55259566063dSJacob Faibussowitsch #undef PetscCall
55269371c9d4SSatish Balay #define PetscCall(...) \
55279371c9d4SSatish Balay   do { \
55285f80ce2aSJacob Faibussowitsch     PetscErrorCode ierr_msv_mpiaij = __VA_ARGS__; \
552998921bdaSJacob Faibussowitsch     if (PetscUnlikely(ierr_msv_mpiaij)) { \
553098921bdaSJacob Faibussowitsch       *_ierr = PetscError(PETSC_COMM_SELF, __LINE__, PETSC_FUNCTION_NAME, __FILE__, ierr_msv_mpiaij, PETSC_ERROR_REPEAT, " "); \
553198921bdaSJacob Faibussowitsch       return; \
553298921bdaSJacob Faibussowitsch     } \
553398921bdaSJacob Faibussowitsch   } while (0)
553498921bdaSJacob Faibussowitsch 
553598921bdaSJacob Faibussowitsch #undef SETERRQ
55369371c9d4SSatish Balay #define SETERRQ(comm, ierr, ...) \
55379371c9d4SSatish Balay   do { \
553898921bdaSJacob Faibussowitsch     *_ierr = PetscError(comm, __LINE__, PETSC_FUNCTION_NAME, __FILE__, ierr, PETSC_ERROR_INITIAL, __VA_ARGS__); \
553998921bdaSJacob Faibussowitsch     return; \
554098921bdaSJacob Faibussowitsch   } while (0)
554181824310SBarry Smith 
5542d71ae5a4SJacob Faibussowitsch PETSC_EXTERN void matsetvaluesseqaij_(Mat *AA, PetscInt *mm, const PetscInt im[], PetscInt *nn, const PetscInt in[], const PetscScalar v[], InsertMode *isis, PetscErrorCode *_ierr)
5543d71ae5a4SJacob Faibussowitsch {
554481824310SBarry Smith   Mat         A = *AA;
554581824310SBarry Smith   PetscInt    m = *mm, n = *nn;
554681824310SBarry Smith   InsertMode  is = *isis;
554781824310SBarry Smith   Mat_SeqAIJ *a  = (Mat_SeqAIJ *)A->data;
554881824310SBarry Smith   PetscInt   *rp, k, low, high, t, ii, row, nrow, i, col, l, rmax, N;
554981824310SBarry Smith   PetscInt   *imax, *ai, *ailen;
555081824310SBarry Smith   PetscInt   *aj, nonew = a->nonew, lastcol = -1;
555154f21887SBarry Smith   MatScalar  *ap, value, *aa;
5552ace3abfcSBarry Smith   PetscBool   ignorezeroentries = a->ignorezeroentries;
5553ace3abfcSBarry Smith   PetscBool   roworiented       = a->roworiented;
555481824310SBarry Smith 
555581824310SBarry Smith   PetscFunctionBegin;
55564994cf47SJed Brown   MatCheckPreallocated(A, 1);
555781824310SBarry Smith   imax  = a->imax;
555881824310SBarry Smith   ai    = a->i;
555981824310SBarry Smith   ailen = a->ilen;
556081824310SBarry Smith   aj    = a->j;
556181824310SBarry Smith   aa    = a->a;
556281824310SBarry Smith 
556381824310SBarry Smith   for (k = 0; k < m; k++) { /* loop over added rows */
556481824310SBarry Smith     row = im[k];
556581824310SBarry Smith     if (row < 0) continue;
55665f80ce2aSJacob Faibussowitsch     PetscCheck(row < A->rmap->n, PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_OUTOFRANGE, "Row too large");
55679371c9d4SSatish Balay     rp   = aj + ai[row];
55689371c9d4SSatish Balay     ap   = aa + ai[row];
55699371c9d4SSatish Balay     rmax = imax[row];
55709371c9d4SSatish Balay     nrow = ailen[row];
557181824310SBarry Smith     low  = 0;
557281824310SBarry Smith     high = nrow;
557381824310SBarry Smith     for (l = 0; l < n; l++) { /* loop over added columns */
557481824310SBarry Smith       if (in[l] < 0) continue;
55755f80ce2aSJacob Faibussowitsch       PetscCheck(in[l] < A->cmap->n, PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_OUTOFRANGE, "Column too large");
557681824310SBarry Smith       col = in[l];
55772205254eSKarl Rupp       if (roworiented) value = v[l + k * n];
55782205254eSKarl Rupp       else value = v[k + l * m];
55792205254eSKarl Rupp 
558081824310SBarry Smith       if (value == 0.0 && ignorezeroentries && (is == ADD_VALUES)) continue;
558181824310SBarry Smith 
55822205254eSKarl Rupp       if (col <= lastcol) low = 0;
55832205254eSKarl Rupp       else high = nrow;
558481824310SBarry Smith       lastcol = col;
558581824310SBarry Smith       while (high - low > 5) {
558681824310SBarry Smith         t = (low + high) / 2;
558781824310SBarry Smith         if (rp[t] > col) high = t;
558881824310SBarry Smith         else low = t;
558981824310SBarry Smith       }
559081824310SBarry Smith       for (i = low; i < high; i++) {
559181824310SBarry Smith         if (rp[i] > col) break;
559281824310SBarry Smith         if (rp[i] == col) {
559381824310SBarry Smith           if (is == ADD_VALUES) ap[i] += value;
559481824310SBarry Smith           else ap[i] = value;
559581824310SBarry Smith           goto noinsert;
559681824310SBarry Smith         }
559781824310SBarry Smith       }
559881824310SBarry Smith       if (value == 0.0 && ignorezeroentries) goto noinsert;
559981824310SBarry Smith       if (nonew == 1) goto noinsert;
56005f80ce2aSJacob Faibussowitsch       PetscCheck(nonew != -1, PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_OUTOFRANGE, "Inserting a new nonzero in the matrix");
5601fef13f97SBarry Smith       MatSeqXAIJReallocateAIJ(A, A->rmap->n, 1, nrow, row, col, rmax, aa, ai, aj, rp, ap, imax, nonew, MatScalar);
56029371c9d4SSatish Balay       N = nrow++ - 1;
56039371c9d4SSatish Balay       a->nz++;
56049371c9d4SSatish Balay       high++;
560581824310SBarry Smith       /* shift up all the later entries in this row */
560681824310SBarry Smith       for (ii = N; ii >= i; ii--) {
560781824310SBarry Smith         rp[ii + 1] = rp[ii];
560881824310SBarry Smith         ap[ii + 1] = ap[ii];
560981824310SBarry Smith       }
561081824310SBarry Smith       rp[i] = col;
561181824310SBarry Smith       ap[i] = value;
5612e56f5c9eSBarry Smith       A->nonzerostate++;
561381824310SBarry Smith     noinsert:;
561481824310SBarry Smith       low = i + 1;
561581824310SBarry Smith     }
561681824310SBarry Smith     ailen[row] = nrow;
561781824310SBarry Smith   }
561881824310SBarry Smith   PetscFunctionReturnVoid();
561981824310SBarry Smith }
562098921bdaSJacob Faibussowitsch /* Undefining these here since they were redefined from their original definition above! No
562198921bdaSJacob Faibussowitsch  * other PETSc functions should be defined past this point, as it is impossible to recover the
562298921bdaSJacob Faibussowitsch  * original definitions */
56239566063dSJacob Faibussowitsch #undef PetscCall
562498921bdaSJacob Faibussowitsch #undef SETERRQ
5625