xref: /petsc/src/mat/impls/aij/seq/aij.c (revision 49abdd8a111d9c2ef7fc48ade253ef64e07f9b37)
1d5d45c9bSBarry Smith /*
23369ce9aSBarry Smith     Defines the basic matrix operations for the AIJ (compressed row)
3d5d45c9bSBarry Smith   matrix storage format.
4d5d45c9bSBarry Smith */
53369ce9aSBarry Smith 
6c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/aij.h> /*I "petscmat.h" I*/
7c6db04a5SJed Brown #include <petscblaslapack.h>
8c6db04a5SJed Brown #include <petscbt.h>
9af0996ceSBarry Smith #include <petsc/private/kernels/blocktranspose.h>
100716a85fSBarry Smith 
1126cec326SBarry Smith /* defines MatSetValues_Seq_Hash(), MatAssemblyEnd_Seq_Hash(), MatSetUp_Seq_Hash() */
1226cec326SBarry Smith #define TYPE AIJ
1326cec326SBarry Smith #define TYPE_BS
1426cec326SBarry Smith #include "../src/mat/impls/aij/seq/seqhashmatsetvalues.h"
1526cec326SBarry Smith #include "../src/mat/impls/aij/seq/seqhashmat.h"
1626cec326SBarry Smith #undef TYPE
1726cec326SBarry Smith #undef TYPE_BS
1826cec326SBarry Smith 
19ba38deedSJacob Faibussowitsch static PetscErrorCode MatSeqAIJSetTypeFromOptions(Mat A)
20d71ae5a4SJacob Faibussowitsch {
214099cc6bSBarry Smith   PetscBool flg;
224099cc6bSBarry Smith   char      type[256];
234099cc6bSBarry Smith 
244099cc6bSBarry Smith   PetscFunctionBegin;
25d0609cedSBarry Smith   PetscObjectOptionsBegin((PetscObject)A);
269566063dSJacob Faibussowitsch   PetscCall(PetscOptionsFList("-mat_seqaij_type", "Matrix SeqAIJ type", "MatSeqAIJSetType", MatSeqAIJList, "seqaij", type, 256, &flg));
279566063dSJacob Faibussowitsch   if (flg) PetscCall(MatSeqAIJSetType(A, type));
28d0609cedSBarry Smith   PetscOptionsEnd();
293ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
304099cc6bSBarry Smith }
314099cc6bSBarry Smith 
32ba38deedSJacob Faibussowitsch static PetscErrorCode MatGetColumnReductions_SeqAIJ(Mat A, PetscInt type, PetscReal *reductions)
33d71ae5a4SJacob Faibussowitsch {
340716a85fSBarry Smith   PetscInt    i, m, n;
350716a85fSBarry Smith   Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data;
360716a85fSBarry Smith 
370716a85fSBarry Smith   PetscFunctionBegin;
389566063dSJacob Faibussowitsch   PetscCall(MatGetSize(A, &m, &n));
399566063dSJacob Faibussowitsch   PetscCall(PetscArrayzero(reductions, n));
400716a85fSBarry Smith   if (type == NORM_2) {
41ad540459SPierre Jolivet     for (i = 0; i < aij->i[m]; i++) reductions[aij->j[i]] += PetscAbsScalar(aij->a[i] * aij->a[i]);
420716a85fSBarry Smith   } else if (type == NORM_1) {
43ad540459SPierre Jolivet     for (i = 0; i < aij->i[m]; i++) reductions[aij->j[i]] += PetscAbsScalar(aij->a[i]);
440716a85fSBarry Smith   } else if (type == NORM_INFINITY) {
45ad540459SPierre Jolivet     for (i = 0; i < aij->i[m]; i++) reductions[aij->j[i]] = PetscMax(PetscAbsScalar(aij->a[i]), reductions[aij->j[i]]);
46857cbf51SRichard Tran Mills   } else if (type == REDUCTION_SUM_REALPART || type == REDUCTION_MEAN_REALPART) {
47ad540459SPierre Jolivet     for (i = 0; i < aij->i[m]; i++) reductions[aij->j[i]] += PetscRealPart(aij->a[i]);
48857cbf51SRichard Tran Mills   } else if (type == REDUCTION_SUM_IMAGINARYPART || type == REDUCTION_MEAN_IMAGINARYPART) {
49ad540459SPierre Jolivet     for (i = 0; i < aij->i[m]; i++) reductions[aij->j[i]] += PetscImaginaryPart(aij->a[i]);
506adde796SStefano Zampini   } else SETERRQ(PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_WRONG, "Unknown reduction type");
510716a85fSBarry Smith 
520716a85fSBarry Smith   if (type == NORM_2) {
53a873a8cdSSam Reynolds     for (i = 0; i < n; i++) reductions[i] = PetscSqrtReal(reductions[i]);
54857cbf51SRichard Tran Mills   } else if (type == REDUCTION_MEAN_REALPART || type == REDUCTION_MEAN_IMAGINARYPART) {
55a873a8cdSSam Reynolds     for (i = 0; i < n; i++) reductions[i] /= m;
560716a85fSBarry Smith   }
573ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
580716a85fSBarry Smith }
590716a85fSBarry Smith 
60ba38deedSJacob Faibussowitsch static PetscErrorCode MatFindOffBlockDiagonalEntries_SeqAIJ(Mat A, IS *is)
61d71ae5a4SJacob Faibussowitsch {
623a062f41SBarry Smith   Mat_SeqAIJ     *a = (Mat_SeqAIJ *)A->data;
633a062f41SBarry Smith   PetscInt        i, m = A->rmap->n, cnt = 0, bs = A->rmap->bs;
643a062f41SBarry Smith   const PetscInt *jj = a->j, *ii = a->i;
653a062f41SBarry Smith   PetscInt       *rows;
663a062f41SBarry Smith 
673a062f41SBarry Smith   PetscFunctionBegin;
683a062f41SBarry Smith   for (i = 0; i < m; i++) {
69ad540459SPierre Jolivet     if ((ii[i] != ii[i + 1]) && ((jj[ii[i]] < bs * (i / bs)) || (jj[ii[i + 1] - 1] > bs * ((i + bs) / bs) - 1))) cnt++;
703a062f41SBarry Smith   }
719566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(cnt, &rows));
723a062f41SBarry Smith   cnt = 0;
733a062f41SBarry Smith   for (i = 0; i < m; i++) {
743a062f41SBarry Smith     if ((ii[i] != ii[i + 1]) && ((jj[ii[i]] < bs * (i / bs)) || (jj[ii[i + 1] - 1] > bs * ((i + bs) / bs) - 1))) {
753a062f41SBarry Smith       rows[cnt] = i;
763a062f41SBarry Smith       cnt++;
773a062f41SBarry Smith     }
783a062f41SBarry Smith   }
799566063dSJacob Faibussowitsch   PetscCall(ISCreateGeneral(PETSC_COMM_SELF, cnt, rows, PETSC_OWN_POINTER, is));
803ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
813a062f41SBarry Smith }
823a062f41SBarry Smith 
83d71ae5a4SJacob Faibussowitsch PetscErrorCode MatFindZeroDiagonals_SeqAIJ_Private(Mat A, PetscInt *nrows, PetscInt **zrows)
84d71ae5a4SJacob Faibussowitsch {
856ce1633cSBarry Smith   Mat_SeqAIJ      *a = (Mat_SeqAIJ *)A->data;
86fff043a9SJunchao Zhang   const MatScalar *aa;
876ce1633cSBarry Smith   PetscInt         i, m = A->rmap->n, cnt = 0;
88b2db7409Sstefano_zampini   const PetscInt  *ii = a->i, *jj = a->j, *diag;
896ce1633cSBarry Smith   PetscInt        *rows;
906ce1633cSBarry Smith 
916ce1633cSBarry Smith   PetscFunctionBegin;
929566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &aa));
939566063dSJacob Faibussowitsch   PetscCall(MatMarkDiagonal_SeqAIJ(A));
946ce1633cSBarry Smith   diag = a->diag;
956ce1633cSBarry Smith   for (i = 0; i < m; i++) {
96ad540459SPierre Jolivet     if ((diag[i] >= ii[i + 1]) || (jj[diag[i]] != i) || (aa[diag[i]] == 0.0)) cnt++;
976ce1633cSBarry Smith   }
989566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(cnt, &rows));
996ce1633cSBarry Smith   cnt = 0;
1006ce1633cSBarry Smith   for (i = 0; i < m; i++) {
101ad540459SPierre Jolivet     if ((diag[i] >= ii[i + 1]) || (jj[diag[i]] != i) || (aa[diag[i]] == 0.0)) rows[cnt++] = i;
1026ce1633cSBarry Smith   }
103f1f41ecbSJed Brown   *nrows = cnt;
104f1f41ecbSJed Brown   *zrows = rows;
1059566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &aa));
1063ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
107f1f41ecbSJed Brown }
108f1f41ecbSJed Brown 
109ba38deedSJacob Faibussowitsch static PetscErrorCode MatFindZeroDiagonals_SeqAIJ(Mat A, IS *zrows)
110d71ae5a4SJacob Faibussowitsch {
111f1f41ecbSJed Brown   PetscInt nrows, *rows;
112f1f41ecbSJed Brown 
113f1f41ecbSJed Brown   PetscFunctionBegin;
1140298fd71SBarry Smith   *zrows = NULL;
1159566063dSJacob Faibussowitsch   PetscCall(MatFindZeroDiagonals_SeqAIJ_Private(A, &nrows, &rows));
1169566063dSJacob Faibussowitsch   PetscCall(ISCreateGeneral(PetscObjectComm((PetscObject)A), nrows, rows, PETSC_OWN_POINTER, zrows));
1173ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
1186ce1633cSBarry Smith }
1196ce1633cSBarry Smith 
120ba38deedSJacob Faibussowitsch static PetscErrorCode MatFindNonzeroRows_SeqAIJ(Mat A, IS *keptrows)
121d71ae5a4SJacob Faibussowitsch {
122b3a44c85SBarry Smith   Mat_SeqAIJ      *a = (Mat_SeqAIJ *)A->data;
123b3a44c85SBarry Smith   const MatScalar *aa;
124b3a44c85SBarry Smith   PetscInt         m = A->rmap->n, cnt = 0;
125b3a44c85SBarry Smith   const PetscInt  *ii;
126b3a44c85SBarry Smith   PetscInt         n, i, j, *rows;
127b3a44c85SBarry Smith 
128b3a44c85SBarry Smith   PetscFunctionBegin;
1299566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &aa));
130f4259b30SLisandro Dalcin   *keptrows = NULL;
131b3a44c85SBarry Smith   ii        = a->i;
132b3a44c85SBarry Smith   for (i = 0; i < m; i++) {
133b3a44c85SBarry Smith     n = ii[i + 1] - ii[i];
134b3a44c85SBarry Smith     if (!n) {
135b3a44c85SBarry Smith       cnt++;
136b3a44c85SBarry Smith       goto ok1;
137b3a44c85SBarry Smith     }
1382e5835c6SStefano Zampini     for (j = ii[i]; j < ii[i + 1]; j++) {
139b3a44c85SBarry Smith       if (aa[j] != 0.0) goto ok1;
140b3a44c85SBarry Smith     }
141b3a44c85SBarry Smith     cnt++;
142b3a44c85SBarry Smith   ok1:;
143b3a44c85SBarry Smith   }
1442e5835c6SStefano Zampini   if (!cnt) {
1459566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJRestoreArrayRead(A, &aa));
1463ba16761SJacob Faibussowitsch     PetscFunctionReturn(PETSC_SUCCESS);
1472e5835c6SStefano Zampini   }
1489566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(A->rmap->n - cnt, &rows));
149b3a44c85SBarry Smith   cnt = 0;
150b3a44c85SBarry Smith   for (i = 0; i < m; i++) {
151b3a44c85SBarry Smith     n = ii[i + 1] - ii[i];
152b3a44c85SBarry Smith     if (!n) continue;
1532e5835c6SStefano Zampini     for (j = ii[i]; j < ii[i + 1]; j++) {
154b3a44c85SBarry Smith       if (aa[j] != 0.0) {
155b3a44c85SBarry Smith         rows[cnt++] = i;
156b3a44c85SBarry Smith         break;
157b3a44c85SBarry Smith       }
158b3a44c85SBarry Smith     }
159b3a44c85SBarry Smith   }
1609566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &aa));
1619566063dSJacob Faibussowitsch   PetscCall(ISCreateGeneral(PETSC_COMM_SELF, cnt, rows, PETSC_OWN_POINTER, keptrows));
1623ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
163b3a44c85SBarry Smith }
164b3a44c85SBarry Smith 
165d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDiagonalSet_SeqAIJ(Mat Y, Vec D, InsertMode is)
166d71ae5a4SJacob Faibussowitsch {
16779299369SBarry Smith   Mat_SeqAIJ        *aij = (Mat_SeqAIJ *)Y->data;
16899e65526SBarry Smith   PetscInt           i, m = Y->rmap->n;
16999e65526SBarry Smith   const PetscInt    *diag;
1702e5835c6SStefano Zampini   MatScalar         *aa;
17199e65526SBarry Smith   const PetscScalar *v;
172ace3abfcSBarry Smith   PetscBool          missing;
17379299369SBarry Smith 
17479299369SBarry Smith   PetscFunctionBegin;
17509f38230SBarry Smith   if (Y->assembled) {
1769566063dSJacob Faibussowitsch     PetscCall(MatMissingDiagonal_SeqAIJ(Y, &missing, NULL));
17709f38230SBarry Smith     if (!missing) {
17879299369SBarry Smith       diag = aij->diag;
1799566063dSJacob Faibussowitsch       PetscCall(VecGetArrayRead(D, &v));
1809566063dSJacob Faibussowitsch       PetscCall(MatSeqAIJGetArray(Y, &aa));
18179299369SBarry Smith       if (is == INSERT_VALUES) {
182ad540459SPierre Jolivet         for (i = 0; i < m; i++) aa[diag[i]] = v[i];
18379299369SBarry Smith       } else {
184ad540459SPierre Jolivet         for (i = 0; i < m; i++) aa[diag[i]] += v[i];
18579299369SBarry Smith       }
1869566063dSJacob Faibussowitsch       PetscCall(MatSeqAIJRestoreArray(Y, &aa));
1879566063dSJacob Faibussowitsch       PetscCall(VecRestoreArrayRead(D, &v));
1883ba16761SJacob Faibussowitsch       PetscFunctionReturn(PETSC_SUCCESS);
18979299369SBarry Smith     }
1909566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJInvalidateDiagonal(Y));
19109f38230SBarry Smith   }
1929566063dSJacob Faibussowitsch   PetscCall(MatDiagonalSet_Default(Y, D, is));
1933ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
19409f38230SBarry Smith }
19579299369SBarry Smith 
196d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetRowIJ_SeqAIJ(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *m, const PetscInt *ia[], const PetscInt *ja[], PetscBool *done)
197d71ae5a4SJacob Faibussowitsch {
198416022c9SBarry Smith   Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data;
19997f1f81fSBarry Smith   PetscInt    i, ishift;
20017ab2063SBarry Smith 
2013a40ed3dSBarry Smith   PetscFunctionBegin;
202f1f2ae84SBarry Smith   if (m) *m = A->rmap->n;
2033ba16761SJacob Faibussowitsch   if (!ia) PetscFunctionReturn(PETSC_SUCCESS);
204bfeeae90SHong Zhang   ishift = 0;
205b94d7dedSBarry Smith   if (symmetric && A->structurally_symmetric != PETSC_BOOL3_TRUE) {
2069566063dSJacob Faibussowitsch     PetscCall(MatToSymmetricIJ_SeqAIJ(A->rmap->n, a->i, a->j, PETSC_TRUE, ishift, oshift, (PetscInt **)ia, (PetscInt **)ja));
207bfeeae90SHong Zhang   } else if (oshift == 1) {
2081a83f524SJed Brown     PetscInt *tia;
209d0f46423SBarry Smith     PetscInt  nz = a->i[A->rmap->n];
2103b2fbd54SBarry Smith     /* malloc space and  add 1 to i and j indices */
2119566063dSJacob Faibussowitsch     PetscCall(PetscMalloc1(A->rmap->n + 1, &tia));
2121a83f524SJed Brown     for (i = 0; i < A->rmap->n + 1; i++) tia[i] = a->i[i] + 1;
2131a83f524SJed Brown     *ia = tia;
214ecc77c7aSBarry Smith     if (ja) {
2151a83f524SJed Brown       PetscInt *tja;
2169566063dSJacob Faibussowitsch       PetscCall(PetscMalloc1(nz + 1, &tja));
2171a83f524SJed Brown       for (i = 0; i < nz; i++) tja[i] = a->j[i] + 1;
2181a83f524SJed Brown       *ja = tja;
219ecc77c7aSBarry Smith     }
2206945ee14SBarry Smith   } else {
221ecc77c7aSBarry Smith     *ia = a->i;
222ecc77c7aSBarry Smith     if (ja) *ja = a->j;
223a2ce50c7SBarry Smith   }
2243ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
225a2744918SBarry Smith }
226a2744918SBarry Smith 
227d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRestoreRowIJ_SeqAIJ(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *n, const PetscInt *ia[], const PetscInt *ja[], PetscBool *done)
228d71ae5a4SJacob Faibussowitsch {
2293a40ed3dSBarry Smith   PetscFunctionBegin;
2303ba16761SJacob Faibussowitsch   if (!ia) PetscFunctionReturn(PETSC_SUCCESS);
231b94d7dedSBarry Smith   if ((symmetric && A->structurally_symmetric != PETSC_BOOL3_TRUE) || oshift == 1) {
2329566063dSJacob Faibussowitsch     PetscCall(PetscFree(*ia));
2339566063dSJacob Faibussowitsch     if (ja) PetscCall(PetscFree(*ja));
234bcd2baecSBarry Smith   }
2353ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
23617ab2063SBarry Smith }
23717ab2063SBarry Smith 
238d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetColumnIJ_SeqAIJ(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *nn, const PetscInt *ia[], const PetscInt *ja[], PetscBool *done)
239d71ae5a4SJacob Faibussowitsch {
2403b2fbd54SBarry Smith   Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data;
241d0f46423SBarry Smith   PetscInt    i, *collengths, *cia, *cja, n = A->cmap->n, m = A->rmap->n;
24297f1f81fSBarry Smith   PetscInt    nz = a->i[m], row, *jj, mr, col;
2433b2fbd54SBarry Smith 
2443a40ed3dSBarry Smith   PetscFunctionBegin;
245899cda47SBarry Smith   *nn = n;
2463ba16761SJacob Faibussowitsch   if (!ia) PetscFunctionReturn(PETSC_SUCCESS);
2473b2fbd54SBarry Smith   if (symmetric) {
2489566063dSJacob Faibussowitsch     PetscCall(MatToSymmetricIJ_SeqAIJ(A->rmap->n, a->i, a->j, PETSC_TRUE, 0, oshift, (PetscInt **)ia, (PetscInt **)ja));
2493b2fbd54SBarry Smith   } else {
2509566063dSJacob Faibussowitsch     PetscCall(PetscCalloc1(n, &collengths));
2519566063dSJacob Faibussowitsch     PetscCall(PetscMalloc1(n + 1, &cia));
2529566063dSJacob Faibussowitsch     PetscCall(PetscMalloc1(nz, &cja));
2533b2fbd54SBarry Smith     jj = a->j;
254ad540459SPierre Jolivet     for (i = 0; i < nz; i++) collengths[jj[i]]++;
2553b2fbd54SBarry Smith     cia[0] = oshift;
256ad540459SPierre Jolivet     for (i = 0; i < n; i++) cia[i + 1] = cia[i] + collengths[i];
2579566063dSJacob Faibussowitsch     PetscCall(PetscArrayzero(collengths, n));
2583b2fbd54SBarry Smith     jj = a->j;
259a93ec695SBarry Smith     for (row = 0; row < m; row++) {
260a93ec695SBarry Smith       mr = a->i[row + 1] - a->i[row];
261a93ec695SBarry Smith       for (i = 0; i < mr; i++) {
262bfeeae90SHong Zhang         col = *jj++;
2632205254eSKarl Rupp 
2643b2fbd54SBarry Smith         cja[cia[col] + collengths[col]++ - oshift] = row + oshift;
2653b2fbd54SBarry Smith       }
2663b2fbd54SBarry Smith     }
2679566063dSJacob Faibussowitsch     PetscCall(PetscFree(collengths));
2689371c9d4SSatish Balay     *ia = cia;
2699371c9d4SSatish Balay     *ja = cja;
2703b2fbd54SBarry Smith   }
2713ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
2723b2fbd54SBarry Smith }
2733b2fbd54SBarry Smith 
274d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRestoreColumnIJ_SeqAIJ(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *n, const PetscInt *ia[], const PetscInt *ja[], PetscBool *done)
275d71ae5a4SJacob Faibussowitsch {
2763a40ed3dSBarry Smith   PetscFunctionBegin;
2773ba16761SJacob Faibussowitsch   if (!ia) PetscFunctionReturn(PETSC_SUCCESS);
2783b2fbd54SBarry Smith 
2799566063dSJacob Faibussowitsch   PetscCall(PetscFree(*ia));
2809566063dSJacob Faibussowitsch   PetscCall(PetscFree(*ja));
2813ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
2823b2fbd54SBarry Smith }
2833b2fbd54SBarry Smith 
2847cee066cSHong Zhang /*
2857cee066cSHong Zhang  MatGetColumnIJ_SeqAIJ_Color() and MatRestoreColumnIJ_SeqAIJ_Color() are customized from
2867cee066cSHong Zhang  MatGetColumnIJ_SeqAIJ() and MatRestoreColumnIJ_SeqAIJ() by adding an output
287040ebd07SHong Zhang  spidx[], index of a->a, to be used in MatTransposeColoringCreate_SeqAIJ() and MatFDColoringCreate_SeqXAIJ()
2887cee066cSHong Zhang */
289d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetColumnIJ_SeqAIJ_Color(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *nn, const PetscInt *ia[], const PetscInt *ja[], PetscInt *spidx[], PetscBool *done)
290d71ae5a4SJacob Faibussowitsch {
2917cee066cSHong Zhang   Mat_SeqAIJ     *a = (Mat_SeqAIJ *)A->data;
2927cee066cSHong Zhang   PetscInt        i, *collengths, *cia, *cja, n = A->cmap->n, m = A->rmap->n;
293071fcb05SBarry Smith   PetscInt        nz = a->i[m], row, mr, col, tmp;
2947cee066cSHong Zhang   PetscInt       *cspidx;
295071fcb05SBarry Smith   const PetscInt *jj;
2967cee066cSHong Zhang 
2977cee066cSHong Zhang   PetscFunctionBegin;
2987cee066cSHong Zhang   *nn = n;
2993ba16761SJacob Faibussowitsch   if (!ia) PetscFunctionReturn(PETSC_SUCCESS);
300625f6d37SHong Zhang 
3019566063dSJacob Faibussowitsch   PetscCall(PetscCalloc1(n, &collengths));
3029566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(n + 1, &cia));
3039566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(nz, &cja));
3049566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(nz, &cspidx));
3057cee066cSHong Zhang   jj = a->j;
306ad540459SPierre Jolivet   for (i = 0; i < nz; i++) collengths[jj[i]]++;
3077cee066cSHong Zhang   cia[0] = oshift;
308ad540459SPierre Jolivet   for (i = 0; i < n; i++) cia[i + 1] = cia[i] + collengths[i];
3099566063dSJacob Faibussowitsch   PetscCall(PetscArrayzero(collengths, n));
3107cee066cSHong Zhang   jj = a->j;
3117cee066cSHong Zhang   for (row = 0; row < m; row++) {
3127cee066cSHong Zhang     mr = a->i[row + 1] - a->i[row];
3137cee066cSHong Zhang     for (i = 0; i < mr; i++) {
3147cee066cSHong Zhang       col         = *jj++;
315071fcb05SBarry Smith       tmp         = cia[col] + collengths[col]++ - oshift;
316071fcb05SBarry Smith       cspidx[tmp] = a->i[row] + i; /* index of a->j */
317071fcb05SBarry Smith       cja[tmp]    = row + oshift;
3187cee066cSHong Zhang     }
3197cee066cSHong Zhang   }
3209566063dSJacob Faibussowitsch   PetscCall(PetscFree(collengths));
321071fcb05SBarry Smith   *ia    = cia;
322071fcb05SBarry Smith   *ja    = cja;
3237cee066cSHong Zhang   *spidx = cspidx;
3243ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3257cee066cSHong Zhang }
3267cee066cSHong Zhang 
327d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRestoreColumnIJ_SeqAIJ_Color(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *n, const PetscInt *ia[], const PetscInt *ja[], PetscInt *spidx[], PetscBool *done)
328d71ae5a4SJacob Faibussowitsch {
3297cee066cSHong Zhang   PetscFunctionBegin;
3309566063dSJacob Faibussowitsch   PetscCall(MatRestoreColumnIJ_SeqAIJ(A, oshift, symmetric, inodecompressed, n, ia, ja, done));
3319566063dSJacob Faibussowitsch   PetscCall(PetscFree(*spidx));
3323ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3337cee066cSHong Zhang }
3347cee066cSHong Zhang 
335ba38deedSJacob Faibussowitsch static PetscErrorCode MatSetValuesRow_SeqAIJ(Mat A, PetscInt row, const PetscScalar v[])
336d71ae5a4SJacob Faibussowitsch {
33787d4246cSBarry Smith   Mat_SeqAIJ  *a  = (Mat_SeqAIJ *)A->data;
33887d4246cSBarry Smith   PetscInt    *ai = a->i;
339fff043a9SJunchao Zhang   PetscScalar *aa;
34087d4246cSBarry Smith 
34187d4246cSBarry Smith   PetscFunctionBegin;
3429566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArray(A, &aa));
3439566063dSJacob Faibussowitsch   PetscCall(PetscArraycpy(aa + ai[row], v, ai[row + 1] - ai[row]));
3449566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArray(A, &aa));
3453ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
34687d4246cSBarry Smith }
34787d4246cSBarry Smith 
348bd04181cSBarry Smith /*
349bd04181cSBarry Smith     MatSeqAIJSetValuesLocalFast - An optimized version of MatSetValuesLocal() for SeqAIJ matrices with several assumptions
350bd04181cSBarry Smith 
351bd04181cSBarry Smith       -   a single row of values is set with each call
352bd04181cSBarry Smith       -   no row or column indices are negative or (in error) larger than the number of rows or columns
353bd04181cSBarry Smith       -   the values are always added to the matrix, not set
354bd04181cSBarry Smith       -   no new locations are introduced in the nonzero structure of the matrix
355bd04181cSBarry Smith 
3561f763a69SBarry Smith      This does NOT assume the global column indices are sorted
357bd04181cSBarry Smith 
3581f763a69SBarry Smith */
359bd04181cSBarry Smith 
360af0996ceSBarry Smith #include <petsc/private/isimpl.h>
361d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetValuesLocalFast(Mat A, PetscInt m, const PetscInt im[], PetscInt n, const PetscInt in[], const PetscScalar v[], InsertMode is)
362d71ae5a4SJacob Faibussowitsch {
363189e4007SBarry Smith   Mat_SeqAIJ     *a = (Mat_SeqAIJ *)A->data;
3641f763a69SBarry Smith   PetscInt        low, high, t, row, nrow, i, col, l;
3651f763a69SBarry Smith   const PetscInt *rp, *ai = a->i, *ailen = a->ilen, *aj = a->j;
3661f763a69SBarry Smith   PetscInt        lastcol = -1;
367fff043a9SJunchao Zhang   MatScalar      *ap, value, *aa;
368189e4007SBarry Smith   const PetscInt *ridx = A->rmap->mapping->indices, *cidx = A->cmap->mapping->indices;
369189e4007SBarry Smith 
370fff043a9SJunchao Zhang   PetscFunctionBegin;
3719566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArray(A, &aa));
372f38dd0b8SBarry Smith   row  = ridx[im[0]];
3731f763a69SBarry Smith   rp   = aj + ai[row];
3741f763a69SBarry Smith   ap   = aa + ai[row];
3751f763a69SBarry Smith   nrow = ailen[row];
376189e4007SBarry Smith   low  = 0;
377189e4007SBarry Smith   high = nrow;
378189e4007SBarry Smith   for (l = 0; l < n; l++) { /* loop over added columns */
379189e4007SBarry Smith     col   = cidx[in[l]];
380f38dd0b8SBarry Smith     value = v[l];
381189e4007SBarry Smith 
382189e4007SBarry Smith     if (col <= lastcol) low = 0;
383189e4007SBarry Smith     else high = nrow;
384189e4007SBarry Smith     lastcol = col;
385189e4007SBarry Smith     while (high - low > 5) {
386189e4007SBarry Smith       t = (low + high) / 2;
387189e4007SBarry Smith       if (rp[t] > col) high = t;
388189e4007SBarry Smith       else low = t;
389189e4007SBarry Smith     }
390189e4007SBarry Smith     for (i = low; i < high; i++) {
391189e4007SBarry Smith       if (rp[i] == col) {
3921f763a69SBarry Smith         ap[i] += value;
393189e4007SBarry Smith         low = i + 1;
3941f763a69SBarry Smith         break;
395189e4007SBarry Smith       }
396189e4007SBarry Smith     }
397189e4007SBarry Smith   }
3989566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArray(A, &aa));
3993ba16761SJacob Faibussowitsch   return PETSC_SUCCESS;
400189e4007SBarry Smith }
401189e4007SBarry Smith 
402d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetValues_SeqAIJ(Mat A, PetscInt m, const PetscInt im[], PetscInt n, const PetscInt in[], const PetscScalar v[], InsertMode is)
403d71ae5a4SJacob Faibussowitsch {
404416022c9SBarry Smith   Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data;
405e2ee6c50SBarry Smith   PetscInt   *rp, k, low, high, t, ii, row, nrow, i, col, l, rmax, N;
40697f1f81fSBarry Smith   PetscInt   *imax = a->imax, *ai = a->i, *ailen = a->ilen;
407e2ee6c50SBarry Smith   PetscInt   *aj = a->j, nonew = a->nonew, lastcol = -1;
408ce496241SStefano Zampini   MatScalar  *ap = NULL, value = 0.0, *aa;
409ace3abfcSBarry Smith   PetscBool   ignorezeroentries = a->ignorezeroentries;
410ace3abfcSBarry Smith   PetscBool   roworiented       = a->roworiented;
41117ab2063SBarry Smith 
4123a40ed3dSBarry Smith   PetscFunctionBegin;
4139566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArray(A, &aa));
41417ab2063SBarry Smith   for (k = 0; k < m; k++) { /* loop over added rows */
415416022c9SBarry Smith     row = im[k];
4165ef9f2a5SBarry Smith     if (row < 0) continue;
4176bdcaf15SBarry Smith     PetscCheck(row < A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Row too large: row %" PetscInt_FMT " max %" PetscInt_FMT, row, A->rmap->n - 1);
4188e3a54c0SPierre Jolivet     rp = PetscSafePointerPlusOffset(aj, ai[row]);
4198e3a54c0SPierre Jolivet     if (!A->structure_only) ap = PetscSafePointerPlusOffset(aa, ai[row]);
4209371c9d4SSatish Balay     rmax = imax[row];
4219371c9d4SSatish Balay     nrow = ailen[row];
422416022c9SBarry Smith     low  = 0;
423c71e6ed7SBarry Smith     high = nrow;
42417ab2063SBarry Smith     for (l = 0; l < n; l++) { /* loop over added columns */
4255ef9f2a5SBarry Smith       if (in[l] < 0) continue;
4266bdcaf15SBarry Smith       PetscCheck(in[l] < A->cmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Column too large: col %" PetscInt_FMT " max %" PetscInt_FMT, in[l], A->cmap->n - 1);
427bfeeae90SHong Zhang       col = in[l];
428071fcb05SBarry Smith       if (v && !A->structure_only) value = roworiented ? v[l + k * n] : v[k + l * m];
429071fcb05SBarry Smith       if (!A->structure_only && value == 0.0 && ignorezeroentries && is == ADD_VALUES && row != col) continue;
43036db0b34SBarry Smith 
4312205254eSKarl Rupp       if (col <= lastcol) low = 0;
4322205254eSKarl Rupp       else high = nrow;
433e2ee6c50SBarry Smith       lastcol = col;
434416022c9SBarry Smith       while (high - low > 5) {
435416022c9SBarry Smith         t = (low + high) / 2;
436416022c9SBarry Smith         if (rp[t] > col) high = t;
437416022c9SBarry Smith         else low = t;
43817ab2063SBarry Smith       }
439416022c9SBarry Smith       for (i = low; i < high; i++) {
44017ab2063SBarry Smith         if (rp[i] > col) break;
44117ab2063SBarry Smith         if (rp[i] == col) {
442876c6284SHong Zhang           if (!A->structure_only) {
4430c0d7e18SFande Kong             if (is == ADD_VALUES) {
4440c0d7e18SFande Kong               ap[i] += value;
4450c0d7e18SFande Kong               (void)PetscLogFlops(1.0);
4469371c9d4SSatish Balay             } else ap[i] = value;
447720833daSHong Zhang           }
448e44c0bd4SBarry Smith           low = i + 1;
44917ab2063SBarry Smith           goto noinsert;
45017ab2063SBarry Smith         }
45117ab2063SBarry Smith       }
452dcd36c23SBarry Smith       if (value == 0.0 && ignorezeroentries && row != col) goto noinsert;
453c2653b3dSLois Curfman McInnes       if (nonew == 1) goto noinsert;
45408401ef6SPierre Jolivet       PetscCheck(nonew != -1, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Inserting a new nonzero at (%" PetscInt_FMT ",%" PetscInt_FMT ") in the matrix", row, col);
455720833daSHong Zhang       if (A->structure_only) {
456876c6284SHong Zhang         MatSeqXAIJReallocateAIJ_structure_only(A, A->rmap->n, 1, nrow, row, col, rmax, ai, aj, rp, imax, nonew, MatScalar);
457720833daSHong Zhang       } else {
458fef13f97SBarry Smith         MatSeqXAIJReallocateAIJ(A, A->rmap->n, 1, nrow, row, col, rmax, aa, ai, aj, rp, ap, imax, nonew, MatScalar);
459720833daSHong Zhang       }
4609371c9d4SSatish Balay       N = nrow++ - 1;
4619371c9d4SSatish Balay       a->nz++;
4629371c9d4SSatish Balay       high++;
463416022c9SBarry Smith       /* shift up all the later entries in this row */
4649566063dSJacob Faibussowitsch       PetscCall(PetscArraymove(rp + i + 1, rp + i, N - i + 1));
46517ab2063SBarry Smith       rp[i] = col;
466580bdb30SBarry Smith       if (!A->structure_only) {
4679566063dSJacob Faibussowitsch         PetscCall(PetscArraymove(ap + i + 1, ap + i, N - i + 1));
468580bdb30SBarry Smith         ap[i] = value;
469580bdb30SBarry Smith       }
470416022c9SBarry Smith       low = i + 1;
471e44c0bd4SBarry Smith     noinsert:;
47217ab2063SBarry Smith     }
47317ab2063SBarry Smith     ailen[row] = nrow;
47417ab2063SBarry Smith   }
4759566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArray(A, &aa));
4763ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
47717ab2063SBarry Smith }
47817ab2063SBarry Smith 
479ba38deedSJacob Faibussowitsch static PetscErrorCode MatSetValues_SeqAIJ_SortedFullNoPreallocation(Mat A, PetscInt m, const PetscInt im[], PetscInt n, const PetscInt in[], const PetscScalar v[], InsertMode is)
480d71ae5a4SJacob Faibussowitsch {
48119b08ed1SBarry Smith   Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data;
48219b08ed1SBarry Smith   PetscInt   *rp, k, row;
48319b08ed1SBarry Smith   PetscInt   *ai = a->i;
48419b08ed1SBarry Smith   PetscInt   *aj = a->j;
485fff043a9SJunchao Zhang   MatScalar  *aa, *ap;
48619b08ed1SBarry Smith 
48719b08ed1SBarry Smith   PetscFunctionBegin;
48828b400f6SJacob Faibussowitsch   PetscCheck(!A->was_assembled, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Cannot call on assembled matrix.");
48908401ef6SPierre Jolivet   PetscCheck(m * n + a->nz <= a->maxnz, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Number of entries in matrix will be larger than maximum nonzeros allocated for %" PetscInt_FMT " in MatSeqAIJSetTotalPreallocation()", a->maxnz);
490fff043a9SJunchao Zhang 
4919566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArray(A, &aa));
49219b08ed1SBarry Smith   for (k = 0; k < m; k++) { /* loop over added rows */
49319b08ed1SBarry Smith     row = im[k];
49419b08ed1SBarry Smith     rp  = aj + ai[row];
4958e3a54c0SPierre Jolivet     ap  = PetscSafePointerPlusOffset(aa, ai[row]);
49619b08ed1SBarry Smith 
4979566063dSJacob Faibussowitsch     PetscCall(PetscMemcpy(rp, in, n * sizeof(PetscInt)));
49819b08ed1SBarry Smith     if (!A->structure_only) {
49919b08ed1SBarry Smith       if (v) {
5009566063dSJacob Faibussowitsch         PetscCall(PetscMemcpy(ap, v, n * sizeof(PetscScalar)));
50119b08ed1SBarry Smith         v += n;
50219b08ed1SBarry Smith       } else {
5039566063dSJacob Faibussowitsch         PetscCall(PetscMemzero(ap, n * sizeof(PetscScalar)));
50419b08ed1SBarry Smith       }
50519b08ed1SBarry Smith     }
50619b08ed1SBarry Smith     a->ilen[row]  = n;
50719b08ed1SBarry Smith     a->imax[row]  = n;
50819b08ed1SBarry Smith     a->i[row + 1] = a->i[row] + n;
50919b08ed1SBarry Smith     a->nz += n;
51019b08ed1SBarry Smith   }
5119566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArray(A, &aa));
5123ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
51319b08ed1SBarry Smith }
51419b08ed1SBarry Smith 
51519b08ed1SBarry Smith /*@
51619b08ed1SBarry Smith   MatSeqAIJSetTotalPreallocation - Sets an upper bound on the total number of expected nonzeros in the matrix.
51719b08ed1SBarry Smith 
51819b08ed1SBarry Smith   Input Parameters:
51911a5261eSBarry Smith + A       - the `MATSEQAIJ` matrix
52019b08ed1SBarry Smith - nztotal - bound on the number of nonzeros
52119b08ed1SBarry Smith 
52219b08ed1SBarry Smith   Level: advanced
52319b08ed1SBarry Smith 
52419b08ed1SBarry Smith   Notes:
52519b08ed1SBarry Smith   This can be called if you will be provided the matrix row by row (from row zero) with sorted column indices for each row.
52611a5261eSBarry Smith   Simply call `MatSetValues()` after this call to provide the matrix entries in the usual manner. This matrix may be used
52719b08ed1SBarry Smith   as always with multiple matrix assemblies.
52819b08ed1SBarry Smith 
5291cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSetOption()`, `MAT_SORTED_FULL`, `MatSetValues()`, `MatSeqAIJSetPreallocation()`
53019b08ed1SBarry Smith @*/
531d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetTotalPreallocation(Mat A, PetscInt nztotal)
532d71ae5a4SJacob Faibussowitsch {
53319b08ed1SBarry Smith   Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data;
53419b08ed1SBarry Smith 
53519b08ed1SBarry Smith   PetscFunctionBegin;
5369566063dSJacob Faibussowitsch   PetscCall(PetscLayoutSetUp(A->rmap));
5379566063dSJacob Faibussowitsch   PetscCall(PetscLayoutSetUp(A->cmap));
53819b08ed1SBarry Smith   a->maxnz = nztotal;
5394dfa11a4SJacob Faibussowitsch   if (!a->imax) { PetscCall(PetscMalloc1(A->rmap->n, &a->imax)); }
54019b08ed1SBarry Smith   if (!a->ilen) {
5419566063dSJacob Faibussowitsch     PetscCall(PetscMalloc1(A->rmap->n, &a->ilen));
54219b08ed1SBarry Smith   } else {
5439566063dSJacob Faibussowitsch     PetscCall(PetscMemzero(a->ilen, A->rmap->n * sizeof(PetscInt)));
54419b08ed1SBarry Smith   }
54519b08ed1SBarry Smith 
54619b08ed1SBarry Smith   /* allocate the matrix space */
5479f0612e4SBarry Smith   PetscCall(PetscShmgetAllocateArray(A->rmap->n + 1, sizeof(PetscInt), (void **)&a->i));
5489f0612e4SBarry Smith   PetscCall(PetscShmgetAllocateArray(nztotal, sizeof(PetscInt), (void **)&a->j));
5499f0612e4SBarry Smith   a->free_ij = PETSC_TRUE;
55019b08ed1SBarry Smith   if (A->structure_only) {
55119b08ed1SBarry Smith     a->free_a = PETSC_FALSE;
55219b08ed1SBarry Smith   } else {
5539f0612e4SBarry Smith     PetscCall(PetscShmgetAllocateArray(nztotal, sizeof(PetscScalar), (void **)&a->a));
55419b08ed1SBarry Smith     a->free_a = PETSC_TRUE;
55519b08ed1SBarry Smith   }
5569f0612e4SBarry Smith   a->i[0]           = 0;
55719b08ed1SBarry Smith   A->ops->setvalues = MatSetValues_SeqAIJ_SortedFullNoPreallocation;
55819b08ed1SBarry Smith   A->preallocated   = PETSC_TRUE;
5593ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
56019b08ed1SBarry Smith }
56119b08ed1SBarry Smith 
562ba38deedSJacob Faibussowitsch static PetscErrorCode MatSetValues_SeqAIJ_SortedFull(Mat A, PetscInt m, const PetscInt im[], PetscInt n, const PetscInt in[], const PetscScalar v[], InsertMode is)
563d71ae5a4SJacob Faibussowitsch {
564071fcb05SBarry Smith   Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data;
565071fcb05SBarry Smith   PetscInt   *rp, k, row;
566071fcb05SBarry Smith   PetscInt   *ai = a->i, *ailen = a->ilen;
567071fcb05SBarry Smith   PetscInt   *aj = a->j;
568fff043a9SJunchao Zhang   MatScalar  *aa, *ap;
569071fcb05SBarry Smith 
570071fcb05SBarry Smith   PetscFunctionBegin;
5719566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArray(A, &aa));
572071fcb05SBarry Smith   for (k = 0; k < m; k++) { /* loop over added rows */
573071fcb05SBarry Smith     row = im[k];
5746bdcaf15SBarry Smith     PetscCheck(n <= a->imax[row], PETSC_COMM_SELF, PETSC_ERR_ARG_WRONG, "Preallocation for row %" PetscInt_FMT " does not match number of columns provided", n);
575071fcb05SBarry Smith     rp = aj + ai[row];
576071fcb05SBarry Smith     ap = aa + ai[row];
57748a46eb9SPierre Jolivet     if (!A->was_assembled) PetscCall(PetscMemcpy(rp, in, n * sizeof(PetscInt)));
578071fcb05SBarry Smith     if (!A->structure_only) {
579071fcb05SBarry Smith       if (v) {
5809566063dSJacob Faibussowitsch         PetscCall(PetscMemcpy(ap, v, n * sizeof(PetscScalar)));
581071fcb05SBarry Smith         v += n;
582071fcb05SBarry Smith       } else {
5839566063dSJacob Faibussowitsch         PetscCall(PetscMemzero(ap, n * sizeof(PetscScalar)));
584071fcb05SBarry Smith       }
585071fcb05SBarry Smith     }
586071fcb05SBarry Smith     ailen[row] = n;
587071fcb05SBarry Smith     a->nz += n;
588071fcb05SBarry Smith   }
5899566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArray(A, &aa));
5903ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
591071fcb05SBarry Smith }
592071fcb05SBarry Smith 
593ba38deedSJacob Faibussowitsch static PetscErrorCode MatGetValues_SeqAIJ(Mat A, PetscInt m, const PetscInt im[], PetscInt n, const PetscInt in[], PetscScalar v[])
594d71ae5a4SJacob Faibussowitsch {
5957eb43aa7SLois Curfman McInnes   Mat_SeqAIJ      *a = (Mat_SeqAIJ *)A->data;
59697f1f81fSBarry Smith   PetscInt        *rp, k, low, high, t, row, nrow, i, col, l, *aj = a->j;
59797f1f81fSBarry Smith   PetscInt        *ai = a->i, *ailen = a->ilen;
5984e208921SJed Brown   const MatScalar *ap, *aa;
5997eb43aa7SLois Curfman McInnes 
6003a40ed3dSBarry Smith   PetscFunctionBegin;
6014e208921SJed Brown   PetscCall(MatSeqAIJGetArrayRead(A, &aa));
6027eb43aa7SLois Curfman McInnes   for (k = 0; k < m; k++) { /* loop over rows */
6037eb43aa7SLois Curfman McInnes     row = im[k];
6049371c9d4SSatish Balay     if (row < 0) {
6059371c9d4SSatish Balay       v += n;
6069371c9d4SSatish Balay       continue;
6079371c9d4SSatish Balay     } /* negative row */
60854c59aa7SJacob Faibussowitsch     PetscCheck(row < A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Row too large: row %" PetscInt_FMT " max %" PetscInt_FMT, row, A->rmap->n - 1);
6098e3a54c0SPierre Jolivet     rp   = PetscSafePointerPlusOffset(aj, ai[row]);
6108e3a54c0SPierre Jolivet     ap   = PetscSafePointerPlusOffset(aa, ai[row]);
6117eb43aa7SLois Curfman McInnes     nrow = ailen[row];
6127eb43aa7SLois Curfman McInnes     for (l = 0; l < n; l++) { /* loop over columns */
6139371c9d4SSatish Balay       if (in[l] < 0) {
6149371c9d4SSatish Balay         v++;
6159371c9d4SSatish Balay         continue;
6169371c9d4SSatish Balay       } /* negative column */
61754c59aa7SJacob Faibussowitsch       PetscCheck(in[l] < A->cmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Column too large: col %" PetscInt_FMT " max %" PetscInt_FMT, in[l], A->cmap->n - 1);
618bfeeae90SHong Zhang       col  = in[l];
6199371c9d4SSatish Balay       high = nrow;
6209371c9d4SSatish Balay       low  = 0; /* assume unsorted */
6217eb43aa7SLois Curfman McInnes       while (high - low > 5) {
6227eb43aa7SLois Curfman McInnes         t = (low + high) / 2;
6237eb43aa7SLois Curfman McInnes         if (rp[t] > col) high = t;
6247eb43aa7SLois Curfman McInnes         else low = t;
6257eb43aa7SLois Curfman McInnes       }
6267eb43aa7SLois Curfman McInnes       for (i = low; i < high; i++) {
6277eb43aa7SLois Curfman McInnes         if (rp[i] > col) break;
6287eb43aa7SLois Curfman McInnes         if (rp[i] == col) {
629b49de8d1SLois Curfman McInnes           *v++ = ap[i];
6307eb43aa7SLois Curfman McInnes           goto finished;
6317eb43aa7SLois Curfman McInnes         }
6327eb43aa7SLois Curfman McInnes       }
63397e567efSBarry Smith       *v++ = 0.0;
6347eb43aa7SLois Curfman McInnes     finished:;
6357eb43aa7SLois Curfman McInnes     }
6367eb43aa7SLois Curfman McInnes   }
6374e208921SJed Brown   PetscCall(MatSeqAIJRestoreArrayRead(A, &aa));
6383ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
6397eb43aa7SLois Curfman McInnes }
6407eb43aa7SLois Curfman McInnes 
641ba38deedSJacob Faibussowitsch static PetscErrorCode MatView_SeqAIJ_Binary(Mat mat, PetscViewer viewer)
642d71ae5a4SJacob Faibussowitsch {
6433ea6fe3dSLisandro Dalcin   Mat_SeqAIJ        *A = (Mat_SeqAIJ *)mat->data;
644c898d852SStefano Zampini   const PetscScalar *av;
6453ea6fe3dSLisandro Dalcin   PetscInt           header[4], M, N, m, nz, i;
6463ea6fe3dSLisandro Dalcin   PetscInt          *rowlens;
64717ab2063SBarry Smith 
6483a40ed3dSBarry Smith   PetscFunctionBegin;
6499566063dSJacob Faibussowitsch   PetscCall(PetscViewerSetUp(viewer));
6502205254eSKarl Rupp 
6513ea6fe3dSLisandro Dalcin   M  = mat->rmap->N;
6523ea6fe3dSLisandro Dalcin   N  = mat->cmap->N;
6533ea6fe3dSLisandro Dalcin   m  = mat->rmap->n;
6543ea6fe3dSLisandro Dalcin   nz = A->nz;
655416022c9SBarry Smith 
6563ea6fe3dSLisandro Dalcin   /* write matrix header */
6573ea6fe3dSLisandro Dalcin   header[0] = MAT_FILE_CLASSID;
6589371c9d4SSatish Balay   header[1] = M;
6599371c9d4SSatish Balay   header[2] = N;
6609371c9d4SSatish Balay   header[3] = nz;
6619566063dSJacob Faibussowitsch   PetscCall(PetscViewerBinaryWrite(viewer, header, 4, PETSC_INT));
662416022c9SBarry Smith 
6633ea6fe3dSLisandro Dalcin   /* fill in and store row lengths */
6649566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(m, &rowlens));
6653ea6fe3dSLisandro Dalcin   for (i = 0; i < m; i++) rowlens[i] = A->i[i + 1] - A->i[i];
6669566063dSJacob Faibussowitsch   PetscCall(PetscViewerBinaryWrite(viewer, rowlens, m, PETSC_INT));
6679566063dSJacob Faibussowitsch   PetscCall(PetscFree(rowlens));
6683ea6fe3dSLisandro Dalcin   /* store column indices */
6699566063dSJacob Faibussowitsch   PetscCall(PetscViewerBinaryWrite(viewer, A->j, nz, PETSC_INT));
670416022c9SBarry Smith   /* store nonzero values */
6719566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(mat, &av));
6729566063dSJacob Faibussowitsch   PetscCall(PetscViewerBinaryWrite(viewer, av, nz, PETSC_SCALAR));
6739566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(mat, &av));
674b37d52dbSMark F. Adams 
6753ea6fe3dSLisandro Dalcin   /* write block size option to the viewer's .info file */
6769566063dSJacob Faibussowitsch   PetscCall(MatView_Binary_BlockSizes(mat, viewer));
6773ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
67817ab2063SBarry Smith }
679416022c9SBarry Smith 
680d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatView_SeqAIJ_ASCII_structonly(Mat A, PetscViewer viewer)
681d71ae5a4SJacob Faibussowitsch {
6827dc0baabSHong Zhang   Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data;
6837dc0baabSHong Zhang   PetscInt    i, k, m = A->rmap->N;
6847dc0baabSHong Zhang 
6857dc0baabSHong Zhang   PetscFunctionBegin;
6869566063dSJacob Faibussowitsch   PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE));
6877dc0baabSHong Zhang   for (i = 0; i < m; i++) {
6889566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIPrintf(viewer, "row %" PetscInt_FMT ":", i));
68948a46eb9SPierre Jolivet     for (k = a->i[i]; k < a->i[i + 1]; k++) PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ") ", a->j[k]));
6909566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIPrintf(viewer, "\n"));
6917dc0baabSHong Zhang   }
6929566063dSJacob Faibussowitsch   PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE));
6933ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
6947dc0baabSHong Zhang }
6957dc0baabSHong Zhang 
69609573ac7SBarry Smith extern PetscErrorCode MatSeqAIJFactorInfo_Matlab(Mat, PetscViewer);
697cd155464SBarry Smith 
698ba38deedSJacob Faibussowitsch static PetscErrorCode MatView_SeqAIJ_ASCII(Mat A, PetscViewer viewer)
699d71ae5a4SJacob Faibussowitsch {
700416022c9SBarry Smith   Mat_SeqAIJ        *a = (Mat_SeqAIJ *)A->data;
701c898d852SStefano Zampini   const PetscScalar *av;
70260e0710aSBarry Smith   PetscInt           i, j, m = A->rmap->n;
703e060cb09SBarry Smith   const char        *name;
704f3ef73ceSBarry Smith   PetscViewerFormat  format;
70517ab2063SBarry Smith 
7063a40ed3dSBarry Smith   PetscFunctionBegin;
7077dc0baabSHong Zhang   if (A->structure_only) {
7089566063dSJacob Faibussowitsch     PetscCall(MatView_SeqAIJ_ASCII_structonly(A, viewer));
7093ba16761SJacob Faibussowitsch     PetscFunctionReturn(PETSC_SUCCESS);
7107dc0baabSHong Zhang   }
71143e49210SHong Zhang 
7129566063dSJacob Faibussowitsch   PetscCall(PetscViewerGetFormat(viewer, &format));
713bd6a2ce3SJunchao Zhang   // By petsc's rule, even PETSC_VIEWER_ASCII_INFO_DETAIL doesn't print matrix entries
7143ba16761SJacob Faibussowitsch   if (format == PETSC_VIEWER_ASCII_FACTOR_INFO || format == PETSC_VIEWER_ASCII_INFO || format == PETSC_VIEWER_ASCII_INFO_DETAIL) PetscFunctionReturn(PETSC_SUCCESS);
7152e5835c6SStefano Zampini 
716c898d852SStefano Zampini   /* trigger copy to CPU if needed */
7179566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &av));
7189566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &av));
71971c2f376SKris Buschelman   if (format == PETSC_VIEWER_ASCII_MATLAB) {
72097f1f81fSBarry Smith     PetscInt nofinalvalue = 0;
72160e0710aSBarry Smith     if (m && ((a->i[m] == a->i[m - 1]) || (a->j[a->nz - 1] != A->cmap->n - 1))) {
722c337ccceSJed Brown       /* Need a dummy value to ensure the dimension of the matrix. */
723d00d2cf4SBarry Smith       nofinalvalue = 1;
724d00d2cf4SBarry Smith     }
7259566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE));
7269566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIPrintf(viewer, "%% Size = %" PetscInt_FMT " %" PetscInt_FMT " \n", m, A->cmap->n));
7279566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIPrintf(viewer, "%% Nonzeros = %" PetscInt_FMT " \n", a->nz));
728fbfe6fa7SJed Brown #if defined(PETSC_USE_COMPLEX)
7299566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIPrintf(viewer, "zzz = zeros(%" PetscInt_FMT ",4);\n", a->nz + nofinalvalue));
730fbfe6fa7SJed Brown #else
7319566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIPrintf(viewer, "zzz = zeros(%" PetscInt_FMT ",3);\n", a->nz + nofinalvalue));
732fbfe6fa7SJed Brown #endif
7339566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIPrintf(viewer, "zzz = [\n"));
73417ab2063SBarry Smith 
73517ab2063SBarry Smith     for (i = 0; i < m; i++) {
73660e0710aSBarry Smith       for (j = a->i[i]; j < a->i[i + 1]; j++) {
737aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX)
7389566063dSJacob Faibussowitsch         PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT "  %18.16e %18.16e\n", i + 1, a->j[j] + 1, (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j])));
73917ab2063SBarry Smith #else
7409566063dSJacob Faibussowitsch         PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT "  %18.16e\n", i + 1, a->j[j] + 1, (double)a->a[j]));
74117ab2063SBarry Smith #endif
74217ab2063SBarry Smith       }
74317ab2063SBarry Smith     }
744d00d2cf4SBarry Smith     if (nofinalvalue) {
745c337ccceSJed Brown #if defined(PETSC_USE_COMPLEX)
7469566063dSJacob Faibussowitsch       PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT "  %18.16e %18.16e\n", m, A->cmap->n, 0., 0.));
747c337ccceSJed Brown #else
7489566063dSJacob Faibussowitsch       PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT "  %18.16e\n", m, A->cmap->n, 0.0));
749c337ccceSJed Brown #endif
750d00d2cf4SBarry Smith     }
7519566063dSJacob Faibussowitsch     PetscCall(PetscObjectGetName((PetscObject)A, &name));
7529566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIPrintf(viewer, "];\n %s = spconvert(zzz);\n", name));
7539566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE));
754fb9695e5SSatish Balay   } else if (format == PETSC_VIEWER_ASCII_COMMON) {
7559566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE));
75644cd7ae7SLois Curfman McInnes     for (i = 0; i < m; i++) {
7579566063dSJacob Faibussowitsch       PetscCall(PetscViewerASCIIPrintf(viewer, "row %" PetscInt_FMT ":", i));
75860e0710aSBarry Smith       for (j = a->i[i]; j < a->i[i + 1]; j++) {
759aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX)
76036db0b34SBarry Smith         if (PetscImaginaryPart(a->a[j]) > 0.0 && PetscRealPart(a->a[j]) != 0.0) {
7619566063dSJacob Faibussowitsch           PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g + %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j])));
76236db0b34SBarry Smith         } else if (PetscImaginaryPart(a->a[j]) < 0.0 && PetscRealPart(a->a[j]) != 0.0) {
7639566063dSJacob Faibussowitsch           PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g - %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)-PetscImaginaryPart(a->a[j])));
76436db0b34SBarry Smith         } else if (PetscRealPart(a->a[j]) != 0.0) {
7659566063dSJacob Faibussowitsch           PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)PetscRealPart(a->a[j])));
7666831982aSBarry Smith         }
76744cd7ae7SLois Curfman McInnes #else
7689566063dSJacob Faibussowitsch         if (a->a[j] != 0.0) PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)a->a[j]));
76944cd7ae7SLois Curfman McInnes #endif
77044cd7ae7SLois Curfman McInnes       }
7719566063dSJacob Faibussowitsch       PetscCall(PetscViewerASCIIPrintf(viewer, "\n"));
77244cd7ae7SLois Curfman McInnes     }
7739566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE));
774fb9695e5SSatish Balay   } else if (format == PETSC_VIEWER_ASCII_SYMMODU) {
77597f1f81fSBarry Smith     PetscInt nzd = 0, fshift = 1, *sptr;
7769566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE));
7779566063dSJacob Faibussowitsch     PetscCall(PetscMalloc1(m + 1, &sptr));
778496be53dSLois Curfman McInnes     for (i = 0; i < m; i++) {
779496be53dSLois Curfman McInnes       sptr[i] = nzd + 1;
78060e0710aSBarry Smith       for (j = a->i[i]; j < a->i[i + 1]; j++) {
781496be53dSLois Curfman McInnes         if (a->j[j] >= i) {
782aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX)
78336db0b34SBarry Smith           if (PetscImaginaryPart(a->a[j]) != 0.0 || PetscRealPart(a->a[j]) != 0.0) nzd++;
784496be53dSLois Curfman McInnes #else
785496be53dSLois Curfman McInnes           if (a->a[j] != 0.0) nzd++;
786496be53dSLois Curfman McInnes #endif
787496be53dSLois Curfman McInnes         }
788496be53dSLois Curfman McInnes       }
789496be53dSLois Curfman McInnes     }
7902e44a96cSLois Curfman McInnes     sptr[m] = nzd + 1;
7919566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " %" PetscInt_FMT "\n\n", m, nzd));
7922e44a96cSLois Curfman McInnes     for (i = 0; i < m + 1; i += 6) {
7932205254eSKarl Rupp       if (i + 4 < m) {
7949566063dSJacob Faibussowitsch         PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT "\n", sptr[i], sptr[i + 1], sptr[i + 2], sptr[i + 3], sptr[i + 4], sptr[i + 5]));
7952205254eSKarl Rupp       } else if (i + 3 < m) {
7969566063dSJacob Faibussowitsch         PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT "\n", sptr[i], sptr[i + 1], sptr[i + 2], sptr[i + 3], sptr[i + 4]));
7972205254eSKarl Rupp       } else if (i + 2 < m) {
7989566063dSJacob Faibussowitsch         PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT "\n", sptr[i], sptr[i + 1], sptr[i + 2], sptr[i + 3]));
7992205254eSKarl Rupp       } else if (i + 1 < m) {
8009566063dSJacob Faibussowitsch         PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT "\n", sptr[i], sptr[i + 1], sptr[i + 2]));
8012205254eSKarl Rupp       } else if (i < m) {
8029566063dSJacob Faibussowitsch         PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " %" PetscInt_FMT "\n", sptr[i], sptr[i + 1]));
8032205254eSKarl Rupp       } else {
8049566063dSJacob Faibussowitsch         PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT "\n", sptr[i]));
8052205254eSKarl Rupp       }
806496be53dSLois Curfman McInnes     }
8079566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIPrintf(viewer, "\n"));
8089566063dSJacob Faibussowitsch     PetscCall(PetscFree(sptr));
809496be53dSLois Curfman McInnes     for (i = 0; i < m; i++) {
81060e0710aSBarry Smith       for (j = a->i[i]; j < a->i[i + 1]; j++) {
8119566063dSJacob Faibussowitsch         if (a->j[j] >= i) PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " ", a->j[j] + fshift));
812496be53dSLois Curfman McInnes       }
8139566063dSJacob Faibussowitsch       PetscCall(PetscViewerASCIIPrintf(viewer, "\n"));
814496be53dSLois Curfman McInnes     }
8159566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIPrintf(viewer, "\n"));
816496be53dSLois Curfman McInnes     for (i = 0; i < m; i++) {
81760e0710aSBarry Smith       for (j = a->i[i]; j < a->i[i + 1]; j++) {
818496be53dSLois Curfman McInnes         if (a->j[j] >= i) {
819aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX)
82048a46eb9SPierre Jolivet           if (PetscImaginaryPart(a->a[j]) != 0.0 || PetscRealPart(a->a[j]) != 0.0) PetscCall(PetscViewerASCIIPrintf(viewer, " %18.16e %18.16e ", (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j])));
821496be53dSLois Curfman McInnes #else
8229566063dSJacob Faibussowitsch           if (a->a[j] != 0.0) PetscCall(PetscViewerASCIIPrintf(viewer, " %18.16e ", (double)a->a[j]));
823496be53dSLois Curfman McInnes #endif
824496be53dSLois Curfman McInnes         }
825496be53dSLois Curfman McInnes       }
8269566063dSJacob Faibussowitsch       PetscCall(PetscViewerASCIIPrintf(viewer, "\n"));
827496be53dSLois Curfman McInnes     }
8289566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE));
829fb9695e5SSatish Balay   } else if (format == PETSC_VIEWER_ASCII_DENSE) {
83097f1f81fSBarry Smith     PetscInt    cnt = 0, jcnt;
83187828ca2SBarry Smith     PetscScalar value;
83268f1ed48SBarry Smith #if defined(PETSC_USE_COMPLEX)
83368f1ed48SBarry Smith     PetscBool realonly = PETSC_TRUE;
83468f1ed48SBarry Smith 
83568f1ed48SBarry Smith     for (i = 0; i < a->i[m]; i++) {
83668f1ed48SBarry Smith       if (PetscImaginaryPart(a->a[i]) != 0.0) {
83768f1ed48SBarry Smith         realonly = PETSC_FALSE;
83868f1ed48SBarry Smith         break;
83968f1ed48SBarry Smith       }
84068f1ed48SBarry Smith     }
84168f1ed48SBarry Smith #endif
84202594712SBarry Smith 
8439566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE));
84402594712SBarry Smith     for (i = 0; i < m; i++) {
84502594712SBarry Smith       jcnt = 0;
846d0f46423SBarry Smith       for (j = 0; j < A->cmap->n; j++) {
847e24b481bSBarry Smith         if (jcnt < a->i[i + 1] - a->i[i] && j == a->j[cnt]) {
84802594712SBarry Smith           value = a->a[cnt++];
849e24b481bSBarry Smith           jcnt++;
85002594712SBarry Smith         } else {
85102594712SBarry Smith           value = 0.0;
85202594712SBarry Smith         }
853aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX)
85468f1ed48SBarry Smith         if (realonly) {
8559566063dSJacob Faibussowitsch           PetscCall(PetscViewerASCIIPrintf(viewer, " %7.5e ", (double)PetscRealPart(value)));
85668f1ed48SBarry Smith         } else {
8579566063dSJacob Faibussowitsch           PetscCall(PetscViewerASCIIPrintf(viewer, " %7.5e+%7.5e i ", (double)PetscRealPart(value), (double)PetscImaginaryPart(value)));
85868f1ed48SBarry Smith         }
85902594712SBarry Smith #else
8609566063dSJacob Faibussowitsch         PetscCall(PetscViewerASCIIPrintf(viewer, " %7.5e ", (double)value));
86102594712SBarry Smith #endif
86202594712SBarry Smith       }
8639566063dSJacob Faibussowitsch       PetscCall(PetscViewerASCIIPrintf(viewer, "\n"));
86402594712SBarry Smith     }
8659566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE));
8663c215bfdSMatthew Knepley   } else if (format == PETSC_VIEWER_ASCII_MATRIXMARKET) {
867150b93efSMatthew G. Knepley     PetscInt fshift = 1;
8689566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE));
8693c215bfdSMatthew Knepley #if defined(PETSC_USE_COMPLEX)
8709566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIPrintf(viewer, "%%%%MatrixMarket matrix coordinate complex general\n"));
8713c215bfdSMatthew Knepley #else
8729566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIPrintf(viewer, "%%%%MatrixMarket matrix coordinate real general\n"));
8733c215bfdSMatthew Knepley #endif
8749566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT "\n", m, A->cmap->n, a->nz));
8753c215bfdSMatthew Knepley     for (i = 0; i < m; i++) {
87660e0710aSBarry Smith       for (j = a->i[i]; j < a->i[i + 1]; j++) {
8773c215bfdSMatthew Knepley #if defined(PETSC_USE_COMPLEX)
8789566063dSJacob Faibussowitsch         PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT " %g %g\n", i + fshift, a->j[j] + fshift, (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j])));
8793c215bfdSMatthew Knepley #else
8809566063dSJacob Faibussowitsch         PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT " %g\n", i + fshift, a->j[j] + fshift, (double)a->a[j]));
8813c215bfdSMatthew Knepley #endif
8823c215bfdSMatthew Knepley       }
8833c215bfdSMatthew Knepley     }
8849566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE));
8853a40ed3dSBarry Smith   } else {
8869566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE));
887d5f3da31SBarry Smith     if (A->factortype) {
88816cd7e1dSShri Abhyankar       for (i = 0; i < m; i++) {
8899566063dSJacob Faibussowitsch         PetscCall(PetscViewerASCIIPrintf(viewer, "row %" PetscInt_FMT ":", i));
89016cd7e1dSShri Abhyankar         /* L part */
89160e0710aSBarry Smith         for (j = a->i[i]; j < a->i[i + 1]; j++) {
89216cd7e1dSShri Abhyankar #if defined(PETSC_USE_COMPLEX)
89316cd7e1dSShri Abhyankar           if (PetscImaginaryPart(a->a[j]) > 0.0) {
8949566063dSJacob Faibussowitsch             PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g + %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j])));
89516cd7e1dSShri Abhyankar           } else if (PetscImaginaryPart(a->a[j]) < 0.0) {
8969566063dSJacob Faibussowitsch             PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g - %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)(-PetscImaginaryPart(a->a[j]))));
89716cd7e1dSShri Abhyankar           } else {
8989566063dSJacob Faibussowitsch             PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)PetscRealPart(a->a[j])));
89916cd7e1dSShri Abhyankar           }
90016cd7e1dSShri Abhyankar #else
9019566063dSJacob Faibussowitsch           PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)a->a[j]));
90216cd7e1dSShri Abhyankar #endif
90316cd7e1dSShri Abhyankar         }
90416cd7e1dSShri Abhyankar         /* diagonal */
90516cd7e1dSShri Abhyankar         j = a->diag[i];
90616cd7e1dSShri Abhyankar #if defined(PETSC_USE_COMPLEX)
90716cd7e1dSShri Abhyankar         if (PetscImaginaryPart(a->a[j]) > 0.0) {
9089566063dSJacob Faibussowitsch           PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g + %g i)", a->j[j], (double)PetscRealPart(1.0 / a->a[j]), (double)PetscImaginaryPart(1.0 / a->a[j])));
90916cd7e1dSShri Abhyankar         } else if (PetscImaginaryPart(a->a[j]) < 0.0) {
9109566063dSJacob Faibussowitsch           PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g - %g i)", a->j[j], (double)PetscRealPart(1.0 / a->a[j]), (double)(-PetscImaginaryPart(1.0 / a->a[j]))));
91116cd7e1dSShri Abhyankar         } else {
9129566063dSJacob Faibussowitsch           PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)PetscRealPart(1.0 / a->a[j])));
91316cd7e1dSShri Abhyankar         }
91416cd7e1dSShri Abhyankar #else
9159566063dSJacob Faibussowitsch         PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)(1.0 / a->a[j])));
91616cd7e1dSShri Abhyankar #endif
91716cd7e1dSShri Abhyankar 
91816cd7e1dSShri Abhyankar         /* U part */
91960e0710aSBarry Smith         for (j = a->diag[i + 1] + 1; j < a->diag[i]; j++) {
92016cd7e1dSShri Abhyankar #if defined(PETSC_USE_COMPLEX)
92116cd7e1dSShri Abhyankar           if (PetscImaginaryPart(a->a[j]) > 0.0) {
9229566063dSJacob Faibussowitsch             PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g + %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j])));
92316cd7e1dSShri Abhyankar           } else if (PetscImaginaryPart(a->a[j]) < 0.0) {
9249566063dSJacob Faibussowitsch             PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g - %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)(-PetscImaginaryPart(a->a[j]))));
92516cd7e1dSShri Abhyankar           } else {
9269566063dSJacob Faibussowitsch             PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)PetscRealPart(a->a[j])));
92716cd7e1dSShri Abhyankar           }
92816cd7e1dSShri Abhyankar #else
9299566063dSJacob Faibussowitsch           PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)a->a[j]));
93016cd7e1dSShri Abhyankar #endif
93116cd7e1dSShri Abhyankar         }
9329566063dSJacob Faibussowitsch         PetscCall(PetscViewerASCIIPrintf(viewer, "\n"));
93316cd7e1dSShri Abhyankar       }
93416cd7e1dSShri Abhyankar     } else {
93517ab2063SBarry Smith       for (i = 0; i < m; i++) {
9369566063dSJacob Faibussowitsch         PetscCall(PetscViewerASCIIPrintf(viewer, "row %" PetscInt_FMT ":", i));
93760e0710aSBarry Smith         for (j = a->i[i]; j < a->i[i + 1]; j++) {
938aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX)
93936db0b34SBarry Smith           if (PetscImaginaryPart(a->a[j]) > 0.0) {
9409566063dSJacob Faibussowitsch             PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g + %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j])));
94136db0b34SBarry Smith           } else if (PetscImaginaryPart(a->a[j]) < 0.0) {
9429566063dSJacob Faibussowitsch             PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g - %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)-PetscImaginaryPart(a->a[j])));
9433a40ed3dSBarry Smith           } else {
9449566063dSJacob Faibussowitsch             PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)PetscRealPart(a->a[j])));
94517ab2063SBarry Smith           }
94617ab2063SBarry Smith #else
9479566063dSJacob Faibussowitsch           PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)a->a[j]));
94817ab2063SBarry Smith #endif
94917ab2063SBarry Smith         }
9509566063dSJacob Faibussowitsch         PetscCall(PetscViewerASCIIPrintf(viewer, "\n"));
95117ab2063SBarry Smith       }
95216cd7e1dSShri Abhyankar     }
9539566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE));
95417ab2063SBarry Smith   }
9559566063dSJacob Faibussowitsch   PetscCall(PetscViewerFlush(viewer));
9563ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
957416022c9SBarry Smith }
958416022c9SBarry Smith 
9599804daf3SBarry Smith #include <petscdraw.h>
960ba38deedSJacob Faibussowitsch static PetscErrorCode MatView_SeqAIJ_Draw_Zoom(PetscDraw draw, void *Aa)
961d71ae5a4SJacob Faibussowitsch {
962480ef9eaSBarry Smith   Mat                A = (Mat)Aa;
963416022c9SBarry Smith   Mat_SeqAIJ        *a = (Mat_SeqAIJ *)A->data;
964383922c3SLisandro Dalcin   PetscInt           i, j, m = A->rmap->n;
965383922c3SLisandro Dalcin   int                color;
966b05fc000SLisandro Dalcin   PetscReal          xl, yl, xr, yr, x_l, x_r, y_l, y_r;
967b0a32e0cSBarry Smith   PetscViewer        viewer;
968f3ef73ceSBarry Smith   PetscViewerFormat  format;
969fff043a9SJunchao Zhang   const PetscScalar *aa;
970cddf8d76SBarry Smith 
9713a40ed3dSBarry Smith   PetscFunctionBegin;
9729566063dSJacob Faibussowitsch   PetscCall(PetscObjectQuery((PetscObject)A, "Zoomviewer", (PetscObject *)&viewer));
9739566063dSJacob Faibussowitsch   PetscCall(PetscViewerGetFormat(viewer, &format));
9749566063dSJacob Faibussowitsch   PetscCall(PetscDrawGetCoordinates(draw, &xl, &yl, &xr, &yr));
975383922c3SLisandro Dalcin 
976416022c9SBarry Smith   /* loop over matrix elements drawing boxes */
9779566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &aa));
978fb9695e5SSatish Balay   if (format != PETSC_VIEWER_DRAW_CONTOUR) {
979d0609cedSBarry Smith     PetscDrawCollectiveBegin(draw);
9800513a670SBarry Smith     /* Blue for negative, Cyan for zero and  Red for positive */
981b0a32e0cSBarry Smith     color = PETSC_DRAW_BLUE;
982416022c9SBarry Smith     for (i = 0; i < m; i++) {
9839371c9d4SSatish Balay       y_l = m - i - 1.0;
9849371c9d4SSatish Balay       y_r = y_l + 1.0;
985bfeeae90SHong Zhang       for (j = a->i[i]; j < a->i[i + 1]; j++) {
9869371c9d4SSatish Balay         x_l = a->j[j];
9879371c9d4SSatish Balay         x_r = x_l + 1.0;
988fff043a9SJunchao Zhang         if (PetscRealPart(aa[j]) >= 0.) continue;
9899566063dSJacob Faibussowitsch         PetscCall(PetscDrawRectangle(draw, x_l, y_l, x_r, y_r, color, color, color, color));
990cddf8d76SBarry Smith       }
991cddf8d76SBarry Smith     }
992b0a32e0cSBarry Smith     color = PETSC_DRAW_CYAN;
993cddf8d76SBarry Smith     for (i = 0; i < m; i++) {
9949371c9d4SSatish Balay       y_l = m - i - 1.0;
9959371c9d4SSatish Balay       y_r = y_l + 1.0;
996bfeeae90SHong Zhang       for (j = a->i[i]; j < a->i[i + 1]; j++) {
9979371c9d4SSatish Balay         x_l = a->j[j];
9989371c9d4SSatish Balay         x_r = x_l + 1.0;
999fff043a9SJunchao Zhang         if (aa[j] != 0.) continue;
10009566063dSJacob Faibussowitsch         PetscCall(PetscDrawRectangle(draw, x_l, y_l, x_r, y_r, color, color, color, color));
1001cddf8d76SBarry Smith       }
1002cddf8d76SBarry Smith     }
1003b0a32e0cSBarry Smith     color = PETSC_DRAW_RED;
1004cddf8d76SBarry Smith     for (i = 0; i < m; i++) {
10059371c9d4SSatish Balay       y_l = m - i - 1.0;
10069371c9d4SSatish Balay       y_r = y_l + 1.0;
1007bfeeae90SHong Zhang       for (j = a->i[i]; j < a->i[i + 1]; j++) {
10089371c9d4SSatish Balay         x_l = a->j[j];
10099371c9d4SSatish Balay         x_r = x_l + 1.0;
1010fff043a9SJunchao Zhang         if (PetscRealPart(aa[j]) <= 0.) continue;
10119566063dSJacob Faibussowitsch         PetscCall(PetscDrawRectangle(draw, x_l, y_l, x_r, y_r, color, color, color, color));
1012416022c9SBarry Smith       }
1013416022c9SBarry Smith     }
1014d0609cedSBarry Smith     PetscDrawCollectiveEnd(draw);
10150513a670SBarry Smith   } else {
10160513a670SBarry Smith     /* use contour shading to indicate magnitude of values */
10170513a670SBarry Smith     /* first determine max of all nonzero values */
1018b05fc000SLisandro Dalcin     PetscReal minv = 0.0, maxv = 0.0;
1019383922c3SLisandro Dalcin     PetscInt  nz = a->nz, count = 0;
1020b0a32e0cSBarry Smith     PetscDraw popup;
10210513a670SBarry Smith 
10220513a670SBarry Smith     for (i = 0; i < nz; i++) {
1023fff043a9SJunchao Zhang       if (PetscAbsScalar(aa[i]) > maxv) maxv = PetscAbsScalar(aa[i]);
10240513a670SBarry Smith     }
1025383922c3SLisandro Dalcin     if (minv >= maxv) maxv = minv + PETSC_SMALL;
10269566063dSJacob Faibussowitsch     PetscCall(PetscDrawGetPopup(draw, &popup));
10279566063dSJacob Faibussowitsch     PetscCall(PetscDrawScalePopup(popup, minv, maxv));
1028383922c3SLisandro Dalcin 
1029d0609cedSBarry Smith     PetscDrawCollectiveBegin(draw);
10300513a670SBarry Smith     for (i = 0; i < m; i++) {
1031383922c3SLisandro Dalcin       y_l = m - i - 1.0;
1032383922c3SLisandro Dalcin       y_r = y_l + 1.0;
1033bfeeae90SHong Zhang       for (j = a->i[i]; j < a->i[i + 1]; j++) {
1034383922c3SLisandro Dalcin         x_l   = a->j[j];
1035383922c3SLisandro Dalcin         x_r   = x_l + 1.0;
1036fff043a9SJunchao Zhang         color = PetscDrawRealToColor(PetscAbsScalar(aa[count]), minv, maxv);
10379566063dSJacob Faibussowitsch         PetscCall(PetscDrawRectangle(draw, x_l, y_l, x_r, y_r, color, color, color, color));
10380513a670SBarry Smith         count++;
10390513a670SBarry Smith       }
10400513a670SBarry Smith     }
1041d0609cedSBarry Smith     PetscDrawCollectiveEnd(draw);
10420513a670SBarry Smith   }
10439566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &aa));
10443ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
1045480ef9eaSBarry Smith }
1046cddf8d76SBarry Smith 
10479804daf3SBarry Smith #include <petscdraw.h>
1048ba38deedSJacob Faibussowitsch static PetscErrorCode MatView_SeqAIJ_Draw(Mat A, PetscViewer viewer)
1049d71ae5a4SJacob Faibussowitsch {
1050b0a32e0cSBarry Smith   PetscDraw draw;
105136db0b34SBarry Smith   PetscReal xr, yr, xl, yl, h, w;
1052ace3abfcSBarry Smith   PetscBool isnull;
1053480ef9eaSBarry Smith 
1054480ef9eaSBarry Smith   PetscFunctionBegin;
10559566063dSJacob Faibussowitsch   PetscCall(PetscViewerDrawGetDraw(viewer, 0, &draw));
10569566063dSJacob Faibussowitsch   PetscCall(PetscDrawIsNull(draw, &isnull));
10573ba16761SJacob Faibussowitsch   if (isnull) PetscFunctionReturn(PETSC_SUCCESS);
1058480ef9eaSBarry Smith 
10599371c9d4SSatish Balay   xr = A->cmap->n;
10609371c9d4SSatish Balay   yr = A->rmap->n;
10619371c9d4SSatish Balay   h  = yr / 10.0;
10629371c9d4SSatish Balay   w  = xr / 10.0;
10639371c9d4SSatish Balay   xr += w;
10649371c9d4SSatish Balay   yr += h;
10659371c9d4SSatish Balay   xl = -w;
10669371c9d4SSatish Balay   yl = -h;
10679566063dSJacob Faibussowitsch   PetscCall(PetscDrawSetCoordinates(draw, xl, yl, xr, yr));
10689566063dSJacob Faibussowitsch   PetscCall(PetscObjectCompose((PetscObject)A, "Zoomviewer", (PetscObject)viewer));
10699566063dSJacob Faibussowitsch   PetscCall(PetscDrawZoom(draw, MatView_SeqAIJ_Draw_Zoom, A));
10709566063dSJacob Faibussowitsch   PetscCall(PetscObjectCompose((PetscObject)A, "Zoomviewer", NULL));
10719566063dSJacob Faibussowitsch   PetscCall(PetscDrawSave(draw));
10723ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
1073416022c9SBarry Smith }
1074416022c9SBarry Smith 
1075d71ae5a4SJacob Faibussowitsch PetscErrorCode MatView_SeqAIJ(Mat A, PetscViewer viewer)
1076d71ae5a4SJacob Faibussowitsch {
1077ace3abfcSBarry Smith   PetscBool iascii, isbinary, isdraw;
1078416022c9SBarry Smith 
10793a40ed3dSBarry Smith   PetscFunctionBegin;
10809566063dSJacob Faibussowitsch   PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERASCII, &iascii));
10819566063dSJacob Faibussowitsch   PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERBINARY, &isbinary));
10829566063dSJacob Faibussowitsch   PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERDRAW, &isdraw));
10831baa6e33SBarry Smith   if (iascii) PetscCall(MatView_SeqAIJ_ASCII(A, viewer));
10841baa6e33SBarry Smith   else if (isbinary) PetscCall(MatView_SeqAIJ_Binary(A, viewer));
10851baa6e33SBarry Smith   else if (isdraw) PetscCall(MatView_SeqAIJ_Draw(A, viewer));
10869566063dSJacob Faibussowitsch   PetscCall(MatView_SeqAIJ_Inode(A, viewer));
10873ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
108817ab2063SBarry Smith }
108919bcc07fSBarry Smith 
1090d71ae5a4SJacob Faibussowitsch PetscErrorCode MatAssemblyEnd_SeqAIJ(Mat A, MatAssemblyType mode)
1091d71ae5a4SJacob Faibussowitsch {
1092416022c9SBarry Smith   Mat_SeqAIJ *a      = (Mat_SeqAIJ *)A->data;
1093580bdb30SBarry Smith   PetscInt    fshift = 0, i, *ai = a->i, *aj = a->j, *imax = a->imax;
1094bc43efbbSJunchao Zhang   PetscInt    m = A->rmap->n, *ip, N, *ailen = a->ilen, rmax = 0, n;
109554f21887SBarry Smith   MatScalar  *aa    = a->a, *ap;
10963447b6efSHong Zhang   PetscReal   ratio = 0.6;
109717ab2063SBarry Smith 
10983a40ed3dSBarry Smith   PetscFunctionBegin;
10993ba16761SJacob Faibussowitsch   if (mode == MAT_FLUSH_ASSEMBLY) PetscFunctionReturn(PETSC_SUCCESS);
11009566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJInvalidateDiagonal(A));
1101b215bc84SStefano Zampini   if (A->was_assembled && A->ass_nonzerostate == A->nonzerostate) {
1102b215bc84SStefano Zampini     /* we need to respect users asking to use or not the inodes routine in between matrix assemblies */
11039566063dSJacob Faibussowitsch     PetscCall(MatAssemblyEnd_SeqAIJ_Inode(A, mode));
11043ba16761SJacob Faibussowitsch     PetscFunctionReturn(PETSC_SUCCESS);
1105b215bc84SStefano Zampini   }
110617ab2063SBarry Smith 
110743ee02c3SBarry Smith   if (m) rmax = ailen[0]; /* determine row with most nonzeros */
110817ab2063SBarry Smith   for (i = 1; i < m; i++) {
1109416022c9SBarry Smith     /* move each row back by the amount of empty slots (fshift) before it*/
111017ab2063SBarry Smith     fshift += imax[i - 1] - ailen[i - 1];
111194a9d846SBarry Smith     rmax = PetscMax(rmax, ailen[i]);
111217ab2063SBarry Smith     if (fshift) {
1113bfeeae90SHong Zhang       ip = aj + ai[i];
1114bfeeae90SHong Zhang       ap = aa + ai[i];
111517ab2063SBarry Smith       N  = ailen[i];
11169566063dSJacob Faibussowitsch       PetscCall(PetscArraymove(ip - fshift, ip, N));
111748a46eb9SPierre Jolivet       if (!A->structure_only) PetscCall(PetscArraymove(ap - fshift, ap, N));
111817ab2063SBarry Smith     }
111917ab2063SBarry Smith     ai[i] = ai[i - 1] + ailen[i - 1];
112017ab2063SBarry Smith   }
112117ab2063SBarry Smith   if (m) {
112217ab2063SBarry Smith     fshift += imax[m - 1] - ailen[m - 1];
112317ab2063SBarry Smith     ai[m] = ai[m - 1] + ailen[m - 1];
112417ab2063SBarry Smith   }
112517ab2063SBarry Smith   /* reset ilen and imax for each row */
11267b083b7cSBarry Smith   a->nonzerorowcnt = 0;
1127396832f4SHong Zhang   if (A->structure_only) {
11289566063dSJacob Faibussowitsch     PetscCall(PetscFree(a->imax));
11299566063dSJacob Faibussowitsch     PetscCall(PetscFree(a->ilen));
1130396832f4SHong Zhang   } else { /* !A->structure_only */
113117ab2063SBarry Smith     for (i = 0; i < m; i++) {
113217ab2063SBarry Smith       ailen[i] = imax[i] = ai[i + 1] - ai[i];
11337b083b7cSBarry Smith       a->nonzerorowcnt += ((ai[i + 1] - ai[i]) > 0);
113417ab2063SBarry Smith     }
1135396832f4SHong Zhang   }
1136bfeeae90SHong Zhang   a->nz = ai[m];
1137aed4548fSBarry Smith   PetscCheck(!fshift || a->nounused != -1, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Unused space detected in matrix: %" PetscInt_FMT " X %" PetscInt_FMT ", %" PetscInt_FMT " unneeded", m, A->cmap->n, fshift);
1138bc43efbbSJunchao Zhang   PetscCall(MatMarkDiagonal_SeqAIJ(A)); // since diagonal info is used a lot, it is helpful to set them up at the end of assembly
1139bc43efbbSJunchao Zhang   a->diagonaldense = PETSC_TRUE;
1140bc43efbbSJunchao Zhang   n                = PetscMin(A->rmap->n, A->cmap->n);
1141bc43efbbSJunchao Zhang   for (i = 0; i < n; i++) {
1142bc43efbbSJunchao Zhang     if (a->diag[i] >= ai[i + 1]) {
1143bc43efbbSJunchao Zhang       a->diagonaldense = PETSC_FALSE;
1144bc43efbbSJunchao Zhang       break;
1145bc43efbbSJunchao Zhang     }
1146bc43efbbSJunchao Zhang   }
11479566063dSJacob Faibussowitsch   PetscCall(PetscInfo(A, "Matrix size: %" PetscInt_FMT " X %" PetscInt_FMT "; storage space: %" PetscInt_FMT " unneeded,%" PetscInt_FMT " used\n", m, A->cmap->n, fshift, a->nz));
11489566063dSJacob Faibussowitsch   PetscCall(PetscInfo(A, "Number of mallocs during MatSetValues() is %" PetscInt_FMT "\n", a->reallocs));
11499566063dSJacob Faibussowitsch   PetscCall(PetscInfo(A, "Maximum nonzeros in any row is %" PetscInt_FMT "\n", rmax));
11502205254eSKarl Rupp 
11518e58a170SBarry Smith   A->info.mallocs += a->reallocs;
1152dd5f02e7SSatish Balay   a->reallocs         = 0;
11536712e2f1SBarry Smith   A->info.nz_unneeded = (PetscReal)fshift;
115436db0b34SBarry Smith   a->rmax             = rmax;
11554e220ebcSLois Curfman McInnes 
115648a46eb9SPierre Jolivet   if (!A->structure_only) PetscCall(MatCheckCompressedRow(A, a->nonzerorowcnt, &a->compressedrow, a->i, m, ratio));
11579566063dSJacob Faibussowitsch   PetscCall(MatAssemblyEnd_SeqAIJ_Inode(A, mode));
11583ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
115917ab2063SBarry Smith }
116017ab2063SBarry Smith 
1161ba38deedSJacob Faibussowitsch static PetscErrorCode MatRealPart_SeqAIJ(Mat A)
1162d71ae5a4SJacob Faibussowitsch {
116399cafbc1SBarry Smith   Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data;
116499cafbc1SBarry Smith   PetscInt    i, nz = a->nz;
11652e5835c6SStefano Zampini   MatScalar  *aa;
116699cafbc1SBarry Smith 
116799cafbc1SBarry Smith   PetscFunctionBegin;
11689566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArray(A, &aa));
116999cafbc1SBarry Smith   for (i = 0; i < nz; i++) aa[i] = PetscRealPart(aa[i]);
11709566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArray(A, &aa));
11719566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJInvalidateDiagonal(A));
11723ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
117399cafbc1SBarry Smith }
117499cafbc1SBarry Smith 
1175ba38deedSJacob Faibussowitsch static PetscErrorCode MatImaginaryPart_SeqAIJ(Mat A)
1176d71ae5a4SJacob Faibussowitsch {
117799cafbc1SBarry Smith   Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data;
117899cafbc1SBarry Smith   PetscInt    i, nz = a->nz;
11792e5835c6SStefano Zampini   MatScalar  *aa;
118099cafbc1SBarry Smith 
118199cafbc1SBarry Smith   PetscFunctionBegin;
11829566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArray(A, &aa));
118399cafbc1SBarry Smith   for (i = 0; i < nz; i++) aa[i] = PetscImaginaryPart(aa[i]);
11849566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArray(A, &aa));
11859566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJInvalidateDiagonal(A));
11863ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
118799cafbc1SBarry Smith }
118899cafbc1SBarry Smith 
1189d71ae5a4SJacob Faibussowitsch PetscErrorCode MatZeroEntries_SeqAIJ(Mat A)
1190d71ae5a4SJacob Faibussowitsch {
1191fff043a9SJunchao Zhang   Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data;
1192fff043a9SJunchao Zhang   MatScalar  *aa;
11933a40ed3dSBarry Smith 
11943a40ed3dSBarry Smith   PetscFunctionBegin;
11959566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayWrite(A, &aa));
11969566063dSJacob Faibussowitsch   PetscCall(PetscArrayzero(aa, a->i[A->rmap->n]));
11979566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayWrite(A, &aa));
11989566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJInvalidateDiagonal(A));
11993ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
120017ab2063SBarry Smith }
1201416022c9SBarry Smith 
1202d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDestroy_SeqAIJ(Mat A)
1203d71ae5a4SJacob Faibussowitsch {
1204416022c9SBarry Smith   Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data;
1205d5d45c9bSBarry Smith 
12063a40ed3dSBarry Smith   PetscFunctionBegin;
1207b4e2f619SBarry Smith   if (A->hash_active) {
1208e3c72094SPierre Jolivet     A->ops[0] = a->cops;
1209b4e2f619SBarry Smith     PetscCall(PetscHMapIJVDestroy(&a->ht));
1210b4e2f619SBarry Smith     PetscCall(PetscFree(a->dnz));
1211b4e2f619SBarry Smith     A->hash_active = PETSC_FALSE;
1212b4e2f619SBarry Smith   }
1213b4e2f619SBarry Smith 
12143ba16761SJacob Faibussowitsch   PetscCall(PetscLogObjectState((PetscObject)A, "Rows=%" PetscInt_FMT ", Cols=%" PetscInt_FMT ", NZ=%" PetscInt_FMT, A->rmap->n, A->cmap->n, a->nz));
12159566063dSJacob Faibussowitsch   PetscCall(MatSeqXAIJFreeAIJ(A, &a->a, &a->j, &a->i));
12169566063dSJacob Faibussowitsch   PetscCall(ISDestroy(&a->row));
12179566063dSJacob Faibussowitsch   PetscCall(ISDestroy(&a->col));
12189566063dSJacob Faibussowitsch   PetscCall(PetscFree(a->diag));
12199566063dSJacob Faibussowitsch   PetscCall(PetscFree(a->ibdiag));
12209566063dSJacob Faibussowitsch   PetscCall(PetscFree(a->imax));
12219566063dSJacob Faibussowitsch   PetscCall(PetscFree(a->ilen));
12229566063dSJacob Faibussowitsch   PetscCall(PetscFree(a->ipre));
12239566063dSJacob Faibussowitsch   PetscCall(PetscFree3(a->idiag, a->mdiag, a->ssor_work));
12249566063dSJacob Faibussowitsch   PetscCall(PetscFree(a->solve_work));
12259566063dSJacob Faibussowitsch   PetscCall(ISDestroy(&a->icol));
12269566063dSJacob Faibussowitsch   PetscCall(PetscFree(a->saved_values));
12279566063dSJacob Faibussowitsch   PetscCall(PetscFree2(a->compressedrow.i, a->compressedrow.rindex));
12289566063dSJacob Faibussowitsch   PetscCall(MatDestroy_SeqAIJ_Inode(A));
12299566063dSJacob Faibussowitsch   PetscCall(PetscFree(A->data));
1230901853e0SKris Buschelman 
12316718818eSStefano Zampini   /* MatMatMultNumeric_SeqAIJ_SeqAIJ_Sorted may allocate this.
12326718818eSStefano Zampini      That function is so heavily used (sometimes in an hidden way through multnumeric function pointers)
12336718818eSStefano Zampini      that is hard to properly add this data to the MatProduct data. We free it here to avoid
12346718818eSStefano Zampini      users reusing the matrix object with different data to incur in obscure segmentation faults
12356718818eSStefano Zampini      due to different matrix sizes */
12369566063dSJacob Faibussowitsch   PetscCall(PetscObjectCompose((PetscObject)A, "__PETSc__ab_dense", NULL));
12376718818eSStefano Zampini 
12389566063dSJacob Faibussowitsch   PetscCall(PetscObjectChangeTypeName((PetscObject)A, NULL));
12392e956fe4SStefano Zampini   PetscCall(PetscObjectComposeFunction((PetscObject)A, "PetscMatlabEnginePut_C", NULL));
12402e956fe4SStefano Zampini   PetscCall(PetscObjectComposeFunction((PetscObject)A, "PetscMatlabEngineGet_C", NULL));
12419566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSeqAIJSetColumnIndices_C", NULL));
12429566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatStoreValues_C", NULL));
12439566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatRetrieveValues_C", NULL));
12449566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqsbaij_C", NULL));
12459566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqbaij_C", NULL));
12469566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijperm_C", NULL));
12472e956fe4SStefano Zampini   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijsell_C", NULL));
12482e956fe4SStefano Zampini #if defined(PETSC_HAVE_MKL_SPARSE)
12492e956fe4SStefano Zampini   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijmkl_C", NULL));
12502e956fe4SStefano Zampini #endif
12514222ddf1SHong Zhang #if defined(PETSC_HAVE_CUDA)
12529566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijcusparse_C", NULL));
12539566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaijcusparse_seqaij_C", NULL));
12549566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaij_seqaijcusparse_C", NULL));
12554222ddf1SHong Zhang #endif
1256d5e393b6SSuyash Tandon #if defined(PETSC_HAVE_HIP)
1257d5e393b6SSuyash Tandon   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijhipsparse_C", NULL));
1258d5e393b6SSuyash Tandon   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaijhipsparse_seqaij_C", NULL));
1259d5e393b6SSuyash Tandon   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaij_seqaijhipsparse_C", NULL));
1260d5e393b6SSuyash Tandon #endif
12613d0639e7SStefano Zampini #if defined(PETSC_HAVE_KOKKOS_KERNELS)
12629566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijkokkos_C", NULL));
12633d0639e7SStefano Zampini #endif
12649566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijcrl_C", NULL));
1265af8000cdSHong Zhang #if defined(PETSC_HAVE_ELEMENTAL)
12669566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_elemental_C", NULL));
1267af8000cdSHong Zhang #endif
1268d24d4204SJose E. Roman #if defined(PETSC_HAVE_SCALAPACK)
12699566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_scalapack_C", NULL));
1270d24d4204SJose E. Roman #endif
127163c07aadSStefano Zampini #if defined(PETSC_HAVE_HYPRE)
12729566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_hypre_C", NULL));
12739566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_transpose_seqaij_seqaij_C", NULL));
127463c07aadSStefano Zampini #endif
12759566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqdense_C", NULL));
12769566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqsell_C", NULL));
12779566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_is_C", NULL));
12789566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatIsTranspose_C", NULL));
12792e956fe4SStefano Zampini   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatIsHermitianTranspose_C", NULL));
12809566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSeqAIJSetPreallocation_C", NULL));
12819566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatResetPreallocation_C", NULL));
12829566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSeqAIJSetPreallocationCSR_C", NULL));
12839566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatReorderForNonzeroDiagonal_C", NULL));
12849566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_is_seqaij_C", NULL));
12859566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqdense_seqaij_C", NULL));
12869566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaij_seqaij_C", NULL));
12879566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSeqAIJKron_C", NULL));
12889566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSetPreallocationCOO_C", NULL));
12899566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSetValuesCOO_C", NULL));
12902e956fe4SStefano Zampini   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatFactorGetSolverType_C", NULL));
12912e956fe4SStefano Zampini   /* these calls do not belong here: the subclasses Duplicate/Destroy are wrong */
12922e956fe4SStefano Zampini   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaijsell_seqaij_C", NULL));
12932e956fe4SStefano Zampini   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaijperm_seqaij_C", NULL));
12942e956fe4SStefano Zampini   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijviennacl_C", NULL));
12952e956fe4SStefano Zampini   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaijviennacl_seqdense_C", NULL));
12962e956fe4SStefano Zampini   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaijviennacl_seqaij_C", NULL));
12973ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
129817ab2063SBarry Smith }
129917ab2063SBarry Smith 
1300d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetOption_SeqAIJ(Mat A, MatOption op, PetscBool flg)
1301d71ae5a4SJacob Faibussowitsch {
1302416022c9SBarry Smith   Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data;
13033a40ed3dSBarry Smith 
13043a40ed3dSBarry Smith   PetscFunctionBegin;
1305a65d3064SKris Buschelman   switch (op) {
1306d71ae5a4SJacob Faibussowitsch   case MAT_ROW_ORIENTED:
1307d71ae5a4SJacob Faibussowitsch     a->roworiented = flg;
1308d71ae5a4SJacob Faibussowitsch     break;
1309d71ae5a4SJacob Faibussowitsch   case MAT_KEEP_NONZERO_PATTERN:
1310d71ae5a4SJacob Faibussowitsch     a->keepnonzeropattern = flg;
1311d71ae5a4SJacob Faibussowitsch     break;
1312d71ae5a4SJacob Faibussowitsch   case MAT_NEW_NONZERO_LOCATIONS:
1313d71ae5a4SJacob Faibussowitsch     a->nonew = (flg ? 0 : 1);
1314d71ae5a4SJacob Faibussowitsch     break;
1315d71ae5a4SJacob Faibussowitsch   case MAT_NEW_NONZERO_LOCATION_ERR:
1316d71ae5a4SJacob Faibussowitsch     a->nonew = (flg ? -1 : 0);
1317d71ae5a4SJacob Faibussowitsch     break;
1318d71ae5a4SJacob Faibussowitsch   case MAT_NEW_NONZERO_ALLOCATION_ERR:
1319d71ae5a4SJacob Faibussowitsch     a->nonew = (flg ? -2 : 0);
1320d71ae5a4SJacob Faibussowitsch     break;
1321d71ae5a4SJacob Faibussowitsch   case MAT_UNUSED_NONZERO_LOCATION_ERR:
1322d71ae5a4SJacob Faibussowitsch     a->nounused = (flg ? -1 : 0);
1323d71ae5a4SJacob Faibussowitsch     break;
1324d71ae5a4SJacob Faibussowitsch   case MAT_IGNORE_ZERO_ENTRIES:
1325d71ae5a4SJacob Faibussowitsch     a->ignorezeroentries = flg;
1326d71ae5a4SJacob Faibussowitsch     break;
13273d472b54SHong Zhang   case MAT_SPD:
1328b1646e73SJed Brown   case MAT_SYMMETRIC:
1329b1646e73SJed Brown   case MAT_STRUCTURALLY_SYMMETRIC:
1330b1646e73SJed Brown   case MAT_HERMITIAN:
1331b1646e73SJed Brown   case MAT_SYMMETRY_ETERNAL:
1332957cac9fSHong Zhang   case MAT_STRUCTURE_ONLY:
1333b94d7dedSBarry Smith   case MAT_STRUCTURAL_SYMMETRY_ETERNAL:
1334b94d7dedSBarry Smith   case MAT_SPD_ETERNAL:
1335b94d7dedSBarry Smith     /* if the diagonal matrix is square it inherits some of the properties above */
13365021d80fSJed Brown     break;
13378c78258cSHong Zhang   case MAT_FORCE_DIAGONAL_ENTRIES:
1338a65d3064SKris Buschelman   case MAT_IGNORE_OFF_PROC_ENTRIES:
1339d71ae5a4SJacob Faibussowitsch   case MAT_USE_HASH_TABLE:
1340d71ae5a4SJacob Faibussowitsch     PetscCall(PetscInfo(A, "Option %s ignored\n", MatOptions[op]));
1341d71ae5a4SJacob Faibussowitsch     break;
1342d71ae5a4SJacob Faibussowitsch   case MAT_USE_INODES:
1343d71ae5a4SJacob Faibussowitsch     PetscCall(MatSetOption_SeqAIJ_Inode(A, MAT_USE_INODES, flg));
1344d71ae5a4SJacob Faibussowitsch     break;
1345d71ae5a4SJacob Faibussowitsch   case MAT_SUBMAT_SINGLEIS:
1346d71ae5a4SJacob Faibussowitsch     A->submat_singleis = flg;
1347d71ae5a4SJacob Faibussowitsch     break;
1348071fcb05SBarry Smith   case MAT_SORTED_FULL:
1349071fcb05SBarry Smith     if (flg) A->ops->setvalues = MatSetValues_SeqAIJ_SortedFull;
1350071fcb05SBarry Smith     else A->ops->setvalues = MatSetValues_SeqAIJ;
1351071fcb05SBarry Smith     break;
1352d71ae5a4SJacob Faibussowitsch   case MAT_FORM_EXPLICIT_TRANSPOSE:
1353d71ae5a4SJacob Faibussowitsch     A->form_explicit_transpose = flg;
1354d71ae5a4SJacob Faibussowitsch     break;
1355d71ae5a4SJacob Faibussowitsch   default:
1356d71ae5a4SJacob Faibussowitsch     SETERRQ(PETSC_COMM_SELF, PETSC_ERR_SUP, "unknown option %d", op);
1357a65d3064SKris Buschelman   }
13583ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
135917ab2063SBarry Smith }
136017ab2063SBarry Smith 
1361ba38deedSJacob Faibussowitsch static PetscErrorCode MatGetDiagonal_SeqAIJ(Mat A, Vec v)
1362d71ae5a4SJacob Faibussowitsch {
1363416022c9SBarry Smith   Mat_SeqAIJ        *a = (Mat_SeqAIJ *)A->data;
1364fdc842d1SBarry Smith   PetscInt           i, j, n, *ai = a->i, *aj = a->j;
1365c898d852SStefano Zampini   PetscScalar       *x;
1366c898d852SStefano Zampini   const PetscScalar *aa;
136717ab2063SBarry Smith 
13683a40ed3dSBarry Smith   PetscFunctionBegin;
13699566063dSJacob Faibussowitsch   PetscCall(VecGetLocalSize(v, &n));
137008401ef6SPierre Jolivet   PetscCheck(n == A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Nonconforming matrix and vector");
13719566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &aa));
1372d5f3da31SBarry Smith   if (A->factortype == MAT_FACTOR_ILU || A->factortype == MAT_FACTOR_LU) {
1373d3e70bfaSHong Zhang     PetscInt *diag = a->diag;
13749566063dSJacob Faibussowitsch     PetscCall(VecGetArrayWrite(v, &x));
13752c990fa1SHong Zhang     for (i = 0; i < n; i++) x[i] = 1.0 / aa[diag[i]];
13769566063dSJacob Faibussowitsch     PetscCall(VecRestoreArrayWrite(v, &x));
13779566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJRestoreArrayRead(A, &aa));
13783ba16761SJacob Faibussowitsch     PetscFunctionReturn(PETSC_SUCCESS);
137935e7444dSHong Zhang   }
138035e7444dSHong Zhang 
13819566063dSJacob Faibussowitsch   PetscCall(VecGetArrayWrite(v, &x));
138235e7444dSHong Zhang   for (i = 0; i < n; i++) {
1383fdc842d1SBarry Smith     x[i] = 0.0;
138435e7444dSHong Zhang     for (j = ai[i]; j < ai[i + 1]; j++) {
138535e7444dSHong Zhang       if (aj[j] == i) {
138635e7444dSHong Zhang         x[i] = aa[j];
138717ab2063SBarry Smith         break;
138817ab2063SBarry Smith       }
138917ab2063SBarry Smith     }
139017ab2063SBarry Smith   }
13919566063dSJacob Faibussowitsch   PetscCall(VecRestoreArrayWrite(v, &x));
13929566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &aa));
13933ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
139417ab2063SBarry Smith }
139517ab2063SBarry Smith 
1396c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/ftn-kernels/fmult.h>
1397d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMultTransposeAdd_SeqAIJ(Mat A, Vec xx, Vec zz, Vec yy)
1398d71ae5a4SJacob Faibussowitsch {
1399416022c9SBarry Smith   Mat_SeqAIJ        *a = (Mat_SeqAIJ *)A->data;
14005f22a7b3SSebastian Grimberg   const MatScalar   *aa;
1401d9ca1df4SBarry Smith   PetscScalar       *y;
1402d9ca1df4SBarry Smith   const PetscScalar *x;
1403d0f46423SBarry Smith   PetscInt           m = A->rmap->n;
14045c897100SBarry Smith #if !defined(PETSC_USE_FORTRAN_KERNEL_MULTTRANSPOSEAIJ)
14055f22a7b3SSebastian Grimberg   const MatScalar  *v;
1406a77337e4SBarry Smith   PetscScalar       alpha;
1407d9ca1df4SBarry Smith   PetscInt          n, i, j;
1408d9ca1df4SBarry Smith   const PetscInt   *idx, *ii, *ridx = NULL;
14093447b6efSHong Zhang   Mat_CompressedRow cprow    = a->compressedrow;
1410ace3abfcSBarry Smith   PetscBool         usecprow = cprow.use;
14115c897100SBarry Smith #endif
141217ab2063SBarry Smith 
14133a40ed3dSBarry Smith   PetscFunctionBegin;
14149566063dSJacob Faibussowitsch   if (zz != yy) PetscCall(VecCopy(zz, yy));
14159566063dSJacob Faibussowitsch   PetscCall(VecGetArrayRead(xx, &x));
14169566063dSJacob Faibussowitsch   PetscCall(VecGetArray(yy, &y));
14179566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &aa));
14185c897100SBarry Smith 
14195c897100SBarry Smith #if defined(PETSC_USE_FORTRAN_KERNEL_MULTTRANSPOSEAIJ)
1420fff043a9SJunchao Zhang   fortranmulttransposeaddaij_(&m, x, a->i, a->j, aa, y);
14215c897100SBarry Smith #else
14223447b6efSHong Zhang   if (usecprow) {
14233447b6efSHong Zhang     m    = cprow.nrows;
14243447b6efSHong Zhang     ii   = cprow.i;
14257b2bb3b9SHong Zhang     ridx = cprow.rindex;
14263447b6efSHong Zhang   } else {
14273447b6efSHong Zhang     ii = a->i;
14283447b6efSHong Zhang   }
142917ab2063SBarry Smith   for (i = 0; i < m; i++) {
14303447b6efSHong Zhang     idx = a->j + ii[i];
1431fff043a9SJunchao Zhang     v   = aa + ii[i];
14323447b6efSHong Zhang     n   = ii[i + 1] - ii[i];
14333447b6efSHong Zhang     if (usecprow) {
14347b2bb3b9SHong Zhang       alpha = x[ridx[i]];
14353447b6efSHong Zhang     } else {
143617ab2063SBarry Smith       alpha = x[i];
14373447b6efSHong Zhang     }
143804fbf559SBarry Smith     for (j = 0; j < n; j++) y[idx[j]] += alpha * v[j];
143917ab2063SBarry Smith   }
14405c897100SBarry Smith #endif
14419566063dSJacob Faibussowitsch   PetscCall(PetscLogFlops(2.0 * a->nz));
14429566063dSJacob Faibussowitsch   PetscCall(VecRestoreArrayRead(xx, &x));
14439566063dSJacob Faibussowitsch   PetscCall(VecRestoreArray(yy, &y));
14449566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &aa));
14453ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
144617ab2063SBarry Smith }
144717ab2063SBarry Smith 
1448d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMultTranspose_SeqAIJ(Mat A, Vec xx, Vec yy)
1449d71ae5a4SJacob Faibussowitsch {
14505c897100SBarry Smith   PetscFunctionBegin;
14519566063dSJacob Faibussowitsch   PetscCall(VecSet(yy, 0.0));
14529566063dSJacob Faibussowitsch   PetscCall(MatMultTransposeAdd_SeqAIJ(A, xx, yy, yy));
14533ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
14545c897100SBarry Smith }
14555c897100SBarry Smith 
1456c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/ftn-kernels/fmult.h>
145778b84d54SShri Abhyankar 
1458d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMult_SeqAIJ(Mat A, Vec xx, Vec yy)
1459d71ae5a4SJacob Faibussowitsch {
1460416022c9SBarry Smith   Mat_SeqAIJ        *a = (Mat_SeqAIJ *)A->data;
1461d9fead3dSBarry Smith   PetscScalar       *y;
146254f21887SBarry Smith   const PetscScalar *x;
14635914357eSBarry Smith   const MatScalar   *a_a;
1464003131ecSBarry Smith   PetscInt           m = A->rmap->n;
14655914357eSBarry Smith   const PetscInt    *ii, *ridx = NULL;
1466ace3abfcSBarry Smith   PetscBool          usecprow = a->compressedrow.use;
146717ab2063SBarry Smith 
1468b6410449SSatish Balay #if defined(PETSC_HAVE_PRAGMA_DISJOINT)
146997952fefSHong Zhang   #pragma disjoint(*x, *y, *aa)
1470fee21e36SBarry Smith #endif
1471fee21e36SBarry Smith 
14723a40ed3dSBarry Smith   PetscFunctionBegin;
1473b215bc84SStefano Zampini   if (a->inode.use && a->inode.checked) {
14749566063dSJacob Faibussowitsch     PetscCall(MatMult_SeqAIJ_Inode(A, xx, yy));
14753ba16761SJacob Faibussowitsch     PetscFunctionReturn(PETSC_SUCCESS);
1476b215bc84SStefano Zampini   }
14779566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &a_a));
14789566063dSJacob Faibussowitsch   PetscCall(VecGetArrayRead(xx, &x));
14799566063dSJacob Faibussowitsch   PetscCall(VecGetArray(yy, &y));
1480416022c9SBarry Smith   ii = a->i;
14814eb6d288SHong Zhang   if (usecprow) { /* use compressed row format */
14829566063dSJacob Faibussowitsch     PetscCall(PetscArrayzero(y, m));
148397952fefSHong Zhang     m    = a->compressedrow.nrows;
148497952fefSHong Zhang     ii   = a->compressedrow.i;
148597952fefSHong Zhang     ridx = a->compressedrow.rindex;
14865914357eSBarry Smith     PetscPragmaUseOMPKernels(parallel for)
14875914357eSBarry Smith     for (PetscInt i = 0; i < m; i++) {
14885914357eSBarry Smith       PetscInt           n   = ii[i + 1] - ii[i];
14895914357eSBarry Smith       const PetscInt    *aj  = a->j + ii[i];
14905914357eSBarry Smith       const PetscScalar *aa  = a_a + ii[i];
14915914357eSBarry Smith       PetscScalar        sum = 0.0;
1492003131ecSBarry Smith       PetscSparseDensePlusDot(sum, x, aa, aj, n);
1493003131ecSBarry Smith       /* for (j=0; j<n; j++) sum += (*aa++)*x[*aj++]; */
149497952fefSHong Zhang       y[*ridx++] = sum;
149597952fefSHong Zhang     }
149697952fefSHong Zhang   } else { /* do not use compressed row format */
1497b05257ddSBarry Smith #if defined(PETSC_USE_FORTRAN_KERNEL_MULTAIJ)
14985914357eSBarry Smith     fortranmultaij_(&m, x, ii, a->j, a_a, y);
1499b05257ddSBarry Smith #else
15005914357eSBarry Smith     PetscPragmaUseOMPKernels(parallel for)
15015914357eSBarry Smith     for (PetscInt i = 0; i < m; i++) {
15025914357eSBarry Smith       PetscInt           n   = ii[i + 1] - ii[i];
15035914357eSBarry Smith       const PetscInt    *aj  = a->j + ii[i];
15045914357eSBarry Smith       const PetscScalar *aa  = a_a + ii[i];
15055914357eSBarry Smith       PetscScalar        sum = 0.0;
1506003131ecSBarry Smith       PetscSparseDensePlusDot(sum, x, aa, aj, n);
150717ab2063SBarry Smith       y[i] = sum;
150817ab2063SBarry Smith     }
15098d195f9aSBarry Smith #endif
1510b05257ddSBarry Smith   }
15119566063dSJacob Faibussowitsch   PetscCall(PetscLogFlops(2.0 * a->nz - a->nonzerorowcnt));
15129566063dSJacob Faibussowitsch   PetscCall(VecRestoreArrayRead(xx, &x));
15139566063dSJacob Faibussowitsch   PetscCall(VecRestoreArray(yy, &y));
15149566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &a_a));
15153ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
151617ab2063SBarry Smith }
151717ab2063SBarry Smith 
1518ba38deedSJacob Faibussowitsch // HACK!!!!! Used by src/mat/tests/ex170.c
1519ba38deedSJacob Faibussowitsch PETSC_EXTERN PetscErrorCode MatMultMax_SeqAIJ(Mat A, Vec xx, Vec yy)
1520d71ae5a4SJacob Faibussowitsch {
1521b434eb95SMatthew G. Knepley   Mat_SeqAIJ        *a = (Mat_SeqAIJ *)A->data;
1522b434eb95SMatthew G. Knepley   PetscScalar       *y;
1523b434eb95SMatthew G. Knepley   const PetscScalar *x;
1524fff043a9SJunchao Zhang   const MatScalar   *aa, *a_a;
1525b434eb95SMatthew G. Knepley   PetscInt           m = A->rmap->n;
1526b434eb95SMatthew G. Knepley   const PetscInt    *aj, *ii, *ridx   = NULL;
1527b434eb95SMatthew G. Knepley   PetscInt           n, i, nonzerorow = 0;
1528b434eb95SMatthew G. Knepley   PetscScalar        sum;
1529b434eb95SMatthew G. Knepley   PetscBool          usecprow = a->compressedrow.use;
1530b434eb95SMatthew G. Knepley 
1531b434eb95SMatthew G. Knepley #if defined(PETSC_HAVE_PRAGMA_DISJOINT)
1532b434eb95SMatthew G. Knepley   #pragma disjoint(*x, *y, *aa)
1533b434eb95SMatthew G. Knepley #endif
1534b434eb95SMatthew G. Knepley 
1535b434eb95SMatthew G. Knepley   PetscFunctionBegin;
15369566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &a_a));
15379566063dSJacob Faibussowitsch   PetscCall(VecGetArrayRead(xx, &x));
15389566063dSJacob Faibussowitsch   PetscCall(VecGetArray(yy, &y));
1539b434eb95SMatthew G. Knepley   if (usecprow) { /* use compressed row format */
1540b434eb95SMatthew G. Knepley     m    = a->compressedrow.nrows;
1541b434eb95SMatthew G. Knepley     ii   = a->compressedrow.i;
1542b434eb95SMatthew G. Knepley     ridx = a->compressedrow.rindex;
1543b434eb95SMatthew G. Knepley     for (i = 0; i < m; i++) {
1544b434eb95SMatthew G. Knepley       n   = ii[i + 1] - ii[i];
1545b434eb95SMatthew G. Knepley       aj  = a->j + ii[i];
1546fff043a9SJunchao Zhang       aa  = a_a + ii[i];
1547b434eb95SMatthew G. Knepley       sum = 0.0;
1548b434eb95SMatthew G. Knepley       nonzerorow += (n > 0);
1549b434eb95SMatthew G. Knepley       PetscSparseDenseMaxDot(sum, x, aa, aj, n);
1550b434eb95SMatthew G. Knepley       /* for (j=0; j<n; j++) sum += (*aa++)*x[*aj++]; */
1551b434eb95SMatthew G. Knepley       y[*ridx++] = sum;
1552b434eb95SMatthew G. Knepley     }
1553b434eb95SMatthew G. Knepley   } else { /* do not use compressed row format */
15543d3eaba7SBarry Smith     ii = a->i;
1555b434eb95SMatthew G. Knepley     for (i = 0; i < m; i++) {
1556b434eb95SMatthew G. Knepley       n   = ii[i + 1] - ii[i];
1557b434eb95SMatthew G. Knepley       aj  = a->j + ii[i];
1558fff043a9SJunchao Zhang       aa  = a_a + ii[i];
1559b434eb95SMatthew G. Knepley       sum = 0.0;
1560b434eb95SMatthew G. Knepley       nonzerorow += (n > 0);
1561b434eb95SMatthew G. Knepley       PetscSparseDenseMaxDot(sum, x, aa, aj, n);
1562b434eb95SMatthew G. Knepley       y[i] = sum;
1563b434eb95SMatthew G. Knepley     }
1564b434eb95SMatthew G. Knepley   }
15659566063dSJacob Faibussowitsch   PetscCall(PetscLogFlops(2.0 * a->nz - nonzerorow));
15669566063dSJacob Faibussowitsch   PetscCall(VecRestoreArrayRead(xx, &x));
15679566063dSJacob Faibussowitsch   PetscCall(VecRestoreArray(yy, &y));
15689566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &a_a));
15693ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
1570b434eb95SMatthew G. Knepley }
1571b434eb95SMatthew G. Knepley 
1572ba38deedSJacob Faibussowitsch // HACK!!!!! Used by src/mat/tests/ex170.c
1573ba38deedSJacob Faibussowitsch PETSC_EXTERN PetscErrorCode MatMultAddMax_SeqAIJ(Mat A, Vec xx, Vec yy, Vec zz)
1574d71ae5a4SJacob Faibussowitsch {
1575b434eb95SMatthew G. Knepley   Mat_SeqAIJ        *a = (Mat_SeqAIJ *)A->data;
1576b434eb95SMatthew G. Knepley   PetscScalar       *y, *z;
1577b434eb95SMatthew G. Knepley   const PetscScalar *x;
1578fff043a9SJunchao Zhang   const MatScalar   *aa, *a_a;
1579b434eb95SMatthew G. Knepley   PetscInt           m = A->rmap->n, *aj, *ii;
1580b434eb95SMatthew G. Knepley   PetscInt           n, i, *ridx = NULL;
1581b434eb95SMatthew G. Knepley   PetscScalar        sum;
1582b434eb95SMatthew G. Knepley   PetscBool          usecprow = a->compressedrow.use;
1583b434eb95SMatthew G. Knepley 
1584b434eb95SMatthew G. Knepley   PetscFunctionBegin;
15859566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &a_a));
15869566063dSJacob Faibussowitsch   PetscCall(VecGetArrayRead(xx, &x));
15879566063dSJacob Faibussowitsch   PetscCall(VecGetArrayPair(yy, zz, &y, &z));
1588b434eb95SMatthew G. Knepley   if (usecprow) { /* use compressed row format */
158948a46eb9SPierre Jolivet     if (zz != yy) PetscCall(PetscArraycpy(z, y, m));
1590b434eb95SMatthew G. Knepley     m    = a->compressedrow.nrows;
1591b434eb95SMatthew G. Knepley     ii   = a->compressedrow.i;
1592b434eb95SMatthew G. Knepley     ridx = a->compressedrow.rindex;
1593b434eb95SMatthew G. Knepley     for (i = 0; i < m; i++) {
1594b434eb95SMatthew G. Knepley       n   = ii[i + 1] - ii[i];
1595b434eb95SMatthew G. Knepley       aj  = a->j + ii[i];
1596fff043a9SJunchao Zhang       aa  = a_a + ii[i];
1597b434eb95SMatthew G. Knepley       sum = y[*ridx];
1598b434eb95SMatthew G. Knepley       PetscSparseDenseMaxDot(sum, x, aa, aj, n);
1599b434eb95SMatthew G. Knepley       z[*ridx++] = sum;
1600b434eb95SMatthew G. Knepley     }
1601b434eb95SMatthew G. Knepley   } else { /* do not use compressed row format */
16023d3eaba7SBarry Smith     ii = a->i;
1603b434eb95SMatthew G. Knepley     for (i = 0; i < m; i++) {
1604b434eb95SMatthew G. Knepley       n   = ii[i + 1] - ii[i];
1605b434eb95SMatthew G. Knepley       aj  = a->j + ii[i];
1606fff043a9SJunchao Zhang       aa  = a_a + ii[i];
1607b434eb95SMatthew G. Knepley       sum = y[i];
1608b434eb95SMatthew G. Knepley       PetscSparseDenseMaxDot(sum, x, aa, aj, n);
1609b434eb95SMatthew G. Knepley       z[i] = sum;
1610b434eb95SMatthew G. Knepley     }
1611b434eb95SMatthew G. Knepley   }
16129566063dSJacob Faibussowitsch   PetscCall(PetscLogFlops(2.0 * a->nz));
16139566063dSJacob Faibussowitsch   PetscCall(VecRestoreArrayRead(xx, &x));
16149566063dSJacob Faibussowitsch   PetscCall(VecRestoreArrayPair(yy, zz, &y, &z));
16159566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &a_a));
16163ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
1617b434eb95SMatthew G. Knepley }
1618b434eb95SMatthew G. Knepley 
1619c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/ftn-kernels/fmultadd.h>
1620d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMultAdd_SeqAIJ(Mat A, Vec xx, Vec yy, Vec zz)
1621d71ae5a4SJacob Faibussowitsch {
1622416022c9SBarry Smith   Mat_SeqAIJ        *a = (Mat_SeqAIJ *)A->data;
1623f15663dcSBarry Smith   PetscScalar       *y, *z;
1624f15663dcSBarry Smith   const PetscScalar *x;
16255914357eSBarry Smith   const MatScalar   *a_a;
16265914357eSBarry Smith   const PetscInt    *ii, *ridx = NULL;
16275914357eSBarry Smith   PetscInt           m        = A->rmap->n;
1628ace3abfcSBarry Smith   PetscBool          usecprow = a->compressedrow.use;
16299ea0dfa2SSatish Balay 
16303a40ed3dSBarry Smith   PetscFunctionBegin;
1631b215bc84SStefano Zampini   if (a->inode.use && a->inode.checked) {
16329566063dSJacob Faibussowitsch     PetscCall(MatMultAdd_SeqAIJ_Inode(A, xx, yy, zz));
16333ba16761SJacob Faibussowitsch     PetscFunctionReturn(PETSC_SUCCESS);
1634b215bc84SStefano Zampini   }
16359566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &a_a));
16369566063dSJacob Faibussowitsch   PetscCall(VecGetArrayRead(xx, &x));
16379566063dSJacob Faibussowitsch   PetscCall(VecGetArrayPair(yy, zz, &y, &z));
16384eb6d288SHong Zhang   if (usecprow) { /* use compressed row format */
163948a46eb9SPierre Jolivet     if (zz != yy) PetscCall(PetscArraycpy(z, y, m));
164097952fefSHong Zhang     m    = a->compressedrow.nrows;
164197952fefSHong Zhang     ii   = a->compressedrow.i;
164297952fefSHong Zhang     ridx = a->compressedrow.rindex;
16435914357eSBarry Smith     for (PetscInt i = 0; i < m; i++) {
16445914357eSBarry Smith       PetscInt           n   = ii[i + 1] - ii[i];
16455914357eSBarry Smith       const PetscInt    *aj  = a->j + ii[i];
16465914357eSBarry Smith       const PetscScalar *aa  = a_a + ii[i];
16475914357eSBarry Smith       PetscScalar        sum = y[*ridx];
1648f15663dcSBarry Smith       PetscSparseDensePlusDot(sum, x, aa, aj, n);
164997952fefSHong Zhang       z[*ridx++] = sum;
165097952fefSHong Zhang     }
165197952fefSHong Zhang   } else { /* do not use compressed row format */
16523d3eaba7SBarry Smith     ii = a->i;
1653f15663dcSBarry Smith #if defined(PETSC_USE_FORTRAN_KERNEL_MULTADDAIJ)
16545914357eSBarry Smith     fortranmultaddaij_(&m, x, ii, a->j, a_a, y, z);
1655f15663dcSBarry Smith #else
16565914357eSBarry Smith     PetscPragmaUseOMPKernels(parallel for)
16575914357eSBarry Smith     for (PetscInt i = 0; i < m; i++) {
16585914357eSBarry Smith       PetscInt           n   = ii[i + 1] - ii[i];
16595914357eSBarry Smith       const PetscInt    *aj  = a->j + ii[i];
16605914357eSBarry Smith       const PetscScalar *aa  = a_a + ii[i];
16615914357eSBarry Smith       PetscScalar        sum = y[i];
1662f15663dcSBarry Smith       PetscSparseDensePlusDot(sum, x, aa, aj, n);
166317ab2063SBarry Smith       z[i] = sum;
166417ab2063SBarry Smith     }
166502ab625aSSatish Balay #endif
1666f15663dcSBarry Smith   }
16679566063dSJacob Faibussowitsch   PetscCall(PetscLogFlops(2.0 * a->nz));
16689566063dSJacob Faibussowitsch   PetscCall(VecRestoreArrayRead(xx, &x));
16699566063dSJacob Faibussowitsch   PetscCall(VecRestoreArrayPair(yy, zz, &y, &z));
16709566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &a_a));
16713ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
167217ab2063SBarry Smith }
167317ab2063SBarry Smith 
167417ab2063SBarry Smith /*
167517ab2063SBarry Smith      Adds diagonal pointers to sparse matrix structure.
167617ab2063SBarry Smith */
1677d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMarkDiagonal_SeqAIJ(Mat A)
1678d71ae5a4SJacob Faibussowitsch {
1679416022c9SBarry Smith   Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data;
1680d0f46423SBarry Smith   PetscInt    i, j, m = A->rmap->n;
1681c0c07093SJunchao Zhang   PetscBool   alreadySet = PETSC_TRUE;
168217ab2063SBarry Smith 
16833a40ed3dSBarry Smith   PetscFunctionBegin;
168409f38230SBarry Smith   if (!a->diag) {
16859566063dSJacob Faibussowitsch     PetscCall(PetscMalloc1(m, &a->diag));
1686c0c07093SJunchao Zhang     alreadySet = PETSC_FALSE;
168709f38230SBarry Smith   }
1688d0f46423SBarry Smith   for (i = 0; i < A->rmap->n; i++) {
1689c0c07093SJunchao Zhang     /* If A's diagonal is already correctly set, this fast track enables cheap and repeated MatMarkDiagonal_SeqAIJ() calls */
1690c0c07093SJunchao Zhang     if (alreadySet) {
1691c0c07093SJunchao Zhang       PetscInt pos = a->diag[i];
1692c0c07093SJunchao Zhang       if (pos >= a->i[i] && pos < a->i[i + 1] && a->j[pos] == i) continue;
1693c0c07093SJunchao Zhang     }
1694c0c07093SJunchao Zhang 
169509f38230SBarry Smith     a->diag[i] = a->i[i + 1];
1696bfeeae90SHong Zhang     for (j = a->i[i]; j < a->i[i + 1]; j++) {
1697bfeeae90SHong Zhang       if (a->j[j] == i) {
169809f38230SBarry Smith         a->diag[i] = j;
169917ab2063SBarry Smith         break;
170017ab2063SBarry Smith       }
170117ab2063SBarry Smith     }
170217ab2063SBarry Smith   }
17033ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
170417ab2063SBarry Smith }
170517ab2063SBarry Smith 
1706ba38deedSJacob Faibussowitsch static PetscErrorCode MatShift_SeqAIJ(Mat A, PetscScalar v)
1707d71ae5a4SJacob Faibussowitsch {
170861ecd0c6SBarry Smith   Mat_SeqAIJ     *a    = (Mat_SeqAIJ *)A->data;
170961ecd0c6SBarry Smith   const PetscInt *diag = (const PetscInt *)a->diag;
171061ecd0c6SBarry Smith   const PetscInt *ii   = (const PetscInt *)a->i;
171161ecd0c6SBarry Smith   PetscInt        i, *mdiag = NULL;
171261ecd0c6SBarry Smith   PetscInt        cnt = 0; /* how many diagonals are missing */
171361ecd0c6SBarry Smith 
171461ecd0c6SBarry Smith   PetscFunctionBegin;
171561ecd0c6SBarry Smith   if (!A->preallocated || !a->nz) {
17169566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJSetPreallocation(A, 1, NULL));
17179566063dSJacob Faibussowitsch     PetscCall(MatShift_Basic(A, v));
17183ba16761SJacob Faibussowitsch     PetscFunctionReturn(PETSC_SUCCESS);
171961ecd0c6SBarry Smith   }
172061ecd0c6SBarry Smith 
172161ecd0c6SBarry Smith   if (a->diagonaldense) {
172261ecd0c6SBarry Smith     cnt = 0;
172361ecd0c6SBarry Smith   } else {
17249566063dSJacob Faibussowitsch     PetscCall(PetscCalloc1(A->rmap->n, &mdiag));
172561ecd0c6SBarry Smith     for (i = 0; i < A->rmap->n; i++) {
1726349d3b71SJunchao Zhang       if (i < A->cmap->n && diag[i] >= ii[i + 1]) { /* 'out of range' rows never have diagonals */
172761ecd0c6SBarry Smith         cnt++;
172861ecd0c6SBarry Smith         mdiag[i] = 1;
172961ecd0c6SBarry Smith       }
173061ecd0c6SBarry Smith     }
173161ecd0c6SBarry Smith   }
173261ecd0c6SBarry Smith   if (!cnt) {
17339566063dSJacob Faibussowitsch     PetscCall(MatShift_Basic(A, v));
173461ecd0c6SBarry Smith   } else {
1735b6f2aa54SBarry Smith     PetscScalar       *olda = a->a; /* preserve pointers to current matrix nonzeros structure and values */
1736b6f2aa54SBarry Smith     PetscInt          *oldj = a->j, *oldi = a->i;
17379f0612e4SBarry Smith     PetscBool          free_a = a->free_a, free_ij = a->free_ij;
17386ea2a7edSJunchao Zhang     const PetscScalar *Aa;
17396ea2a7edSJunchao Zhang 
17406ea2a7edSJunchao Zhang     PetscCall(MatSeqAIJGetArrayRead(A, &Aa)); // sync the host
17416ea2a7edSJunchao Zhang     PetscCall(MatSeqAIJRestoreArrayRead(A, &Aa));
174261ecd0c6SBarry Smith 
174361ecd0c6SBarry Smith     a->a = NULL;
174461ecd0c6SBarry Smith     a->j = NULL;
174561ecd0c6SBarry Smith     a->i = NULL;
174661ecd0c6SBarry Smith     /* increase the values in imax for each row where a diagonal is being inserted then reallocate the matrix data structures */
1747ad540459SPierre Jolivet     for (i = 0; i < PetscMin(A->rmap->n, A->cmap->n); i++) a->imax[i] += mdiag[i];
17489566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(A, 0, a->imax));
174961ecd0c6SBarry Smith 
175061ecd0c6SBarry Smith     /* copy old values into new matrix data structure */
175161ecd0c6SBarry Smith     for (i = 0; i < A->rmap->n; i++) {
17529566063dSJacob Faibussowitsch       PetscCall(MatSetValues(A, 1, &i, a->imax[i] - mdiag[i], &oldj[oldi[i]], &olda[oldi[i]], ADD_VALUES));
175348a46eb9SPierre Jolivet       if (i < A->cmap->n) PetscCall(MatSetValue(A, i, i, v, ADD_VALUES));
1754447d62f5SStefano Zampini     }
17559566063dSJacob Faibussowitsch     PetscCall(MatAssemblyBegin(A, MAT_FINAL_ASSEMBLY));
17569566063dSJacob Faibussowitsch     PetscCall(MatAssemblyEnd(A, MAT_FINAL_ASSEMBLY));
17579f0612e4SBarry Smith     if (free_a) PetscCall(PetscShmgetDeallocateArray((void **)&olda));
17589f0612e4SBarry Smith     if (free_ij) PetscCall(PetscShmgetDeallocateArray((void **)&oldj));
17599f0612e4SBarry Smith     if (free_ij) PetscCall(PetscShmgetDeallocateArray((void **)&oldi));
176061ecd0c6SBarry Smith   }
17619566063dSJacob Faibussowitsch   PetscCall(PetscFree(mdiag));
176261ecd0c6SBarry Smith   a->diagonaldense = PETSC_TRUE;
17633ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
176461ecd0c6SBarry Smith }
176561ecd0c6SBarry Smith 
1766be5855fcSBarry Smith /*
1767be5855fcSBarry Smith      Checks for missing diagonals
1768be5855fcSBarry Smith */
1769d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMissingDiagonal_SeqAIJ(Mat A, PetscBool *missing, PetscInt *d)
1770d71ae5a4SJacob Faibussowitsch {
1771be5855fcSBarry Smith   Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data;
17727734d3b5SMatthew G. Knepley   PetscInt   *diag, *ii = a->i, i;
1773be5855fcSBarry Smith 
1774be5855fcSBarry Smith   PetscFunctionBegin;
177509f38230SBarry Smith   *missing = PETSC_FALSE;
17767734d3b5SMatthew G. Knepley   if (A->rmap->n > 0 && !ii) {
177709f38230SBarry Smith     *missing = PETSC_TRUE;
177809f38230SBarry Smith     if (d) *d = 0;
17799566063dSJacob Faibussowitsch     PetscCall(PetscInfo(A, "Matrix has no entries therefore is missing diagonal\n"));
178009f38230SBarry Smith   } else {
178101445905SHong Zhang     PetscInt n;
178201445905SHong Zhang     n    = PetscMin(A->rmap->n, A->cmap->n);
1783f1e2ffcdSBarry Smith     diag = a->diag;
178401445905SHong Zhang     for (i = 0; i < n; i++) {
17857734d3b5SMatthew G. Knepley       if (diag[i] >= ii[i + 1]) {
178609f38230SBarry Smith         *missing = PETSC_TRUE;
178709f38230SBarry Smith         if (d) *d = i;
17889566063dSJacob Faibussowitsch         PetscCall(PetscInfo(A, "Matrix is missing diagonal number %" PetscInt_FMT "\n", i));
1789358d2f5dSShri Abhyankar         break;
179009f38230SBarry Smith       }
1791be5855fcSBarry Smith     }
1792be5855fcSBarry Smith   }
17933ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
1794be5855fcSBarry Smith }
1795be5855fcSBarry Smith 
17960da83c2eSBarry Smith #include <petscblaslapack.h>
17970da83c2eSBarry Smith #include <petsc/private/kernels/blockinvert.h>
17980da83c2eSBarry Smith 
17990da83c2eSBarry Smith /*
18000da83c2eSBarry Smith     Note that values is allocated externally by the PC and then passed into this routine
18010da83c2eSBarry Smith */
1802ba38deedSJacob Faibussowitsch static PetscErrorCode MatInvertVariableBlockDiagonal_SeqAIJ(Mat A, PetscInt nblocks, const PetscInt *bsizes, PetscScalar *diag)
1803d71ae5a4SJacob Faibussowitsch {
18040da83c2eSBarry Smith   PetscInt        n = A->rmap->n, i, ncnt = 0, *indx, j, bsizemax = 0, *v_pivots;
18050da83c2eSBarry Smith   PetscBool       allowzeropivot, zeropivotdetected = PETSC_FALSE;
18060da83c2eSBarry Smith   const PetscReal shift = 0.0;
18070da83c2eSBarry Smith   PetscInt        ipvt[5];
18084e208921SJed Brown   PetscCount      flops = 0;
18090da83c2eSBarry Smith   PetscScalar     work[25], *v_work;
18100da83c2eSBarry Smith 
18110da83c2eSBarry Smith   PetscFunctionBegin;
18120da83c2eSBarry Smith   allowzeropivot = PetscNot(A->erroriffailure);
18130da83c2eSBarry Smith   for (i = 0; i < nblocks; i++) ncnt += bsizes[i];
181408401ef6SPierre Jolivet   PetscCheck(ncnt == n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Total blocksizes %" PetscInt_FMT " doesn't match number matrix rows %" PetscInt_FMT, ncnt, n);
1815ad540459SPierre Jolivet   for (i = 0; i < nblocks; i++) bsizemax = PetscMax(bsizemax, bsizes[i]);
18169566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(bsizemax, &indx));
181748a46eb9SPierre Jolivet   if (bsizemax > 7) PetscCall(PetscMalloc2(bsizemax, &v_work, bsizemax, &v_pivots));
18180da83c2eSBarry Smith   ncnt = 0;
18190da83c2eSBarry Smith   for (i = 0; i < nblocks; i++) {
18200da83c2eSBarry Smith     for (j = 0; j < bsizes[i]; j++) indx[j] = ncnt + j;
18219566063dSJacob Faibussowitsch     PetscCall(MatGetValues(A, bsizes[i], indx, bsizes[i], indx, diag));
18220da83c2eSBarry Smith     switch (bsizes[i]) {
1823d71ae5a4SJacob Faibussowitsch     case 1:
1824d71ae5a4SJacob Faibussowitsch       *diag = 1.0 / (*diag);
1825d71ae5a4SJacob Faibussowitsch       break;
18260da83c2eSBarry Smith     case 2:
18279566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_inverse_A_2(diag, shift, allowzeropivot, &zeropivotdetected));
18280da83c2eSBarry Smith       if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT;
18299566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_transpose_A_2(diag));
18300da83c2eSBarry Smith       break;
18310da83c2eSBarry Smith     case 3:
18329566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_inverse_A_3(diag, shift, allowzeropivot, &zeropivotdetected));
18330da83c2eSBarry Smith       if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT;
18349566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_transpose_A_3(diag));
18350da83c2eSBarry Smith       break;
18360da83c2eSBarry Smith     case 4:
18379566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_inverse_A_4(diag, shift, allowzeropivot, &zeropivotdetected));
18380da83c2eSBarry Smith       if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT;
18399566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_transpose_A_4(diag));
18400da83c2eSBarry Smith       break;
18410da83c2eSBarry Smith     case 5:
18429566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_inverse_A_5(diag, ipvt, work, shift, allowzeropivot, &zeropivotdetected));
18430da83c2eSBarry Smith       if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT;
18449566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_transpose_A_5(diag));
18450da83c2eSBarry Smith       break;
18460da83c2eSBarry Smith     case 6:
18479566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_inverse_A_6(diag, shift, allowzeropivot, &zeropivotdetected));
18480da83c2eSBarry Smith       if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT;
18499566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_transpose_A_6(diag));
18500da83c2eSBarry Smith       break;
18510da83c2eSBarry Smith     case 7:
18529566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_inverse_A_7(diag, shift, allowzeropivot, &zeropivotdetected));
18530da83c2eSBarry Smith       if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT;
18549566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_transpose_A_7(diag));
18550da83c2eSBarry Smith       break;
18560da83c2eSBarry Smith     default:
18579566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_inverse_A(bsizes[i], diag, v_pivots, v_work, allowzeropivot, &zeropivotdetected));
18580da83c2eSBarry Smith       if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT;
18599566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_transpose_A_N(diag, bsizes[i]));
18600da83c2eSBarry Smith     }
18610da83c2eSBarry Smith     ncnt += bsizes[i];
18620da83c2eSBarry Smith     diag += bsizes[i] * bsizes[i];
1863baa50dc0SBrad Aagaard     flops += 2 * PetscPowInt64(bsizes[i], 3) / 3;
18640da83c2eSBarry Smith   }
18653ba16761SJacob Faibussowitsch   PetscCall(PetscLogFlops(flops));
186648a46eb9SPierre Jolivet   if (bsizemax > 7) PetscCall(PetscFree2(v_work, v_pivots));
18679566063dSJacob Faibussowitsch   PetscCall(PetscFree(indx));
18683ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
18690da83c2eSBarry Smith }
18700da83c2eSBarry Smith 
1871422a814eSBarry Smith /*
1872422a814eSBarry Smith    Negative shift indicates do not generate an error if there is a zero diagonal, just invert it anyways
1873422a814eSBarry Smith */
1874ba38deedSJacob Faibussowitsch static PetscErrorCode MatInvertDiagonal_SeqAIJ(Mat A, PetscScalar omega, PetscScalar fshift)
1875d71ae5a4SJacob Faibussowitsch {
187671f1c65dSBarry Smith   Mat_SeqAIJ      *a = (Mat_SeqAIJ *)A->data;
1877d0f46423SBarry Smith   PetscInt         i, *diag, m = A->rmap->n;
18782e5835c6SStefano Zampini   const MatScalar *v;
187954f21887SBarry Smith   PetscScalar     *idiag, *mdiag;
188071f1c65dSBarry Smith 
188171f1c65dSBarry Smith   PetscFunctionBegin;
18823ba16761SJacob Faibussowitsch   if (a->idiagvalid) PetscFunctionReturn(PETSC_SUCCESS);
18839566063dSJacob Faibussowitsch   PetscCall(MatMarkDiagonal_SeqAIJ(A));
188471f1c65dSBarry Smith   diag = a->diag;
18854dfa11a4SJacob Faibussowitsch   if (!a->idiag) { PetscCall(PetscMalloc3(m, &a->idiag, m, &a->mdiag, m, &a->ssor_work)); }
18862e5835c6SStefano Zampini 
188771f1c65dSBarry Smith   mdiag = a->mdiag;
188871f1c65dSBarry Smith   idiag = a->idiag;
18899566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &v));
1890422a814eSBarry Smith   if (omega == 1.0 && PetscRealPart(fshift) <= 0.0) {
189171f1c65dSBarry Smith     for (i = 0; i < m; i++) {
189271f1c65dSBarry Smith       mdiag[i] = v[diag[i]];
1893899639b0SHong Zhang       if (!PetscAbsScalar(mdiag[i])) { /* zero diagonal */
1894899639b0SHong Zhang         if (PetscRealPart(fshift)) {
18959566063dSJacob Faibussowitsch           PetscCall(PetscInfo(A, "Zero diagonal on row %" PetscInt_FMT "\n", i));
18967b6c816cSBarry Smith           A->factorerrortype             = MAT_FACTOR_NUMERIC_ZEROPIVOT;
18977b6c816cSBarry Smith           A->factorerror_zeropivot_value = 0.0;
18987b6c816cSBarry Smith           A->factorerror_zeropivot_row   = i;
189998921bdaSJacob Faibussowitsch         } else SETERRQ(PETSC_COMM_SELF, PETSC_ERR_ARG_INCOMP, "Zero diagonal on row %" PetscInt_FMT, i);
1900899639b0SHong Zhang       }
190171f1c65dSBarry Smith       idiag[i] = 1.0 / v[diag[i]];
190271f1c65dSBarry Smith     }
19039566063dSJacob Faibussowitsch     PetscCall(PetscLogFlops(m));
190471f1c65dSBarry Smith   } else {
190571f1c65dSBarry Smith     for (i = 0; i < m; i++) {
190671f1c65dSBarry Smith       mdiag[i] = v[diag[i]];
190771f1c65dSBarry Smith       idiag[i] = omega / (fshift + v[diag[i]]);
190871f1c65dSBarry Smith     }
19099566063dSJacob Faibussowitsch     PetscCall(PetscLogFlops(2.0 * m));
191071f1c65dSBarry Smith   }
191171f1c65dSBarry Smith   a->idiagvalid = PETSC_TRUE;
19129566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &v));
19133ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
191471f1c65dSBarry Smith }
191571f1c65dSBarry Smith 
1916d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSOR_SeqAIJ(Mat A, Vec bb, PetscReal omega, MatSORType flag, PetscReal fshift, PetscInt its, PetscInt lits, Vec xx)
1917d71ae5a4SJacob Faibussowitsch {
1918416022c9SBarry Smith   Mat_SeqAIJ        *a = (Mat_SeqAIJ *)A->data;
1919e6d1f457SBarry Smith   PetscScalar       *x, d, sum, *t, scale;
19202e5835c6SStefano Zampini   const MatScalar   *v, *idiag = NULL, *mdiag, *aa;
192154f21887SBarry Smith   const PetscScalar *b, *bs, *xb, *ts;
19223d3eaba7SBarry Smith   PetscInt           n, m = A->rmap->n, i;
192397f1f81fSBarry Smith   const PetscInt    *idx, *diag;
192417ab2063SBarry Smith 
19253a40ed3dSBarry Smith   PetscFunctionBegin;
1926b215bc84SStefano Zampini   if (a->inode.use && a->inode.checked && omega == 1.0 && fshift == 0.0) {
19279566063dSJacob Faibussowitsch     PetscCall(MatSOR_SeqAIJ_Inode(A, bb, omega, flag, fshift, its, lits, xx));
19283ba16761SJacob Faibussowitsch     PetscFunctionReturn(PETSC_SUCCESS);
1929b215bc84SStefano Zampini   }
1930b965ef7fSBarry Smith   its = its * lits;
193191723122SBarry Smith 
193271f1c65dSBarry Smith   if (fshift != a->fshift || omega != a->omega) a->idiagvalid = PETSC_FALSE; /* must recompute idiag[] */
19339566063dSJacob Faibussowitsch   if (!a->idiagvalid) PetscCall(MatInvertDiagonal_SeqAIJ(A, omega, fshift));
193471f1c65dSBarry Smith   a->fshift = fshift;
193571f1c65dSBarry Smith   a->omega  = omega;
1936ed480e8bSBarry Smith 
193771f1c65dSBarry Smith   diag  = a->diag;
193871f1c65dSBarry Smith   t     = a->ssor_work;
1939ed480e8bSBarry Smith   idiag = a->idiag;
194071f1c65dSBarry Smith   mdiag = a->mdiag;
1941ed480e8bSBarry Smith 
19429566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &aa));
19439566063dSJacob Faibussowitsch   PetscCall(VecGetArray(xx, &x));
19449566063dSJacob Faibussowitsch   PetscCall(VecGetArrayRead(bb, &b));
1945ed480e8bSBarry Smith   /* We count flops by assuming the upper triangular and lower triangular parts have the same number of nonzeros */
194617ab2063SBarry Smith   if (flag == SOR_APPLY_UPPER) {
194717ab2063SBarry Smith     /* apply (U + D/omega) to the vector */
1948ed480e8bSBarry Smith     bs = b;
194917ab2063SBarry Smith     for (i = 0; i < m; i++) {
195071f1c65dSBarry Smith       d   = fshift + mdiag[i];
1951416022c9SBarry Smith       n   = a->i[i + 1] - diag[i] - 1;
1952ed480e8bSBarry Smith       idx = a->j + diag[i] + 1;
19532e5835c6SStefano Zampini       v   = aa + diag[i] + 1;
195417ab2063SBarry Smith       sum = b[i] * d / omega;
1955003131ecSBarry Smith       PetscSparseDensePlusDot(sum, bs, v, idx, n);
195617ab2063SBarry Smith       x[i] = sum;
195717ab2063SBarry Smith     }
19589566063dSJacob Faibussowitsch     PetscCall(VecRestoreArray(xx, &x));
19599566063dSJacob Faibussowitsch     PetscCall(VecRestoreArrayRead(bb, &b));
19609566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJRestoreArrayRead(A, &aa));
19619566063dSJacob Faibussowitsch     PetscCall(PetscLogFlops(a->nz));
19623ba16761SJacob Faibussowitsch     PetscFunctionReturn(PETSC_SUCCESS);
196317ab2063SBarry Smith   }
1964c783ea89SBarry Smith 
196508401ef6SPierre Jolivet   PetscCheck(flag != SOR_APPLY_LOWER, PETSC_COMM_SELF, PETSC_ERR_SUP, "SOR_APPLY_LOWER is not implemented");
1966f7d195e4SLawrence Mitchell   if (flag & SOR_EISENSTAT) {
19674c500f23SPierre Jolivet     /* Let  A = L + U + D; where L is lower triangular,
1968887ee2caSBarry Smith     U is upper triangular, E = D/omega; This routine applies
196917ab2063SBarry Smith 
197017ab2063SBarry Smith             (L + E)^{-1} A (U + E)^{-1}
197117ab2063SBarry Smith 
1972887ee2caSBarry Smith     to a vector efficiently using Eisenstat's trick.
197317ab2063SBarry Smith     */
197417ab2063SBarry Smith     scale = (2.0 / omega) - 1.0;
197517ab2063SBarry Smith 
197617ab2063SBarry Smith     /*  x = (E + U)^{-1} b */
197717ab2063SBarry Smith     for (i = m - 1; i >= 0; i--) {
1978416022c9SBarry Smith       n   = a->i[i + 1] - diag[i] - 1;
1979ed480e8bSBarry Smith       idx = a->j + diag[i] + 1;
19802e5835c6SStefano Zampini       v   = aa + diag[i] + 1;
198117ab2063SBarry Smith       sum = b[i];
1982e6d1f457SBarry Smith       PetscSparseDenseMinusDot(sum, x, v, idx, n);
1983ed480e8bSBarry Smith       x[i] = sum * idiag[i];
198417ab2063SBarry Smith     }
198517ab2063SBarry Smith 
198617ab2063SBarry Smith     /*  t = b - (2*E - D)x */
19872e5835c6SStefano Zampini     v = aa;
19882205254eSKarl Rupp     for (i = 0; i < m; i++) t[i] = b[i] - scale * (v[*diag++]) * x[i];
198917ab2063SBarry Smith 
199017ab2063SBarry Smith     /*  t = (E + L)^{-1}t */
1991ed480e8bSBarry Smith     ts   = t;
1992416022c9SBarry Smith     diag = a->diag;
199317ab2063SBarry Smith     for (i = 0; i < m; i++) {
1994416022c9SBarry Smith       n   = diag[i] - a->i[i];
1995ed480e8bSBarry Smith       idx = a->j + a->i[i];
19962e5835c6SStefano Zampini       v   = aa + a->i[i];
199717ab2063SBarry Smith       sum = t[i];
1998003131ecSBarry Smith       PetscSparseDenseMinusDot(sum, ts, v, idx, n);
1999ed480e8bSBarry Smith       t[i] = sum * idiag[i];
2000733d66baSBarry Smith       /*  x = x + t */
2001733d66baSBarry Smith       x[i] += t[i];
200217ab2063SBarry Smith     }
200317ab2063SBarry Smith 
20049566063dSJacob Faibussowitsch     PetscCall(PetscLogFlops(6.0 * m - 1 + 2.0 * a->nz));
20059566063dSJacob Faibussowitsch     PetscCall(VecRestoreArray(xx, &x));
20069566063dSJacob Faibussowitsch     PetscCall(VecRestoreArrayRead(bb, &b));
20073ba16761SJacob Faibussowitsch     PetscFunctionReturn(PETSC_SUCCESS);
200817ab2063SBarry Smith   }
200917ab2063SBarry Smith   if (flag & SOR_ZERO_INITIAL_GUESS) {
201017ab2063SBarry Smith     if (flag & SOR_FORWARD_SWEEP || flag & SOR_LOCAL_FORWARD_SWEEP) {
201117ab2063SBarry Smith       for (i = 0; i < m; i++) {
2012416022c9SBarry Smith         n   = diag[i] - a->i[i];
2013ed480e8bSBarry Smith         idx = a->j + a->i[i];
20142e5835c6SStefano Zampini         v   = aa + a->i[i];
201517ab2063SBarry Smith         sum = b[i];
2016e6d1f457SBarry Smith         PetscSparseDenseMinusDot(sum, x, v, idx, n);
20175c99c7daSBarry Smith         t[i] = sum;
2018ed480e8bSBarry Smith         x[i] = sum * idiag[i];
201917ab2063SBarry Smith       }
20205c99c7daSBarry Smith       xb = t;
20219566063dSJacob Faibussowitsch       PetscCall(PetscLogFlops(a->nz));
20223a40ed3dSBarry Smith     } else xb = b;
202317ab2063SBarry Smith     if (flag & SOR_BACKWARD_SWEEP || flag & SOR_LOCAL_BACKWARD_SWEEP) {
202417ab2063SBarry Smith       for (i = m - 1; i >= 0; i--) {
2025416022c9SBarry Smith         n   = a->i[i + 1] - diag[i] - 1;
2026ed480e8bSBarry Smith         idx = a->j + diag[i] + 1;
20272e5835c6SStefano Zampini         v   = aa + diag[i] + 1;
202817ab2063SBarry Smith         sum = xb[i];
2029e6d1f457SBarry Smith         PetscSparseDenseMinusDot(sum, x, v, idx, n);
20305c99c7daSBarry Smith         if (xb == b) {
2031ed480e8bSBarry Smith           x[i] = sum * idiag[i];
20325c99c7daSBarry Smith         } else {
2033b19a5dc2SMark Adams           x[i] = (1 - omega) * x[i] + sum * idiag[i]; /* omega in idiag */
203417ab2063SBarry Smith         }
20355c99c7daSBarry Smith       }
20369566063dSJacob Faibussowitsch       PetscCall(PetscLogFlops(a->nz)); /* assumes 1/2 in upper */
203717ab2063SBarry Smith     }
203817ab2063SBarry Smith     its--;
203917ab2063SBarry Smith   }
204017ab2063SBarry Smith   while (its--) {
204117ab2063SBarry Smith     if (flag & SOR_FORWARD_SWEEP || flag & SOR_LOCAL_FORWARD_SWEEP) {
204217ab2063SBarry Smith       for (i = 0; i < m; i++) {
2043b19a5dc2SMark Adams         /* lower */
2044b19a5dc2SMark Adams         n   = diag[i] - a->i[i];
2045ed480e8bSBarry Smith         idx = a->j + a->i[i];
20462e5835c6SStefano Zampini         v   = aa + a->i[i];
204717ab2063SBarry Smith         sum = b[i];
2048e6d1f457SBarry Smith         PetscSparseDenseMinusDot(sum, x, v, idx, n);
2049b19a5dc2SMark Adams         t[i] = sum; /* save application of the lower-triangular part */
2050b19a5dc2SMark Adams         /* upper */
2051b19a5dc2SMark Adams         n   = a->i[i + 1] - diag[i] - 1;
2052b19a5dc2SMark Adams         idx = a->j + diag[i] + 1;
20532e5835c6SStefano Zampini         v   = aa + diag[i] + 1;
2054b19a5dc2SMark Adams         PetscSparseDenseMinusDot(sum, x, v, idx, n);
2055b19a5dc2SMark Adams         x[i] = (1. - omega) * x[i] + sum * idiag[i]; /* omega in idiag */
205617ab2063SBarry Smith       }
2057b19a5dc2SMark Adams       xb = t;
20589566063dSJacob Faibussowitsch       PetscCall(PetscLogFlops(2.0 * a->nz));
2059b19a5dc2SMark Adams     } else xb = b;
206017ab2063SBarry Smith     if (flag & SOR_BACKWARD_SWEEP || flag & SOR_LOCAL_BACKWARD_SWEEP) {
206117ab2063SBarry Smith       for (i = m - 1; i >= 0; i--) {
2062b19a5dc2SMark Adams         sum = xb[i];
2063b19a5dc2SMark Adams         if (xb == b) {
2064b19a5dc2SMark Adams           /* whole matrix (no checkpointing available) */
2065416022c9SBarry Smith           n   = a->i[i + 1] - a->i[i];
2066ed480e8bSBarry Smith           idx = a->j + a->i[i];
20672e5835c6SStefano Zampini           v   = aa + a->i[i];
2068e6d1f457SBarry Smith           PetscSparseDenseMinusDot(sum, x, v, idx, n);
2069ed480e8bSBarry Smith           x[i] = (1. - omega) * x[i] + (sum + mdiag[i] * x[i]) * idiag[i];
2070b19a5dc2SMark Adams         } else { /* lower-triangular part has been saved, so only apply upper-triangular */
2071b19a5dc2SMark Adams           n   = a->i[i + 1] - diag[i] - 1;
2072b19a5dc2SMark Adams           idx = a->j + diag[i] + 1;
20732e5835c6SStefano Zampini           v   = aa + diag[i] + 1;
2074b19a5dc2SMark Adams           PetscSparseDenseMinusDot(sum, x, v, idx, n);
2075b19a5dc2SMark Adams           x[i] = (1. - omega) * x[i] + sum * idiag[i]; /* omega in idiag */
207617ab2063SBarry Smith         }
2077b19a5dc2SMark Adams       }
2078b19a5dc2SMark Adams       if (xb == b) {
20799566063dSJacob Faibussowitsch         PetscCall(PetscLogFlops(2.0 * a->nz));
2080b19a5dc2SMark Adams       } else {
20819566063dSJacob Faibussowitsch         PetscCall(PetscLogFlops(a->nz)); /* assumes 1/2 in upper */
2082b19a5dc2SMark Adams       }
208317ab2063SBarry Smith     }
208417ab2063SBarry Smith   }
20859566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &aa));
20869566063dSJacob Faibussowitsch   PetscCall(VecRestoreArray(xx, &x));
20879566063dSJacob Faibussowitsch   PetscCall(VecRestoreArrayRead(bb, &b));
20883ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
208917ab2063SBarry Smith }
209017ab2063SBarry Smith 
2091ba38deedSJacob Faibussowitsch static PetscErrorCode MatGetInfo_SeqAIJ(Mat A, MatInfoType flag, MatInfo *info)
2092d71ae5a4SJacob Faibussowitsch {
2093416022c9SBarry Smith   Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data;
20944e220ebcSLois Curfman McInnes 
20953a40ed3dSBarry Smith   PetscFunctionBegin;
20964e220ebcSLois Curfman McInnes   info->block_size   = 1.0;
20973966268fSBarry Smith   info->nz_allocated = a->maxnz;
20983966268fSBarry Smith   info->nz_used      = a->nz;
20993966268fSBarry Smith   info->nz_unneeded  = (a->maxnz - a->nz);
21003966268fSBarry Smith   info->assemblies   = A->num_ass;
21013966268fSBarry Smith   info->mallocs      = A->info.mallocs;
21024dfa11a4SJacob Faibussowitsch   info->memory       = 0; /* REVIEW ME */
2103d5f3da31SBarry Smith   if (A->factortype) {
21044e220ebcSLois Curfman McInnes     info->fill_ratio_given  = A->info.fill_ratio_given;
21054e220ebcSLois Curfman McInnes     info->fill_ratio_needed = A->info.fill_ratio_needed;
21064e220ebcSLois Curfman McInnes     info->factor_mallocs    = A->info.factor_mallocs;
21074e220ebcSLois Curfman McInnes   } else {
21084e220ebcSLois Curfman McInnes     info->fill_ratio_given  = 0;
21094e220ebcSLois Curfman McInnes     info->fill_ratio_needed = 0;
21104e220ebcSLois Curfman McInnes     info->factor_mallocs    = 0;
21114e220ebcSLois Curfman McInnes   }
21123ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
211317ab2063SBarry Smith }
211417ab2063SBarry Smith 
2115ba38deedSJacob Faibussowitsch static PetscErrorCode MatZeroRows_SeqAIJ(Mat A, PetscInt N, const PetscInt rows[], PetscScalar diag, Vec x, Vec b)
2116d71ae5a4SJacob Faibussowitsch {
2117416022c9SBarry Smith   Mat_SeqAIJ        *a = (Mat_SeqAIJ *)A->data;
2118c7da8527SEric Chamberland   PetscInt           i, m = A->rmap->n - 1;
211997b48c8fSBarry Smith   const PetscScalar *xx;
21202e5835c6SStefano Zampini   PetscScalar       *bb, *aa;
2121c7da8527SEric Chamberland   PetscInt           d = 0;
212217ab2063SBarry Smith 
21233a40ed3dSBarry Smith   PetscFunctionBegin;
212497b48c8fSBarry Smith   if (x && b) {
21259566063dSJacob Faibussowitsch     PetscCall(VecGetArrayRead(x, &xx));
21269566063dSJacob Faibussowitsch     PetscCall(VecGetArray(b, &bb));
212797b48c8fSBarry Smith     for (i = 0; i < N; i++) {
2128aed4548fSBarry Smith       PetscCheck(rows[i] >= 0 && rows[i] <= m, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "row %" PetscInt_FMT " out of range", rows[i]);
2129447d62f5SStefano Zampini       if (rows[i] >= A->cmap->n) continue;
213097b48c8fSBarry Smith       bb[rows[i]] = diag * xx[rows[i]];
213197b48c8fSBarry Smith     }
21329566063dSJacob Faibussowitsch     PetscCall(VecRestoreArrayRead(x, &xx));
21339566063dSJacob Faibussowitsch     PetscCall(VecRestoreArray(b, &bb));
213497b48c8fSBarry Smith   }
213597b48c8fSBarry Smith 
21369566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArray(A, &aa));
2137a9817697SBarry Smith   if (a->keepnonzeropattern) {
2138f1e2ffcdSBarry Smith     for (i = 0; i < N; i++) {
2139aed4548fSBarry Smith       PetscCheck(rows[i] >= 0 && rows[i] <= m, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "row %" PetscInt_FMT " out of range", rows[i]);
21409566063dSJacob Faibussowitsch       PetscCall(PetscArrayzero(&aa[a->i[rows[i]]], a->ilen[rows[i]]));
2141f1e2ffcdSBarry Smith     }
2142f4df32b1SMatthew Knepley     if (diag != 0.0) {
2143c7da8527SEric Chamberland       for (i = 0; i < N; i++) {
2144c7da8527SEric Chamberland         d = rows[i];
2145447d62f5SStefano Zampini         if (rows[i] >= A->cmap->n) continue;
214608401ef6SPierre Jolivet         PetscCheck(a->diag[d] < a->i[d + 1], PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Matrix is missing diagonal entry in the zeroed row %" PetscInt_FMT, d);
2147c7da8527SEric Chamberland       }
2148f1e2ffcdSBarry Smith       for (i = 0; i < N; i++) {
2149447d62f5SStefano Zampini         if (rows[i] >= A->cmap->n) continue;
21502e5835c6SStefano Zampini         aa[a->diag[rows[i]]] = diag;
2151f1e2ffcdSBarry Smith       }
2152f1e2ffcdSBarry Smith     }
2153f1e2ffcdSBarry Smith   } else {
2154f4df32b1SMatthew Knepley     if (diag != 0.0) {
215517ab2063SBarry Smith       for (i = 0; i < N; i++) {
2156aed4548fSBarry Smith         PetscCheck(rows[i] >= 0 && rows[i] <= m, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "row %" PetscInt_FMT " out of range", rows[i]);
21577ae801bdSBarry Smith         if (a->ilen[rows[i]] > 0) {
2158447d62f5SStefano Zampini           if (rows[i] >= A->cmap->n) {
2159447d62f5SStefano Zampini             a->ilen[rows[i]] = 0;
2160447d62f5SStefano Zampini           } else {
2161416022c9SBarry Smith             a->ilen[rows[i]]    = 1;
21622e5835c6SStefano Zampini             aa[a->i[rows[i]]]   = diag;
2163bfeeae90SHong Zhang             a->j[a->i[rows[i]]] = rows[i];
2164447d62f5SStefano Zampini           }
2165447d62f5SStefano Zampini         } else if (rows[i] < A->cmap->n) { /* in case row was completely empty */
21669566063dSJacob Faibussowitsch           PetscCall(MatSetValues_SeqAIJ(A, 1, &rows[i], 1, &rows[i], &diag, INSERT_VALUES));
216717ab2063SBarry Smith         }
216817ab2063SBarry Smith       }
21693a40ed3dSBarry Smith     } else {
217017ab2063SBarry Smith       for (i = 0; i < N; i++) {
2171aed4548fSBarry Smith         PetscCheck(rows[i] >= 0 && rows[i] <= m, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "row %" PetscInt_FMT " out of range", rows[i]);
2172416022c9SBarry Smith         a->ilen[rows[i]] = 0;
217317ab2063SBarry Smith       }
217417ab2063SBarry Smith     }
2175e56f5c9eSBarry Smith     A->nonzerostate++;
2176f1e2ffcdSBarry Smith   }
21779566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArray(A, &aa));
2178dbbe0bcdSBarry Smith   PetscUseTypeMethod(A, assemblyend, MAT_FINAL_ASSEMBLY);
21793ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
218017ab2063SBarry Smith }
218117ab2063SBarry Smith 
2182ba38deedSJacob Faibussowitsch static PetscErrorCode MatZeroRowsColumns_SeqAIJ(Mat A, PetscInt N, const PetscInt rows[], PetscScalar diag, Vec x, Vec b)
2183d71ae5a4SJacob Faibussowitsch {
21846e169961SBarry Smith   Mat_SeqAIJ        *a = (Mat_SeqAIJ *)A->data;
21856e169961SBarry Smith   PetscInt           i, j, m = A->rmap->n - 1, d = 0;
21862b40b63fSBarry Smith   PetscBool          missing, *zeroed, vecs = PETSC_FALSE;
21876e169961SBarry Smith   const PetscScalar *xx;
21882e5835c6SStefano Zampini   PetscScalar       *bb, *aa;
21896e169961SBarry Smith 
21906e169961SBarry Smith   PetscFunctionBegin;
21913ba16761SJacob Faibussowitsch   if (!N) PetscFunctionReturn(PETSC_SUCCESS);
21929566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArray(A, &aa));
21936e169961SBarry Smith   if (x && b) {
21949566063dSJacob Faibussowitsch     PetscCall(VecGetArrayRead(x, &xx));
21959566063dSJacob Faibussowitsch     PetscCall(VecGetArray(b, &bb));
21962b40b63fSBarry Smith     vecs = PETSC_TRUE;
21976e169961SBarry Smith   }
21989566063dSJacob Faibussowitsch   PetscCall(PetscCalloc1(A->rmap->n, &zeroed));
21996e169961SBarry Smith   for (i = 0; i < N; i++) {
2200aed4548fSBarry Smith     PetscCheck(rows[i] >= 0 && rows[i] <= m, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "row %" PetscInt_FMT " out of range", rows[i]);
22018e3a54c0SPierre Jolivet     PetscCall(PetscArrayzero(PetscSafePointerPlusOffset(aa, a->i[rows[i]]), a->ilen[rows[i]]));
22022205254eSKarl Rupp 
22036e169961SBarry Smith     zeroed[rows[i]] = PETSC_TRUE;
22046e169961SBarry Smith   }
22056e169961SBarry Smith   for (i = 0; i < A->rmap->n; i++) {
22066e169961SBarry Smith     if (!zeroed[i]) {
22076e169961SBarry Smith       for (j = a->i[i]; j < a->i[i + 1]; j++) {
22084cf107fdSStefano Zampini         if (a->j[j] < A->rmap->n && zeroed[a->j[j]]) {
22092e5835c6SStefano Zampini           if (vecs) bb[i] -= aa[j] * xx[a->j[j]];
22102e5835c6SStefano Zampini           aa[j] = 0.0;
22116e169961SBarry Smith         }
22126e169961SBarry Smith       }
22134cf107fdSStefano Zampini     } else if (vecs && i < A->cmap->N) bb[i] = diag * xx[i];
22146e169961SBarry Smith   }
22156e169961SBarry Smith   if (x && b) {
22169566063dSJacob Faibussowitsch     PetscCall(VecRestoreArrayRead(x, &xx));
22179566063dSJacob Faibussowitsch     PetscCall(VecRestoreArray(b, &bb));
22186e169961SBarry Smith   }
22199566063dSJacob Faibussowitsch   PetscCall(PetscFree(zeroed));
22206e169961SBarry Smith   if (diag != 0.0) {
22219566063dSJacob Faibussowitsch     PetscCall(MatMissingDiagonal_SeqAIJ(A, &missing, &d));
22221d5a398dSstefano_zampini     if (missing) {
22231d5a398dSstefano_zampini       for (i = 0; i < N; i++) {
22244cf107fdSStefano Zampini         if (rows[i] >= A->cmap->N) continue;
2225aed4548fSBarry Smith         PetscCheck(!a->nonew || rows[i] < d, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Matrix is missing diagonal entry in row %" PetscInt_FMT " (%" PetscInt_FMT ")", d, rows[i]);
22269566063dSJacob Faibussowitsch         PetscCall(MatSetValues_SeqAIJ(A, 1, &rows[i], 1, &rows[i], &diag, INSERT_VALUES));
22271d5a398dSstefano_zampini       }
22281d5a398dSstefano_zampini     } else {
2229ad540459SPierre Jolivet       for (i = 0; i < N; i++) aa[a->diag[rows[i]]] = diag;
22306e169961SBarry Smith     }
22311d5a398dSstefano_zampini   }
22329566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArray(A, &aa));
2233dbbe0bcdSBarry Smith   PetscUseTypeMethod(A, assemblyend, MAT_FINAL_ASSEMBLY);
22343ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
22356e169961SBarry Smith }
22366e169961SBarry Smith 
2237d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetRow_SeqAIJ(Mat A, PetscInt row, PetscInt *nz, PetscInt **idx, PetscScalar **v)
2238d71ae5a4SJacob Faibussowitsch {
2239fff043a9SJunchao Zhang   Mat_SeqAIJ        *a = (Mat_SeqAIJ *)A->data;
2240fff043a9SJunchao Zhang   const PetscScalar *aa;
224117ab2063SBarry Smith 
22423a40ed3dSBarry Smith   PetscFunctionBegin;
22439566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &aa));
2244416022c9SBarry Smith   *nz = a->i[row + 1] - a->i[row];
22458e3a54c0SPierre Jolivet   if (v) *v = PetscSafePointerPlusOffset((PetscScalar *)aa, a->i[row]);
224617ab2063SBarry Smith   if (idx) {
22475c0db29aSPierre Jolivet     if (*nz && a->j) *idx = a->j + a->i[row];
2248f4259b30SLisandro Dalcin     else *idx = NULL;
224917ab2063SBarry Smith   }
22509566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &aa));
22513ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
225217ab2063SBarry Smith }
225317ab2063SBarry Smith 
2254d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRestoreRow_SeqAIJ(Mat A, PetscInt row, PetscInt *nz, PetscInt **idx, PetscScalar **v)
2255d71ae5a4SJacob Faibussowitsch {
22563a40ed3dSBarry Smith   PetscFunctionBegin;
22573ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
225817ab2063SBarry Smith }
225917ab2063SBarry Smith 
2260ba38deedSJacob Faibussowitsch static PetscErrorCode MatNorm_SeqAIJ(Mat A, NormType type, PetscReal *nrm)
2261d71ae5a4SJacob Faibussowitsch {
2262416022c9SBarry Smith   Mat_SeqAIJ      *a = (Mat_SeqAIJ *)A->data;
22632e5835c6SStefano Zampini   const MatScalar *v;
226436db0b34SBarry Smith   PetscReal        sum = 0.0;
226597f1f81fSBarry Smith   PetscInt         i, j;
226617ab2063SBarry Smith 
22673a40ed3dSBarry Smith   PetscFunctionBegin;
22689566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &v));
226917ab2063SBarry Smith   if (type == NORM_FROBENIUS) {
2270570b7f6dSBarry Smith #if defined(PETSC_USE_REAL___FP16)
2271570b7f6dSBarry Smith     PetscBLASInt one = 1, nz = a->nz;
2272792fecdfSBarry Smith     PetscCallBLAS("BLASnrm2", *nrm = BLASnrm2_(&nz, v, &one));
2273570b7f6dSBarry Smith #else
2274416022c9SBarry Smith     for (i = 0; i < a->nz; i++) {
22759371c9d4SSatish Balay       sum += PetscRealPart(PetscConj(*v) * (*v));
22769371c9d4SSatish Balay       v++;
227717ab2063SBarry Smith     }
22788f1a2a5eSBarry Smith     *nrm = PetscSqrtReal(sum);
2279570b7f6dSBarry Smith #endif
22809566063dSJacob Faibussowitsch     PetscCall(PetscLogFlops(2.0 * a->nz));
22813a40ed3dSBarry Smith   } else if (type == NORM_1) {
228236db0b34SBarry Smith     PetscReal *tmp;
228397f1f81fSBarry Smith     PetscInt  *jj = a->j;
22849566063dSJacob Faibussowitsch     PetscCall(PetscCalloc1(A->cmap->n + 1, &tmp));
2285064f8208SBarry Smith     *nrm = 0.0;
2286416022c9SBarry Smith     for (j = 0; j < a->nz; j++) {
22879371c9d4SSatish Balay       tmp[*jj++] += PetscAbsScalar(*v);
22889371c9d4SSatish Balay       v++;
228917ab2063SBarry Smith     }
2290d0f46423SBarry Smith     for (j = 0; j < A->cmap->n; j++) {
2291064f8208SBarry Smith       if (tmp[j] > *nrm) *nrm = tmp[j];
229217ab2063SBarry Smith     }
22939566063dSJacob Faibussowitsch     PetscCall(PetscFree(tmp));
22949566063dSJacob Faibussowitsch     PetscCall(PetscLogFlops(PetscMax(a->nz - 1, 0)));
22953a40ed3dSBarry Smith   } else if (type == NORM_INFINITY) {
2296064f8208SBarry Smith     *nrm = 0.0;
2297d0f46423SBarry Smith     for (j = 0; j < A->rmap->n; j++) {
22988e3a54c0SPierre Jolivet       const PetscScalar *v2 = PetscSafePointerPlusOffset(v, a->i[j]);
229917ab2063SBarry Smith       sum                   = 0.0;
2300416022c9SBarry Smith       for (i = 0; i < a->i[j + 1] - a->i[j]; i++) {
23019371c9d4SSatish Balay         sum += PetscAbsScalar(*v2);
23029371c9d4SSatish Balay         v2++;
230317ab2063SBarry Smith       }
2304064f8208SBarry Smith       if (sum > *nrm) *nrm = sum;
230517ab2063SBarry Smith     }
23069566063dSJacob Faibussowitsch     PetscCall(PetscLogFlops(PetscMax(a->nz - 1, 0)));
2307f23aa3ddSBarry Smith   } else SETERRQ(PETSC_COMM_SELF, PETSC_ERR_SUP, "No support for two norm");
23089566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &v));
23093ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
231017ab2063SBarry Smith }
231117ab2063SBarry Smith 
2312ba38deedSJacob Faibussowitsch static PetscErrorCode MatIsTranspose_SeqAIJ(Mat A, Mat B, PetscReal tol, PetscBool *f)
2313d71ae5a4SJacob Faibussowitsch {
23143d3eaba7SBarry Smith   Mat_SeqAIJ      *aij = (Mat_SeqAIJ *)A->data, *bij = (Mat_SeqAIJ *)B->data;
231554f21887SBarry Smith   PetscInt        *adx, *bdx, *aii, *bii, *aptr, *bptr;
23162e5835c6SStefano Zampini   const MatScalar *va, *vb;
231797f1f81fSBarry Smith   PetscInt         ma, na, mb, nb, i;
2318cd0d46ebSvictorle 
2319cd0d46ebSvictorle   PetscFunctionBegin;
23209566063dSJacob Faibussowitsch   PetscCall(MatGetSize(A, &ma, &na));
23219566063dSJacob Faibussowitsch   PetscCall(MatGetSize(B, &mb, &nb));
23225485867bSBarry Smith   if (ma != nb || na != mb) {
23235485867bSBarry Smith     *f = PETSC_FALSE;
23243ba16761SJacob Faibussowitsch     PetscFunctionReturn(PETSC_SUCCESS);
23255485867bSBarry Smith   }
23269566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &va));
23279566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(B, &vb));
23289371c9d4SSatish Balay   aii = aij->i;
23299371c9d4SSatish Balay   bii = bij->i;
23309371c9d4SSatish Balay   adx = aij->j;
23319371c9d4SSatish Balay   bdx = bij->j;
23329566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(ma, &aptr));
23339566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(mb, &bptr));
2334cd0d46ebSvictorle   for (i = 0; i < ma; i++) aptr[i] = aii[i];
2335cd0d46ebSvictorle   for (i = 0; i < mb; i++) bptr[i] = bii[i];
2336cd0d46ebSvictorle 
2337cd0d46ebSvictorle   *f = PETSC_TRUE;
2338cd0d46ebSvictorle   for (i = 0; i < ma; i++) {
2339cd0d46ebSvictorle     while (aptr[i] < aii[i + 1]) {
234097f1f81fSBarry Smith       PetscInt    idc, idr;
23415485867bSBarry Smith       PetscScalar vc, vr;
2342cd0d46ebSvictorle       /* column/row index/value */
23435485867bSBarry Smith       idc = adx[aptr[i]];
23445485867bSBarry Smith       idr = bdx[bptr[idc]];
23455485867bSBarry Smith       vc  = va[aptr[i]];
23465485867bSBarry Smith       vr  = vb[bptr[idc]];
23475485867bSBarry Smith       if (i != idr || PetscAbsScalar(vc - vr) > tol) {
23485485867bSBarry Smith         *f = PETSC_FALSE;
23495485867bSBarry Smith         goto done;
2350cd0d46ebSvictorle       } else {
23515485867bSBarry Smith         aptr[i]++;
23525485867bSBarry Smith         if (B || i != idc) bptr[idc]++;
2353cd0d46ebSvictorle       }
2354cd0d46ebSvictorle     }
2355cd0d46ebSvictorle   }
2356cd0d46ebSvictorle done:
23579566063dSJacob Faibussowitsch   PetscCall(PetscFree(aptr));
23589566063dSJacob Faibussowitsch   PetscCall(PetscFree(bptr));
23599566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &va));
23609566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(B, &vb));
23613ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
2362cd0d46ebSvictorle }
2363cd0d46ebSvictorle 
2364ba38deedSJacob Faibussowitsch static PetscErrorCode MatIsHermitianTranspose_SeqAIJ(Mat A, Mat B, PetscReal tol, PetscBool *f)
2365d71ae5a4SJacob Faibussowitsch {
23663d3eaba7SBarry Smith   Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data, *bij = (Mat_SeqAIJ *)B->data;
236754f21887SBarry Smith   PetscInt   *adx, *bdx, *aii, *bii, *aptr, *bptr;
236854f21887SBarry Smith   MatScalar  *va, *vb;
23691cbb95d3SBarry Smith   PetscInt    ma, na, mb, nb, i;
23701cbb95d3SBarry Smith 
23711cbb95d3SBarry Smith   PetscFunctionBegin;
23729566063dSJacob Faibussowitsch   PetscCall(MatGetSize(A, &ma, &na));
23739566063dSJacob Faibussowitsch   PetscCall(MatGetSize(B, &mb, &nb));
23741cbb95d3SBarry Smith   if (ma != nb || na != mb) {
23751cbb95d3SBarry Smith     *f = PETSC_FALSE;
23763ba16761SJacob Faibussowitsch     PetscFunctionReturn(PETSC_SUCCESS);
23771cbb95d3SBarry Smith   }
23789371c9d4SSatish Balay   aii = aij->i;
23799371c9d4SSatish Balay   bii = bij->i;
23809371c9d4SSatish Balay   adx = aij->j;
23819371c9d4SSatish Balay   bdx = bij->j;
23829371c9d4SSatish Balay   va  = aij->a;
23839371c9d4SSatish Balay   vb  = bij->a;
23849566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(ma, &aptr));
23859566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(mb, &bptr));
23861cbb95d3SBarry Smith   for (i = 0; i < ma; i++) aptr[i] = aii[i];
23871cbb95d3SBarry Smith   for (i = 0; i < mb; i++) bptr[i] = bii[i];
23881cbb95d3SBarry Smith 
23891cbb95d3SBarry Smith   *f = PETSC_TRUE;
23901cbb95d3SBarry Smith   for (i = 0; i < ma; i++) {
23911cbb95d3SBarry Smith     while (aptr[i] < aii[i + 1]) {
23921cbb95d3SBarry Smith       PetscInt    idc, idr;
23931cbb95d3SBarry Smith       PetscScalar vc, vr;
23941cbb95d3SBarry Smith       /* column/row index/value */
23951cbb95d3SBarry Smith       idc = adx[aptr[i]];
23961cbb95d3SBarry Smith       idr = bdx[bptr[idc]];
23971cbb95d3SBarry Smith       vc  = va[aptr[i]];
23981cbb95d3SBarry Smith       vr  = vb[bptr[idc]];
23991cbb95d3SBarry Smith       if (i != idr || PetscAbsScalar(vc - PetscConj(vr)) > tol) {
24001cbb95d3SBarry Smith         *f = PETSC_FALSE;
24011cbb95d3SBarry Smith         goto done;
24021cbb95d3SBarry Smith       } else {
24031cbb95d3SBarry Smith         aptr[i]++;
24041cbb95d3SBarry Smith         if (B || i != idc) bptr[idc]++;
24051cbb95d3SBarry Smith       }
24061cbb95d3SBarry Smith     }
24071cbb95d3SBarry Smith   }
24081cbb95d3SBarry Smith done:
24099566063dSJacob Faibussowitsch   PetscCall(PetscFree(aptr));
24109566063dSJacob Faibussowitsch   PetscCall(PetscFree(bptr));
24113ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
24121cbb95d3SBarry Smith }
24131cbb95d3SBarry Smith 
2414d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDiagonalScale_SeqAIJ(Mat A, Vec ll, Vec rr)
2415d71ae5a4SJacob Faibussowitsch {
2416416022c9SBarry Smith   Mat_SeqAIJ        *a = (Mat_SeqAIJ *)A->data;
2417fff8e43fSBarry Smith   const PetscScalar *l, *r;
2418fff8e43fSBarry Smith   PetscScalar        x;
241954f21887SBarry Smith   MatScalar         *v;
2420fff8e43fSBarry Smith   PetscInt           i, j, m = A->rmap->n, n = A->cmap->n, M, nz = a->nz;
2421fff8e43fSBarry Smith   const PetscInt    *jj;
242217ab2063SBarry Smith 
24233a40ed3dSBarry Smith   PetscFunctionBegin;
242417ab2063SBarry Smith   if (ll) {
24253ea7c6a1SSatish Balay     /* The local size is used so that VecMPI can be passed to this routine
24263ea7c6a1SSatish Balay        by MatDiagonalScale_MPIAIJ */
24279566063dSJacob Faibussowitsch     PetscCall(VecGetLocalSize(ll, &m));
242808401ef6SPierre Jolivet     PetscCheck(m == A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Left scaling vector wrong length");
24299566063dSJacob Faibussowitsch     PetscCall(VecGetArrayRead(ll, &l));
24309566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJGetArray(A, &v));
243117ab2063SBarry Smith     for (i = 0; i < m; i++) {
243217ab2063SBarry Smith       x = l[i];
2433416022c9SBarry Smith       M = a->i[i + 1] - a->i[i];
24342205254eSKarl Rupp       for (j = 0; j < M; j++) (*v++) *= x;
243517ab2063SBarry Smith     }
24369566063dSJacob Faibussowitsch     PetscCall(VecRestoreArrayRead(ll, &l));
24379566063dSJacob Faibussowitsch     PetscCall(PetscLogFlops(nz));
24389566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJRestoreArray(A, &v));
243917ab2063SBarry Smith   }
244017ab2063SBarry Smith   if (rr) {
24419566063dSJacob Faibussowitsch     PetscCall(VecGetLocalSize(rr, &n));
244208401ef6SPierre Jolivet     PetscCheck(n == A->cmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Right scaling vector wrong length");
24439566063dSJacob Faibussowitsch     PetscCall(VecGetArrayRead(rr, &r));
24449566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJGetArray(A, &v));
24452e5835c6SStefano Zampini     jj = a->j;
24462205254eSKarl Rupp     for (i = 0; i < nz; i++) (*v++) *= r[*jj++];
24479566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJRestoreArray(A, &v));
24489566063dSJacob Faibussowitsch     PetscCall(VecRestoreArrayRead(rr, &r));
24499566063dSJacob Faibussowitsch     PetscCall(PetscLogFlops(nz));
245017ab2063SBarry Smith   }
24519566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJInvalidateDiagonal(A));
24523ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
245317ab2063SBarry Smith }
245417ab2063SBarry Smith 
2455d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateSubMatrix_SeqAIJ(Mat A, IS isrow, IS iscol, PetscInt csize, MatReuse scall, Mat *B)
2456d71ae5a4SJacob Faibussowitsch {
2457db02288aSLois Curfman McInnes   Mat_SeqAIJ        *a = (Mat_SeqAIJ *)A->data, *c;
2458d0f46423SBarry Smith   PetscInt          *smap, i, k, kstart, kend, oldcols = A->cmap->n, *lens;
245997f1f81fSBarry Smith   PetscInt           row, mat_i, *mat_j, tcol, first, step, *mat_ilen, sum, lensi;
24605d0c19d7SBarry Smith   const PetscInt    *irow, *icol;
24612e5835c6SStefano Zampini   const PetscScalar *aa;
24625d0c19d7SBarry Smith   PetscInt           nrows, ncols;
246397f1f81fSBarry Smith   PetscInt          *starts, *j_new, *i_new, *aj = a->j, *ai = a->i, ii, *ailen = a->ilen;
2464fb3c7e2dSJunchao Zhang   MatScalar         *a_new, *mat_a, *c_a;
2465416022c9SBarry Smith   Mat                C;
2466cdc6f3adSToby Isaac   PetscBool          stride;
246717ab2063SBarry Smith 
24683a40ed3dSBarry Smith   PetscFunctionBegin;
24699566063dSJacob Faibussowitsch   PetscCall(ISGetIndices(isrow, &irow));
24709566063dSJacob Faibussowitsch   PetscCall(ISGetLocalSize(isrow, &nrows));
24719566063dSJacob Faibussowitsch   PetscCall(ISGetLocalSize(iscol, &ncols));
247217ab2063SBarry Smith 
24739566063dSJacob Faibussowitsch   PetscCall(PetscObjectTypeCompare((PetscObject)iscol, ISSTRIDE, &stride));
2474ff718158SBarry Smith   if (stride) {
24759566063dSJacob Faibussowitsch     PetscCall(ISStrideGetInfo(iscol, &first, &step));
2476ff718158SBarry Smith   } else {
2477ff718158SBarry Smith     first = 0;
2478ff718158SBarry Smith     step  = 0;
2479ff718158SBarry Smith   }
2480fee21e36SBarry Smith   if (stride && step == 1) {
248102834360SBarry Smith     /* special case of contiguous rows */
24829566063dSJacob Faibussowitsch     PetscCall(PetscMalloc2(nrows, &lens, nrows, &starts));
248302834360SBarry Smith     /* loop over new rows determining lens and starting points */
248402834360SBarry Smith     for (i = 0; i < nrows; i++) {
2485bfeeae90SHong Zhang       kstart    = ai[irow[i]];
2486a2744918SBarry Smith       kend      = kstart + ailen[irow[i]];
2487a91a9bebSLisandro Dalcin       starts[i] = kstart;
248802834360SBarry Smith       for (k = kstart; k < kend; k++) {
2489bfeeae90SHong Zhang         if (aj[k] >= first) {
249002834360SBarry Smith           starts[i] = k;
249102834360SBarry Smith           break;
249202834360SBarry Smith         }
249302834360SBarry Smith       }
2494a2744918SBarry Smith       sum = 0;
249502834360SBarry Smith       while (k < kend) {
2496bfeeae90SHong Zhang         if (aj[k++] >= first + ncols) break;
2497a2744918SBarry Smith         sum++;
249802834360SBarry Smith       }
2499a2744918SBarry Smith       lens[i] = sum;
250002834360SBarry Smith     }
250102834360SBarry Smith     /* create submatrix */
2502cddf8d76SBarry Smith     if (scall == MAT_REUSE_MATRIX) {
250397f1f81fSBarry Smith       PetscInt n_cols, n_rows;
25049566063dSJacob Faibussowitsch       PetscCall(MatGetSize(*B, &n_rows, &n_cols));
2505aed4548fSBarry Smith       PetscCheck(n_rows == nrows && n_cols == ncols, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Reused submatrix wrong size");
25069566063dSJacob Faibussowitsch       PetscCall(MatZeroEntries(*B));
250708480c60SBarry Smith       C = *B;
25083a40ed3dSBarry Smith     } else {
25093bef6203SJed Brown       PetscInt rbs, cbs;
25109566063dSJacob Faibussowitsch       PetscCall(MatCreate(PetscObjectComm((PetscObject)A), &C));
25119566063dSJacob Faibussowitsch       PetscCall(MatSetSizes(C, nrows, ncols, PETSC_DETERMINE, PETSC_DETERMINE));
25129566063dSJacob Faibussowitsch       PetscCall(ISGetBlockSize(isrow, &rbs));
25139566063dSJacob Faibussowitsch       PetscCall(ISGetBlockSize(iscol, &cbs));
25149566063dSJacob Faibussowitsch       PetscCall(MatSetBlockSizes(C, rbs, cbs));
25159566063dSJacob Faibussowitsch       PetscCall(MatSetType(C, ((PetscObject)A)->type_name));
25169566063dSJacob Faibussowitsch       PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(C, 0, lens));
251708480c60SBarry Smith     }
2518db02288aSLois Curfman McInnes     c = (Mat_SeqAIJ *)C->data;
2519db02288aSLois Curfman McInnes 
252002834360SBarry Smith     /* loop over rows inserting into submatrix */
2521fb3c7e2dSJunchao Zhang     PetscCall(MatSeqAIJGetArrayWrite(C, &a_new)); // Not 'a_new = c->a-new', since that raw usage ignores offload state of C
2522db02288aSLois Curfman McInnes     j_new = c->j;
2523db02288aSLois Curfman McInnes     i_new = c->i;
25249566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJGetArrayRead(A, &aa));
252502834360SBarry Smith     for (i = 0; i < nrows; i++) {
2526a2744918SBarry Smith       ii    = starts[i];
2527a2744918SBarry Smith       lensi = lens[i];
2528810441c8SPierre Jolivet       if (lensi) {
2529ad540459SPierre Jolivet         for (k = 0; k < lensi; k++) *j_new++ = aj[ii + k] - first;
25309566063dSJacob Faibussowitsch         PetscCall(PetscArraycpy(a_new, aa + starts[i], lensi));
2531a2744918SBarry Smith         a_new += lensi;
2532810441c8SPierre Jolivet       }
2533a2744918SBarry Smith       i_new[i + 1] = i_new[i] + lensi;
2534a2744918SBarry Smith       c->ilen[i]   = lensi;
253502834360SBarry Smith     }
2536fb3c7e2dSJunchao Zhang     PetscCall(MatSeqAIJRestoreArrayWrite(C, &a_new)); // Set C's offload state properly
25379566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJRestoreArrayRead(A, &aa));
25389566063dSJacob Faibussowitsch     PetscCall(PetscFree2(lens, starts));
25393a40ed3dSBarry Smith   } else {
25409566063dSJacob Faibussowitsch     PetscCall(ISGetIndices(iscol, &icol));
25419566063dSJacob Faibussowitsch     PetscCall(PetscCalloc1(oldcols, &smap));
25429566063dSJacob Faibussowitsch     PetscCall(PetscMalloc1(1 + nrows, &lens));
25434dcab191SBarry Smith     for (i = 0; i < ncols; i++) {
25446bdcaf15SBarry Smith       PetscCheck(icol[i] < oldcols, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Requesting column beyond largest column icol[%" PetscInt_FMT "] %" PetscInt_FMT " >= A->cmap->n %" PetscInt_FMT, i, icol[i], oldcols);
25454dcab191SBarry Smith       smap[icol[i]] = i + 1;
25464dcab191SBarry Smith     }
25474dcab191SBarry Smith 
254802834360SBarry Smith     /* determine lens of each row */
254902834360SBarry Smith     for (i = 0; i < nrows; i++) {
2550bfeeae90SHong Zhang       kstart  = ai[irow[i]];
255102834360SBarry Smith       kend    = kstart + a->ilen[irow[i]];
255202834360SBarry Smith       lens[i] = 0;
255302834360SBarry Smith       for (k = kstart; k < kend; k++) {
2554ad540459SPierre Jolivet         if (smap[aj[k]]) lens[i]++;
255502834360SBarry Smith       }
255602834360SBarry Smith     }
255717ab2063SBarry Smith     /* Create and fill new matrix */
2558a2744918SBarry Smith     if (scall == MAT_REUSE_MATRIX) {
2559ace3abfcSBarry Smith       PetscBool equal;
25600f5bd95cSBarry Smith 
256199141d43SSatish Balay       c = (Mat_SeqAIJ *)((*B)->data);
2562aed4548fSBarry Smith       PetscCheck((*B)->rmap->n == nrows && (*B)->cmap->n == ncols, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Cannot reuse matrix. wrong size");
25639566063dSJacob Faibussowitsch       PetscCall(PetscArraycmp(c->ilen, lens, (*B)->rmap->n, &equal));
2564fdfbdca6SPierre Jolivet       PetscCheck(equal, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Cannot reuse matrix. wrong number of nonzeros");
25659566063dSJacob Faibussowitsch       PetscCall(PetscArrayzero(c->ilen, (*B)->rmap->n));
256608480c60SBarry Smith       C = *B;
25673a40ed3dSBarry Smith     } else {
25683bef6203SJed Brown       PetscInt rbs, cbs;
25699566063dSJacob Faibussowitsch       PetscCall(MatCreate(PetscObjectComm((PetscObject)A), &C));
25709566063dSJacob Faibussowitsch       PetscCall(MatSetSizes(C, nrows, ncols, PETSC_DETERMINE, PETSC_DETERMINE));
25719566063dSJacob Faibussowitsch       PetscCall(ISGetBlockSize(isrow, &rbs));
25729566063dSJacob Faibussowitsch       PetscCall(ISGetBlockSize(iscol, &cbs));
257337a5e0faSPierre Jolivet       if (rbs > 1 || cbs > 1) PetscCall(MatSetBlockSizes(C, rbs, cbs));
25749566063dSJacob Faibussowitsch       PetscCall(MatSetType(C, ((PetscObject)A)->type_name));
25759566063dSJacob Faibussowitsch       PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(C, 0, lens));
257608480c60SBarry Smith     }
25779566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJGetArrayRead(A, &aa));
2578fb3c7e2dSJunchao Zhang 
2579f4f49eeaSPierre Jolivet     c = (Mat_SeqAIJ *)C->data;
2580fb3c7e2dSJunchao Zhang     PetscCall(MatSeqAIJGetArrayWrite(C, &c_a)); // Not 'c->a', since that raw usage ignores offload state of C
258117ab2063SBarry Smith     for (i = 0; i < nrows; i++) {
258299141d43SSatish Balay       row      = irow[i];
2583bfeeae90SHong Zhang       kstart   = ai[row];
258499141d43SSatish Balay       kend     = kstart + a->ilen[row];
2585bfeeae90SHong Zhang       mat_i    = c->i[i];
25868e3a54c0SPierre Jolivet       mat_j    = PetscSafePointerPlusOffset(c->j, mat_i);
25878e3a54c0SPierre Jolivet       mat_a    = PetscSafePointerPlusOffset(c_a, mat_i);
258899141d43SSatish Balay       mat_ilen = c->ilen + i;
258917ab2063SBarry Smith       for (k = kstart; k < kend; k++) {
2590bfeeae90SHong Zhang         if ((tcol = smap[a->j[k]])) {
2591ed480e8bSBarry Smith           *mat_j++ = tcol - 1;
25922e5835c6SStefano Zampini           *mat_a++ = aa[k];
259399141d43SSatish Balay           (*mat_ilen)++;
259417ab2063SBarry Smith         }
259517ab2063SBarry Smith       }
259617ab2063SBarry Smith     }
25979566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJRestoreArrayRead(A, &aa));
259802834360SBarry Smith     /* Free work space */
25999566063dSJacob Faibussowitsch     PetscCall(ISRestoreIndices(iscol, &icol));
26009566063dSJacob Faibussowitsch     PetscCall(PetscFree(smap));
26019566063dSJacob Faibussowitsch     PetscCall(PetscFree(lens));
2602cdc6f3adSToby Isaac     /* sort */
2603cdc6f3adSToby Isaac     for (i = 0; i < nrows; i++) {
2604cdc6f3adSToby Isaac       PetscInt ilen;
2605cdc6f3adSToby Isaac 
2606cdc6f3adSToby Isaac       mat_i = c->i[i];
26078e3a54c0SPierre Jolivet       mat_j = PetscSafePointerPlusOffset(c->j, mat_i);
26088e3a54c0SPierre Jolivet       mat_a = PetscSafePointerPlusOffset(c_a, mat_i);
2609cdc6f3adSToby Isaac       ilen  = c->ilen[i];
26109566063dSJacob Faibussowitsch       PetscCall(PetscSortIntWithScalarArray(ilen, mat_j, mat_a));
2611cdc6f3adSToby Isaac     }
2612fb3c7e2dSJunchao Zhang     PetscCall(MatSeqAIJRestoreArrayWrite(C, &c_a));
261302834360SBarry Smith   }
26148c3ff71bSJunchao Zhang #if defined(PETSC_HAVE_DEVICE)
26159566063dSJacob Faibussowitsch   PetscCall(MatBindToCPU(C, A->boundtocpu));
2616305c6ccfSStefano Zampini #endif
26179566063dSJacob Faibussowitsch   PetscCall(MatAssemblyBegin(C, MAT_FINAL_ASSEMBLY));
26189566063dSJacob Faibussowitsch   PetscCall(MatAssemblyEnd(C, MAT_FINAL_ASSEMBLY));
261917ab2063SBarry Smith 
26209566063dSJacob Faibussowitsch   PetscCall(ISRestoreIndices(isrow, &irow));
2621416022c9SBarry Smith   *B = C;
26223ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
262317ab2063SBarry Smith }
262417ab2063SBarry Smith 
2625ba38deedSJacob Faibussowitsch static PetscErrorCode MatGetMultiProcBlock_SeqAIJ(Mat mat, MPI_Comm subComm, MatReuse scall, Mat *subMat)
2626d71ae5a4SJacob Faibussowitsch {
262782d44351SHong Zhang   Mat B;
262882d44351SHong Zhang 
262982d44351SHong Zhang   PetscFunctionBegin;
2630c2d650bdSHong Zhang   if (scall == MAT_INITIAL_MATRIX) {
26319566063dSJacob Faibussowitsch     PetscCall(MatCreate(subComm, &B));
26329566063dSJacob Faibussowitsch     PetscCall(MatSetSizes(B, mat->rmap->n, mat->cmap->n, mat->rmap->n, mat->cmap->n));
26339566063dSJacob Faibussowitsch     PetscCall(MatSetBlockSizesFromMats(B, mat, mat));
26349566063dSJacob Faibussowitsch     PetscCall(MatSetType(B, MATSEQAIJ));
26359566063dSJacob Faibussowitsch     PetscCall(MatDuplicateNoCreate_SeqAIJ(B, mat, MAT_COPY_VALUES, PETSC_TRUE));
263682d44351SHong Zhang     *subMat = B;
2637c2d650bdSHong Zhang   } else {
26389566063dSJacob Faibussowitsch     PetscCall(MatCopy_SeqAIJ(mat, *subMat, SAME_NONZERO_PATTERN));
2639c2d650bdSHong Zhang   }
26403ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
264182d44351SHong Zhang }
264282d44351SHong Zhang 
2643ba38deedSJacob Faibussowitsch static PetscErrorCode MatILUFactor_SeqAIJ(Mat inA, IS row, IS col, const MatFactorInfo *info)
2644d71ae5a4SJacob Faibussowitsch {
264563b91edcSBarry Smith   Mat_SeqAIJ *a = (Mat_SeqAIJ *)inA->data;
264663b91edcSBarry Smith   Mat         outA;
2647ace3abfcSBarry Smith   PetscBool   row_identity, col_identity;
264863b91edcSBarry Smith 
26493a40ed3dSBarry Smith   PetscFunctionBegin;
265008401ef6SPierre Jolivet   PetscCheck(info->levels == 0, PETSC_COMM_SELF, PETSC_ERR_SUP, "Only levels=0 supported for in-place ilu");
26511df811f5SHong Zhang 
26529566063dSJacob Faibussowitsch   PetscCall(ISIdentity(row, &row_identity));
26539566063dSJacob Faibussowitsch   PetscCall(ISIdentity(col, &col_identity));
2654a871dcd8SBarry Smith 
265563b91edcSBarry Smith   outA             = inA;
2656d5f3da31SBarry Smith   outA->factortype = MAT_FACTOR_LU;
26579566063dSJacob Faibussowitsch   PetscCall(PetscFree(inA->solvertype));
26589566063dSJacob Faibussowitsch   PetscCall(PetscStrallocpy(MATSOLVERPETSC, &inA->solvertype));
26592205254eSKarl Rupp 
26609566063dSJacob Faibussowitsch   PetscCall(PetscObjectReference((PetscObject)row));
26619566063dSJacob Faibussowitsch   PetscCall(ISDestroy(&a->row));
26622205254eSKarl Rupp 
2663c3122656SLisandro Dalcin   a->row = row;
26642205254eSKarl Rupp 
26659566063dSJacob Faibussowitsch   PetscCall(PetscObjectReference((PetscObject)col));
26669566063dSJacob Faibussowitsch   PetscCall(ISDestroy(&a->col));
26672205254eSKarl Rupp 
2668c3122656SLisandro Dalcin   a->col = col;
266963b91edcSBarry Smith 
267036db0b34SBarry Smith   /* Create the inverse permutation so that it can be used in MatLUFactorNumeric() */
26719566063dSJacob Faibussowitsch   PetscCall(ISDestroy(&a->icol));
26729566063dSJacob Faibussowitsch   PetscCall(ISInvertPermutation(col, PETSC_DECIDE, &a->icol));
2673f0ec6fceSSatish Balay 
267494a9d846SBarry Smith   if (!a->solve_work) { /* this matrix may have been factored before */
26759566063dSJacob Faibussowitsch     PetscCall(PetscMalloc1(inA->rmap->n + 1, &a->solve_work));
267694a9d846SBarry Smith   }
267763b91edcSBarry Smith 
26789566063dSJacob Faibussowitsch   PetscCall(MatMarkDiagonal_SeqAIJ(inA));
2679137fb511SHong Zhang   if (row_identity && col_identity) {
26809566063dSJacob Faibussowitsch     PetscCall(MatLUFactorNumeric_SeqAIJ_inplace(outA, inA, info));
2681137fb511SHong Zhang   } else {
26829566063dSJacob Faibussowitsch     PetscCall(MatLUFactorNumeric_SeqAIJ_InplaceWithPerm(outA, inA, info));
2683137fb511SHong Zhang   }
26843ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
2685a871dcd8SBarry Smith }
2686a871dcd8SBarry Smith 
2687d71ae5a4SJacob Faibussowitsch PetscErrorCode MatScale_SeqAIJ(Mat inA, PetscScalar alpha)
2688d71ae5a4SJacob Faibussowitsch {
2689f0b747eeSBarry Smith   Mat_SeqAIJ  *a = (Mat_SeqAIJ *)inA->data;
2690dfa0f9e5SStefano Zampini   PetscScalar *v;
2691c5df96a5SBarry Smith   PetscBLASInt one = 1, bnz;
26923a40ed3dSBarry Smith 
26933a40ed3dSBarry Smith   PetscFunctionBegin;
26949566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArray(inA, &v));
26959566063dSJacob Faibussowitsch   PetscCall(PetscBLASIntCast(a->nz, &bnz));
2696792fecdfSBarry Smith   PetscCallBLAS("BLASscal", BLASscal_(&bnz, &alpha, v, &one));
26979566063dSJacob Faibussowitsch   PetscCall(PetscLogFlops(a->nz));
26989566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArray(inA, &v));
26999566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJInvalidateDiagonal(inA));
27003ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
2701f0b747eeSBarry Smith }
2702f0b747eeSBarry Smith 
2703d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDestroySubMatrix_Private(Mat_SubSppt *submatj)
2704d71ae5a4SJacob Faibussowitsch {
270516b64355SHong Zhang   PetscInt i;
270616b64355SHong Zhang 
270716b64355SHong Zhang   PetscFunctionBegin;
270816b64355SHong Zhang   if (!submatj->id) { /* delete data that are linked only to submats[id=0] */
27099566063dSJacob Faibussowitsch     PetscCall(PetscFree4(submatj->sbuf1, submatj->ptr, submatj->tmp, submatj->ctr));
271016b64355SHong Zhang 
271148a46eb9SPierre Jolivet     for (i = 0; i < submatj->nrqr; ++i) PetscCall(PetscFree(submatj->sbuf2[i]));
27129566063dSJacob Faibussowitsch     PetscCall(PetscFree3(submatj->sbuf2, submatj->req_size, submatj->req_source1));
271316b64355SHong Zhang 
271416b64355SHong Zhang     if (submatj->rbuf1) {
27159566063dSJacob Faibussowitsch       PetscCall(PetscFree(submatj->rbuf1[0]));
27169566063dSJacob Faibussowitsch       PetscCall(PetscFree(submatj->rbuf1));
271716b64355SHong Zhang     }
271816b64355SHong Zhang 
271948a46eb9SPierre Jolivet     for (i = 0; i < submatj->nrqs; ++i) PetscCall(PetscFree(submatj->rbuf3[i]));
27209566063dSJacob Faibussowitsch     PetscCall(PetscFree3(submatj->req_source2, submatj->rbuf2, submatj->rbuf3));
27219566063dSJacob Faibussowitsch     PetscCall(PetscFree(submatj->pa));
272216b64355SHong Zhang   }
272316b64355SHong Zhang 
272416b64355SHong Zhang #if defined(PETSC_USE_CTABLE)
2725eec179cfSJacob Faibussowitsch   PetscCall(PetscHMapIDestroy(&submatj->rmap));
27269566063dSJacob Faibussowitsch   if (submatj->cmap_loc) PetscCall(PetscFree(submatj->cmap_loc));
27279566063dSJacob Faibussowitsch   PetscCall(PetscFree(submatj->rmap_loc));
272816b64355SHong Zhang #else
27299566063dSJacob Faibussowitsch   PetscCall(PetscFree(submatj->rmap));
273016b64355SHong Zhang #endif
273116b64355SHong Zhang 
273216b64355SHong Zhang   if (!submatj->allcolumns) {
273316b64355SHong Zhang #if defined(PETSC_USE_CTABLE)
2734eec179cfSJacob Faibussowitsch     PetscCall(PetscHMapIDestroy((PetscHMapI *)&submatj->cmap));
273516b64355SHong Zhang #else
27369566063dSJacob Faibussowitsch     PetscCall(PetscFree(submatj->cmap));
273716b64355SHong Zhang #endif
273816b64355SHong Zhang   }
27399566063dSJacob Faibussowitsch   PetscCall(PetscFree(submatj->row2proc));
274016b64355SHong Zhang 
27419566063dSJacob Faibussowitsch   PetscCall(PetscFree(submatj));
27423ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
274316b64355SHong Zhang }
274416b64355SHong Zhang 
2745d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDestroySubMatrix_SeqAIJ(Mat C)
2746d71ae5a4SJacob Faibussowitsch {
274716b64355SHong Zhang   Mat_SeqAIJ  *c       = (Mat_SeqAIJ *)C->data;
27485c39f6d9SHong Zhang   Mat_SubSppt *submatj = c->submatis1;
274916b64355SHong Zhang 
275016b64355SHong Zhang   PetscFunctionBegin;
27519566063dSJacob Faibussowitsch   PetscCall((*submatj->destroy)(C));
27529566063dSJacob Faibussowitsch   PetscCall(MatDestroySubMatrix_Private(submatj));
27533ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
275416b64355SHong Zhang }
275516b64355SHong Zhang 
275689a1a59bSHong Zhang /* Note this has code duplication with MatDestroySubMatrices_SeqBAIJ() */
2757ba38deedSJacob Faibussowitsch static PetscErrorCode MatDestroySubMatrices_SeqAIJ(PetscInt n, Mat *mat[])
2758d71ae5a4SJacob Faibussowitsch {
27592d033e1fSHong Zhang   PetscInt     i;
27600fb991dcSHong Zhang   Mat          C;
27610fb991dcSHong Zhang   Mat_SeqAIJ  *c;
27620fb991dcSHong Zhang   Mat_SubSppt *submatj;
27632d033e1fSHong Zhang 
27642d033e1fSHong Zhang   PetscFunctionBegin;
27652d033e1fSHong Zhang   for (i = 0; i < n; i++) {
27660fb991dcSHong Zhang     C       = (*mat)[i];
27670fb991dcSHong Zhang     c       = (Mat_SeqAIJ *)C->data;
27680fb991dcSHong Zhang     submatj = c->submatis1;
27692d033e1fSHong Zhang     if (submatj) {
2770682e4c99SStefano Zampini       if (--((PetscObject)C)->refct <= 0) {
277126cc229bSBarry Smith         PetscCall(PetscFree(C->factorprefix));
27729566063dSJacob Faibussowitsch         PetscCall((*submatj->destroy)(C));
27739566063dSJacob Faibussowitsch         PetscCall(MatDestroySubMatrix_Private(submatj));
27749566063dSJacob Faibussowitsch         PetscCall(PetscFree(C->defaultvectype));
27753faff063SStefano Zampini         PetscCall(PetscFree(C->defaultrandtype));
27769566063dSJacob Faibussowitsch         PetscCall(PetscLayoutDestroy(&C->rmap));
27779566063dSJacob Faibussowitsch         PetscCall(PetscLayoutDestroy(&C->cmap));
27789566063dSJacob Faibussowitsch         PetscCall(PetscHeaderDestroy(&C));
2779682e4c99SStefano Zampini       }
27802d033e1fSHong Zhang     } else {
27819566063dSJacob Faibussowitsch       PetscCall(MatDestroy(&C));
27822d033e1fSHong Zhang     }
27832d033e1fSHong Zhang   }
278486e85357SHong Zhang 
278563a75b2aSHong Zhang   /* Destroy Dummy submatrices created for reuse */
27869566063dSJacob Faibussowitsch   PetscCall(MatDestroySubMatrices_Dummy(n, mat));
278763a75b2aSHong Zhang 
27889566063dSJacob Faibussowitsch   PetscCall(PetscFree(*mat));
27893ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
27902d033e1fSHong Zhang }
27912d033e1fSHong Zhang 
2792ba38deedSJacob Faibussowitsch static PetscErrorCode MatCreateSubMatrices_SeqAIJ(Mat A, PetscInt n, const IS irow[], const IS icol[], MatReuse scall, Mat *B[])
2793d71ae5a4SJacob Faibussowitsch {
279497f1f81fSBarry Smith   PetscInt i;
2795cddf8d76SBarry Smith 
27963a40ed3dSBarry Smith   PetscFunctionBegin;
279748a46eb9SPierre Jolivet   if (scall == MAT_INITIAL_MATRIX) PetscCall(PetscCalloc1(n + 1, B));
2798cddf8d76SBarry Smith 
279948a46eb9SPierre Jolivet   for (i = 0; i < n; i++) PetscCall(MatCreateSubMatrix_SeqAIJ(A, irow[i], icol[i], PETSC_DECIDE, scall, &(*B)[i]));
28003ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
2801cddf8d76SBarry Smith }
2802cddf8d76SBarry Smith 
2803ba38deedSJacob Faibussowitsch static PetscErrorCode MatIncreaseOverlap_SeqAIJ(Mat A, PetscInt is_max, IS is[], PetscInt ov)
2804d71ae5a4SJacob Faibussowitsch {
2805e4d965acSSatish Balay   Mat_SeqAIJ     *a = (Mat_SeqAIJ *)A->data;
28069a88ca10SBarry Smith   PetscInt        row, i, j, k, l, ll, m, n, *nidx, isz, val;
28075d0c19d7SBarry Smith   const PetscInt *idx;
28089a88ca10SBarry Smith   PetscInt        start, end, *ai, *aj, bs = (A->rmap->bs > 0 && A->rmap->bs == A->cmap->bs) ? A->rmap->bs : 1;
2809f1af5d2fSBarry Smith   PetscBT         table;
2810bbd702dbSSatish Balay 
28113a40ed3dSBarry Smith   PetscFunctionBegin;
28129a88ca10SBarry Smith   m  = A->rmap->n / bs;
2813e4d965acSSatish Balay   ai = a->i;
2814bfeeae90SHong Zhang   aj = a->j;
28158a047759SSatish Balay 
281608401ef6SPierre Jolivet   PetscCheck(ov >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "illegal negative overlap value used");
281706763907SSatish Balay 
28189566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(m + 1, &nidx));
28199566063dSJacob Faibussowitsch   PetscCall(PetscBTCreate(m, &table));
282006763907SSatish Balay 
2821e4d965acSSatish Balay   for (i = 0; i < is_max; i++) {
2822b97fc60eSLois Curfman McInnes     /* Initialize the two local arrays */
2823e4d965acSSatish Balay     isz = 0;
28249566063dSJacob Faibussowitsch     PetscCall(PetscBTMemzero(m, table));
2825e4d965acSSatish Balay 
2826e4d965acSSatish Balay     /* Extract the indices, assume there can be duplicate entries */
28279566063dSJacob Faibussowitsch     PetscCall(ISGetIndices(is[i], &idx));
28289566063dSJacob Faibussowitsch     PetscCall(ISGetLocalSize(is[i], &n));
2829e4d965acSSatish Balay 
28309a88ca10SBarry Smith     if (bs > 1) {
28319a88ca10SBarry Smith       /* Enter these into the temp arrays. I.e., mark table[row], enter row into new index */
28329a88ca10SBarry Smith       for (j = 0; j < n; ++j) {
28339a88ca10SBarry Smith         if (!PetscBTLookupSet(table, idx[j] / bs)) nidx[isz++] = idx[j] / bs;
28349a88ca10SBarry Smith       }
28359a88ca10SBarry Smith       PetscCall(ISRestoreIndices(is[i], &idx));
28369a88ca10SBarry Smith       PetscCall(ISDestroy(&is[i]));
28379a88ca10SBarry Smith 
28389a88ca10SBarry Smith       k = 0;
28399a88ca10SBarry Smith       for (j = 0; j < ov; j++) { /* for each overlap */
28409a88ca10SBarry Smith         n = isz;
28419a88ca10SBarry Smith         for (; k < n; k++) { /* do only those rows in nidx[k], which are not done yet */
28429a88ca10SBarry Smith           for (ll = 0; ll < bs; ll++) {
28439a88ca10SBarry Smith             row   = bs * nidx[k] + ll;
28449a88ca10SBarry Smith             start = ai[row];
28459a88ca10SBarry Smith             end   = ai[row + 1];
28469a88ca10SBarry Smith             for (l = start; l < end; l++) {
28479a88ca10SBarry Smith               val = aj[l] / bs;
28489a88ca10SBarry Smith               if (!PetscBTLookupSet(table, val)) nidx[isz++] = val;
28499a88ca10SBarry Smith             }
28509a88ca10SBarry Smith           }
28519a88ca10SBarry Smith         }
28529a88ca10SBarry Smith       }
285357508eceSPierre Jolivet       PetscCall(ISCreateBlock(PETSC_COMM_SELF, bs, isz, nidx, PETSC_COPY_VALUES, is + i));
28549a88ca10SBarry Smith     } else {
2855dd097bc3SLois Curfman McInnes       /* Enter these into the temp arrays. I.e., mark table[row], enter row into new index */
2856e4d965acSSatish Balay       for (j = 0; j < n; ++j) {
28572205254eSKarl Rupp         if (!PetscBTLookupSet(table, idx[j])) nidx[isz++] = idx[j];
28584dcbc457SBarry Smith       }
28599566063dSJacob Faibussowitsch       PetscCall(ISRestoreIndices(is[i], &idx));
28609566063dSJacob Faibussowitsch       PetscCall(ISDestroy(&is[i]));
2861e4d965acSSatish Balay 
286204a348a9SBarry Smith       k = 0;
286304a348a9SBarry Smith       for (j = 0; j < ov; j++) { /* for each overlap */
286404a348a9SBarry Smith         n = isz;
286506763907SSatish Balay         for (; k < n; k++) { /* do only those rows in nidx[k], which are not done yet */
2866e4d965acSSatish Balay           row   = nidx[k];
2867e4d965acSSatish Balay           start = ai[row];
2868e4d965acSSatish Balay           end   = ai[row + 1];
286904a348a9SBarry Smith           for (l = start; l < end; l++) {
2870efb16452SHong Zhang             val = aj[l];
28712205254eSKarl Rupp             if (!PetscBTLookupSet(table, val)) nidx[isz++] = val;
2872e4d965acSSatish Balay           }
2873e4d965acSSatish Balay         }
2874e4d965acSSatish Balay       }
287557508eceSPierre Jolivet       PetscCall(ISCreateGeneral(PETSC_COMM_SELF, isz, nidx, PETSC_COPY_VALUES, is + i));
2876e4d965acSSatish Balay     }
28779a88ca10SBarry Smith   }
28789566063dSJacob Faibussowitsch   PetscCall(PetscBTDestroy(&table));
28799566063dSJacob Faibussowitsch   PetscCall(PetscFree(nidx));
28803ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
28814dcbc457SBarry Smith }
288217ab2063SBarry Smith 
2883ba38deedSJacob Faibussowitsch static PetscErrorCode MatPermute_SeqAIJ(Mat A, IS rowp, IS colp, Mat *B)
2884d71ae5a4SJacob Faibussowitsch {
28850513a670SBarry Smith   Mat_SeqAIJ     *a = (Mat_SeqAIJ *)A->data;
28863b98c0a2SBarry Smith   PetscInt        i, nz = 0, m = A->rmap->n, n = A->cmap->n;
28875d0c19d7SBarry Smith   const PetscInt *row, *col;
28885d0c19d7SBarry Smith   PetscInt       *cnew, j, *lens;
288956cd22aeSBarry Smith   IS              icolp, irowp;
28900298fd71SBarry Smith   PetscInt       *cwork = NULL;
28910298fd71SBarry Smith   PetscScalar    *vwork = NULL;
28920513a670SBarry Smith 
28933a40ed3dSBarry Smith   PetscFunctionBegin;
28949566063dSJacob Faibussowitsch   PetscCall(ISInvertPermutation(rowp, PETSC_DECIDE, &irowp));
28959566063dSJacob Faibussowitsch   PetscCall(ISGetIndices(irowp, &row));
28969566063dSJacob Faibussowitsch   PetscCall(ISInvertPermutation(colp, PETSC_DECIDE, &icolp));
28979566063dSJacob Faibussowitsch   PetscCall(ISGetIndices(icolp, &col));
28980513a670SBarry Smith 
28990513a670SBarry Smith   /* determine lengths of permuted rows */
29009566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(m + 1, &lens));
29012205254eSKarl Rupp   for (i = 0; i < m; i++) lens[row[i]] = a->i[i + 1] - a->i[i];
29029566063dSJacob Faibussowitsch   PetscCall(MatCreate(PetscObjectComm((PetscObject)A), B));
29039566063dSJacob Faibussowitsch   PetscCall(MatSetSizes(*B, m, n, m, n));
29049566063dSJacob Faibussowitsch   PetscCall(MatSetBlockSizesFromMats(*B, A, A));
29059566063dSJacob Faibussowitsch   PetscCall(MatSetType(*B, ((PetscObject)A)->type_name));
29069566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(*B, 0, lens));
29079566063dSJacob Faibussowitsch   PetscCall(PetscFree(lens));
29080513a670SBarry Smith 
29099566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(n, &cnew));
29100513a670SBarry Smith   for (i = 0; i < m; i++) {
29119566063dSJacob Faibussowitsch     PetscCall(MatGetRow_SeqAIJ(A, i, &nz, &cwork, &vwork));
29122205254eSKarl Rupp     for (j = 0; j < nz; j++) cnew[j] = col[cwork[j]];
29139566063dSJacob Faibussowitsch     PetscCall(MatSetValues_SeqAIJ(*B, 1, &row[i], nz, cnew, vwork, INSERT_VALUES));
29149566063dSJacob Faibussowitsch     PetscCall(MatRestoreRow_SeqAIJ(A, i, &nz, &cwork, &vwork));
29150513a670SBarry Smith   }
29169566063dSJacob Faibussowitsch   PetscCall(PetscFree(cnew));
29172205254eSKarl Rupp 
29183c7d62e4SBarry Smith   (*B)->assembled = PETSC_FALSE;
29192205254eSKarl Rupp 
29208c3ff71bSJunchao Zhang #if defined(PETSC_HAVE_DEVICE)
29219566063dSJacob Faibussowitsch   PetscCall(MatBindToCPU(*B, A->boundtocpu));
29229fe5e383SStefano Zampini #endif
29239566063dSJacob Faibussowitsch   PetscCall(MatAssemblyBegin(*B, MAT_FINAL_ASSEMBLY));
29249566063dSJacob Faibussowitsch   PetscCall(MatAssemblyEnd(*B, MAT_FINAL_ASSEMBLY));
29259566063dSJacob Faibussowitsch   PetscCall(ISRestoreIndices(irowp, &row));
29269566063dSJacob Faibussowitsch   PetscCall(ISRestoreIndices(icolp, &col));
29279566063dSJacob Faibussowitsch   PetscCall(ISDestroy(&irowp));
29289566063dSJacob Faibussowitsch   PetscCall(ISDestroy(&icolp));
292948a46eb9SPierre Jolivet   if (rowp == colp) PetscCall(MatPropagateSymmetryOptions(A, *B));
29303ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
29310513a670SBarry Smith }
29320513a670SBarry Smith 
2933d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCopy_SeqAIJ(Mat A, Mat B, MatStructure str)
2934d71ae5a4SJacob Faibussowitsch {
2935cb5b572fSBarry Smith   PetscFunctionBegin;
293633f4a19fSKris Buschelman   /* If the two matrices have the same copy implementation, use fast copy. */
293733f4a19fSKris Buschelman   if (str == SAME_NONZERO_PATTERN && (A->ops->copy == B->ops->copy)) {
2938be6bf707SBarry Smith     Mat_SeqAIJ        *a = (Mat_SeqAIJ *)A->data;
2939be6bf707SBarry Smith     Mat_SeqAIJ        *b = (Mat_SeqAIJ *)B->data;
29402e5835c6SStefano Zampini     const PetscScalar *aa;
2941be6bf707SBarry Smith 
29429566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJGetArrayRead(A, &aa));
294308401ef6SPierre Jolivet     PetscCheck(a->i[A->rmap->n] == b->i[B->rmap->n], PETSC_COMM_SELF, PETSC_ERR_ARG_INCOMP, "Number of nonzeros in two matrices are different %" PetscInt_FMT " != %" PetscInt_FMT, a->i[A->rmap->n], b->i[B->rmap->n]);
29449566063dSJacob Faibussowitsch     PetscCall(PetscArraycpy(b->a, aa, a->i[A->rmap->n]));
29459566063dSJacob Faibussowitsch     PetscCall(PetscObjectStateIncrease((PetscObject)B));
29469566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJRestoreArrayRead(A, &aa));
2947cb5b572fSBarry Smith   } else {
29489566063dSJacob Faibussowitsch     PetscCall(MatCopy_Basic(A, B, str));
2949cb5b572fSBarry Smith   }
29503ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
2951cb5b572fSBarry Smith }
2952cb5b572fSBarry Smith 
2953d71ae5a4SJacob Faibussowitsch PETSC_INTERN PetscErrorCode MatSeqAIJGetArray_SeqAIJ(Mat A, PetscScalar *array[])
2954d71ae5a4SJacob Faibussowitsch {
29556c0721eeSBarry Smith   Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data;
29566e111a19SKarl Rupp 
29576c0721eeSBarry Smith   PetscFunctionBegin;
29586c0721eeSBarry Smith   *array = a->a;
29593ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
29606c0721eeSBarry Smith }
29616c0721eeSBarry Smith 
2962d71ae5a4SJacob Faibussowitsch PETSC_INTERN PetscErrorCode MatSeqAIJRestoreArray_SeqAIJ(Mat A, PetscScalar *array[])
2963d71ae5a4SJacob Faibussowitsch {
29646c0721eeSBarry Smith   PetscFunctionBegin;
2965f38c1e66SStefano Zampini   *array = NULL;
29663ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
29676c0721eeSBarry Smith }
2968273d9f13SBarry Smith 
29698229c054SShri Abhyankar /*
29708229c054SShri Abhyankar    Computes the number of nonzeros per row needed for preallocation when X and Y
29718229c054SShri Abhyankar    have different nonzero structure.
29728229c054SShri Abhyankar */
2973d71ae5a4SJacob Faibussowitsch PetscErrorCode MatAXPYGetPreallocation_SeqX_private(PetscInt m, const PetscInt *xi, const PetscInt *xj, const PetscInt *yi, const PetscInt *yj, PetscInt *nnz)
2974d71ae5a4SJacob Faibussowitsch {
2975b264fe52SHong Zhang   PetscInt i, j, k, nzx, nzy;
2976ec7775f6SShri Abhyankar 
2977ec7775f6SShri Abhyankar   PetscFunctionBegin;
2978ec7775f6SShri Abhyankar   /* Set the number of nonzeros in the new matrix */
2979ec7775f6SShri Abhyankar   for (i = 0; i < m; i++) {
29808e3a54c0SPierre Jolivet     const PetscInt *xjj = PetscSafePointerPlusOffset(xj, xi[i]), *yjj = PetscSafePointerPlusOffset(yj, yi[i]);
2981b264fe52SHong Zhang     nzx    = xi[i + 1] - xi[i];
2982b264fe52SHong Zhang     nzy    = yi[i + 1] - yi[i];
29838af7cee1SJed Brown     nnz[i] = 0;
29848af7cee1SJed Brown     for (j = 0, k = 0; j < nzx; j++) {                  /* Point in X */
2985b264fe52SHong Zhang       for (; k < nzy && yjj[k] < xjj[j]; k++) nnz[i]++; /* Catch up to X */
2986b264fe52SHong Zhang       if (k < nzy && yjj[k] == xjj[j]) k++;             /* Skip duplicate */
29878af7cee1SJed Brown       nnz[i]++;
29888af7cee1SJed Brown     }
29898af7cee1SJed Brown     for (; k < nzy; k++) nnz[i]++;
2990ec7775f6SShri Abhyankar   }
29913ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
2992ec7775f6SShri Abhyankar }
2993ec7775f6SShri Abhyankar 
2994d71ae5a4SJacob Faibussowitsch PetscErrorCode MatAXPYGetPreallocation_SeqAIJ(Mat Y, Mat X, PetscInt *nnz)
2995d71ae5a4SJacob Faibussowitsch {
2996b264fe52SHong Zhang   PetscInt    m = Y->rmap->N;
2997b264fe52SHong Zhang   Mat_SeqAIJ *x = (Mat_SeqAIJ *)X->data;
2998b264fe52SHong Zhang   Mat_SeqAIJ *y = (Mat_SeqAIJ *)Y->data;
2999b264fe52SHong Zhang 
3000b264fe52SHong Zhang   PetscFunctionBegin;
3001b264fe52SHong Zhang   /* Set the number of nonzeros in the new matrix */
30029566063dSJacob Faibussowitsch   PetscCall(MatAXPYGetPreallocation_SeqX_private(m, x->i, x->j, y->i, y->j, nnz));
30033ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3004b264fe52SHong Zhang }
3005b264fe52SHong Zhang 
3006d71ae5a4SJacob Faibussowitsch PetscErrorCode MatAXPY_SeqAIJ(Mat Y, PetscScalar a, Mat X, MatStructure str)
3007d71ae5a4SJacob Faibussowitsch {
3008ac90fabeSBarry Smith   Mat_SeqAIJ *x = (Mat_SeqAIJ *)X->data, *y = (Mat_SeqAIJ *)Y->data;
3009ac90fabeSBarry Smith 
3010ac90fabeSBarry Smith   PetscFunctionBegin;
3011134adf20SPierre Jolivet   if (str == UNKNOWN_NONZERO_PATTERN || (PetscDefined(USE_DEBUG) && str == SAME_NONZERO_PATTERN)) {
3012134adf20SPierre Jolivet     PetscBool e = x->nz == y->nz ? PETSC_TRUE : PETSC_FALSE;
3013134adf20SPierre Jolivet     if (e) {
30149566063dSJacob Faibussowitsch       PetscCall(PetscArraycmp(x->i, y->i, Y->rmap->n + 1, &e));
301581fa06acSBarry Smith       if (e) {
30169566063dSJacob Faibussowitsch         PetscCall(PetscArraycmp(x->j, y->j, y->nz, &e));
3017134adf20SPierre Jolivet         if (e) str = SAME_NONZERO_PATTERN;
301881fa06acSBarry Smith       }
301981fa06acSBarry Smith     }
302054c59aa7SJacob Faibussowitsch     if (!e) PetscCheck(str != SAME_NONZERO_PATTERN, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONG, "MatStructure is not SAME_NONZERO_PATTERN");
302181fa06acSBarry Smith   }
3022ac90fabeSBarry Smith   if (str == SAME_NONZERO_PATTERN) {
30232e5835c6SStefano Zampini     const PetscScalar *xa;
30242e5835c6SStefano Zampini     PetscScalar       *ya, alpha = a;
302581fa06acSBarry Smith     PetscBLASInt       one = 1, bnz;
302681fa06acSBarry Smith 
30279566063dSJacob Faibussowitsch     PetscCall(PetscBLASIntCast(x->nz, &bnz));
30289566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJGetArray(Y, &ya));
30299566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJGetArrayRead(X, &xa));
3030792fecdfSBarry Smith     PetscCallBLAS("BLASaxpy", BLASaxpy_(&bnz, &alpha, xa, &one, ya, &one));
30319566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJRestoreArrayRead(X, &xa));
30329566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJRestoreArray(Y, &ya));
30339566063dSJacob Faibussowitsch     PetscCall(PetscLogFlops(2.0 * bnz));
30349566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJInvalidateDiagonal(Y));
30359566063dSJacob Faibussowitsch     PetscCall(PetscObjectStateIncrease((PetscObject)Y));
3036ab784542SHong Zhang   } else if (str == SUBSET_NONZERO_PATTERN) { /* nonzeros of X is a subset of Y's */
30379566063dSJacob Faibussowitsch     PetscCall(MatAXPY_Basic(Y, a, X, str));
3038ac90fabeSBarry Smith   } else {
30398229c054SShri Abhyankar     Mat       B;
30408229c054SShri Abhyankar     PetscInt *nnz;
30419566063dSJacob Faibussowitsch     PetscCall(PetscMalloc1(Y->rmap->N, &nnz));
30429566063dSJacob Faibussowitsch     PetscCall(MatCreate(PetscObjectComm((PetscObject)Y), &B));
30439566063dSJacob Faibussowitsch     PetscCall(PetscObjectSetName((PetscObject)B, ((PetscObject)Y)->name));
30449566063dSJacob Faibussowitsch     PetscCall(MatSetLayouts(B, Y->rmap, Y->cmap));
30459566063dSJacob Faibussowitsch     PetscCall(MatSetType(B, ((PetscObject)Y)->type_name));
30469566063dSJacob Faibussowitsch     PetscCall(MatAXPYGetPreallocation_SeqAIJ(Y, X, nnz));
30479566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJSetPreallocation(B, 0, nnz));
30489566063dSJacob Faibussowitsch     PetscCall(MatAXPY_BasicWithPreallocation(B, Y, a, X, str));
30499566063dSJacob Faibussowitsch     PetscCall(MatHeaderMerge(Y, &B));
30509bb234a9SBarry Smith     PetscCall(MatSeqAIJCheckInode(Y));
30519566063dSJacob Faibussowitsch     PetscCall(PetscFree(nnz));
3052ac90fabeSBarry Smith   }
30533ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3054ac90fabeSBarry Smith }
3055ac90fabeSBarry Smith 
3056d71ae5a4SJacob Faibussowitsch PETSC_INTERN PetscErrorCode MatConjugate_SeqAIJ(Mat mat)
3057d71ae5a4SJacob Faibussowitsch {
3058354c94deSBarry Smith #if defined(PETSC_USE_COMPLEX)
3059354c94deSBarry Smith   Mat_SeqAIJ  *aij = (Mat_SeqAIJ *)mat->data;
3060354c94deSBarry Smith   PetscInt     i, nz;
3061354c94deSBarry Smith   PetscScalar *a;
3062354c94deSBarry Smith 
3063354c94deSBarry Smith   PetscFunctionBegin;
3064354c94deSBarry Smith   nz = aij->nz;
30659566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArray(mat, &a));
30662205254eSKarl Rupp   for (i = 0; i < nz; i++) a[i] = PetscConj(a[i]);
30679566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArray(mat, &a));
3068354c94deSBarry Smith #else
3069354c94deSBarry Smith   PetscFunctionBegin;
3070354c94deSBarry Smith #endif
30713ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3072354c94deSBarry Smith }
3073354c94deSBarry Smith 
3074ba38deedSJacob Faibussowitsch static PetscErrorCode MatGetRowMaxAbs_SeqAIJ(Mat A, Vec v, PetscInt idx[])
3075d71ae5a4SJacob Faibussowitsch {
3076e34fafa9SBarry Smith   Mat_SeqAIJ      *a = (Mat_SeqAIJ *)A->data;
3077d0f46423SBarry Smith   PetscInt         i, j, m = A->rmap->n, *ai, *aj, ncols, n;
3078e34fafa9SBarry Smith   PetscReal        atmp;
3079985db425SBarry Smith   PetscScalar     *x;
3080ce496241SStefano Zampini   const MatScalar *aa, *av;
3081e34fafa9SBarry Smith 
3082e34fafa9SBarry Smith   PetscFunctionBegin;
308328b400f6SJacob Faibussowitsch   PetscCheck(!A->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix");
30849566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &av));
3085ce496241SStefano Zampini   aa = av;
3086e34fafa9SBarry Smith   ai = a->i;
3087e34fafa9SBarry Smith   aj = a->j;
3088e34fafa9SBarry Smith 
30899566063dSJacob Faibussowitsch   PetscCall(VecSet(v, 0.0));
30909566063dSJacob Faibussowitsch   PetscCall(VecGetArrayWrite(v, &x));
30919566063dSJacob Faibussowitsch   PetscCall(VecGetLocalSize(v, &n));
309208401ef6SPierre Jolivet   PetscCheck(n == A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Nonconforming matrix and vector");
3093e34fafa9SBarry Smith   for (i = 0; i < m; i++) {
30949371c9d4SSatish Balay     ncols = ai[1] - ai[0];
30959371c9d4SSatish Balay     ai++;
3096e34fafa9SBarry Smith     for (j = 0; j < ncols; j++) {
3097985db425SBarry Smith       atmp = PetscAbsScalar(*aa);
30989371c9d4SSatish Balay       if (PetscAbsScalar(x[i]) < atmp) {
30999371c9d4SSatish Balay         x[i] = atmp;
31009371c9d4SSatish Balay         if (idx) idx[i] = *aj;
31019371c9d4SSatish Balay       }
31029371c9d4SSatish Balay       aa++;
31039371c9d4SSatish Balay       aj++;
3104985db425SBarry Smith     }
3105985db425SBarry Smith   }
31069566063dSJacob Faibussowitsch   PetscCall(VecRestoreArrayWrite(v, &x));
31079566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &av));
31083ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3109985db425SBarry Smith }
3110985db425SBarry Smith 
3111eede4a3fSMark Adams static PetscErrorCode MatGetRowSumAbs_SeqAIJ(Mat A, Vec v)
3112eede4a3fSMark Adams {
3113eede4a3fSMark Adams   Mat_SeqAIJ      *a = (Mat_SeqAIJ *)A->data;
3114eede4a3fSMark Adams   PetscInt         i, j, m = A->rmap->n, *ai, ncols, n;
3115eede4a3fSMark Adams   PetscScalar     *x;
3116eede4a3fSMark Adams   const MatScalar *aa, *av;
3117eede4a3fSMark Adams 
3118eede4a3fSMark Adams   PetscFunctionBegin;
3119eede4a3fSMark Adams   PetscCheck(!A->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix");
3120eede4a3fSMark Adams   PetscCall(MatSeqAIJGetArrayRead(A, &av));
3121eede4a3fSMark Adams   aa = av;
3122eede4a3fSMark Adams   ai = a->i;
3123eede4a3fSMark Adams 
3124eede4a3fSMark Adams   PetscCall(VecSet(v, 0.0));
3125eede4a3fSMark Adams   PetscCall(VecGetArrayWrite(v, &x));
3126eede4a3fSMark Adams   PetscCall(VecGetLocalSize(v, &n));
3127eede4a3fSMark Adams   PetscCheck(n == A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Nonconforming matrix and vector");
3128eede4a3fSMark Adams   for (i = 0; i < m; i++) {
3129eede4a3fSMark Adams     ncols = ai[1] - ai[0];
3130eede4a3fSMark Adams     ai++;
3131eede4a3fSMark Adams     for (j = 0; j < ncols; j++) {
3132eede4a3fSMark Adams       x[i] += PetscAbsScalar(*aa);
3133eede4a3fSMark Adams       aa++;
3134eede4a3fSMark Adams     }
3135eede4a3fSMark Adams   }
3136eede4a3fSMark Adams   PetscCall(VecRestoreArrayWrite(v, &x));
3137eede4a3fSMark Adams   PetscCall(MatSeqAIJRestoreArrayRead(A, &av));
3138eede4a3fSMark Adams   PetscFunctionReturn(PETSC_SUCCESS);
3139eede4a3fSMark Adams }
3140eede4a3fSMark Adams 
3141ba38deedSJacob Faibussowitsch static PetscErrorCode MatGetRowMax_SeqAIJ(Mat A, Vec v, PetscInt idx[])
3142d71ae5a4SJacob Faibussowitsch {
3143985db425SBarry Smith   Mat_SeqAIJ      *a = (Mat_SeqAIJ *)A->data;
3144d0f46423SBarry Smith   PetscInt         i, j, m = A->rmap->n, *ai, *aj, ncols, n;
3145985db425SBarry Smith   PetscScalar     *x;
3146ce496241SStefano Zampini   const MatScalar *aa, *av;
3147985db425SBarry Smith 
3148985db425SBarry Smith   PetscFunctionBegin;
314928b400f6SJacob Faibussowitsch   PetscCheck(!A->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix");
31509566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &av));
3151ce496241SStefano Zampini   aa = av;
3152985db425SBarry Smith   ai = a->i;
3153985db425SBarry Smith   aj = a->j;
3154985db425SBarry Smith 
31559566063dSJacob Faibussowitsch   PetscCall(VecSet(v, 0.0));
31569566063dSJacob Faibussowitsch   PetscCall(VecGetArrayWrite(v, &x));
31579566063dSJacob Faibussowitsch   PetscCall(VecGetLocalSize(v, &n));
315808401ef6SPierre Jolivet   PetscCheck(n == A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Nonconforming matrix and vector");
3159985db425SBarry Smith   for (i = 0; i < m; i++) {
31609371c9d4SSatish Balay     ncols = ai[1] - ai[0];
31619371c9d4SSatish Balay     ai++;
3162d0f46423SBarry Smith     if (ncols == A->cmap->n) { /* row is dense */
31639371c9d4SSatish Balay       x[i] = *aa;
31649371c9d4SSatish Balay       if (idx) idx[i] = 0;
3165985db425SBarry Smith     } else { /* row is sparse so already KNOW maximum is 0.0 or higher */
3166985db425SBarry Smith       x[i] = 0.0;
3167985db425SBarry Smith       if (idx) {
3168985db425SBarry Smith         for (j = 0; j < ncols; j++) { /* find first implicit 0.0 in the row */
3169985db425SBarry Smith           if (aj[j] > j) {
3170985db425SBarry Smith             idx[i] = j;
3171985db425SBarry Smith             break;
3172985db425SBarry Smith           }
3173985db425SBarry Smith         }
31741a254869SHong Zhang         /* in case first implicit 0.0 in the row occurs at ncols-th column */
31751a254869SHong Zhang         if (j == ncols && j < A->cmap->n) idx[i] = j;
3176985db425SBarry Smith       }
3177985db425SBarry Smith     }
3178985db425SBarry Smith     for (j = 0; j < ncols; j++) {
31799371c9d4SSatish Balay       if (PetscRealPart(x[i]) < PetscRealPart(*aa)) {
31809371c9d4SSatish Balay         x[i] = *aa;
31819371c9d4SSatish Balay         if (idx) idx[i] = *aj;
31829371c9d4SSatish Balay       }
31839371c9d4SSatish Balay       aa++;
31849371c9d4SSatish Balay       aj++;
3185985db425SBarry Smith     }
3186985db425SBarry Smith   }
31879566063dSJacob Faibussowitsch   PetscCall(VecRestoreArrayWrite(v, &x));
31889566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &av));
31893ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3190985db425SBarry Smith }
3191985db425SBarry Smith 
3192ba38deedSJacob Faibussowitsch static PetscErrorCode MatGetRowMinAbs_SeqAIJ(Mat A, Vec v, PetscInt idx[])
3193d71ae5a4SJacob Faibussowitsch {
3194c87e5d42SMatthew Knepley   Mat_SeqAIJ      *a = (Mat_SeqAIJ *)A->data;
3195c87e5d42SMatthew Knepley   PetscInt         i, j, m = A->rmap->n, *ai, *aj, ncols, n;
3196ce496241SStefano Zampini   PetscScalar     *x;
3197ce496241SStefano Zampini   const MatScalar *aa, *av;
3198c87e5d42SMatthew Knepley 
3199c87e5d42SMatthew Knepley   PetscFunctionBegin;
32009566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &av));
3201ce496241SStefano Zampini   aa = av;
3202c87e5d42SMatthew Knepley   ai = a->i;
3203c87e5d42SMatthew Knepley   aj = a->j;
3204c87e5d42SMatthew Knepley 
32059566063dSJacob Faibussowitsch   PetscCall(VecSet(v, 0.0));
32069566063dSJacob Faibussowitsch   PetscCall(VecGetArrayWrite(v, &x));
32079566063dSJacob Faibussowitsch   PetscCall(VecGetLocalSize(v, &n));
320808401ef6SPierre Jolivet   PetscCheck(n == m, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Nonconforming matrix and vector, %" PetscInt_FMT " vs. %" PetscInt_FMT " rows", m, n);
3209c87e5d42SMatthew Knepley   for (i = 0; i < m; i++) {
32109371c9d4SSatish Balay     ncols = ai[1] - ai[0];
32119371c9d4SSatish Balay     ai++;
3212f07e67edSHong Zhang     if (ncols == A->cmap->n) { /* row is dense */
32139371c9d4SSatish Balay       x[i] = *aa;
32149371c9d4SSatish Balay       if (idx) idx[i] = 0;
3215f07e67edSHong Zhang     } else { /* row is sparse so already KNOW minimum is 0.0 or higher */
3216f07e67edSHong Zhang       x[i] = 0.0;
3217f07e67edSHong Zhang       if (idx) { /* find first implicit 0.0 in the row */
3218289a08f5SMatthew Knepley         for (j = 0; j < ncols; j++) {
3219f07e67edSHong Zhang           if (aj[j] > j) {
3220f07e67edSHong Zhang             idx[i] = j;
32212205254eSKarl Rupp             break;
32222205254eSKarl Rupp           }
3223289a08f5SMatthew Knepley         }
3224f07e67edSHong Zhang         /* in case first implicit 0.0 in the row occurs at ncols-th column */
3225f07e67edSHong Zhang         if (j == ncols && j < A->cmap->n) idx[i] = j;
3226f07e67edSHong Zhang       }
3227289a08f5SMatthew Knepley     }
3228c87e5d42SMatthew Knepley     for (j = 0; j < ncols; j++) {
32299371c9d4SSatish Balay       if (PetscAbsScalar(x[i]) > PetscAbsScalar(*aa)) {
32309371c9d4SSatish Balay         x[i] = *aa;
32319371c9d4SSatish Balay         if (idx) idx[i] = *aj;
32329371c9d4SSatish Balay       }
32339371c9d4SSatish Balay       aa++;
32349371c9d4SSatish Balay       aj++;
3235c87e5d42SMatthew Knepley     }
3236c87e5d42SMatthew Knepley   }
32379566063dSJacob Faibussowitsch   PetscCall(VecRestoreArrayWrite(v, &x));
32389566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &av));
32393ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3240c87e5d42SMatthew Knepley }
3241c87e5d42SMatthew Knepley 
3242ba38deedSJacob Faibussowitsch static PetscErrorCode MatGetRowMin_SeqAIJ(Mat A, Vec v, PetscInt idx[])
3243d71ae5a4SJacob Faibussowitsch {
3244985db425SBarry Smith   Mat_SeqAIJ      *a = (Mat_SeqAIJ *)A->data;
3245d9ca1df4SBarry Smith   PetscInt         i, j, m = A->rmap->n, ncols, n;
3246d9ca1df4SBarry Smith   const PetscInt  *ai, *aj;
3247985db425SBarry Smith   PetscScalar     *x;
3248ce496241SStefano Zampini   const MatScalar *aa, *av;
3249985db425SBarry Smith 
3250985db425SBarry Smith   PetscFunctionBegin;
325128b400f6SJacob Faibussowitsch   PetscCheck(!A->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix");
32529566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &av));
3253ce496241SStefano Zampini   aa = av;
3254985db425SBarry Smith   ai = a->i;
3255985db425SBarry Smith   aj = a->j;
3256985db425SBarry Smith 
32579566063dSJacob Faibussowitsch   PetscCall(VecSet(v, 0.0));
32589566063dSJacob Faibussowitsch   PetscCall(VecGetArrayWrite(v, &x));
32599566063dSJacob Faibussowitsch   PetscCall(VecGetLocalSize(v, &n));
326008401ef6SPierre Jolivet   PetscCheck(n == m, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Nonconforming matrix and vector");
3261985db425SBarry Smith   for (i = 0; i < m; i++) {
32629371c9d4SSatish Balay     ncols = ai[1] - ai[0];
32639371c9d4SSatish Balay     ai++;
3264d0f46423SBarry Smith     if (ncols == A->cmap->n) { /* row is dense */
32659371c9d4SSatish Balay       x[i] = *aa;
32669371c9d4SSatish Balay       if (idx) idx[i] = 0;
3267985db425SBarry Smith     } else { /* row is sparse so already KNOW minimum is 0.0 or lower */
3268985db425SBarry Smith       x[i] = 0.0;
3269985db425SBarry Smith       if (idx) { /* find first implicit 0.0 in the row */
3270985db425SBarry Smith         for (j = 0; j < ncols; j++) {
3271985db425SBarry Smith           if (aj[j] > j) {
3272985db425SBarry Smith             idx[i] = j;
3273985db425SBarry Smith             break;
3274985db425SBarry Smith           }
3275985db425SBarry Smith         }
3276fa213d2fSHong Zhang         /* in case first implicit 0.0 in the row occurs at ncols-th column */
3277fa213d2fSHong Zhang         if (j == ncols && j < A->cmap->n) idx[i] = j;
3278985db425SBarry Smith       }
3279985db425SBarry Smith     }
3280985db425SBarry Smith     for (j = 0; j < ncols; j++) {
32819371c9d4SSatish Balay       if (PetscRealPart(x[i]) > PetscRealPart(*aa)) {
32829371c9d4SSatish Balay         x[i] = *aa;
32839371c9d4SSatish Balay         if (idx) idx[i] = *aj;
32849371c9d4SSatish Balay       }
32859371c9d4SSatish Balay       aa++;
32869371c9d4SSatish Balay       aj++;
3287e34fafa9SBarry Smith     }
3288e34fafa9SBarry Smith   }
32899566063dSJacob Faibussowitsch   PetscCall(VecRestoreArrayWrite(v, &x));
32909566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &av));
32913ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3292e34fafa9SBarry Smith }
3293bbead8a2SBarry Smith 
3294ba38deedSJacob Faibussowitsch static PetscErrorCode MatInvertBlockDiagonal_SeqAIJ(Mat A, const PetscScalar **values)
3295d71ae5a4SJacob Faibussowitsch {
3296bbead8a2SBarry Smith   Mat_SeqAIJ     *a = (Mat_SeqAIJ *)A->data;
329733d57670SJed Brown   PetscInt        i, bs = PetscAbs(A->rmap->bs), mbs = A->rmap->n / bs, ipvt[5], bs2 = bs * bs, *v_pivots, ij[7], *IJ, j;
3298bbead8a2SBarry Smith   MatScalar      *diag, work[25], *v_work;
32990da83c2eSBarry Smith   const PetscReal shift = 0.0;
33001a9391e3SHong Zhang   PetscBool       allowzeropivot, zeropivotdetected = PETSC_FALSE;
3301bbead8a2SBarry Smith 
3302bbead8a2SBarry Smith   PetscFunctionBegin;
3303a455e926SHong Zhang   allowzeropivot = PetscNot(A->erroriffailure);
33044a0d0026SBarry Smith   if (a->ibdiagvalid) {
33054a0d0026SBarry Smith     if (values) *values = a->ibdiag;
33063ba16761SJacob Faibussowitsch     PetscFunctionReturn(PETSC_SUCCESS);
33074a0d0026SBarry Smith   }
33089566063dSJacob Faibussowitsch   PetscCall(MatMarkDiagonal_SeqAIJ(A));
33094dfa11a4SJacob Faibussowitsch   if (!a->ibdiag) { PetscCall(PetscMalloc1(bs2 * mbs, &a->ibdiag)); }
3310bbead8a2SBarry Smith   diag = a->ibdiag;
3311bbead8a2SBarry Smith   if (values) *values = a->ibdiag;
3312bbead8a2SBarry Smith   /* factor and invert each block */
3313bbead8a2SBarry Smith   switch (bs) {
3314bbead8a2SBarry Smith   case 1:
3315bbead8a2SBarry Smith     for (i = 0; i < mbs; i++) {
33169566063dSJacob Faibussowitsch       PetscCall(MatGetValues(A, 1, &i, 1, &i, diag + i));
3317ec1892c8SHong Zhang       if (PetscAbsScalar(diag[i] + shift) < PETSC_MACHINE_EPSILON) {
3318ec1892c8SHong Zhang         if (allowzeropivot) {
33197b6c816cSBarry Smith           A->factorerrortype             = MAT_FACTOR_NUMERIC_ZEROPIVOT;
33207b6c816cSBarry Smith           A->factorerror_zeropivot_value = PetscAbsScalar(diag[i]);
33217b6c816cSBarry Smith           A->factorerror_zeropivot_row   = i;
33229566063dSJacob Faibussowitsch           PetscCall(PetscInfo(A, "Zero pivot, row %" PetscInt_FMT " pivot %g tolerance %g\n", i, (double)PetscAbsScalar(diag[i]), (double)PETSC_MACHINE_EPSILON));
332398921bdaSJacob Faibussowitsch         } else SETERRQ(PETSC_COMM_SELF, PETSC_ERR_MAT_LU_ZRPVT, "Zero pivot, row %" PetscInt_FMT " pivot %g tolerance %g", i, (double)PetscAbsScalar(diag[i]), (double)PETSC_MACHINE_EPSILON);
3324ec1892c8SHong Zhang       }
3325bbead8a2SBarry Smith       diag[i] = (PetscScalar)1.0 / (diag[i] + shift);
3326bbead8a2SBarry Smith     }
3327bbead8a2SBarry Smith     break;
3328bbead8a2SBarry Smith   case 2:
3329bbead8a2SBarry Smith     for (i = 0; i < mbs; i++) {
33309371c9d4SSatish Balay       ij[0] = 2 * i;
33319371c9d4SSatish Balay       ij[1] = 2 * i + 1;
33329566063dSJacob Faibussowitsch       PetscCall(MatGetValues(A, 2, ij, 2, ij, diag));
33339566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_inverse_A_2(diag, shift, allowzeropivot, &zeropivotdetected));
33347b6c816cSBarry Smith       if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT;
33359566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_transpose_A_2(diag));
3336bbead8a2SBarry Smith       diag += 4;
3337bbead8a2SBarry Smith     }
3338bbead8a2SBarry Smith     break;
3339bbead8a2SBarry Smith   case 3:
3340bbead8a2SBarry Smith     for (i = 0; i < mbs; i++) {
33419371c9d4SSatish Balay       ij[0] = 3 * i;
33429371c9d4SSatish Balay       ij[1] = 3 * i + 1;
33439371c9d4SSatish Balay       ij[2] = 3 * i + 2;
33449566063dSJacob Faibussowitsch       PetscCall(MatGetValues(A, 3, ij, 3, ij, diag));
33459566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_inverse_A_3(diag, shift, allowzeropivot, &zeropivotdetected));
33467b6c816cSBarry Smith       if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT;
33479566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_transpose_A_3(diag));
3348bbead8a2SBarry Smith       diag += 9;
3349bbead8a2SBarry Smith     }
3350bbead8a2SBarry Smith     break;
3351bbead8a2SBarry Smith   case 4:
3352bbead8a2SBarry Smith     for (i = 0; i < mbs; i++) {
33539371c9d4SSatish Balay       ij[0] = 4 * i;
33549371c9d4SSatish Balay       ij[1] = 4 * i + 1;
33559371c9d4SSatish Balay       ij[2] = 4 * i + 2;
33569371c9d4SSatish Balay       ij[3] = 4 * i + 3;
33579566063dSJacob Faibussowitsch       PetscCall(MatGetValues(A, 4, ij, 4, ij, diag));
33589566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_inverse_A_4(diag, shift, allowzeropivot, &zeropivotdetected));
33597b6c816cSBarry Smith       if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT;
33609566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_transpose_A_4(diag));
3361bbead8a2SBarry Smith       diag += 16;
3362bbead8a2SBarry Smith     }
3363bbead8a2SBarry Smith     break;
3364bbead8a2SBarry Smith   case 5:
3365bbead8a2SBarry Smith     for (i = 0; i < mbs; i++) {
33669371c9d4SSatish Balay       ij[0] = 5 * i;
33679371c9d4SSatish Balay       ij[1] = 5 * i + 1;
33689371c9d4SSatish Balay       ij[2] = 5 * i + 2;
33699371c9d4SSatish Balay       ij[3] = 5 * i + 3;
33709371c9d4SSatish Balay       ij[4] = 5 * i + 4;
33719566063dSJacob Faibussowitsch       PetscCall(MatGetValues(A, 5, ij, 5, ij, diag));
33729566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_inverse_A_5(diag, ipvt, work, shift, allowzeropivot, &zeropivotdetected));
33737b6c816cSBarry Smith       if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT;
33749566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_transpose_A_5(diag));
3375bbead8a2SBarry Smith       diag += 25;
3376bbead8a2SBarry Smith     }
3377bbead8a2SBarry Smith     break;
3378bbead8a2SBarry Smith   case 6:
3379bbead8a2SBarry Smith     for (i = 0; i < mbs; i++) {
33809371c9d4SSatish Balay       ij[0] = 6 * i;
33819371c9d4SSatish Balay       ij[1] = 6 * i + 1;
33829371c9d4SSatish Balay       ij[2] = 6 * i + 2;
33839371c9d4SSatish Balay       ij[3] = 6 * i + 3;
33849371c9d4SSatish Balay       ij[4] = 6 * i + 4;
33859371c9d4SSatish Balay       ij[5] = 6 * i + 5;
33869566063dSJacob Faibussowitsch       PetscCall(MatGetValues(A, 6, ij, 6, ij, diag));
33879566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_inverse_A_6(diag, shift, allowzeropivot, &zeropivotdetected));
33887b6c816cSBarry Smith       if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT;
33899566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_transpose_A_6(diag));
3390bbead8a2SBarry Smith       diag += 36;
3391bbead8a2SBarry Smith     }
3392bbead8a2SBarry Smith     break;
3393bbead8a2SBarry Smith   case 7:
3394bbead8a2SBarry Smith     for (i = 0; i < mbs; i++) {
33959371c9d4SSatish Balay       ij[0] = 7 * i;
33969371c9d4SSatish Balay       ij[1] = 7 * i + 1;
33979371c9d4SSatish Balay       ij[2] = 7 * i + 2;
33989371c9d4SSatish Balay       ij[3] = 7 * i + 3;
33999371c9d4SSatish Balay       ij[4] = 7 * i + 4;
34009371c9d4SSatish Balay       ij[5] = 7 * i + 5;
3401cdd8bf47SJunchao Zhang       ij[6] = 7 * i + 6;
34029566063dSJacob Faibussowitsch       PetscCall(MatGetValues(A, 7, ij, 7, ij, diag));
34039566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_inverse_A_7(diag, shift, allowzeropivot, &zeropivotdetected));
34047b6c816cSBarry Smith       if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT;
34059566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_transpose_A_7(diag));
3406bbead8a2SBarry Smith       diag += 49;
3407bbead8a2SBarry Smith     }
3408bbead8a2SBarry Smith     break;
3409bbead8a2SBarry Smith   default:
34109566063dSJacob Faibussowitsch     PetscCall(PetscMalloc3(bs, &v_work, bs, &v_pivots, bs, &IJ));
3411bbead8a2SBarry Smith     for (i = 0; i < mbs; i++) {
3412ad540459SPierre Jolivet       for (j = 0; j < bs; j++) IJ[j] = bs * i + j;
34139566063dSJacob Faibussowitsch       PetscCall(MatGetValues(A, bs, IJ, bs, IJ, diag));
34149566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_inverse_A(bs, diag, v_pivots, v_work, allowzeropivot, &zeropivotdetected));
34157b6c816cSBarry Smith       if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT;
34169566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_transpose_A_N(diag, bs));
3417bbead8a2SBarry Smith       diag += bs2;
3418bbead8a2SBarry Smith     }
34199566063dSJacob Faibussowitsch     PetscCall(PetscFree3(v_work, v_pivots, IJ));
3420bbead8a2SBarry Smith   }
3421bbead8a2SBarry Smith   a->ibdiagvalid = PETSC_TRUE;
34223ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3423bbead8a2SBarry Smith }
3424bbead8a2SBarry Smith 
3425d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatSetRandom_SeqAIJ(Mat x, PetscRandom rctx)
3426d71ae5a4SJacob Faibussowitsch {
342773a71a0fSBarry Smith   Mat_SeqAIJ *aij = (Mat_SeqAIJ *)x->data;
3428fff043a9SJunchao Zhang   PetscScalar a, *aa;
342973a71a0fSBarry Smith   PetscInt    m, n, i, j, col;
343073a71a0fSBarry Smith 
343173a71a0fSBarry Smith   PetscFunctionBegin;
343273a71a0fSBarry Smith   if (!x->assembled) {
34339566063dSJacob Faibussowitsch     PetscCall(MatGetSize(x, &m, &n));
343473a71a0fSBarry Smith     for (i = 0; i < m; i++) {
343573a71a0fSBarry Smith       for (j = 0; j < aij->imax[i]; j++) {
34369566063dSJacob Faibussowitsch         PetscCall(PetscRandomGetValue(rctx, &a));
343773a71a0fSBarry Smith         col = (PetscInt)(n * PetscRealPart(a));
34389566063dSJacob Faibussowitsch         PetscCall(MatSetValues(x, 1, &i, 1, &col, &a, ADD_VALUES));
343973a71a0fSBarry Smith       }
344073a71a0fSBarry Smith     }
3441e2ce353bSJunchao Zhang   } else {
34429566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJGetArrayWrite(x, &aa));
34439566063dSJacob Faibussowitsch     for (i = 0; i < aij->nz; i++) PetscCall(PetscRandomGetValue(rctx, aa + i));
34449566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJRestoreArrayWrite(x, &aa));
3445e2ce353bSJunchao Zhang   }
34469566063dSJacob Faibussowitsch   PetscCall(MatAssemblyBegin(x, MAT_FINAL_ASSEMBLY));
34479566063dSJacob Faibussowitsch   PetscCall(MatAssemblyEnd(x, MAT_FINAL_ASSEMBLY));
34483ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
344973a71a0fSBarry Smith }
345073a71a0fSBarry Smith 
3451679944adSJunchao Zhang /* Like MatSetRandom_SeqAIJ, but do not set values on columns in range of [low, high) */
3452d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetRandomSkipColumnRange_SeqAIJ_Private(Mat x, PetscInt low, PetscInt high, PetscRandom rctx)
3453d71ae5a4SJacob Faibussowitsch {
3454679944adSJunchao Zhang   Mat_SeqAIJ *aij = (Mat_SeqAIJ *)x->data;
3455679944adSJunchao Zhang   PetscScalar a;
3456679944adSJunchao Zhang   PetscInt    m, n, i, j, col, nskip;
3457679944adSJunchao Zhang 
3458679944adSJunchao Zhang   PetscFunctionBegin;
3459679944adSJunchao Zhang   nskip = high - low;
34609566063dSJacob Faibussowitsch   PetscCall(MatGetSize(x, &m, &n));
3461679944adSJunchao Zhang   n -= nskip; /* shrink number of columns where nonzeros can be set */
3462679944adSJunchao Zhang   for (i = 0; i < m; i++) {
3463679944adSJunchao Zhang     for (j = 0; j < aij->imax[i]; j++) {
34649566063dSJacob Faibussowitsch       PetscCall(PetscRandomGetValue(rctx, &a));
3465679944adSJunchao Zhang       col = (PetscInt)(n * PetscRealPart(a));
3466679944adSJunchao Zhang       if (col >= low) col += nskip; /* shift col rightward to skip the hole */
34679566063dSJacob Faibussowitsch       PetscCall(MatSetValues(x, 1, &i, 1, &col, &a, ADD_VALUES));
3468679944adSJunchao Zhang     }
3469e2ce353bSJunchao Zhang   }
34709566063dSJacob Faibussowitsch   PetscCall(MatAssemblyBegin(x, MAT_FINAL_ASSEMBLY));
34719566063dSJacob Faibussowitsch   PetscCall(MatAssemblyEnd(x, MAT_FINAL_ASSEMBLY));
34723ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3473679944adSJunchao Zhang }
3474679944adSJunchao Zhang 
34750a6ffc59SBarry Smith static struct _MatOps MatOps_Values = {MatSetValues_SeqAIJ,
3476cb5b572fSBarry Smith                                        MatGetRow_SeqAIJ,
3477cb5b572fSBarry Smith                                        MatRestoreRow_SeqAIJ,
3478cb5b572fSBarry Smith                                        MatMult_SeqAIJ,
347997304618SKris Buschelman                                        /*  4*/ MatMultAdd_SeqAIJ,
34807c922b88SBarry Smith                                        MatMultTranspose_SeqAIJ,
34817c922b88SBarry Smith                                        MatMultTransposeAdd_SeqAIJ,
3482f4259b30SLisandro Dalcin                                        NULL,
3483f4259b30SLisandro Dalcin                                        NULL,
3484f4259b30SLisandro Dalcin                                        NULL,
3485f4259b30SLisandro Dalcin                                        /* 10*/ NULL,
3486cb5b572fSBarry Smith                                        MatLUFactor_SeqAIJ,
3487f4259b30SLisandro Dalcin                                        NULL,
348841f059aeSBarry Smith                                        MatSOR_SeqAIJ,
348991e9d3e2SHong Zhang                                        MatTranspose_SeqAIJ,
349097304618SKris Buschelman                                        /*1 5*/ MatGetInfo_SeqAIJ,
3491cb5b572fSBarry Smith                                        MatEqual_SeqAIJ,
3492cb5b572fSBarry Smith                                        MatGetDiagonal_SeqAIJ,
3493cb5b572fSBarry Smith                                        MatDiagonalScale_SeqAIJ,
3494cb5b572fSBarry Smith                                        MatNorm_SeqAIJ,
3495f4259b30SLisandro Dalcin                                        /* 20*/ NULL,
3496cb5b572fSBarry Smith                                        MatAssemblyEnd_SeqAIJ,
3497cb5b572fSBarry Smith                                        MatSetOption_SeqAIJ,
3498cb5b572fSBarry Smith                                        MatZeroEntries_SeqAIJ,
3499d519adbfSMatthew Knepley                                        /* 24*/ MatZeroRows_SeqAIJ,
3500f4259b30SLisandro Dalcin                                        NULL,
3501f4259b30SLisandro Dalcin                                        NULL,
3502f4259b30SLisandro Dalcin                                        NULL,
3503f4259b30SLisandro Dalcin                                        NULL,
350426cec326SBarry Smith                                        /* 29*/ MatSetUp_Seq_Hash,
3505f4259b30SLisandro Dalcin                                        NULL,
3506f4259b30SLisandro Dalcin                                        NULL,
3507f4259b30SLisandro Dalcin                                        NULL,
3508f4259b30SLisandro Dalcin                                        NULL,
3509d519adbfSMatthew Knepley                                        /* 34*/ MatDuplicate_SeqAIJ,
3510f4259b30SLisandro Dalcin                                        NULL,
3511f4259b30SLisandro Dalcin                                        NULL,
3512cb5b572fSBarry Smith                                        MatILUFactor_SeqAIJ,
3513f4259b30SLisandro Dalcin                                        NULL,
3514d519adbfSMatthew Knepley                                        /* 39*/ MatAXPY_SeqAIJ,
35157dae84e0SHong Zhang                                        MatCreateSubMatrices_SeqAIJ,
3516cb5b572fSBarry Smith                                        MatIncreaseOverlap_SeqAIJ,
3517cb5b572fSBarry Smith                                        MatGetValues_SeqAIJ,
3518cb5b572fSBarry Smith                                        MatCopy_SeqAIJ,
3519d519adbfSMatthew Knepley                                        /* 44*/ MatGetRowMax_SeqAIJ,
3520cb5b572fSBarry Smith                                        MatScale_SeqAIJ,
35217d68702bSBarry Smith                                        MatShift_SeqAIJ,
352279299369SBarry Smith                                        MatDiagonalSet_SeqAIJ,
35236e169961SBarry Smith                                        MatZeroRowsColumns_SeqAIJ,
352473a71a0fSBarry Smith                                        /* 49*/ MatSetRandom_SeqAIJ,
35253b2fbd54SBarry Smith                                        MatGetRowIJ_SeqAIJ,
35263b2fbd54SBarry Smith                                        MatRestoreRowIJ_SeqAIJ,
35273b2fbd54SBarry Smith                                        MatGetColumnIJ_SeqAIJ,
3528a93ec695SBarry Smith                                        MatRestoreColumnIJ_SeqAIJ,
352993dfae19SHong Zhang                                        /* 54*/ MatFDColoringCreate_SeqXAIJ,
3530f4259b30SLisandro Dalcin                                        NULL,
3531f4259b30SLisandro Dalcin                                        NULL,
3532cda55fadSBarry Smith                                        MatPermute_SeqAIJ,
3533f4259b30SLisandro Dalcin                                        NULL,
3534f4259b30SLisandro Dalcin                                        /* 59*/ NULL,
3535b9b97703SBarry Smith                                        MatDestroy_SeqAIJ,
3536b9b97703SBarry Smith                                        MatView_SeqAIJ,
3537f4259b30SLisandro Dalcin                                        NULL,
3538f4259b30SLisandro Dalcin                                        NULL,
3539f4259b30SLisandro Dalcin                                        /* 64*/ NULL,
3540321b30b9SSatish Balay                                        MatMatMatMultNumeric_SeqAIJ_SeqAIJ_SeqAIJ,
3541f4259b30SLisandro Dalcin                                        NULL,
3542f4259b30SLisandro Dalcin                                        NULL,
3543f4259b30SLisandro Dalcin                                        NULL,
3544d519adbfSMatthew Knepley                                        /* 69*/ MatGetRowMaxAbs_SeqAIJ,
3545c87e5d42SMatthew Knepley                                        MatGetRowMinAbs_SeqAIJ,
3546f4259b30SLisandro Dalcin                                        NULL,
3547f4259b30SLisandro Dalcin                                        NULL,
3548f4259b30SLisandro Dalcin                                        NULL,
3549f4259b30SLisandro Dalcin                                        /* 74*/ NULL,
35503acb8795SBarry Smith                                        MatFDColoringApply_AIJ,
3551f4259b30SLisandro Dalcin                                        NULL,
3552f4259b30SLisandro Dalcin                                        NULL,
3553f4259b30SLisandro Dalcin                                        NULL,
35546ce1633cSBarry Smith                                        /* 79*/ MatFindZeroDiagonals_SeqAIJ,
3555f4259b30SLisandro Dalcin                                        NULL,
3556f4259b30SLisandro Dalcin                                        NULL,
3557f4259b30SLisandro Dalcin                                        NULL,
3558bc011b1eSHong Zhang                                        MatLoad_SeqAIJ,
35596cff0a6bSPierre Jolivet                                        /* 84*/ NULL,
35606cff0a6bSPierre Jolivet                                        NULL,
3561f4259b30SLisandro Dalcin                                        NULL,
3562f4259b30SLisandro Dalcin                                        NULL,
3563f4259b30SLisandro Dalcin                                        NULL,
3564f4259b30SLisandro Dalcin                                        /* 89*/ NULL,
3565f4259b30SLisandro Dalcin                                        NULL,
356626be0446SHong Zhang                                        MatMatMultNumeric_SeqAIJ_SeqAIJ,
3567f4259b30SLisandro Dalcin                                        NULL,
3568f4259b30SLisandro Dalcin                                        NULL,
35698fa4b5a6SHong Zhang                                        /* 94*/ MatPtAPNumeric_SeqAIJ_SeqAIJ_SparseAxpy,
3570f4259b30SLisandro Dalcin                                        NULL,
3571f4259b30SLisandro Dalcin                                        NULL,
35726fc122caSHong Zhang                                        MatMatTransposeMultNumeric_SeqAIJ_SeqAIJ,
3573f4259b30SLisandro Dalcin                                        NULL,
35744222ddf1SHong Zhang                                        /* 99*/ MatProductSetFromOptions_SeqAIJ,
3575f4259b30SLisandro Dalcin                                        NULL,
3576f4259b30SLisandro Dalcin                                        NULL,
357787d4246cSBarry Smith                                        MatConjugate_SeqAIJ,
3578f4259b30SLisandro Dalcin                                        NULL,
3579d519adbfSMatthew Knepley                                        /*104*/ MatSetValuesRow_SeqAIJ,
358099cafbc1SBarry Smith                                        MatRealPart_SeqAIJ,
3581f5edf698SHong Zhang                                        MatImaginaryPart_SeqAIJ,
3582f4259b30SLisandro Dalcin                                        NULL,
3583f4259b30SLisandro Dalcin                                        NULL,
3584cbd44569SHong Zhang                                        /*109*/ MatMatSolve_SeqAIJ,
3585f4259b30SLisandro Dalcin                                        NULL,
35862af78befSBarry Smith                                        MatGetRowMin_SeqAIJ,
3587f4259b30SLisandro Dalcin                                        NULL,
3588599ef60dSHong Zhang                                        MatMissingDiagonal_SeqAIJ,
3589f4259b30SLisandro Dalcin                                        /*114*/ NULL,
3590f4259b30SLisandro Dalcin                                        NULL,
3591f4259b30SLisandro Dalcin                                        NULL,
3592f4259b30SLisandro Dalcin                                        NULL,
3593f4259b30SLisandro Dalcin                                        NULL,
3594f4259b30SLisandro Dalcin                                        /*119*/ NULL,
3595f4259b30SLisandro Dalcin                                        NULL,
3596f4259b30SLisandro Dalcin                                        NULL,
3597f4259b30SLisandro Dalcin                                        NULL,
3598b3a44c85SBarry Smith                                        MatGetMultiProcBlock_SeqAIJ,
35990716a85fSBarry Smith                                        /*124*/ MatFindNonzeroRows_SeqAIJ,
3600a873a8cdSSam Reynolds                                        MatGetColumnReductions_SeqAIJ,
360137868618SMatthew G Knepley                                        MatInvertBlockDiagonal_SeqAIJ,
36020da83c2eSBarry Smith                                        MatInvertVariableBlockDiagonal_SeqAIJ,
3603f4259b30SLisandro Dalcin                                        NULL,
3604f4259b30SLisandro Dalcin                                        /*129*/ NULL,
3605f4259b30SLisandro Dalcin                                        NULL,
3606f4259b30SLisandro Dalcin                                        NULL,
360775648e8dSHong Zhang                                        MatTransposeMatMultNumeric_SeqAIJ_SeqAIJ,
3608b9af6bddSHong Zhang                                        MatTransposeColoringCreate_SeqAIJ,
3609b9af6bddSHong Zhang                                        /*134*/ MatTransColoringApplySpToDen_SeqAIJ,
36102b8ad9a3SHong Zhang                                        MatTransColoringApplyDenToSp_SeqAIJ,
3611f4259b30SLisandro Dalcin                                        NULL,
3612f4259b30SLisandro Dalcin                                        NULL,
36133964eb88SJed Brown                                        MatRARtNumeric_SeqAIJ_SeqAIJ,
3614f4259b30SLisandro Dalcin                                        /*139*/ NULL,
3615f4259b30SLisandro Dalcin                                        NULL,
3616f4259b30SLisandro Dalcin                                        NULL,
36173a062f41SBarry Smith                                        MatFDColoringSetUp_SeqXAIJ,
36189c8f2541SHong Zhang                                        MatFindOffBlockDiagonalEntries_SeqAIJ,
36194222ddf1SHong Zhang                                        MatCreateMPIMatConcatenateSeqMat_SeqAIJ,
36204222ddf1SHong Zhang                                        /*145*/ MatDestroySubMatrices_SeqAIJ,
3621f4259b30SLisandro Dalcin                                        NULL,
362272833a62Smarkadams4                                        NULL,
362372833a62Smarkadams4                                        MatCreateGraph_Simple_AIJ,
36242d776b49SBarry Smith                                        NULL,
3625dec0b466SHong Zhang                                        /*150*/ MatTransposeSymbolic_SeqAIJ,
3626eede4a3fSMark Adams                                        MatEliminateZeros_SeqAIJ,
36274cc2b5b5SPierre Jolivet                                        MatGetRowSumAbs_SeqAIJ,
362842ce410bSJunchao Zhang                                        NULL,
362942ce410bSJunchao Zhang                                        NULL,
36304cc2b5b5SPierre Jolivet                                        NULL};
363117ab2063SBarry Smith 
3632ba38deedSJacob Faibussowitsch static PetscErrorCode MatSeqAIJSetColumnIndices_SeqAIJ(Mat mat, PetscInt *indices)
3633d71ae5a4SJacob Faibussowitsch {
3634bef8e0ddSBarry Smith   Mat_SeqAIJ *aij = (Mat_SeqAIJ *)mat->data;
363597f1f81fSBarry Smith   PetscInt    i, nz, n;
3636bef8e0ddSBarry Smith 
3637bef8e0ddSBarry Smith   PetscFunctionBegin;
3638bef8e0ddSBarry Smith   nz = aij->maxnz;
3639d0f46423SBarry Smith   n  = mat->rmap->n;
3640ad540459SPierre Jolivet   for (i = 0; i < nz; i++) aij->j[i] = indices[i];
3641bef8e0ddSBarry Smith   aij->nz = nz;
3642ad540459SPierre Jolivet   for (i = 0; i < n; i++) aij->ilen[i] = aij->imax[i];
36433ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3644bef8e0ddSBarry Smith }
3645bef8e0ddSBarry Smith 
3646a3bb6f32SFande Kong /*
3647ddea5d60SJunchao Zhang  * Given a sparse matrix with global column indices, compact it by using a local column space.
3648ddea5d60SJunchao Zhang  * The result matrix helps saving memory in other algorithms, such as MatPtAPSymbolic_MPIAIJ_MPIAIJ_scalable()
3649ddea5d60SJunchao Zhang  */
3650d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJCompactOutExtraColumns_SeqAIJ(Mat mat, ISLocalToGlobalMapping *mapping)
3651d71ae5a4SJacob Faibussowitsch {
3652a3bb6f32SFande Kong   Mat_SeqAIJ   *aij = (Mat_SeqAIJ *)mat->data;
3653eec179cfSJacob Faibussowitsch   PetscHMapI    gid1_lid1;
3654eec179cfSJacob Faibussowitsch   PetscHashIter tpos;
365525b670f0SStefano Zampini   PetscInt      gid, lid, i, ec, nz = aij->nz;
365625b670f0SStefano Zampini   PetscInt     *garray, *jj = aij->j;
3657a3bb6f32SFande Kong 
3658a3bb6f32SFande Kong   PetscFunctionBegin;
3659a3bb6f32SFande Kong   PetscValidHeaderSpecific(mat, MAT_CLASSID, 1);
36604f572ea9SToby Isaac   PetscAssertPointer(mapping, 2);
3661a3bb6f32SFande Kong   /* use a table */
3662eec179cfSJacob Faibussowitsch   PetscCall(PetscHMapICreateWithSize(mat->rmap->n, &gid1_lid1));
3663a3bb6f32SFande Kong   ec = 0;
366425b670f0SStefano Zampini   for (i = 0; i < nz; i++) {
366525b670f0SStefano Zampini     PetscInt data, gid1 = jj[i] + 1;
3666eec179cfSJacob Faibussowitsch     PetscCall(PetscHMapIGetWithDefault(gid1_lid1, gid1, 0, &data));
3667a3bb6f32SFande Kong     if (!data) {
3668a3bb6f32SFande Kong       /* one based table */
3669c76ffc5fSJacob Faibussowitsch       PetscCall(PetscHMapISet(gid1_lid1, gid1, ++ec));
3670a3bb6f32SFande Kong     }
3671a3bb6f32SFande Kong   }
3672a3bb6f32SFande Kong   /* form array of columns we need */
36739566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(ec, &garray));
3674eec179cfSJacob Faibussowitsch   PetscHashIterBegin(gid1_lid1, tpos);
3675eec179cfSJacob Faibussowitsch   while (!PetscHashIterAtEnd(gid1_lid1, tpos)) {
3676eec179cfSJacob Faibussowitsch     PetscHashIterGetKey(gid1_lid1, tpos, gid);
3677eec179cfSJacob Faibussowitsch     PetscHashIterGetVal(gid1_lid1, tpos, lid);
3678eec179cfSJacob Faibussowitsch     PetscHashIterNext(gid1_lid1, tpos);
3679a3bb6f32SFande Kong     gid--;
3680a3bb6f32SFande Kong     lid--;
3681a3bb6f32SFande Kong     garray[lid] = gid;
3682a3bb6f32SFande Kong   }
36839566063dSJacob Faibussowitsch   PetscCall(PetscSortInt(ec, garray)); /* sort, and rebuild */
3684eec179cfSJacob Faibussowitsch   PetscCall(PetscHMapIClear(gid1_lid1));
3685c76ffc5fSJacob Faibussowitsch   for (i = 0; i < ec; i++) PetscCall(PetscHMapISet(gid1_lid1, garray[i] + 1, i + 1));
3686a3bb6f32SFande Kong   /* compact out the extra columns in B */
368725b670f0SStefano Zampini   for (i = 0; i < nz; i++) {
368825b670f0SStefano Zampini     PetscInt gid1 = jj[i] + 1;
3689eec179cfSJacob Faibussowitsch     PetscCall(PetscHMapIGetWithDefault(gid1_lid1, gid1, 0, &lid));
3690a3bb6f32SFande Kong     lid--;
369125b670f0SStefano Zampini     jj[i] = lid;
3692a3bb6f32SFande Kong   }
36939566063dSJacob Faibussowitsch   PetscCall(PetscLayoutDestroy(&mat->cmap));
3694eec179cfSJacob Faibussowitsch   PetscCall(PetscHMapIDestroy(&gid1_lid1));
36959566063dSJacob Faibussowitsch   PetscCall(PetscLayoutCreateFromSizes(PetscObjectComm((PetscObject)mat), ec, ec, 1, &mat->cmap));
36969566063dSJacob Faibussowitsch   PetscCall(ISLocalToGlobalMappingCreate(PETSC_COMM_SELF, mat->cmap->bs, mat->cmap->n, garray, PETSC_OWN_POINTER, mapping));
36979566063dSJacob Faibussowitsch   PetscCall(ISLocalToGlobalMappingSetType(*mapping, ISLOCALTOGLOBALMAPPINGHASH));
36983ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3699a3bb6f32SFande Kong }
3700a3bb6f32SFande Kong 
3701bef8e0ddSBarry Smith /*@
3702bef8e0ddSBarry Smith   MatSeqAIJSetColumnIndices - Set the column indices for all the rows
3703bef8e0ddSBarry Smith   in the matrix.
3704bef8e0ddSBarry Smith 
3705bef8e0ddSBarry Smith   Input Parameters:
370611a5261eSBarry Smith + mat     - the `MATSEQAIJ` matrix
3707bef8e0ddSBarry Smith - indices - the column indices
3708bef8e0ddSBarry Smith 
370915091d37SBarry Smith   Level: advanced
371015091d37SBarry Smith 
3711bef8e0ddSBarry Smith   Notes:
3712bef8e0ddSBarry Smith   This can be called if you have precomputed the nonzero structure of the
3713bef8e0ddSBarry Smith   matrix and want to provide it to the matrix object to improve the performance
371411a5261eSBarry Smith   of the `MatSetValues()` operation.
3715bef8e0ddSBarry Smith 
3716bef8e0ddSBarry Smith   You MUST have set the correct numbers of nonzeros per row in the call to
371711a5261eSBarry Smith   `MatCreateSeqAIJ()`, and the columns indices MUST be sorted.
3718bef8e0ddSBarry Smith 
371911a5261eSBarry Smith   MUST be called before any calls to `MatSetValues()`
3720bef8e0ddSBarry Smith 
3721b9617806SBarry Smith   The indices should start with zero, not one.
3722b9617806SBarry Smith 
37231cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MATSEQAIJ`
3724bef8e0ddSBarry Smith @*/
3725d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetColumnIndices(Mat mat, PetscInt *indices)
3726d71ae5a4SJacob Faibussowitsch {
3727bef8e0ddSBarry Smith   PetscFunctionBegin;
37280700a824SBarry Smith   PetscValidHeaderSpecific(mat, MAT_CLASSID, 1);
37294f572ea9SToby Isaac   PetscAssertPointer(indices, 2);
3730cac4c232SBarry Smith   PetscUseMethod(mat, "MatSeqAIJSetColumnIndices_C", (Mat, PetscInt *), (mat, indices));
37313ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3732bef8e0ddSBarry Smith }
3733bef8e0ddSBarry Smith 
3734ba38deedSJacob Faibussowitsch static PetscErrorCode MatStoreValues_SeqAIJ(Mat mat)
3735d71ae5a4SJacob Faibussowitsch {
3736be6bf707SBarry Smith   Mat_SeqAIJ *aij = (Mat_SeqAIJ *)mat->data;
3737d0f46423SBarry Smith   size_t      nz  = aij->i[mat->rmap->n];
3738be6bf707SBarry Smith 
3739be6bf707SBarry Smith   PetscFunctionBegin;
374028b400f6SJacob Faibussowitsch   PetscCheck(aij->nonew, PETSC_COMM_SELF, PETSC_ERR_ORDER, "Must call MatSetOption(A,MAT_NEW_NONZERO_LOCATIONS,PETSC_FALSE);first");
3741be6bf707SBarry Smith 
3742be6bf707SBarry Smith   /* allocate space for values if not already there */
37434dfa11a4SJacob Faibussowitsch   if (!aij->saved_values) { PetscCall(PetscMalloc1(nz + 1, &aij->saved_values)); }
3744be6bf707SBarry Smith 
3745be6bf707SBarry Smith   /* copy values over */
37469566063dSJacob Faibussowitsch   PetscCall(PetscArraycpy(aij->saved_values, aij->a, nz));
37473ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3748be6bf707SBarry Smith }
3749be6bf707SBarry Smith 
3750be6bf707SBarry Smith /*@
375120f4b53cSBarry Smith   MatStoreValues - Stashes a copy of the matrix values; this allows reusing of the linear part of a Jacobian, while recomputing only the
3752be6bf707SBarry Smith   nonlinear portion.
3753be6bf707SBarry Smith 
3754c3339decSBarry Smith   Logically Collect
3755be6bf707SBarry Smith 
375627430b45SBarry Smith   Input Parameter:
375711a5261eSBarry Smith . mat - the matrix (currently only `MATAIJ` matrices support this option)
3758be6bf707SBarry Smith 
375915091d37SBarry Smith   Level: advanced
376015091d37SBarry Smith 
37612920cce0SJacob Faibussowitsch   Example Usage:
376227430b45SBarry Smith .vb
37632ef1f0ffSBarry Smith     Using SNES
376427430b45SBarry Smith     Create Jacobian matrix
376527430b45SBarry Smith     Set linear terms into matrix
376627430b45SBarry Smith     Apply boundary conditions to matrix, at this time matrix must have
376727430b45SBarry Smith       final nonzero structure (i.e. setting the nonlinear terms and applying
376827430b45SBarry Smith       boundary conditions again will not change the nonzero structure
376927430b45SBarry Smith     MatSetOption(mat, MAT_NEW_NONZERO_LOCATIONS, PETSC_FALSE);
377027430b45SBarry Smith     MatStoreValues(mat);
377127430b45SBarry Smith     Call SNESSetJacobian() with matrix
377227430b45SBarry Smith     In your Jacobian routine
377327430b45SBarry Smith       MatRetrieveValues(mat);
377427430b45SBarry Smith       Set nonlinear terms in matrix
3775be6bf707SBarry Smith 
377627430b45SBarry Smith     Without `SNESSolve()`, i.e. when you handle nonlinear solve yourself:
377727430b45SBarry Smith     // build linear portion of Jacobian
377827430b45SBarry Smith     MatSetOption(mat, MAT_NEW_NONZERO_LOCATIONS, PETSC_FALSE);
377927430b45SBarry Smith     MatStoreValues(mat);
378027430b45SBarry Smith     loop over nonlinear iterations
378127430b45SBarry Smith        MatRetrieveValues(mat);
378227430b45SBarry Smith        // call MatSetValues(mat,...) to set nonliner portion of Jacobian
378327430b45SBarry Smith        // call MatAssemblyBegin/End() on matrix
378427430b45SBarry Smith        Solve linear system with Jacobian
378527430b45SBarry Smith     endloop
378627430b45SBarry Smith .ve
3787be6bf707SBarry Smith 
3788be6bf707SBarry Smith   Notes:
3789da81f932SPierre Jolivet   Matrix must already be assembled before calling this routine
379011a5261eSBarry Smith   Must set the matrix option `MatSetOption`(mat,`MAT_NEW_NONZERO_LOCATIONS`,`PETSC_FALSE`); before
3791be6bf707SBarry Smith   calling this routine.
3792be6bf707SBarry Smith 
37930c468ba9SBarry Smith   When this is called multiple times it overwrites the previous set of stored values
37940c468ba9SBarry Smith   and does not allocated additional space.
37950c468ba9SBarry Smith 
3796fe59aa6dSJacob Faibussowitsch .seealso: [](ch_matrices), `Mat`, `MatRetrieveValues()`
3797be6bf707SBarry Smith @*/
3798d71ae5a4SJacob Faibussowitsch PetscErrorCode MatStoreValues(Mat mat)
3799d71ae5a4SJacob Faibussowitsch {
3800be6bf707SBarry Smith   PetscFunctionBegin;
38010700a824SBarry Smith   PetscValidHeaderSpecific(mat, MAT_CLASSID, 1);
380228b400f6SJacob Faibussowitsch   PetscCheck(mat->assembled, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for unassembled matrix");
380328b400f6SJacob Faibussowitsch   PetscCheck(!mat->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix");
3804cac4c232SBarry Smith   PetscUseMethod(mat, "MatStoreValues_C", (Mat), (mat));
38053ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3806be6bf707SBarry Smith }
3807be6bf707SBarry Smith 
3808ba38deedSJacob Faibussowitsch static PetscErrorCode MatRetrieveValues_SeqAIJ(Mat mat)
3809d71ae5a4SJacob Faibussowitsch {
3810be6bf707SBarry Smith   Mat_SeqAIJ *aij = (Mat_SeqAIJ *)mat->data;
3811d0f46423SBarry Smith   PetscInt    nz  = aij->i[mat->rmap->n];
3812be6bf707SBarry Smith 
3813be6bf707SBarry Smith   PetscFunctionBegin;
381428b400f6SJacob Faibussowitsch   PetscCheck(aij->nonew, PETSC_COMM_SELF, PETSC_ERR_ORDER, "Must call MatSetOption(A,MAT_NEW_NONZERO_LOCATIONS,PETSC_FALSE);first");
381528b400f6SJacob Faibussowitsch   PetscCheck(aij->saved_values, PETSC_COMM_SELF, PETSC_ERR_ORDER, "Must call MatStoreValues(A);first");
3816be6bf707SBarry Smith   /* copy values over */
38179566063dSJacob Faibussowitsch   PetscCall(PetscArraycpy(aij->a, aij->saved_values, nz));
38183ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3819be6bf707SBarry Smith }
3820be6bf707SBarry Smith 
3821be6bf707SBarry Smith /*@
382220f4b53cSBarry Smith   MatRetrieveValues - Retrieves the copy of the matrix values that was stored with `MatStoreValues()`
3823be6bf707SBarry Smith 
3824c3339decSBarry Smith   Logically Collect
3825be6bf707SBarry Smith 
38262fe279fdSBarry Smith   Input Parameter:
382711a5261eSBarry Smith . mat - the matrix (currently only `MATAIJ` matrices support this option)
3828be6bf707SBarry Smith 
382915091d37SBarry Smith   Level: advanced
383015091d37SBarry Smith 
38311cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatStoreValues()`
3832be6bf707SBarry Smith @*/
3833d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRetrieveValues(Mat mat)
3834d71ae5a4SJacob Faibussowitsch {
3835be6bf707SBarry Smith   PetscFunctionBegin;
38360700a824SBarry Smith   PetscValidHeaderSpecific(mat, MAT_CLASSID, 1);
383728b400f6SJacob Faibussowitsch   PetscCheck(mat->assembled, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for unassembled matrix");
383828b400f6SJacob Faibussowitsch   PetscCheck(!mat->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix");
3839cac4c232SBarry Smith   PetscUseMethod(mat, "MatRetrieveValues_C", (Mat), (mat));
38403ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3841be6bf707SBarry Smith }
3842be6bf707SBarry Smith 
38435d83a8b1SBarry Smith /*@
384411a5261eSBarry Smith   MatCreateSeqAIJ - Creates a sparse matrix in `MATSEQAIJ` (compressed row) format
38450d15e28bSLois Curfman McInnes   (the default parallel PETSc format).  For good matrix assembly performance
384620f4b53cSBarry Smith   the user should preallocate the matrix storage by setting the parameter `nz`
384720f4b53cSBarry Smith   (or the array `nnz`).
384817ab2063SBarry Smith 
3849d083f849SBarry Smith   Collective
3850db81eaa0SLois Curfman McInnes 
385117ab2063SBarry Smith   Input Parameters:
385211a5261eSBarry Smith + comm - MPI communicator, set to `PETSC_COMM_SELF`
385317ab2063SBarry Smith . m    - number of rows
385417ab2063SBarry Smith . n    - number of columns
385517ab2063SBarry Smith . nz   - number of nonzeros per row (same for all rows)
385651c19458SBarry Smith - nnz  - array containing the number of nonzeros in the various rows
38570298fd71SBarry Smith          (possibly different for each row) or NULL
385817ab2063SBarry Smith 
385917ab2063SBarry Smith   Output Parameter:
3860416022c9SBarry Smith . A - the matrix
386117ab2063SBarry Smith 
38622ef1f0ffSBarry Smith   Options Database Keys:
38632ef1f0ffSBarry Smith + -mat_no_inode            - Do not use inodes
38642ef1f0ffSBarry Smith - -mat_inode_limit <limit> - Sets inode limit (max limit=5)
38652ef1f0ffSBarry Smith 
38662ef1f0ffSBarry Smith   Level: intermediate
3867175b88e8SBarry Smith 
3868b259b22eSLois Curfman McInnes   Notes:
386977433607SBarry Smith   It is recommend to use `MatCreateFromOptions()` instead of this routine
387077433607SBarry Smith 
38712ef1f0ffSBarry Smith   If `nnz` is given then `nz` is ignored
387249a6f317SBarry Smith 
38732ef1f0ffSBarry Smith   The `MATSEQAIJ` format, also called
38742ef1f0ffSBarry Smith   compressed row storage, is fully compatible with standard Fortran
38750002213bSLois Curfman McInnes   storage.  That is, the stored row and column indices can begin at
38762ef1f0ffSBarry Smith   either one (as in Fortran) or zero.
387717ab2063SBarry Smith 
387820f4b53cSBarry Smith   Specify the preallocated storage with either `nz` or `nnz` (not both).
38792ef1f0ffSBarry Smith   Set `nz` = `PETSC_DEFAULT` and `nnz` = `NULL` for PETSc to control dynamic memory
388020f4b53cSBarry Smith   allocation.
388117ab2063SBarry Smith 
3882682d7d0cSBarry Smith   By default, this format uses inodes (identical nodes) when possible, to
38834fca80b9SLois Curfman McInnes   improve numerical efficiency of matrix-vector products and solves. We
3884682d7d0cSBarry Smith   search for consecutive rows with the same nonzero structure, thereby
38856c7ebb05SLois Curfman McInnes   reusing matrix information to achieve increased efficiency.
38866c7ebb05SLois Curfman McInnes 
38871cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, [Sparse Matrix Creation](sec_matsparse), `MatCreate()`, `MatCreateAIJ()`, `MatSetValues()`, `MatSeqAIJSetColumnIndices()`, `MatCreateSeqAIJWithArrays()`
388817ab2063SBarry Smith @*/
3889d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateSeqAIJ(MPI_Comm comm, PetscInt m, PetscInt n, PetscInt nz, const PetscInt nnz[], Mat *A)
3890d71ae5a4SJacob Faibussowitsch {
38913a40ed3dSBarry Smith   PetscFunctionBegin;
38929566063dSJacob Faibussowitsch   PetscCall(MatCreate(comm, A));
38939566063dSJacob Faibussowitsch   PetscCall(MatSetSizes(*A, m, n, m, n));
38949566063dSJacob Faibussowitsch   PetscCall(MatSetType(*A, MATSEQAIJ));
38959566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(*A, nz, nnz));
38963ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3897273d9f13SBarry Smith }
3898273d9f13SBarry Smith 
38995d83a8b1SBarry Smith /*@
3900273d9f13SBarry Smith   MatSeqAIJSetPreallocation - For good matrix assembly performance
3901273d9f13SBarry Smith   the user should preallocate the matrix storage by setting the parameter nz
3902273d9f13SBarry Smith   (or the array nnz).  By setting these parameters accurately, performance
3903273d9f13SBarry Smith   during matrix assembly can be increased by more than a factor of 50.
3904273d9f13SBarry Smith 
3905d083f849SBarry Smith   Collective
3906273d9f13SBarry Smith 
3907273d9f13SBarry Smith   Input Parameters:
39081c4f3114SJed Brown + B   - The matrix
3909273d9f13SBarry Smith . nz  - number of nonzeros per row (same for all rows)
3910273d9f13SBarry Smith - nnz - array containing the number of nonzeros in the various rows
39110298fd71SBarry Smith          (possibly different for each row) or NULL
3912273d9f13SBarry Smith 
39132ef1f0ffSBarry Smith   Options Database Keys:
39142ef1f0ffSBarry Smith + -mat_no_inode            - Do not use inodes
39152ef1f0ffSBarry Smith - -mat_inode_limit <limit> - Sets inode limit (max limit=5)
39162ef1f0ffSBarry Smith 
39172ef1f0ffSBarry Smith   Level: intermediate
39182ef1f0ffSBarry Smith 
3919273d9f13SBarry Smith   Notes:
39202ef1f0ffSBarry Smith   If `nnz` is given then `nz` is ignored
392149a6f317SBarry Smith 
392211a5261eSBarry Smith   The `MATSEQAIJ` format also called
39232ef1f0ffSBarry Smith   compressed row storage, is fully compatible with standard Fortran
3924273d9f13SBarry Smith   storage.  That is, the stored row and column indices can begin at
3925273d9f13SBarry Smith   either one (as in Fortran) or zero.  See the users' manual for details.
3926273d9f13SBarry Smith 
39272ef1f0ffSBarry Smith   Specify the preallocated storage with either `nz` or `nnz` (not both).
39282ef1f0ffSBarry Smith   Set nz = `PETSC_DEFAULT` and `nnz` = `NULL` for PETSc to control dynamic memory
39292ef1f0ffSBarry Smith   allocation.
3930273d9f13SBarry Smith 
393111a5261eSBarry Smith   You can call `MatGetInfo()` to get information on how effective the preallocation was;
3932aa95bbe8SBarry Smith   for example the fields mallocs,nz_allocated,nz_used,nz_unneeded;
3933aa95bbe8SBarry Smith   You can also run with the option -info and look for messages with the string
3934aa95bbe8SBarry Smith   malloc in them to see if additional memory allocation was needed.
3935aa95bbe8SBarry Smith 
393611a5261eSBarry Smith   Developer Notes:
393711a5261eSBarry Smith   Use nz of `MAT_SKIP_ALLOCATION` to not allocate any space for the matrix
3938a96a251dSBarry Smith   entries or columns indices
3939a96a251dSBarry Smith 
3940273d9f13SBarry Smith   By default, this format uses inodes (identical nodes) when possible, to
3941273d9f13SBarry Smith   improve numerical efficiency of matrix-vector products and solves. We
3942273d9f13SBarry Smith   search for consecutive rows with the same nonzero structure, thereby
3943273d9f13SBarry Smith   reusing matrix information to achieve increased efficiency.
3944273d9f13SBarry Smith 
39451cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatCreate()`, `MatCreateAIJ()`, `MatSetValues()`, `MatSeqAIJSetColumnIndices()`, `MatCreateSeqAIJWithArrays()`, `MatGetInfo()`,
3946db781477SPatrick Sanan           `MatSeqAIJSetTotalPreallocation()`
3947273d9f13SBarry Smith @*/
3948d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetPreallocation(Mat B, PetscInt nz, const PetscInt nnz[])
3949d71ae5a4SJacob Faibussowitsch {
3950a23d5eceSKris Buschelman   PetscFunctionBegin;
39516ba663aaSJed Brown   PetscValidHeaderSpecific(B, MAT_CLASSID, 1);
39526ba663aaSJed Brown   PetscValidType(B, 1);
3953cac4c232SBarry Smith   PetscTryMethod(B, "MatSeqAIJSetPreallocation_C", (Mat, PetscInt, const PetscInt[]), (B, nz, nnz));
39543ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3955a23d5eceSKris Buschelman }
3956a23d5eceSKris Buschelman 
3957d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetPreallocation_SeqAIJ(Mat B, PetscInt nz, const PetscInt *nnz)
3958d71ae5a4SJacob Faibussowitsch {
3959ad79cf63SBarry Smith   Mat_SeqAIJ *b              = (Mat_SeqAIJ *)B->data;
39602576faa2SJed Brown   PetscBool   skipallocation = PETSC_FALSE, realalloc = PETSC_FALSE;
396197f1f81fSBarry Smith   PetscInt    i;
3962273d9f13SBarry Smith 
3963273d9f13SBarry Smith   PetscFunctionBegin;
3964ad79cf63SBarry Smith   if (B->hash_active) {
3965aea10558SJacob Faibussowitsch     B->ops[0] = b->cops;
3966ad79cf63SBarry Smith     PetscCall(PetscHMapIJVDestroy(&b->ht));
3967ad79cf63SBarry Smith     PetscCall(PetscFree(b->dnz));
3968ad79cf63SBarry Smith     B->hash_active = PETSC_FALSE;
3969ad79cf63SBarry Smith   }
39702576faa2SJed Brown   if (nz >= 0 || nnz) realalloc = PETSC_TRUE;
3971a96a251dSBarry Smith   if (nz == MAT_SKIP_ALLOCATION) {
3972c461c341SBarry Smith     skipallocation = PETSC_TRUE;
3973c461c341SBarry Smith     nz             = 0;
3974c461c341SBarry Smith   }
39759566063dSJacob Faibussowitsch   PetscCall(PetscLayoutSetUp(B->rmap));
39769566063dSJacob Faibussowitsch   PetscCall(PetscLayoutSetUp(B->cmap));
3977899cda47SBarry Smith 
3978435da068SBarry Smith   if (nz == PETSC_DEFAULT || nz == PETSC_DECIDE) nz = 5;
397908401ef6SPierre Jolivet   PetscCheck(nz >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "nz cannot be less than 0: value %" PetscInt_FMT, nz);
39809f0612e4SBarry Smith   if (nnz) {
3981d0f46423SBarry Smith     for (i = 0; i < B->rmap->n; i++) {
398208401ef6SPierre Jolivet       PetscCheck(nnz[i] >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "nnz cannot be less than 0: local row %" PetscInt_FMT " value %" PetscInt_FMT, i, nnz[i]);
398308401ef6SPierre Jolivet       PetscCheck(nnz[i] <= B->cmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "nnz cannot be greater than row length: local row %" PetscInt_FMT " value %" PetscInt_FMT " rowlength %" PetscInt_FMT, i, nnz[i], B->cmap->n);
3984b73539f3SBarry Smith     }
3985b73539f3SBarry Smith   }
3986b73539f3SBarry Smith 
3987273d9f13SBarry Smith   B->preallocated = PETSC_TRUE;
3988ab93d7beSBarry Smith   if (!skipallocation) {
39894dfa11a4SJacob Faibussowitsch     if (!b->imax) { PetscCall(PetscMalloc1(B->rmap->n, &b->imax)); }
3990071fcb05SBarry Smith     if (!b->ilen) {
3991071fcb05SBarry Smith       /* b->ilen will count nonzeros in each row so far. */
39929566063dSJacob Faibussowitsch       PetscCall(PetscCalloc1(B->rmap->n, &b->ilen));
3993071fcb05SBarry Smith     } else {
39949566063dSJacob Faibussowitsch       PetscCall(PetscMemzero(b->ilen, B->rmap->n * sizeof(PetscInt)));
39952ee49352SLisandro Dalcin     }
3996aa624791SPierre Jolivet     if (!b->ipre) PetscCall(PetscMalloc1(B->rmap->n, &b->ipre));
3997273d9f13SBarry Smith     if (!nnz) {
3998435da068SBarry Smith       if (nz == PETSC_DEFAULT || nz == PETSC_DECIDE) nz = 10;
3999c62bd62aSJed Brown       else if (nz < 0) nz = 1;
40005d2a9ed1SStefano Zampini       nz = PetscMin(nz, B->cmap->n);
4001d0f46423SBarry Smith       for (i = 0; i < B->rmap->n; i++) b->imax[i] = nz;
4002c43c4a61SBarry Smith       PetscCall(PetscIntMultError(nz, B->rmap->n, &nz));
4003273d9f13SBarry Smith     } else {
4004c73702f5SBarry Smith       PetscInt64 nz64 = 0;
40059371c9d4SSatish Balay       for (i = 0; i < B->rmap->n; i++) {
40069371c9d4SSatish Balay         b->imax[i] = nnz[i];
40079371c9d4SSatish Balay         nz64 += nnz[i];
40089371c9d4SSatish Balay       }
40099566063dSJacob Faibussowitsch       PetscCall(PetscIntCast(nz64, &nz));
4010273d9f13SBarry Smith     }
4011ab93d7beSBarry Smith 
4012273d9f13SBarry Smith     /* allocate the matrix space */
40139566063dSJacob Faibussowitsch     PetscCall(MatSeqXAIJFreeAIJ(B, &b->a, &b->j, &b->i));
40149f0612e4SBarry Smith     PetscCall(PetscShmgetAllocateArray(nz, sizeof(PetscInt), (void **)&b->j));
40159f0612e4SBarry Smith     PetscCall(PetscShmgetAllocateArray(B->rmap->n + 1, sizeof(PetscInt), (void **)&b->i));
40169f0612e4SBarry Smith     b->free_ij = PETSC_TRUE;
4017396832f4SHong Zhang     if (B->structure_only) {
40189f0612e4SBarry Smith       b->free_a = PETSC_FALSE;
4019396832f4SHong Zhang     } else {
40209f0612e4SBarry Smith       PetscCall(PetscShmgetAllocateArray(nz, sizeof(PetscScalar), (void **)&b->a));
40219f0612e4SBarry Smith       b->free_a = PETSC_TRUE;
4022396832f4SHong Zhang     }
4023bfeeae90SHong Zhang     b->i[0] = 0;
4024ad540459SPierre Jolivet     for (i = 1; i < B->rmap->n + 1; i++) b->i[i] = b->i[i - 1] + b->imax[i - 1];
4025c461c341SBarry Smith   } else {
4026e6b907acSBarry Smith     b->free_a  = PETSC_FALSE;
4027e6b907acSBarry Smith     b->free_ij = PETSC_FALSE;
4028c461c341SBarry Smith   }
4029273d9f13SBarry Smith 
4030846b4da1SFande Kong   if (b->ipre && nnz != b->ipre && b->imax) {
4031846b4da1SFande Kong     /* reserve user-requested sparsity */
40329566063dSJacob Faibussowitsch     PetscCall(PetscArraycpy(b->ipre, b->imax, B->rmap->n));
4033846b4da1SFande Kong   }
4034846b4da1SFande Kong 
4035273d9f13SBarry Smith   b->nz               = 0;
4036273d9f13SBarry Smith   b->maxnz            = nz;
4037273d9f13SBarry Smith   B->info.nz_unneeded = (double)b->maxnz;
40381baa6e33SBarry Smith   if (realalloc) PetscCall(MatSetOption(B, MAT_NEW_NONZERO_ALLOCATION_ERR, PETSC_TRUE));
4039cb7b82ddSBarry Smith   B->was_assembled = PETSC_FALSE;
4040cb7b82ddSBarry Smith   B->assembled     = PETSC_FALSE;
40415519a089SJose E. Roman   /* We simply deem preallocation has changed nonzero state. Updating the state
40425519a089SJose E. Roman      will give clients (like AIJKokkos) a chance to know something has happened.
40435519a089SJose E. Roman   */
40445519a089SJose E. Roman   B->nonzerostate++;
40453ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
4046273d9f13SBarry Smith }
4047273d9f13SBarry Smith 
4048ba38deedSJacob Faibussowitsch static PetscErrorCode MatResetPreallocation_SeqAIJ(Mat A)
4049d71ae5a4SJacob Faibussowitsch {
4050846b4da1SFande Kong   Mat_SeqAIJ *a;
4051a5bbaf83SFande Kong   PetscInt    i;
40521f14be2bSBarry Smith   PetscBool   skipreset;
4053846b4da1SFande Kong 
4054846b4da1SFande Kong   PetscFunctionBegin;
4055846b4da1SFande Kong   PetscValidHeaderSpecific(A, MAT_CLASSID, 1);
405614d0e64fSAlex Lindsay 
405714d0e64fSAlex Lindsay   /* Check local size. If zero, then return */
40583ba16761SJacob Faibussowitsch   if (!A->rmap->n) PetscFunctionReturn(PETSC_SUCCESS);
405914d0e64fSAlex Lindsay 
4060846b4da1SFande Kong   a = (Mat_SeqAIJ *)A->data;
40612c814fdeSFande Kong   /* if no saved info, we error out */
406228b400f6SJacob Faibussowitsch   PetscCheck(a->ipre, PETSC_COMM_SELF, PETSC_ERR_ARG_NULL, "No saved preallocation info ");
40632c814fdeSFande Kong 
40641f14be2bSBarry Smith   PetscCheck(a->i && a->imax && a->ilen, PETSC_COMM_SELF, PETSC_ERR_ARG_NULL, "Memory info is incomplete, and can not reset preallocation ");
40652c814fdeSFande Kong 
40661f14be2bSBarry Smith   PetscCall(PetscArraycmp(a->ipre, a->ilen, A->rmap->n, &skipreset));
40671f14be2bSBarry Smith   if (!skipreset) {
40689566063dSJacob Faibussowitsch     PetscCall(PetscArraycpy(a->imax, a->ipre, A->rmap->n));
40699566063dSJacob Faibussowitsch     PetscCall(PetscArrayzero(a->ilen, A->rmap->n));
4070846b4da1SFande Kong     a->i[0] = 0;
4071ad540459SPierre Jolivet     for (i = 1; i < A->rmap->n + 1; i++) a->i[i] = a->i[i - 1] + a->imax[i - 1];
4072846b4da1SFande Kong     A->preallocated     = PETSC_TRUE;
4073846b4da1SFande Kong     a->nz               = 0;
4074846b4da1SFande Kong     a->maxnz            = a->i[A->rmap->n];
4075846b4da1SFande Kong     A->info.nz_unneeded = (double)a->maxnz;
4076846b4da1SFande Kong     A->was_assembled    = PETSC_FALSE;
4077846b4da1SFande Kong     A->assembled        = PETSC_FALSE;
40781f14be2bSBarry Smith   }
40793ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
4080846b4da1SFande Kong }
4081846b4da1SFande Kong 
408258d36128SBarry Smith /*@
408311a5261eSBarry Smith   MatSeqAIJSetPreallocationCSR - Allocates memory for a sparse sequential matrix in `MATSEQAIJ` format.
4084a1661176SMatthew Knepley 
4085a1661176SMatthew Knepley   Input Parameters:
4086a1661176SMatthew Knepley + B - the matrix
4087d8a51d2aSBarry Smith . i - the indices into `j` for the start of each row (indices start with zero)
4088d8a51d2aSBarry Smith . j - the column indices for each row (indices start with zero) these must be sorted for each row
4089d8a51d2aSBarry Smith - v - optional values in the matrix, use `NULL` if not provided
4090a1661176SMatthew Knepley 
4091a1661176SMatthew Knepley   Level: developer
4092a1661176SMatthew Knepley 
40936a9b8d82SBarry Smith   Notes:
40942ef1f0ffSBarry Smith   The `i`,`j`,`v` values are COPIED with this routine; to avoid the copy use `MatCreateSeqAIJWithArrays()`
409558d36128SBarry Smith 
40966a9b8d82SBarry Smith   This routine may be called multiple times with different nonzero patterns (or the same nonzero pattern). The nonzero
40976a9b8d82SBarry Smith   structure will be the union of all the previous nonzero structures.
40986a9b8d82SBarry Smith 
40996a9b8d82SBarry Smith   Developer Notes:
41002ef1f0ffSBarry Smith   An optimization could be added to the implementation where it checks if the `i`, and `j` are identical to the current `i` and `j` and
41012ef1f0ffSBarry Smith   then just copies the `v` values directly with `PetscMemcpy()`.
41026a9b8d82SBarry Smith 
410311a5261eSBarry Smith   This routine could also take a `PetscCopyMode` argument to allow sharing the values instead of always copying them.
41046a9b8d82SBarry Smith 
4105fe59aa6dSJacob Faibussowitsch .seealso: [](ch_matrices), `Mat`, `MatCreate()`, `MatCreateSeqAIJ()`, `MatSetValues()`, `MatSeqAIJSetPreallocation()`, `MATSEQAIJ`, `MatResetPreallocation()`
4106a1661176SMatthew Knepley @*/
4107d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetPreallocationCSR(Mat B, const PetscInt i[], const PetscInt j[], const PetscScalar v[])
4108d71ae5a4SJacob Faibussowitsch {
4109a1661176SMatthew Knepley   PetscFunctionBegin;
41100700a824SBarry Smith   PetscValidHeaderSpecific(B, MAT_CLASSID, 1);
41116ba663aaSJed Brown   PetscValidType(B, 1);
4112cac4c232SBarry Smith   PetscTryMethod(B, "MatSeqAIJSetPreallocationCSR_C", (Mat, const PetscInt[], const PetscInt[], const PetscScalar[]), (B, i, j, v));
41133ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
4114a1661176SMatthew Knepley }
4115a1661176SMatthew Knepley 
4116ba38deedSJacob Faibussowitsch static PetscErrorCode MatSeqAIJSetPreallocationCSR_SeqAIJ(Mat B, const PetscInt Ii[], const PetscInt J[], const PetscScalar v[])
4117d71ae5a4SJacob Faibussowitsch {
4118a1661176SMatthew Knepley   PetscInt  i;
4119a1661176SMatthew Knepley   PetscInt  m, n;
4120a1661176SMatthew Knepley   PetscInt  nz;
41216a9b8d82SBarry Smith   PetscInt *nnz;
4122a1661176SMatthew Knepley 
4123a1661176SMatthew Knepley   PetscFunctionBegin;
4124aed4548fSBarry Smith   PetscCheck(Ii[0] == 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Ii[0] must be 0 it is %" PetscInt_FMT, Ii[0]);
4125779a8d59SSatish Balay 
41269566063dSJacob Faibussowitsch   PetscCall(PetscLayoutSetUp(B->rmap));
41279566063dSJacob Faibussowitsch   PetscCall(PetscLayoutSetUp(B->cmap));
4128779a8d59SSatish Balay 
41299566063dSJacob Faibussowitsch   PetscCall(MatGetSize(B, &m, &n));
41309566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(m + 1, &nnz));
4131a1661176SMatthew Knepley   for (i = 0; i < m; i++) {
4132b7940d39SSatish Balay     nz = Ii[i + 1] - Ii[i];
413308401ef6SPierre Jolivet     PetscCheck(nz >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Local row %" PetscInt_FMT " has a negative number of columns %" PetscInt_FMT, i, nz);
4134a1661176SMatthew Knepley     nnz[i] = nz;
4135a1661176SMatthew Knepley   }
41369566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJSetPreallocation(B, 0, nnz));
41379566063dSJacob Faibussowitsch   PetscCall(PetscFree(nnz));
4138a1661176SMatthew Knepley 
41398e3a54c0SPierre Jolivet   for (i = 0; i < m; i++) PetscCall(MatSetValues_SeqAIJ(B, 1, &i, Ii[i + 1] - Ii[i], J + Ii[i], PetscSafePointerPlusOffset(v, Ii[i]), INSERT_VALUES));
4140a1661176SMatthew Knepley 
41419566063dSJacob Faibussowitsch   PetscCall(MatAssemblyBegin(B, MAT_FINAL_ASSEMBLY));
41429566063dSJacob Faibussowitsch   PetscCall(MatAssemblyEnd(B, MAT_FINAL_ASSEMBLY));
4143a1661176SMatthew Knepley 
41449566063dSJacob Faibussowitsch   PetscCall(MatSetOption(B, MAT_NEW_NONZERO_LOCATION_ERR, PETSC_TRUE));
41453ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
4146a1661176SMatthew Knepley }
4147a1661176SMatthew Knepley 
4148ad7e164aSPierre Jolivet /*@
41492ef1f0ffSBarry Smith   MatSeqAIJKron - Computes `C`, the Kronecker product of `A` and `B`.
4150ad7e164aSPierre Jolivet 
4151ad7e164aSPierre Jolivet   Input Parameters:
4152ad7e164aSPierre Jolivet + A     - left-hand side matrix
4153ad7e164aSPierre Jolivet . B     - right-hand side matrix
415411a5261eSBarry Smith - reuse - either `MAT_INITIAL_MATRIX` or `MAT_REUSE_MATRIX`
4155ad7e164aSPierre Jolivet 
4156ad7e164aSPierre Jolivet   Output Parameter:
41572ef1f0ffSBarry Smith . C - Kronecker product of `A` and `B`
4158ad7e164aSPierre Jolivet 
4159ad7e164aSPierre Jolivet   Level: intermediate
4160ad7e164aSPierre Jolivet 
416111a5261eSBarry Smith   Note:
416211a5261eSBarry Smith   `MAT_REUSE_MATRIX` can only be used when the nonzero structure of the product matrix has not changed from that last call to `MatSeqAIJKron()`.
4163ad7e164aSPierre Jolivet 
41641cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatCreateSeqAIJ()`, `MATSEQAIJ`, `MATKAIJ`, `MatReuse`
4165ad7e164aSPierre Jolivet @*/
4166d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJKron(Mat A, Mat B, MatReuse reuse, Mat *C)
4167d71ae5a4SJacob Faibussowitsch {
4168ad7e164aSPierre Jolivet   PetscFunctionBegin;
4169ad7e164aSPierre Jolivet   PetscValidHeaderSpecific(A, MAT_CLASSID, 1);
4170ad7e164aSPierre Jolivet   PetscValidType(A, 1);
4171ad7e164aSPierre Jolivet   PetscValidHeaderSpecific(B, MAT_CLASSID, 2);
4172ad7e164aSPierre Jolivet   PetscValidType(B, 2);
41734f572ea9SToby Isaac   PetscAssertPointer(C, 4);
4174ad7e164aSPierre Jolivet   if (reuse == MAT_REUSE_MATRIX) {
4175ad7e164aSPierre Jolivet     PetscValidHeaderSpecific(*C, MAT_CLASSID, 4);
4176ad7e164aSPierre Jolivet     PetscValidType(*C, 4);
4177ad7e164aSPierre Jolivet   }
4178cac4c232SBarry Smith   PetscTryMethod(A, "MatSeqAIJKron_C", (Mat, Mat, MatReuse, Mat *), (A, B, reuse, C));
41793ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
4180ad7e164aSPierre Jolivet }
4181ad7e164aSPierre Jolivet 
4182ba38deedSJacob Faibussowitsch static PetscErrorCode MatSeqAIJKron_SeqAIJ(Mat A, Mat B, MatReuse reuse, Mat *C)
4183d71ae5a4SJacob Faibussowitsch {
4184ad7e164aSPierre Jolivet   Mat                newmat;
4185ad7e164aSPierre Jolivet   Mat_SeqAIJ        *a = (Mat_SeqAIJ *)A->data;
4186ad7e164aSPierre Jolivet   Mat_SeqAIJ        *b = (Mat_SeqAIJ *)B->data;
4187ad7e164aSPierre Jolivet   PetscScalar       *v;
4188fff043a9SJunchao Zhang   const PetscScalar *aa, *ba;
4189ad7e164aSPierre Jolivet   PetscInt          *i, *j, m, n, p, q, nnz = 0, am = A->rmap->n, bm = B->rmap->n, an = A->cmap->n, bn = B->cmap->n;
4190ad7e164aSPierre Jolivet   PetscBool          flg;
4191ad7e164aSPierre Jolivet 
4192ad7e164aSPierre Jolivet   PetscFunctionBegin;
419328b400f6SJacob Faibussowitsch   PetscCheck(!A->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix");
419428b400f6SJacob Faibussowitsch   PetscCheck(A->assembled, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for unassembled matrix");
419528b400f6SJacob Faibussowitsch   PetscCheck(!B->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix");
419628b400f6SJacob Faibussowitsch   PetscCheck(B->assembled, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for unassembled matrix");
41979566063dSJacob Faibussowitsch   PetscCall(PetscObjectTypeCompare((PetscObject)B, MATSEQAIJ, &flg));
419828b400f6SJacob Faibussowitsch   PetscCheck(flg, PETSC_COMM_SELF, PETSC_ERR_SUP, "MatType %s", ((PetscObject)B)->type_name);
4199aed4548fSBarry Smith   PetscCheck(reuse == MAT_INITIAL_MATRIX || reuse == MAT_REUSE_MATRIX, PETSC_COMM_SELF, PETSC_ERR_SUP, "MatReuse %d", (int)reuse);
4200ad7e164aSPierre Jolivet   if (reuse == MAT_INITIAL_MATRIX) {
42019566063dSJacob Faibussowitsch     PetscCall(PetscMalloc2(am * bm + 1, &i, a->i[am] * b->i[bm], &j));
42029566063dSJacob Faibussowitsch     PetscCall(MatCreate(PETSC_COMM_SELF, &newmat));
42039566063dSJacob Faibussowitsch     PetscCall(MatSetSizes(newmat, am * bm, an * bn, am * bm, an * bn));
42049566063dSJacob Faibussowitsch     PetscCall(MatSetType(newmat, MATAIJ));
4205ad7e164aSPierre Jolivet     i[0] = 0;
4206ad7e164aSPierre Jolivet     for (m = 0; m < am; ++m) {
4207ad7e164aSPierre Jolivet       for (p = 0; p < bm; ++p) {
4208ad7e164aSPierre Jolivet         i[m * bm + p + 1] = i[m * bm + p] + (a->i[m + 1] - a->i[m]) * (b->i[p + 1] - b->i[p]);
4209ad7e164aSPierre Jolivet         for (n = a->i[m]; n < a->i[m + 1]; ++n) {
4210ad540459SPierre Jolivet           for (q = b->i[p]; q < b->i[p + 1]; ++q) j[nnz++] = a->j[n] * bn + b->j[q];
4211ad7e164aSPierre Jolivet         }
4212ad7e164aSPierre Jolivet       }
4213ad7e164aSPierre Jolivet     }
42149566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJSetPreallocationCSR(newmat, i, j, NULL));
4215ad7e164aSPierre Jolivet     *C = newmat;
42169566063dSJacob Faibussowitsch     PetscCall(PetscFree2(i, j));
4217ad7e164aSPierre Jolivet     nnz = 0;
4218ad7e164aSPierre Jolivet   }
42199566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArray(*C, &v));
42209566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &aa));
42219566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(B, &ba));
4222ad7e164aSPierre Jolivet   for (m = 0; m < am; ++m) {
4223ad7e164aSPierre Jolivet     for (p = 0; p < bm; ++p) {
4224ad7e164aSPierre Jolivet       for (n = a->i[m]; n < a->i[m + 1]; ++n) {
4225ad540459SPierre Jolivet         for (q = b->i[p]; q < b->i[p + 1]; ++q) v[nnz++] = aa[n] * ba[q];
4226ad7e164aSPierre Jolivet       }
4227ad7e164aSPierre Jolivet     }
4228ad7e164aSPierre Jolivet   }
42299566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArray(*C, &v));
42309566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &aa));
42319566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(B, &ba));
42323ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
4233ad7e164aSPierre Jolivet }
4234ad7e164aSPierre Jolivet 
4235c6db04a5SJed Brown #include <../src/mat/impls/dense/seq/dense.h>
4236af0996ceSBarry Smith #include <petsc/private/kernels/petscaxpy.h>
4237170fe5c8SBarry Smith 
4238170fe5c8SBarry Smith /*
4239170fe5c8SBarry Smith     Computes (B'*A')' since computing B*A directly is untenable
4240170fe5c8SBarry Smith 
4241170fe5c8SBarry Smith                n                       p                          p
42422da392ccSBarry Smith         [             ]       [             ]         [                 ]
42432da392ccSBarry Smith       m [      A      ]  *  n [       B     ]   =   m [         C       ]
42442da392ccSBarry Smith         [             ]       [             ]         [                 ]
4245170fe5c8SBarry Smith 
4246170fe5c8SBarry Smith */
4247d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMatMultNumeric_SeqDense_SeqAIJ(Mat A, Mat B, Mat C)
4248d71ae5a4SJacob Faibussowitsch {
4249170fe5c8SBarry Smith   Mat_SeqDense      *sub_a = (Mat_SeqDense *)A->data;
4250170fe5c8SBarry Smith   Mat_SeqAIJ        *sub_b = (Mat_SeqAIJ *)B->data;
4251170fe5c8SBarry Smith   Mat_SeqDense      *sub_c = (Mat_SeqDense *)C->data;
425286214ceeSStefano Zampini   PetscInt           i, j, n, m, q, p;
4253170fe5c8SBarry Smith   const PetscInt    *ii, *idx;
4254170fe5c8SBarry Smith   const PetscScalar *b, *a, *a_q;
4255170fe5c8SBarry Smith   PetscScalar       *c, *c_q;
425686214ceeSStefano Zampini   PetscInt           clda = sub_c->lda;
425786214ceeSStefano Zampini   PetscInt           alda = sub_a->lda;
4258170fe5c8SBarry Smith 
4259170fe5c8SBarry Smith   PetscFunctionBegin;
4260d0f46423SBarry Smith   m = A->rmap->n;
4261d0f46423SBarry Smith   n = A->cmap->n;
4262d0f46423SBarry Smith   p = B->cmap->n;
4263170fe5c8SBarry Smith   a = sub_a->v;
4264170fe5c8SBarry Smith   b = sub_b->a;
4265170fe5c8SBarry Smith   c = sub_c->v;
426686214ceeSStefano Zampini   if (clda == m) {
42679566063dSJacob Faibussowitsch     PetscCall(PetscArrayzero(c, m * p));
426886214ceeSStefano Zampini   } else {
426986214ceeSStefano Zampini     for (j = 0; j < p; j++)
42709371c9d4SSatish Balay       for (i = 0; i < m; i++) c[j * clda + i] = 0.0;
427186214ceeSStefano Zampini   }
4272170fe5c8SBarry Smith   ii  = sub_b->i;
4273170fe5c8SBarry Smith   idx = sub_b->j;
4274170fe5c8SBarry Smith   for (i = 0; i < n; i++) {
4275170fe5c8SBarry Smith     q = ii[i + 1] - ii[i];
4276170fe5c8SBarry Smith     while (q-- > 0) {
427786214ceeSStefano Zampini       c_q = c + clda * (*idx);
427886214ceeSStefano Zampini       a_q = a + alda * i;
4279854c7f52SBarry Smith       PetscKernelAXPY(c_q, *b, a_q, m);
4280170fe5c8SBarry Smith       idx++;
4281170fe5c8SBarry Smith       b++;
4282170fe5c8SBarry Smith     }
4283170fe5c8SBarry Smith   }
42843ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
4285170fe5c8SBarry Smith }
4286170fe5c8SBarry Smith 
4287d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMatMultSymbolic_SeqDense_SeqAIJ(Mat A, Mat B, PetscReal fill, Mat C)
4288d71ae5a4SJacob Faibussowitsch {
4289d0f46423SBarry Smith   PetscInt  m = A->rmap->n, n = B->cmap->n;
429086214ceeSStefano Zampini   PetscBool cisdense;
4291170fe5c8SBarry Smith 
4292170fe5c8SBarry Smith   PetscFunctionBegin;
429308401ef6SPierre Jolivet   PetscCheck(A->cmap->n == B->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "A->cmap->n %" PetscInt_FMT " != B->rmap->n %" PetscInt_FMT, A->cmap->n, B->rmap->n);
42949566063dSJacob Faibussowitsch   PetscCall(MatSetSizes(C, m, n, m, n));
42959566063dSJacob Faibussowitsch   PetscCall(MatSetBlockSizesFromMats(C, A, B));
4296d5e393b6SSuyash Tandon   PetscCall(PetscObjectTypeCompareAny((PetscObject)C, &cisdense, MATSEQDENSE, MATSEQDENSECUDA, MATSEQDENSEHIP, ""));
429748a46eb9SPierre Jolivet   if (!cisdense) PetscCall(MatSetType(C, MATDENSE));
42989566063dSJacob Faibussowitsch   PetscCall(MatSetUp(C));
4299d73949e8SHong Zhang 
43004222ddf1SHong Zhang   C->ops->matmultnumeric = MatMatMultNumeric_SeqDense_SeqAIJ;
43013ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
4302170fe5c8SBarry Smith }
4303170fe5c8SBarry Smith 
43040bad9183SKris Buschelman /*MC
4305fafad747SKris Buschelman    MATSEQAIJ - MATSEQAIJ = "seqaij" - A matrix type to be used for sequential sparse matrices,
43060bad9183SKris Buschelman    based on compressed sparse row format.
43070bad9183SKris Buschelman 
43082ef1f0ffSBarry Smith    Options Database Key:
43090bad9183SKris Buschelman . -mat_type seqaij - sets the matrix type to "seqaij" during a call to MatSetFromOptions()
43100bad9183SKris Buschelman 
43110bad9183SKris Buschelman    Level: beginner
43120bad9183SKris Buschelman 
43130cd7f59aSBarry Smith    Notes:
43142ef1f0ffSBarry Smith     `MatSetValues()` may be called for this matrix type with a `NULL` argument for the numerical values,
43150cd7f59aSBarry Smith     in this case the values associated with the rows and columns one passes in are set to zero
43160cd7f59aSBarry Smith     in the matrix
43170cd7f59aSBarry Smith 
431811a5261eSBarry Smith     `MatSetOptions`(,`MAT_STRUCTURE_ONLY`,`PETSC_TRUE`) may be called for this matrix type. In this no
431911a5261eSBarry Smith     space is allocated for the nonzero entries and any entries passed with `MatSetValues()` are ignored
43200cd7f59aSBarry Smith 
432111a5261eSBarry Smith   Developer Note:
43222ef1f0ffSBarry Smith     It would be nice if all matrix formats supported passing `NULL` in for the numerical values
43230cd7f59aSBarry Smith 
43241cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatCreateSeqAIJ()`, `MatSetFromOptions()`, `MatSetType()`, `MatCreate()`, `MatType`, `MATSELL`, `MATSEQSELL`, `MATMPISELL`
43250bad9183SKris Buschelman M*/
43260bad9183SKris Buschelman 
4327ccd284c7SBarry Smith /*MC
4328ccd284c7SBarry Smith    MATAIJ - MATAIJ = "aij" - A matrix type to be used for sparse matrices.
4329ccd284c7SBarry Smith 
433011a5261eSBarry Smith    This matrix type is identical to `MATSEQAIJ` when constructed with a single process communicator,
433111a5261eSBarry Smith    and `MATMPIAIJ` otherwise.  As a result, for single process communicators,
433211a5261eSBarry Smith    `MatSeqAIJSetPreallocation()` is supported, and similarly `MatMPIAIJSetPreallocation()` is supported
4333ccd284c7SBarry Smith    for communicators controlling multiple processes.  It is recommended that you call both of
4334ccd284c7SBarry Smith    the above preallocation routines for simplicity.
4335ccd284c7SBarry Smith 
43362ef1f0ffSBarry Smith    Options Database Key:
433711a5261eSBarry Smith . -mat_type aij - sets the matrix type to "aij" during a call to `MatSetFromOptions()`
4338ccd284c7SBarry Smith 
43392ef1f0ffSBarry Smith   Level: beginner
43402ef1f0ffSBarry Smith 
434111a5261eSBarry Smith    Note:
434211a5261eSBarry Smith    Subclasses include `MATAIJCUSPARSE`, `MATAIJPERM`, `MATAIJSELL`, `MATAIJMKL`, `MATAIJCRL`, and also automatically switches over to use inodes when
4343ccd284c7SBarry Smith    enough exist.
4344ccd284c7SBarry Smith 
43451cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatCreateAIJ()`, `MatCreateSeqAIJ()`, `MATSEQAIJ`, `MATMPIAIJ`, `MATSELL`, `MATSEQSELL`, `MATMPISELL`
4346ccd284c7SBarry Smith M*/
4347ccd284c7SBarry Smith 
4348ccd284c7SBarry Smith /*MC
4349ccd284c7SBarry Smith    MATAIJCRL - MATAIJCRL = "aijcrl" - A matrix type to be used for sparse matrices.
4350ccd284c7SBarry Smith 
43512ef1f0ffSBarry Smith    Options Database Key:
43522ef1f0ffSBarry Smith . -mat_type aijcrl - sets the matrix type to "aijcrl" during a call to `MatSetFromOptions()`
43532ef1f0ffSBarry Smith 
43542ef1f0ffSBarry Smith   Level: beginner
43552ef1f0ffSBarry Smith 
43562ef1f0ffSBarry Smith    Note:
435711a5261eSBarry Smith    This matrix type is identical to `MATSEQAIJCRL` when constructed with a single process communicator,
435811a5261eSBarry Smith    and `MATMPIAIJCRL` otherwise.  As a result, for single process communicators,
435911a5261eSBarry Smith    `MatSeqAIJSetPreallocation()` is supported, and similarly `MatMPIAIJSetPreallocation()` is supported
4360ccd284c7SBarry Smith    for communicators controlling multiple processes.  It is recommended that you call both of
4361ccd284c7SBarry Smith    the above preallocation routines for simplicity.
4362ccd284c7SBarry Smith 
43631cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatCreateMPIAIJCRL`, `MATSEQAIJCRL`, `MATMPIAIJCRL`, `MATSEQAIJCRL`, `MATMPIAIJCRL`
4364ccd284c7SBarry Smith M*/
4365ccd284c7SBarry Smith 
43667906f579SHong Zhang PETSC_INTERN PetscErrorCode MatConvert_SeqAIJ_SeqAIJCRL(Mat, MatType, MatReuse, Mat *);
43677906f579SHong Zhang #if defined(PETSC_HAVE_ELEMENTAL)
43687906f579SHong Zhang PETSC_INTERN PetscErrorCode MatConvert_SeqAIJ_Elemental(Mat, MatType, MatReuse, Mat *);
43697906f579SHong Zhang #endif
4370d24d4204SJose E. Roman #if defined(PETSC_HAVE_SCALAPACK)
4371d24d4204SJose E. Roman PETSC_INTERN PetscErrorCode MatConvert_AIJ_ScaLAPACK(Mat, MatType, MatReuse, Mat *);
4372d24d4204SJose E. Roman #endif
43737906f579SHong Zhang #if defined(PETSC_HAVE_HYPRE)
43747906f579SHong Zhang PETSC_INTERN PetscErrorCode MatConvert_AIJ_HYPRE(Mat A, MatType, MatReuse, Mat *);
43757906f579SHong Zhang #endif
43767906f579SHong Zhang 
4377d4002b98SHong Zhang PETSC_EXTERN PetscErrorCode MatConvert_SeqAIJ_SeqSELL(Mat, MatType, MatReuse, Mat *);
4378c9225affSStefano Zampini PETSC_INTERN PetscErrorCode MatConvert_XAIJ_IS(Mat, MatType, MatReuse, Mat *);
43794222ddf1SHong Zhang PETSC_INTERN PetscErrorCode MatProductSetFromOptions_IS_XAIJ(Mat);
43807906f579SHong Zhang 
43818c778c55SBarry Smith /*@C
438211a5261eSBarry Smith   MatSeqAIJGetArray - gives read/write access to the array where the data for a `MATSEQAIJ` matrix is stored
43838c778c55SBarry Smith 
43848c778c55SBarry Smith   Not Collective
43858c778c55SBarry Smith 
43868c778c55SBarry Smith   Input Parameter:
4387fe59aa6dSJacob Faibussowitsch . A - a `MATSEQAIJ` matrix
43888c778c55SBarry Smith 
43898c778c55SBarry Smith   Output Parameter:
43908c778c55SBarry Smith . array - pointer to the data
43918c778c55SBarry Smith 
43928c778c55SBarry Smith   Level: intermediate
43938c778c55SBarry Smith 
4394fe59aa6dSJacob Faibussowitsch   Fortran Notes:
43950ab4885dSBarry Smith   `MatSeqAIJGetArray()` Fortran binding is deprecated (since PETSc 3.19), use `MatSeqAIJGetArrayF90()`
43960ab4885dSBarry Smith 
43971cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJRestoreArray()`, `MatSeqAIJGetArrayF90()`
43988c778c55SBarry Smith @*/
43995d83a8b1SBarry Smith PetscErrorCode MatSeqAIJGetArray(Mat A, PetscScalar *array[])
4400d71ae5a4SJacob Faibussowitsch {
4401d67d9f35SJunchao Zhang   Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data;
44028c778c55SBarry Smith 
44038c778c55SBarry Smith   PetscFunctionBegin;
4404d67d9f35SJunchao Zhang   if (aij->ops->getarray) {
44059566063dSJacob Faibussowitsch     PetscCall((*aij->ops->getarray)(A, array));
4406d67d9f35SJunchao Zhang   } else {
4407d67d9f35SJunchao Zhang     *array = aij->a;
4408d67d9f35SJunchao Zhang   }
44093ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
4410d67d9f35SJunchao Zhang }
4411d67d9f35SJunchao Zhang 
4412d67d9f35SJunchao Zhang /*@C
441311a5261eSBarry Smith   MatSeqAIJRestoreArray - returns access to the array where the data for a `MATSEQAIJ` matrix is stored obtained by `MatSeqAIJGetArray()`
4414d67d9f35SJunchao Zhang 
4415d67d9f35SJunchao Zhang   Not Collective
4416d67d9f35SJunchao Zhang 
4417d67d9f35SJunchao Zhang   Input Parameters:
4418fe59aa6dSJacob Faibussowitsch + A     - a `MATSEQAIJ` matrix
4419d67d9f35SJunchao Zhang - array - pointer to the data
4420d67d9f35SJunchao Zhang 
4421d67d9f35SJunchao Zhang   Level: intermediate
4422d67d9f35SJunchao Zhang 
4423fe59aa6dSJacob Faibussowitsch   Fortran Notes:
44240ab4885dSBarry Smith   `MatSeqAIJRestoreArray()` Fortran binding is deprecated (since PETSc 3.19), use `MatSeqAIJRestoreArrayF90()`
44250ab4885dSBarry Smith 
44261cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJGetArray()`, `MatSeqAIJRestoreArrayF90()`
4427d67d9f35SJunchao Zhang @*/
44285d83a8b1SBarry Smith PetscErrorCode MatSeqAIJRestoreArray(Mat A, PetscScalar *array[])
4429d71ae5a4SJacob Faibussowitsch {
4430d67d9f35SJunchao Zhang   Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data;
4431d67d9f35SJunchao Zhang 
4432d67d9f35SJunchao Zhang   PetscFunctionBegin;
4433d67d9f35SJunchao Zhang   if (aij->ops->restorearray) {
44349566063dSJacob Faibussowitsch     PetscCall((*aij->ops->restorearray)(A, array));
4435d67d9f35SJunchao Zhang   } else {
4436d67d9f35SJunchao Zhang     *array = NULL;
4437d67d9f35SJunchao Zhang   }
44389566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJInvalidateDiagonal(A));
44399566063dSJacob Faibussowitsch   PetscCall(PetscObjectStateIncrease((PetscObject)A));
44403ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
44418c778c55SBarry Smith }
44428c778c55SBarry Smith 
444321e72a00SBarry Smith /*@C
444411a5261eSBarry Smith   MatSeqAIJGetArrayRead - gives read-only access to the array where the data for a `MATSEQAIJ` matrix is stored
44458f1ea47aSStefano Zampini 
44460ab4885dSBarry Smith   Not Collective; No Fortran Support
44478f1ea47aSStefano Zampini 
44488f1ea47aSStefano Zampini   Input Parameter:
4449fe59aa6dSJacob Faibussowitsch . A - a `MATSEQAIJ` matrix
44508f1ea47aSStefano Zampini 
44518f1ea47aSStefano Zampini   Output Parameter:
44528f1ea47aSStefano Zampini . array - pointer to the data
44538f1ea47aSStefano Zampini 
44548f1ea47aSStefano Zampini   Level: intermediate
44558f1ea47aSStefano Zampini 
44561cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJGetArray()`, `MatSeqAIJRestoreArrayRead()`
44578f1ea47aSStefano Zampini @*/
44585d83a8b1SBarry Smith PetscErrorCode MatSeqAIJGetArrayRead(Mat A, const PetscScalar *array[])
4459d71ae5a4SJacob Faibussowitsch {
4460d67d9f35SJunchao Zhang   Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data;
44618f1ea47aSStefano Zampini 
44628f1ea47aSStefano Zampini   PetscFunctionBegin;
4463d67d9f35SJunchao Zhang   if (aij->ops->getarrayread) {
44649566063dSJacob Faibussowitsch     PetscCall((*aij->ops->getarrayread)(A, array));
4465d67d9f35SJunchao Zhang   } else {
4466d67d9f35SJunchao Zhang     *array = aij->a;
4467d67d9f35SJunchao Zhang   }
44683ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
44698f1ea47aSStefano Zampini }
44708f1ea47aSStefano Zampini 
44718f1ea47aSStefano Zampini /*@C
447211a5261eSBarry Smith   MatSeqAIJRestoreArrayRead - restore the read-only access array obtained from `MatSeqAIJGetArrayRead()`
44738f1ea47aSStefano Zampini 
44740ab4885dSBarry Smith   Not Collective; No Fortran Support
44758f1ea47aSStefano Zampini 
44768f1ea47aSStefano Zampini   Input Parameter:
4477fe59aa6dSJacob Faibussowitsch . A - a `MATSEQAIJ` matrix
44788f1ea47aSStefano Zampini 
44798f1ea47aSStefano Zampini   Output Parameter:
44808f1ea47aSStefano Zampini . array - pointer to the data
44818f1ea47aSStefano Zampini 
44828f1ea47aSStefano Zampini   Level: intermediate
44838f1ea47aSStefano Zampini 
44841cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJGetArray()`, `MatSeqAIJGetArrayRead()`
44858f1ea47aSStefano Zampini @*/
44865d83a8b1SBarry Smith PetscErrorCode MatSeqAIJRestoreArrayRead(Mat A, const PetscScalar *array[])
4487d71ae5a4SJacob Faibussowitsch {
4488d67d9f35SJunchao Zhang   Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data;
44898f1ea47aSStefano Zampini 
44908f1ea47aSStefano Zampini   PetscFunctionBegin;
4491d67d9f35SJunchao Zhang   if (aij->ops->restorearrayread) {
44929566063dSJacob Faibussowitsch     PetscCall((*aij->ops->restorearrayread)(A, array));
4493d67d9f35SJunchao Zhang   } else {
4494d67d9f35SJunchao Zhang     *array = NULL;
4495d67d9f35SJunchao Zhang   }
44963ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
4497d67d9f35SJunchao Zhang }
4498d67d9f35SJunchao Zhang 
4499d67d9f35SJunchao Zhang /*@C
450011a5261eSBarry Smith   MatSeqAIJGetArrayWrite - gives write-only access to the array where the data for a `MATSEQAIJ` matrix is stored
4501d67d9f35SJunchao Zhang 
45020ab4885dSBarry Smith   Not Collective; No Fortran Support
4503d67d9f35SJunchao Zhang 
4504d67d9f35SJunchao Zhang   Input Parameter:
4505fe59aa6dSJacob Faibussowitsch . A - a `MATSEQAIJ` matrix
4506d67d9f35SJunchao Zhang 
4507d67d9f35SJunchao Zhang   Output Parameter:
4508d67d9f35SJunchao Zhang . array - pointer to the data
4509d67d9f35SJunchao Zhang 
4510d67d9f35SJunchao Zhang   Level: intermediate
4511d67d9f35SJunchao Zhang 
45121cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJGetArray()`, `MatSeqAIJRestoreArrayRead()`
4513d67d9f35SJunchao Zhang @*/
45145d83a8b1SBarry Smith PetscErrorCode MatSeqAIJGetArrayWrite(Mat A, PetscScalar *array[])
4515d71ae5a4SJacob Faibussowitsch {
4516d67d9f35SJunchao Zhang   Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data;
4517d67d9f35SJunchao Zhang 
4518d67d9f35SJunchao Zhang   PetscFunctionBegin;
4519d67d9f35SJunchao Zhang   if (aij->ops->getarraywrite) {
45209566063dSJacob Faibussowitsch     PetscCall((*aij->ops->getarraywrite)(A, array));
4521d67d9f35SJunchao Zhang   } else {
4522d67d9f35SJunchao Zhang     *array = aij->a;
4523d67d9f35SJunchao Zhang   }
45249566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJInvalidateDiagonal(A));
45259566063dSJacob Faibussowitsch   PetscCall(PetscObjectStateIncrease((PetscObject)A));
45263ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
4527d67d9f35SJunchao Zhang }
4528d67d9f35SJunchao Zhang 
4529d67d9f35SJunchao Zhang /*@C
4530d67d9f35SJunchao Zhang   MatSeqAIJRestoreArrayWrite - restore the read-only access array obtained from MatSeqAIJGetArrayRead
4531d67d9f35SJunchao Zhang 
45320ab4885dSBarry Smith   Not Collective; No Fortran Support
4533d67d9f35SJunchao Zhang 
4534d67d9f35SJunchao Zhang   Input Parameter:
4535fe59aa6dSJacob Faibussowitsch . A - a MATSEQAIJ matrix
4536d67d9f35SJunchao Zhang 
4537d67d9f35SJunchao Zhang   Output Parameter:
4538d67d9f35SJunchao Zhang . array - pointer to the data
4539d67d9f35SJunchao Zhang 
4540d67d9f35SJunchao Zhang   Level: intermediate
4541d67d9f35SJunchao Zhang 
45421cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJGetArray()`, `MatSeqAIJGetArrayRead()`
4543d67d9f35SJunchao Zhang @*/
45445d83a8b1SBarry Smith PetscErrorCode MatSeqAIJRestoreArrayWrite(Mat A, PetscScalar *array[])
4545d71ae5a4SJacob Faibussowitsch {
4546d67d9f35SJunchao Zhang   Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data;
4547d67d9f35SJunchao Zhang 
4548d67d9f35SJunchao Zhang   PetscFunctionBegin;
4549d67d9f35SJunchao Zhang   if (aij->ops->restorearraywrite) {
45509566063dSJacob Faibussowitsch     PetscCall((*aij->ops->restorearraywrite)(A, array));
4551d67d9f35SJunchao Zhang   } else {
4552d67d9f35SJunchao Zhang     *array = NULL;
4553d67d9f35SJunchao Zhang   }
45543ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
45558f1ea47aSStefano Zampini }
45568f1ea47aSStefano Zampini 
45578f1ea47aSStefano Zampini /*@C
455811a5261eSBarry Smith   MatSeqAIJGetCSRAndMemType - Get the CSR arrays and the memory type of the `MATSEQAIJ` matrix
45597ee59b9bSJunchao Zhang 
45600ab4885dSBarry Smith   Not Collective; No Fortran Support
45617ee59b9bSJunchao Zhang 
45627ee59b9bSJunchao Zhang   Input Parameter:
456311a5261eSBarry Smith . mat - a matrix of type `MATSEQAIJ` or its subclasses
45647ee59b9bSJunchao Zhang 
45657ee59b9bSJunchao Zhang   Output Parameters:
45667ee59b9bSJunchao Zhang + i     - row map array of the matrix
45677ee59b9bSJunchao Zhang . j     - column index array of the matrix
45687ee59b9bSJunchao Zhang . a     - data array of the matrix
4569fe59aa6dSJacob Faibussowitsch - mtype - memory type of the arrays
45707ee59b9bSJunchao Zhang 
4571fe59aa6dSJacob Faibussowitsch   Level: developer
45722ef1f0ffSBarry Smith 
45737ee59b9bSJunchao Zhang   Notes:
45742ef1f0ffSBarry Smith   Any of the output parameters can be `NULL`, in which case the corresponding value is not returned.
45757ee59b9bSJunchao Zhang   If mat is a device matrix, the arrays are on the device. Otherwise, they are on the host.
45767ee59b9bSJunchao Zhang 
45777ee59b9bSJunchao Zhang   One can call this routine on a preallocated but not assembled matrix to just get the memory of the CSR underneath the matrix.
45782ef1f0ffSBarry Smith   If the matrix is assembled, the data array `a` is guaranteed to have the latest values of the matrix.
45797ee59b9bSJunchao Zhang 
45801cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJGetArray()`, `MatSeqAIJGetArrayRead()`
45817ee59b9bSJunchao Zhang @*/
45825d83a8b1SBarry Smith PetscErrorCode MatSeqAIJGetCSRAndMemType(Mat mat, const PetscInt *i[], const PetscInt *j[], PetscScalar *a[], PetscMemType *mtype)
4583d71ae5a4SJacob Faibussowitsch {
45847ee59b9bSJunchao Zhang   Mat_SeqAIJ *aij = (Mat_SeqAIJ *)mat->data;
45857ee59b9bSJunchao Zhang 
45867ee59b9bSJunchao Zhang   PetscFunctionBegin;
45877ee59b9bSJunchao Zhang   PetscCheck(mat->preallocated, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "matrix is not preallocated");
45887ee59b9bSJunchao Zhang   if (aij->ops->getcsrandmemtype) {
45897ee59b9bSJunchao Zhang     PetscCall((*aij->ops->getcsrandmemtype)(mat, i, j, a, mtype));
45907ee59b9bSJunchao Zhang   } else {
45917ee59b9bSJunchao Zhang     if (i) *i = aij->i;
45927ee59b9bSJunchao Zhang     if (j) *j = aij->j;
45937ee59b9bSJunchao Zhang     if (a) *a = aij->a;
45947ee59b9bSJunchao Zhang     if (mtype) *mtype = PETSC_MEMTYPE_HOST;
45957ee59b9bSJunchao Zhang   }
45963ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
45977ee59b9bSJunchao Zhang }
45987ee59b9bSJunchao Zhang 
4599cc4c1da9SBarry Smith /*@
460021e72a00SBarry Smith   MatSeqAIJGetMaxRowNonzeros - returns the maximum number of nonzeros in any row
460121e72a00SBarry Smith 
460221e72a00SBarry Smith   Not Collective
460321e72a00SBarry Smith 
460421e72a00SBarry Smith   Input Parameter:
4605fe59aa6dSJacob Faibussowitsch . A - a `MATSEQAIJ` matrix
460621e72a00SBarry Smith 
460721e72a00SBarry Smith   Output Parameter:
460821e72a00SBarry Smith . nz - the maximum number of nonzeros in any row
460921e72a00SBarry Smith 
461021e72a00SBarry Smith   Level: intermediate
461121e72a00SBarry Smith 
46121cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJRestoreArray()`, `MatSeqAIJGetArrayF90()`
461321e72a00SBarry Smith @*/
4614d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJGetMaxRowNonzeros(Mat A, PetscInt *nz)
4615d71ae5a4SJacob Faibussowitsch {
461621e72a00SBarry Smith   Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data;
461721e72a00SBarry Smith 
461821e72a00SBarry Smith   PetscFunctionBegin;
461921e72a00SBarry Smith   *nz = aij->rmax;
46203ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
462121e72a00SBarry Smith }
462221e72a00SBarry Smith 
4623*49abdd8aSBarry Smith static PetscErrorCode MatCOOStructDestroy_SeqAIJ(void **data)
46242c4ab24aSJunchao Zhang {
4625*49abdd8aSBarry Smith   MatCOOStruct_SeqAIJ *coo = (MatCOOStruct_SeqAIJ *)*data;
46264d86920dSPierre Jolivet 
46272c4ab24aSJunchao Zhang   PetscFunctionBegin;
46282c4ab24aSJunchao Zhang   PetscCall(PetscFree(coo->perm));
46292c4ab24aSJunchao Zhang   PetscCall(PetscFree(coo->jmap));
46302c4ab24aSJunchao Zhang   PetscCall(PetscFree(coo));
46312c4ab24aSJunchao Zhang   PetscFunctionReturn(PETSC_SUCCESS);
46322c4ab24aSJunchao Zhang }
46332c4ab24aSJunchao Zhang 
4634d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetPreallocationCOO_SeqAIJ(Mat mat, PetscCount coo_n, PetscInt coo_i[], PetscInt coo_j[])
4635d71ae5a4SJacob Faibussowitsch {
4636394ed5ebSJunchao Zhang   MPI_Comm             comm;
4637394ed5ebSJunchao Zhang   PetscInt            *i, *j;
46380d88f7f4SJunchao Zhang   PetscInt             M, N, row, iprev;
4639394ed5ebSJunchao Zhang   PetscCount           k, p, q, nneg, nnz, start, end; /* Index the coo array, so use PetscCount as their type */
4640394ed5ebSJunchao Zhang   PetscInt            *Ai;                             /* Change to PetscCount once we use it for row pointers */
4641394ed5ebSJunchao Zhang   PetscInt            *Aj;
4642394ed5ebSJunchao Zhang   PetscScalar         *Aa;
4643f4f49eeaSPierre Jolivet   Mat_SeqAIJ          *seqaij = (Mat_SeqAIJ *)mat->data;
4644cbc6b225SStefano Zampini   MatType              rtype;
4645394ed5ebSJunchao Zhang   PetscCount          *perm, *jmap;
46462c4ab24aSJunchao Zhang   MatCOOStruct_SeqAIJ *coo;
46470d88f7f4SJunchao Zhang   PetscBool            isorted;
46489f0612e4SBarry Smith   PetscBool            hypre;
46499f0612e4SBarry Smith   const char          *name;
4650394ed5ebSJunchao Zhang 
4651394ed5ebSJunchao Zhang   PetscFunctionBegin;
46529566063dSJacob Faibussowitsch   PetscCall(PetscObjectGetComm((PetscObject)mat, &comm));
46539566063dSJacob Faibussowitsch   PetscCall(MatGetSize(mat, &M, &N));
4654e8729f6fSJunchao Zhang   i = coo_i;
4655e8729f6fSJunchao Zhang   j = coo_j;
46569566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(coo_n, &perm));
46570d88f7f4SJunchao Zhang 
46580d88f7f4SJunchao Zhang   /* Ignore entries with negative row or col indices; at the same time, check if i[] is already sorted (e.g., MatConvert_AlJ_HYPRE results in this case) */
46590d88f7f4SJunchao Zhang   isorted = PETSC_TRUE;
46600d88f7f4SJunchao Zhang   iprev   = PETSC_INT_MIN;
46610d88f7f4SJunchao Zhang   for (k = 0; k < coo_n; k++) {
4662394ed5ebSJunchao Zhang     if (j[k] < 0) i[k] = -1;
46630d88f7f4SJunchao Zhang     if (isorted) {
46640d88f7f4SJunchao Zhang       if (i[k] < iprev) isorted = PETSC_FALSE;
46650d88f7f4SJunchao Zhang       else iprev = i[k];
46660d88f7f4SJunchao Zhang     }
4667394ed5ebSJunchao Zhang     perm[k] = k;
4668394ed5ebSJunchao Zhang   }
4669394ed5ebSJunchao Zhang 
46700d88f7f4SJunchao Zhang   /* Sort by row if not already */
46710d88f7f4SJunchao Zhang   if (!isorted) PetscCall(PetscSortIntWithIntCountArrayPair(coo_n, i, j, perm));
4672651b1cf9SStefano Zampini 
4673651b1cf9SStefano Zampini   /* Advance k to the first row with a non-negative index */
4674651b1cf9SStefano Zampini   for (k = 0; k < coo_n; k++)
46759371c9d4SSatish Balay     if (i[k] >= 0) break;
4676394ed5ebSJunchao Zhang   nneg = k;
46779566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(coo_n - nneg + 1, &jmap)); /* +1 to make a CSR-like data structure. jmap[i] originally is the number of repeats for i-th nonzero */
4678394ed5ebSJunchao Zhang   nnz = 0;                                          /* Total number of unique nonzeros to be counted */
467935cb6cd3SPierre Jolivet   jmap++;                                           /* Inc jmap by 1 for convenience */
4680394ed5ebSJunchao Zhang 
46819f0612e4SBarry Smith   PetscCall(PetscShmgetAllocateArray(M + 1, sizeof(PetscInt), (void **)&Ai)); /* CSR of A */
46829f0612e4SBarry Smith   PetscCall(PetscArrayzero(Ai, M + 1));
46839f0612e4SBarry Smith   PetscCall(PetscShmgetAllocateArray(coo_n - nneg, sizeof(PetscInt), (void **)&Aj)); /* We have at most coo_n-nneg unique nonzeros */
4684394ed5ebSJunchao Zhang 
4685651b1cf9SStefano Zampini   PetscCall(PetscObjectGetName((PetscObject)mat, &name));
4686651b1cf9SStefano Zampini   PetscCall(PetscStrcmp("_internal_COO_mat_for_hypre", name, &hypre));
4687651b1cf9SStefano Zampini 
4688394ed5ebSJunchao Zhang   /* In each row, sort by column, then unique column indices to get row length */
468935cb6cd3SPierre Jolivet   Ai++;  /* Inc by 1 for convenience */
4690394ed5ebSJunchao Zhang   q = 0; /* q-th unique nonzero, with q starting from 0 */
4691394ed5ebSJunchao Zhang   while (k < coo_n) {
46920d88f7f4SJunchao Zhang     PetscBool strictly_sorted; // this row is strictly sorted?
46930d88f7f4SJunchao Zhang     PetscInt  jprev;
46940d88f7f4SJunchao Zhang 
46950d88f7f4SJunchao Zhang     /* get [start,end) indices for this row; also check if cols in this row are strictly sorted */
4696394ed5ebSJunchao Zhang     row             = i[k];
46970d88f7f4SJunchao Zhang     start           = k;
46980d88f7f4SJunchao Zhang     jprev           = PETSC_INT_MIN;
46990d88f7f4SJunchao Zhang     strictly_sorted = PETSC_TRUE;
47000d88f7f4SJunchao Zhang     while (k < coo_n && i[k] == row) {
47010d88f7f4SJunchao Zhang       if (strictly_sorted) {
47020d88f7f4SJunchao Zhang         if (j[k] <= jprev) strictly_sorted = PETSC_FALSE;
47030d88f7f4SJunchao Zhang         else jprev = j[k];
47040d88f7f4SJunchao Zhang       }
47050d88f7f4SJunchao Zhang       k++;
47060d88f7f4SJunchao Zhang     }
4707394ed5ebSJunchao Zhang     end = k;
47080d88f7f4SJunchao Zhang 
4709651b1cf9SStefano Zampini     /* hack for HYPRE: swap min column to diag so that diagonal values will go first */
4710651b1cf9SStefano Zampini     if (hypre) {
47111690c2aeSBarry Smith       PetscInt  minj    = PETSC_INT_MAX;
4712651b1cf9SStefano Zampini       PetscBool hasdiag = PETSC_FALSE;
47130d88f7f4SJunchao Zhang 
47140d88f7f4SJunchao Zhang       if (strictly_sorted) { // fast path to swap the first and the diag
47150d88f7f4SJunchao Zhang         PetscCount tmp;
47160d88f7f4SJunchao Zhang         for (p = start; p < end; p++) {
47170d88f7f4SJunchao Zhang           if (j[p] == row && p != start) {
47180d88f7f4SJunchao Zhang             j[p]        = j[start];
47190d88f7f4SJunchao Zhang             j[start]    = row;
47200d88f7f4SJunchao Zhang             tmp         = perm[start];
47210d88f7f4SJunchao Zhang             perm[start] = perm[p];
47220d88f7f4SJunchao Zhang             perm[p]     = tmp;
47230d88f7f4SJunchao Zhang             break;
47240d88f7f4SJunchao Zhang           }
47250d88f7f4SJunchao Zhang         }
47260d88f7f4SJunchao Zhang       } else {
4727651b1cf9SStefano Zampini         for (p = start; p < end; p++) {
4728651b1cf9SStefano Zampini           hasdiag = (PetscBool)(hasdiag || (j[p] == row));
4729651b1cf9SStefano Zampini           minj    = PetscMin(minj, j[p]);
4730651b1cf9SStefano Zampini         }
47310d88f7f4SJunchao Zhang 
4732651b1cf9SStefano Zampini         if (hasdiag) {
4733651b1cf9SStefano Zampini           for (p = start; p < end; p++) {
4734651b1cf9SStefano Zampini             if (j[p] == minj) j[p] = row;
4735651b1cf9SStefano Zampini             else if (j[p] == row) j[p] = minj;
4736651b1cf9SStefano Zampini           }
4737651b1cf9SStefano Zampini         }
4738651b1cf9SStefano Zampini       }
47390d88f7f4SJunchao Zhang     }
47400d88f7f4SJunchao Zhang     // sort by columns in a row
47410d88f7f4SJunchao Zhang     if (!strictly_sorted) PetscCall(PetscSortIntWithCountArray(end - start, j + start, perm + start));
4742651b1cf9SStefano Zampini 
47430d88f7f4SJunchao Zhang     if (strictly_sorted) { // fast path to set Aj[], jmap[], Ai[], nnz, q
47440d88f7f4SJunchao Zhang       for (p = start; p < end; p++, q++) {
47450d88f7f4SJunchao Zhang         Aj[q]   = j[p];
47460d88f7f4SJunchao Zhang         jmap[q] = 1;
47470d88f7f4SJunchao Zhang       }
47486497c311SBarry Smith       PetscCall(PetscIntCast(end - start, Ai + row));
47490d88f7f4SJunchao Zhang       nnz += Ai[row]; // q is already advanced
47500d88f7f4SJunchao Zhang     } else {
4751394ed5ebSJunchao Zhang       /* Find number of unique col entries in this row */
4752394ed5ebSJunchao Zhang       Aj[q]   = j[start]; /* Log the first nonzero in this row */
4753651b1cf9SStefano Zampini       jmap[q] = 1;        /* Number of repeats of this nonzero entry */
4754394ed5ebSJunchao Zhang       Ai[row] = 1;
4755394ed5ebSJunchao Zhang       nnz++;
4756394ed5ebSJunchao Zhang 
4757394ed5ebSJunchao Zhang       for (p = start + 1; p < end; p++) { /* Scan remaining nonzero in this row */
4758394ed5ebSJunchao Zhang         if (j[p] != j[p - 1]) {           /* Meet a new nonzero */
4759394ed5ebSJunchao Zhang           q++;
4760394ed5ebSJunchao Zhang           jmap[q] = 1;
4761394ed5ebSJunchao Zhang           Aj[q]   = j[p];
4762394ed5ebSJunchao Zhang           Ai[row]++;
4763394ed5ebSJunchao Zhang           nnz++;
4764394ed5ebSJunchao Zhang         } else {
4765394ed5ebSJunchao Zhang           jmap[q]++;
4766394ed5ebSJunchao Zhang         }
4767394ed5ebSJunchao Zhang       }
4768394ed5ebSJunchao Zhang       q++; /* Move to next row and thus next unique nonzero */
4769394ed5ebSJunchao Zhang     }
47700d88f7f4SJunchao Zhang   }
47710d88f7f4SJunchao Zhang 
4772394ed5ebSJunchao Zhang   Ai--; /* Back to the beginning of Ai[] */
4773394ed5ebSJunchao Zhang   for (k = 0; k < M; k++) Ai[k + 1] += Ai[k];
47740d88f7f4SJunchao Zhang   jmap--; // Back to the beginning of jmap[]
4775394ed5ebSJunchao Zhang   jmap[0] = 0;
4776394ed5ebSJunchao Zhang   for (k = 0; k < nnz; k++) jmap[k + 1] += jmap[k];
47770d88f7f4SJunchao Zhang 
47789f0612e4SBarry Smith   if (nnz < coo_n - nneg) { /* Reallocate with actual number of unique nonzeros */
4779394ed5ebSJunchao Zhang     PetscCount *jmap_new;
4780394ed5ebSJunchao Zhang     PetscInt   *Aj_new;
4781394ed5ebSJunchao Zhang 
47829566063dSJacob Faibussowitsch     PetscCall(PetscMalloc1(nnz + 1, &jmap_new));
47839566063dSJacob Faibussowitsch     PetscCall(PetscArraycpy(jmap_new, jmap, nnz + 1));
47849566063dSJacob Faibussowitsch     PetscCall(PetscFree(jmap));
4785394ed5ebSJunchao Zhang     jmap = jmap_new;
4786394ed5ebSJunchao Zhang 
47879f0612e4SBarry Smith     PetscCall(PetscShmgetAllocateArray(nnz, sizeof(PetscInt), (void **)&Aj_new));
47889566063dSJacob Faibussowitsch     PetscCall(PetscArraycpy(Aj_new, Aj, nnz));
47899f0612e4SBarry Smith     PetscCall(PetscShmgetDeallocateArray((void **)&Aj));
4790394ed5ebSJunchao Zhang     Aj = Aj_new;
4791394ed5ebSJunchao Zhang   }
4792394ed5ebSJunchao Zhang 
4793394ed5ebSJunchao Zhang   if (nneg) { /* Discard heading entries with negative indices in perm[], as we'll access it from index 0 in MatSetValuesCOO */
4794394ed5ebSJunchao Zhang     PetscCount *perm_new;
4795cbc6b225SStefano Zampini 
47969566063dSJacob Faibussowitsch     PetscCall(PetscMalloc1(coo_n - nneg, &perm_new));
47979566063dSJacob Faibussowitsch     PetscCall(PetscArraycpy(perm_new, perm + nneg, coo_n - nneg));
47989566063dSJacob Faibussowitsch     PetscCall(PetscFree(perm));
4799394ed5ebSJunchao Zhang     perm = perm_new;
4800394ed5ebSJunchao Zhang   }
4801394ed5ebSJunchao Zhang 
48029566063dSJacob Faibussowitsch   PetscCall(MatGetRootType_Private(mat, &rtype));
48039f0612e4SBarry Smith   PetscCall(PetscShmgetAllocateArray(nnz, sizeof(PetscScalar), (void **)&Aa));
48049f0612e4SBarry Smith   PetscCall(PetscArrayzero(Aa, nnz));
48059566063dSJacob Faibussowitsch   PetscCall(MatSetSeqAIJWithArrays_private(PETSC_COMM_SELF, M, N, Ai, Aj, Aa, rtype, mat));
4806394ed5ebSJunchao Zhang 
4807394ed5ebSJunchao Zhang   seqaij->free_a = seqaij->free_ij = PETSC_TRUE; /* Let newmat own Ai, Aj and Aa */
48082c4ab24aSJunchao Zhang 
48092c4ab24aSJunchao Zhang   // Put the COO struct in a container and then attach that to the matrix
48102c4ab24aSJunchao Zhang   PetscCall(PetscMalloc1(1, &coo));
48116497c311SBarry Smith   PetscCall(PetscIntCast(nnz, &coo->nz));
48122c4ab24aSJunchao Zhang   coo->n    = coo_n;
48132c4ab24aSJunchao Zhang   coo->Atot = coo_n - nneg; // Annz is seqaij->nz, so no need to record that again
48142c4ab24aSJunchao Zhang   coo->jmap = jmap;         // of length nnz+1
48152c4ab24aSJunchao Zhang   coo->perm = perm;
481603e76207SPierre Jolivet   PetscCall(PetscObjectContainerCompose((PetscObject)mat, "__PETSc_MatCOOStruct_Host", coo, MatCOOStructDestroy_SeqAIJ));
48173ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
4818394ed5ebSJunchao Zhang }
4819394ed5ebSJunchao Zhang 
4820d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatSetValuesCOO_SeqAIJ(Mat A, const PetscScalar v[], InsertMode imode)
4821d71ae5a4SJacob Faibussowitsch {
4822394ed5ebSJunchao Zhang   Mat_SeqAIJ          *aseq = (Mat_SeqAIJ *)A->data;
4823394ed5ebSJunchao Zhang   PetscCount           i, j, Annz = aseq->nz;
48242c4ab24aSJunchao Zhang   PetscCount          *perm, *jmap;
4825394ed5ebSJunchao Zhang   PetscScalar         *Aa;
48262c4ab24aSJunchao Zhang   PetscContainer       container;
48272c4ab24aSJunchao Zhang   MatCOOStruct_SeqAIJ *coo;
4828394ed5ebSJunchao Zhang 
4829394ed5ebSJunchao Zhang   PetscFunctionBegin;
48302c4ab24aSJunchao Zhang   PetscCall(PetscObjectQuery((PetscObject)A, "__PETSc_MatCOOStruct_Host", (PetscObject *)&container));
48312c4ab24aSJunchao Zhang   PetscCheck(container, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Not found MatCOOStruct on this matrix");
48322c4ab24aSJunchao Zhang   PetscCall(PetscContainerGetPointer(container, (void **)&coo));
48332c4ab24aSJunchao Zhang   perm = coo->perm;
48342c4ab24aSJunchao Zhang   jmap = coo->jmap;
48359566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArray(A, &Aa));
4836394ed5ebSJunchao Zhang   for (i = 0; i < Annz; i++) {
4837b6c38306SJunchao Zhang     PetscScalar sum = 0.0;
4838b6c38306SJunchao Zhang     for (j = jmap[i]; j < jmap[i + 1]; j++) sum += v[perm[j]];
4839b6c38306SJunchao Zhang     Aa[i] = (imode == INSERT_VALUES ? 0.0 : Aa[i]) + sum;
4840394ed5ebSJunchao Zhang   }
48419566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArray(A, &Aa));
48423ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
4843394ed5ebSJunchao Zhang }
4844394ed5ebSJunchao Zhang 
484534b5b067SBarry Smith #if defined(PETSC_HAVE_CUDA)
48465063d097SStefano Zampini PETSC_INTERN PetscErrorCode MatConvert_SeqAIJ_SeqAIJCUSPARSE(Mat, MatType, MatReuse, Mat *);
484702fe1965SBarry Smith #endif
4848d5e393b6SSuyash Tandon #if defined(PETSC_HAVE_HIP)
4849d5e393b6SSuyash Tandon PETSC_INTERN PetscErrorCode MatConvert_SeqAIJ_SeqAIJHIPSPARSE(Mat, MatType, MatReuse, Mat *);
4850d5e393b6SSuyash Tandon #endif
48513d0639e7SStefano Zampini #if defined(PETSC_HAVE_KOKKOS_KERNELS)
48525063d097SStefano Zampini PETSC_INTERN PetscErrorCode MatConvert_SeqAIJ_SeqAIJKokkos(Mat, MatType, MatReuse, Mat *);
48533d0639e7SStefano Zampini #endif
485402fe1965SBarry Smith 
4855d71ae5a4SJacob Faibussowitsch PETSC_EXTERN PetscErrorCode MatCreate_SeqAIJ(Mat B)
4856d71ae5a4SJacob Faibussowitsch {
4857273d9f13SBarry Smith   Mat_SeqAIJ *b;
485838baddfdSBarry Smith   PetscMPIInt size;
4859273d9f13SBarry Smith 
4860273d9f13SBarry Smith   PetscFunctionBegin;
48619566063dSJacob Faibussowitsch   PetscCallMPI(MPI_Comm_size(PetscObjectComm((PetscObject)B), &size));
486208401ef6SPierre Jolivet   PetscCheck(size <= 1, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Comm must be of size 1");
4863273d9f13SBarry Smith 
48644dfa11a4SJacob Faibussowitsch   PetscCall(PetscNew(&b));
48652205254eSKarl Rupp 
4866b0a32e0cSBarry Smith   B->data   = (void *)b;
4867aea10558SJacob Faibussowitsch   B->ops[0] = MatOps_Values;
4868071fcb05SBarry Smith   if (B->sortedfull) B->ops->setvalues = MatSetValues_SeqAIJ_SortedFull;
48692205254eSKarl Rupp 
4870f4259b30SLisandro Dalcin   b->row                = NULL;
4871f4259b30SLisandro Dalcin   b->col                = NULL;
4872f4259b30SLisandro Dalcin   b->icol               = NULL;
4873b810aeb4SBarry Smith   b->reallocs           = 0;
487436db0b34SBarry Smith   b->ignorezeroentries  = PETSC_FALSE;
4875f1e2ffcdSBarry Smith   b->roworiented        = PETSC_TRUE;
4876416022c9SBarry Smith   b->nonew              = 0;
4877f4259b30SLisandro Dalcin   b->diag               = NULL;
4878f4259b30SLisandro Dalcin   b->solve_work         = NULL;
4879f4259b30SLisandro Dalcin   B->spptr              = NULL;
4880f4259b30SLisandro Dalcin   b->saved_values       = NULL;
4881f4259b30SLisandro Dalcin   b->idiag              = NULL;
4882f4259b30SLisandro Dalcin   b->mdiag              = NULL;
4883f4259b30SLisandro Dalcin   b->ssor_work          = NULL;
488471f1c65dSBarry Smith   b->omega              = 1.0;
488571f1c65dSBarry Smith   b->fshift             = 0.0;
488671f1c65dSBarry Smith   b->idiagvalid         = PETSC_FALSE;
4887bbead8a2SBarry Smith   b->ibdiagvalid        = PETSC_FALSE;
4888a9817697SBarry Smith   b->keepnonzeropattern = PETSC_FALSE;
488917ab2063SBarry Smith 
48909566063dSJacob Faibussowitsch   PetscCall(PetscObjectChangeTypeName((PetscObject)B, MATSEQAIJ));
4891d1e78c4fSBarry Smith #if defined(PETSC_HAVE_MATLAB)
48929566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "PetscMatlabEnginePut_C", MatlabEnginePut_SeqAIJ));
48939566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "PetscMatlabEngineGet_C", MatlabEngineGet_SeqAIJ));
4894b3866ffcSBarry Smith #endif
48959566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSeqAIJSetColumnIndices_C", MatSeqAIJSetColumnIndices_SeqAIJ));
48969566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatStoreValues_C", MatStoreValues_SeqAIJ));
48979566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatRetrieveValues_C", MatRetrieveValues_SeqAIJ));
48989566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqsbaij_C", MatConvert_SeqAIJ_SeqSBAIJ));
48999566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqbaij_C", MatConvert_SeqAIJ_SeqBAIJ));
49009566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijperm_C", MatConvert_SeqAIJ_SeqAIJPERM));
49019566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijsell_C", MatConvert_SeqAIJ_SeqAIJSELL));
49029779e05dSSatish Balay #if defined(PETSC_HAVE_MKL_SPARSE)
49039566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijmkl_C", MatConvert_SeqAIJ_SeqAIJMKL));
4904191b95cbSRichard Tran Mills #endif
490534b5b067SBarry Smith #if defined(PETSC_HAVE_CUDA)
49069566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijcusparse_C", MatConvert_SeqAIJ_SeqAIJCUSPARSE));
49079566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_seqaijcusparse_seqaij_C", MatProductSetFromOptions_SeqAIJ));
49089566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_seqaij_seqaijcusparse_C", MatProductSetFromOptions_SeqAIJ));
490902fe1965SBarry Smith #endif
4910d5e393b6SSuyash Tandon #if defined(PETSC_HAVE_HIP)
4911d5e393b6SSuyash Tandon   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijhipsparse_C", MatConvert_SeqAIJ_SeqAIJHIPSPARSE));
4912d5e393b6SSuyash Tandon   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_seqaijhipsparse_seqaij_C", MatProductSetFromOptions_SeqAIJ));
4913d5e393b6SSuyash Tandon   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_seqaij_seqaijhipsparse_C", MatProductSetFromOptions_SeqAIJ));
4914d5e393b6SSuyash Tandon #endif
49153d0639e7SStefano Zampini #if defined(PETSC_HAVE_KOKKOS_KERNELS)
49169566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijkokkos_C", MatConvert_SeqAIJ_SeqAIJKokkos));
49173d0639e7SStefano Zampini #endif
49189566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijcrl_C", MatConvert_SeqAIJ_SeqAIJCRL));
4919af8000cdSHong Zhang #if defined(PETSC_HAVE_ELEMENTAL)
49209566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_elemental_C", MatConvert_SeqAIJ_Elemental));
4921af8000cdSHong Zhang #endif
4922d24d4204SJose E. Roman #if defined(PETSC_HAVE_SCALAPACK)
49239566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_scalapack_C", MatConvert_AIJ_ScaLAPACK));
4924d24d4204SJose E. Roman #endif
492563c07aadSStefano Zampini #if defined(PETSC_HAVE_HYPRE)
49269566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_hypre_C", MatConvert_AIJ_HYPRE));
49279566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_transpose_seqaij_seqaij_C", MatProductSetFromOptions_Transpose_AIJ_AIJ));
492863c07aadSStefano Zampini #endif
49299566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqdense_C", MatConvert_SeqAIJ_SeqDense));
49309566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqsell_C", MatConvert_SeqAIJ_SeqSELL));
49319566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_is_C", MatConvert_XAIJ_IS));
49329566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatIsTranspose_C", MatIsTranspose_SeqAIJ));
493314e4dea2SJose E. Roman   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatIsHermitianTranspose_C", MatIsHermitianTranspose_SeqAIJ));
49349566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSeqAIJSetPreallocation_C", MatSeqAIJSetPreallocation_SeqAIJ));
49359566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatResetPreallocation_C", MatResetPreallocation_SeqAIJ));
49369566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSeqAIJSetPreallocationCSR_C", MatSeqAIJSetPreallocationCSR_SeqAIJ));
49379566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatReorderForNonzeroDiagonal_C", MatReorderForNonzeroDiagonal_SeqAIJ));
49389566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_is_seqaij_C", MatProductSetFromOptions_IS_XAIJ));
49399566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_seqdense_seqaij_C", MatProductSetFromOptions_SeqDense_SeqAIJ));
49409566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_seqaij_seqaij_C", MatProductSetFromOptions_SeqAIJ));
49419566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSeqAIJKron_C", MatSeqAIJKron_SeqAIJ));
49429566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSetPreallocationCOO_C", MatSetPreallocationCOO_SeqAIJ));
49439566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSetValuesCOO_C", MatSetValuesCOO_SeqAIJ));
49449566063dSJacob Faibussowitsch   PetscCall(MatCreate_SeqAIJ_Inode(B));
49459566063dSJacob Faibussowitsch   PetscCall(PetscObjectChangeTypeName((PetscObject)B, MATSEQAIJ));
49469566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJSetTypeFromOptions(B)); /* this allows changing the matrix subtype to say MATSEQAIJPERM */
49473ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
494817ab2063SBarry Smith }
494917ab2063SBarry Smith 
4950b24902e0SBarry Smith /*
49513893b582SJunchao Zhang     Given a matrix generated with MatGetFactor() duplicates all the information in A into C
4952b24902e0SBarry Smith */
4953d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDuplicateNoCreate_SeqAIJ(Mat C, Mat A, MatDuplicateOption cpvalues, PetscBool mallocmatspace)
4954d71ae5a4SJacob Faibussowitsch {
49552a350339SBarry Smith   Mat_SeqAIJ *c = (Mat_SeqAIJ *)C->data, *a = (Mat_SeqAIJ *)A->data;
4956071fcb05SBarry Smith   PetscInt    m = A->rmap->n, i;
495717ab2063SBarry Smith 
49583a40ed3dSBarry Smith   PetscFunctionBegin;
4959aed4548fSBarry Smith   PetscCheck(A->assembled || cpvalues == MAT_DO_NOT_COPY_VALUES, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Cannot duplicate unassembled matrix");
4960273d9f13SBarry Smith 
4961d5f3da31SBarry Smith   C->factortype    = A->factortype;
4962f4259b30SLisandro Dalcin   c->row           = NULL;
4963f4259b30SLisandro Dalcin   c->col           = NULL;
4964f4259b30SLisandro Dalcin   c->icol          = NULL;
49656ad4291fSHong Zhang   c->reallocs      = 0;
4966bc43efbbSJunchao Zhang   c->diagonaldense = a->diagonaldense;
496717ab2063SBarry Smith 
496869272f91SPierre Jolivet   C->assembled = A->assembled;
496917ab2063SBarry Smith 
497069272f91SPierre Jolivet   if (A->preallocated) {
49719566063dSJacob Faibussowitsch     PetscCall(PetscLayoutReference(A->rmap, &C->rmap));
49729566063dSJacob Faibussowitsch     PetscCall(PetscLayoutReference(A->cmap, &C->cmap));
4973eec197d1SBarry Smith 
497431fe6a7dSBarry Smith     if (!A->hash_active) {
49759566063dSJacob Faibussowitsch       PetscCall(PetscMalloc1(m, &c->imax));
49769566063dSJacob Faibussowitsch       PetscCall(PetscMemcpy(c->imax, a->imax, m * sizeof(PetscInt)));
49779566063dSJacob Faibussowitsch       PetscCall(PetscMalloc1(m, &c->ilen));
49789566063dSJacob Faibussowitsch       PetscCall(PetscMemcpy(c->ilen, a->ilen, m * sizeof(PetscInt)));
497917ab2063SBarry Smith 
498017ab2063SBarry Smith       /* allocate the matrix space */
4981f77e22a1SHong Zhang       if (mallocmatspace) {
49829f0612e4SBarry Smith         PetscCall(PetscShmgetAllocateArray(a->i[m], sizeof(PetscScalar), (void **)&c->a));
49839f0612e4SBarry Smith         PetscCall(PetscShmgetAllocateArray(a->i[m], sizeof(PetscInt), (void **)&c->j));
49849f0612e4SBarry Smith         PetscCall(PetscShmgetAllocateArray(m + 1, sizeof(PetscInt), (void **)&c->i));
49859566063dSJacob Faibussowitsch         PetscCall(PetscArraycpy(c->i, a->i, m + 1));
49869f0612e4SBarry Smith         c->free_a  = PETSC_TRUE;
49879f0612e4SBarry Smith         c->free_ij = PETSC_TRUE;
498817ab2063SBarry Smith         if (m > 0) {
49899566063dSJacob Faibussowitsch           PetscCall(PetscArraycpy(c->j, a->j, a->i[m]));
4990be6bf707SBarry Smith           if (cpvalues == MAT_COPY_VALUES) {
49912e5835c6SStefano Zampini             const PetscScalar *aa;
49922e5835c6SStefano Zampini 
49939566063dSJacob Faibussowitsch             PetscCall(MatSeqAIJGetArrayRead(A, &aa));
49949566063dSJacob Faibussowitsch             PetscCall(PetscArraycpy(c->a, aa, a->i[m]));
49959566063dSJacob Faibussowitsch             PetscCall(MatSeqAIJGetArrayRead(A, &aa));
4996be6bf707SBarry Smith           } else {
49979566063dSJacob Faibussowitsch             PetscCall(PetscArrayzero(c->a, a->i[m]));
499817ab2063SBarry Smith           }
499908480c60SBarry Smith         }
5000f77e22a1SHong Zhang       }
500131fe6a7dSBarry Smith       C->preallocated = PETSC_TRUE;
500231fe6a7dSBarry Smith     } else {
500331fe6a7dSBarry Smith       PetscCheck(mallocmatspace, PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_WRONGSTATE, "Cannot malloc matrix memory from a non-preallocated matrix");
500431fe6a7dSBarry Smith       PetscCall(MatSetUp(C));
500531fe6a7dSBarry Smith     }
500617ab2063SBarry Smith 
50076ad4291fSHong Zhang     c->ignorezeroentries = a->ignorezeroentries;
5008416022c9SBarry Smith     c->roworiented       = a->roworiented;
5009416022c9SBarry Smith     c->nonew             = a->nonew;
5010416022c9SBarry Smith     if (a->diag) {
50119566063dSJacob Faibussowitsch       PetscCall(PetscMalloc1(m + 1, &c->diag));
50129566063dSJacob Faibussowitsch       PetscCall(PetscMemcpy(c->diag, a->diag, m * sizeof(PetscInt)));
5013071fcb05SBarry Smith     } else c->diag = NULL;
50142205254eSKarl Rupp 
5015f4259b30SLisandro Dalcin     c->solve_work         = NULL;
5016f4259b30SLisandro Dalcin     c->saved_values       = NULL;
5017f4259b30SLisandro Dalcin     c->idiag              = NULL;
5018f4259b30SLisandro Dalcin     c->ssor_work          = NULL;
5019a9817697SBarry Smith     c->keepnonzeropattern = a->keepnonzeropattern;
50206ad4291fSHong Zhang 
5021893ad86cSHong Zhang     c->rmax  = a->rmax;
5022416022c9SBarry Smith     c->nz    = a->nz;
50238ed568f8SMatthew G Knepley     c->maxnz = a->nz; /* Since we allocate exactly the right amount */
5024754ec7b1SSatish Balay 
50256ad4291fSHong Zhang     c->compressedrow.use   = a->compressedrow.use;
50266ad4291fSHong Zhang     c->compressedrow.nrows = a->compressedrow.nrows;
5027cd6b891eSBarry Smith     if (a->compressedrow.use) {
50286ad4291fSHong Zhang       i = a->compressedrow.nrows;
50299566063dSJacob Faibussowitsch       PetscCall(PetscMalloc2(i + 1, &c->compressedrow.i, i, &c->compressedrow.rindex));
50309566063dSJacob Faibussowitsch       PetscCall(PetscArraycpy(c->compressedrow.i, a->compressedrow.i, i + 1));
50319566063dSJacob Faibussowitsch       PetscCall(PetscArraycpy(c->compressedrow.rindex, a->compressedrow.rindex, i));
503227ea64f8SHong Zhang     } else {
503327ea64f8SHong Zhang       c->compressedrow.use    = PETSC_FALSE;
50340298fd71SBarry Smith       c->compressedrow.i      = NULL;
50350298fd71SBarry Smith       c->compressedrow.rindex = NULL;
50366ad4291fSHong Zhang     }
5037ea632784SBarry Smith     c->nonzerorowcnt = a->nonzerorowcnt;
5038e56f5c9eSBarry Smith     C->nonzerostate  = A->nonzerostate;
50394846f1f5SKris Buschelman 
50409566063dSJacob Faibussowitsch     PetscCall(MatDuplicate_SeqAIJ_Inode(A, cpvalues, &C));
504169272f91SPierre Jolivet   }
50429566063dSJacob Faibussowitsch   PetscCall(PetscFunctionListDuplicate(((PetscObject)A)->qlist, &((PetscObject)C)->qlist));
50433ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
504417ab2063SBarry Smith }
504517ab2063SBarry Smith 
5046d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDuplicate_SeqAIJ(Mat A, MatDuplicateOption cpvalues, Mat *B)
5047d71ae5a4SJacob Faibussowitsch {
5048b24902e0SBarry Smith   PetscFunctionBegin;
50499566063dSJacob Faibussowitsch   PetscCall(MatCreate(PetscObjectComm((PetscObject)A), B));
50509566063dSJacob Faibussowitsch   PetscCall(MatSetSizes(*B, A->rmap->n, A->cmap->n, A->rmap->n, A->cmap->n));
505148a46eb9SPierre Jolivet   if (!(A->rmap->n % A->rmap->bs) && !(A->cmap->n % A->cmap->bs)) PetscCall(MatSetBlockSizesFromMats(*B, A, A));
50529566063dSJacob Faibussowitsch   PetscCall(MatSetType(*B, ((PetscObject)A)->type_name));
50539566063dSJacob Faibussowitsch   PetscCall(MatDuplicateNoCreate_SeqAIJ(*B, A, cpvalues, PETSC_TRUE));
50543ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
5055b24902e0SBarry Smith }
5056b24902e0SBarry Smith 
5057d71ae5a4SJacob Faibussowitsch PetscErrorCode MatLoad_SeqAIJ(Mat newMat, PetscViewer viewer)
5058d71ae5a4SJacob Faibussowitsch {
505952f91c60SVaclav Hapla   PetscBool isbinary, ishdf5;
506052f91c60SVaclav Hapla 
506152f91c60SVaclav Hapla   PetscFunctionBegin;
506252f91c60SVaclav Hapla   PetscValidHeaderSpecific(newMat, MAT_CLASSID, 1);
506352f91c60SVaclav Hapla   PetscValidHeaderSpecific(viewer, PETSC_VIEWER_CLASSID, 2);
5064c27b3999SVaclav Hapla   /* force binary viewer to load .info file if it has not yet done so */
50659566063dSJacob Faibussowitsch   PetscCall(PetscViewerSetUp(viewer));
50669566063dSJacob Faibussowitsch   PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERBINARY, &isbinary));
50679566063dSJacob Faibussowitsch   PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERHDF5, &ishdf5));
506852f91c60SVaclav Hapla   if (isbinary) {
50699566063dSJacob Faibussowitsch     PetscCall(MatLoad_SeqAIJ_Binary(newMat, viewer));
507052f91c60SVaclav Hapla   } else if (ishdf5) {
507152f91c60SVaclav Hapla #if defined(PETSC_HAVE_HDF5)
50729566063dSJacob Faibussowitsch     PetscCall(MatLoad_AIJ_HDF5(newMat, viewer));
507352f91c60SVaclav Hapla #else
507452f91c60SVaclav Hapla     SETERRQ(PetscObjectComm((PetscObject)newMat), PETSC_ERR_SUP, "HDF5 not supported in this build.\nPlease reconfigure using --download-hdf5");
507552f91c60SVaclav Hapla #endif
507652f91c60SVaclav Hapla   } else {
507798921bdaSJacob Faibussowitsch     SETERRQ(PetscObjectComm((PetscObject)newMat), PETSC_ERR_SUP, "Viewer type %s not yet supported for reading %s matrices", ((PetscObject)viewer)->type_name, ((PetscObject)newMat)->type_name);
507852f91c60SVaclav Hapla   }
50793ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
508052f91c60SVaclav Hapla }
508152f91c60SVaclav Hapla 
5082d71ae5a4SJacob Faibussowitsch PetscErrorCode MatLoad_SeqAIJ_Binary(Mat mat, PetscViewer viewer)
5083d71ae5a4SJacob Faibussowitsch {
50843ea6fe3dSLisandro Dalcin   Mat_SeqAIJ *a = (Mat_SeqAIJ *)mat->data;
50853ea6fe3dSLisandro Dalcin   PetscInt    header[4], *rowlens, M, N, nz, sum, rows, cols, i;
5086fbdbba38SShri Abhyankar 
5087fbdbba38SShri Abhyankar   PetscFunctionBegin;
50889566063dSJacob Faibussowitsch   PetscCall(PetscViewerSetUp(viewer));
5089bbead8a2SBarry Smith 
50903ea6fe3dSLisandro Dalcin   /* read in matrix header */
50919566063dSJacob Faibussowitsch   PetscCall(PetscViewerBinaryRead(viewer, header, 4, NULL, PETSC_INT));
509208401ef6SPierre Jolivet   PetscCheck(header[0] == MAT_FILE_CLASSID, PETSC_COMM_SELF, PETSC_ERR_FILE_UNEXPECTED, "Not a matrix object in file");
50939371c9d4SSatish Balay   M  = header[1];
50949371c9d4SSatish Balay   N  = header[2];
50959371c9d4SSatish Balay   nz = header[3];
509608401ef6SPierre Jolivet   PetscCheck(M >= 0, PetscObjectComm((PetscObject)viewer), PETSC_ERR_FILE_UNEXPECTED, "Matrix row size (%" PetscInt_FMT ") in file is negative", M);
509708401ef6SPierre Jolivet   PetscCheck(N >= 0, PetscObjectComm((PetscObject)viewer), PETSC_ERR_FILE_UNEXPECTED, "Matrix column size (%" PetscInt_FMT ") in file is negative", N);
509808401ef6SPierre Jolivet   PetscCheck(nz >= 0, PETSC_COMM_SELF, PETSC_ERR_FILE_UNEXPECTED, "Matrix stored in special format on disk, cannot load as SeqAIJ");
5099fbdbba38SShri Abhyankar 
51003ea6fe3dSLisandro Dalcin   /* set block sizes from the viewer's .info file */
51019566063dSJacob Faibussowitsch   PetscCall(MatLoad_Binary_BlockSizes(mat, viewer));
51023ea6fe3dSLisandro Dalcin   /* set local and global sizes if not set already */
51033ea6fe3dSLisandro Dalcin   if (mat->rmap->n < 0) mat->rmap->n = M;
51043ea6fe3dSLisandro Dalcin   if (mat->cmap->n < 0) mat->cmap->n = N;
51053ea6fe3dSLisandro Dalcin   if (mat->rmap->N < 0) mat->rmap->N = M;
51063ea6fe3dSLisandro Dalcin   if (mat->cmap->N < 0) mat->cmap->N = N;
51079566063dSJacob Faibussowitsch   PetscCall(PetscLayoutSetUp(mat->rmap));
51089566063dSJacob Faibussowitsch   PetscCall(PetscLayoutSetUp(mat->cmap));
51093ea6fe3dSLisandro Dalcin 
51103ea6fe3dSLisandro Dalcin   /* check if the matrix sizes are correct */
51119566063dSJacob Faibussowitsch   PetscCall(MatGetSize(mat, &rows, &cols));
5112aed4548fSBarry Smith   PetscCheck(M == rows && N == cols, PETSC_COMM_SELF, PETSC_ERR_FILE_UNEXPECTED, "Matrix in file of different sizes (%" PetscInt_FMT ", %" PetscInt_FMT ") than the input matrix (%" PetscInt_FMT ", %" PetscInt_FMT ")", M, N, rows, cols);
51133ea6fe3dSLisandro Dalcin 
5114fbdbba38SShri Abhyankar   /* read in row lengths */
51159566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(M, &rowlens));
51169566063dSJacob Faibussowitsch   PetscCall(PetscViewerBinaryRead(viewer, rowlens, M, NULL, PETSC_INT));
51173ea6fe3dSLisandro Dalcin   /* check if sum(rowlens) is same as nz */
51189371c9d4SSatish Balay   sum = 0;
51199371c9d4SSatish Balay   for (i = 0; i < M; i++) sum += rowlens[i];
512008401ef6SPierre Jolivet   PetscCheck(sum == nz, PETSC_COMM_SELF, PETSC_ERR_FILE_UNEXPECTED, "Inconsistent matrix data in file: nonzeros = %" PetscInt_FMT ", sum-row-lengths = %" PetscInt_FMT, nz, sum);
51213ea6fe3dSLisandro Dalcin   /* preallocate and check sizes */
51229566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(mat, 0, rowlens));
51239566063dSJacob Faibussowitsch   PetscCall(MatGetSize(mat, &rows, &cols));
5124aed4548fSBarry Smith   PetscCheck(M == rows && N == cols, PETSC_COMM_SELF, PETSC_ERR_FILE_UNEXPECTED, "Matrix in file of different length (%" PetscInt_FMT ", %" PetscInt_FMT ") than the input matrix (%" PetscInt_FMT ", %" PetscInt_FMT ")", M, N, rows, cols);
51253ea6fe3dSLisandro Dalcin   /* store row lengths */
51269566063dSJacob Faibussowitsch   PetscCall(PetscArraycpy(a->ilen, rowlens, M));
51279566063dSJacob Faibussowitsch   PetscCall(PetscFree(rowlens));
5128fbdbba38SShri Abhyankar 
51293ea6fe3dSLisandro Dalcin   /* fill in "i" row pointers */
51309371c9d4SSatish Balay   a->i[0] = 0;
51319371c9d4SSatish Balay   for (i = 0; i < M; i++) a->i[i + 1] = a->i[i] + a->ilen[i];
51323ea6fe3dSLisandro Dalcin   /* read in "j" column indices */
51339566063dSJacob Faibussowitsch   PetscCall(PetscViewerBinaryRead(viewer, a->j, nz, NULL, PETSC_INT));
51343ea6fe3dSLisandro Dalcin   /* read in "a" nonzero values */
51359566063dSJacob Faibussowitsch   PetscCall(PetscViewerBinaryRead(viewer, a->a, nz, NULL, PETSC_SCALAR));
5136fbdbba38SShri Abhyankar 
51379566063dSJacob Faibussowitsch   PetscCall(MatAssemblyBegin(mat, MAT_FINAL_ASSEMBLY));
51389566063dSJacob Faibussowitsch   PetscCall(MatAssemblyEnd(mat, MAT_FINAL_ASSEMBLY));
51393ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
5140fbdbba38SShri Abhyankar }
5141fbdbba38SShri Abhyankar 
5142d71ae5a4SJacob Faibussowitsch PetscErrorCode MatEqual_SeqAIJ(Mat A, Mat B, PetscBool *flg)
5143d71ae5a4SJacob Faibussowitsch {
51447264ac53SSatish Balay   Mat_SeqAIJ        *a = (Mat_SeqAIJ *)A->data, *b = (Mat_SeqAIJ *)B->data;
5145fff043a9SJunchao Zhang   const PetscScalar *aa, *ba;
5146eeffb40dSHong Zhang #if defined(PETSC_USE_COMPLEX)
5147eeffb40dSHong Zhang   PetscInt k;
5148eeffb40dSHong Zhang #endif
51497264ac53SSatish Balay 
51503a40ed3dSBarry Smith   PetscFunctionBegin;
5151bfeeae90SHong Zhang   /* If the  matrix dimensions are not equal,or no of nonzeros */
5152d0f46423SBarry Smith   if ((A->rmap->n != B->rmap->n) || (A->cmap->n != B->cmap->n) || (a->nz != b->nz)) {
5153ca44d042SBarry Smith     *flg = PETSC_FALSE;
51543ba16761SJacob Faibussowitsch     PetscFunctionReturn(PETSC_SUCCESS);
5155bcd2baecSBarry Smith   }
51567264ac53SSatish Balay 
51577264ac53SSatish Balay   /* if the a->i are the same */
51589566063dSJacob Faibussowitsch   PetscCall(PetscArraycmp(a->i, b->i, A->rmap->n + 1, flg));
51593ba16761SJacob Faibussowitsch   if (!*flg) PetscFunctionReturn(PETSC_SUCCESS);
51607264ac53SSatish Balay 
51617264ac53SSatish Balay   /* if a->j are the same */
51629566063dSJacob Faibussowitsch   PetscCall(PetscArraycmp(a->j, b->j, a->nz, flg));
51633ba16761SJacob Faibussowitsch   if (!*flg) PetscFunctionReturn(PETSC_SUCCESS);
5164bcd2baecSBarry Smith 
51659566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &aa));
51669566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(B, &ba));
5167bcd2baecSBarry Smith   /* if a->a are the same */
5168eeffb40dSHong Zhang #if defined(PETSC_USE_COMPLEX)
5169eeffb40dSHong Zhang   for (k = 0; k < a->nz; k++) {
5170fff043a9SJunchao Zhang     if (PetscRealPart(aa[k]) != PetscRealPart(ba[k]) || PetscImaginaryPart(aa[k]) != PetscImaginaryPart(ba[k])) {
5171eeffb40dSHong Zhang       *flg = PETSC_FALSE;
51723ba16761SJacob Faibussowitsch       PetscFunctionReturn(PETSC_SUCCESS);
5173eeffb40dSHong Zhang     }
5174eeffb40dSHong Zhang   }
5175eeffb40dSHong Zhang #else
51769566063dSJacob Faibussowitsch   PetscCall(PetscArraycmp(aa, ba, a->nz, flg));
5177eeffb40dSHong Zhang #endif
51789566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &aa));
51799566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(B, &ba));
51803ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
51817264ac53SSatish Balay }
518236db0b34SBarry Smith 
518305869f15SSatish Balay /*@
518411a5261eSBarry Smith   MatCreateSeqAIJWithArrays - Creates an sequential `MATSEQAIJ` matrix using matrix elements (in CSR format)
518536db0b34SBarry Smith   provided by the user.
518636db0b34SBarry Smith 
5187d083f849SBarry Smith   Collective
518836db0b34SBarry Smith 
518936db0b34SBarry Smith   Input Parameters:
519036db0b34SBarry Smith + comm - must be an MPI communicator of size 1
519136db0b34SBarry Smith . m    - number of rows
519236db0b34SBarry Smith . n    - number of columns
5193483a2f95SBarry Smith . i    - row indices; that is i[0] = 0, i[row] = i[row-1] + number of elements in that row of the matrix
519436db0b34SBarry Smith . j    - column indices
519536db0b34SBarry Smith - a    - matrix values
519636db0b34SBarry Smith 
519736db0b34SBarry Smith   Output Parameter:
519836db0b34SBarry Smith . mat - the matrix
519936db0b34SBarry Smith 
520036db0b34SBarry Smith   Level: intermediate
520136db0b34SBarry Smith 
520236db0b34SBarry Smith   Notes:
52032ef1f0ffSBarry Smith   The `i`, `j`, and `a` arrays are not copied by this routine, the user must free these arrays
5204292fb18eSBarry Smith   once the matrix is destroyed and not before
520536db0b34SBarry Smith 
520636db0b34SBarry Smith   You cannot set new nonzero locations into this matrix, that will generate an error.
520736db0b34SBarry Smith 
52082ef1f0ffSBarry Smith   The `i` and `j` indices are 0 based
520936db0b34SBarry Smith 
5210a4552177SSatish Balay   The format which is used for the sparse matrix input, is equivalent to a
5211a4552177SSatish Balay   row-major ordering.. i.e for the following matrix, the input data expected is
52128eef79e4SBarry Smith   as shown
52132ef1f0ffSBarry Smith .vb
52142ef1f0ffSBarry Smith         1 0 0
52152ef1f0ffSBarry Smith         2 0 3
52162ef1f0ffSBarry Smith         4 5 6
5217a4552177SSatish Balay 
52182ef1f0ffSBarry Smith         i =  {0,1,3,6}  [size = nrow+1  = 3+1]
52192ef1f0ffSBarry Smith         j =  {0,0,2,0,1,2}  [size = 6]; values must be sorted for each row
52202ef1f0ffSBarry Smith         v =  {1,2,3,4,5,6}  [size = 6]
52212ef1f0ffSBarry Smith .ve
5222a4552177SSatish Balay 
52231cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatCreate()`, `MatCreateAIJ()`, `MatCreateSeqAIJ()`, `MatCreateMPIAIJWithArrays()`, `MatMPIAIJSetPreallocationCSR()`
522436db0b34SBarry Smith @*/
5225d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateSeqAIJWithArrays(MPI_Comm comm, PetscInt m, PetscInt n, PetscInt i[], PetscInt j[], PetscScalar a[], Mat *mat)
5226d71ae5a4SJacob Faibussowitsch {
5227cbcfb4deSHong Zhang   PetscInt    ii;
522836db0b34SBarry Smith   Mat_SeqAIJ *aij;
5229cbcfb4deSHong Zhang   PetscInt    jj;
523036db0b34SBarry Smith 
523136db0b34SBarry Smith   PetscFunctionBegin;
5232aed4548fSBarry Smith   PetscCheck(m <= 0 || i[0] == 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "i (row indices) must start with 0");
52339566063dSJacob Faibussowitsch   PetscCall(MatCreate(comm, mat));
52349566063dSJacob Faibussowitsch   PetscCall(MatSetSizes(*mat, m, n, m, n));
52359566063dSJacob Faibussowitsch   /* PetscCall(MatSetBlockSizes(*mat,,)); */
52369566063dSJacob Faibussowitsch   PetscCall(MatSetType(*mat, MATSEQAIJ));
52379566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(*mat, MAT_SKIP_ALLOCATION, NULL));
5238ab93d7beSBarry Smith   aij = (Mat_SeqAIJ *)(*mat)->data;
52399566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(m, &aij->imax));
52409566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(m, &aij->ilen));
5241ab93d7beSBarry Smith 
524236db0b34SBarry Smith   aij->i       = i;
524336db0b34SBarry Smith   aij->j       = j;
524436db0b34SBarry Smith   aij->a       = a;
524536db0b34SBarry Smith   aij->nonew   = -1; /*this indicates that inserting a new value in the matrix that generates a new nonzero is an error*/
5246e6b907acSBarry Smith   aij->free_a  = PETSC_FALSE;
5247e6b907acSBarry Smith   aij->free_ij = PETSC_FALSE;
524836db0b34SBarry Smith 
5249cbc6b225SStefano Zampini   for (ii = 0, aij->nonzerorowcnt = 0, aij->rmax = 0; ii < m; ii++) {
525036db0b34SBarry Smith     aij->ilen[ii] = aij->imax[ii] = i[ii + 1] - i[ii];
525176bd3646SJed Brown     if (PetscDefined(USE_DEBUG)) {
5252aed4548fSBarry Smith       PetscCheck(i[ii + 1] - i[ii] >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Negative row length in i (row indices) row = %" PetscInt_FMT " length = %" PetscInt_FMT, ii, i[ii + 1] - i[ii]);
52539985e31cSBarry Smith       for (jj = i[ii] + 1; jj < i[ii + 1]; jj++) {
525408401ef6SPierre Jolivet         PetscCheck(j[jj] >= j[jj - 1], PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Column entry number %" PetscInt_FMT " (actual column %" PetscInt_FMT ") in row %" PetscInt_FMT " is not sorted", jj - i[ii], j[jj], ii);
525508401ef6SPierre Jolivet         PetscCheck(j[jj] != j[jj - 1], PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Column entry number %" PetscInt_FMT " (actual column %" PetscInt_FMT ") in row %" PetscInt_FMT " is identical to previous entry", jj - i[ii], j[jj], ii);
52569985e31cSBarry Smith       }
525736db0b34SBarry Smith     }
525876bd3646SJed Brown   }
525976bd3646SJed Brown   if (PetscDefined(USE_DEBUG)) {
526036db0b34SBarry Smith     for (ii = 0; ii < aij->i[m]; ii++) {
526108401ef6SPierre Jolivet       PetscCheck(j[ii] >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Negative column index at location = %" PetscInt_FMT " index = %" PetscInt_FMT, ii, j[ii]);
5262da0802e2SStefano Zampini       PetscCheck(j[ii] <= n - 1, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Column index to large at location = %" PetscInt_FMT " index = %" PetscInt_FMT " last column = %" PetscInt_FMT, ii, j[ii], n - 1);
526336db0b34SBarry Smith     }
526476bd3646SJed Brown   }
526536db0b34SBarry Smith 
52669566063dSJacob Faibussowitsch   PetscCall(MatAssemblyBegin(*mat, MAT_FINAL_ASSEMBLY));
52679566063dSJacob Faibussowitsch   PetscCall(MatAssemblyEnd(*mat, MAT_FINAL_ASSEMBLY));
52683ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
526936db0b34SBarry Smith }
5270cbc6b225SStefano Zampini 
5271f62e3866SBarry Smith /*@
527211a5261eSBarry Smith   MatCreateSeqAIJFromTriple - Creates an sequential `MATSEQAIJ` matrix using matrix elements (in COO format)
52738a0b0e6bSVictor Minden   provided by the user.
52748a0b0e6bSVictor Minden 
5275d083f849SBarry Smith   Collective
52768a0b0e6bSVictor Minden 
52778a0b0e6bSVictor Minden   Input Parameters:
52788a0b0e6bSVictor Minden + comm - must be an MPI communicator of size 1
52798a0b0e6bSVictor Minden . m    - number of rows
52808a0b0e6bSVictor Minden . n    - number of columns
52818a0b0e6bSVictor Minden . i    - row indices
52828a0b0e6bSVictor Minden . j    - column indices
52831230e6d1SVictor Minden . a    - matrix values
52841230e6d1SVictor Minden . nz   - number of nonzeros
52852ef1f0ffSBarry Smith - idx  - if the `i` and `j` indices start with 1 use `PETSC_TRUE` otherwise use `PETSC_FALSE`
52868a0b0e6bSVictor Minden 
52878a0b0e6bSVictor Minden   Output Parameter:
52888a0b0e6bSVictor Minden . mat - the matrix
52898a0b0e6bSVictor Minden 
52908a0b0e6bSVictor Minden   Level: intermediate
52918a0b0e6bSVictor Minden 
5292f62e3866SBarry Smith   Example:
5293f62e3866SBarry Smith   For the following matrix, the input data expected is as shown (using 0 based indexing)
52949e99939fSJunchao Zhang .vb
52958a0b0e6bSVictor Minden         1 0 0
52968a0b0e6bSVictor Minden         2 0 3
52978a0b0e6bSVictor Minden         4 5 6
52988a0b0e6bSVictor Minden 
52998a0b0e6bSVictor Minden         i =  {0,1,1,2,2,2}
53008a0b0e6bSVictor Minden         j =  {0,0,2,0,1,2}
53018a0b0e6bSVictor Minden         v =  {1,2,3,4,5,6}
53029e99939fSJunchao Zhang .ve
5303fe59aa6dSJacob Faibussowitsch 
53042ef1f0ffSBarry Smith   Note:
5305d7547e51SJunchao Zhang   Instead of using this function, users should also consider `MatSetPreallocationCOO()` and `MatSetValuesCOO()`, which allow repeated or remote entries,
5306d7547e51SJunchao Zhang   and are particularly useful in iterative applications.
53078a0b0e6bSVictor Minden 
53081cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatCreate()`, `MatCreateAIJ()`, `MatCreateSeqAIJ()`, `MatCreateSeqAIJWithArrays()`, `MatMPIAIJSetPreallocationCSR()`, `MatSetValuesCOO()`, `MatSetPreallocationCOO()`
53098a0b0e6bSVictor Minden @*/
5310d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateSeqAIJFromTriple(MPI_Comm comm, PetscInt m, PetscInt n, PetscInt i[], PetscInt j[], PetscScalar a[], Mat *mat, PetscInt nz, PetscBool idx)
5311d71ae5a4SJacob Faibussowitsch {
5312d021a1c5SVictor Minden   PetscInt ii, *nnz, one = 1, row, col;
53138a0b0e6bSVictor Minden 
53148a0b0e6bSVictor Minden   PetscFunctionBegin;
53159566063dSJacob Faibussowitsch   PetscCall(PetscCalloc1(m, &nnz));
5316ad540459SPierre Jolivet   for (ii = 0; ii < nz; ii++) nnz[i[ii] - !!idx] += 1;
53179566063dSJacob Faibussowitsch   PetscCall(MatCreate(comm, mat));
53189566063dSJacob Faibussowitsch   PetscCall(MatSetSizes(*mat, m, n, m, n));
53199566063dSJacob Faibussowitsch   PetscCall(MatSetType(*mat, MATSEQAIJ));
53209566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(*mat, 0, nnz));
53211230e6d1SVictor Minden   for (ii = 0; ii < nz; ii++) {
53221230e6d1SVictor Minden     if (idx) {
53231230e6d1SVictor Minden       row = i[ii] - 1;
53241230e6d1SVictor Minden       col = j[ii] - 1;
53251230e6d1SVictor Minden     } else {
53261230e6d1SVictor Minden       row = i[ii];
53271230e6d1SVictor Minden       col = j[ii];
53288a0b0e6bSVictor Minden     }
53299566063dSJacob Faibussowitsch     PetscCall(MatSetValues(*mat, one, &row, one, &col, &a[ii], ADD_VALUES));
53308a0b0e6bSVictor Minden   }
53319566063dSJacob Faibussowitsch   PetscCall(MatAssemblyBegin(*mat, MAT_FINAL_ASSEMBLY));
53329566063dSJacob Faibussowitsch   PetscCall(MatAssemblyEnd(*mat, MAT_FINAL_ASSEMBLY));
53339566063dSJacob Faibussowitsch   PetscCall(PetscFree(nnz));
53343ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
53358a0b0e6bSVictor Minden }
533636db0b34SBarry Smith 
5337d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJInvalidateDiagonal(Mat A)
5338d71ae5a4SJacob Faibussowitsch {
5339acf2f550SJed Brown   Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data;
5340acf2f550SJed Brown 
5341acf2f550SJed Brown   PetscFunctionBegin;
5342acf2f550SJed Brown   a->idiagvalid  = PETSC_FALSE;
5343acf2f550SJed Brown   a->ibdiagvalid = PETSC_FALSE;
53442205254eSKarl Rupp 
53459566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJInvalidateDiagonal_Inode(A));
53463ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
5347acf2f550SJed Brown }
5348acf2f550SJed Brown 
5349d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateMPIMatConcatenateSeqMat_SeqAIJ(MPI_Comm comm, Mat inmat, PetscInt n, MatReuse scall, Mat *outmat)
5350d71ae5a4SJacob Faibussowitsch {
53519c8f2541SHong Zhang   PetscFunctionBegin;
53529566063dSJacob Faibussowitsch   PetscCall(MatCreateMPIMatConcatenateSeqMat_MPIAIJ(comm, inmat, n, scall, outmat));
53533ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
53549c8f2541SHong Zhang }
53559c8f2541SHong Zhang 
535681824310SBarry Smith /*
535753dd7562SDmitry Karpeev  Permute A into C's *local* index space using rowemb,colemb.
535853dd7562SDmitry Karpeev  The embedding are supposed to be injections and the above implies that the range of rowemb is a subset
535953dd7562SDmitry Karpeev  of [0,m), colemb is in [0,n).
536053dd7562SDmitry Karpeev  If pattern == DIFFERENT_NONZERO_PATTERN, C is preallocated according to A.
536153dd7562SDmitry Karpeev  */
5362d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetSeqMat_SeqAIJ(Mat C, IS rowemb, IS colemb, MatStructure pattern, Mat B)
5363d71ae5a4SJacob Faibussowitsch {
536453dd7562SDmitry Karpeev   /* If making this function public, change the error returned in this function away from _PLIB. */
536553dd7562SDmitry Karpeev   Mat_SeqAIJ     *Baij;
536653dd7562SDmitry Karpeev   PetscBool       seqaij;
536753dd7562SDmitry Karpeev   PetscInt        m, n, *nz, i, j, count;
536853dd7562SDmitry Karpeev   PetscScalar     v;
536953dd7562SDmitry Karpeev   const PetscInt *rowindices, *colindices;
537053dd7562SDmitry Karpeev 
537153dd7562SDmitry Karpeev   PetscFunctionBegin;
53723ba16761SJacob Faibussowitsch   if (!B) PetscFunctionReturn(PETSC_SUCCESS);
537353dd7562SDmitry Karpeev   /* Check to make sure the target matrix (and embeddings) are compatible with C and each other. */
53749566063dSJacob Faibussowitsch   PetscCall(PetscObjectBaseTypeCompare((PetscObject)B, MATSEQAIJ, &seqaij));
537528b400f6SJacob Faibussowitsch   PetscCheck(seqaij, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Input matrix is of wrong type");
537653dd7562SDmitry Karpeev   if (rowemb) {
53779566063dSJacob Faibussowitsch     PetscCall(ISGetLocalSize(rowemb, &m));
537808401ef6SPierre Jolivet     PetscCheck(m == B->rmap->n, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Row IS of size %" PetscInt_FMT " is incompatible with matrix row size %" PetscInt_FMT, m, B->rmap->n);
537953dd7562SDmitry Karpeev   } else {
538008401ef6SPierre Jolivet     PetscCheck(C->rmap->n == B->rmap->n, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Input matrix is row-incompatible with the target matrix");
538153dd7562SDmitry Karpeev   }
538253dd7562SDmitry Karpeev   if (colemb) {
53839566063dSJacob Faibussowitsch     PetscCall(ISGetLocalSize(colemb, &n));
538408401ef6SPierre Jolivet     PetscCheck(n == B->cmap->n, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Diag col IS of size %" PetscInt_FMT " is incompatible with input matrix col size %" PetscInt_FMT, n, B->cmap->n);
538553dd7562SDmitry Karpeev   } else {
538608401ef6SPierre Jolivet     PetscCheck(C->cmap->n == B->cmap->n, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Input matrix is col-incompatible with the target matrix");
538753dd7562SDmitry Karpeev   }
538853dd7562SDmitry Karpeev 
5389f4f49eeaSPierre Jolivet   Baij = (Mat_SeqAIJ *)B->data;
539053dd7562SDmitry Karpeev   if (pattern == DIFFERENT_NONZERO_PATTERN) {
53919566063dSJacob Faibussowitsch     PetscCall(PetscMalloc1(B->rmap->n, &nz));
5392ad540459SPierre Jolivet     for (i = 0; i < B->rmap->n; i++) nz[i] = Baij->i[i + 1] - Baij->i[i];
53939566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJSetPreallocation(C, 0, nz));
53949566063dSJacob Faibussowitsch     PetscCall(PetscFree(nz));
539553dd7562SDmitry Karpeev   }
539648a46eb9SPierre Jolivet   if (pattern == SUBSET_NONZERO_PATTERN) PetscCall(MatZeroEntries(C));
539753dd7562SDmitry Karpeev   count      = 0;
539853dd7562SDmitry Karpeev   rowindices = NULL;
539953dd7562SDmitry Karpeev   colindices = NULL;
540048a46eb9SPierre Jolivet   if (rowemb) PetscCall(ISGetIndices(rowemb, &rowindices));
540148a46eb9SPierre Jolivet   if (colemb) PetscCall(ISGetIndices(colemb, &colindices));
540253dd7562SDmitry Karpeev   for (i = 0; i < B->rmap->n; i++) {
540353dd7562SDmitry Karpeev     PetscInt row;
540453dd7562SDmitry Karpeev     row = i;
540553dd7562SDmitry Karpeev     if (rowindices) row = rowindices[i];
540653dd7562SDmitry Karpeev     for (j = Baij->i[i]; j < Baij->i[i + 1]; j++) {
540753dd7562SDmitry Karpeev       PetscInt col;
540853dd7562SDmitry Karpeev       col = Baij->j[count];
540953dd7562SDmitry Karpeev       if (colindices) col = colindices[col];
541053dd7562SDmitry Karpeev       v = Baij->a[count];
54119566063dSJacob Faibussowitsch       PetscCall(MatSetValues(C, 1, &row, 1, &col, &v, INSERT_VALUES));
541253dd7562SDmitry Karpeev       ++count;
541353dd7562SDmitry Karpeev     }
541453dd7562SDmitry Karpeev   }
541553dd7562SDmitry Karpeev   /* FIXME: set C's nonzerostate correctly. */
541653dd7562SDmitry Karpeev   /* Assembly for C is necessary. */
541753dd7562SDmitry Karpeev   C->preallocated  = PETSC_TRUE;
541853dd7562SDmitry Karpeev   C->assembled     = PETSC_TRUE;
541953dd7562SDmitry Karpeev   C->was_assembled = PETSC_FALSE;
54203ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
542153dd7562SDmitry Karpeev }
542253dd7562SDmitry Karpeev 
542358c11ad4SPierre Jolivet PetscErrorCode MatEliminateZeros_SeqAIJ(Mat A, PetscBool keep)
5424dec0b466SHong Zhang {
5425dec0b466SHong Zhang   Mat_SeqAIJ *a  = (Mat_SeqAIJ *)A->data;
5426dec0b466SHong Zhang   MatScalar  *aa = a->a;
5427dec0b466SHong Zhang   PetscInt    m = A->rmap->n, fshift = 0, fshift_prev = 0, i, k;
5428dec0b466SHong Zhang   PetscInt   *ailen = a->ilen, *imax = a->imax, *ai = a->i, *aj = a->j, rmax = 0;
5429dec0b466SHong Zhang 
5430dec0b466SHong Zhang   PetscFunctionBegin;
5431dec0b466SHong Zhang   PetscCheck(A->assembled, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Cannot eliminate zeros for unassembled matrix");
5432dec0b466SHong Zhang   if (m) rmax = ailen[0]; /* determine row with most nonzeros */
5433dec0b466SHong Zhang   for (i = 1; i <= m; i++) {
5434dec0b466SHong Zhang     /* move each nonzero entry back by the amount of zero slots (fshift) before it*/
5435dec0b466SHong Zhang     for (k = ai[i - 1]; k < ai[i]; k++) {
543658c11ad4SPierre Jolivet       if (aa[k] == 0 && (aj[k] != i - 1 || !keep)) fshift++;
5437dec0b466SHong Zhang       else {
5438dec0b466SHong Zhang         if (aa[k] == 0 && aj[k] == i - 1) PetscCall(PetscInfo(A, "Keep the diagonal zero at row %" PetscInt_FMT "\n", i - 1));
5439dec0b466SHong Zhang         aa[k - fshift] = aa[k];
5440dec0b466SHong Zhang         aj[k - fshift] = aj[k];
5441dec0b466SHong Zhang       }
5442dec0b466SHong Zhang     }
5443dec0b466SHong Zhang     ai[i - 1] -= fshift_prev; // safe to update ai[i-1] now since it will not be used in the next iteration
5444dec0b466SHong Zhang     fshift_prev = fshift;
5445dec0b466SHong Zhang     /* reset ilen and imax for each row */
5446dec0b466SHong Zhang     ailen[i - 1] = imax[i - 1] = ai[i] - fshift - ai[i - 1];
5447dec0b466SHong Zhang     a->nonzerorowcnt += ((ai[i] - fshift - ai[i - 1]) > 0);
5448dec0b466SHong Zhang     rmax = PetscMax(rmax, ailen[i - 1]);
5449dec0b466SHong Zhang   }
5450312eded4SPierre Jolivet   if (fshift) {
5451dec0b466SHong Zhang     if (m) {
5452dec0b466SHong Zhang       ai[m] -= fshift;
5453dec0b466SHong Zhang       a->nz = ai[m];
5454dec0b466SHong Zhang     }
5455dec0b466SHong Zhang     PetscCall(PetscInfo(A, "Matrix size: %" PetscInt_FMT " X %" PetscInt_FMT "; zeros eliminated: %" PetscInt_FMT "; nonzeros left: %" PetscInt_FMT "\n", m, A->cmap->n, fshift, a->nz));
5456312eded4SPierre Jolivet     A->nonzerostate++;
5457dec0b466SHong Zhang     A->info.nz_unneeded += (PetscReal)fshift;
5458dec0b466SHong Zhang     a->rmax = rmax;
5459dec0b466SHong Zhang     if (a->inode.use && a->inode.checked) PetscCall(MatSeqAIJCheckInode(A));
5460dec0b466SHong Zhang     PetscCall(MatAssemblyBegin(A, MAT_FINAL_ASSEMBLY));
5461dec0b466SHong Zhang     PetscCall(MatAssemblyEnd(A, MAT_FINAL_ASSEMBLY));
5462312eded4SPierre Jolivet   }
54633ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
5464dec0b466SHong Zhang }
5465dec0b466SHong Zhang 
54664099cc6bSBarry Smith PetscFunctionList MatSeqAIJList = NULL;
54674099cc6bSBarry Smith 
5468cc4c1da9SBarry Smith /*@
546911a5261eSBarry Smith   MatSeqAIJSetType - Converts a `MATSEQAIJ` matrix to a subtype
54704099cc6bSBarry Smith 
5471c3339decSBarry Smith   Collective
54724099cc6bSBarry Smith 
54734099cc6bSBarry Smith   Input Parameters:
54744099cc6bSBarry Smith + mat    - the matrix object
54754099cc6bSBarry Smith - matype - matrix type
54764099cc6bSBarry Smith 
54774099cc6bSBarry Smith   Options Database Key:
54784e187271SRichard Tran Mills . -mat_seqaij_type  <method> - for example seqaijcrl
54794099cc6bSBarry Smith 
54804099cc6bSBarry Smith   Level: intermediate
54814099cc6bSBarry Smith 
5482fe59aa6dSJacob Faibussowitsch .seealso: [](ch_matrices), `Mat`, `PCSetType()`, `VecSetType()`, `MatCreate()`, `MatType`
54834099cc6bSBarry Smith @*/
5484d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetType(Mat mat, MatType matype)
5485d71ae5a4SJacob Faibussowitsch {
54864099cc6bSBarry Smith   PetscBool sametype;
54875f80ce2aSJacob Faibussowitsch   PetscErrorCode (*r)(Mat, MatType, MatReuse, Mat *);
54884099cc6bSBarry Smith 
54894099cc6bSBarry Smith   PetscFunctionBegin;
54904099cc6bSBarry Smith   PetscValidHeaderSpecific(mat, MAT_CLASSID, 1);
54919566063dSJacob Faibussowitsch   PetscCall(PetscObjectTypeCompare((PetscObject)mat, matype, &sametype));
54923ba16761SJacob Faibussowitsch   if (sametype) PetscFunctionReturn(PETSC_SUCCESS);
54934099cc6bSBarry Smith 
54949566063dSJacob Faibussowitsch   PetscCall(PetscFunctionListFind(MatSeqAIJList, matype, &r));
54956adde796SStefano Zampini   PetscCheck(r, PetscObjectComm((PetscObject)mat), PETSC_ERR_ARG_UNKNOWN_TYPE, "Unknown Mat type given: %s", matype);
54969566063dSJacob Faibussowitsch   PetscCall((*r)(mat, matype, MAT_INPLACE_MATRIX, &mat));
54973ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
54984099cc6bSBarry Smith }
54994099cc6bSBarry Smith 
55004099cc6bSBarry Smith /*@C
550111a5261eSBarry Smith   MatSeqAIJRegister -  - Adds a new sub-matrix type for sequential `MATSEQAIJ` matrices
55024099cc6bSBarry Smith 
5503cc4c1da9SBarry Smith   Not Collective, No Fortran Support
55044099cc6bSBarry Smith 
55054099cc6bSBarry Smith   Input Parameters:
5506fe59aa6dSJacob Faibussowitsch + sname    - name of a new user-defined matrix type, for example `MATSEQAIJCRL`
55074099cc6bSBarry Smith - function - routine to convert to subtype
55084099cc6bSBarry Smith 
55092ef1f0ffSBarry Smith   Level: advanced
55102ef1f0ffSBarry Smith 
55114099cc6bSBarry Smith   Notes:
551211a5261eSBarry Smith   `MatSeqAIJRegister()` may be called multiple times to add several user-defined solvers.
55134099cc6bSBarry Smith 
55144099cc6bSBarry Smith   Then, your matrix can be chosen with the procedural interface at runtime via the option
55154099cc6bSBarry Smith $     -mat_seqaij_type my_mat
55164099cc6bSBarry Smith 
55171cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJRegisterAll()`
55184099cc6bSBarry Smith @*/
5519d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJRegister(const char sname[], PetscErrorCode (*function)(Mat, MatType, MatReuse, Mat *))
5520d71ae5a4SJacob Faibussowitsch {
55214099cc6bSBarry Smith   PetscFunctionBegin;
55229566063dSJacob Faibussowitsch   PetscCall(MatInitializePackage());
55239566063dSJacob Faibussowitsch   PetscCall(PetscFunctionListAdd(&MatSeqAIJList, sname, function));
55243ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
55254099cc6bSBarry Smith }
55264099cc6bSBarry Smith 
55274099cc6bSBarry Smith PetscBool MatSeqAIJRegisterAllCalled = PETSC_FALSE;
55284099cc6bSBarry Smith 
55294099cc6bSBarry Smith /*@C
553011a5261eSBarry Smith   MatSeqAIJRegisterAll - Registers all of the matrix subtypes of `MATSSEQAIJ`
55314099cc6bSBarry Smith 
55324099cc6bSBarry Smith   Not Collective
55334099cc6bSBarry Smith 
55344099cc6bSBarry Smith   Level: advanced
55354099cc6bSBarry Smith 
55362ef1f0ffSBarry Smith   Note:
55372ef1f0ffSBarry Smith   This registers the versions of `MATSEQAIJ` for GPUs
55382ef1f0ffSBarry Smith 
55391cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatRegisterAll()`, `MatSeqAIJRegister()`
55404099cc6bSBarry Smith @*/
5541d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJRegisterAll(void)
5542d71ae5a4SJacob Faibussowitsch {
55434099cc6bSBarry Smith   PetscFunctionBegin;
55443ba16761SJacob Faibussowitsch   if (MatSeqAIJRegisterAllCalled) PetscFunctionReturn(PETSC_SUCCESS);
55454099cc6bSBarry Smith   MatSeqAIJRegisterAllCalled = PETSC_TRUE;
55464099cc6bSBarry Smith 
55479566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRegister(MATSEQAIJCRL, MatConvert_SeqAIJ_SeqAIJCRL));
55489566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRegister(MATSEQAIJPERM, MatConvert_SeqAIJ_SeqAIJPERM));
55499566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRegister(MATSEQAIJSELL, MatConvert_SeqAIJ_SeqAIJSELL));
55509779e05dSSatish Balay #if defined(PETSC_HAVE_MKL_SPARSE)
55519566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRegister(MATSEQAIJMKL, MatConvert_SeqAIJ_SeqAIJMKL));
5552485f9817SRichard Tran Mills #endif
55535063d097SStefano Zampini #if defined(PETSC_HAVE_CUDA)
55549566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRegister(MATSEQAIJCUSPARSE, MatConvert_SeqAIJ_SeqAIJCUSPARSE));
55555063d097SStefano Zampini #endif
5556d5e393b6SSuyash Tandon #if defined(PETSC_HAVE_HIP)
5557d5e393b6SSuyash Tandon   PetscCall(MatSeqAIJRegister(MATSEQAIJHIPSPARSE, MatConvert_SeqAIJ_SeqAIJHIPSPARSE));
5558d5e393b6SSuyash Tandon #endif
55595063d097SStefano Zampini #if defined(PETSC_HAVE_KOKKOS_KERNELS)
55609566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRegister(MATSEQAIJKOKKOS, MatConvert_SeqAIJ_SeqAIJKokkos));
55615063d097SStefano Zampini #endif
55624099cc6bSBarry Smith #if defined(PETSC_HAVE_VIENNACL) && defined(PETSC_HAVE_VIENNACL_NO_CUDA)
55639566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRegister(MATMPIAIJVIENNACL, MatConvert_SeqAIJ_SeqAIJViennaCL));
55644099cc6bSBarry Smith #endif
55653ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
55664099cc6bSBarry Smith }
556753dd7562SDmitry Karpeev 
556853dd7562SDmitry Karpeev /*
556981824310SBarry Smith     Special version for direct calls from Fortran
557081824310SBarry Smith */
557181824310SBarry Smith #if defined(PETSC_HAVE_FORTRAN_CAPS)
557281824310SBarry Smith   #define matsetvaluesseqaij_ MATSETVALUESSEQAIJ
557381824310SBarry Smith #elif !defined(PETSC_HAVE_FORTRAN_UNDERSCORE)
557481824310SBarry Smith   #define matsetvaluesseqaij_ matsetvaluesseqaij
557581824310SBarry Smith #endif
557681824310SBarry Smith 
557781824310SBarry Smith /* Change these macros so can be used in void function */
557898921bdaSJacob Faibussowitsch 
557998921bdaSJacob Faibussowitsch /* Change these macros so can be used in void function */
55809566063dSJacob Faibussowitsch /* Identical to PetscCallVoid, except it assigns to *_ierr */
55819566063dSJacob Faibussowitsch #undef PetscCall
55829371c9d4SSatish Balay #define PetscCall(...) \
55839371c9d4SSatish Balay   do { \
55845f80ce2aSJacob Faibussowitsch     PetscErrorCode ierr_msv_mpiaij = __VA_ARGS__; \
558598921bdaSJacob Faibussowitsch     if (PetscUnlikely(ierr_msv_mpiaij)) { \
558698921bdaSJacob Faibussowitsch       *_ierr = PetscError(PETSC_COMM_SELF, __LINE__, PETSC_FUNCTION_NAME, __FILE__, ierr_msv_mpiaij, PETSC_ERROR_REPEAT, " "); \
558798921bdaSJacob Faibussowitsch       return; \
558898921bdaSJacob Faibussowitsch     } \
558998921bdaSJacob Faibussowitsch   } while (0)
559098921bdaSJacob Faibussowitsch 
559198921bdaSJacob Faibussowitsch #undef SETERRQ
55929371c9d4SSatish Balay #define SETERRQ(comm, ierr, ...) \
55939371c9d4SSatish Balay   do { \
559498921bdaSJacob Faibussowitsch     *_ierr = PetscError(comm, __LINE__, PETSC_FUNCTION_NAME, __FILE__, ierr, PETSC_ERROR_INITIAL, __VA_ARGS__); \
559598921bdaSJacob Faibussowitsch     return; \
559698921bdaSJacob Faibussowitsch   } while (0)
559781824310SBarry Smith 
5598d71ae5a4SJacob Faibussowitsch PETSC_EXTERN void matsetvaluesseqaij_(Mat *AA, PetscInt *mm, const PetscInt im[], PetscInt *nn, const PetscInt in[], const PetscScalar v[], InsertMode *isis, PetscErrorCode *_ierr)
5599d71ae5a4SJacob Faibussowitsch {
560081824310SBarry Smith   Mat         A = *AA;
560181824310SBarry Smith   PetscInt    m = *mm, n = *nn;
560281824310SBarry Smith   InsertMode  is = *isis;
560381824310SBarry Smith   Mat_SeqAIJ *a  = (Mat_SeqAIJ *)A->data;
560481824310SBarry Smith   PetscInt   *rp, k, low, high, t, ii, row, nrow, i, col, l, rmax, N;
560581824310SBarry Smith   PetscInt   *imax, *ai, *ailen;
560681824310SBarry Smith   PetscInt   *aj, nonew = a->nonew, lastcol = -1;
560754f21887SBarry Smith   MatScalar  *ap, value, *aa;
5608ace3abfcSBarry Smith   PetscBool   ignorezeroentries = a->ignorezeroentries;
5609ace3abfcSBarry Smith   PetscBool   roworiented       = a->roworiented;
561081824310SBarry Smith 
561181824310SBarry Smith   PetscFunctionBegin;
56124994cf47SJed Brown   MatCheckPreallocated(A, 1);
561381824310SBarry Smith   imax  = a->imax;
561481824310SBarry Smith   ai    = a->i;
561581824310SBarry Smith   ailen = a->ilen;
561681824310SBarry Smith   aj    = a->j;
561781824310SBarry Smith   aa    = a->a;
561881824310SBarry Smith 
561981824310SBarry Smith   for (k = 0; k < m; k++) { /* loop over added rows */
562081824310SBarry Smith     row = im[k];
562181824310SBarry Smith     if (row < 0) continue;
56225f80ce2aSJacob Faibussowitsch     PetscCheck(row < A->rmap->n, PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_OUTOFRANGE, "Row too large");
56239371c9d4SSatish Balay     rp   = aj + ai[row];
56249371c9d4SSatish Balay     ap   = aa + ai[row];
56259371c9d4SSatish Balay     rmax = imax[row];
56269371c9d4SSatish Balay     nrow = ailen[row];
562781824310SBarry Smith     low  = 0;
562881824310SBarry Smith     high = nrow;
562981824310SBarry Smith     for (l = 0; l < n; l++) { /* loop over added columns */
563081824310SBarry Smith       if (in[l] < 0) continue;
56315f80ce2aSJacob Faibussowitsch       PetscCheck(in[l] < A->cmap->n, PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_OUTOFRANGE, "Column too large");
563281824310SBarry Smith       col = in[l];
56332205254eSKarl Rupp       if (roworiented) value = v[l + k * n];
56342205254eSKarl Rupp       else value = v[k + l * m];
56352205254eSKarl Rupp 
563681824310SBarry Smith       if (value == 0.0 && ignorezeroentries && (is == ADD_VALUES)) continue;
563781824310SBarry Smith 
56382205254eSKarl Rupp       if (col <= lastcol) low = 0;
56392205254eSKarl Rupp       else high = nrow;
564081824310SBarry Smith       lastcol = col;
564181824310SBarry Smith       while (high - low > 5) {
564281824310SBarry Smith         t = (low + high) / 2;
564381824310SBarry Smith         if (rp[t] > col) high = t;
564481824310SBarry Smith         else low = t;
564581824310SBarry Smith       }
564681824310SBarry Smith       for (i = low; i < high; i++) {
564781824310SBarry Smith         if (rp[i] > col) break;
564881824310SBarry Smith         if (rp[i] == col) {
564981824310SBarry Smith           if (is == ADD_VALUES) ap[i] += value;
565081824310SBarry Smith           else ap[i] = value;
565181824310SBarry Smith           goto noinsert;
565281824310SBarry Smith         }
565381824310SBarry Smith       }
565481824310SBarry Smith       if (value == 0.0 && ignorezeroentries) goto noinsert;
565581824310SBarry Smith       if (nonew == 1) goto noinsert;
56565f80ce2aSJacob Faibussowitsch       PetscCheck(nonew != -1, PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_OUTOFRANGE, "Inserting a new nonzero in the matrix");
5657fef13f97SBarry Smith       MatSeqXAIJReallocateAIJ(A, A->rmap->n, 1, nrow, row, col, rmax, aa, ai, aj, rp, ap, imax, nonew, MatScalar);
56589371c9d4SSatish Balay       N = nrow++ - 1;
56599371c9d4SSatish Balay       a->nz++;
56609371c9d4SSatish Balay       high++;
566181824310SBarry Smith       /* shift up all the later entries in this row */
566281824310SBarry Smith       for (ii = N; ii >= i; ii--) {
566381824310SBarry Smith         rp[ii + 1] = rp[ii];
566481824310SBarry Smith         ap[ii + 1] = ap[ii];
566581824310SBarry Smith       }
566681824310SBarry Smith       rp[i] = col;
566781824310SBarry Smith       ap[i] = value;
566881824310SBarry Smith     noinsert:;
566981824310SBarry Smith       low = i + 1;
567081824310SBarry Smith     }
567181824310SBarry Smith     ailen[row] = nrow;
567281824310SBarry Smith   }
567381824310SBarry Smith   PetscFunctionReturnVoid();
567481824310SBarry Smith }
567598921bdaSJacob Faibussowitsch /* Undefining these here since they were redefined from their original definition above! No
567698921bdaSJacob Faibussowitsch  * other PETSc functions should be defined past this point, as it is impossible to recover the
567798921bdaSJacob Faibussowitsch  * original definitions */
56789566063dSJacob Faibussowitsch #undef PetscCall
567998921bdaSJacob Faibussowitsch #undef SETERRQ
5680