xref: /petsc/src/mat/impls/aij/seq/aij.c (revision 07425a8d4172ec73b7b53c5ce4d6ba1b92fe45cf)
1d5d45c9bSBarry Smith /*
23369ce9aSBarry Smith     Defines the basic matrix operations for the AIJ (compressed row)
3d5d45c9bSBarry Smith   matrix storage format.
4d5d45c9bSBarry Smith */
53369ce9aSBarry Smith 
6c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/aij.h> /*I "petscmat.h" I*/
7c6db04a5SJed Brown #include <petscblaslapack.h>
8c6db04a5SJed Brown #include <petscbt.h>
9af0996ceSBarry Smith #include <petsc/private/kernels/blocktranspose.h>
100716a85fSBarry Smith 
1126cec326SBarry Smith /* defines MatSetValues_Seq_Hash(), MatAssemblyEnd_Seq_Hash(), MatSetUp_Seq_Hash() */
1226cec326SBarry Smith #define TYPE AIJ
1326cec326SBarry Smith #define TYPE_BS
1426cec326SBarry Smith #include "../src/mat/impls/aij/seq/seqhashmatsetvalues.h"
1526cec326SBarry Smith #include "../src/mat/impls/aij/seq/seqhashmat.h"
1626cec326SBarry Smith #undef TYPE
1726cec326SBarry Smith #undef TYPE_BS
1826cec326SBarry Smith 
19ba38deedSJacob Faibussowitsch static PetscErrorCode MatSeqAIJSetTypeFromOptions(Mat A)
20d71ae5a4SJacob Faibussowitsch {
214099cc6bSBarry Smith   PetscBool flg;
224099cc6bSBarry Smith   char      type[256];
234099cc6bSBarry Smith 
244099cc6bSBarry Smith   PetscFunctionBegin;
25d0609cedSBarry Smith   PetscObjectOptionsBegin((PetscObject)A);
269566063dSJacob Faibussowitsch   PetscCall(PetscOptionsFList("-mat_seqaij_type", "Matrix SeqAIJ type", "MatSeqAIJSetType", MatSeqAIJList, "seqaij", type, 256, &flg));
279566063dSJacob Faibussowitsch   if (flg) PetscCall(MatSeqAIJSetType(A, type));
28d0609cedSBarry Smith   PetscOptionsEnd();
293ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
304099cc6bSBarry Smith }
314099cc6bSBarry Smith 
32ba38deedSJacob Faibussowitsch static PetscErrorCode MatGetColumnReductions_SeqAIJ(Mat A, PetscInt type, PetscReal *reductions)
33d71ae5a4SJacob Faibussowitsch {
340716a85fSBarry Smith   PetscInt    i, m, n;
350716a85fSBarry Smith   Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data;
360716a85fSBarry Smith 
370716a85fSBarry Smith   PetscFunctionBegin;
389566063dSJacob Faibussowitsch   PetscCall(MatGetSize(A, &m, &n));
399566063dSJacob Faibussowitsch   PetscCall(PetscArrayzero(reductions, n));
400716a85fSBarry Smith   if (type == NORM_2) {
41ad540459SPierre Jolivet     for (i = 0; i < aij->i[m]; i++) reductions[aij->j[i]] += PetscAbsScalar(aij->a[i] * aij->a[i]);
420716a85fSBarry Smith   } else if (type == NORM_1) {
43ad540459SPierre Jolivet     for (i = 0; i < aij->i[m]; i++) reductions[aij->j[i]] += PetscAbsScalar(aij->a[i]);
440716a85fSBarry Smith   } else if (type == NORM_INFINITY) {
45ad540459SPierre Jolivet     for (i = 0; i < aij->i[m]; i++) reductions[aij->j[i]] = PetscMax(PetscAbsScalar(aij->a[i]), reductions[aij->j[i]]);
46857cbf51SRichard Tran Mills   } else if (type == REDUCTION_SUM_REALPART || type == REDUCTION_MEAN_REALPART) {
47ad540459SPierre Jolivet     for (i = 0; i < aij->i[m]; i++) reductions[aij->j[i]] += PetscRealPart(aij->a[i]);
48857cbf51SRichard Tran Mills   } else if (type == REDUCTION_SUM_IMAGINARYPART || type == REDUCTION_MEAN_IMAGINARYPART) {
49ad540459SPierre Jolivet     for (i = 0; i < aij->i[m]; i++) reductions[aij->j[i]] += PetscImaginaryPart(aij->a[i]);
506adde796SStefano Zampini   } else SETERRQ(PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_WRONG, "Unknown reduction type");
510716a85fSBarry Smith 
520716a85fSBarry Smith   if (type == NORM_2) {
53a873a8cdSSam Reynolds     for (i = 0; i < n; i++) reductions[i] = PetscSqrtReal(reductions[i]);
54857cbf51SRichard Tran Mills   } else if (type == REDUCTION_MEAN_REALPART || type == REDUCTION_MEAN_IMAGINARYPART) {
55a873a8cdSSam Reynolds     for (i = 0; i < n; i++) reductions[i] /= m;
560716a85fSBarry Smith   }
573ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
580716a85fSBarry Smith }
590716a85fSBarry Smith 
60ba38deedSJacob Faibussowitsch static PetscErrorCode MatFindOffBlockDiagonalEntries_SeqAIJ(Mat A, IS *is)
61d71ae5a4SJacob Faibussowitsch {
623a062f41SBarry Smith   Mat_SeqAIJ     *a = (Mat_SeqAIJ *)A->data;
633a062f41SBarry Smith   PetscInt        i, m = A->rmap->n, cnt = 0, bs = A->rmap->bs;
643a062f41SBarry Smith   const PetscInt *jj = a->j, *ii = a->i;
653a062f41SBarry Smith   PetscInt       *rows;
663a062f41SBarry Smith 
673a062f41SBarry Smith   PetscFunctionBegin;
683a062f41SBarry Smith   for (i = 0; i < m; i++) {
69ad540459SPierre Jolivet     if ((ii[i] != ii[i + 1]) && ((jj[ii[i]] < bs * (i / bs)) || (jj[ii[i + 1] - 1] > bs * ((i + bs) / bs) - 1))) cnt++;
703a062f41SBarry Smith   }
719566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(cnt, &rows));
723a062f41SBarry Smith   cnt = 0;
733a062f41SBarry Smith   for (i = 0; i < m; i++) {
743a062f41SBarry Smith     if ((ii[i] != ii[i + 1]) && ((jj[ii[i]] < bs * (i / bs)) || (jj[ii[i + 1] - 1] > bs * ((i + bs) / bs) - 1))) {
753a062f41SBarry Smith       rows[cnt] = i;
763a062f41SBarry Smith       cnt++;
773a062f41SBarry Smith     }
783a062f41SBarry Smith   }
799566063dSJacob Faibussowitsch   PetscCall(ISCreateGeneral(PETSC_COMM_SELF, cnt, rows, PETSC_OWN_POINTER, is));
803ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
813a062f41SBarry Smith }
823a062f41SBarry Smith 
83d71ae5a4SJacob Faibussowitsch PetscErrorCode MatFindZeroDiagonals_SeqAIJ_Private(Mat A, PetscInt *nrows, PetscInt **zrows)
84d71ae5a4SJacob Faibussowitsch {
856ce1633cSBarry Smith   Mat_SeqAIJ      *a = (Mat_SeqAIJ *)A->data;
86fff043a9SJunchao Zhang   const MatScalar *aa;
876ce1633cSBarry Smith   PetscInt         i, m = A->rmap->n, cnt = 0;
88b2db7409Sstefano_zampini   const PetscInt  *ii = a->i, *jj = a->j, *diag;
896ce1633cSBarry Smith   PetscInt        *rows;
906ce1633cSBarry Smith 
916ce1633cSBarry Smith   PetscFunctionBegin;
929566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &aa));
939566063dSJacob Faibussowitsch   PetscCall(MatMarkDiagonal_SeqAIJ(A));
946ce1633cSBarry Smith   diag = a->diag;
956ce1633cSBarry Smith   for (i = 0; i < m; i++) {
96ad540459SPierre Jolivet     if ((diag[i] >= ii[i + 1]) || (jj[diag[i]] != i) || (aa[diag[i]] == 0.0)) cnt++;
976ce1633cSBarry Smith   }
989566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(cnt, &rows));
996ce1633cSBarry Smith   cnt = 0;
1006ce1633cSBarry Smith   for (i = 0; i < m; i++) {
101ad540459SPierre Jolivet     if ((diag[i] >= ii[i + 1]) || (jj[diag[i]] != i) || (aa[diag[i]] == 0.0)) rows[cnt++] = i;
1026ce1633cSBarry Smith   }
103f1f41ecbSJed Brown   *nrows = cnt;
104f1f41ecbSJed Brown   *zrows = rows;
1059566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &aa));
1063ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
107f1f41ecbSJed Brown }
108f1f41ecbSJed Brown 
109ba38deedSJacob Faibussowitsch static PetscErrorCode MatFindZeroDiagonals_SeqAIJ(Mat A, IS *zrows)
110d71ae5a4SJacob Faibussowitsch {
111f1f41ecbSJed Brown   PetscInt nrows, *rows;
112f1f41ecbSJed Brown 
113f1f41ecbSJed Brown   PetscFunctionBegin;
1140298fd71SBarry Smith   *zrows = NULL;
1159566063dSJacob Faibussowitsch   PetscCall(MatFindZeroDiagonals_SeqAIJ_Private(A, &nrows, &rows));
1169566063dSJacob Faibussowitsch   PetscCall(ISCreateGeneral(PetscObjectComm((PetscObject)A), nrows, rows, PETSC_OWN_POINTER, zrows));
1173ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
1186ce1633cSBarry Smith }
1196ce1633cSBarry Smith 
120ba38deedSJacob Faibussowitsch static PetscErrorCode MatFindNonzeroRows_SeqAIJ(Mat A, IS *keptrows)
121d71ae5a4SJacob Faibussowitsch {
122b3a44c85SBarry Smith   Mat_SeqAIJ      *a = (Mat_SeqAIJ *)A->data;
123b3a44c85SBarry Smith   const MatScalar *aa;
124b3a44c85SBarry Smith   PetscInt         m = A->rmap->n, cnt = 0;
125b3a44c85SBarry Smith   const PetscInt  *ii;
126b3a44c85SBarry Smith   PetscInt         n, i, j, *rows;
127b3a44c85SBarry Smith 
128b3a44c85SBarry Smith   PetscFunctionBegin;
1299566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &aa));
130f4259b30SLisandro Dalcin   *keptrows = NULL;
131b3a44c85SBarry Smith   ii        = a->i;
132b3a44c85SBarry Smith   for (i = 0; i < m; i++) {
133b3a44c85SBarry Smith     n = ii[i + 1] - ii[i];
134b3a44c85SBarry Smith     if (!n) {
135b3a44c85SBarry Smith       cnt++;
136b3a44c85SBarry Smith       goto ok1;
137b3a44c85SBarry Smith     }
1382e5835c6SStefano Zampini     for (j = ii[i]; j < ii[i + 1]; j++) {
139b3a44c85SBarry Smith       if (aa[j] != 0.0) goto ok1;
140b3a44c85SBarry Smith     }
141b3a44c85SBarry Smith     cnt++;
142b3a44c85SBarry Smith   ok1:;
143b3a44c85SBarry Smith   }
1442e5835c6SStefano Zampini   if (!cnt) {
1459566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJRestoreArrayRead(A, &aa));
1463ba16761SJacob Faibussowitsch     PetscFunctionReturn(PETSC_SUCCESS);
1472e5835c6SStefano Zampini   }
1489566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(A->rmap->n - cnt, &rows));
149b3a44c85SBarry Smith   cnt = 0;
150b3a44c85SBarry Smith   for (i = 0; i < m; i++) {
151b3a44c85SBarry Smith     n = ii[i + 1] - ii[i];
152b3a44c85SBarry Smith     if (!n) continue;
1532e5835c6SStefano Zampini     for (j = ii[i]; j < ii[i + 1]; j++) {
154b3a44c85SBarry Smith       if (aa[j] != 0.0) {
155b3a44c85SBarry Smith         rows[cnt++] = i;
156b3a44c85SBarry Smith         break;
157b3a44c85SBarry Smith       }
158b3a44c85SBarry Smith     }
159b3a44c85SBarry Smith   }
1609566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &aa));
1619566063dSJacob Faibussowitsch   PetscCall(ISCreateGeneral(PETSC_COMM_SELF, cnt, rows, PETSC_OWN_POINTER, keptrows));
1623ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
163b3a44c85SBarry Smith }
164b3a44c85SBarry Smith 
165d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDiagonalSet_SeqAIJ(Mat Y, Vec D, InsertMode is)
166d71ae5a4SJacob Faibussowitsch {
16779299369SBarry Smith   Mat_SeqAIJ        *aij = (Mat_SeqAIJ *)Y->data;
16899e65526SBarry Smith   PetscInt           i, m = Y->rmap->n;
16999e65526SBarry Smith   const PetscInt    *diag;
1702e5835c6SStefano Zampini   MatScalar         *aa;
17199e65526SBarry Smith   const PetscScalar *v;
172ace3abfcSBarry Smith   PetscBool          missing;
17379299369SBarry Smith 
17479299369SBarry Smith   PetscFunctionBegin;
17509f38230SBarry Smith   if (Y->assembled) {
1769566063dSJacob Faibussowitsch     PetscCall(MatMissingDiagonal_SeqAIJ(Y, &missing, NULL));
17709f38230SBarry Smith     if (!missing) {
17879299369SBarry Smith       diag = aij->diag;
1799566063dSJacob Faibussowitsch       PetscCall(VecGetArrayRead(D, &v));
1809566063dSJacob Faibussowitsch       PetscCall(MatSeqAIJGetArray(Y, &aa));
18179299369SBarry Smith       if (is == INSERT_VALUES) {
182ad540459SPierre Jolivet         for (i = 0; i < m; i++) aa[diag[i]] = v[i];
18379299369SBarry Smith       } else {
184ad540459SPierre Jolivet         for (i = 0; i < m; i++) aa[diag[i]] += v[i];
18579299369SBarry Smith       }
1869566063dSJacob Faibussowitsch       PetscCall(MatSeqAIJRestoreArray(Y, &aa));
1879566063dSJacob Faibussowitsch       PetscCall(VecRestoreArrayRead(D, &v));
1883ba16761SJacob Faibussowitsch       PetscFunctionReturn(PETSC_SUCCESS);
18979299369SBarry Smith     }
19009f38230SBarry Smith   }
1919566063dSJacob Faibussowitsch   PetscCall(MatDiagonalSet_Default(Y, D, is));
1923ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
19309f38230SBarry Smith }
19479299369SBarry Smith 
195d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetRowIJ_SeqAIJ(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *m, const PetscInt *ia[], const PetscInt *ja[], PetscBool *done)
196d71ae5a4SJacob Faibussowitsch {
197416022c9SBarry Smith   Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data;
19897f1f81fSBarry Smith   PetscInt    i, ishift;
19917ab2063SBarry Smith 
2003a40ed3dSBarry Smith   PetscFunctionBegin;
201f1f2ae84SBarry Smith   if (m) *m = A->rmap->n;
2023ba16761SJacob Faibussowitsch   if (!ia) PetscFunctionReturn(PETSC_SUCCESS);
203bfeeae90SHong Zhang   ishift = 0;
204b94d7dedSBarry Smith   if (symmetric && A->structurally_symmetric != PETSC_BOOL3_TRUE) {
2059566063dSJacob Faibussowitsch     PetscCall(MatToSymmetricIJ_SeqAIJ(A->rmap->n, a->i, a->j, PETSC_TRUE, ishift, oshift, (PetscInt **)ia, (PetscInt **)ja));
206bfeeae90SHong Zhang   } else if (oshift == 1) {
2071a83f524SJed Brown     PetscInt *tia;
208d0f46423SBarry Smith     PetscInt  nz = a->i[A->rmap->n];
2093b2fbd54SBarry Smith     /* malloc space and  add 1 to i and j indices */
2109566063dSJacob Faibussowitsch     PetscCall(PetscMalloc1(A->rmap->n + 1, &tia));
2111a83f524SJed Brown     for (i = 0; i < A->rmap->n + 1; i++) tia[i] = a->i[i] + 1;
2121a83f524SJed Brown     *ia = tia;
213ecc77c7aSBarry Smith     if (ja) {
2141a83f524SJed Brown       PetscInt *tja;
2159566063dSJacob Faibussowitsch       PetscCall(PetscMalloc1(nz + 1, &tja));
2161a83f524SJed Brown       for (i = 0; i < nz; i++) tja[i] = a->j[i] + 1;
2171a83f524SJed Brown       *ja = tja;
218ecc77c7aSBarry Smith     }
2196945ee14SBarry Smith   } else {
220ecc77c7aSBarry Smith     *ia = a->i;
221ecc77c7aSBarry Smith     if (ja) *ja = a->j;
222a2ce50c7SBarry Smith   }
2233ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
224a2744918SBarry Smith }
225a2744918SBarry Smith 
226d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRestoreRowIJ_SeqAIJ(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *n, const PetscInt *ia[], const PetscInt *ja[], PetscBool *done)
227d71ae5a4SJacob Faibussowitsch {
2283a40ed3dSBarry Smith   PetscFunctionBegin;
2293ba16761SJacob Faibussowitsch   if (!ia) PetscFunctionReturn(PETSC_SUCCESS);
230b94d7dedSBarry Smith   if ((symmetric && A->structurally_symmetric != PETSC_BOOL3_TRUE) || oshift == 1) {
2319566063dSJacob Faibussowitsch     PetscCall(PetscFree(*ia));
2329566063dSJacob Faibussowitsch     if (ja) PetscCall(PetscFree(*ja));
233bcd2baecSBarry Smith   }
2343ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
23517ab2063SBarry Smith }
23617ab2063SBarry Smith 
237d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetColumnIJ_SeqAIJ(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *nn, const PetscInt *ia[], const PetscInt *ja[], PetscBool *done)
238d71ae5a4SJacob Faibussowitsch {
2393b2fbd54SBarry Smith   Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data;
240d0f46423SBarry Smith   PetscInt    i, *collengths, *cia, *cja, n = A->cmap->n, m = A->rmap->n;
24197f1f81fSBarry Smith   PetscInt    nz = a->i[m], row, *jj, mr, col;
2423b2fbd54SBarry Smith 
2433a40ed3dSBarry Smith   PetscFunctionBegin;
244899cda47SBarry Smith   *nn = n;
2453ba16761SJacob Faibussowitsch   if (!ia) PetscFunctionReturn(PETSC_SUCCESS);
2463b2fbd54SBarry Smith   if (symmetric) {
2479566063dSJacob Faibussowitsch     PetscCall(MatToSymmetricIJ_SeqAIJ(A->rmap->n, a->i, a->j, PETSC_TRUE, 0, oshift, (PetscInt **)ia, (PetscInt **)ja));
2483b2fbd54SBarry Smith   } else {
2499566063dSJacob Faibussowitsch     PetscCall(PetscCalloc1(n, &collengths));
2509566063dSJacob Faibussowitsch     PetscCall(PetscMalloc1(n + 1, &cia));
2519566063dSJacob Faibussowitsch     PetscCall(PetscMalloc1(nz, &cja));
2523b2fbd54SBarry Smith     jj = a->j;
253ad540459SPierre Jolivet     for (i = 0; i < nz; i++) collengths[jj[i]]++;
2543b2fbd54SBarry Smith     cia[0] = oshift;
255ad540459SPierre Jolivet     for (i = 0; i < n; i++) cia[i + 1] = cia[i] + collengths[i];
2569566063dSJacob Faibussowitsch     PetscCall(PetscArrayzero(collengths, n));
2573b2fbd54SBarry Smith     jj = a->j;
258a93ec695SBarry Smith     for (row = 0; row < m; row++) {
259a93ec695SBarry Smith       mr = a->i[row + 1] - a->i[row];
260a93ec695SBarry Smith       for (i = 0; i < mr; i++) {
261bfeeae90SHong Zhang         col = *jj++;
2622205254eSKarl Rupp 
2633b2fbd54SBarry Smith         cja[cia[col] + collengths[col]++ - oshift] = row + oshift;
2643b2fbd54SBarry Smith       }
2653b2fbd54SBarry Smith     }
2669566063dSJacob Faibussowitsch     PetscCall(PetscFree(collengths));
2679371c9d4SSatish Balay     *ia = cia;
2689371c9d4SSatish Balay     *ja = cja;
2693b2fbd54SBarry Smith   }
2703ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
2713b2fbd54SBarry Smith }
2723b2fbd54SBarry Smith 
273d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRestoreColumnIJ_SeqAIJ(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *n, const PetscInt *ia[], const PetscInt *ja[], PetscBool *done)
274d71ae5a4SJacob Faibussowitsch {
2753a40ed3dSBarry Smith   PetscFunctionBegin;
2763ba16761SJacob Faibussowitsch   if (!ia) PetscFunctionReturn(PETSC_SUCCESS);
2773b2fbd54SBarry Smith 
2789566063dSJacob Faibussowitsch   PetscCall(PetscFree(*ia));
2799566063dSJacob Faibussowitsch   PetscCall(PetscFree(*ja));
2803ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
2813b2fbd54SBarry Smith }
2823b2fbd54SBarry Smith 
2837cee066cSHong Zhang /*
2847cee066cSHong Zhang  MatGetColumnIJ_SeqAIJ_Color() and MatRestoreColumnIJ_SeqAIJ_Color() are customized from
2857cee066cSHong Zhang  MatGetColumnIJ_SeqAIJ() and MatRestoreColumnIJ_SeqAIJ() by adding an output
286040ebd07SHong Zhang  spidx[], index of a->a, to be used in MatTransposeColoringCreate_SeqAIJ() and MatFDColoringCreate_SeqXAIJ()
2877cee066cSHong Zhang */
288d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetColumnIJ_SeqAIJ_Color(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *nn, const PetscInt *ia[], const PetscInt *ja[], PetscInt *spidx[], PetscBool *done)
289d71ae5a4SJacob Faibussowitsch {
2907cee066cSHong Zhang   Mat_SeqAIJ     *a = (Mat_SeqAIJ *)A->data;
2917cee066cSHong Zhang   PetscInt        i, *collengths, *cia, *cja, n = A->cmap->n, m = A->rmap->n;
292071fcb05SBarry Smith   PetscInt        nz = a->i[m], row, mr, col, tmp;
2937cee066cSHong Zhang   PetscInt       *cspidx;
294071fcb05SBarry Smith   const PetscInt *jj;
2957cee066cSHong Zhang 
2967cee066cSHong Zhang   PetscFunctionBegin;
2977cee066cSHong Zhang   *nn = n;
2983ba16761SJacob Faibussowitsch   if (!ia) PetscFunctionReturn(PETSC_SUCCESS);
299625f6d37SHong Zhang 
3009566063dSJacob Faibussowitsch   PetscCall(PetscCalloc1(n, &collengths));
3019566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(n + 1, &cia));
3029566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(nz, &cja));
3039566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(nz, &cspidx));
3047cee066cSHong Zhang   jj = a->j;
305ad540459SPierre Jolivet   for (i = 0; i < nz; i++) collengths[jj[i]]++;
3067cee066cSHong Zhang   cia[0] = oshift;
307ad540459SPierre Jolivet   for (i = 0; i < n; i++) cia[i + 1] = cia[i] + collengths[i];
3089566063dSJacob Faibussowitsch   PetscCall(PetscArrayzero(collengths, n));
3097cee066cSHong Zhang   jj = a->j;
3107cee066cSHong Zhang   for (row = 0; row < m; row++) {
3117cee066cSHong Zhang     mr = a->i[row + 1] - a->i[row];
3127cee066cSHong Zhang     for (i = 0; i < mr; i++) {
3137cee066cSHong Zhang       col         = *jj++;
314071fcb05SBarry Smith       tmp         = cia[col] + collengths[col]++ - oshift;
315071fcb05SBarry Smith       cspidx[tmp] = a->i[row] + i; /* index of a->j */
316071fcb05SBarry Smith       cja[tmp]    = row + oshift;
3177cee066cSHong Zhang     }
3187cee066cSHong Zhang   }
3199566063dSJacob Faibussowitsch   PetscCall(PetscFree(collengths));
320071fcb05SBarry Smith   *ia    = cia;
321071fcb05SBarry Smith   *ja    = cja;
3227cee066cSHong Zhang   *spidx = cspidx;
3233ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3247cee066cSHong Zhang }
3257cee066cSHong Zhang 
326d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRestoreColumnIJ_SeqAIJ_Color(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *n, const PetscInt *ia[], const PetscInt *ja[], PetscInt *spidx[], PetscBool *done)
327d71ae5a4SJacob Faibussowitsch {
3287cee066cSHong Zhang   PetscFunctionBegin;
3299566063dSJacob Faibussowitsch   PetscCall(MatRestoreColumnIJ_SeqAIJ(A, oshift, symmetric, inodecompressed, n, ia, ja, done));
3309566063dSJacob Faibussowitsch   PetscCall(PetscFree(*spidx));
3313ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3327cee066cSHong Zhang }
3337cee066cSHong Zhang 
334ba38deedSJacob Faibussowitsch static PetscErrorCode MatSetValuesRow_SeqAIJ(Mat A, PetscInt row, const PetscScalar v[])
335d71ae5a4SJacob Faibussowitsch {
33687d4246cSBarry Smith   Mat_SeqAIJ  *a  = (Mat_SeqAIJ *)A->data;
33787d4246cSBarry Smith   PetscInt    *ai = a->i;
338fff043a9SJunchao Zhang   PetscScalar *aa;
33987d4246cSBarry Smith 
34087d4246cSBarry Smith   PetscFunctionBegin;
3419566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArray(A, &aa));
3429566063dSJacob Faibussowitsch   PetscCall(PetscArraycpy(aa + ai[row], v, ai[row + 1] - ai[row]));
3439566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArray(A, &aa));
3443ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
34587d4246cSBarry Smith }
34687d4246cSBarry Smith 
347bd04181cSBarry Smith /*
348bd04181cSBarry Smith     MatSeqAIJSetValuesLocalFast - An optimized version of MatSetValuesLocal() for SeqAIJ matrices with several assumptions
349bd04181cSBarry Smith 
350bd04181cSBarry Smith       -   a single row of values is set with each call
351bd04181cSBarry Smith       -   no row or column indices are negative or (in error) larger than the number of rows or columns
352bd04181cSBarry Smith       -   the values are always added to the matrix, not set
353bd04181cSBarry Smith       -   no new locations are introduced in the nonzero structure of the matrix
354bd04181cSBarry Smith 
3551f763a69SBarry Smith      This does NOT assume the global column indices are sorted
356bd04181cSBarry Smith 
3571f763a69SBarry Smith */
358bd04181cSBarry Smith 
359af0996ceSBarry Smith #include <petsc/private/isimpl.h>
360d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetValuesLocalFast(Mat A, PetscInt m, const PetscInt im[], PetscInt n, const PetscInt in[], const PetscScalar v[], InsertMode is)
361d71ae5a4SJacob Faibussowitsch {
362189e4007SBarry Smith   Mat_SeqAIJ     *a = (Mat_SeqAIJ *)A->data;
3631f763a69SBarry Smith   PetscInt        low, high, t, row, nrow, i, col, l;
3641f763a69SBarry Smith   const PetscInt *rp, *ai = a->i, *ailen = a->ilen, *aj = a->j;
3651f763a69SBarry Smith   PetscInt        lastcol = -1;
366fff043a9SJunchao Zhang   MatScalar      *ap, value, *aa;
367189e4007SBarry Smith   const PetscInt *ridx = A->rmap->mapping->indices, *cidx = A->cmap->mapping->indices;
368189e4007SBarry Smith 
369fff043a9SJunchao Zhang   PetscFunctionBegin;
3709566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArray(A, &aa));
371f38dd0b8SBarry Smith   row  = ridx[im[0]];
3721f763a69SBarry Smith   rp   = aj + ai[row];
3731f763a69SBarry Smith   ap   = aa + ai[row];
3741f763a69SBarry Smith   nrow = ailen[row];
375189e4007SBarry Smith   low  = 0;
376189e4007SBarry Smith   high = nrow;
377189e4007SBarry Smith   for (l = 0; l < n; l++) { /* loop over added columns */
378189e4007SBarry Smith     col   = cidx[in[l]];
379f38dd0b8SBarry Smith     value = v[l];
380189e4007SBarry Smith 
381189e4007SBarry Smith     if (col <= lastcol) low = 0;
382189e4007SBarry Smith     else high = nrow;
383189e4007SBarry Smith     lastcol = col;
384189e4007SBarry Smith     while (high - low > 5) {
385189e4007SBarry Smith       t = (low + high) / 2;
386189e4007SBarry Smith       if (rp[t] > col) high = t;
387189e4007SBarry Smith       else low = t;
388189e4007SBarry Smith     }
389189e4007SBarry Smith     for (i = low; i < high; i++) {
390189e4007SBarry Smith       if (rp[i] == col) {
3911f763a69SBarry Smith         ap[i] += value;
392189e4007SBarry Smith         low = i + 1;
3931f763a69SBarry Smith         break;
394189e4007SBarry Smith       }
395189e4007SBarry Smith     }
396189e4007SBarry Smith   }
3979566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArray(A, &aa));
3983ba16761SJacob Faibussowitsch   return PETSC_SUCCESS;
399189e4007SBarry Smith }
400189e4007SBarry Smith 
401d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetValues_SeqAIJ(Mat A, PetscInt m, const PetscInt im[], PetscInt n, const PetscInt in[], const PetscScalar v[], InsertMode is)
402d71ae5a4SJacob Faibussowitsch {
403416022c9SBarry Smith   Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data;
404e2ee6c50SBarry Smith   PetscInt   *rp, k, low, high, t, ii, row, nrow, i, col, l, rmax, N;
40597f1f81fSBarry Smith   PetscInt   *imax = a->imax, *ai = a->i, *ailen = a->ilen;
406e2ee6c50SBarry Smith   PetscInt   *aj = a->j, nonew = a->nonew, lastcol = -1;
407ce496241SStefano Zampini   MatScalar  *ap = NULL, value = 0.0, *aa;
408ace3abfcSBarry Smith   PetscBool   ignorezeroentries = a->ignorezeroentries;
409ace3abfcSBarry Smith   PetscBool   roworiented       = a->roworiented;
41017ab2063SBarry Smith 
4113a40ed3dSBarry Smith   PetscFunctionBegin;
4129566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArray(A, &aa));
41317ab2063SBarry Smith   for (k = 0; k < m; k++) { /* loop over added rows */
414416022c9SBarry Smith     row = im[k];
4155ef9f2a5SBarry Smith     if (row < 0) continue;
4166bdcaf15SBarry Smith     PetscCheck(row < A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Row too large: row %" PetscInt_FMT " max %" PetscInt_FMT, row, A->rmap->n - 1);
4178e3a54c0SPierre Jolivet     rp = PetscSafePointerPlusOffset(aj, ai[row]);
4188e3a54c0SPierre Jolivet     if (!A->structure_only) ap = PetscSafePointerPlusOffset(aa, ai[row]);
4199371c9d4SSatish Balay     rmax = imax[row];
4209371c9d4SSatish Balay     nrow = ailen[row];
421416022c9SBarry Smith     low  = 0;
422c71e6ed7SBarry Smith     high = nrow;
42317ab2063SBarry Smith     for (l = 0; l < n; l++) { /* loop over added columns */
4245ef9f2a5SBarry Smith       if (in[l] < 0) continue;
4256bdcaf15SBarry Smith       PetscCheck(in[l] < A->cmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Column too large: col %" PetscInt_FMT " max %" PetscInt_FMT, in[l], A->cmap->n - 1);
426bfeeae90SHong Zhang       col = in[l];
427071fcb05SBarry Smith       if (v && !A->structure_only) value = roworiented ? v[l + k * n] : v[k + l * m];
428071fcb05SBarry Smith       if (!A->structure_only && value == 0.0 && ignorezeroentries && is == ADD_VALUES && row != col) continue;
42936db0b34SBarry Smith 
4302205254eSKarl Rupp       if (col <= lastcol) low = 0;
4312205254eSKarl Rupp       else high = nrow;
432e2ee6c50SBarry Smith       lastcol = col;
433416022c9SBarry Smith       while (high - low > 5) {
434416022c9SBarry Smith         t = (low + high) / 2;
435416022c9SBarry Smith         if (rp[t] > col) high = t;
436416022c9SBarry Smith         else low = t;
43717ab2063SBarry Smith       }
438416022c9SBarry Smith       for (i = low; i < high; i++) {
43917ab2063SBarry Smith         if (rp[i] > col) break;
44017ab2063SBarry Smith         if (rp[i] == col) {
441876c6284SHong Zhang           if (!A->structure_only) {
4420c0d7e18SFande Kong             if (is == ADD_VALUES) {
4430c0d7e18SFande Kong               ap[i] += value;
4440c0d7e18SFande Kong               (void)PetscLogFlops(1.0);
4459371c9d4SSatish Balay             } else ap[i] = value;
446720833daSHong Zhang           }
447e44c0bd4SBarry Smith           low = i + 1;
44817ab2063SBarry Smith           goto noinsert;
44917ab2063SBarry Smith         }
45017ab2063SBarry Smith       }
451dcd36c23SBarry Smith       if (value == 0.0 && ignorezeroentries && row != col) goto noinsert;
452c2653b3dSLois Curfman McInnes       if (nonew == 1) goto noinsert;
45308401ef6SPierre Jolivet       PetscCheck(nonew != -1, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Inserting a new nonzero at (%" PetscInt_FMT ",%" PetscInt_FMT ") in the matrix", row, col);
454720833daSHong Zhang       if (A->structure_only) {
455876c6284SHong Zhang         MatSeqXAIJReallocateAIJ_structure_only(A, A->rmap->n, 1, nrow, row, col, rmax, ai, aj, rp, imax, nonew, MatScalar);
456720833daSHong Zhang       } else {
457fef13f97SBarry Smith         MatSeqXAIJReallocateAIJ(A, A->rmap->n, 1, nrow, row, col, rmax, aa, ai, aj, rp, ap, imax, nonew, MatScalar);
458720833daSHong Zhang       }
4599371c9d4SSatish Balay       N = nrow++ - 1;
4609371c9d4SSatish Balay       a->nz++;
4619371c9d4SSatish Balay       high++;
462416022c9SBarry Smith       /* shift up all the later entries in this row */
4639566063dSJacob Faibussowitsch       PetscCall(PetscArraymove(rp + i + 1, rp + i, N - i + 1));
46417ab2063SBarry Smith       rp[i] = col;
465580bdb30SBarry Smith       if (!A->structure_only) {
4669566063dSJacob Faibussowitsch         PetscCall(PetscArraymove(ap + i + 1, ap + i, N - i + 1));
467580bdb30SBarry Smith         ap[i] = value;
468580bdb30SBarry Smith       }
469416022c9SBarry Smith       low = i + 1;
470e44c0bd4SBarry Smith     noinsert:;
47117ab2063SBarry Smith     }
47217ab2063SBarry Smith     ailen[row] = nrow;
47317ab2063SBarry Smith   }
4749566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArray(A, &aa));
4753ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
47617ab2063SBarry Smith }
47717ab2063SBarry Smith 
478ba38deedSJacob Faibussowitsch static PetscErrorCode MatSetValues_SeqAIJ_SortedFullNoPreallocation(Mat A, PetscInt m, const PetscInt im[], PetscInt n, const PetscInt in[], const PetscScalar v[], InsertMode is)
479d71ae5a4SJacob Faibussowitsch {
48019b08ed1SBarry Smith   Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data;
48119b08ed1SBarry Smith   PetscInt   *rp, k, row;
48219b08ed1SBarry Smith   PetscInt   *ai = a->i;
48319b08ed1SBarry Smith   PetscInt   *aj = a->j;
484fff043a9SJunchao Zhang   MatScalar  *aa, *ap;
48519b08ed1SBarry Smith 
48619b08ed1SBarry Smith   PetscFunctionBegin;
48728b400f6SJacob Faibussowitsch   PetscCheck(!A->was_assembled, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Cannot call on assembled matrix.");
48808401ef6SPierre Jolivet   PetscCheck(m * n + a->nz <= a->maxnz, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Number of entries in matrix will be larger than maximum nonzeros allocated for %" PetscInt_FMT " in MatSeqAIJSetTotalPreallocation()", a->maxnz);
489fff043a9SJunchao Zhang 
4909566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArray(A, &aa));
49119b08ed1SBarry Smith   for (k = 0; k < m; k++) { /* loop over added rows */
49219b08ed1SBarry Smith     row = im[k];
49319b08ed1SBarry Smith     rp  = aj + ai[row];
4948e3a54c0SPierre Jolivet     ap  = PetscSafePointerPlusOffset(aa, ai[row]);
49519b08ed1SBarry Smith 
4969566063dSJacob Faibussowitsch     PetscCall(PetscMemcpy(rp, in, n * sizeof(PetscInt)));
49719b08ed1SBarry Smith     if (!A->structure_only) {
49819b08ed1SBarry Smith       if (v) {
4999566063dSJacob Faibussowitsch         PetscCall(PetscMemcpy(ap, v, n * sizeof(PetscScalar)));
50019b08ed1SBarry Smith         v += n;
50119b08ed1SBarry Smith       } else {
5029566063dSJacob Faibussowitsch         PetscCall(PetscMemzero(ap, n * sizeof(PetscScalar)));
50319b08ed1SBarry Smith       }
50419b08ed1SBarry Smith     }
50519b08ed1SBarry Smith     a->ilen[row]  = n;
50619b08ed1SBarry Smith     a->imax[row]  = n;
50719b08ed1SBarry Smith     a->i[row + 1] = a->i[row] + n;
50819b08ed1SBarry Smith     a->nz += n;
50919b08ed1SBarry Smith   }
5109566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArray(A, &aa));
5113ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
51219b08ed1SBarry Smith }
51319b08ed1SBarry Smith 
51419b08ed1SBarry Smith /*@
51519b08ed1SBarry Smith   MatSeqAIJSetTotalPreallocation - Sets an upper bound on the total number of expected nonzeros in the matrix.
51619b08ed1SBarry Smith 
51719b08ed1SBarry Smith   Input Parameters:
51811a5261eSBarry Smith + A       - the `MATSEQAIJ` matrix
51919b08ed1SBarry Smith - nztotal - bound on the number of nonzeros
52019b08ed1SBarry Smith 
52119b08ed1SBarry Smith   Level: advanced
52219b08ed1SBarry Smith 
52319b08ed1SBarry Smith   Notes:
52419b08ed1SBarry Smith   This can be called if you will be provided the matrix row by row (from row zero) with sorted column indices for each row.
52511a5261eSBarry Smith   Simply call `MatSetValues()` after this call to provide the matrix entries in the usual manner. This matrix may be used
52619b08ed1SBarry Smith   as always with multiple matrix assemblies.
52719b08ed1SBarry Smith 
5281cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSetOption()`, `MAT_SORTED_FULL`, `MatSetValues()`, `MatSeqAIJSetPreallocation()`
52919b08ed1SBarry Smith @*/
530d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetTotalPreallocation(Mat A, PetscInt nztotal)
531d71ae5a4SJacob Faibussowitsch {
53219b08ed1SBarry Smith   Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data;
53319b08ed1SBarry Smith 
53419b08ed1SBarry Smith   PetscFunctionBegin;
5359566063dSJacob Faibussowitsch   PetscCall(PetscLayoutSetUp(A->rmap));
5369566063dSJacob Faibussowitsch   PetscCall(PetscLayoutSetUp(A->cmap));
53719b08ed1SBarry Smith   a->maxnz = nztotal;
5383a7d0413SPierre Jolivet   if (!a->imax) PetscCall(PetscMalloc1(A->rmap->n, &a->imax));
53919b08ed1SBarry Smith   if (!a->ilen) {
5409566063dSJacob Faibussowitsch     PetscCall(PetscMalloc1(A->rmap->n, &a->ilen));
54119b08ed1SBarry Smith   } else {
5429566063dSJacob Faibussowitsch     PetscCall(PetscMemzero(a->ilen, A->rmap->n * sizeof(PetscInt)));
54319b08ed1SBarry Smith   }
54419b08ed1SBarry Smith 
54519b08ed1SBarry Smith   /* allocate the matrix space */
5469f0612e4SBarry Smith   PetscCall(PetscShmgetAllocateArray(A->rmap->n + 1, sizeof(PetscInt), (void **)&a->i));
5479f0612e4SBarry Smith   PetscCall(PetscShmgetAllocateArray(nztotal, sizeof(PetscInt), (void **)&a->j));
5489f0612e4SBarry Smith   a->free_ij = PETSC_TRUE;
54919b08ed1SBarry Smith   if (A->structure_only) {
55019b08ed1SBarry Smith     a->free_a = PETSC_FALSE;
55119b08ed1SBarry Smith   } else {
5529f0612e4SBarry Smith     PetscCall(PetscShmgetAllocateArray(nztotal, sizeof(PetscScalar), (void **)&a->a));
55319b08ed1SBarry Smith     a->free_a = PETSC_TRUE;
55419b08ed1SBarry Smith   }
5559f0612e4SBarry Smith   a->i[0]           = 0;
55619b08ed1SBarry Smith   A->ops->setvalues = MatSetValues_SeqAIJ_SortedFullNoPreallocation;
55719b08ed1SBarry Smith   A->preallocated   = PETSC_TRUE;
5583ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
55919b08ed1SBarry Smith }
56019b08ed1SBarry Smith 
561ba38deedSJacob Faibussowitsch static PetscErrorCode MatSetValues_SeqAIJ_SortedFull(Mat A, PetscInt m, const PetscInt im[], PetscInt n, const PetscInt in[], const PetscScalar v[], InsertMode is)
562d71ae5a4SJacob Faibussowitsch {
563071fcb05SBarry Smith   Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data;
564071fcb05SBarry Smith   PetscInt   *rp, k, row;
565071fcb05SBarry Smith   PetscInt   *ai = a->i, *ailen = a->ilen;
566071fcb05SBarry Smith   PetscInt   *aj = a->j;
567fff043a9SJunchao Zhang   MatScalar  *aa, *ap;
568071fcb05SBarry Smith 
569071fcb05SBarry Smith   PetscFunctionBegin;
5709566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArray(A, &aa));
571071fcb05SBarry Smith   for (k = 0; k < m; k++) { /* loop over added rows */
572071fcb05SBarry Smith     row = im[k];
5736bdcaf15SBarry Smith     PetscCheck(n <= a->imax[row], PETSC_COMM_SELF, PETSC_ERR_ARG_WRONG, "Preallocation for row %" PetscInt_FMT " does not match number of columns provided", n);
574071fcb05SBarry Smith     rp = aj + ai[row];
575071fcb05SBarry Smith     ap = aa + ai[row];
57648a46eb9SPierre Jolivet     if (!A->was_assembled) PetscCall(PetscMemcpy(rp, in, n * sizeof(PetscInt)));
577071fcb05SBarry Smith     if (!A->structure_only) {
578071fcb05SBarry Smith       if (v) {
5799566063dSJacob Faibussowitsch         PetscCall(PetscMemcpy(ap, v, n * sizeof(PetscScalar)));
580071fcb05SBarry Smith         v += n;
581071fcb05SBarry Smith       } else {
5829566063dSJacob Faibussowitsch         PetscCall(PetscMemzero(ap, n * sizeof(PetscScalar)));
583071fcb05SBarry Smith       }
584071fcb05SBarry Smith     }
585071fcb05SBarry Smith     ailen[row] = n;
586071fcb05SBarry Smith     a->nz += n;
587071fcb05SBarry Smith   }
5889566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArray(A, &aa));
5893ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
590071fcb05SBarry Smith }
591071fcb05SBarry Smith 
592ba38deedSJacob Faibussowitsch static PetscErrorCode MatGetValues_SeqAIJ(Mat A, PetscInt m, const PetscInt im[], PetscInt n, const PetscInt in[], PetscScalar v[])
593d71ae5a4SJacob Faibussowitsch {
5947eb43aa7SLois Curfman McInnes   Mat_SeqAIJ      *a = (Mat_SeqAIJ *)A->data;
59597f1f81fSBarry Smith   PetscInt        *rp, k, low, high, t, row, nrow, i, col, l, *aj = a->j;
59697f1f81fSBarry Smith   PetscInt        *ai = a->i, *ailen = a->ilen;
5974e208921SJed Brown   const MatScalar *ap, *aa;
5987eb43aa7SLois Curfman McInnes 
5993a40ed3dSBarry Smith   PetscFunctionBegin;
6004e208921SJed Brown   PetscCall(MatSeqAIJGetArrayRead(A, &aa));
6017eb43aa7SLois Curfman McInnes   for (k = 0; k < m; k++) { /* loop over rows */
6027eb43aa7SLois Curfman McInnes     row = im[k];
6039371c9d4SSatish Balay     if (row < 0) {
6049371c9d4SSatish Balay       v += n;
6059371c9d4SSatish Balay       continue;
6069371c9d4SSatish Balay     } /* negative row */
60754c59aa7SJacob Faibussowitsch     PetscCheck(row < A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Row too large: row %" PetscInt_FMT " max %" PetscInt_FMT, row, A->rmap->n - 1);
6088e3a54c0SPierre Jolivet     rp   = PetscSafePointerPlusOffset(aj, ai[row]);
6098e3a54c0SPierre Jolivet     ap   = PetscSafePointerPlusOffset(aa, ai[row]);
6107eb43aa7SLois Curfman McInnes     nrow = ailen[row];
6117eb43aa7SLois Curfman McInnes     for (l = 0; l < n; l++) { /* loop over columns */
6129371c9d4SSatish Balay       if (in[l] < 0) {
6139371c9d4SSatish Balay         v++;
6149371c9d4SSatish Balay         continue;
6159371c9d4SSatish Balay       } /* negative column */
61654c59aa7SJacob Faibussowitsch       PetscCheck(in[l] < A->cmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Column too large: col %" PetscInt_FMT " max %" PetscInt_FMT, in[l], A->cmap->n - 1);
617bfeeae90SHong Zhang       col  = in[l];
6189371c9d4SSatish Balay       high = nrow;
6199371c9d4SSatish Balay       low  = 0; /* assume unsorted */
6207eb43aa7SLois Curfman McInnes       while (high - low > 5) {
6217eb43aa7SLois Curfman McInnes         t = (low + high) / 2;
6227eb43aa7SLois Curfman McInnes         if (rp[t] > col) high = t;
6237eb43aa7SLois Curfman McInnes         else low = t;
6247eb43aa7SLois Curfman McInnes       }
6257eb43aa7SLois Curfman McInnes       for (i = low; i < high; i++) {
6267eb43aa7SLois Curfman McInnes         if (rp[i] > col) break;
6277eb43aa7SLois Curfman McInnes         if (rp[i] == col) {
628b49de8d1SLois Curfman McInnes           *v++ = ap[i];
6297eb43aa7SLois Curfman McInnes           goto finished;
6307eb43aa7SLois Curfman McInnes         }
6317eb43aa7SLois Curfman McInnes       }
63297e567efSBarry Smith       *v++ = 0.0;
6337eb43aa7SLois Curfman McInnes     finished:;
6347eb43aa7SLois Curfman McInnes     }
6357eb43aa7SLois Curfman McInnes   }
6364e208921SJed Brown   PetscCall(MatSeqAIJRestoreArrayRead(A, &aa));
6373ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
6387eb43aa7SLois Curfman McInnes }
6397eb43aa7SLois Curfman McInnes 
640ba38deedSJacob Faibussowitsch static PetscErrorCode MatView_SeqAIJ_Binary(Mat mat, PetscViewer viewer)
641d71ae5a4SJacob Faibussowitsch {
6423ea6fe3dSLisandro Dalcin   Mat_SeqAIJ        *A = (Mat_SeqAIJ *)mat->data;
643c898d852SStefano Zampini   const PetscScalar *av;
6443ea6fe3dSLisandro Dalcin   PetscInt           header[4], M, N, m, nz, i;
6453ea6fe3dSLisandro Dalcin   PetscInt          *rowlens;
64617ab2063SBarry Smith 
6473a40ed3dSBarry Smith   PetscFunctionBegin;
6489566063dSJacob Faibussowitsch   PetscCall(PetscViewerSetUp(viewer));
6492205254eSKarl Rupp 
6503ea6fe3dSLisandro Dalcin   M  = mat->rmap->N;
6513ea6fe3dSLisandro Dalcin   N  = mat->cmap->N;
6523ea6fe3dSLisandro Dalcin   m  = mat->rmap->n;
6533ea6fe3dSLisandro Dalcin   nz = A->nz;
654416022c9SBarry Smith 
6553ea6fe3dSLisandro Dalcin   /* write matrix header */
6563ea6fe3dSLisandro Dalcin   header[0] = MAT_FILE_CLASSID;
6579371c9d4SSatish Balay   header[1] = M;
6589371c9d4SSatish Balay   header[2] = N;
6599371c9d4SSatish Balay   header[3] = nz;
6609566063dSJacob Faibussowitsch   PetscCall(PetscViewerBinaryWrite(viewer, header, 4, PETSC_INT));
661416022c9SBarry Smith 
6623ea6fe3dSLisandro Dalcin   /* fill in and store row lengths */
6639566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(m, &rowlens));
6643ea6fe3dSLisandro Dalcin   for (i = 0; i < m; i++) rowlens[i] = A->i[i + 1] - A->i[i];
665e457bb90SBarry Smith   if (PetscDefined(USE_DEBUG)) {
666e457bb90SBarry Smith     PetscInt mnz = 0;
667e457bb90SBarry Smith 
668e457bb90SBarry Smith     for (i = 0; i < m; i++) mnz += rowlens[i];
669e457bb90SBarry Smith     PetscCheck(nz == mnz, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Row lens %" PetscInt_FMT " do not sum to nz %" PetscInt_FMT, mnz, nz);
670e457bb90SBarry Smith   }
6719566063dSJacob Faibussowitsch   PetscCall(PetscViewerBinaryWrite(viewer, rowlens, m, PETSC_INT));
6729566063dSJacob Faibussowitsch   PetscCall(PetscFree(rowlens));
6733ea6fe3dSLisandro Dalcin   /* store column indices */
6749566063dSJacob Faibussowitsch   PetscCall(PetscViewerBinaryWrite(viewer, A->j, nz, PETSC_INT));
675416022c9SBarry Smith   /* store nonzero values */
6769566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(mat, &av));
6779566063dSJacob Faibussowitsch   PetscCall(PetscViewerBinaryWrite(viewer, av, nz, PETSC_SCALAR));
6789566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(mat, &av));
679b37d52dbSMark F. Adams 
6803ea6fe3dSLisandro Dalcin   /* write block size option to the viewer's .info file */
6819566063dSJacob Faibussowitsch   PetscCall(MatView_Binary_BlockSizes(mat, viewer));
6823ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
68317ab2063SBarry Smith }
684416022c9SBarry Smith 
685d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatView_SeqAIJ_ASCII_structonly(Mat A, PetscViewer viewer)
686d71ae5a4SJacob Faibussowitsch {
6877dc0baabSHong Zhang   Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data;
6887dc0baabSHong Zhang   PetscInt    i, k, m = A->rmap->N;
6897dc0baabSHong Zhang 
6907dc0baabSHong Zhang   PetscFunctionBegin;
6919566063dSJacob Faibussowitsch   PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE));
6927dc0baabSHong Zhang   for (i = 0; i < m; i++) {
6939566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIPrintf(viewer, "row %" PetscInt_FMT ":", i));
69448a46eb9SPierre Jolivet     for (k = a->i[i]; k < a->i[i + 1]; k++) PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ") ", a->j[k]));
6959566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIPrintf(viewer, "\n"));
6967dc0baabSHong Zhang   }
6979566063dSJacob Faibussowitsch   PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE));
6983ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
6997dc0baabSHong Zhang }
7007dc0baabSHong Zhang 
701ba38deedSJacob Faibussowitsch static PetscErrorCode MatView_SeqAIJ_ASCII(Mat A, PetscViewer viewer)
702d71ae5a4SJacob Faibussowitsch {
703416022c9SBarry Smith   Mat_SeqAIJ        *a = (Mat_SeqAIJ *)A->data;
704c898d852SStefano Zampini   const PetscScalar *av;
70560e0710aSBarry Smith   PetscInt           i, j, m = A->rmap->n;
706e060cb09SBarry Smith   const char        *name;
707f3ef73ceSBarry Smith   PetscViewerFormat  format;
70817ab2063SBarry Smith 
7093a40ed3dSBarry Smith   PetscFunctionBegin;
7107dc0baabSHong Zhang   if (A->structure_only) {
7119566063dSJacob Faibussowitsch     PetscCall(MatView_SeqAIJ_ASCII_structonly(A, viewer));
7123ba16761SJacob Faibussowitsch     PetscFunctionReturn(PETSC_SUCCESS);
7137dc0baabSHong Zhang   }
71443e49210SHong Zhang 
7159566063dSJacob Faibussowitsch   PetscCall(PetscViewerGetFormat(viewer, &format));
716bd6a2ce3SJunchao Zhang   // By petsc's rule, even PETSC_VIEWER_ASCII_INFO_DETAIL doesn't print matrix entries
7173ba16761SJacob Faibussowitsch   if (format == PETSC_VIEWER_ASCII_FACTOR_INFO || format == PETSC_VIEWER_ASCII_INFO || format == PETSC_VIEWER_ASCII_INFO_DETAIL) PetscFunctionReturn(PETSC_SUCCESS);
7182e5835c6SStefano Zampini 
719c898d852SStefano Zampini   /* trigger copy to CPU if needed */
7209566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &av));
7219566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &av));
72271c2f376SKris Buschelman   if (format == PETSC_VIEWER_ASCII_MATLAB) {
72397f1f81fSBarry Smith     PetscInt nofinalvalue = 0;
72460e0710aSBarry Smith     if (m && ((a->i[m] == a->i[m - 1]) || (a->j[a->nz - 1] != A->cmap->n - 1))) {
725c337ccceSJed Brown       /* Need a dummy value to ensure the dimension of the matrix. */
726d00d2cf4SBarry Smith       nofinalvalue = 1;
727d00d2cf4SBarry Smith     }
7289566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE));
7299566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIPrintf(viewer, "%% Size = %" PetscInt_FMT " %" PetscInt_FMT " \n", m, A->cmap->n));
7309566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIPrintf(viewer, "%% Nonzeros = %" PetscInt_FMT " \n", a->nz));
731fbfe6fa7SJed Brown #if defined(PETSC_USE_COMPLEX)
7329566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIPrintf(viewer, "zzz = zeros(%" PetscInt_FMT ",4);\n", a->nz + nofinalvalue));
733fbfe6fa7SJed Brown #else
7349566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIPrintf(viewer, "zzz = zeros(%" PetscInt_FMT ",3);\n", a->nz + nofinalvalue));
735fbfe6fa7SJed Brown #endif
7369566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIPrintf(viewer, "zzz = [\n"));
73717ab2063SBarry Smith 
73817ab2063SBarry Smith     for (i = 0; i < m; i++) {
73960e0710aSBarry Smith       for (j = a->i[i]; j < a->i[i + 1]; j++) {
740aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX)
7419566063dSJacob Faibussowitsch         PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT "  %18.16e %18.16e\n", i + 1, a->j[j] + 1, (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j])));
74217ab2063SBarry Smith #else
7439566063dSJacob Faibussowitsch         PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT "  %18.16e\n", i + 1, a->j[j] + 1, (double)a->a[j]));
74417ab2063SBarry Smith #endif
74517ab2063SBarry Smith       }
74617ab2063SBarry Smith     }
747d00d2cf4SBarry Smith     if (nofinalvalue) {
748c337ccceSJed Brown #if defined(PETSC_USE_COMPLEX)
7499566063dSJacob Faibussowitsch       PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT "  %18.16e %18.16e\n", m, A->cmap->n, 0., 0.));
750c337ccceSJed Brown #else
7519566063dSJacob Faibussowitsch       PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT "  %18.16e\n", m, A->cmap->n, 0.0));
752c337ccceSJed Brown #endif
753d00d2cf4SBarry Smith     }
7549566063dSJacob Faibussowitsch     PetscCall(PetscObjectGetName((PetscObject)A, &name));
7559566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIPrintf(viewer, "];\n %s = spconvert(zzz);\n", name));
7569566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE));
757fb9695e5SSatish Balay   } else if (format == PETSC_VIEWER_ASCII_COMMON) {
7589566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE));
75944cd7ae7SLois Curfman McInnes     for (i = 0; i < m; i++) {
7609566063dSJacob Faibussowitsch       PetscCall(PetscViewerASCIIPrintf(viewer, "row %" PetscInt_FMT ":", i));
76160e0710aSBarry Smith       for (j = a->i[i]; j < a->i[i + 1]; j++) {
762aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX)
76336db0b34SBarry Smith         if (PetscImaginaryPart(a->a[j]) > 0.0 && PetscRealPart(a->a[j]) != 0.0) {
7649566063dSJacob Faibussowitsch           PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g + %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j])));
76536db0b34SBarry Smith         } else if (PetscImaginaryPart(a->a[j]) < 0.0 && PetscRealPart(a->a[j]) != 0.0) {
7669566063dSJacob Faibussowitsch           PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g - %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)-PetscImaginaryPart(a->a[j])));
76736db0b34SBarry Smith         } else if (PetscRealPart(a->a[j]) != 0.0) {
7689566063dSJacob Faibussowitsch           PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)PetscRealPart(a->a[j])));
7696831982aSBarry Smith         }
77044cd7ae7SLois Curfman McInnes #else
7719566063dSJacob Faibussowitsch         if (a->a[j] != 0.0) PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)a->a[j]));
77244cd7ae7SLois Curfman McInnes #endif
77344cd7ae7SLois Curfman McInnes       }
7749566063dSJacob Faibussowitsch       PetscCall(PetscViewerASCIIPrintf(viewer, "\n"));
77544cd7ae7SLois Curfman McInnes     }
7769566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE));
777fb9695e5SSatish Balay   } else if (format == PETSC_VIEWER_ASCII_SYMMODU) {
77897f1f81fSBarry Smith     PetscInt nzd = 0, fshift = 1, *sptr;
7799566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE));
7809566063dSJacob Faibussowitsch     PetscCall(PetscMalloc1(m + 1, &sptr));
781496be53dSLois Curfman McInnes     for (i = 0; i < m; i++) {
782496be53dSLois Curfman McInnes       sptr[i] = nzd + 1;
78360e0710aSBarry Smith       for (j = a->i[i]; j < a->i[i + 1]; j++) {
784496be53dSLois Curfman McInnes         if (a->j[j] >= i) {
785aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX)
78636db0b34SBarry Smith           if (PetscImaginaryPart(a->a[j]) != 0.0 || PetscRealPart(a->a[j]) != 0.0) nzd++;
787496be53dSLois Curfman McInnes #else
788496be53dSLois Curfman McInnes           if (a->a[j] != 0.0) nzd++;
789496be53dSLois Curfman McInnes #endif
790496be53dSLois Curfman McInnes         }
791496be53dSLois Curfman McInnes       }
792496be53dSLois Curfman McInnes     }
7932e44a96cSLois Curfman McInnes     sptr[m] = nzd + 1;
7949566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " %" PetscInt_FMT "\n\n", m, nzd));
7952e44a96cSLois Curfman McInnes     for (i = 0; i < m + 1; i += 6) {
7962205254eSKarl Rupp       if (i + 4 < m) {
7979566063dSJacob Faibussowitsch         PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT "\n", sptr[i], sptr[i + 1], sptr[i + 2], sptr[i + 3], sptr[i + 4], sptr[i + 5]));
7982205254eSKarl Rupp       } else if (i + 3 < m) {
7999566063dSJacob Faibussowitsch         PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT "\n", sptr[i], sptr[i + 1], sptr[i + 2], sptr[i + 3], sptr[i + 4]));
8002205254eSKarl Rupp       } else if (i + 2 < m) {
8019566063dSJacob Faibussowitsch         PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT "\n", sptr[i], sptr[i + 1], sptr[i + 2], sptr[i + 3]));
8022205254eSKarl Rupp       } else if (i + 1 < m) {
8039566063dSJacob Faibussowitsch         PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT "\n", sptr[i], sptr[i + 1], sptr[i + 2]));
8042205254eSKarl Rupp       } else if (i < m) {
8059566063dSJacob Faibussowitsch         PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " %" PetscInt_FMT "\n", sptr[i], sptr[i + 1]));
8062205254eSKarl Rupp       } else {
8079566063dSJacob Faibussowitsch         PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT "\n", sptr[i]));
8082205254eSKarl Rupp       }
809496be53dSLois Curfman McInnes     }
8109566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIPrintf(viewer, "\n"));
8119566063dSJacob Faibussowitsch     PetscCall(PetscFree(sptr));
812496be53dSLois Curfman McInnes     for (i = 0; i < m; i++) {
81360e0710aSBarry Smith       for (j = a->i[i]; j < a->i[i + 1]; j++) {
8149566063dSJacob Faibussowitsch         if (a->j[j] >= i) PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " ", a->j[j] + fshift));
815496be53dSLois Curfman McInnes       }
8169566063dSJacob Faibussowitsch       PetscCall(PetscViewerASCIIPrintf(viewer, "\n"));
817496be53dSLois Curfman McInnes     }
8189566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIPrintf(viewer, "\n"));
819496be53dSLois Curfman McInnes     for (i = 0; i < m; i++) {
82060e0710aSBarry Smith       for (j = a->i[i]; j < a->i[i + 1]; j++) {
821496be53dSLois Curfman McInnes         if (a->j[j] >= i) {
822aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX)
82348a46eb9SPierre Jolivet           if (PetscImaginaryPart(a->a[j]) != 0.0 || PetscRealPart(a->a[j]) != 0.0) PetscCall(PetscViewerASCIIPrintf(viewer, " %18.16e %18.16e ", (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j])));
824496be53dSLois Curfman McInnes #else
8259566063dSJacob Faibussowitsch           if (a->a[j] != 0.0) PetscCall(PetscViewerASCIIPrintf(viewer, " %18.16e ", (double)a->a[j]));
826496be53dSLois Curfman McInnes #endif
827496be53dSLois Curfman McInnes         }
828496be53dSLois Curfman McInnes       }
8299566063dSJacob Faibussowitsch       PetscCall(PetscViewerASCIIPrintf(viewer, "\n"));
830496be53dSLois Curfman McInnes     }
8319566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE));
832fb9695e5SSatish Balay   } else if (format == PETSC_VIEWER_ASCII_DENSE) {
83397f1f81fSBarry Smith     PetscInt    cnt = 0, jcnt;
83487828ca2SBarry Smith     PetscScalar value;
83568f1ed48SBarry Smith #if defined(PETSC_USE_COMPLEX)
83668f1ed48SBarry Smith     PetscBool realonly = PETSC_TRUE;
83768f1ed48SBarry Smith 
83868f1ed48SBarry Smith     for (i = 0; i < a->i[m]; i++) {
83968f1ed48SBarry Smith       if (PetscImaginaryPart(a->a[i]) != 0.0) {
84068f1ed48SBarry Smith         realonly = PETSC_FALSE;
84168f1ed48SBarry Smith         break;
84268f1ed48SBarry Smith       }
84368f1ed48SBarry Smith     }
84468f1ed48SBarry Smith #endif
84502594712SBarry Smith 
8469566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE));
84702594712SBarry Smith     for (i = 0; i < m; i++) {
84802594712SBarry Smith       jcnt = 0;
849d0f46423SBarry Smith       for (j = 0; j < A->cmap->n; j++) {
850e24b481bSBarry Smith         if (jcnt < a->i[i + 1] - a->i[i] && j == a->j[cnt]) {
85102594712SBarry Smith           value = a->a[cnt++];
852e24b481bSBarry Smith           jcnt++;
85302594712SBarry Smith         } else {
85402594712SBarry Smith           value = 0.0;
85502594712SBarry Smith         }
856aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX)
85768f1ed48SBarry Smith         if (realonly) {
8589566063dSJacob Faibussowitsch           PetscCall(PetscViewerASCIIPrintf(viewer, " %7.5e ", (double)PetscRealPart(value)));
85968f1ed48SBarry Smith         } else {
8609566063dSJacob Faibussowitsch           PetscCall(PetscViewerASCIIPrintf(viewer, " %7.5e+%7.5e i ", (double)PetscRealPart(value), (double)PetscImaginaryPart(value)));
86168f1ed48SBarry Smith         }
86202594712SBarry Smith #else
8639566063dSJacob Faibussowitsch         PetscCall(PetscViewerASCIIPrintf(viewer, " %7.5e ", (double)value));
86402594712SBarry Smith #endif
86502594712SBarry Smith       }
8669566063dSJacob Faibussowitsch       PetscCall(PetscViewerASCIIPrintf(viewer, "\n"));
86702594712SBarry Smith     }
8689566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE));
8693c215bfdSMatthew Knepley   } else if (format == PETSC_VIEWER_ASCII_MATRIXMARKET) {
870150b93efSMatthew G. Knepley     PetscInt fshift = 1;
8719566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE));
8723c215bfdSMatthew Knepley #if defined(PETSC_USE_COMPLEX)
8739566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIPrintf(viewer, "%%%%MatrixMarket matrix coordinate complex general\n"));
8743c215bfdSMatthew Knepley #else
8759566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIPrintf(viewer, "%%%%MatrixMarket matrix coordinate real general\n"));
8763c215bfdSMatthew Knepley #endif
8779566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT "\n", m, A->cmap->n, a->nz));
8783c215bfdSMatthew Knepley     for (i = 0; i < m; i++) {
87960e0710aSBarry Smith       for (j = a->i[i]; j < a->i[i + 1]; j++) {
8803c215bfdSMatthew Knepley #if defined(PETSC_USE_COMPLEX)
8819566063dSJacob Faibussowitsch         PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT " %g %g\n", i + fshift, a->j[j] + fshift, (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j])));
8823c215bfdSMatthew Knepley #else
8839566063dSJacob Faibussowitsch         PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT " %g\n", i + fshift, a->j[j] + fshift, (double)a->a[j]));
8843c215bfdSMatthew Knepley #endif
8853c215bfdSMatthew Knepley       }
8863c215bfdSMatthew Knepley     }
8879566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE));
8883a40ed3dSBarry Smith   } else {
8899566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE));
890d5f3da31SBarry Smith     if (A->factortype) {
89116cd7e1dSShri Abhyankar       for (i = 0; i < m; i++) {
8929566063dSJacob Faibussowitsch         PetscCall(PetscViewerASCIIPrintf(viewer, "row %" PetscInt_FMT ":", i));
89316cd7e1dSShri Abhyankar         /* L part */
89460e0710aSBarry Smith         for (j = a->i[i]; j < a->i[i + 1]; j++) {
89516cd7e1dSShri Abhyankar #if defined(PETSC_USE_COMPLEX)
89616cd7e1dSShri Abhyankar           if (PetscImaginaryPart(a->a[j]) > 0.0) {
8979566063dSJacob Faibussowitsch             PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g + %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j])));
89816cd7e1dSShri Abhyankar           } else if (PetscImaginaryPart(a->a[j]) < 0.0) {
8999566063dSJacob Faibussowitsch             PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g - %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)(-PetscImaginaryPart(a->a[j]))));
90016cd7e1dSShri Abhyankar           } else {
9019566063dSJacob Faibussowitsch             PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)PetscRealPart(a->a[j])));
90216cd7e1dSShri Abhyankar           }
90316cd7e1dSShri Abhyankar #else
9049566063dSJacob Faibussowitsch           PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)a->a[j]));
90516cd7e1dSShri Abhyankar #endif
90616cd7e1dSShri Abhyankar         }
90716cd7e1dSShri Abhyankar         /* diagonal */
90816cd7e1dSShri Abhyankar         j = a->diag[i];
90916cd7e1dSShri Abhyankar #if defined(PETSC_USE_COMPLEX)
91016cd7e1dSShri Abhyankar         if (PetscImaginaryPart(a->a[j]) > 0.0) {
911835f2295SStefano Zampini           PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g + %g i)", a->j[j], (double)PetscRealPart(1 / a->a[j]), (double)PetscImaginaryPart(1 / a->a[j])));
91216cd7e1dSShri Abhyankar         } else if (PetscImaginaryPart(a->a[j]) < 0.0) {
913835f2295SStefano Zampini           PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g - %g i)", a->j[j], (double)PetscRealPart(1 / a->a[j]), (double)(-PetscImaginaryPart(1 / a->a[j]))));
91416cd7e1dSShri Abhyankar         } else {
915835f2295SStefano Zampini           PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)PetscRealPart(1 / a->a[j])));
91616cd7e1dSShri Abhyankar         }
91716cd7e1dSShri Abhyankar #else
918835f2295SStefano Zampini         PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)(1 / a->a[j])));
91916cd7e1dSShri Abhyankar #endif
92016cd7e1dSShri Abhyankar 
92116cd7e1dSShri Abhyankar         /* U part */
92260e0710aSBarry Smith         for (j = a->diag[i + 1] + 1; j < a->diag[i]; j++) {
92316cd7e1dSShri Abhyankar #if defined(PETSC_USE_COMPLEX)
92416cd7e1dSShri Abhyankar           if (PetscImaginaryPart(a->a[j]) > 0.0) {
9259566063dSJacob Faibussowitsch             PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g + %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j])));
92616cd7e1dSShri Abhyankar           } else if (PetscImaginaryPart(a->a[j]) < 0.0) {
9279566063dSJacob Faibussowitsch             PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g - %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)(-PetscImaginaryPart(a->a[j]))));
92816cd7e1dSShri Abhyankar           } else {
9299566063dSJacob Faibussowitsch             PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)PetscRealPart(a->a[j])));
93016cd7e1dSShri Abhyankar           }
93116cd7e1dSShri Abhyankar #else
9329566063dSJacob Faibussowitsch           PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)a->a[j]));
93316cd7e1dSShri Abhyankar #endif
93416cd7e1dSShri Abhyankar         }
9359566063dSJacob Faibussowitsch         PetscCall(PetscViewerASCIIPrintf(viewer, "\n"));
93616cd7e1dSShri Abhyankar       }
93716cd7e1dSShri Abhyankar     } else {
93817ab2063SBarry Smith       for (i = 0; i < m; i++) {
9399566063dSJacob Faibussowitsch         PetscCall(PetscViewerASCIIPrintf(viewer, "row %" PetscInt_FMT ":", i));
94060e0710aSBarry Smith         for (j = a->i[i]; j < a->i[i + 1]; j++) {
941aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX)
94236db0b34SBarry Smith           if (PetscImaginaryPart(a->a[j]) > 0.0) {
9439566063dSJacob Faibussowitsch             PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g + %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j])));
94436db0b34SBarry Smith           } else if (PetscImaginaryPart(a->a[j]) < 0.0) {
9459566063dSJacob Faibussowitsch             PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g - %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)-PetscImaginaryPart(a->a[j])));
9463a40ed3dSBarry Smith           } else {
9479566063dSJacob Faibussowitsch             PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)PetscRealPart(a->a[j])));
94817ab2063SBarry Smith           }
94917ab2063SBarry Smith #else
9509566063dSJacob Faibussowitsch           PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)a->a[j]));
95117ab2063SBarry Smith #endif
95217ab2063SBarry Smith         }
9539566063dSJacob Faibussowitsch         PetscCall(PetscViewerASCIIPrintf(viewer, "\n"));
95417ab2063SBarry Smith       }
95516cd7e1dSShri Abhyankar     }
9569566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE));
95717ab2063SBarry Smith   }
9589566063dSJacob Faibussowitsch   PetscCall(PetscViewerFlush(viewer));
9593ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
960416022c9SBarry Smith }
961416022c9SBarry Smith 
9629804daf3SBarry Smith #include <petscdraw.h>
963ba38deedSJacob Faibussowitsch static PetscErrorCode MatView_SeqAIJ_Draw_Zoom(PetscDraw draw, void *Aa)
964d71ae5a4SJacob Faibussowitsch {
965480ef9eaSBarry Smith   Mat                A = (Mat)Aa;
966416022c9SBarry Smith   Mat_SeqAIJ        *a = (Mat_SeqAIJ *)A->data;
967383922c3SLisandro Dalcin   PetscInt           i, j, m = A->rmap->n;
968383922c3SLisandro Dalcin   int                color;
969b05fc000SLisandro Dalcin   PetscReal          xl, yl, xr, yr, x_l, x_r, y_l, y_r;
970b0a32e0cSBarry Smith   PetscViewer        viewer;
971f3ef73ceSBarry Smith   PetscViewerFormat  format;
972fff043a9SJunchao Zhang   const PetscScalar *aa;
973cddf8d76SBarry Smith 
9743a40ed3dSBarry Smith   PetscFunctionBegin;
9759566063dSJacob Faibussowitsch   PetscCall(PetscObjectQuery((PetscObject)A, "Zoomviewer", (PetscObject *)&viewer));
9769566063dSJacob Faibussowitsch   PetscCall(PetscViewerGetFormat(viewer, &format));
9779566063dSJacob Faibussowitsch   PetscCall(PetscDrawGetCoordinates(draw, &xl, &yl, &xr, &yr));
978383922c3SLisandro Dalcin 
979416022c9SBarry Smith   /* loop over matrix elements drawing boxes */
9809566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &aa));
981fb9695e5SSatish Balay   if (format != PETSC_VIEWER_DRAW_CONTOUR) {
982d0609cedSBarry Smith     PetscDrawCollectiveBegin(draw);
9830513a670SBarry Smith     /* Blue for negative, Cyan for zero and  Red for positive */
984b0a32e0cSBarry Smith     color = PETSC_DRAW_BLUE;
985416022c9SBarry Smith     for (i = 0; i < m; i++) {
9869371c9d4SSatish Balay       y_l = m - i - 1.0;
9879371c9d4SSatish Balay       y_r = y_l + 1.0;
988bfeeae90SHong Zhang       for (j = a->i[i]; j < a->i[i + 1]; j++) {
9899371c9d4SSatish Balay         x_l = a->j[j];
9909371c9d4SSatish Balay         x_r = x_l + 1.0;
991fff043a9SJunchao Zhang         if (PetscRealPart(aa[j]) >= 0.) continue;
9929566063dSJacob Faibussowitsch         PetscCall(PetscDrawRectangle(draw, x_l, y_l, x_r, y_r, color, color, color, color));
993cddf8d76SBarry Smith       }
994cddf8d76SBarry Smith     }
995b0a32e0cSBarry Smith     color = PETSC_DRAW_CYAN;
996cddf8d76SBarry Smith     for (i = 0; i < m; i++) {
9979371c9d4SSatish Balay       y_l = m - i - 1.0;
9989371c9d4SSatish Balay       y_r = y_l + 1.0;
999bfeeae90SHong Zhang       for (j = a->i[i]; j < a->i[i + 1]; j++) {
10009371c9d4SSatish Balay         x_l = a->j[j];
10019371c9d4SSatish Balay         x_r = x_l + 1.0;
1002fff043a9SJunchao Zhang         if (aa[j] != 0.) continue;
10039566063dSJacob Faibussowitsch         PetscCall(PetscDrawRectangle(draw, x_l, y_l, x_r, y_r, color, color, color, color));
1004cddf8d76SBarry Smith       }
1005cddf8d76SBarry Smith     }
1006b0a32e0cSBarry Smith     color = PETSC_DRAW_RED;
1007cddf8d76SBarry Smith     for (i = 0; i < m; i++) {
10089371c9d4SSatish Balay       y_l = m - i - 1.0;
10099371c9d4SSatish Balay       y_r = y_l + 1.0;
1010bfeeae90SHong Zhang       for (j = a->i[i]; j < a->i[i + 1]; j++) {
10119371c9d4SSatish Balay         x_l = a->j[j];
10129371c9d4SSatish Balay         x_r = x_l + 1.0;
1013fff043a9SJunchao Zhang         if (PetscRealPart(aa[j]) <= 0.) continue;
10149566063dSJacob Faibussowitsch         PetscCall(PetscDrawRectangle(draw, x_l, y_l, x_r, y_r, color, color, color, color));
1015416022c9SBarry Smith       }
1016416022c9SBarry Smith     }
1017d0609cedSBarry Smith     PetscDrawCollectiveEnd(draw);
10180513a670SBarry Smith   } else {
10190513a670SBarry Smith     /* use contour shading to indicate magnitude of values */
10200513a670SBarry Smith     /* first determine max of all nonzero values */
1021b05fc000SLisandro Dalcin     PetscReal minv = 0.0, maxv = 0.0;
1022383922c3SLisandro Dalcin     PetscInt  nz = a->nz, count = 0;
1023b0a32e0cSBarry Smith     PetscDraw popup;
10240513a670SBarry Smith 
10250513a670SBarry Smith     for (i = 0; i < nz; i++) {
1026fff043a9SJunchao Zhang       if (PetscAbsScalar(aa[i]) > maxv) maxv = PetscAbsScalar(aa[i]);
10270513a670SBarry Smith     }
1028383922c3SLisandro Dalcin     if (minv >= maxv) maxv = minv + PETSC_SMALL;
10299566063dSJacob Faibussowitsch     PetscCall(PetscDrawGetPopup(draw, &popup));
10309566063dSJacob Faibussowitsch     PetscCall(PetscDrawScalePopup(popup, minv, maxv));
1031383922c3SLisandro Dalcin 
1032d0609cedSBarry Smith     PetscDrawCollectiveBegin(draw);
10330513a670SBarry Smith     for (i = 0; i < m; i++) {
1034383922c3SLisandro Dalcin       y_l = m - i - 1.0;
1035383922c3SLisandro Dalcin       y_r = y_l + 1.0;
1036bfeeae90SHong Zhang       for (j = a->i[i]; j < a->i[i + 1]; j++) {
1037383922c3SLisandro Dalcin         x_l   = a->j[j];
1038383922c3SLisandro Dalcin         x_r   = x_l + 1.0;
1039fff043a9SJunchao Zhang         color = PetscDrawRealToColor(PetscAbsScalar(aa[count]), minv, maxv);
10409566063dSJacob Faibussowitsch         PetscCall(PetscDrawRectangle(draw, x_l, y_l, x_r, y_r, color, color, color, color));
10410513a670SBarry Smith         count++;
10420513a670SBarry Smith       }
10430513a670SBarry Smith     }
1044d0609cedSBarry Smith     PetscDrawCollectiveEnd(draw);
10450513a670SBarry Smith   }
10469566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &aa));
10473ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
1048480ef9eaSBarry Smith }
1049cddf8d76SBarry Smith 
10509804daf3SBarry Smith #include <petscdraw.h>
1051ba38deedSJacob Faibussowitsch static PetscErrorCode MatView_SeqAIJ_Draw(Mat A, PetscViewer viewer)
1052d71ae5a4SJacob Faibussowitsch {
1053b0a32e0cSBarry Smith   PetscDraw draw;
105436db0b34SBarry Smith   PetscReal xr, yr, xl, yl, h, w;
1055ace3abfcSBarry Smith   PetscBool isnull;
1056480ef9eaSBarry Smith 
1057480ef9eaSBarry Smith   PetscFunctionBegin;
10589566063dSJacob Faibussowitsch   PetscCall(PetscViewerDrawGetDraw(viewer, 0, &draw));
10599566063dSJacob Faibussowitsch   PetscCall(PetscDrawIsNull(draw, &isnull));
10603ba16761SJacob Faibussowitsch   if (isnull) PetscFunctionReturn(PETSC_SUCCESS);
1061480ef9eaSBarry Smith 
10629371c9d4SSatish Balay   xr = A->cmap->n;
10639371c9d4SSatish Balay   yr = A->rmap->n;
10649371c9d4SSatish Balay   h  = yr / 10.0;
10659371c9d4SSatish Balay   w  = xr / 10.0;
10669371c9d4SSatish Balay   xr += w;
10679371c9d4SSatish Balay   yr += h;
10689371c9d4SSatish Balay   xl = -w;
10699371c9d4SSatish Balay   yl = -h;
10709566063dSJacob Faibussowitsch   PetscCall(PetscDrawSetCoordinates(draw, xl, yl, xr, yr));
10719566063dSJacob Faibussowitsch   PetscCall(PetscObjectCompose((PetscObject)A, "Zoomviewer", (PetscObject)viewer));
10729566063dSJacob Faibussowitsch   PetscCall(PetscDrawZoom(draw, MatView_SeqAIJ_Draw_Zoom, A));
10739566063dSJacob Faibussowitsch   PetscCall(PetscObjectCompose((PetscObject)A, "Zoomviewer", NULL));
10749566063dSJacob Faibussowitsch   PetscCall(PetscDrawSave(draw));
10753ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
1076416022c9SBarry Smith }
1077416022c9SBarry Smith 
1078d71ae5a4SJacob Faibussowitsch PetscErrorCode MatView_SeqAIJ(Mat A, PetscViewer viewer)
1079d71ae5a4SJacob Faibussowitsch {
10809f196a02SMartin Diehl   PetscBool isascii, isbinary, isdraw;
1081416022c9SBarry Smith 
10823a40ed3dSBarry Smith   PetscFunctionBegin;
10839f196a02SMartin Diehl   PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERASCII, &isascii));
10849566063dSJacob Faibussowitsch   PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERBINARY, &isbinary));
10859566063dSJacob Faibussowitsch   PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERDRAW, &isdraw));
10869f196a02SMartin Diehl   if (isascii) PetscCall(MatView_SeqAIJ_ASCII(A, viewer));
10871baa6e33SBarry Smith   else if (isbinary) PetscCall(MatView_SeqAIJ_Binary(A, viewer));
10881baa6e33SBarry Smith   else if (isdraw) PetscCall(MatView_SeqAIJ_Draw(A, viewer));
10899566063dSJacob Faibussowitsch   PetscCall(MatView_SeqAIJ_Inode(A, viewer));
10903ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
109117ab2063SBarry Smith }
109219bcc07fSBarry Smith 
1093d71ae5a4SJacob Faibussowitsch PetscErrorCode MatAssemblyEnd_SeqAIJ(Mat A, MatAssemblyType mode)
1094d71ae5a4SJacob Faibussowitsch {
1095416022c9SBarry Smith   Mat_SeqAIJ *a      = (Mat_SeqAIJ *)A->data;
1096580bdb30SBarry Smith   PetscInt    fshift = 0, i, *ai = a->i, *aj = a->j, *imax = a->imax;
1097*07425a8dSBarry Smith   PetscInt    m = A->rmap->n, *ip, N, *ailen = a->ilen, rmax = 0;
109854f21887SBarry Smith   MatScalar  *aa    = a->a, *ap;
10993447b6efSHong Zhang   PetscReal   ratio = 0.6;
110017ab2063SBarry Smith 
11013a40ed3dSBarry Smith   PetscFunctionBegin;
11023ba16761SJacob Faibussowitsch   if (mode == MAT_FLUSH_ASSEMBLY) PetscFunctionReturn(PETSC_SUCCESS);
1103b215bc84SStefano Zampini   if (A->was_assembled && A->ass_nonzerostate == A->nonzerostate) {
110455a7f34eSJunchao Zhang     /* we need to respect users asking to use or not the inodes routine in between matrix assemblies, e.g., via MatSetOption(A, MAT_USE_INODES, val) */
110555a7f34eSJunchao Zhang     PetscCall(MatAssemblyEnd_SeqAIJ_Inode(A, mode)); /* read the sparsity pattern */
11063ba16761SJacob Faibussowitsch     PetscFunctionReturn(PETSC_SUCCESS);
1107b215bc84SStefano Zampini   }
110817ab2063SBarry Smith 
110943ee02c3SBarry Smith   if (m) rmax = ailen[0]; /* determine row with most nonzeros */
111017ab2063SBarry Smith   for (i = 1; i < m; i++) {
1111416022c9SBarry Smith     /* move each row back by the amount of empty slots (fshift) before it*/
111217ab2063SBarry Smith     fshift += imax[i - 1] - ailen[i - 1];
111394a9d846SBarry Smith     rmax = PetscMax(rmax, ailen[i]);
111417ab2063SBarry Smith     if (fshift) {
1115bfeeae90SHong Zhang       ip = aj + ai[i];
1116bfeeae90SHong Zhang       ap = aa + ai[i];
111717ab2063SBarry Smith       N  = ailen[i];
11189566063dSJacob Faibussowitsch       PetscCall(PetscArraymove(ip - fshift, ip, N));
111948a46eb9SPierre Jolivet       if (!A->structure_only) PetscCall(PetscArraymove(ap - fshift, ap, N));
112017ab2063SBarry Smith     }
112117ab2063SBarry Smith     ai[i] = ai[i - 1] + ailen[i - 1];
112217ab2063SBarry Smith   }
112317ab2063SBarry Smith   if (m) {
112417ab2063SBarry Smith     fshift += imax[m - 1] - ailen[m - 1];
112517ab2063SBarry Smith     ai[m] = ai[m - 1] + ailen[m - 1];
112617ab2063SBarry Smith   }
112717ab2063SBarry Smith   /* reset ilen and imax for each row */
11287b083b7cSBarry Smith   a->nonzerorowcnt = 0;
1129396832f4SHong Zhang   if (A->structure_only) {
11309566063dSJacob Faibussowitsch     PetscCall(PetscFree(a->imax));
11319566063dSJacob Faibussowitsch     PetscCall(PetscFree(a->ilen));
1132396832f4SHong Zhang   } else { /* !A->structure_only */
113317ab2063SBarry Smith     for (i = 0; i < m; i++) {
113417ab2063SBarry Smith       ailen[i] = imax[i] = ai[i + 1] - ai[i];
11357b083b7cSBarry Smith       a->nonzerorowcnt += ((ai[i + 1] - ai[i]) > 0);
113617ab2063SBarry Smith     }
1137396832f4SHong Zhang   }
1138bfeeae90SHong Zhang   a->nz = ai[m];
1139aed4548fSBarry Smith   PetscCheck(!fshift || a->nounused != -1, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Unused space detected in matrix: %" PetscInt_FMT " X %" PetscInt_FMT ", %" PetscInt_FMT " unneeded", m, A->cmap->n, fshift);
1140bc43efbbSJunchao Zhang   PetscCall(MatMarkDiagonal_SeqAIJ(A)); // since diagonal info is used a lot, it is helpful to set them up at the end of assembly
11419566063dSJacob Faibussowitsch   PetscCall(PetscInfo(A, "Matrix size: %" PetscInt_FMT " X %" PetscInt_FMT "; storage space: %" PetscInt_FMT " unneeded,%" PetscInt_FMT " used\n", m, A->cmap->n, fshift, a->nz));
11429566063dSJacob Faibussowitsch   PetscCall(PetscInfo(A, "Number of mallocs during MatSetValues() is %" PetscInt_FMT "\n", a->reallocs));
11439566063dSJacob Faibussowitsch   PetscCall(PetscInfo(A, "Maximum nonzeros in any row is %" PetscInt_FMT "\n", rmax));
11442205254eSKarl Rupp 
11458e58a170SBarry Smith   A->info.mallocs += a->reallocs;
1146dd5f02e7SSatish Balay   a->reallocs         = 0;
11476712e2f1SBarry Smith   A->info.nz_unneeded = (PetscReal)fshift;
114836db0b34SBarry Smith   a->rmax             = rmax;
11494e220ebcSLois Curfman McInnes 
115048a46eb9SPierre Jolivet   if (!A->structure_only) PetscCall(MatCheckCompressedRow(A, a->nonzerorowcnt, &a->compressedrow, a->i, m, ratio));
11519566063dSJacob Faibussowitsch   PetscCall(MatAssemblyEnd_SeqAIJ_Inode(A, mode));
11523ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
115317ab2063SBarry Smith }
115417ab2063SBarry Smith 
1155ba38deedSJacob Faibussowitsch static PetscErrorCode MatRealPart_SeqAIJ(Mat A)
1156d71ae5a4SJacob Faibussowitsch {
115799cafbc1SBarry Smith   Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data;
115899cafbc1SBarry Smith   PetscInt    i, nz = a->nz;
11592e5835c6SStefano Zampini   MatScalar  *aa;
116099cafbc1SBarry Smith 
116199cafbc1SBarry Smith   PetscFunctionBegin;
11629566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArray(A, &aa));
116399cafbc1SBarry Smith   for (i = 0; i < nz; i++) aa[i] = PetscRealPart(aa[i]);
11649566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArray(A, &aa));
11653ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
116699cafbc1SBarry Smith }
116799cafbc1SBarry Smith 
1168ba38deedSJacob Faibussowitsch static PetscErrorCode MatImaginaryPart_SeqAIJ(Mat A)
1169d71ae5a4SJacob Faibussowitsch {
117099cafbc1SBarry Smith   Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data;
117199cafbc1SBarry Smith   PetscInt    i, nz = a->nz;
11722e5835c6SStefano Zampini   MatScalar  *aa;
117399cafbc1SBarry Smith 
117499cafbc1SBarry Smith   PetscFunctionBegin;
11759566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArray(A, &aa));
117699cafbc1SBarry Smith   for (i = 0; i < nz; i++) aa[i] = PetscImaginaryPart(aa[i]);
11779566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArray(A, &aa));
11783ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
117999cafbc1SBarry Smith }
118099cafbc1SBarry Smith 
1181d71ae5a4SJacob Faibussowitsch PetscErrorCode MatZeroEntries_SeqAIJ(Mat A)
1182d71ae5a4SJacob Faibussowitsch {
1183fff043a9SJunchao Zhang   Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data;
1184fff043a9SJunchao Zhang   MatScalar  *aa;
11853a40ed3dSBarry Smith 
11863a40ed3dSBarry Smith   PetscFunctionBegin;
11879566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayWrite(A, &aa));
11889566063dSJacob Faibussowitsch   PetscCall(PetscArrayzero(aa, a->i[A->rmap->n]));
11899566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayWrite(A, &aa));
11903ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
119117ab2063SBarry Smith }
1192416022c9SBarry Smith 
1193674b392bSAlexander static PetscErrorCode MatReset_SeqAIJ(Mat A)
1194d71ae5a4SJacob Faibussowitsch {
1195416022c9SBarry Smith   Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data;
1196d5d45c9bSBarry Smith 
11973a40ed3dSBarry Smith   PetscFunctionBegin;
1198b4e2f619SBarry Smith   if (A->hash_active) {
1199e3c72094SPierre Jolivet     A->ops[0] = a->cops;
1200b4e2f619SBarry Smith     PetscCall(PetscHMapIJVDestroy(&a->ht));
1201b4e2f619SBarry Smith     PetscCall(PetscFree(a->dnz));
1202b4e2f619SBarry Smith     A->hash_active = PETSC_FALSE;
1203b4e2f619SBarry Smith   }
1204b4e2f619SBarry Smith 
12053ba16761SJacob Faibussowitsch   PetscCall(PetscLogObjectState((PetscObject)A, "Rows=%" PetscInt_FMT ", Cols=%" PetscInt_FMT ", NZ=%" PetscInt_FMT, A->rmap->n, A->cmap->n, a->nz));
12069566063dSJacob Faibussowitsch   PetscCall(MatSeqXAIJFreeAIJ(A, &a->a, &a->j, &a->i));
12079566063dSJacob Faibussowitsch   PetscCall(ISDestroy(&a->row));
12089566063dSJacob Faibussowitsch   PetscCall(ISDestroy(&a->col));
12099566063dSJacob Faibussowitsch   PetscCall(PetscFree(a->diag));
12109566063dSJacob Faibussowitsch   PetscCall(PetscFree(a->ibdiag));
12119566063dSJacob Faibussowitsch   PetscCall(PetscFree(a->imax));
12129566063dSJacob Faibussowitsch   PetscCall(PetscFree(a->ilen));
12139566063dSJacob Faibussowitsch   PetscCall(PetscFree(a->ipre));
12149566063dSJacob Faibussowitsch   PetscCall(PetscFree3(a->idiag, a->mdiag, a->ssor_work));
12159566063dSJacob Faibussowitsch   PetscCall(PetscFree(a->solve_work));
12169566063dSJacob Faibussowitsch   PetscCall(ISDestroy(&a->icol));
12179566063dSJacob Faibussowitsch   PetscCall(PetscFree(a->saved_values));
1218820d003aSStefano Zampini   a->compressedrow.use = PETSC_FALSE;
12199566063dSJacob Faibussowitsch   PetscCall(PetscFree2(a->compressedrow.i, a->compressedrow.rindex));
12209566063dSJacob Faibussowitsch   PetscCall(MatDestroy_SeqAIJ_Inode(A));
1221674b392bSAlexander   PetscFunctionReturn(PETSC_SUCCESS);
1222674b392bSAlexander }
1223674b392bSAlexander 
1224674b392bSAlexander static PetscErrorCode MatResetHash_SeqAIJ(Mat A)
1225674b392bSAlexander {
1226674b392bSAlexander   PetscFunctionBegin;
1227674b392bSAlexander   PetscCall(MatReset_SeqAIJ(A));
1228674b392bSAlexander   PetscCall(MatCreate_SeqAIJ_Inode(A));
1229674b392bSAlexander   PetscCall(MatSetUp_Seq_Hash(A));
1230674b392bSAlexander   A->nonzerostate++;
1231674b392bSAlexander   PetscFunctionReturn(PETSC_SUCCESS);
1232674b392bSAlexander }
1233674b392bSAlexander 
1234674b392bSAlexander PetscErrorCode MatDestroy_SeqAIJ(Mat A)
1235674b392bSAlexander {
1236674b392bSAlexander   PetscFunctionBegin;
1237674b392bSAlexander   PetscCall(MatReset_SeqAIJ(A));
12389566063dSJacob Faibussowitsch   PetscCall(PetscFree(A->data));
1239901853e0SKris Buschelman 
12406718818eSStefano Zampini   /* MatMatMultNumeric_SeqAIJ_SeqAIJ_Sorted may allocate this.
12416718818eSStefano Zampini      That function is so heavily used (sometimes in an hidden way through multnumeric function pointers)
12426718818eSStefano Zampini      that is hard to properly add this data to the MatProduct data. We free it here to avoid
12436718818eSStefano Zampini      users reusing the matrix object with different data to incur in obscure segmentation faults
12446718818eSStefano Zampini      due to different matrix sizes */
12459566063dSJacob Faibussowitsch   PetscCall(PetscObjectCompose((PetscObject)A, "__PETSc__ab_dense", NULL));
12466718818eSStefano Zampini 
12479566063dSJacob Faibussowitsch   PetscCall(PetscObjectChangeTypeName((PetscObject)A, NULL));
12482e956fe4SStefano Zampini   PetscCall(PetscObjectComposeFunction((PetscObject)A, "PetscMatlabEnginePut_C", NULL));
12492e956fe4SStefano Zampini   PetscCall(PetscObjectComposeFunction((PetscObject)A, "PetscMatlabEngineGet_C", NULL));
12509566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSeqAIJSetColumnIndices_C", NULL));
12519566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatStoreValues_C", NULL));
12529566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatRetrieveValues_C", NULL));
12539566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqsbaij_C", NULL));
12549566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqbaij_C", NULL));
12559566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijperm_C", NULL));
12562e956fe4SStefano Zampini   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijsell_C", NULL));
12572e956fe4SStefano Zampini #if defined(PETSC_HAVE_MKL_SPARSE)
12582e956fe4SStefano Zampini   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijmkl_C", NULL));
12592e956fe4SStefano Zampini #endif
12604222ddf1SHong Zhang #if defined(PETSC_HAVE_CUDA)
12619566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijcusparse_C", NULL));
12629566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaijcusparse_seqaij_C", NULL));
12639566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaij_seqaijcusparse_C", NULL));
12644222ddf1SHong Zhang #endif
1265d5e393b6SSuyash Tandon #if defined(PETSC_HAVE_HIP)
1266d5e393b6SSuyash Tandon   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijhipsparse_C", NULL));
1267d5e393b6SSuyash Tandon   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaijhipsparse_seqaij_C", NULL));
1268d5e393b6SSuyash Tandon   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaij_seqaijhipsparse_C", NULL));
1269d5e393b6SSuyash Tandon #endif
12703d0639e7SStefano Zampini #if defined(PETSC_HAVE_KOKKOS_KERNELS)
12719566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijkokkos_C", NULL));
12723d0639e7SStefano Zampini #endif
12739566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijcrl_C", NULL));
1274af8000cdSHong Zhang #if defined(PETSC_HAVE_ELEMENTAL)
12759566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_elemental_C", NULL));
1276af8000cdSHong Zhang #endif
1277d1a032dbSPierre Jolivet #if defined(PETSC_HAVE_SCALAPACK) && (defined(PETSC_USE_REAL_SINGLE) || defined(PETSC_USE_REAL_DOUBLE))
12789566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_scalapack_C", NULL));
1279d24d4204SJose E. Roman #endif
128063c07aadSStefano Zampini #if defined(PETSC_HAVE_HYPRE)
12819566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_hypre_C", NULL));
12829566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_transpose_seqaij_seqaij_C", NULL));
128363c07aadSStefano Zampini #endif
12849566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqdense_C", NULL));
12859566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqsell_C", NULL));
12869566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_is_C", NULL));
12879566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatIsTranspose_C", NULL));
12882e956fe4SStefano Zampini   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatIsHermitianTranspose_C", NULL));
12899566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSeqAIJSetPreallocation_C", NULL));
12909566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatResetPreallocation_C", NULL));
1291674b392bSAlexander   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatResetHash_C", NULL));
12929566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSeqAIJSetPreallocationCSR_C", NULL));
12939566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatReorderForNonzeroDiagonal_C", NULL));
12949566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_is_seqaij_C", NULL));
12959566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqdense_seqaij_C", NULL));
12969566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaij_seqaij_C", NULL));
12979566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSeqAIJKron_C", NULL));
12989566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSetPreallocationCOO_C", NULL));
12999566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSetValuesCOO_C", NULL));
13002e956fe4SStefano Zampini   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatFactorGetSolverType_C", NULL));
13012e956fe4SStefano Zampini   /* these calls do not belong here: the subclasses Duplicate/Destroy are wrong */
13022e956fe4SStefano Zampini   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaijsell_seqaij_C", NULL));
13032e956fe4SStefano Zampini   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaijperm_seqaij_C", NULL));
13042e956fe4SStefano Zampini   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijviennacl_C", NULL));
13052e956fe4SStefano Zampini   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaijviennacl_seqdense_C", NULL));
13062e956fe4SStefano Zampini   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaijviennacl_seqaij_C", NULL));
13073ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
130817ab2063SBarry Smith }
130917ab2063SBarry Smith 
1310d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetOption_SeqAIJ(Mat A, MatOption op, PetscBool flg)
1311d71ae5a4SJacob Faibussowitsch {
1312416022c9SBarry Smith   Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data;
13133a40ed3dSBarry Smith 
13143a40ed3dSBarry Smith   PetscFunctionBegin;
1315a65d3064SKris Buschelman   switch (op) {
1316d71ae5a4SJacob Faibussowitsch   case MAT_ROW_ORIENTED:
1317d71ae5a4SJacob Faibussowitsch     a->roworiented = flg;
1318d71ae5a4SJacob Faibussowitsch     break;
1319d71ae5a4SJacob Faibussowitsch   case MAT_KEEP_NONZERO_PATTERN:
1320d71ae5a4SJacob Faibussowitsch     a->keepnonzeropattern = flg;
1321d71ae5a4SJacob Faibussowitsch     break;
1322d71ae5a4SJacob Faibussowitsch   case MAT_NEW_NONZERO_LOCATIONS:
1323d71ae5a4SJacob Faibussowitsch     a->nonew = (flg ? 0 : 1);
1324d71ae5a4SJacob Faibussowitsch     break;
1325d71ae5a4SJacob Faibussowitsch   case MAT_NEW_NONZERO_LOCATION_ERR:
1326d71ae5a4SJacob Faibussowitsch     a->nonew = (flg ? -1 : 0);
1327d71ae5a4SJacob Faibussowitsch     break;
1328d71ae5a4SJacob Faibussowitsch   case MAT_NEW_NONZERO_ALLOCATION_ERR:
1329d71ae5a4SJacob Faibussowitsch     a->nonew = (flg ? -2 : 0);
1330d71ae5a4SJacob Faibussowitsch     break;
1331d71ae5a4SJacob Faibussowitsch   case MAT_UNUSED_NONZERO_LOCATION_ERR:
1332d71ae5a4SJacob Faibussowitsch     a->nounused = (flg ? -1 : 0);
1333d71ae5a4SJacob Faibussowitsch     break;
1334d71ae5a4SJacob Faibussowitsch   case MAT_IGNORE_ZERO_ENTRIES:
1335d71ae5a4SJacob Faibussowitsch     a->ignorezeroentries = flg;
1336d71ae5a4SJacob Faibussowitsch     break;
1337d71ae5a4SJacob Faibussowitsch   case MAT_USE_INODES:
1338d71ae5a4SJacob Faibussowitsch     PetscCall(MatSetOption_SeqAIJ_Inode(A, MAT_USE_INODES, flg));
1339d71ae5a4SJacob Faibussowitsch     break;
1340d71ae5a4SJacob Faibussowitsch   case MAT_SUBMAT_SINGLEIS:
1341d71ae5a4SJacob Faibussowitsch     A->submat_singleis = flg;
1342d71ae5a4SJacob Faibussowitsch     break;
1343071fcb05SBarry Smith   case MAT_SORTED_FULL:
1344071fcb05SBarry Smith     if (flg) A->ops->setvalues = MatSetValues_SeqAIJ_SortedFull;
1345071fcb05SBarry Smith     else A->ops->setvalues = MatSetValues_SeqAIJ;
1346071fcb05SBarry Smith     break;
1347d71ae5a4SJacob Faibussowitsch   case MAT_FORM_EXPLICIT_TRANSPOSE:
1348d71ae5a4SJacob Faibussowitsch     A->form_explicit_transpose = flg;
1349d71ae5a4SJacob Faibussowitsch     break;
1350d71ae5a4SJacob Faibussowitsch   default:
1351888c827cSStefano Zampini     break;
1352a65d3064SKris Buschelman   }
13533ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
135417ab2063SBarry Smith }
135517ab2063SBarry Smith 
13569ee18893SBarry Smith PETSC_INTERN PetscErrorCode MatGetDiagonal_SeqAIJ(Mat A, Vec v)
1357d71ae5a4SJacob Faibussowitsch {
1358416022c9SBarry Smith   Mat_SeqAIJ        *a = (Mat_SeqAIJ *)A->data;
1359fdc842d1SBarry Smith   PetscInt           i, j, n, *ai = a->i, *aj = a->j;
1360c898d852SStefano Zampini   PetscScalar       *x;
1361c898d852SStefano Zampini   const PetscScalar *aa;
136217ab2063SBarry Smith 
13633a40ed3dSBarry Smith   PetscFunctionBegin;
13649566063dSJacob Faibussowitsch   PetscCall(VecGetLocalSize(v, &n));
136508401ef6SPierre Jolivet   PetscCheck(n == A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Nonconforming matrix and vector");
13669566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &aa));
1367d5f3da31SBarry Smith   if (A->factortype == MAT_FACTOR_ILU || A->factortype == MAT_FACTOR_LU) {
1368d3e70bfaSHong Zhang     PetscInt *diag = a->diag;
13699566063dSJacob Faibussowitsch     PetscCall(VecGetArrayWrite(v, &x));
13702c990fa1SHong Zhang     for (i = 0; i < n; i++) x[i] = 1.0 / aa[diag[i]];
13719566063dSJacob Faibussowitsch     PetscCall(VecRestoreArrayWrite(v, &x));
13729566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJRestoreArrayRead(A, &aa));
13733ba16761SJacob Faibussowitsch     PetscFunctionReturn(PETSC_SUCCESS);
137435e7444dSHong Zhang   }
137535e7444dSHong Zhang 
13769566063dSJacob Faibussowitsch   PetscCall(VecGetArrayWrite(v, &x));
137735e7444dSHong Zhang   for (i = 0; i < n; i++) {
1378fdc842d1SBarry Smith     x[i] = 0.0;
137935e7444dSHong Zhang     for (j = ai[i]; j < ai[i + 1]; j++) {
138035e7444dSHong Zhang       if (aj[j] == i) {
138135e7444dSHong Zhang         x[i] = aa[j];
138217ab2063SBarry Smith         break;
138317ab2063SBarry Smith       }
138417ab2063SBarry Smith     }
138517ab2063SBarry Smith   }
13869566063dSJacob Faibussowitsch   PetscCall(VecRestoreArrayWrite(v, &x));
13879566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &aa));
13883ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
138917ab2063SBarry Smith }
139017ab2063SBarry Smith 
1391c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/ftn-kernels/fmult.h>
1392d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMultTransposeAdd_SeqAIJ(Mat A, Vec xx, Vec zz, Vec yy)
1393d71ae5a4SJacob Faibussowitsch {
1394416022c9SBarry Smith   Mat_SeqAIJ        *a = (Mat_SeqAIJ *)A->data;
13955f22a7b3SSebastian Grimberg   const MatScalar   *aa;
1396d9ca1df4SBarry Smith   PetscScalar       *y;
1397d9ca1df4SBarry Smith   const PetscScalar *x;
1398d0f46423SBarry Smith   PetscInt           m = A->rmap->n;
13995c897100SBarry Smith #if !defined(PETSC_USE_FORTRAN_KERNEL_MULTTRANSPOSEAIJ)
14005f22a7b3SSebastian Grimberg   const MatScalar  *v;
1401a77337e4SBarry Smith   PetscScalar       alpha;
1402d9ca1df4SBarry Smith   PetscInt          n, i, j;
1403d9ca1df4SBarry Smith   const PetscInt   *idx, *ii, *ridx = NULL;
14043447b6efSHong Zhang   Mat_CompressedRow cprow    = a->compressedrow;
1405ace3abfcSBarry Smith   PetscBool         usecprow = cprow.use;
14065c897100SBarry Smith #endif
140717ab2063SBarry Smith 
14083a40ed3dSBarry Smith   PetscFunctionBegin;
14099566063dSJacob Faibussowitsch   if (zz != yy) PetscCall(VecCopy(zz, yy));
14109566063dSJacob Faibussowitsch   PetscCall(VecGetArrayRead(xx, &x));
14119566063dSJacob Faibussowitsch   PetscCall(VecGetArray(yy, &y));
14129566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &aa));
14135c897100SBarry Smith 
14145c897100SBarry Smith #if defined(PETSC_USE_FORTRAN_KERNEL_MULTTRANSPOSEAIJ)
1415fff043a9SJunchao Zhang   fortranmulttransposeaddaij_(&m, x, a->i, a->j, aa, y);
14165c897100SBarry Smith #else
14173447b6efSHong Zhang   if (usecprow) {
14183447b6efSHong Zhang     m    = cprow.nrows;
14193447b6efSHong Zhang     ii   = cprow.i;
14207b2bb3b9SHong Zhang     ridx = cprow.rindex;
14213447b6efSHong Zhang   } else {
14223447b6efSHong Zhang     ii = a->i;
14233447b6efSHong Zhang   }
142417ab2063SBarry Smith   for (i = 0; i < m; i++) {
14253447b6efSHong Zhang     idx = a->j + ii[i];
1426fff043a9SJunchao Zhang     v   = aa + ii[i];
14273447b6efSHong Zhang     n   = ii[i + 1] - ii[i];
14283447b6efSHong Zhang     if (usecprow) {
14297b2bb3b9SHong Zhang       alpha = x[ridx[i]];
14303447b6efSHong Zhang     } else {
143117ab2063SBarry Smith       alpha = x[i];
14323447b6efSHong Zhang     }
143304fbf559SBarry Smith     for (j = 0; j < n; j++) y[idx[j]] += alpha * v[j];
143417ab2063SBarry Smith   }
14355c897100SBarry Smith #endif
14369566063dSJacob Faibussowitsch   PetscCall(PetscLogFlops(2.0 * a->nz));
14379566063dSJacob Faibussowitsch   PetscCall(VecRestoreArrayRead(xx, &x));
14389566063dSJacob Faibussowitsch   PetscCall(VecRestoreArray(yy, &y));
14399566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &aa));
14403ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
144117ab2063SBarry Smith }
144217ab2063SBarry Smith 
1443d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMultTranspose_SeqAIJ(Mat A, Vec xx, Vec yy)
1444d71ae5a4SJacob Faibussowitsch {
14455c897100SBarry Smith   PetscFunctionBegin;
14469566063dSJacob Faibussowitsch   PetscCall(VecSet(yy, 0.0));
14479566063dSJacob Faibussowitsch   PetscCall(MatMultTransposeAdd_SeqAIJ(A, xx, yy, yy));
14483ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
14495c897100SBarry Smith }
14505c897100SBarry Smith 
1451c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/ftn-kernels/fmult.h>
145278b84d54SShri Abhyankar 
1453d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMult_SeqAIJ(Mat A, Vec xx, Vec yy)
1454d71ae5a4SJacob Faibussowitsch {
1455416022c9SBarry Smith   Mat_SeqAIJ        *a = (Mat_SeqAIJ *)A->data;
1456d9fead3dSBarry Smith   PetscScalar       *y;
145754f21887SBarry Smith   const PetscScalar *x;
14585914357eSBarry Smith   const MatScalar   *a_a;
1459003131ecSBarry Smith   PetscInt           m = A->rmap->n;
14605914357eSBarry Smith   const PetscInt    *ii, *ridx = NULL;
1461ace3abfcSBarry Smith   PetscBool          usecprow = a->compressedrow.use;
146217ab2063SBarry Smith 
1463b6410449SSatish Balay #if defined(PETSC_HAVE_PRAGMA_DISJOINT)
146497952fefSHong Zhang   #pragma disjoint(*x, *y, *aa)
1465fee21e36SBarry Smith #endif
1466fee21e36SBarry Smith 
14673a40ed3dSBarry Smith   PetscFunctionBegin;
1468b215bc84SStefano Zampini   if (a->inode.use && a->inode.checked) {
14699566063dSJacob Faibussowitsch     PetscCall(MatMult_SeqAIJ_Inode(A, xx, yy));
14703ba16761SJacob Faibussowitsch     PetscFunctionReturn(PETSC_SUCCESS);
1471b215bc84SStefano Zampini   }
14729566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &a_a));
14739566063dSJacob Faibussowitsch   PetscCall(VecGetArrayRead(xx, &x));
14749566063dSJacob Faibussowitsch   PetscCall(VecGetArray(yy, &y));
1475416022c9SBarry Smith   ii = a->i;
14764eb6d288SHong Zhang   if (usecprow) { /* use compressed row format */
14779566063dSJacob Faibussowitsch     PetscCall(PetscArrayzero(y, m));
147897952fefSHong Zhang     m    = a->compressedrow.nrows;
147997952fefSHong Zhang     ii   = a->compressedrow.i;
148097952fefSHong Zhang     ridx = a->compressedrow.rindex;
14815914357eSBarry Smith     PetscPragmaUseOMPKernels(parallel for)
14825914357eSBarry Smith     for (PetscInt i = 0; i < m; i++) {
14835914357eSBarry Smith       PetscInt           n   = ii[i + 1] - ii[i];
14845914357eSBarry Smith       const PetscInt    *aj  = a->j + ii[i];
14855914357eSBarry Smith       const PetscScalar *aa  = a_a + ii[i];
14865914357eSBarry Smith       PetscScalar        sum = 0.0;
1487003131ecSBarry Smith       PetscSparseDensePlusDot(sum, x, aa, aj, n);
1488003131ecSBarry Smith       /* for (j=0; j<n; j++) sum += (*aa++)*x[*aj++]; */
1489c9a1b032SJunchao Zhang       y[ridx[i]] = sum;
149097952fefSHong Zhang     }
149197952fefSHong Zhang   } else { /* do not use compressed row format */
1492b05257ddSBarry Smith #if defined(PETSC_USE_FORTRAN_KERNEL_MULTAIJ)
14935914357eSBarry Smith     fortranmultaij_(&m, x, ii, a->j, a_a, y);
1494b05257ddSBarry Smith #else
14955914357eSBarry Smith     PetscPragmaUseOMPKernels(parallel for)
14965914357eSBarry Smith     for (PetscInt i = 0; i < m; i++) {
14975914357eSBarry Smith       PetscInt           n   = ii[i + 1] - ii[i];
14985914357eSBarry Smith       const PetscInt    *aj  = a->j + ii[i];
14995914357eSBarry Smith       const PetscScalar *aa  = a_a + ii[i];
15005914357eSBarry Smith       PetscScalar        sum = 0.0;
1501003131ecSBarry Smith       PetscSparseDensePlusDot(sum, x, aa, aj, n);
150217ab2063SBarry Smith       y[i] = sum;
150317ab2063SBarry Smith     }
15048d195f9aSBarry Smith #endif
1505b05257ddSBarry Smith   }
15069566063dSJacob Faibussowitsch   PetscCall(PetscLogFlops(2.0 * a->nz - a->nonzerorowcnt));
15079566063dSJacob Faibussowitsch   PetscCall(VecRestoreArrayRead(xx, &x));
15089566063dSJacob Faibussowitsch   PetscCall(VecRestoreArray(yy, &y));
15099566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &a_a));
15103ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
151117ab2063SBarry Smith }
151217ab2063SBarry Smith 
1513ba38deedSJacob Faibussowitsch // HACK!!!!! Used by src/mat/tests/ex170.c
1514ba38deedSJacob Faibussowitsch PETSC_EXTERN PetscErrorCode MatMultMax_SeqAIJ(Mat A, Vec xx, Vec yy)
1515d71ae5a4SJacob Faibussowitsch {
1516b434eb95SMatthew G. Knepley   Mat_SeqAIJ        *a = (Mat_SeqAIJ *)A->data;
1517b434eb95SMatthew G. Knepley   PetscScalar       *y;
1518b434eb95SMatthew G. Knepley   const PetscScalar *x;
1519fff043a9SJunchao Zhang   const MatScalar   *aa, *a_a;
1520b434eb95SMatthew G. Knepley   PetscInt           m = A->rmap->n;
1521b434eb95SMatthew G. Knepley   const PetscInt    *aj, *ii, *ridx   = NULL;
1522b434eb95SMatthew G. Knepley   PetscInt           n, i, nonzerorow = 0;
1523b434eb95SMatthew G. Knepley   PetscScalar        sum;
1524b434eb95SMatthew G. Knepley   PetscBool          usecprow = a->compressedrow.use;
1525b434eb95SMatthew G. Knepley 
1526b434eb95SMatthew G. Knepley #if defined(PETSC_HAVE_PRAGMA_DISJOINT)
1527b434eb95SMatthew G. Knepley   #pragma disjoint(*x, *y, *aa)
1528b434eb95SMatthew G. Knepley #endif
1529b434eb95SMatthew G. Knepley 
1530b434eb95SMatthew G. Knepley   PetscFunctionBegin;
15319566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &a_a));
15329566063dSJacob Faibussowitsch   PetscCall(VecGetArrayRead(xx, &x));
15339566063dSJacob Faibussowitsch   PetscCall(VecGetArray(yy, &y));
1534b434eb95SMatthew G. Knepley   if (usecprow) { /* use compressed row format */
1535b434eb95SMatthew G. Knepley     m    = a->compressedrow.nrows;
1536b434eb95SMatthew G. Knepley     ii   = a->compressedrow.i;
1537b434eb95SMatthew G. Knepley     ridx = a->compressedrow.rindex;
1538b434eb95SMatthew G. Knepley     for (i = 0; i < m; i++) {
1539b434eb95SMatthew G. Knepley       n   = ii[i + 1] - ii[i];
1540b434eb95SMatthew G. Knepley       aj  = a->j + ii[i];
1541fff043a9SJunchao Zhang       aa  = a_a + ii[i];
1542b434eb95SMatthew G. Knepley       sum = 0.0;
1543b434eb95SMatthew G. Knepley       nonzerorow += (n > 0);
1544b434eb95SMatthew G. Knepley       PetscSparseDenseMaxDot(sum, x, aa, aj, n);
1545b434eb95SMatthew G. Knepley       /* for (j=0; j<n; j++) sum += (*aa++)*x[*aj++]; */
1546b434eb95SMatthew G. Knepley       y[*ridx++] = sum;
1547b434eb95SMatthew G. Knepley     }
1548b434eb95SMatthew G. Knepley   } else { /* do not use compressed row format */
15493d3eaba7SBarry Smith     ii = a->i;
1550b434eb95SMatthew G. Knepley     for (i = 0; i < m; i++) {
1551b434eb95SMatthew G. Knepley       n   = ii[i + 1] - ii[i];
1552b434eb95SMatthew G. Knepley       aj  = a->j + ii[i];
1553fff043a9SJunchao Zhang       aa  = a_a + ii[i];
1554b434eb95SMatthew G. Knepley       sum = 0.0;
1555b434eb95SMatthew G. Knepley       nonzerorow += (n > 0);
1556b434eb95SMatthew G. Knepley       PetscSparseDenseMaxDot(sum, x, aa, aj, n);
1557b434eb95SMatthew G. Knepley       y[i] = sum;
1558b434eb95SMatthew G. Knepley     }
1559b434eb95SMatthew G. Knepley   }
15609566063dSJacob Faibussowitsch   PetscCall(PetscLogFlops(2.0 * a->nz - nonzerorow));
15619566063dSJacob Faibussowitsch   PetscCall(VecRestoreArrayRead(xx, &x));
15629566063dSJacob Faibussowitsch   PetscCall(VecRestoreArray(yy, &y));
15639566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &a_a));
15643ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
1565b434eb95SMatthew G. Knepley }
1566b434eb95SMatthew G. Knepley 
1567ba38deedSJacob Faibussowitsch // HACK!!!!! Used by src/mat/tests/ex170.c
1568ba38deedSJacob Faibussowitsch PETSC_EXTERN PetscErrorCode MatMultAddMax_SeqAIJ(Mat A, Vec xx, Vec yy, Vec zz)
1569d71ae5a4SJacob Faibussowitsch {
1570b434eb95SMatthew G. Knepley   Mat_SeqAIJ        *a = (Mat_SeqAIJ *)A->data;
1571b434eb95SMatthew G. Knepley   PetscScalar       *y, *z;
1572b434eb95SMatthew G. Knepley   const PetscScalar *x;
1573fff043a9SJunchao Zhang   const MatScalar   *aa, *a_a;
1574b434eb95SMatthew G. Knepley   PetscInt           m = A->rmap->n, *aj, *ii;
1575b434eb95SMatthew G. Knepley   PetscInt           n, i, *ridx = NULL;
1576b434eb95SMatthew G. Knepley   PetscScalar        sum;
1577b434eb95SMatthew G. Knepley   PetscBool          usecprow = a->compressedrow.use;
1578b434eb95SMatthew G. Knepley 
1579b434eb95SMatthew G. Knepley   PetscFunctionBegin;
15809566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &a_a));
15819566063dSJacob Faibussowitsch   PetscCall(VecGetArrayRead(xx, &x));
15829566063dSJacob Faibussowitsch   PetscCall(VecGetArrayPair(yy, zz, &y, &z));
1583b434eb95SMatthew G. Knepley   if (usecprow) { /* use compressed row format */
158448a46eb9SPierre Jolivet     if (zz != yy) PetscCall(PetscArraycpy(z, y, m));
1585b434eb95SMatthew G. Knepley     m    = a->compressedrow.nrows;
1586b434eb95SMatthew G. Knepley     ii   = a->compressedrow.i;
1587b434eb95SMatthew G. Knepley     ridx = a->compressedrow.rindex;
1588b434eb95SMatthew G. Knepley     for (i = 0; i < m; i++) {
1589b434eb95SMatthew G. Knepley       n   = ii[i + 1] - ii[i];
1590b434eb95SMatthew G. Knepley       aj  = a->j + ii[i];
1591fff043a9SJunchao Zhang       aa  = a_a + ii[i];
1592b434eb95SMatthew G. Knepley       sum = y[*ridx];
1593b434eb95SMatthew G. Knepley       PetscSparseDenseMaxDot(sum, x, aa, aj, n);
1594b434eb95SMatthew G. Knepley       z[*ridx++] = sum;
1595b434eb95SMatthew G. Knepley     }
1596b434eb95SMatthew G. Knepley   } else { /* do not use compressed row format */
15973d3eaba7SBarry Smith     ii = a->i;
1598b434eb95SMatthew G. Knepley     for (i = 0; i < m; i++) {
1599b434eb95SMatthew G. Knepley       n   = ii[i + 1] - ii[i];
1600b434eb95SMatthew G. Knepley       aj  = a->j + ii[i];
1601fff043a9SJunchao Zhang       aa  = a_a + ii[i];
1602b434eb95SMatthew G. Knepley       sum = y[i];
1603b434eb95SMatthew G. Knepley       PetscSparseDenseMaxDot(sum, x, aa, aj, n);
1604b434eb95SMatthew G. Knepley       z[i] = sum;
1605b434eb95SMatthew G. Knepley     }
1606b434eb95SMatthew G. Knepley   }
16079566063dSJacob Faibussowitsch   PetscCall(PetscLogFlops(2.0 * a->nz));
16089566063dSJacob Faibussowitsch   PetscCall(VecRestoreArrayRead(xx, &x));
16099566063dSJacob Faibussowitsch   PetscCall(VecRestoreArrayPair(yy, zz, &y, &z));
16109566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &a_a));
16113ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
1612b434eb95SMatthew G. Knepley }
1613b434eb95SMatthew G. Knepley 
1614c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/ftn-kernels/fmultadd.h>
1615d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMultAdd_SeqAIJ(Mat A, Vec xx, Vec yy, Vec zz)
1616d71ae5a4SJacob Faibussowitsch {
1617416022c9SBarry Smith   Mat_SeqAIJ        *a = (Mat_SeqAIJ *)A->data;
1618f15663dcSBarry Smith   PetscScalar       *y, *z;
1619f15663dcSBarry Smith   const PetscScalar *x;
16205914357eSBarry Smith   const MatScalar   *a_a;
16215914357eSBarry Smith   const PetscInt    *ii, *ridx = NULL;
16225914357eSBarry Smith   PetscInt           m        = A->rmap->n;
1623ace3abfcSBarry Smith   PetscBool          usecprow = a->compressedrow.use;
16249ea0dfa2SSatish Balay 
16253a40ed3dSBarry Smith   PetscFunctionBegin;
1626b215bc84SStefano Zampini   if (a->inode.use && a->inode.checked) {
16279566063dSJacob Faibussowitsch     PetscCall(MatMultAdd_SeqAIJ_Inode(A, xx, yy, zz));
16283ba16761SJacob Faibussowitsch     PetscFunctionReturn(PETSC_SUCCESS);
1629b215bc84SStefano Zampini   }
16309566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &a_a));
16319566063dSJacob Faibussowitsch   PetscCall(VecGetArrayRead(xx, &x));
16329566063dSJacob Faibussowitsch   PetscCall(VecGetArrayPair(yy, zz, &y, &z));
16334eb6d288SHong Zhang   if (usecprow) { /* use compressed row format */
163448a46eb9SPierre Jolivet     if (zz != yy) PetscCall(PetscArraycpy(z, y, m));
163597952fefSHong Zhang     m    = a->compressedrow.nrows;
163697952fefSHong Zhang     ii   = a->compressedrow.i;
163797952fefSHong Zhang     ridx = a->compressedrow.rindex;
16385914357eSBarry Smith     for (PetscInt i = 0; i < m; i++) {
16395914357eSBarry Smith       PetscInt           n   = ii[i + 1] - ii[i];
16405914357eSBarry Smith       const PetscInt    *aj  = a->j + ii[i];
16415914357eSBarry Smith       const PetscScalar *aa  = a_a + ii[i];
16425914357eSBarry Smith       PetscScalar        sum = y[*ridx];
1643f15663dcSBarry Smith       PetscSparseDensePlusDot(sum, x, aa, aj, n);
164497952fefSHong Zhang       z[*ridx++] = sum;
164597952fefSHong Zhang     }
164697952fefSHong Zhang   } else { /* do not use compressed row format */
16473d3eaba7SBarry Smith     ii = a->i;
1648f15663dcSBarry Smith #if defined(PETSC_USE_FORTRAN_KERNEL_MULTADDAIJ)
16495914357eSBarry Smith     fortranmultaddaij_(&m, x, ii, a->j, a_a, y, z);
1650f15663dcSBarry Smith #else
16515914357eSBarry Smith     PetscPragmaUseOMPKernels(parallel for)
16525914357eSBarry Smith     for (PetscInt i = 0; i < m; i++) {
16535914357eSBarry Smith       PetscInt           n   = ii[i + 1] - ii[i];
16545914357eSBarry Smith       const PetscInt    *aj  = a->j + ii[i];
16555914357eSBarry Smith       const PetscScalar *aa  = a_a + ii[i];
16565914357eSBarry Smith       PetscScalar        sum = y[i];
1657f15663dcSBarry Smith       PetscSparseDensePlusDot(sum, x, aa, aj, n);
165817ab2063SBarry Smith       z[i] = sum;
165917ab2063SBarry Smith     }
166002ab625aSSatish Balay #endif
1661f15663dcSBarry Smith   }
16629566063dSJacob Faibussowitsch   PetscCall(PetscLogFlops(2.0 * a->nz));
16639566063dSJacob Faibussowitsch   PetscCall(VecRestoreArrayRead(xx, &x));
16649566063dSJacob Faibussowitsch   PetscCall(VecRestoreArrayPair(yy, zz, &y, &z));
16659566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &a_a));
16663ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
166717ab2063SBarry Smith }
166817ab2063SBarry Smith 
166917ab2063SBarry Smith /*
1670*07425a8dSBarry Smith      Adds diagonal pointers to sparse matrix nonzero structure and determines if all diagonal entries are present
167117ab2063SBarry Smith */
1672d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMarkDiagonal_SeqAIJ(Mat A)
1673d71ae5a4SJacob Faibussowitsch {
1674416022c9SBarry Smith   Mat_SeqAIJ    *a = (Mat_SeqAIJ *)A->data;
1675*07425a8dSBarry Smith   const PetscInt m = A->rmap->n;
167617ab2063SBarry Smith 
16773a40ed3dSBarry Smith   PetscFunctionBegin;
1678*07425a8dSBarry Smith   if (a->diag && a->diagNonzeroState == A->nonzerostate) PetscFunctionReturn(PETSC_SUCCESS);
1679*07425a8dSBarry Smith   if (!a->diag) PetscCall(PetscMalloc1(m, &a->diag));
1680*07425a8dSBarry Smith   a->diagDense = PETSC_TRUE;
1681*07425a8dSBarry Smith 
1682*07425a8dSBarry Smith   for (PetscInt i = 0; i < A->rmap->n; i++) {
1683*07425a8dSBarry Smith     PetscBool found = PETSC_FALSE;
1684c0c07093SJunchao Zhang 
168509f38230SBarry Smith     a->diag[i] = a->i[i + 1];
1686*07425a8dSBarry Smith     for (PetscInt j = a->i[i]; j < a->i[i + 1]; j++) {
1687bfeeae90SHong Zhang       if (a->j[j] == i) {
168809f38230SBarry Smith         a->diag[i] = j;
1689*07425a8dSBarry Smith         found      = PETSC_TRUE;
169017ab2063SBarry Smith         break;
169117ab2063SBarry Smith       }
169217ab2063SBarry Smith     }
1693*07425a8dSBarry Smith     if (!found) a->diagDense = PETSC_FALSE;
169417ab2063SBarry Smith   }
1695*07425a8dSBarry Smith   a->diagNonzeroState = A->nonzerostate;
16963ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
169717ab2063SBarry Smith }
169817ab2063SBarry Smith 
1699ba38deedSJacob Faibussowitsch static PetscErrorCode MatShift_SeqAIJ(Mat A, PetscScalar v)
1700d71ae5a4SJacob Faibussowitsch {
170161ecd0c6SBarry Smith   Mat_SeqAIJ     *a    = (Mat_SeqAIJ *)A->data;
170261ecd0c6SBarry Smith   const PetscInt *diag = (const PetscInt *)a->diag;
170361ecd0c6SBarry Smith   const PetscInt *ii   = (const PetscInt *)a->i;
170461ecd0c6SBarry Smith 
170561ecd0c6SBarry Smith   PetscFunctionBegin;
170661ecd0c6SBarry Smith   if (!A->preallocated || !a->nz) {
17079566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJSetPreallocation(A, 1, NULL));
17089566063dSJacob Faibussowitsch     PetscCall(MatShift_Basic(A, v));
17093ba16761SJacob Faibussowitsch     PetscFunctionReturn(PETSC_SUCCESS);
171061ecd0c6SBarry Smith   }
171161ecd0c6SBarry Smith 
1712*07425a8dSBarry Smith   if (a->diagDense) {
17139566063dSJacob Faibussowitsch     PetscCall(MatShift_Basic(A, v));
171461ecd0c6SBarry Smith   } else {
1715b6f2aa54SBarry Smith     PetscScalar       *olda = a->a; /* preserve pointers to current matrix nonzeros structure and values */
1716b6f2aa54SBarry Smith     PetscInt          *oldj = a->j, *oldi = a->i;
17179f0612e4SBarry Smith     PetscBool          free_a = a->free_a, free_ij = a->free_ij;
17186ea2a7edSJunchao Zhang     const PetscScalar *Aa;
1719*07425a8dSBarry Smith     PetscInt          *mdiag = NULL;
17206ea2a7edSJunchao Zhang 
1721*07425a8dSBarry Smith     PetscCall(PetscCalloc1(A->rmap->n, &mdiag));
1722*07425a8dSBarry Smith     for (PetscInt i = 0; i < A->rmap->n; i++) {
1723*07425a8dSBarry Smith       if (i < A->cmap->n && diag[i] >= ii[i + 1]) { /* 'out of range' rows never have diagonals */
1724*07425a8dSBarry Smith         mdiag[i] = 1;
1725*07425a8dSBarry Smith       }
1726*07425a8dSBarry Smith     }
17276ea2a7edSJunchao Zhang     PetscCall(MatSeqAIJGetArrayRead(A, &Aa)); // sync the host
17286ea2a7edSJunchao Zhang     PetscCall(MatSeqAIJRestoreArrayRead(A, &Aa));
172961ecd0c6SBarry Smith 
173061ecd0c6SBarry Smith     a->a = NULL;
173161ecd0c6SBarry Smith     a->j = NULL;
173261ecd0c6SBarry Smith     a->i = NULL;
173361ecd0c6SBarry Smith     /* increase the values in imax for each row where a diagonal is being inserted then reallocate the matrix data structures */
1734*07425a8dSBarry Smith     for (PetscInt i = 0; i < PetscMin(A->rmap->n, A->cmap->n); i++) a->imax[i] += mdiag[i];
17359566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(A, 0, a->imax));
173661ecd0c6SBarry Smith 
173761ecd0c6SBarry Smith     /* copy old values into new matrix data structure */
1738*07425a8dSBarry Smith     for (PetscInt i = 0; i < A->rmap->n; i++) {
17399566063dSJacob Faibussowitsch       PetscCall(MatSetValues(A, 1, &i, a->imax[i] - mdiag[i], &oldj[oldi[i]], &olda[oldi[i]], ADD_VALUES));
174048a46eb9SPierre Jolivet       if (i < A->cmap->n) PetscCall(MatSetValue(A, i, i, v, ADD_VALUES));
1741447d62f5SStefano Zampini     }
17429566063dSJacob Faibussowitsch     PetscCall(MatAssemblyBegin(A, MAT_FINAL_ASSEMBLY));
17439566063dSJacob Faibussowitsch     PetscCall(MatAssemblyEnd(A, MAT_FINAL_ASSEMBLY));
17449f0612e4SBarry Smith     if (free_a) PetscCall(PetscShmgetDeallocateArray((void **)&olda));
17459f0612e4SBarry Smith     if (free_ij) PetscCall(PetscShmgetDeallocateArray((void **)&oldj));
17469f0612e4SBarry Smith     if (free_ij) PetscCall(PetscShmgetDeallocateArray((void **)&oldi));
17479566063dSJacob Faibussowitsch     PetscCall(PetscFree(mdiag));
1748*07425a8dSBarry Smith     PetscCall(MatMarkDiagonal_SeqAIJ(A));
1749*07425a8dSBarry Smith   }
17503ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
175161ecd0c6SBarry Smith }
175261ecd0c6SBarry Smith 
1753be5855fcSBarry Smith /*
1754be5855fcSBarry Smith      Checks for missing diagonals
1755be5855fcSBarry Smith */
1756d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMissingDiagonal_SeqAIJ(Mat A, PetscBool *missing, PetscInt *d)
1757d71ae5a4SJacob Faibussowitsch {
1758be5855fcSBarry Smith   Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data;
17597734d3b5SMatthew G. Knepley   PetscInt   *diag, *ii = a->i, i;
1760be5855fcSBarry Smith 
1761be5855fcSBarry Smith   PetscFunctionBegin;
176209f38230SBarry Smith   *missing = PETSC_FALSE;
17637734d3b5SMatthew G. Knepley   if (A->rmap->n > 0 && !ii) {
176409f38230SBarry Smith     *missing = PETSC_TRUE;
176509f38230SBarry Smith     if (d) *d = 0;
17669566063dSJacob Faibussowitsch     PetscCall(PetscInfo(A, "Matrix has no entries therefore is missing diagonal\n"));
176709f38230SBarry Smith   } else {
176801445905SHong Zhang     PetscInt n;
176901445905SHong Zhang     n    = PetscMin(A->rmap->n, A->cmap->n);
1770f1e2ffcdSBarry Smith     diag = a->diag;
177101445905SHong Zhang     for (i = 0; i < n; i++) {
17727734d3b5SMatthew G. Knepley       if (diag[i] >= ii[i + 1]) {
177309f38230SBarry Smith         *missing = PETSC_TRUE;
177409f38230SBarry Smith         if (d) *d = i;
17759566063dSJacob Faibussowitsch         PetscCall(PetscInfo(A, "Matrix is missing diagonal number %" PetscInt_FMT "\n", i));
1776358d2f5dSShri Abhyankar         break;
177709f38230SBarry Smith       }
1778be5855fcSBarry Smith     }
1779be5855fcSBarry Smith   }
17803ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
1781be5855fcSBarry Smith }
1782be5855fcSBarry Smith 
17830da83c2eSBarry Smith #include <petscblaslapack.h>
17840da83c2eSBarry Smith #include <petsc/private/kernels/blockinvert.h>
17850da83c2eSBarry Smith 
17860da83c2eSBarry Smith /*
17870da83c2eSBarry Smith     Note that values is allocated externally by the PC and then passed into this routine
17880da83c2eSBarry Smith */
1789ba38deedSJacob Faibussowitsch static PetscErrorCode MatInvertVariableBlockDiagonal_SeqAIJ(Mat A, PetscInt nblocks, const PetscInt *bsizes, PetscScalar *diag)
1790d71ae5a4SJacob Faibussowitsch {
17910da83c2eSBarry Smith   PetscInt        n = A->rmap->n, i, ncnt = 0, *indx, j, bsizemax = 0, *v_pivots;
17920da83c2eSBarry Smith   PetscBool       allowzeropivot, zeropivotdetected = PETSC_FALSE;
17930da83c2eSBarry Smith   const PetscReal shift = 0.0;
17940da83c2eSBarry Smith   PetscInt        ipvt[5];
17954e208921SJed Brown   PetscCount      flops = 0;
17960da83c2eSBarry Smith   PetscScalar     work[25], *v_work;
17970da83c2eSBarry Smith 
17980da83c2eSBarry Smith   PetscFunctionBegin;
17990da83c2eSBarry Smith   allowzeropivot = PetscNot(A->erroriffailure);
18000da83c2eSBarry Smith   for (i = 0; i < nblocks; i++) ncnt += bsizes[i];
180108401ef6SPierre Jolivet   PetscCheck(ncnt == n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Total blocksizes %" PetscInt_FMT " doesn't match number matrix rows %" PetscInt_FMT, ncnt, n);
1802ad540459SPierre Jolivet   for (i = 0; i < nblocks; i++) bsizemax = PetscMax(bsizemax, bsizes[i]);
18039566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(bsizemax, &indx));
180448a46eb9SPierre Jolivet   if (bsizemax > 7) PetscCall(PetscMalloc2(bsizemax, &v_work, bsizemax, &v_pivots));
18050da83c2eSBarry Smith   ncnt = 0;
18060da83c2eSBarry Smith   for (i = 0; i < nblocks; i++) {
18070da83c2eSBarry Smith     for (j = 0; j < bsizes[i]; j++) indx[j] = ncnt + j;
18089566063dSJacob Faibussowitsch     PetscCall(MatGetValues(A, bsizes[i], indx, bsizes[i], indx, diag));
18090da83c2eSBarry Smith     switch (bsizes[i]) {
1810d71ae5a4SJacob Faibussowitsch     case 1:
1811d71ae5a4SJacob Faibussowitsch       *diag = 1.0 / (*diag);
1812d71ae5a4SJacob Faibussowitsch       break;
18130da83c2eSBarry Smith     case 2:
18149566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_inverse_A_2(diag, shift, allowzeropivot, &zeropivotdetected));
18150da83c2eSBarry Smith       if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT;
18169566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_transpose_A_2(diag));
18170da83c2eSBarry Smith       break;
18180da83c2eSBarry Smith     case 3:
18199566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_inverse_A_3(diag, shift, allowzeropivot, &zeropivotdetected));
18200da83c2eSBarry Smith       if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT;
18219566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_transpose_A_3(diag));
18220da83c2eSBarry Smith       break;
18230da83c2eSBarry Smith     case 4:
18249566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_inverse_A_4(diag, shift, allowzeropivot, &zeropivotdetected));
18250da83c2eSBarry Smith       if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT;
18269566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_transpose_A_4(diag));
18270da83c2eSBarry Smith       break;
18280da83c2eSBarry Smith     case 5:
18299566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_inverse_A_5(diag, ipvt, work, shift, allowzeropivot, &zeropivotdetected));
18300da83c2eSBarry Smith       if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT;
18319566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_transpose_A_5(diag));
18320da83c2eSBarry Smith       break;
18330da83c2eSBarry Smith     case 6:
18349566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_inverse_A_6(diag, shift, allowzeropivot, &zeropivotdetected));
18350da83c2eSBarry Smith       if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT;
18369566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_transpose_A_6(diag));
18370da83c2eSBarry Smith       break;
18380da83c2eSBarry Smith     case 7:
18399566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_inverse_A_7(diag, shift, allowzeropivot, &zeropivotdetected));
18400da83c2eSBarry Smith       if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT;
18419566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_transpose_A_7(diag));
18420da83c2eSBarry Smith       break;
18430da83c2eSBarry Smith     default:
18449566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_inverse_A(bsizes[i], diag, v_pivots, v_work, allowzeropivot, &zeropivotdetected));
18450da83c2eSBarry Smith       if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT;
18469566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_transpose_A_N(diag, bsizes[i]));
18470da83c2eSBarry Smith     }
18480da83c2eSBarry Smith     ncnt += bsizes[i];
18490da83c2eSBarry Smith     diag += bsizes[i] * bsizes[i];
1850baa50dc0SBrad Aagaard     flops += 2 * PetscPowInt64(bsizes[i], 3) / 3;
18510da83c2eSBarry Smith   }
18523ba16761SJacob Faibussowitsch   PetscCall(PetscLogFlops(flops));
185348a46eb9SPierre Jolivet   if (bsizemax > 7) PetscCall(PetscFree2(v_work, v_pivots));
18549566063dSJacob Faibussowitsch   PetscCall(PetscFree(indx));
18553ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
18560da83c2eSBarry Smith }
18570da83c2eSBarry Smith 
1858422a814eSBarry Smith /*
1859422a814eSBarry Smith    Negative shift indicates do not generate an error if there is a zero diagonal, just invert it anyways
1860422a814eSBarry Smith */
1861*07425a8dSBarry Smith static PetscErrorCode MatInvertDiagonalForSOR_SeqAIJ(Mat A, PetscScalar omega, PetscScalar fshift)
1862d71ae5a4SJacob Faibussowitsch {
186371f1c65dSBarry Smith   Mat_SeqAIJ      *a = (Mat_SeqAIJ *)A->data;
1864d0f46423SBarry Smith   PetscInt         i, *diag, m = A->rmap->n;
18652e5835c6SStefano Zampini   const MatScalar *v;
186654f21887SBarry Smith   PetscScalar     *idiag, *mdiag;
186771f1c65dSBarry Smith 
186871f1c65dSBarry Smith   PetscFunctionBegin;
1869*07425a8dSBarry Smith   if (a->idiagState == ((PetscObject)A)->state && a->omega == omega && a->fshift == fshift) PetscFunctionReturn(PETSC_SUCCESS);
18709566063dSJacob Faibussowitsch   PetscCall(MatMarkDiagonal_SeqAIJ(A));
1871*07425a8dSBarry Smith   PetscCheck(a->diagDense, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Matrix must have all diagonal location to invert them");
187271f1c65dSBarry Smith   diag = a->diag;
18733a7d0413SPierre Jolivet   if (!a->idiag) PetscCall(PetscMalloc3(m, &a->idiag, m, &a->mdiag, m, &a->ssor_work));
18742e5835c6SStefano Zampini 
187571f1c65dSBarry Smith   mdiag = a->mdiag;
187671f1c65dSBarry Smith   idiag = a->idiag;
18779566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &v));
1878422a814eSBarry Smith   if (omega == 1.0 && PetscRealPart(fshift) <= 0.0) {
187971f1c65dSBarry Smith     for (i = 0; i < m; i++) {
188071f1c65dSBarry Smith       mdiag[i] = v[diag[i]];
1881899639b0SHong Zhang       if (!PetscAbsScalar(mdiag[i])) { /* zero diagonal */
1882966bd95aSPierre Jolivet         PetscCheck(PetscRealPart(fshift), PETSC_COMM_SELF, PETSC_ERR_ARG_INCOMP, "Zero diagonal on row %" PetscInt_FMT, i);
18839566063dSJacob Faibussowitsch         PetscCall(PetscInfo(A, "Zero diagonal on row %" PetscInt_FMT "\n", i));
18847b6c816cSBarry Smith         A->factorerrortype             = MAT_FACTOR_NUMERIC_ZEROPIVOT;
18857b6c816cSBarry Smith         A->factorerror_zeropivot_value = 0.0;
18867b6c816cSBarry Smith         A->factorerror_zeropivot_row   = i;
1887899639b0SHong Zhang       }
188871f1c65dSBarry Smith       idiag[i] = 1.0 / v[diag[i]];
188971f1c65dSBarry Smith     }
18909566063dSJacob Faibussowitsch     PetscCall(PetscLogFlops(m));
189171f1c65dSBarry Smith   } else {
189271f1c65dSBarry Smith     for (i = 0; i < m; i++) {
189371f1c65dSBarry Smith       mdiag[i] = v[diag[i]];
189471f1c65dSBarry Smith       idiag[i] = omega / (fshift + v[diag[i]]);
189571f1c65dSBarry Smith     }
18969566063dSJacob Faibussowitsch     PetscCall(PetscLogFlops(2.0 * m));
189771f1c65dSBarry Smith   }
18989566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &v));
1899*07425a8dSBarry Smith   a->idiagState = ((PetscObject)A)->state;
1900*07425a8dSBarry Smith   a->omega      = omega;
1901*07425a8dSBarry Smith   a->fshift     = fshift;
19023ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
190371f1c65dSBarry Smith }
190471f1c65dSBarry Smith 
1905d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSOR_SeqAIJ(Mat A, Vec bb, PetscReal omega, MatSORType flag, PetscReal fshift, PetscInt its, PetscInt lits, Vec xx)
1906d71ae5a4SJacob Faibussowitsch {
1907416022c9SBarry Smith   Mat_SeqAIJ        *a = (Mat_SeqAIJ *)A->data;
1908e6d1f457SBarry Smith   PetscScalar       *x, d, sum, *t, scale;
19092e5835c6SStefano Zampini   const MatScalar   *v, *idiag = NULL, *mdiag, *aa;
191054f21887SBarry Smith   const PetscScalar *b, *bs, *xb, *ts;
19113d3eaba7SBarry Smith   PetscInt           n, m = A->rmap->n, i;
191297f1f81fSBarry Smith   const PetscInt    *idx, *diag;
191317ab2063SBarry Smith 
19143a40ed3dSBarry Smith   PetscFunctionBegin;
1915b215bc84SStefano Zampini   if (a->inode.use && a->inode.checked && omega == 1.0 && fshift == 0.0) {
19169566063dSJacob Faibussowitsch     PetscCall(MatSOR_SeqAIJ_Inode(A, bb, omega, flag, fshift, its, lits, xx));
19173ba16761SJacob Faibussowitsch     PetscFunctionReturn(PETSC_SUCCESS);
1918b215bc84SStefano Zampini   }
1919b965ef7fSBarry Smith   its = its * lits;
1920*07425a8dSBarry Smith   PetscCall(MatInvertDiagonalForSOR_SeqAIJ(A, omega, fshift));
192171f1c65dSBarry Smith   diag  = a->diag;
192271f1c65dSBarry Smith   t     = a->ssor_work;
1923ed480e8bSBarry Smith   idiag = a->idiag;
192471f1c65dSBarry Smith   mdiag = a->mdiag;
1925ed480e8bSBarry Smith 
19269566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &aa));
19279566063dSJacob Faibussowitsch   PetscCall(VecGetArray(xx, &x));
19289566063dSJacob Faibussowitsch   PetscCall(VecGetArrayRead(bb, &b));
1929ed480e8bSBarry Smith   /* We count flops by assuming the upper triangular and lower triangular parts have the same number of nonzeros */
193017ab2063SBarry Smith   if (flag == SOR_APPLY_UPPER) {
193117ab2063SBarry Smith     /* apply (U + D/omega) to the vector */
1932ed480e8bSBarry Smith     bs = b;
193317ab2063SBarry Smith     for (i = 0; i < m; i++) {
193471f1c65dSBarry Smith       d   = fshift + mdiag[i];
1935416022c9SBarry Smith       n   = a->i[i + 1] - diag[i] - 1;
1936ed480e8bSBarry Smith       idx = a->j + diag[i] + 1;
19372e5835c6SStefano Zampini       v   = aa + diag[i] + 1;
193817ab2063SBarry Smith       sum = b[i] * d / omega;
1939003131ecSBarry Smith       PetscSparseDensePlusDot(sum, bs, v, idx, n);
194017ab2063SBarry Smith       x[i] = sum;
194117ab2063SBarry Smith     }
19429566063dSJacob Faibussowitsch     PetscCall(VecRestoreArray(xx, &x));
19439566063dSJacob Faibussowitsch     PetscCall(VecRestoreArrayRead(bb, &b));
19449566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJRestoreArrayRead(A, &aa));
19459566063dSJacob Faibussowitsch     PetscCall(PetscLogFlops(a->nz));
19463ba16761SJacob Faibussowitsch     PetscFunctionReturn(PETSC_SUCCESS);
194717ab2063SBarry Smith   }
1948c783ea89SBarry Smith 
194908401ef6SPierre Jolivet   PetscCheck(flag != SOR_APPLY_LOWER, PETSC_COMM_SELF, PETSC_ERR_SUP, "SOR_APPLY_LOWER is not implemented");
1950f7d195e4SLawrence Mitchell   if (flag & SOR_EISENSTAT) {
19514c500f23SPierre Jolivet     /* Let  A = L + U + D; where L is lower triangular,
1952887ee2caSBarry Smith     U is upper triangular, E = D/omega; This routine applies
195317ab2063SBarry Smith 
195417ab2063SBarry Smith             (L + E)^{-1} A (U + E)^{-1}
195517ab2063SBarry Smith 
1956887ee2caSBarry Smith     to a vector efficiently using Eisenstat's trick.
195717ab2063SBarry Smith     */
195817ab2063SBarry Smith     scale = (2.0 / omega) - 1.0;
195917ab2063SBarry Smith 
196017ab2063SBarry Smith     /*  x = (E + U)^{-1} b */
196117ab2063SBarry Smith     for (i = m - 1; i >= 0; i--) {
1962416022c9SBarry Smith       n   = a->i[i + 1] - diag[i] - 1;
1963ed480e8bSBarry Smith       idx = a->j + diag[i] + 1;
19642e5835c6SStefano Zampini       v   = aa + diag[i] + 1;
196517ab2063SBarry Smith       sum = b[i];
1966e6d1f457SBarry Smith       PetscSparseDenseMinusDot(sum, x, v, idx, n);
1967ed480e8bSBarry Smith       x[i] = sum * idiag[i];
196817ab2063SBarry Smith     }
196917ab2063SBarry Smith 
197017ab2063SBarry Smith     /*  t = b - (2*E - D)x */
19712e5835c6SStefano Zampini     v = aa;
19722205254eSKarl Rupp     for (i = 0; i < m; i++) t[i] = b[i] - scale * (v[*diag++]) * x[i];
197317ab2063SBarry Smith 
197417ab2063SBarry Smith     /*  t = (E + L)^{-1}t */
1975ed480e8bSBarry Smith     ts   = t;
1976416022c9SBarry Smith     diag = a->diag;
197717ab2063SBarry Smith     for (i = 0; i < m; i++) {
1978416022c9SBarry Smith       n   = diag[i] - a->i[i];
1979ed480e8bSBarry Smith       idx = a->j + a->i[i];
19802e5835c6SStefano Zampini       v   = aa + a->i[i];
198117ab2063SBarry Smith       sum = t[i];
1982003131ecSBarry Smith       PetscSparseDenseMinusDot(sum, ts, v, idx, n);
1983ed480e8bSBarry Smith       t[i] = sum * idiag[i];
1984733d66baSBarry Smith       /*  x = x + t */
1985733d66baSBarry Smith       x[i] += t[i];
198617ab2063SBarry Smith     }
198717ab2063SBarry Smith 
19889566063dSJacob Faibussowitsch     PetscCall(PetscLogFlops(6.0 * m - 1 + 2.0 * a->nz));
19899566063dSJacob Faibussowitsch     PetscCall(VecRestoreArray(xx, &x));
19909566063dSJacob Faibussowitsch     PetscCall(VecRestoreArrayRead(bb, &b));
19913ba16761SJacob Faibussowitsch     PetscFunctionReturn(PETSC_SUCCESS);
199217ab2063SBarry Smith   }
199317ab2063SBarry Smith   if (flag & SOR_ZERO_INITIAL_GUESS) {
199417ab2063SBarry Smith     if (flag & SOR_FORWARD_SWEEP || flag & SOR_LOCAL_FORWARD_SWEEP) {
199517ab2063SBarry Smith       for (i = 0; i < m; i++) {
1996416022c9SBarry Smith         n   = diag[i] - a->i[i];
1997ed480e8bSBarry Smith         idx = a->j + a->i[i];
19982e5835c6SStefano Zampini         v   = aa + a->i[i];
199917ab2063SBarry Smith         sum = b[i];
2000e6d1f457SBarry Smith         PetscSparseDenseMinusDot(sum, x, v, idx, n);
20015c99c7daSBarry Smith         t[i] = sum;
2002ed480e8bSBarry Smith         x[i] = sum * idiag[i];
200317ab2063SBarry Smith       }
20045c99c7daSBarry Smith       xb = t;
20059566063dSJacob Faibussowitsch       PetscCall(PetscLogFlops(a->nz));
20063a40ed3dSBarry Smith     } else xb = b;
200717ab2063SBarry Smith     if (flag & SOR_BACKWARD_SWEEP || flag & SOR_LOCAL_BACKWARD_SWEEP) {
200817ab2063SBarry Smith       for (i = m - 1; i >= 0; i--) {
2009416022c9SBarry Smith         n   = a->i[i + 1] - diag[i] - 1;
2010ed480e8bSBarry Smith         idx = a->j + diag[i] + 1;
20112e5835c6SStefano Zampini         v   = aa + diag[i] + 1;
201217ab2063SBarry Smith         sum = xb[i];
2013e6d1f457SBarry Smith         PetscSparseDenseMinusDot(sum, x, v, idx, n);
20145c99c7daSBarry Smith         if (xb == b) {
2015ed480e8bSBarry Smith           x[i] = sum * idiag[i];
20165c99c7daSBarry Smith         } else {
2017b19a5dc2SMark Adams           x[i] = (1 - omega) * x[i] + sum * idiag[i]; /* omega in idiag */
201817ab2063SBarry Smith         }
20195c99c7daSBarry Smith       }
20209566063dSJacob Faibussowitsch       PetscCall(PetscLogFlops(a->nz)); /* assumes 1/2 in upper */
202117ab2063SBarry Smith     }
202217ab2063SBarry Smith     its--;
202317ab2063SBarry Smith   }
202417ab2063SBarry Smith   while (its--) {
202517ab2063SBarry Smith     if (flag & SOR_FORWARD_SWEEP || flag & SOR_LOCAL_FORWARD_SWEEP) {
202617ab2063SBarry Smith       for (i = 0; i < m; i++) {
2027b19a5dc2SMark Adams         /* lower */
2028b19a5dc2SMark Adams         n   = diag[i] - a->i[i];
2029ed480e8bSBarry Smith         idx = a->j + a->i[i];
20302e5835c6SStefano Zampini         v   = aa + a->i[i];
203117ab2063SBarry Smith         sum = b[i];
2032e6d1f457SBarry Smith         PetscSparseDenseMinusDot(sum, x, v, idx, n);
2033b19a5dc2SMark Adams         t[i] = sum; /* save application of the lower-triangular part */
2034b19a5dc2SMark Adams         /* upper */
2035b19a5dc2SMark Adams         n   = a->i[i + 1] - diag[i] - 1;
2036b19a5dc2SMark Adams         idx = a->j + diag[i] + 1;
20372e5835c6SStefano Zampini         v   = aa + diag[i] + 1;
2038b19a5dc2SMark Adams         PetscSparseDenseMinusDot(sum, x, v, idx, n);
2039b19a5dc2SMark Adams         x[i] = (1. - omega) * x[i] + sum * idiag[i]; /* omega in idiag */
204017ab2063SBarry Smith       }
2041b19a5dc2SMark Adams       xb = t;
20429566063dSJacob Faibussowitsch       PetscCall(PetscLogFlops(2.0 * a->nz));
2043b19a5dc2SMark Adams     } else xb = b;
204417ab2063SBarry Smith     if (flag & SOR_BACKWARD_SWEEP || flag & SOR_LOCAL_BACKWARD_SWEEP) {
204517ab2063SBarry Smith       for (i = m - 1; i >= 0; i--) {
2046b19a5dc2SMark Adams         sum = xb[i];
2047b19a5dc2SMark Adams         if (xb == b) {
2048b19a5dc2SMark Adams           /* whole matrix (no checkpointing available) */
2049416022c9SBarry Smith           n   = a->i[i + 1] - a->i[i];
2050ed480e8bSBarry Smith           idx = a->j + a->i[i];
20512e5835c6SStefano Zampini           v   = aa + a->i[i];
2052e6d1f457SBarry Smith           PetscSparseDenseMinusDot(sum, x, v, idx, n);
2053ed480e8bSBarry Smith           x[i] = (1. - omega) * x[i] + (sum + mdiag[i] * x[i]) * idiag[i];
2054b19a5dc2SMark Adams         } else { /* lower-triangular part has been saved, so only apply upper-triangular */
2055b19a5dc2SMark Adams           n   = a->i[i + 1] - diag[i] - 1;
2056b19a5dc2SMark Adams           idx = a->j + diag[i] + 1;
20572e5835c6SStefano Zampini           v   = aa + diag[i] + 1;
2058b19a5dc2SMark Adams           PetscSparseDenseMinusDot(sum, x, v, idx, n);
2059b19a5dc2SMark Adams           x[i] = (1. - omega) * x[i] + sum * idiag[i]; /* omega in idiag */
206017ab2063SBarry Smith         }
2061b19a5dc2SMark Adams       }
2062b19a5dc2SMark Adams       if (xb == b) {
20639566063dSJacob Faibussowitsch         PetscCall(PetscLogFlops(2.0 * a->nz));
2064b19a5dc2SMark Adams       } else {
20659566063dSJacob Faibussowitsch         PetscCall(PetscLogFlops(a->nz)); /* assumes 1/2 in upper */
2066b19a5dc2SMark Adams       }
206717ab2063SBarry Smith     }
206817ab2063SBarry Smith   }
20699566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &aa));
20709566063dSJacob Faibussowitsch   PetscCall(VecRestoreArray(xx, &x));
20719566063dSJacob Faibussowitsch   PetscCall(VecRestoreArrayRead(bb, &b));
20723ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
207317ab2063SBarry Smith }
207417ab2063SBarry Smith 
2075ba38deedSJacob Faibussowitsch static PetscErrorCode MatGetInfo_SeqAIJ(Mat A, MatInfoType flag, MatInfo *info)
2076d71ae5a4SJacob Faibussowitsch {
2077416022c9SBarry Smith   Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data;
20784e220ebcSLois Curfman McInnes 
20793a40ed3dSBarry Smith   PetscFunctionBegin;
20804e220ebcSLois Curfman McInnes   info->block_size   = 1.0;
20813966268fSBarry Smith   info->nz_allocated = a->maxnz;
20823966268fSBarry Smith   info->nz_used      = a->nz;
20833966268fSBarry Smith   info->nz_unneeded  = (a->maxnz - a->nz);
20843966268fSBarry Smith   info->assemblies   = A->num_ass;
20853966268fSBarry Smith   info->mallocs      = A->info.mallocs;
20864dfa11a4SJacob Faibussowitsch   info->memory       = 0; /* REVIEW ME */
2087d5f3da31SBarry Smith   if (A->factortype) {
20884e220ebcSLois Curfman McInnes     info->fill_ratio_given  = A->info.fill_ratio_given;
20894e220ebcSLois Curfman McInnes     info->fill_ratio_needed = A->info.fill_ratio_needed;
20904e220ebcSLois Curfman McInnes     info->factor_mallocs    = A->info.factor_mallocs;
20914e220ebcSLois Curfman McInnes   } else {
20924e220ebcSLois Curfman McInnes     info->fill_ratio_given  = 0;
20934e220ebcSLois Curfman McInnes     info->fill_ratio_needed = 0;
20944e220ebcSLois Curfman McInnes     info->factor_mallocs    = 0;
20954e220ebcSLois Curfman McInnes   }
20963ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
209717ab2063SBarry Smith }
209817ab2063SBarry Smith 
2099ba38deedSJacob Faibussowitsch static PetscErrorCode MatZeroRows_SeqAIJ(Mat A, PetscInt N, const PetscInt rows[], PetscScalar diag, Vec x, Vec b)
2100d71ae5a4SJacob Faibussowitsch {
2101416022c9SBarry Smith   Mat_SeqAIJ        *a = (Mat_SeqAIJ *)A->data;
2102c7da8527SEric Chamberland   PetscInt           i, m = A->rmap->n - 1;
210397b48c8fSBarry Smith   const PetscScalar *xx;
21042e5835c6SStefano Zampini   PetscScalar       *bb, *aa;
2105c7da8527SEric Chamberland   PetscInt           d = 0;
210617ab2063SBarry Smith 
21073a40ed3dSBarry Smith   PetscFunctionBegin;
210897b48c8fSBarry Smith   if (x && b) {
21099566063dSJacob Faibussowitsch     PetscCall(VecGetArrayRead(x, &xx));
21109566063dSJacob Faibussowitsch     PetscCall(VecGetArray(b, &bb));
211197b48c8fSBarry Smith     for (i = 0; i < N; i++) {
2112aed4548fSBarry Smith       PetscCheck(rows[i] >= 0 && rows[i] <= m, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "row %" PetscInt_FMT " out of range", rows[i]);
2113447d62f5SStefano Zampini       if (rows[i] >= A->cmap->n) continue;
211497b48c8fSBarry Smith       bb[rows[i]] = diag * xx[rows[i]];
211597b48c8fSBarry Smith     }
21169566063dSJacob Faibussowitsch     PetscCall(VecRestoreArrayRead(x, &xx));
21179566063dSJacob Faibussowitsch     PetscCall(VecRestoreArray(b, &bb));
211897b48c8fSBarry Smith   }
211997b48c8fSBarry Smith 
21209566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArray(A, &aa));
2121a9817697SBarry Smith   if (a->keepnonzeropattern) {
2122f1e2ffcdSBarry Smith     for (i = 0; i < N; i++) {
2123aed4548fSBarry Smith       PetscCheck(rows[i] >= 0 && rows[i] <= m, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "row %" PetscInt_FMT " out of range", rows[i]);
21249566063dSJacob Faibussowitsch       PetscCall(PetscArrayzero(&aa[a->i[rows[i]]], a->ilen[rows[i]]));
2125f1e2ffcdSBarry Smith     }
2126f4df32b1SMatthew Knepley     if (diag != 0.0) {
2127c7da8527SEric Chamberland       for (i = 0; i < N; i++) {
2128c7da8527SEric Chamberland         d = rows[i];
2129447d62f5SStefano Zampini         if (rows[i] >= A->cmap->n) continue;
213008401ef6SPierre Jolivet         PetscCheck(a->diag[d] < a->i[d + 1], PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Matrix is missing diagonal entry in the zeroed row %" PetscInt_FMT, d);
2131c7da8527SEric Chamberland       }
2132f1e2ffcdSBarry Smith       for (i = 0; i < N; i++) {
2133447d62f5SStefano Zampini         if (rows[i] >= A->cmap->n) continue;
21342e5835c6SStefano Zampini         aa[a->diag[rows[i]]] = diag;
2135f1e2ffcdSBarry Smith       }
2136f1e2ffcdSBarry Smith     }
2137f1e2ffcdSBarry Smith   } else {
2138f4df32b1SMatthew Knepley     if (diag != 0.0) {
213917ab2063SBarry Smith       for (i = 0; i < N; i++) {
2140aed4548fSBarry Smith         PetscCheck(rows[i] >= 0 && rows[i] <= m, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "row %" PetscInt_FMT " out of range", rows[i]);
21417ae801bdSBarry Smith         if (a->ilen[rows[i]] > 0) {
2142447d62f5SStefano Zampini           if (rows[i] >= A->cmap->n) {
2143447d62f5SStefano Zampini             a->ilen[rows[i]] = 0;
2144447d62f5SStefano Zampini           } else {
2145416022c9SBarry Smith             a->ilen[rows[i]]    = 1;
21462e5835c6SStefano Zampini             aa[a->i[rows[i]]]   = diag;
2147bfeeae90SHong Zhang             a->j[a->i[rows[i]]] = rows[i];
2148447d62f5SStefano Zampini           }
2149447d62f5SStefano Zampini         } else if (rows[i] < A->cmap->n) { /* in case row was completely empty */
21509566063dSJacob Faibussowitsch           PetscCall(MatSetValues_SeqAIJ(A, 1, &rows[i], 1, &rows[i], &diag, INSERT_VALUES));
215117ab2063SBarry Smith         }
215217ab2063SBarry Smith       }
21533a40ed3dSBarry Smith     } else {
215417ab2063SBarry Smith       for (i = 0; i < N; i++) {
2155aed4548fSBarry Smith         PetscCheck(rows[i] >= 0 && rows[i] <= m, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "row %" PetscInt_FMT " out of range", rows[i]);
2156416022c9SBarry Smith         a->ilen[rows[i]] = 0;
215717ab2063SBarry Smith       }
215817ab2063SBarry Smith     }
2159e56f5c9eSBarry Smith     A->nonzerostate++;
2160f1e2ffcdSBarry Smith   }
21619566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArray(A, &aa));
2162dbbe0bcdSBarry Smith   PetscUseTypeMethod(A, assemblyend, MAT_FINAL_ASSEMBLY);
21633ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
216417ab2063SBarry Smith }
216517ab2063SBarry Smith 
2166ba38deedSJacob Faibussowitsch static PetscErrorCode MatZeroRowsColumns_SeqAIJ(Mat A, PetscInt N, const PetscInt rows[], PetscScalar diag, Vec x, Vec b)
2167d71ae5a4SJacob Faibussowitsch {
21686e169961SBarry Smith   Mat_SeqAIJ        *a = (Mat_SeqAIJ *)A->data;
21696e169961SBarry Smith   PetscInt           i, j, m = A->rmap->n - 1, d = 0;
21702b40b63fSBarry Smith   PetscBool          missing, *zeroed, vecs = PETSC_FALSE;
21716e169961SBarry Smith   const PetscScalar *xx;
21722e5835c6SStefano Zampini   PetscScalar       *bb, *aa;
21736e169961SBarry Smith 
21746e169961SBarry Smith   PetscFunctionBegin;
21753ba16761SJacob Faibussowitsch   if (!N) PetscFunctionReturn(PETSC_SUCCESS);
21769566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArray(A, &aa));
21776e169961SBarry Smith   if (x && b) {
21789566063dSJacob Faibussowitsch     PetscCall(VecGetArrayRead(x, &xx));
21799566063dSJacob Faibussowitsch     PetscCall(VecGetArray(b, &bb));
21802b40b63fSBarry Smith     vecs = PETSC_TRUE;
21816e169961SBarry Smith   }
21829566063dSJacob Faibussowitsch   PetscCall(PetscCalloc1(A->rmap->n, &zeroed));
21836e169961SBarry Smith   for (i = 0; i < N; i++) {
2184aed4548fSBarry Smith     PetscCheck(rows[i] >= 0 && rows[i] <= m, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "row %" PetscInt_FMT " out of range", rows[i]);
21858e3a54c0SPierre Jolivet     PetscCall(PetscArrayzero(PetscSafePointerPlusOffset(aa, a->i[rows[i]]), a->ilen[rows[i]]));
21862205254eSKarl Rupp 
21876e169961SBarry Smith     zeroed[rows[i]] = PETSC_TRUE;
21886e169961SBarry Smith   }
21896e169961SBarry Smith   for (i = 0; i < A->rmap->n; i++) {
21906e169961SBarry Smith     if (!zeroed[i]) {
21916e169961SBarry Smith       for (j = a->i[i]; j < a->i[i + 1]; j++) {
21924cf107fdSStefano Zampini         if (a->j[j] < A->rmap->n && zeroed[a->j[j]]) {
21932e5835c6SStefano Zampini           if (vecs) bb[i] -= aa[j] * xx[a->j[j]];
21942e5835c6SStefano Zampini           aa[j] = 0.0;
21956e169961SBarry Smith         }
21966e169961SBarry Smith       }
21974cf107fdSStefano Zampini     } else if (vecs && i < A->cmap->N) bb[i] = diag * xx[i];
21986e169961SBarry Smith   }
21996e169961SBarry Smith   if (x && b) {
22009566063dSJacob Faibussowitsch     PetscCall(VecRestoreArrayRead(x, &xx));
22019566063dSJacob Faibussowitsch     PetscCall(VecRestoreArray(b, &bb));
22026e169961SBarry Smith   }
22039566063dSJacob Faibussowitsch   PetscCall(PetscFree(zeroed));
22046e169961SBarry Smith   if (diag != 0.0) {
22059566063dSJacob Faibussowitsch     PetscCall(MatMissingDiagonal_SeqAIJ(A, &missing, &d));
22061d5a398dSstefano_zampini     if (missing) {
22071d5a398dSstefano_zampini       for (i = 0; i < N; i++) {
22084cf107fdSStefano Zampini         if (rows[i] >= A->cmap->N) continue;
2209aed4548fSBarry Smith         PetscCheck(!a->nonew || rows[i] < d, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Matrix is missing diagonal entry in row %" PetscInt_FMT " (%" PetscInt_FMT ")", d, rows[i]);
22109566063dSJacob Faibussowitsch         PetscCall(MatSetValues_SeqAIJ(A, 1, &rows[i], 1, &rows[i], &diag, INSERT_VALUES));
22111d5a398dSstefano_zampini       }
22121d5a398dSstefano_zampini     } else {
2213ad540459SPierre Jolivet       for (i = 0; i < N; i++) aa[a->diag[rows[i]]] = diag;
22146e169961SBarry Smith     }
22151d5a398dSstefano_zampini   }
22169566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArray(A, &aa));
2217dbbe0bcdSBarry Smith   PetscUseTypeMethod(A, assemblyend, MAT_FINAL_ASSEMBLY);
22183ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
22196e169961SBarry Smith }
22206e169961SBarry Smith 
2221d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetRow_SeqAIJ(Mat A, PetscInt row, PetscInt *nz, PetscInt **idx, PetscScalar **v)
2222d71ae5a4SJacob Faibussowitsch {
2223fff043a9SJunchao Zhang   Mat_SeqAIJ        *a = (Mat_SeqAIJ *)A->data;
2224fff043a9SJunchao Zhang   const PetscScalar *aa;
222517ab2063SBarry Smith 
22263a40ed3dSBarry Smith   PetscFunctionBegin;
22279566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &aa));
2228416022c9SBarry Smith   *nz = a->i[row + 1] - a->i[row];
22298e3a54c0SPierre Jolivet   if (v) *v = PetscSafePointerPlusOffset((PetscScalar *)aa, a->i[row]);
223017ab2063SBarry Smith   if (idx) {
22315c0db29aSPierre Jolivet     if (*nz && a->j) *idx = a->j + a->i[row];
2232f4259b30SLisandro Dalcin     else *idx = NULL;
223317ab2063SBarry Smith   }
22349566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &aa));
22353ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
223617ab2063SBarry Smith }
223717ab2063SBarry Smith 
2238d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRestoreRow_SeqAIJ(Mat A, PetscInt row, PetscInt *nz, PetscInt **idx, PetscScalar **v)
2239d71ae5a4SJacob Faibussowitsch {
22403a40ed3dSBarry Smith   PetscFunctionBegin;
22413ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
224217ab2063SBarry Smith }
224317ab2063SBarry Smith 
2244ba38deedSJacob Faibussowitsch static PetscErrorCode MatNorm_SeqAIJ(Mat A, NormType type, PetscReal *nrm)
2245d71ae5a4SJacob Faibussowitsch {
2246416022c9SBarry Smith   Mat_SeqAIJ      *a = (Mat_SeqAIJ *)A->data;
22472e5835c6SStefano Zampini   const MatScalar *v;
224836db0b34SBarry Smith   PetscReal        sum = 0.0;
224997f1f81fSBarry Smith   PetscInt         i, j;
225017ab2063SBarry Smith 
22513a40ed3dSBarry Smith   PetscFunctionBegin;
22529566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &v));
225317ab2063SBarry Smith   if (type == NORM_FROBENIUS) {
2254570b7f6dSBarry Smith #if defined(PETSC_USE_REAL___FP16)
2255570b7f6dSBarry Smith     PetscBLASInt one = 1, nz = a->nz;
2256792fecdfSBarry Smith     PetscCallBLAS("BLASnrm2", *nrm = BLASnrm2_(&nz, v, &one));
2257570b7f6dSBarry Smith #else
2258416022c9SBarry Smith     for (i = 0; i < a->nz; i++) {
22599371c9d4SSatish Balay       sum += PetscRealPart(PetscConj(*v) * (*v));
22609371c9d4SSatish Balay       v++;
226117ab2063SBarry Smith     }
22628f1a2a5eSBarry Smith     *nrm = PetscSqrtReal(sum);
2263570b7f6dSBarry Smith #endif
22649566063dSJacob Faibussowitsch     PetscCall(PetscLogFlops(2.0 * a->nz));
22653a40ed3dSBarry Smith   } else if (type == NORM_1) {
226636db0b34SBarry Smith     PetscReal *tmp;
226797f1f81fSBarry Smith     PetscInt  *jj = a->j;
22689566063dSJacob Faibussowitsch     PetscCall(PetscCalloc1(A->cmap->n + 1, &tmp));
2269064f8208SBarry Smith     *nrm = 0.0;
2270416022c9SBarry Smith     for (j = 0; j < a->nz; j++) {
22719371c9d4SSatish Balay       tmp[*jj++] += PetscAbsScalar(*v);
22729371c9d4SSatish Balay       v++;
227317ab2063SBarry Smith     }
2274d0f46423SBarry Smith     for (j = 0; j < A->cmap->n; j++) {
2275064f8208SBarry Smith       if (tmp[j] > *nrm) *nrm = tmp[j];
227617ab2063SBarry Smith     }
22779566063dSJacob Faibussowitsch     PetscCall(PetscFree(tmp));
22789566063dSJacob Faibussowitsch     PetscCall(PetscLogFlops(PetscMax(a->nz - 1, 0)));
22793a40ed3dSBarry Smith   } else if (type == NORM_INFINITY) {
2280064f8208SBarry Smith     *nrm = 0.0;
2281d0f46423SBarry Smith     for (j = 0; j < A->rmap->n; j++) {
22828e3a54c0SPierre Jolivet       const PetscScalar *v2 = PetscSafePointerPlusOffset(v, a->i[j]);
228317ab2063SBarry Smith       sum                   = 0.0;
2284416022c9SBarry Smith       for (i = 0; i < a->i[j + 1] - a->i[j]; i++) {
22859371c9d4SSatish Balay         sum += PetscAbsScalar(*v2);
22869371c9d4SSatish Balay         v2++;
228717ab2063SBarry Smith       }
2288064f8208SBarry Smith       if (sum > *nrm) *nrm = sum;
228917ab2063SBarry Smith     }
22909566063dSJacob Faibussowitsch     PetscCall(PetscLogFlops(PetscMax(a->nz - 1, 0)));
2291f23aa3ddSBarry Smith   } else SETERRQ(PETSC_COMM_SELF, PETSC_ERR_SUP, "No support for two norm");
22929566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &v));
22933ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
229417ab2063SBarry Smith }
229517ab2063SBarry Smith 
2296ba38deedSJacob Faibussowitsch static PetscErrorCode MatIsTranspose_SeqAIJ(Mat A, Mat B, PetscReal tol, PetscBool *f)
2297d71ae5a4SJacob Faibussowitsch {
22983d3eaba7SBarry Smith   Mat_SeqAIJ      *aij = (Mat_SeqAIJ *)A->data, *bij = (Mat_SeqAIJ *)B->data;
229954f21887SBarry Smith   PetscInt        *adx, *bdx, *aii, *bii, *aptr, *bptr;
23002e5835c6SStefano Zampini   const MatScalar *va, *vb;
230197f1f81fSBarry Smith   PetscInt         ma, na, mb, nb, i;
2302cd0d46ebSvictorle 
2303cd0d46ebSvictorle   PetscFunctionBegin;
23049566063dSJacob Faibussowitsch   PetscCall(MatGetSize(A, &ma, &na));
23059566063dSJacob Faibussowitsch   PetscCall(MatGetSize(B, &mb, &nb));
23065485867bSBarry Smith   if (ma != nb || na != mb) {
23075485867bSBarry Smith     *f = PETSC_FALSE;
23083ba16761SJacob Faibussowitsch     PetscFunctionReturn(PETSC_SUCCESS);
23095485867bSBarry Smith   }
23109566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &va));
23119566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(B, &vb));
23129371c9d4SSatish Balay   aii = aij->i;
23139371c9d4SSatish Balay   bii = bij->i;
23149371c9d4SSatish Balay   adx = aij->j;
23159371c9d4SSatish Balay   bdx = bij->j;
23169566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(ma, &aptr));
23179566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(mb, &bptr));
2318cd0d46ebSvictorle   for (i = 0; i < ma; i++) aptr[i] = aii[i];
2319cd0d46ebSvictorle   for (i = 0; i < mb; i++) bptr[i] = bii[i];
2320cd0d46ebSvictorle 
2321cd0d46ebSvictorle   *f = PETSC_TRUE;
2322cd0d46ebSvictorle   for (i = 0; i < ma; i++) {
2323cd0d46ebSvictorle     while (aptr[i] < aii[i + 1]) {
232497f1f81fSBarry Smith       PetscInt    idc, idr;
23255485867bSBarry Smith       PetscScalar vc, vr;
2326cd0d46ebSvictorle       /* column/row index/value */
23275485867bSBarry Smith       idc = adx[aptr[i]];
23285485867bSBarry Smith       idr = bdx[bptr[idc]];
23295485867bSBarry Smith       vc  = va[aptr[i]];
23305485867bSBarry Smith       vr  = vb[bptr[idc]];
23315485867bSBarry Smith       if (i != idr || PetscAbsScalar(vc - vr) > tol) {
23325485867bSBarry Smith         *f = PETSC_FALSE;
23335485867bSBarry Smith         goto done;
2334cd0d46ebSvictorle       } else {
23355485867bSBarry Smith         aptr[i]++;
23365485867bSBarry Smith         if (B || i != idc) bptr[idc]++;
2337cd0d46ebSvictorle       }
2338cd0d46ebSvictorle     }
2339cd0d46ebSvictorle   }
2340cd0d46ebSvictorle done:
23419566063dSJacob Faibussowitsch   PetscCall(PetscFree(aptr));
23429566063dSJacob Faibussowitsch   PetscCall(PetscFree(bptr));
23439566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &va));
23449566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(B, &vb));
23453ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
2346cd0d46ebSvictorle }
2347cd0d46ebSvictorle 
2348ba38deedSJacob Faibussowitsch static PetscErrorCode MatIsHermitianTranspose_SeqAIJ(Mat A, Mat B, PetscReal tol, PetscBool *f)
2349d71ae5a4SJacob Faibussowitsch {
23503d3eaba7SBarry Smith   Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data, *bij = (Mat_SeqAIJ *)B->data;
235154f21887SBarry Smith   PetscInt   *adx, *bdx, *aii, *bii, *aptr, *bptr;
235254f21887SBarry Smith   MatScalar  *va, *vb;
23531cbb95d3SBarry Smith   PetscInt    ma, na, mb, nb, i;
23541cbb95d3SBarry Smith 
23551cbb95d3SBarry Smith   PetscFunctionBegin;
23569566063dSJacob Faibussowitsch   PetscCall(MatGetSize(A, &ma, &na));
23579566063dSJacob Faibussowitsch   PetscCall(MatGetSize(B, &mb, &nb));
23581cbb95d3SBarry Smith   if (ma != nb || na != mb) {
23591cbb95d3SBarry Smith     *f = PETSC_FALSE;
23603ba16761SJacob Faibussowitsch     PetscFunctionReturn(PETSC_SUCCESS);
23611cbb95d3SBarry Smith   }
23629371c9d4SSatish Balay   aii = aij->i;
23639371c9d4SSatish Balay   bii = bij->i;
23649371c9d4SSatish Balay   adx = aij->j;
23659371c9d4SSatish Balay   bdx = bij->j;
23669371c9d4SSatish Balay   va  = aij->a;
23679371c9d4SSatish Balay   vb  = bij->a;
23689566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(ma, &aptr));
23699566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(mb, &bptr));
23701cbb95d3SBarry Smith   for (i = 0; i < ma; i++) aptr[i] = aii[i];
23711cbb95d3SBarry Smith   for (i = 0; i < mb; i++) bptr[i] = bii[i];
23721cbb95d3SBarry Smith 
23731cbb95d3SBarry Smith   *f = PETSC_TRUE;
23741cbb95d3SBarry Smith   for (i = 0; i < ma; i++) {
23751cbb95d3SBarry Smith     while (aptr[i] < aii[i + 1]) {
23761cbb95d3SBarry Smith       PetscInt    idc, idr;
23771cbb95d3SBarry Smith       PetscScalar vc, vr;
23781cbb95d3SBarry Smith       /* column/row index/value */
23791cbb95d3SBarry Smith       idc = adx[aptr[i]];
23801cbb95d3SBarry Smith       idr = bdx[bptr[idc]];
23811cbb95d3SBarry Smith       vc  = va[aptr[i]];
23821cbb95d3SBarry Smith       vr  = vb[bptr[idc]];
23831cbb95d3SBarry Smith       if (i != idr || PetscAbsScalar(vc - PetscConj(vr)) > tol) {
23841cbb95d3SBarry Smith         *f = PETSC_FALSE;
23851cbb95d3SBarry Smith         goto done;
23861cbb95d3SBarry Smith       } else {
23871cbb95d3SBarry Smith         aptr[i]++;
23881cbb95d3SBarry Smith         if (B || i != idc) bptr[idc]++;
23891cbb95d3SBarry Smith       }
23901cbb95d3SBarry Smith     }
23911cbb95d3SBarry Smith   }
23921cbb95d3SBarry Smith done:
23939566063dSJacob Faibussowitsch   PetscCall(PetscFree(aptr));
23949566063dSJacob Faibussowitsch   PetscCall(PetscFree(bptr));
23953ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
23961cbb95d3SBarry Smith }
23971cbb95d3SBarry Smith 
2398d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDiagonalScale_SeqAIJ(Mat A, Vec ll, Vec rr)
2399d71ae5a4SJacob Faibussowitsch {
2400416022c9SBarry Smith   Mat_SeqAIJ        *a = (Mat_SeqAIJ *)A->data;
2401fff8e43fSBarry Smith   const PetscScalar *l, *r;
2402fff8e43fSBarry Smith   PetscScalar        x;
240354f21887SBarry Smith   MatScalar         *v;
2404fff8e43fSBarry Smith   PetscInt           i, j, m = A->rmap->n, n = A->cmap->n, M, nz = a->nz;
2405fff8e43fSBarry Smith   const PetscInt    *jj;
240617ab2063SBarry Smith 
24073a40ed3dSBarry Smith   PetscFunctionBegin;
240817ab2063SBarry Smith   if (ll) {
24093ea7c6a1SSatish Balay     /* The local size is used so that VecMPI can be passed to this routine
24103ea7c6a1SSatish Balay        by MatDiagonalScale_MPIAIJ */
24119566063dSJacob Faibussowitsch     PetscCall(VecGetLocalSize(ll, &m));
241208401ef6SPierre Jolivet     PetscCheck(m == A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Left scaling vector wrong length");
24139566063dSJacob Faibussowitsch     PetscCall(VecGetArrayRead(ll, &l));
24149566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJGetArray(A, &v));
241517ab2063SBarry Smith     for (i = 0; i < m; i++) {
241617ab2063SBarry Smith       x = l[i];
2417416022c9SBarry Smith       M = a->i[i + 1] - a->i[i];
24182205254eSKarl Rupp       for (j = 0; j < M; j++) (*v++) *= x;
241917ab2063SBarry Smith     }
24209566063dSJacob Faibussowitsch     PetscCall(VecRestoreArrayRead(ll, &l));
24219566063dSJacob Faibussowitsch     PetscCall(PetscLogFlops(nz));
24229566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJRestoreArray(A, &v));
242317ab2063SBarry Smith   }
242417ab2063SBarry Smith   if (rr) {
24259566063dSJacob Faibussowitsch     PetscCall(VecGetLocalSize(rr, &n));
242608401ef6SPierre Jolivet     PetscCheck(n == A->cmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Right scaling vector wrong length");
24279566063dSJacob Faibussowitsch     PetscCall(VecGetArrayRead(rr, &r));
24289566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJGetArray(A, &v));
24292e5835c6SStefano Zampini     jj = a->j;
24302205254eSKarl Rupp     for (i = 0; i < nz; i++) (*v++) *= r[*jj++];
24319566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJRestoreArray(A, &v));
24329566063dSJacob Faibussowitsch     PetscCall(VecRestoreArrayRead(rr, &r));
24339566063dSJacob Faibussowitsch     PetscCall(PetscLogFlops(nz));
243417ab2063SBarry Smith   }
24353ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
243617ab2063SBarry Smith }
243717ab2063SBarry Smith 
2438d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateSubMatrix_SeqAIJ(Mat A, IS isrow, IS iscol, PetscInt csize, MatReuse scall, Mat *B)
2439d71ae5a4SJacob Faibussowitsch {
2440db02288aSLois Curfman McInnes   Mat_SeqAIJ        *a = (Mat_SeqAIJ *)A->data, *c;
2441d0f46423SBarry Smith   PetscInt          *smap, i, k, kstart, kend, oldcols = A->cmap->n, *lens;
244297f1f81fSBarry Smith   PetscInt           row, mat_i, *mat_j, tcol, first, step, *mat_ilen, sum, lensi;
24435d0c19d7SBarry Smith   const PetscInt    *irow, *icol;
24442e5835c6SStefano Zampini   const PetscScalar *aa;
24455d0c19d7SBarry Smith   PetscInt           nrows, ncols;
244697f1f81fSBarry Smith   PetscInt          *starts, *j_new, *i_new, *aj = a->j, *ai = a->i, ii, *ailen = a->ilen;
2447fb3c7e2dSJunchao Zhang   MatScalar         *a_new, *mat_a, *c_a;
2448416022c9SBarry Smith   Mat                C;
2449cdc6f3adSToby Isaac   PetscBool          stride;
245017ab2063SBarry Smith 
24513a40ed3dSBarry Smith   PetscFunctionBegin;
24529566063dSJacob Faibussowitsch   PetscCall(ISGetIndices(isrow, &irow));
24539566063dSJacob Faibussowitsch   PetscCall(ISGetLocalSize(isrow, &nrows));
24549566063dSJacob Faibussowitsch   PetscCall(ISGetLocalSize(iscol, &ncols));
245517ab2063SBarry Smith 
24569566063dSJacob Faibussowitsch   PetscCall(PetscObjectTypeCompare((PetscObject)iscol, ISSTRIDE, &stride));
2457ff718158SBarry Smith   if (stride) {
24589566063dSJacob Faibussowitsch     PetscCall(ISStrideGetInfo(iscol, &first, &step));
2459ff718158SBarry Smith   } else {
2460ff718158SBarry Smith     first = 0;
2461ff718158SBarry Smith     step  = 0;
2462ff718158SBarry Smith   }
2463fee21e36SBarry Smith   if (stride && step == 1) {
246402834360SBarry Smith     /* special case of contiguous rows */
24659566063dSJacob Faibussowitsch     PetscCall(PetscMalloc2(nrows, &lens, nrows, &starts));
246602834360SBarry Smith     /* loop over new rows determining lens and starting points */
246702834360SBarry Smith     for (i = 0; i < nrows; i++) {
2468bfeeae90SHong Zhang       kstart    = ai[irow[i]];
2469a2744918SBarry Smith       kend      = kstart + ailen[irow[i]];
2470a91a9bebSLisandro Dalcin       starts[i] = kstart;
247102834360SBarry Smith       for (k = kstart; k < kend; k++) {
2472bfeeae90SHong Zhang         if (aj[k] >= first) {
247302834360SBarry Smith           starts[i] = k;
247402834360SBarry Smith           break;
247502834360SBarry Smith         }
247602834360SBarry Smith       }
2477a2744918SBarry Smith       sum = 0;
247802834360SBarry Smith       while (k < kend) {
2479bfeeae90SHong Zhang         if (aj[k++] >= first + ncols) break;
2480a2744918SBarry Smith         sum++;
248102834360SBarry Smith       }
2482a2744918SBarry Smith       lens[i] = sum;
248302834360SBarry Smith     }
248402834360SBarry Smith     /* create submatrix */
2485cddf8d76SBarry Smith     if (scall == MAT_REUSE_MATRIX) {
248697f1f81fSBarry Smith       PetscInt n_cols, n_rows;
24879566063dSJacob Faibussowitsch       PetscCall(MatGetSize(*B, &n_rows, &n_cols));
2488aed4548fSBarry Smith       PetscCheck(n_rows == nrows && n_cols == ncols, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Reused submatrix wrong size");
24899566063dSJacob Faibussowitsch       PetscCall(MatZeroEntries(*B));
249008480c60SBarry Smith       C = *B;
24913a40ed3dSBarry Smith     } else {
24923bef6203SJed Brown       PetscInt rbs, cbs;
24939566063dSJacob Faibussowitsch       PetscCall(MatCreate(PetscObjectComm((PetscObject)A), &C));
24949566063dSJacob Faibussowitsch       PetscCall(MatSetSizes(C, nrows, ncols, PETSC_DETERMINE, PETSC_DETERMINE));
24959566063dSJacob Faibussowitsch       PetscCall(ISGetBlockSize(isrow, &rbs));
24969566063dSJacob Faibussowitsch       PetscCall(ISGetBlockSize(iscol, &cbs));
24979566063dSJacob Faibussowitsch       PetscCall(MatSetBlockSizes(C, rbs, cbs));
24989566063dSJacob Faibussowitsch       PetscCall(MatSetType(C, ((PetscObject)A)->type_name));
24999566063dSJacob Faibussowitsch       PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(C, 0, lens));
250008480c60SBarry Smith     }
2501db02288aSLois Curfman McInnes     c = (Mat_SeqAIJ *)C->data;
2502db02288aSLois Curfman McInnes 
250302834360SBarry Smith     /* loop over rows inserting into submatrix */
2504fb3c7e2dSJunchao Zhang     PetscCall(MatSeqAIJGetArrayWrite(C, &a_new)); // Not 'a_new = c->a-new', since that raw usage ignores offload state of C
2505db02288aSLois Curfman McInnes     j_new = c->j;
2506db02288aSLois Curfman McInnes     i_new = c->i;
25079566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJGetArrayRead(A, &aa));
250802834360SBarry Smith     for (i = 0; i < nrows; i++) {
2509a2744918SBarry Smith       ii    = starts[i];
2510a2744918SBarry Smith       lensi = lens[i];
2511810441c8SPierre Jolivet       if (lensi) {
2512ad540459SPierre Jolivet         for (k = 0; k < lensi; k++) *j_new++ = aj[ii + k] - first;
25139566063dSJacob Faibussowitsch         PetscCall(PetscArraycpy(a_new, aa + starts[i], lensi));
2514a2744918SBarry Smith         a_new += lensi;
2515810441c8SPierre Jolivet       }
2516a2744918SBarry Smith       i_new[i + 1] = i_new[i] + lensi;
2517a2744918SBarry Smith       c->ilen[i]   = lensi;
251802834360SBarry Smith     }
2519fb3c7e2dSJunchao Zhang     PetscCall(MatSeqAIJRestoreArrayWrite(C, &a_new)); // Set C's offload state properly
25209566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJRestoreArrayRead(A, &aa));
25219566063dSJacob Faibussowitsch     PetscCall(PetscFree2(lens, starts));
25223a40ed3dSBarry Smith   } else {
25239566063dSJacob Faibussowitsch     PetscCall(ISGetIndices(iscol, &icol));
25249566063dSJacob Faibussowitsch     PetscCall(PetscCalloc1(oldcols, &smap));
25259566063dSJacob Faibussowitsch     PetscCall(PetscMalloc1(1 + nrows, &lens));
25264dcab191SBarry Smith     for (i = 0; i < ncols; i++) {
25276bdcaf15SBarry Smith       PetscCheck(icol[i] < oldcols, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Requesting column beyond largest column icol[%" PetscInt_FMT "] %" PetscInt_FMT " >= A->cmap->n %" PetscInt_FMT, i, icol[i], oldcols);
25284dcab191SBarry Smith       smap[icol[i]] = i + 1;
25294dcab191SBarry Smith     }
25304dcab191SBarry Smith 
253102834360SBarry Smith     /* determine lens of each row */
253202834360SBarry Smith     for (i = 0; i < nrows; i++) {
2533bfeeae90SHong Zhang       kstart  = ai[irow[i]];
253402834360SBarry Smith       kend    = kstart + a->ilen[irow[i]];
253502834360SBarry Smith       lens[i] = 0;
253602834360SBarry Smith       for (k = kstart; k < kend; k++) {
2537ad540459SPierre Jolivet         if (smap[aj[k]]) lens[i]++;
253802834360SBarry Smith       }
253902834360SBarry Smith     }
254017ab2063SBarry Smith     /* Create and fill new matrix */
2541a2744918SBarry Smith     if (scall == MAT_REUSE_MATRIX) {
2542ace3abfcSBarry Smith       PetscBool equal;
25430f5bd95cSBarry Smith 
254499141d43SSatish Balay       c = (Mat_SeqAIJ *)((*B)->data);
2545aed4548fSBarry Smith       PetscCheck((*B)->rmap->n == nrows && (*B)->cmap->n == ncols, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Cannot reuse matrix. wrong size");
25469566063dSJacob Faibussowitsch       PetscCall(PetscArraycmp(c->ilen, lens, (*B)->rmap->n, &equal));
2547fdfbdca6SPierre Jolivet       PetscCheck(equal, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Cannot reuse matrix. wrong number of nonzeros");
25489566063dSJacob Faibussowitsch       PetscCall(PetscArrayzero(c->ilen, (*B)->rmap->n));
254908480c60SBarry Smith       C = *B;
25503a40ed3dSBarry Smith     } else {
25513bef6203SJed Brown       PetscInt rbs, cbs;
25529566063dSJacob Faibussowitsch       PetscCall(MatCreate(PetscObjectComm((PetscObject)A), &C));
25539566063dSJacob Faibussowitsch       PetscCall(MatSetSizes(C, nrows, ncols, PETSC_DETERMINE, PETSC_DETERMINE));
25549566063dSJacob Faibussowitsch       PetscCall(ISGetBlockSize(isrow, &rbs));
25559566063dSJacob Faibussowitsch       PetscCall(ISGetBlockSize(iscol, &cbs));
255637a5e0faSPierre Jolivet       if (rbs > 1 || cbs > 1) PetscCall(MatSetBlockSizes(C, rbs, cbs));
25579566063dSJacob Faibussowitsch       PetscCall(MatSetType(C, ((PetscObject)A)->type_name));
25589566063dSJacob Faibussowitsch       PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(C, 0, lens));
255908480c60SBarry Smith     }
25609566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJGetArrayRead(A, &aa));
2561fb3c7e2dSJunchao Zhang 
2562f4f49eeaSPierre Jolivet     c = (Mat_SeqAIJ *)C->data;
2563fb3c7e2dSJunchao Zhang     PetscCall(MatSeqAIJGetArrayWrite(C, &c_a)); // Not 'c->a', since that raw usage ignores offload state of C
256417ab2063SBarry Smith     for (i = 0; i < nrows; i++) {
256599141d43SSatish Balay       row      = irow[i];
2566bfeeae90SHong Zhang       kstart   = ai[row];
256799141d43SSatish Balay       kend     = kstart + a->ilen[row];
2568bfeeae90SHong Zhang       mat_i    = c->i[i];
25698e3a54c0SPierre Jolivet       mat_j    = PetscSafePointerPlusOffset(c->j, mat_i);
25708e3a54c0SPierre Jolivet       mat_a    = PetscSafePointerPlusOffset(c_a, mat_i);
257199141d43SSatish Balay       mat_ilen = c->ilen + i;
257217ab2063SBarry Smith       for (k = kstart; k < kend; k++) {
2573bfeeae90SHong Zhang         if ((tcol = smap[a->j[k]])) {
2574ed480e8bSBarry Smith           *mat_j++ = tcol - 1;
25752e5835c6SStefano Zampini           *mat_a++ = aa[k];
257699141d43SSatish Balay           (*mat_ilen)++;
257717ab2063SBarry Smith         }
257817ab2063SBarry Smith       }
257917ab2063SBarry Smith     }
25809566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJRestoreArrayRead(A, &aa));
258102834360SBarry Smith     /* Free work space */
25829566063dSJacob Faibussowitsch     PetscCall(ISRestoreIndices(iscol, &icol));
25839566063dSJacob Faibussowitsch     PetscCall(PetscFree(smap));
25849566063dSJacob Faibussowitsch     PetscCall(PetscFree(lens));
2585cdc6f3adSToby Isaac     /* sort */
2586cdc6f3adSToby Isaac     for (i = 0; i < nrows; i++) {
2587cdc6f3adSToby Isaac       PetscInt ilen;
2588cdc6f3adSToby Isaac 
2589cdc6f3adSToby Isaac       mat_i = c->i[i];
25908e3a54c0SPierre Jolivet       mat_j = PetscSafePointerPlusOffset(c->j, mat_i);
25918e3a54c0SPierre Jolivet       mat_a = PetscSafePointerPlusOffset(c_a, mat_i);
2592cdc6f3adSToby Isaac       ilen  = c->ilen[i];
25939566063dSJacob Faibussowitsch       PetscCall(PetscSortIntWithScalarArray(ilen, mat_j, mat_a));
2594cdc6f3adSToby Isaac     }
2595fb3c7e2dSJunchao Zhang     PetscCall(MatSeqAIJRestoreArrayWrite(C, &c_a));
259602834360SBarry Smith   }
25978c3ff71bSJunchao Zhang #if defined(PETSC_HAVE_DEVICE)
25989566063dSJacob Faibussowitsch   PetscCall(MatBindToCPU(C, A->boundtocpu));
2599305c6ccfSStefano Zampini #endif
26009566063dSJacob Faibussowitsch   PetscCall(MatAssemblyBegin(C, MAT_FINAL_ASSEMBLY));
26019566063dSJacob Faibussowitsch   PetscCall(MatAssemblyEnd(C, MAT_FINAL_ASSEMBLY));
260217ab2063SBarry Smith 
26039566063dSJacob Faibussowitsch   PetscCall(ISRestoreIndices(isrow, &irow));
2604416022c9SBarry Smith   *B = C;
26053ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
260617ab2063SBarry Smith }
260717ab2063SBarry Smith 
2608ba38deedSJacob Faibussowitsch static PetscErrorCode MatGetMultiProcBlock_SeqAIJ(Mat mat, MPI_Comm subComm, MatReuse scall, Mat *subMat)
2609d71ae5a4SJacob Faibussowitsch {
261082d44351SHong Zhang   Mat B;
261182d44351SHong Zhang 
261282d44351SHong Zhang   PetscFunctionBegin;
2613c2d650bdSHong Zhang   if (scall == MAT_INITIAL_MATRIX) {
26149566063dSJacob Faibussowitsch     PetscCall(MatCreate(subComm, &B));
26159566063dSJacob Faibussowitsch     PetscCall(MatSetSizes(B, mat->rmap->n, mat->cmap->n, mat->rmap->n, mat->cmap->n));
26169566063dSJacob Faibussowitsch     PetscCall(MatSetBlockSizesFromMats(B, mat, mat));
26179566063dSJacob Faibussowitsch     PetscCall(MatSetType(B, MATSEQAIJ));
26189566063dSJacob Faibussowitsch     PetscCall(MatDuplicateNoCreate_SeqAIJ(B, mat, MAT_COPY_VALUES, PETSC_TRUE));
261982d44351SHong Zhang     *subMat = B;
2620c2d650bdSHong Zhang   } else {
26219566063dSJacob Faibussowitsch     PetscCall(MatCopy_SeqAIJ(mat, *subMat, SAME_NONZERO_PATTERN));
2622c2d650bdSHong Zhang   }
26233ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
262482d44351SHong Zhang }
262582d44351SHong Zhang 
2626ba38deedSJacob Faibussowitsch static PetscErrorCode MatILUFactor_SeqAIJ(Mat inA, IS row, IS col, const MatFactorInfo *info)
2627d71ae5a4SJacob Faibussowitsch {
262863b91edcSBarry Smith   Mat_SeqAIJ *a = (Mat_SeqAIJ *)inA->data;
262963b91edcSBarry Smith   Mat         outA;
2630ace3abfcSBarry Smith   PetscBool   row_identity, col_identity;
263163b91edcSBarry Smith 
26323a40ed3dSBarry Smith   PetscFunctionBegin;
263308401ef6SPierre Jolivet   PetscCheck(info->levels == 0, PETSC_COMM_SELF, PETSC_ERR_SUP, "Only levels=0 supported for in-place ilu");
26341df811f5SHong Zhang 
26359566063dSJacob Faibussowitsch   PetscCall(ISIdentity(row, &row_identity));
26369566063dSJacob Faibussowitsch   PetscCall(ISIdentity(col, &col_identity));
2637a871dcd8SBarry Smith 
263863b91edcSBarry Smith   outA             = inA;
2639d5f3da31SBarry Smith   outA->factortype = MAT_FACTOR_LU;
26409566063dSJacob Faibussowitsch   PetscCall(PetscFree(inA->solvertype));
26419566063dSJacob Faibussowitsch   PetscCall(PetscStrallocpy(MATSOLVERPETSC, &inA->solvertype));
26422205254eSKarl Rupp 
26439566063dSJacob Faibussowitsch   PetscCall(PetscObjectReference((PetscObject)row));
26449566063dSJacob Faibussowitsch   PetscCall(ISDestroy(&a->row));
26452205254eSKarl Rupp 
2646c3122656SLisandro Dalcin   a->row = row;
26472205254eSKarl Rupp 
26489566063dSJacob Faibussowitsch   PetscCall(PetscObjectReference((PetscObject)col));
26499566063dSJacob Faibussowitsch   PetscCall(ISDestroy(&a->col));
26502205254eSKarl Rupp 
2651c3122656SLisandro Dalcin   a->col = col;
265263b91edcSBarry Smith 
265336db0b34SBarry Smith   /* Create the inverse permutation so that it can be used in MatLUFactorNumeric() */
26549566063dSJacob Faibussowitsch   PetscCall(ISDestroy(&a->icol));
26559566063dSJacob Faibussowitsch   PetscCall(ISInvertPermutation(col, PETSC_DECIDE, &a->icol));
2656f0ec6fceSSatish Balay 
265794a9d846SBarry Smith   if (!a->solve_work) { /* this matrix may have been factored before */
265884648c2dSPierre Jolivet     PetscCall(PetscMalloc1(inA->rmap->n, &a->solve_work));
265994a9d846SBarry Smith   }
266063b91edcSBarry Smith 
26619566063dSJacob Faibussowitsch   PetscCall(MatMarkDiagonal_SeqAIJ(inA));
2662137fb511SHong Zhang   if (row_identity && col_identity) {
26639566063dSJacob Faibussowitsch     PetscCall(MatLUFactorNumeric_SeqAIJ_inplace(outA, inA, info));
2664137fb511SHong Zhang   } else {
26659566063dSJacob Faibussowitsch     PetscCall(MatLUFactorNumeric_SeqAIJ_InplaceWithPerm(outA, inA, info));
2666137fb511SHong Zhang   }
26673ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
2668a871dcd8SBarry Smith }
2669a871dcd8SBarry Smith 
2670d71ae5a4SJacob Faibussowitsch PetscErrorCode MatScale_SeqAIJ(Mat inA, PetscScalar alpha)
2671d71ae5a4SJacob Faibussowitsch {
2672f0b747eeSBarry Smith   Mat_SeqAIJ  *a = (Mat_SeqAIJ *)inA->data;
2673dfa0f9e5SStefano Zampini   PetscScalar *v;
2674c5df96a5SBarry Smith   PetscBLASInt one = 1, bnz;
26753a40ed3dSBarry Smith 
26763a40ed3dSBarry Smith   PetscFunctionBegin;
26779566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArray(inA, &v));
26789566063dSJacob Faibussowitsch   PetscCall(PetscBLASIntCast(a->nz, &bnz));
2679792fecdfSBarry Smith   PetscCallBLAS("BLASscal", BLASscal_(&bnz, &alpha, v, &one));
26809566063dSJacob Faibussowitsch   PetscCall(PetscLogFlops(a->nz));
26819566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArray(inA, &v));
26823ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
2683f0b747eeSBarry Smith }
2684f0b747eeSBarry Smith 
2685d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDestroySubMatrix_Private(Mat_SubSppt *submatj)
2686d71ae5a4SJacob Faibussowitsch {
268716b64355SHong Zhang   PetscInt i;
268816b64355SHong Zhang 
268916b64355SHong Zhang   PetscFunctionBegin;
269016b64355SHong Zhang   if (!submatj->id) { /* delete data that are linked only to submats[id=0] */
26919566063dSJacob Faibussowitsch     PetscCall(PetscFree4(submatj->sbuf1, submatj->ptr, submatj->tmp, submatj->ctr));
269216b64355SHong Zhang 
269348a46eb9SPierre Jolivet     for (i = 0; i < submatj->nrqr; ++i) PetscCall(PetscFree(submatj->sbuf2[i]));
26949566063dSJacob Faibussowitsch     PetscCall(PetscFree3(submatj->sbuf2, submatj->req_size, submatj->req_source1));
269516b64355SHong Zhang 
269616b64355SHong Zhang     if (submatj->rbuf1) {
26979566063dSJacob Faibussowitsch       PetscCall(PetscFree(submatj->rbuf1[0]));
26989566063dSJacob Faibussowitsch       PetscCall(PetscFree(submatj->rbuf1));
269916b64355SHong Zhang     }
270016b64355SHong Zhang 
270148a46eb9SPierre Jolivet     for (i = 0; i < submatj->nrqs; ++i) PetscCall(PetscFree(submatj->rbuf3[i]));
27029566063dSJacob Faibussowitsch     PetscCall(PetscFree3(submatj->req_source2, submatj->rbuf2, submatj->rbuf3));
27039566063dSJacob Faibussowitsch     PetscCall(PetscFree(submatj->pa));
270416b64355SHong Zhang   }
270516b64355SHong Zhang 
270616b64355SHong Zhang #if defined(PETSC_USE_CTABLE)
2707eec179cfSJacob Faibussowitsch   PetscCall(PetscHMapIDestroy(&submatj->rmap));
27089566063dSJacob Faibussowitsch   if (submatj->cmap_loc) PetscCall(PetscFree(submatj->cmap_loc));
27099566063dSJacob Faibussowitsch   PetscCall(PetscFree(submatj->rmap_loc));
271016b64355SHong Zhang #else
27119566063dSJacob Faibussowitsch   PetscCall(PetscFree(submatj->rmap));
271216b64355SHong Zhang #endif
271316b64355SHong Zhang 
271416b64355SHong Zhang   if (!submatj->allcolumns) {
271516b64355SHong Zhang #if defined(PETSC_USE_CTABLE)
2716835f2295SStefano Zampini     PetscCall(PetscHMapIDestroy(&submatj->cmap));
271716b64355SHong Zhang #else
27189566063dSJacob Faibussowitsch     PetscCall(PetscFree(submatj->cmap));
271916b64355SHong Zhang #endif
272016b64355SHong Zhang   }
27219566063dSJacob Faibussowitsch   PetscCall(PetscFree(submatj->row2proc));
272216b64355SHong Zhang 
27239566063dSJacob Faibussowitsch   PetscCall(PetscFree(submatj));
27243ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
272516b64355SHong Zhang }
272616b64355SHong Zhang 
2727d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDestroySubMatrix_SeqAIJ(Mat C)
2728d71ae5a4SJacob Faibussowitsch {
272916b64355SHong Zhang   Mat_SeqAIJ  *c       = (Mat_SeqAIJ *)C->data;
27305c39f6d9SHong Zhang   Mat_SubSppt *submatj = c->submatis1;
273116b64355SHong Zhang 
273216b64355SHong Zhang   PetscFunctionBegin;
27339566063dSJacob Faibussowitsch   PetscCall((*submatj->destroy)(C));
27349566063dSJacob Faibussowitsch   PetscCall(MatDestroySubMatrix_Private(submatj));
27353ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
273616b64355SHong Zhang }
273716b64355SHong Zhang 
273889a1a59bSHong Zhang /* Note this has code duplication with MatDestroySubMatrices_SeqBAIJ() */
2739ba38deedSJacob Faibussowitsch static PetscErrorCode MatDestroySubMatrices_SeqAIJ(PetscInt n, Mat *mat[])
2740d71ae5a4SJacob Faibussowitsch {
27412d033e1fSHong Zhang   PetscInt     i;
27420fb991dcSHong Zhang   Mat          C;
27430fb991dcSHong Zhang   Mat_SeqAIJ  *c;
27440fb991dcSHong Zhang   Mat_SubSppt *submatj;
27452d033e1fSHong Zhang 
27462d033e1fSHong Zhang   PetscFunctionBegin;
27472d033e1fSHong Zhang   for (i = 0; i < n; i++) {
27480fb991dcSHong Zhang     C       = (*mat)[i];
27490fb991dcSHong Zhang     c       = (Mat_SeqAIJ *)C->data;
27500fb991dcSHong Zhang     submatj = c->submatis1;
27512d033e1fSHong Zhang     if (submatj) {
2752682e4c99SStefano Zampini       if (--((PetscObject)C)->refct <= 0) {
275326cc229bSBarry Smith         PetscCall(PetscFree(C->factorprefix));
27549566063dSJacob Faibussowitsch         PetscCall((*submatj->destroy)(C));
27559566063dSJacob Faibussowitsch         PetscCall(MatDestroySubMatrix_Private(submatj));
27569566063dSJacob Faibussowitsch         PetscCall(PetscFree(C->defaultvectype));
27573faff063SStefano Zampini         PetscCall(PetscFree(C->defaultrandtype));
27589566063dSJacob Faibussowitsch         PetscCall(PetscLayoutDestroy(&C->rmap));
27599566063dSJacob Faibussowitsch         PetscCall(PetscLayoutDestroy(&C->cmap));
27609566063dSJacob Faibussowitsch         PetscCall(PetscHeaderDestroy(&C));
2761682e4c99SStefano Zampini       }
27622d033e1fSHong Zhang     } else {
27639566063dSJacob Faibussowitsch       PetscCall(MatDestroy(&C));
27642d033e1fSHong Zhang     }
27652d033e1fSHong Zhang   }
276686e85357SHong Zhang 
276763a75b2aSHong Zhang   /* Destroy Dummy submatrices created for reuse */
27689566063dSJacob Faibussowitsch   PetscCall(MatDestroySubMatrices_Dummy(n, mat));
276963a75b2aSHong Zhang 
27709566063dSJacob Faibussowitsch   PetscCall(PetscFree(*mat));
27713ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
27722d033e1fSHong Zhang }
27732d033e1fSHong Zhang 
2774ba38deedSJacob Faibussowitsch static PetscErrorCode MatCreateSubMatrices_SeqAIJ(Mat A, PetscInt n, const IS irow[], const IS icol[], MatReuse scall, Mat *B[])
2775d71ae5a4SJacob Faibussowitsch {
277697f1f81fSBarry Smith   PetscInt i;
2777cddf8d76SBarry Smith 
27783a40ed3dSBarry Smith   PetscFunctionBegin;
277948a46eb9SPierre Jolivet   if (scall == MAT_INITIAL_MATRIX) PetscCall(PetscCalloc1(n + 1, B));
2780cddf8d76SBarry Smith 
278148a46eb9SPierre Jolivet   for (i = 0; i < n; i++) PetscCall(MatCreateSubMatrix_SeqAIJ(A, irow[i], icol[i], PETSC_DECIDE, scall, &(*B)[i]));
27823ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
2783cddf8d76SBarry Smith }
2784cddf8d76SBarry Smith 
2785ba38deedSJacob Faibussowitsch static PetscErrorCode MatIncreaseOverlap_SeqAIJ(Mat A, PetscInt is_max, IS is[], PetscInt ov)
2786d71ae5a4SJacob Faibussowitsch {
2787e4d965acSSatish Balay   Mat_SeqAIJ     *a = (Mat_SeqAIJ *)A->data;
27889a88ca10SBarry Smith   PetscInt        row, i, j, k, l, ll, m, n, *nidx, isz, val;
27895d0c19d7SBarry Smith   const PetscInt *idx;
279058b7e2c1SStefano Zampini   PetscInt        start, end, *ai, *aj, bs = A->rmap->bs == A->cmap->bs ? A->rmap->bs : 1;
2791f1af5d2fSBarry Smith   PetscBT         table;
2792bbd702dbSSatish Balay 
27933a40ed3dSBarry Smith   PetscFunctionBegin;
27949a88ca10SBarry Smith   m  = A->rmap->n / bs;
2795e4d965acSSatish Balay   ai = a->i;
2796bfeeae90SHong Zhang   aj = a->j;
27978a047759SSatish Balay 
279808401ef6SPierre Jolivet   PetscCheck(ov >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "illegal negative overlap value used");
279906763907SSatish Balay 
28009566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(m + 1, &nidx));
28019566063dSJacob Faibussowitsch   PetscCall(PetscBTCreate(m, &table));
280206763907SSatish Balay 
2803e4d965acSSatish Balay   for (i = 0; i < is_max; i++) {
2804b97fc60eSLois Curfman McInnes     /* Initialize the two local arrays */
2805e4d965acSSatish Balay     isz = 0;
28069566063dSJacob Faibussowitsch     PetscCall(PetscBTMemzero(m, table));
2807e4d965acSSatish Balay 
2808e4d965acSSatish Balay     /* Extract the indices, assume there can be duplicate entries */
28099566063dSJacob Faibussowitsch     PetscCall(ISGetIndices(is[i], &idx));
28109566063dSJacob Faibussowitsch     PetscCall(ISGetLocalSize(is[i], &n));
2811e4d965acSSatish Balay 
28129a88ca10SBarry Smith     if (bs > 1) {
28139a88ca10SBarry Smith       /* Enter these into the temp arrays. I.e., mark table[row], enter row into new index */
28149a88ca10SBarry Smith       for (j = 0; j < n; ++j) {
28159a88ca10SBarry Smith         if (!PetscBTLookupSet(table, idx[j] / bs)) nidx[isz++] = idx[j] / bs;
28169a88ca10SBarry Smith       }
28179a88ca10SBarry Smith       PetscCall(ISRestoreIndices(is[i], &idx));
28189a88ca10SBarry Smith       PetscCall(ISDestroy(&is[i]));
28199a88ca10SBarry Smith 
28209a88ca10SBarry Smith       k = 0;
28219a88ca10SBarry Smith       for (j = 0; j < ov; j++) { /* for each overlap */
28229a88ca10SBarry Smith         n = isz;
28239a88ca10SBarry Smith         for (; k < n; k++) { /* do only those rows in nidx[k], which are not done yet */
28249a88ca10SBarry Smith           for (ll = 0; ll < bs; ll++) {
28259a88ca10SBarry Smith             row   = bs * nidx[k] + ll;
28269a88ca10SBarry Smith             start = ai[row];
28279a88ca10SBarry Smith             end   = ai[row + 1];
28289a88ca10SBarry Smith             for (l = start; l < end; l++) {
28299a88ca10SBarry Smith               val = aj[l] / bs;
28309a88ca10SBarry Smith               if (!PetscBTLookupSet(table, val)) nidx[isz++] = val;
28319a88ca10SBarry Smith             }
28329a88ca10SBarry Smith           }
28339a88ca10SBarry Smith         }
28349a88ca10SBarry Smith       }
283557508eceSPierre Jolivet       PetscCall(ISCreateBlock(PETSC_COMM_SELF, bs, isz, nidx, PETSC_COPY_VALUES, is + i));
28369a88ca10SBarry Smith     } else {
2837dd097bc3SLois Curfman McInnes       /* Enter these into the temp arrays. I.e., mark table[row], enter row into new index */
2838e4d965acSSatish Balay       for (j = 0; j < n; ++j) {
28392205254eSKarl Rupp         if (!PetscBTLookupSet(table, idx[j])) nidx[isz++] = idx[j];
28404dcbc457SBarry Smith       }
28419566063dSJacob Faibussowitsch       PetscCall(ISRestoreIndices(is[i], &idx));
28429566063dSJacob Faibussowitsch       PetscCall(ISDestroy(&is[i]));
2843e4d965acSSatish Balay 
284404a348a9SBarry Smith       k = 0;
284504a348a9SBarry Smith       for (j = 0; j < ov; j++) { /* for each overlap */
284604a348a9SBarry Smith         n = isz;
284706763907SSatish Balay         for (; k < n; k++) { /* do only those rows in nidx[k], which are not done yet */
2848e4d965acSSatish Balay           row   = nidx[k];
2849e4d965acSSatish Balay           start = ai[row];
2850e4d965acSSatish Balay           end   = ai[row + 1];
285104a348a9SBarry Smith           for (l = start; l < end; l++) {
2852efb16452SHong Zhang             val = aj[l];
28532205254eSKarl Rupp             if (!PetscBTLookupSet(table, val)) nidx[isz++] = val;
2854e4d965acSSatish Balay           }
2855e4d965acSSatish Balay         }
2856e4d965acSSatish Balay       }
285757508eceSPierre Jolivet       PetscCall(ISCreateGeneral(PETSC_COMM_SELF, isz, nidx, PETSC_COPY_VALUES, is + i));
2858e4d965acSSatish Balay     }
28599a88ca10SBarry Smith   }
28609566063dSJacob Faibussowitsch   PetscCall(PetscBTDestroy(&table));
28619566063dSJacob Faibussowitsch   PetscCall(PetscFree(nidx));
28623ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
28634dcbc457SBarry Smith }
286417ab2063SBarry Smith 
2865ba38deedSJacob Faibussowitsch static PetscErrorCode MatPermute_SeqAIJ(Mat A, IS rowp, IS colp, Mat *B)
2866d71ae5a4SJacob Faibussowitsch {
28670513a670SBarry Smith   Mat_SeqAIJ     *a = (Mat_SeqAIJ *)A->data;
28683b98c0a2SBarry Smith   PetscInt        i, nz = 0, m = A->rmap->n, n = A->cmap->n;
28695d0c19d7SBarry Smith   const PetscInt *row, *col;
28705d0c19d7SBarry Smith   PetscInt       *cnew, j, *lens;
287156cd22aeSBarry Smith   IS              icolp, irowp;
28720298fd71SBarry Smith   PetscInt       *cwork = NULL;
28730298fd71SBarry Smith   PetscScalar    *vwork = NULL;
28740513a670SBarry Smith 
28753a40ed3dSBarry Smith   PetscFunctionBegin;
28769566063dSJacob Faibussowitsch   PetscCall(ISInvertPermutation(rowp, PETSC_DECIDE, &irowp));
28779566063dSJacob Faibussowitsch   PetscCall(ISGetIndices(irowp, &row));
28789566063dSJacob Faibussowitsch   PetscCall(ISInvertPermutation(colp, PETSC_DECIDE, &icolp));
28799566063dSJacob Faibussowitsch   PetscCall(ISGetIndices(icolp, &col));
28800513a670SBarry Smith 
28810513a670SBarry Smith   /* determine lengths of permuted rows */
28829566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(m + 1, &lens));
28832205254eSKarl Rupp   for (i = 0; i < m; i++) lens[row[i]] = a->i[i + 1] - a->i[i];
28849566063dSJacob Faibussowitsch   PetscCall(MatCreate(PetscObjectComm((PetscObject)A), B));
28859566063dSJacob Faibussowitsch   PetscCall(MatSetSizes(*B, m, n, m, n));
28869566063dSJacob Faibussowitsch   PetscCall(MatSetBlockSizesFromMats(*B, A, A));
28879566063dSJacob Faibussowitsch   PetscCall(MatSetType(*B, ((PetscObject)A)->type_name));
28889566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(*B, 0, lens));
28899566063dSJacob Faibussowitsch   PetscCall(PetscFree(lens));
28900513a670SBarry Smith 
28919566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(n, &cnew));
28920513a670SBarry Smith   for (i = 0; i < m; i++) {
28939566063dSJacob Faibussowitsch     PetscCall(MatGetRow_SeqAIJ(A, i, &nz, &cwork, &vwork));
28942205254eSKarl Rupp     for (j = 0; j < nz; j++) cnew[j] = col[cwork[j]];
28959566063dSJacob Faibussowitsch     PetscCall(MatSetValues_SeqAIJ(*B, 1, &row[i], nz, cnew, vwork, INSERT_VALUES));
28969566063dSJacob Faibussowitsch     PetscCall(MatRestoreRow_SeqAIJ(A, i, &nz, &cwork, &vwork));
28970513a670SBarry Smith   }
28989566063dSJacob Faibussowitsch   PetscCall(PetscFree(cnew));
28992205254eSKarl Rupp 
29003c7d62e4SBarry Smith   (*B)->assembled = PETSC_FALSE;
29012205254eSKarl Rupp 
29028c3ff71bSJunchao Zhang #if defined(PETSC_HAVE_DEVICE)
29039566063dSJacob Faibussowitsch   PetscCall(MatBindToCPU(*B, A->boundtocpu));
29049fe5e383SStefano Zampini #endif
29059566063dSJacob Faibussowitsch   PetscCall(MatAssemblyBegin(*B, MAT_FINAL_ASSEMBLY));
29069566063dSJacob Faibussowitsch   PetscCall(MatAssemblyEnd(*B, MAT_FINAL_ASSEMBLY));
29079566063dSJacob Faibussowitsch   PetscCall(ISRestoreIndices(irowp, &row));
29089566063dSJacob Faibussowitsch   PetscCall(ISRestoreIndices(icolp, &col));
29099566063dSJacob Faibussowitsch   PetscCall(ISDestroy(&irowp));
29109566063dSJacob Faibussowitsch   PetscCall(ISDestroy(&icolp));
291148a46eb9SPierre Jolivet   if (rowp == colp) PetscCall(MatPropagateSymmetryOptions(A, *B));
29123ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
29130513a670SBarry Smith }
29140513a670SBarry Smith 
2915d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCopy_SeqAIJ(Mat A, Mat B, MatStructure str)
2916d71ae5a4SJacob Faibussowitsch {
2917cb5b572fSBarry Smith   PetscFunctionBegin;
291833f4a19fSKris Buschelman   /* If the two matrices have the same copy implementation, use fast copy. */
291933f4a19fSKris Buschelman   if (str == SAME_NONZERO_PATTERN && (A->ops->copy == B->ops->copy)) {
2920be6bf707SBarry Smith     Mat_SeqAIJ        *a = (Mat_SeqAIJ *)A->data;
2921be6bf707SBarry Smith     Mat_SeqAIJ        *b = (Mat_SeqAIJ *)B->data;
29222e5835c6SStefano Zampini     const PetscScalar *aa;
29233ac85a22SJunchao Zhang     PetscScalar       *bb;
2924be6bf707SBarry Smith 
29259566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJGetArrayRead(A, &aa));
29263ac85a22SJunchao Zhang     PetscCall(MatSeqAIJGetArrayWrite(B, &bb));
29273ac85a22SJunchao Zhang 
292808401ef6SPierre Jolivet     PetscCheck(a->i[A->rmap->n] == b->i[B->rmap->n], PETSC_COMM_SELF, PETSC_ERR_ARG_INCOMP, "Number of nonzeros in two matrices are different %" PetscInt_FMT " != %" PetscInt_FMT, a->i[A->rmap->n], b->i[B->rmap->n]);
29293ac85a22SJunchao Zhang     PetscCall(PetscArraycpy(bb, aa, a->i[A->rmap->n]));
29309566063dSJacob Faibussowitsch     PetscCall(PetscObjectStateIncrease((PetscObject)B));
29319566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJRestoreArrayRead(A, &aa));
29323ac85a22SJunchao Zhang     PetscCall(MatSeqAIJRestoreArrayWrite(B, &bb));
2933cb5b572fSBarry Smith   } else {
29349566063dSJacob Faibussowitsch     PetscCall(MatCopy_Basic(A, B, str));
2935cb5b572fSBarry Smith   }
29363ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
2937cb5b572fSBarry Smith }
2938cb5b572fSBarry Smith 
2939d71ae5a4SJacob Faibussowitsch PETSC_INTERN PetscErrorCode MatSeqAIJGetArray_SeqAIJ(Mat A, PetscScalar *array[])
2940d71ae5a4SJacob Faibussowitsch {
29416c0721eeSBarry Smith   Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data;
29426e111a19SKarl Rupp 
29436c0721eeSBarry Smith   PetscFunctionBegin;
29446c0721eeSBarry Smith   *array = a->a;
29453ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
29466c0721eeSBarry Smith }
29476c0721eeSBarry Smith 
2948d71ae5a4SJacob Faibussowitsch PETSC_INTERN PetscErrorCode MatSeqAIJRestoreArray_SeqAIJ(Mat A, PetscScalar *array[])
2949d71ae5a4SJacob Faibussowitsch {
29506c0721eeSBarry Smith   PetscFunctionBegin;
2951f38c1e66SStefano Zampini   *array = NULL;
29523ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
29536c0721eeSBarry Smith }
2954273d9f13SBarry Smith 
29558229c054SShri Abhyankar /*
29568229c054SShri Abhyankar    Computes the number of nonzeros per row needed for preallocation when X and Y
29578229c054SShri Abhyankar    have different nonzero structure.
29588229c054SShri Abhyankar */
2959d71ae5a4SJacob Faibussowitsch PetscErrorCode MatAXPYGetPreallocation_SeqX_private(PetscInt m, const PetscInt *xi, const PetscInt *xj, const PetscInt *yi, const PetscInt *yj, PetscInt *nnz)
2960d71ae5a4SJacob Faibussowitsch {
2961b264fe52SHong Zhang   PetscInt i, j, k, nzx, nzy;
2962ec7775f6SShri Abhyankar 
2963ec7775f6SShri Abhyankar   PetscFunctionBegin;
2964ec7775f6SShri Abhyankar   /* Set the number of nonzeros in the new matrix */
2965ec7775f6SShri Abhyankar   for (i = 0; i < m; i++) {
29668e3a54c0SPierre Jolivet     const PetscInt *xjj = PetscSafePointerPlusOffset(xj, xi[i]), *yjj = PetscSafePointerPlusOffset(yj, yi[i]);
2967b264fe52SHong Zhang     nzx    = xi[i + 1] - xi[i];
2968b264fe52SHong Zhang     nzy    = yi[i + 1] - yi[i];
29698af7cee1SJed Brown     nnz[i] = 0;
29708af7cee1SJed Brown     for (j = 0, k = 0; j < nzx; j++) {                  /* Point in X */
2971b264fe52SHong Zhang       for (; k < nzy && yjj[k] < xjj[j]; k++) nnz[i]++; /* Catch up to X */
2972b264fe52SHong Zhang       if (k < nzy && yjj[k] == xjj[j]) k++;             /* Skip duplicate */
29738af7cee1SJed Brown       nnz[i]++;
29748af7cee1SJed Brown     }
29758af7cee1SJed Brown     for (; k < nzy; k++) nnz[i]++;
2976ec7775f6SShri Abhyankar   }
29773ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
2978ec7775f6SShri Abhyankar }
2979ec7775f6SShri Abhyankar 
2980d71ae5a4SJacob Faibussowitsch PetscErrorCode MatAXPYGetPreallocation_SeqAIJ(Mat Y, Mat X, PetscInt *nnz)
2981d71ae5a4SJacob Faibussowitsch {
2982b264fe52SHong Zhang   PetscInt    m = Y->rmap->N;
2983b264fe52SHong Zhang   Mat_SeqAIJ *x = (Mat_SeqAIJ *)X->data;
2984b264fe52SHong Zhang   Mat_SeqAIJ *y = (Mat_SeqAIJ *)Y->data;
2985b264fe52SHong Zhang 
2986b264fe52SHong Zhang   PetscFunctionBegin;
2987b264fe52SHong Zhang   /* Set the number of nonzeros in the new matrix */
29889566063dSJacob Faibussowitsch   PetscCall(MatAXPYGetPreallocation_SeqX_private(m, x->i, x->j, y->i, y->j, nnz));
29893ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
2990b264fe52SHong Zhang }
2991b264fe52SHong Zhang 
2992d71ae5a4SJacob Faibussowitsch PetscErrorCode MatAXPY_SeqAIJ(Mat Y, PetscScalar a, Mat X, MatStructure str)
2993d71ae5a4SJacob Faibussowitsch {
2994ac90fabeSBarry Smith   Mat_SeqAIJ *x = (Mat_SeqAIJ *)X->data, *y = (Mat_SeqAIJ *)Y->data;
2995ac90fabeSBarry Smith 
2996ac90fabeSBarry Smith   PetscFunctionBegin;
2997134adf20SPierre Jolivet   if (str == UNKNOWN_NONZERO_PATTERN || (PetscDefined(USE_DEBUG) && str == SAME_NONZERO_PATTERN)) {
2998134adf20SPierre Jolivet     PetscBool e = x->nz == y->nz ? PETSC_TRUE : PETSC_FALSE;
2999134adf20SPierre Jolivet     if (e) {
30009566063dSJacob Faibussowitsch       PetscCall(PetscArraycmp(x->i, y->i, Y->rmap->n + 1, &e));
300181fa06acSBarry Smith       if (e) {
30029566063dSJacob Faibussowitsch         PetscCall(PetscArraycmp(x->j, y->j, y->nz, &e));
3003134adf20SPierre Jolivet         if (e) str = SAME_NONZERO_PATTERN;
300481fa06acSBarry Smith       }
300581fa06acSBarry Smith     }
300654c59aa7SJacob Faibussowitsch     if (!e) PetscCheck(str != SAME_NONZERO_PATTERN, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONG, "MatStructure is not SAME_NONZERO_PATTERN");
300781fa06acSBarry Smith   }
3008ac90fabeSBarry Smith   if (str == SAME_NONZERO_PATTERN) {
30092e5835c6SStefano Zampini     const PetscScalar *xa;
30102e5835c6SStefano Zampini     PetscScalar       *ya, alpha = a;
301181fa06acSBarry Smith     PetscBLASInt       one = 1, bnz;
301281fa06acSBarry Smith 
30139566063dSJacob Faibussowitsch     PetscCall(PetscBLASIntCast(x->nz, &bnz));
30149566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJGetArray(Y, &ya));
30159566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJGetArrayRead(X, &xa));
3016792fecdfSBarry Smith     PetscCallBLAS("BLASaxpy", BLASaxpy_(&bnz, &alpha, xa, &one, ya, &one));
30179566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJRestoreArrayRead(X, &xa));
30189566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJRestoreArray(Y, &ya));
30199566063dSJacob Faibussowitsch     PetscCall(PetscLogFlops(2.0 * bnz));
30209566063dSJacob Faibussowitsch     PetscCall(PetscObjectStateIncrease((PetscObject)Y));
3021ab784542SHong Zhang   } else if (str == SUBSET_NONZERO_PATTERN) { /* nonzeros of X is a subset of Y's */
30229566063dSJacob Faibussowitsch     PetscCall(MatAXPY_Basic(Y, a, X, str));
3023ac90fabeSBarry Smith   } else {
30248229c054SShri Abhyankar     Mat       B;
30258229c054SShri Abhyankar     PetscInt *nnz;
30269566063dSJacob Faibussowitsch     PetscCall(PetscMalloc1(Y->rmap->N, &nnz));
30279566063dSJacob Faibussowitsch     PetscCall(MatCreate(PetscObjectComm((PetscObject)Y), &B));
30289566063dSJacob Faibussowitsch     PetscCall(PetscObjectSetName((PetscObject)B, ((PetscObject)Y)->name));
30299566063dSJacob Faibussowitsch     PetscCall(MatSetLayouts(B, Y->rmap, Y->cmap));
30309566063dSJacob Faibussowitsch     PetscCall(MatSetType(B, ((PetscObject)Y)->type_name));
30319566063dSJacob Faibussowitsch     PetscCall(MatAXPYGetPreallocation_SeqAIJ(Y, X, nnz));
30329566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJSetPreallocation(B, 0, nnz));
30339566063dSJacob Faibussowitsch     PetscCall(MatAXPY_BasicWithPreallocation(B, Y, a, X, str));
30349566063dSJacob Faibussowitsch     PetscCall(MatHeaderMerge(Y, &B));
30359bb234a9SBarry Smith     PetscCall(MatSeqAIJCheckInode(Y));
30369566063dSJacob Faibussowitsch     PetscCall(PetscFree(nnz));
3037ac90fabeSBarry Smith   }
30383ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3039ac90fabeSBarry Smith }
3040ac90fabeSBarry Smith 
3041d71ae5a4SJacob Faibussowitsch PETSC_INTERN PetscErrorCode MatConjugate_SeqAIJ(Mat mat)
3042d71ae5a4SJacob Faibussowitsch {
3043354c94deSBarry Smith #if defined(PETSC_USE_COMPLEX)
3044354c94deSBarry Smith   Mat_SeqAIJ  *aij = (Mat_SeqAIJ *)mat->data;
3045354c94deSBarry Smith   PetscInt     i, nz;
3046354c94deSBarry Smith   PetscScalar *a;
3047354c94deSBarry Smith 
3048354c94deSBarry Smith   PetscFunctionBegin;
3049354c94deSBarry Smith   nz = aij->nz;
30509566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArray(mat, &a));
30512205254eSKarl Rupp   for (i = 0; i < nz; i++) a[i] = PetscConj(a[i]);
30529566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArray(mat, &a));
3053354c94deSBarry Smith #else
3054354c94deSBarry Smith   PetscFunctionBegin;
3055354c94deSBarry Smith #endif
30563ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3057354c94deSBarry Smith }
3058354c94deSBarry Smith 
3059ba38deedSJacob Faibussowitsch static PetscErrorCode MatGetRowMaxAbs_SeqAIJ(Mat A, Vec v, PetscInt idx[])
3060d71ae5a4SJacob Faibussowitsch {
3061e34fafa9SBarry Smith   Mat_SeqAIJ      *a = (Mat_SeqAIJ *)A->data;
3062d0f46423SBarry Smith   PetscInt         i, j, m = A->rmap->n, *ai, *aj, ncols, n;
3063e34fafa9SBarry Smith   PetscReal        atmp;
3064985db425SBarry Smith   PetscScalar     *x;
3065ce496241SStefano Zampini   const MatScalar *aa, *av;
3066e34fafa9SBarry Smith 
3067e34fafa9SBarry Smith   PetscFunctionBegin;
306828b400f6SJacob Faibussowitsch   PetscCheck(!A->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix");
30699566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &av));
3070ce496241SStefano Zampini   aa = av;
3071e34fafa9SBarry Smith   ai = a->i;
3072e34fafa9SBarry Smith   aj = a->j;
3073e34fafa9SBarry Smith 
30749566063dSJacob Faibussowitsch   PetscCall(VecGetArrayWrite(v, &x));
30759566063dSJacob Faibussowitsch   PetscCall(VecGetLocalSize(v, &n));
307608401ef6SPierre Jolivet   PetscCheck(n == A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Nonconforming matrix and vector");
3077e34fafa9SBarry Smith   for (i = 0; i < m; i++) {
30789371c9d4SSatish Balay     ncols = ai[1] - ai[0];
30799371c9d4SSatish Balay     ai++;
308062e5df07SMark Adams     x[i] = 0;
3081e34fafa9SBarry Smith     for (j = 0; j < ncols; j++) {
3082985db425SBarry Smith       atmp = PetscAbsScalar(*aa);
30839371c9d4SSatish Balay       if (PetscAbsScalar(x[i]) < atmp) {
30849371c9d4SSatish Balay         x[i] = atmp;
30859371c9d4SSatish Balay         if (idx) idx[i] = *aj;
30869371c9d4SSatish Balay       }
30879371c9d4SSatish Balay       aa++;
30889371c9d4SSatish Balay       aj++;
3089985db425SBarry Smith     }
3090985db425SBarry Smith   }
30919566063dSJacob Faibussowitsch   PetscCall(VecRestoreArrayWrite(v, &x));
30929566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &av));
30933ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3094985db425SBarry Smith }
3095985db425SBarry Smith 
3096eede4a3fSMark Adams static PetscErrorCode MatGetRowSumAbs_SeqAIJ(Mat A, Vec v)
3097eede4a3fSMark Adams {
3098eede4a3fSMark Adams   Mat_SeqAIJ      *a = (Mat_SeqAIJ *)A->data;
3099eede4a3fSMark Adams   PetscInt         i, j, m = A->rmap->n, *ai, ncols, n;
3100eede4a3fSMark Adams   PetscScalar     *x;
3101eede4a3fSMark Adams   const MatScalar *aa, *av;
3102eede4a3fSMark Adams 
3103eede4a3fSMark Adams   PetscFunctionBegin;
3104eede4a3fSMark Adams   PetscCheck(!A->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix");
3105eede4a3fSMark Adams   PetscCall(MatSeqAIJGetArrayRead(A, &av));
3106eede4a3fSMark Adams   aa = av;
3107eede4a3fSMark Adams   ai = a->i;
3108eede4a3fSMark Adams 
3109eede4a3fSMark Adams   PetscCall(VecGetArrayWrite(v, &x));
3110eede4a3fSMark Adams   PetscCall(VecGetLocalSize(v, &n));
3111eede4a3fSMark Adams   PetscCheck(n == A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Nonconforming matrix and vector");
3112eede4a3fSMark Adams   for (i = 0; i < m; i++) {
3113eede4a3fSMark Adams     ncols = ai[1] - ai[0];
3114eede4a3fSMark Adams     ai++;
311562e5df07SMark Adams     x[i] = 0;
3116eede4a3fSMark Adams     for (j = 0; j < ncols; j++) {
3117eede4a3fSMark Adams       x[i] += PetscAbsScalar(*aa);
3118eede4a3fSMark Adams       aa++;
3119eede4a3fSMark Adams     }
3120eede4a3fSMark Adams   }
3121eede4a3fSMark Adams   PetscCall(VecRestoreArrayWrite(v, &x));
3122eede4a3fSMark Adams   PetscCall(MatSeqAIJRestoreArrayRead(A, &av));
3123eede4a3fSMark Adams   PetscFunctionReturn(PETSC_SUCCESS);
3124eede4a3fSMark Adams }
3125eede4a3fSMark Adams 
3126ba38deedSJacob Faibussowitsch static PetscErrorCode MatGetRowMax_SeqAIJ(Mat A, Vec v, PetscInt idx[])
3127d71ae5a4SJacob Faibussowitsch {
3128985db425SBarry Smith   Mat_SeqAIJ      *a = (Mat_SeqAIJ *)A->data;
3129d0f46423SBarry Smith   PetscInt         i, j, m = A->rmap->n, *ai, *aj, ncols, n;
3130985db425SBarry Smith   PetscScalar     *x;
3131ce496241SStefano Zampini   const MatScalar *aa, *av;
3132985db425SBarry Smith 
3133985db425SBarry Smith   PetscFunctionBegin;
313428b400f6SJacob Faibussowitsch   PetscCheck(!A->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix");
31359566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &av));
3136ce496241SStefano Zampini   aa = av;
3137985db425SBarry Smith   ai = a->i;
3138985db425SBarry Smith   aj = a->j;
3139985db425SBarry Smith 
31409566063dSJacob Faibussowitsch   PetscCall(VecGetArrayWrite(v, &x));
31419566063dSJacob Faibussowitsch   PetscCall(VecGetLocalSize(v, &n));
314208401ef6SPierre Jolivet   PetscCheck(n == A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Nonconforming matrix and vector");
3143985db425SBarry Smith   for (i = 0; i < m; i++) {
31449371c9d4SSatish Balay     ncols = ai[1] - ai[0];
31459371c9d4SSatish Balay     ai++;
3146d0f46423SBarry Smith     if (ncols == A->cmap->n) { /* row is dense */
31479371c9d4SSatish Balay       x[i] = *aa;
31489371c9d4SSatish Balay       if (idx) idx[i] = 0;
3149985db425SBarry Smith     } else { /* row is sparse so already KNOW maximum is 0.0 or higher */
3150985db425SBarry Smith       x[i] = 0.0;
3151985db425SBarry Smith       if (idx) {
3152985db425SBarry Smith         for (j = 0; j < ncols; j++) { /* find first implicit 0.0 in the row */
3153985db425SBarry Smith           if (aj[j] > j) {
3154985db425SBarry Smith             idx[i] = j;
3155985db425SBarry Smith             break;
3156985db425SBarry Smith           }
3157985db425SBarry Smith         }
31581a254869SHong Zhang         /* in case first implicit 0.0 in the row occurs at ncols-th column */
31591a254869SHong Zhang         if (j == ncols && j < A->cmap->n) idx[i] = j;
3160985db425SBarry Smith       }
3161985db425SBarry Smith     }
3162985db425SBarry Smith     for (j = 0; j < ncols; j++) {
31639371c9d4SSatish Balay       if (PetscRealPart(x[i]) < PetscRealPart(*aa)) {
31649371c9d4SSatish Balay         x[i] = *aa;
31659371c9d4SSatish Balay         if (idx) idx[i] = *aj;
31669371c9d4SSatish Balay       }
31679371c9d4SSatish Balay       aa++;
31689371c9d4SSatish Balay       aj++;
3169985db425SBarry Smith     }
3170985db425SBarry Smith   }
31719566063dSJacob Faibussowitsch   PetscCall(VecRestoreArrayWrite(v, &x));
31729566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &av));
31733ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3174985db425SBarry Smith }
3175985db425SBarry Smith 
3176ba38deedSJacob Faibussowitsch static PetscErrorCode MatGetRowMinAbs_SeqAIJ(Mat A, Vec v, PetscInt idx[])
3177d71ae5a4SJacob Faibussowitsch {
3178c87e5d42SMatthew Knepley   Mat_SeqAIJ      *a = (Mat_SeqAIJ *)A->data;
3179c87e5d42SMatthew Knepley   PetscInt         i, j, m = A->rmap->n, *ai, *aj, ncols, n;
3180ce496241SStefano Zampini   PetscScalar     *x;
3181ce496241SStefano Zampini   const MatScalar *aa, *av;
3182c87e5d42SMatthew Knepley 
3183c87e5d42SMatthew Knepley   PetscFunctionBegin;
31849566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &av));
3185ce496241SStefano Zampini   aa = av;
3186c87e5d42SMatthew Knepley   ai = a->i;
3187c87e5d42SMatthew Knepley   aj = a->j;
3188c87e5d42SMatthew Knepley 
31899566063dSJacob Faibussowitsch   PetscCall(VecGetArrayWrite(v, &x));
31909566063dSJacob Faibussowitsch   PetscCall(VecGetLocalSize(v, &n));
319108401ef6SPierre Jolivet   PetscCheck(n == m, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Nonconforming matrix and vector, %" PetscInt_FMT " vs. %" PetscInt_FMT " rows", m, n);
3192c87e5d42SMatthew Knepley   for (i = 0; i < m; i++) {
31939371c9d4SSatish Balay     ncols = ai[1] - ai[0];
31949371c9d4SSatish Balay     ai++;
3195f07e67edSHong Zhang     if (ncols == A->cmap->n) { /* row is dense */
31969371c9d4SSatish Balay       x[i] = *aa;
31979371c9d4SSatish Balay       if (idx) idx[i] = 0;
3198f07e67edSHong Zhang     } else { /* row is sparse so already KNOW minimum is 0.0 or higher */
3199f07e67edSHong Zhang       x[i] = 0.0;
3200f07e67edSHong Zhang       if (idx) { /* find first implicit 0.0 in the row */
3201289a08f5SMatthew Knepley         for (j = 0; j < ncols; j++) {
3202f07e67edSHong Zhang           if (aj[j] > j) {
3203f07e67edSHong Zhang             idx[i] = j;
32042205254eSKarl Rupp             break;
32052205254eSKarl Rupp           }
3206289a08f5SMatthew Knepley         }
3207f07e67edSHong Zhang         /* in case first implicit 0.0 in the row occurs at ncols-th column */
3208f07e67edSHong Zhang         if (j == ncols && j < A->cmap->n) idx[i] = j;
3209f07e67edSHong Zhang       }
3210289a08f5SMatthew Knepley     }
3211c87e5d42SMatthew Knepley     for (j = 0; j < ncols; j++) {
32129371c9d4SSatish Balay       if (PetscAbsScalar(x[i]) > PetscAbsScalar(*aa)) {
32139371c9d4SSatish Balay         x[i] = *aa;
32149371c9d4SSatish Balay         if (idx) idx[i] = *aj;
32159371c9d4SSatish Balay       }
32169371c9d4SSatish Balay       aa++;
32179371c9d4SSatish Balay       aj++;
3218c87e5d42SMatthew Knepley     }
3219c87e5d42SMatthew Knepley   }
32209566063dSJacob Faibussowitsch   PetscCall(VecRestoreArrayWrite(v, &x));
32219566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &av));
32223ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3223c87e5d42SMatthew Knepley }
3224c87e5d42SMatthew Knepley 
3225ba38deedSJacob Faibussowitsch static PetscErrorCode MatGetRowMin_SeqAIJ(Mat A, Vec v, PetscInt idx[])
3226d71ae5a4SJacob Faibussowitsch {
3227985db425SBarry Smith   Mat_SeqAIJ      *a = (Mat_SeqAIJ *)A->data;
3228d9ca1df4SBarry Smith   PetscInt         i, j, m = A->rmap->n, ncols, n;
3229d9ca1df4SBarry Smith   const PetscInt  *ai, *aj;
3230985db425SBarry Smith   PetscScalar     *x;
3231ce496241SStefano Zampini   const MatScalar *aa, *av;
3232985db425SBarry Smith 
3233985db425SBarry Smith   PetscFunctionBegin;
323428b400f6SJacob Faibussowitsch   PetscCheck(!A->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix");
32359566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &av));
3236ce496241SStefano Zampini   aa = av;
3237985db425SBarry Smith   ai = a->i;
3238985db425SBarry Smith   aj = a->j;
3239985db425SBarry Smith 
32409566063dSJacob Faibussowitsch   PetscCall(VecGetArrayWrite(v, &x));
32419566063dSJacob Faibussowitsch   PetscCall(VecGetLocalSize(v, &n));
324208401ef6SPierre Jolivet   PetscCheck(n == m, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Nonconforming matrix and vector");
3243985db425SBarry Smith   for (i = 0; i < m; i++) {
32449371c9d4SSatish Balay     ncols = ai[1] - ai[0];
32459371c9d4SSatish Balay     ai++;
3246d0f46423SBarry Smith     if (ncols == A->cmap->n) { /* row is dense */
32479371c9d4SSatish Balay       x[i] = *aa;
32489371c9d4SSatish Balay       if (idx) idx[i] = 0;
3249985db425SBarry Smith     } else { /* row is sparse so already KNOW minimum is 0.0 or lower */
3250985db425SBarry Smith       x[i] = 0.0;
3251985db425SBarry Smith       if (idx) { /* find first implicit 0.0 in the row */
3252985db425SBarry Smith         for (j = 0; j < ncols; j++) {
3253985db425SBarry Smith           if (aj[j] > j) {
3254985db425SBarry Smith             idx[i] = j;
3255985db425SBarry Smith             break;
3256985db425SBarry Smith           }
3257985db425SBarry Smith         }
3258fa213d2fSHong Zhang         /* in case first implicit 0.0 in the row occurs at ncols-th column */
3259fa213d2fSHong Zhang         if (j == ncols && j < A->cmap->n) idx[i] = j;
3260985db425SBarry Smith       }
3261985db425SBarry Smith     }
3262985db425SBarry Smith     for (j = 0; j < ncols; j++) {
32639371c9d4SSatish Balay       if (PetscRealPart(x[i]) > PetscRealPart(*aa)) {
32649371c9d4SSatish Balay         x[i] = *aa;
32659371c9d4SSatish Balay         if (idx) idx[i] = *aj;
32669371c9d4SSatish Balay       }
32679371c9d4SSatish Balay       aa++;
32689371c9d4SSatish Balay       aj++;
3269e34fafa9SBarry Smith     }
3270e34fafa9SBarry Smith   }
32719566063dSJacob Faibussowitsch   PetscCall(VecRestoreArrayWrite(v, &x));
32729566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &av));
32733ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3274e34fafa9SBarry Smith }
3275bbead8a2SBarry Smith 
3276ba38deedSJacob Faibussowitsch static PetscErrorCode MatInvertBlockDiagonal_SeqAIJ(Mat A, const PetscScalar **values)
3277d71ae5a4SJacob Faibussowitsch {
3278bbead8a2SBarry Smith   Mat_SeqAIJ     *a = (Mat_SeqAIJ *)A->data;
327958b7e2c1SStefano Zampini   PetscInt        i, bs = A->rmap->bs, mbs = A->rmap->n / bs, ipvt[5], bs2 = bs * bs, *v_pivots, ij[7], *IJ, j;
3280bbead8a2SBarry Smith   MatScalar      *diag, work[25], *v_work;
32810da83c2eSBarry Smith   const PetscReal shift = 0.0;
32821a9391e3SHong Zhang   PetscBool       allowzeropivot, zeropivotdetected = PETSC_FALSE;
3283bbead8a2SBarry Smith 
3284bbead8a2SBarry Smith   PetscFunctionBegin;
3285a455e926SHong Zhang   allowzeropivot = PetscNot(A->erroriffailure);
32864a0d0026SBarry Smith   if (a->ibdiagvalid) {
32874a0d0026SBarry Smith     if (values) *values = a->ibdiag;
32883ba16761SJacob Faibussowitsch     PetscFunctionReturn(PETSC_SUCCESS);
32894a0d0026SBarry Smith   }
32909566063dSJacob Faibussowitsch   PetscCall(MatMarkDiagonal_SeqAIJ(A));
32913a7d0413SPierre Jolivet   if (!a->ibdiag) PetscCall(PetscMalloc1(bs2 * mbs, &a->ibdiag));
3292bbead8a2SBarry Smith   diag = a->ibdiag;
3293bbead8a2SBarry Smith   if (values) *values = a->ibdiag;
3294bbead8a2SBarry Smith   /* factor and invert each block */
3295bbead8a2SBarry Smith   switch (bs) {
3296bbead8a2SBarry Smith   case 1:
3297bbead8a2SBarry Smith     for (i = 0; i < mbs; i++) {
32989566063dSJacob Faibussowitsch       PetscCall(MatGetValues(A, 1, &i, 1, &i, diag + i));
3299ec1892c8SHong Zhang       if (PetscAbsScalar(diag[i] + shift) < PETSC_MACHINE_EPSILON) {
3300966bd95aSPierre Jolivet         PetscCheck(allowzeropivot, PETSC_COMM_SELF, PETSC_ERR_MAT_LU_ZRPVT, "Zero pivot, row %" PetscInt_FMT " pivot %g tolerance %g", i, (double)PetscAbsScalar(diag[i]), (double)PETSC_MACHINE_EPSILON);
33017b6c816cSBarry Smith         A->factorerrortype             = MAT_FACTOR_NUMERIC_ZEROPIVOT;
33027b6c816cSBarry Smith         A->factorerror_zeropivot_value = PetscAbsScalar(diag[i]);
33037b6c816cSBarry Smith         A->factorerror_zeropivot_row   = i;
33049566063dSJacob Faibussowitsch         PetscCall(PetscInfo(A, "Zero pivot, row %" PetscInt_FMT " pivot %g tolerance %g\n", i, (double)PetscAbsScalar(diag[i]), (double)PETSC_MACHINE_EPSILON));
3305ec1892c8SHong Zhang       }
3306bbead8a2SBarry Smith       diag[i] = (PetscScalar)1.0 / (diag[i] + shift);
3307bbead8a2SBarry Smith     }
3308bbead8a2SBarry Smith     break;
3309bbead8a2SBarry Smith   case 2:
3310bbead8a2SBarry Smith     for (i = 0; i < mbs; i++) {
33119371c9d4SSatish Balay       ij[0] = 2 * i;
33129371c9d4SSatish Balay       ij[1] = 2 * i + 1;
33139566063dSJacob Faibussowitsch       PetscCall(MatGetValues(A, 2, ij, 2, ij, diag));
33149566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_inverse_A_2(diag, shift, allowzeropivot, &zeropivotdetected));
33157b6c816cSBarry Smith       if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT;
33169566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_transpose_A_2(diag));
3317bbead8a2SBarry Smith       diag += 4;
3318bbead8a2SBarry Smith     }
3319bbead8a2SBarry Smith     break;
3320bbead8a2SBarry Smith   case 3:
3321bbead8a2SBarry Smith     for (i = 0; i < mbs; i++) {
33229371c9d4SSatish Balay       ij[0] = 3 * i;
33239371c9d4SSatish Balay       ij[1] = 3 * i + 1;
33249371c9d4SSatish Balay       ij[2] = 3 * i + 2;
33259566063dSJacob Faibussowitsch       PetscCall(MatGetValues(A, 3, ij, 3, ij, diag));
33269566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_inverse_A_3(diag, shift, allowzeropivot, &zeropivotdetected));
33277b6c816cSBarry Smith       if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT;
33289566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_transpose_A_3(diag));
3329bbead8a2SBarry Smith       diag += 9;
3330bbead8a2SBarry Smith     }
3331bbead8a2SBarry Smith     break;
3332bbead8a2SBarry Smith   case 4:
3333bbead8a2SBarry Smith     for (i = 0; i < mbs; i++) {
33349371c9d4SSatish Balay       ij[0] = 4 * i;
33359371c9d4SSatish Balay       ij[1] = 4 * i + 1;
33369371c9d4SSatish Balay       ij[2] = 4 * i + 2;
33379371c9d4SSatish Balay       ij[3] = 4 * i + 3;
33389566063dSJacob Faibussowitsch       PetscCall(MatGetValues(A, 4, ij, 4, ij, diag));
33399566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_inverse_A_4(diag, shift, allowzeropivot, &zeropivotdetected));
33407b6c816cSBarry Smith       if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT;
33419566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_transpose_A_4(diag));
3342bbead8a2SBarry Smith       diag += 16;
3343bbead8a2SBarry Smith     }
3344bbead8a2SBarry Smith     break;
3345bbead8a2SBarry Smith   case 5:
3346bbead8a2SBarry Smith     for (i = 0; i < mbs; i++) {
33479371c9d4SSatish Balay       ij[0] = 5 * i;
33489371c9d4SSatish Balay       ij[1] = 5 * i + 1;
33499371c9d4SSatish Balay       ij[2] = 5 * i + 2;
33509371c9d4SSatish Balay       ij[3] = 5 * i + 3;
33519371c9d4SSatish Balay       ij[4] = 5 * i + 4;
33529566063dSJacob Faibussowitsch       PetscCall(MatGetValues(A, 5, ij, 5, ij, diag));
33539566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_inverse_A_5(diag, ipvt, work, shift, allowzeropivot, &zeropivotdetected));
33547b6c816cSBarry Smith       if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT;
33559566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_transpose_A_5(diag));
3356bbead8a2SBarry Smith       diag += 25;
3357bbead8a2SBarry Smith     }
3358bbead8a2SBarry Smith     break;
3359bbead8a2SBarry Smith   case 6:
3360bbead8a2SBarry Smith     for (i = 0; i < mbs; i++) {
33619371c9d4SSatish Balay       ij[0] = 6 * i;
33629371c9d4SSatish Balay       ij[1] = 6 * i + 1;
33639371c9d4SSatish Balay       ij[2] = 6 * i + 2;
33649371c9d4SSatish Balay       ij[3] = 6 * i + 3;
33659371c9d4SSatish Balay       ij[4] = 6 * i + 4;
33669371c9d4SSatish Balay       ij[5] = 6 * i + 5;
33679566063dSJacob Faibussowitsch       PetscCall(MatGetValues(A, 6, ij, 6, ij, diag));
33689566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_inverse_A_6(diag, shift, allowzeropivot, &zeropivotdetected));
33697b6c816cSBarry Smith       if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT;
33709566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_transpose_A_6(diag));
3371bbead8a2SBarry Smith       diag += 36;
3372bbead8a2SBarry Smith     }
3373bbead8a2SBarry Smith     break;
3374bbead8a2SBarry Smith   case 7:
3375bbead8a2SBarry Smith     for (i = 0; i < mbs; i++) {
33769371c9d4SSatish Balay       ij[0] = 7 * i;
33779371c9d4SSatish Balay       ij[1] = 7 * i + 1;
33789371c9d4SSatish Balay       ij[2] = 7 * i + 2;
33799371c9d4SSatish Balay       ij[3] = 7 * i + 3;
33809371c9d4SSatish Balay       ij[4] = 7 * i + 4;
33819371c9d4SSatish Balay       ij[5] = 7 * i + 5;
3382cdd8bf47SJunchao Zhang       ij[6] = 7 * i + 6;
33839566063dSJacob Faibussowitsch       PetscCall(MatGetValues(A, 7, ij, 7, ij, diag));
33849566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_inverse_A_7(diag, shift, allowzeropivot, &zeropivotdetected));
33857b6c816cSBarry Smith       if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT;
33869566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_transpose_A_7(diag));
3387bbead8a2SBarry Smith       diag += 49;
3388bbead8a2SBarry Smith     }
3389bbead8a2SBarry Smith     break;
3390bbead8a2SBarry Smith   default:
33919566063dSJacob Faibussowitsch     PetscCall(PetscMalloc3(bs, &v_work, bs, &v_pivots, bs, &IJ));
3392bbead8a2SBarry Smith     for (i = 0; i < mbs; i++) {
3393ad540459SPierre Jolivet       for (j = 0; j < bs; j++) IJ[j] = bs * i + j;
33949566063dSJacob Faibussowitsch       PetscCall(MatGetValues(A, bs, IJ, bs, IJ, diag));
33959566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_inverse_A(bs, diag, v_pivots, v_work, allowzeropivot, &zeropivotdetected));
33967b6c816cSBarry Smith       if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT;
33979566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_transpose_A_N(diag, bs));
3398bbead8a2SBarry Smith       diag += bs2;
3399bbead8a2SBarry Smith     }
34009566063dSJacob Faibussowitsch     PetscCall(PetscFree3(v_work, v_pivots, IJ));
3401bbead8a2SBarry Smith   }
3402bbead8a2SBarry Smith   a->ibdiagvalid = PETSC_TRUE;
34033ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3404bbead8a2SBarry Smith }
3405bbead8a2SBarry Smith 
3406d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatSetRandom_SeqAIJ(Mat x, PetscRandom rctx)
3407d71ae5a4SJacob Faibussowitsch {
340873a71a0fSBarry Smith   Mat_SeqAIJ *aij = (Mat_SeqAIJ *)x->data;
3409fff043a9SJunchao Zhang   PetscScalar a, *aa;
341073a71a0fSBarry Smith   PetscInt    m, n, i, j, col;
341173a71a0fSBarry Smith 
341273a71a0fSBarry Smith   PetscFunctionBegin;
341373a71a0fSBarry Smith   if (!x->assembled) {
34149566063dSJacob Faibussowitsch     PetscCall(MatGetSize(x, &m, &n));
341573a71a0fSBarry Smith     for (i = 0; i < m; i++) {
341673a71a0fSBarry Smith       for (j = 0; j < aij->imax[i]; j++) {
34179566063dSJacob Faibussowitsch         PetscCall(PetscRandomGetValue(rctx, &a));
341873a71a0fSBarry Smith         col = (PetscInt)(n * PetscRealPart(a));
34199566063dSJacob Faibussowitsch         PetscCall(MatSetValues(x, 1, &i, 1, &col, &a, ADD_VALUES));
342073a71a0fSBarry Smith       }
342173a71a0fSBarry Smith     }
3422e2ce353bSJunchao Zhang   } else {
34239566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJGetArrayWrite(x, &aa));
34249566063dSJacob Faibussowitsch     for (i = 0; i < aij->nz; i++) PetscCall(PetscRandomGetValue(rctx, aa + i));
34259566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJRestoreArrayWrite(x, &aa));
3426e2ce353bSJunchao Zhang   }
34279566063dSJacob Faibussowitsch   PetscCall(MatAssemblyBegin(x, MAT_FINAL_ASSEMBLY));
34289566063dSJacob Faibussowitsch   PetscCall(MatAssemblyEnd(x, MAT_FINAL_ASSEMBLY));
34293ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
343073a71a0fSBarry Smith }
343173a71a0fSBarry Smith 
3432679944adSJunchao Zhang /* Like MatSetRandom_SeqAIJ, but do not set values on columns in range of [low, high) */
3433d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetRandomSkipColumnRange_SeqAIJ_Private(Mat x, PetscInt low, PetscInt high, PetscRandom rctx)
3434d71ae5a4SJacob Faibussowitsch {
3435679944adSJunchao Zhang   Mat_SeqAIJ *aij = (Mat_SeqAIJ *)x->data;
3436679944adSJunchao Zhang   PetscScalar a;
3437679944adSJunchao Zhang   PetscInt    m, n, i, j, col, nskip;
3438679944adSJunchao Zhang 
3439679944adSJunchao Zhang   PetscFunctionBegin;
3440679944adSJunchao Zhang   nskip = high - low;
34419566063dSJacob Faibussowitsch   PetscCall(MatGetSize(x, &m, &n));
3442679944adSJunchao Zhang   n -= nskip; /* shrink number of columns where nonzeros can be set */
3443679944adSJunchao Zhang   for (i = 0; i < m; i++) {
3444679944adSJunchao Zhang     for (j = 0; j < aij->imax[i]; j++) {
34459566063dSJacob Faibussowitsch       PetscCall(PetscRandomGetValue(rctx, &a));
3446679944adSJunchao Zhang       col = (PetscInt)(n * PetscRealPart(a));
3447679944adSJunchao Zhang       if (col >= low) col += nskip; /* shift col rightward to skip the hole */
34489566063dSJacob Faibussowitsch       PetscCall(MatSetValues(x, 1, &i, 1, &col, &a, ADD_VALUES));
3449679944adSJunchao Zhang     }
3450e2ce353bSJunchao Zhang   }
34519566063dSJacob Faibussowitsch   PetscCall(MatAssemblyBegin(x, MAT_FINAL_ASSEMBLY));
34529566063dSJacob Faibussowitsch   PetscCall(MatAssemblyEnd(x, MAT_FINAL_ASSEMBLY));
34533ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3454679944adSJunchao Zhang }
3455679944adSJunchao Zhang 
34560a6ffc59SBarry Smith static struct _MatOps MatOps_Values = {MatSetValues_SeqAIJ,
3457cb5b572fSBarry Smith                                        MatGetRow_SeqAIJ,
3458cb5b572fSBarry Smith                                        MatRestoreRow_SeqAIJ,
3459cb5b572fSBarry Smith                                        MatMult_SeqAIJ,
346097304618SKris Buschelman                                        /*  4*/ MatMultAdd_SeqAIJ,
34617c922b88SBarry Smith                                        MatMultTranspose_SeqAIJ,
34627c922b88SBarry Smith                                        MatMultTransposeAdd_SeqAIJ,
3463f4259b30SLisandro Dalcin                                        NULL,
3464f4259b30SLisandro Dalcin                                        NULL,
3465f4259b30SLisandro Dalcin                                        NULL,
3466f4259b30SLisandro Dalcin                                        /* 10*/ NULL,
3467cb5b572fSBarry Smith                                        MatLUFactor_SeqAIJ,
3468f4259b30SLisandro Dalcin                                        NULL,
346941f059aeSBarry Smith                                        MatSOR_SeqAIJ,
347091e9d3e2SHong Zhang                                        MatTranspose_SeqAIJ,
347197304618SKris Buschelman                                        /* 15*/ MatGetInfo_SeqAIJ,
3472cb5b572fSBarry Smith                                        MatEqual_SeqAIJ,
3473cb5b572fSBarry Smith                                        MatGetDiagonal_SeqAIJ,
3474cb5b572fSBarry Smith                                        MatDiagonalScale_SeqAIJ,
3475cb5b572fSBarry Smith                                        MatNorm_SeqAIJ,
3476f4259b30SLisandro Dalcin                                        /* 20*/ NULL,
3477cb5b572fSBarry Smith                                        MatAssemblyEnd_SeqAIJ,
3478cb5b572fSBarry Smith                                        MatSetOption_SeqAIJ,
3479cb5b572fSBarry Smith                                        MatZeroEntries_SeqAIJ,
3480d519adbfSMatthew Knepley                                        /* 24*/ MatZeroRows_SeqAIJ,
3481f4259b30SLisandro Dalcin                                        NULL,
3482f4259b30SLisandro Dalcin                                        NULL,
3483f4259b30SLisandro Dalcin                                        NULL,
3484f4259b30SLisandro Dalcin                                        NULL,
348526cec326SBarry Smith                                        /* 29*/ MatSetUp_Seq_Hash,
3486f4259b30SLisandro Dalcin                                        NULL,
3487f4259b30SLisandro Dalcin                                        NULL,
3488f4259b30SLisandro Dalcin                                        NULL,
3489f4259b30SLisandro Dalcin                                        NULL,
3490d519adbfSMatthew Knepley                                        /* 34*/ MatDuplicate_SeqAIJ,
3491f4259b30SLisandro Dalcin                                        NULL,
3492f4259b30SLisandro Dalcin                                        NULL,
3493cb5b572fSBarry Smith                                        MatILUFactor_SeqAIJ,
3494f4259b30SLisandro Dalcin                                        NULL,
3495d519adbfSMatthew Knepley                                        /* 39*/ MatAXPY_SeqAIJ,
34967dae84e0SHong Zhang                                        MatCreateSubMatrices_SeqAIJ,
3497cb5b572fSBarry Smith                                        MatIncreaseOverlap_SeqAIJ,
3498cb5b572fSBarry Smith                                        MatGetValues_SeqAIJ,
3499cb5b572fSBarry Smith                                        MatCopy_SeqAIJ,
3500d519adbfSMatthew Knepley                                        /* 44*/ MatGetRowMax_SeqAIJ,
3501cb5b572fSBarry Smith                                        MatScale_SeqAIJ,
35027d68702bSBarry Smith                                        MatShift_SeqAIJ,
350379299369SBarry Smith                                        MatDiagonalSet_SeqAIJ,
35046e169961SBarry Smith                                        MatZeroRowsColumns_SeqAIJ,
350573a71a0fSBarry Smith                                        /* 49*/ MatSetRandom_SeqAIJ,
35063b2fbd54SBarry Smith                                        MatGetRowIJ_SeqAIJ,
35073b2fbd54SBarry Smith                                        MatRestoreRowIJ_SeqAIJ,
35083b2fbd54SBarry Smith                                        MatGetColumnIJ_SeqAIJ,
3509a93ec695SBarry Smith                                        MatRestoreColumnIJ_SeqAIJ,
351093dfae19SHong Zhang                                        /* 54*/ MatFDColoringCreate_SeqXAIJ,
3511f4259b30SLisandro Dalcin                                        NULL,
3512f4259b30SLisandro Dalcin                                        NULL,
3513cda55fadSBarry Smith                                        MatPermute_SeqAIJ,
3514f4259b30SLisandro Dalcin                                        NULL,
3515f4259b30SLisandro Dalcin                                        /* 59*/ NULL,
3516b9b97703SBarry Smith                                        MatDestroy_SeqAIJ,
3517b9b97703SBarry Smith                                        MatView_SeqAIJ,
3518f4259b30SLisandro Dalcin                                        NULL,
3519f4259b30SLisandro Dalcin                                        NULL,
35208bb0f5c6SPierre Jolivet                                        /* 64*/ MatMatMatMultNumeric_SeqAIJ_SeqAIJ_SeqAIJ,
3521f4259b30SLisandro Dalcin                                        NULL,
3522f4259b30SLisandro Dalcin                                        NULL,
3523f4259b30SLisandro Dalcin                                        NULL,
35248bb0f5c6SPierre Jolivet                                        MatGetRowMaxAbs_SeqAIJ,
35258bb0f5c6SPierre Jolivet                                        /* 69*/ MatGetRowMinAbs_SeqAIJ,
3526f4259b30SLisandro Dalcin                                        NULL,
3527f4259b30SLisandro Dalcin                                        NULL,
35283acb8795SBarry Smith                                        MatFDColoringApply_AIJ,
3529f4259b30SLisandro Dalcin                                        NULL,
35308bb0f5c6SPierre Jolivet                                        /* 74*/ MatFindZeroDiagonals_SeqAIJ,
3531f4259b30SLisandro Dalcin                                        NULL,
3532f4259b30SLisandro Dalcin                                        NULL,
3533f4259b30SLisandro Dalcin                                        NULL,
3534bc011b1eSHong Zhang                                        MatLoad_SeqAIJ,
35358bb0f5c6SPierre Jolivet                                        /* 79*/ NULL,
35368bb0f5c6SPierre Jolivet                                        NULL,
35378bb0f5c6SPierre Jolivet                                        NULL,
35388bb0f5c6SPierre Jolivet                                        NULL,
35398bb0f5c6SPierre Jolivet                                        NULL,
35406cff0a6bSPierre Jolivet                                        /* 84*/ NULL,
354126be0446SHong Zhang                                        MatMatMultNumeric_SeqAIJ_SeqAIJ,
35428bb0f5c6SPierre Jolivet                                        MatPtAPNumeric_SeqAIJ_SeqAIJ_SparseAxpy,
3543f4259b30SLisandro Dalcin                                        NULL,
35446fc122caSHong Zhang                                        MatMatTransposeMultNumeric_SeqAIJ_SeqAIJ,
35458bb0f5c6SPierre Jolivet                                        /* 90*/ NULL,
35468bb0f5c6SPierre Jolivet                                        MatProductSetFromOptions_SeqAIJ,
3547f4259b30SLisandro Dalcin                                        NULL,
3548f4259b30SLisandro Dalcin                                        NULL,
354987d4246cSBarry Smith                                        MatConjugate_SeqAIJ,
35508bb0f5c6SPierre Jolivet                                        /* 94*/ NULL,
35518bb0f5c6SPierre Jolivet                                        MatSetValuesRow_SeqAIJ,
355299cafbc1SBarry Smith                                        MatRealPart_SeqAIJ,
3553f5edf698SHong Zhang                                        MatImaginaryPart_SeqAIJ,
3554f4259b30SLisandro Dalcin                                        NULL,
35558bb0f5c6SPierre Jolivet                                        /* 99*/ NULL,
35568bb0f5c6SPierre Jolivet                                        MatMatSolve_SeqAIJ,
3557f4259b30SLisandro Dalcin                                        NULL,
35582af78befSBarry Smith                                        MatGetRowMin_SeqAIJ,
3559f4259b30SLisandro Dalcin                                        NULL,
35608bb0f5c6SPierre Jolivet                                        /*104*/ MatMissingDiagonal_SeqAIJ,
3561f4259b30SLisandro Dalcin                                        NULL,
3562f4259b30SLisandro Dalcin                                        NULL,
3563f4259b30SLisandro Dalcin                                        NULL,
3564f4259b30SLisandro Dalcin                                        NULL,
35658bb0f5c6SPierre Jolivet                                        /*109*/ NULL,
3566f4259b30SLisandro Dalcin                                        NULL,
3567f4259b30SLisandro Dalcin                                        NULL,
3568f4259b30SLisandro Dalcin                                        NULL,
35698bb0f5c6SPierre Jolivet                                        NULL,
35708bb0f5c6SPierre Jolivet                                        /*114*/ MatGetMultiProcBlock_SeqAIJ,
35718bb0f5c6SPierre Jolivet                                        MatFindNonzeroRows_SeqAIJ,
3572a873a8cdSSam Reynolds                                        MatGetColumnReductions_SeqAIJ,
357337868618SMatthew G Knepley                                        MatInvertBlockDiagonal_SeqAIJ,
35740da83c2eSBarry Smith                                        MatInvertVariableBlockDiagonal_SeqAIJ,
35758bb0f5c6SPierre Jolivet                                        /*119*/ NULL,
3576f4259b30SLisandro Dalcin                                        NULL,
3577f4259b30SLisandro Dalcin                                        NULL,
357875648e8dSHong Zhang                                        MatTransposeMatMultNumeric_SeqAIJ_SeqAIJ,
3579b9af6bddSHong Zhang                                        MatTransposeColoringCreate_SeqAIJ,
35808bb0f5c6SPierre Jolivet                                        /*124*/ MatTransColoringApplySpToDen_SeqAIJ,
35812b8ad9a3SHong Zhang                                        MatTransColoringApplyDenToSp_SeqAIJ,
35823964eb88SJed Brown                                        MatRARtNumeric_SeqAIJ_SeqAIJ,
35838bb0f5c6SPierre Jolivet                                        NULL,
35848bb0f5c6SPierre Jolivet                                        NULL,
35858bb0f5c6SPierre Jolivet                                        /*129*/ MatFDColoringSetUp_SeqXAIJ,
35868bb0f5c6SPierre Jolivet                                        MatFindOffBlockDiagonalEntries_SeqAIJ,
35878bb0f5c6SPierre Jolivet                                        MatCreateMPIMatConcatenateSeqMat_SeqAIJ,
35888bb0f5c6SPierre Jolivet                                        MatDestroySubMatrices_SeqAIJ,
35898bb0f5c6SPierre Jolivet                                        NULL,
35908bb0f5c6SPierre Jolivet                                        /*134*/ NULL,
35918bb0f5c6SPierre Jolivet                                        MatCreateGraph_Simple_AIJ,
35928bb0f5c6SPierre Jolivet                                        MatTransposeSymbolic_SeqAIJ,
35938bb0f5c6SPierre Jolivet                                        MatEliminateZeros_SeqAIJ,
35948bb0f5c6SPierre Jolivet                                        MatGetRowSumAbs_SeqAIJ,
3595f4259b30SLisandro Dalcin                                        /*139*/ NULL,
3596f4259b30SLisandro Dalcin                                        NULL,
3597f4259b30SLisandro Dalcin                                        NULL,
359803db1824SAlex Lindsay                                        MatCopyHashToXAIJ_Seq_Hash,
3599c2be7ffeSStefano Zampini                                        NULL,
360003db1824SAlex Lindsay                                        NULL};
360117ab2063SBarry Smith 
3602ba38deedSJacob Faibussowitsch static PetscErrorCode MatSeqAIJSetColumnIndices_SeqAIJ(Mat mat, PetscInt *indices)
3603d71ae5a4SJacob Faibussowitsch {
3604bef8e0ddSBarry Smith   Mat_SeqAIJ *aij = (Mat_SeqAIJ *)mat->data;
360597f1f81fSBarry Smith   PetscInt    i, nz, n;
3606bef8e0ddSBarry Smith 
3607bef8e0ddSBarry Smith   PetscFunctionBegin;
3608bef8e0ddSBarry Smith   nz = aij->maxnz;
3609d0f46423SBarry Smith   n  = mat->rmap->n;
3610ad540459SPierre Jolivet   for (i = 0; i < nz; i++) aij->j[i] = indices[i];
3611bef8e0ddSBarry Smith   aij->nz = nz;
3612ad540459SPierre Jolivet   for (i = 0; i < n; i++) aij->ilen[i] = aij->imax[i];
36133ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3614bef8e0ddSBarry Smith }
3615bef8e0ddSBarry Smith 
3616a3bb6f32SFande Kong /*
3617ddea5d60SJunchao Zhang  * Given a sparse matrix with global column indices, compact it by using a local column space.
3618ddea5d60SJunchao Zhang  * The result matrix helps saving memory in other algorithms, such as MatPtAPSymbolic_MPIAIJ_MPIAIJ_scalable()
3619ddea5d60SJunchao Zhang  */
3620d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJCompactOutExtraColumns_SeqAIJ(Mat mat, ISLocalToGlobalMapping *mapping)
3621d71ae5a4SJacob Faibussowitsch {
3622a3bb6f32SFande Kong   Mat_SeqAIJ   *aij = (Mat_SeqAIJ *)mat->data;
3623eec179cfSJacob Faibussowitsch   PetscHMapI    gid1_lid1;
3624eec179cfSJacob Faibussowitsch   PetscHashIter tpos;
362525b670f0SStefano Zampini   PetscInt      gid, lid, i, ec, nz = aij->nz;
362625b670f0SStefano Zampini   PetscInt     *garray, *jj = aij->j;
3627a3bb6f32SFande Kong 
3628a3bb6f32SFande Kong   PetscFunctionBegin;
3629a3bb6f32SFande Kong   PetscValidHeaderSpecific(mat, MAT_CLASSID, 1);
36304f572ea9SToby Isaac   PetscAssertPointer(mapping, 2);
3631a3bb6f32SFande Kong   /* use a table */
3632eec179cfSJacob Faibussowitsch   PetscCall(PetscHMapICreateWithSize(mat->rmap->n, &gid1_lid1));
3633a3bb6f32SFande Kong   ec = 0;
363425b670f0SStefano Zampini   for (i = 0; i < nz; i++) {
363525b670f0SStefano Zampini     PetscInt data, gid1 = jj[i] + 1;
3636eec179cfSJacob Faibussowitsch     PetscCall(PetscHMapIGetWithDefault(gid1_lid1, gid1, 0, &data));
3637a3bb6f32SFande Kong     if (!data) {
3638a3bb6f32SFande Kong       /* one based table */
3639c76ffc5fSJacob Faibussowitsch       PetscCall(PetscHMapISet(gid1_lid1, gid1, ++ec));
3640a3bb6f32SFande Kong     }
3641a3bb6f32SFande Kong   }
3642a3bb6f32SFande Kong   /* form array of columns we need */
36439566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(ec, &garray));
3644eec179cfSJacob Faibussowitsch   PetscHashIterBegin(gid1_lid1, tpos);
3645eec179cfSJacob Faibussowitsch   while (!PetscHashIterAtEnd(gid1_lid1, tpos)) {
3646eec179cfSJacob Faibussowitsch     PetscHashIterGetKey(gid1_lid1, tpos, gid);
3647eec179cfSJacob Faibussowitsch     PetscHashIterGetVal(gid1_lid1, tpos, lid);
3648eec179cfSJacob Faibussowitsch     PetscHashIterNext(gid1_lid1, tpos);
3649a3bb6f32SFande Kong     gid--;
3650a3bb6f32SFande Kong     lid--;
3651a3bb6f32SFande Kong     garray[lid] = gid;
3652a3bb6f32SFande Kong   }
36539566063dSJacob Faibussowitsch   PetscCall(PetscSortInt(ec, garray)); /* sort, and rebuild */
3654eec179cfSJacob Faibussowitsch   PetscCall(PetscHMapIClear(gid1_lid1));
3655c76ffc5fSJacob Faibussowitsch   for (i = 0; i < ec; i++) PetscCall(PetscHMapISet(gid1_lid1, garray[i] + 1, i + 1));
3656a3bb6f32SFande Kong   /* compact out the extra columns in B */
365725b670f0SStefano Zampini   for (i = 0; i < nz; i++) {
365825b670f0SStefano Zampini     PetscInt gid1 = jj[i] + 1;
3659eec179cfSJacob Faibussowitsch     PetscCall(PetscHMapIGetWithDefault(gid1_lid1, gid1, 0, &lid));
3660a3bb6f32SFande Kong     lid--;
366125b670f0SStefano Zampini     jj[i] = lid;
3662a3bb6f32SFande Kong   }
36639566063dSJacob Faibussowitsch   PetscCall(PetscLayoutDestroy(&mat->cmap));
3664eec179cfSJacob Faibussowitsch   PetscCall(PetscHMapIDestroy(&gid1_lid1));
36659566063dSJacob Faibussowitsch   PetscCall(PetscLayoutCreateFromSizes(PetscObjectComm((PetscObject)mat), ec, ec, 1, &mat->cmap));
36669566063dSJacob Faibussowitsch   PetscCall(ISLocalToGlobalMappingCreate(PETSC_COMM_SELF, mat->cmap->bs, mat->cmap->n, garray, PETSC_OWN_POINTER, mapping));
36679566063dSJacob Faibussowitsch   PetscCall(ISLocalToGlobalMappingSetType(*mapping, ISLOCALTOGLOBALMAPPINGHASH));
36683ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3669a3bb6f32SFande Kong }
3670a3bb6f32SFande Kong 
3671bef8e0ddSBarry Smith /*@
3672bef8e0ddSBarry Smith   MatSeqAIJSetColumnIndices - Set the column indices for all the rows
3673bef8e0ddSBarry Smith   in the matrix.
3674bef8e0ddSBarry Smith 
3675bef8e0ddSBarry Smith   Input Parameters:
367611a5261eSBarry Smith + mat     - the `MATSEQAIJ` matrix
3677bef8e0ddSBarry Smith - indices - the column indices
3678bef8e0ddSBarry Smith 
367915091d37SBarry Smith   Level: advanced
368015091d37SBarry Smith 
3681bef8e0ddSBarry Smith   Notes:
3682bef8e0ddSBarry Smith   This can be called if you have precomputed the nonzero structure of the
3683bef8e0ddSBarry Smith   matrix and want to provide it to the matrix object to improve the performance
368411a5261eSBarry Smith   of the `MatSetValues()` operation.
3685bef8e0ddSBarry Smith 
3686bef8e0ddSBarry Smith   You MUST have set the correct numbers of nonzeros per row in the call to
368711a5261eSBarry Smith   `MatCreateSeqAIJ()`, and the columns indices MUST be sorted.
3688bef8e0ddSBarry Smith 
368911a5261eSBarry Smith   MUST be called before any calls to `MatSetValues()`
3690bef8e0ddSBarry Smith 
3691b9617806SBarry Smith   The indices should start with zero, not one.
3692b9617806SBarry Smith 
36931cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MATSEQAIJ`
3694bef8e0ddSBarry Smith @*/
3695d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetColumnIndices(Mat mat, PetscInt *indices)
3696d71ae5a4SJacob Faibussowitsch {
3697bef8e0ddSBarry Smith   PetscFunctionBegin;
36980700a824SBarry Smith   PetscValidHeaderSpecific(mat, MAT_CLASSID, 1);
36994f572ea9SToby Isaac   PetscAssertPointer(indices, 2);
3700cac4c232SBarry Smith   PetscUseMethod(mat, "MatSeqAIJSetColumnIndices_C", (Mat, PetscInt *), (mat, indices));
37013ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3702bef8e0ddSBarry Smith }
3703bef8e0ddSBarry Smith 
3704ba38deedSJacob Faibussowitsch static PetscErrorCode MatStoreValues_SeqAIJ(Mat mat)
3705d71ae5a4SJacob Faibussowitsch {
3706be6bf707SBarry Smith   Mat_SeqAIJ *aij = (Mat_SeqAIJ *)mat->data;
3707d0f46423SBarry Smith   size_t      nz  = aij->i[mat->rmap->n];
3708be6bf707SBarry Smith 
3709be6bf707SBarry Smith   PetscFunctionBegin;
371028b400f6SJacob Faibussowitsch   PetscCheck(aij->nonew, PETSC_COMM_SELF, PETSC_ERR_ORDER, "Must call MatSetOption(A,MAT_NEW_NONZERO_LOCATIONS,PETSC_FALSE);first");
3711be6bf707SBarry Smith 
3712be6bf707SBarry Smith   /* allocate space for values if not already there */
37133a7d0413SPierre Jolivet   if (!aij->saved_values) PetscCall(PetscMalloc1(nz + 1, &aij->saved_values));
3714be6bf707SBarry Smith 
3715be6bf707SBarry Smith   /* copy values over */
37169566063dSJacob Faibussowitsch   PetscCall(PetscArraycpy(aij->saved_values, aij->a, nz));
37173ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3718be6bf707SBarry Smith }
3719be6bf707SBarry Smith 
3720be6bf707SBarry Smith /*@
372120f4b53cSBarry Smith   MatStoreValues - Stashes a copy of the matrix values; this allows reusing of the linear part of a Jacobian, while recomputing only the
3722be6bf707SBarry Smith   nonlinear portion.
3723be6bf707SBarry Smith 
3724c3339decSBarry Smith   Logically Collect
3725be6bf707SBarry Smith 
372627430b45SBarry Smith   Input Parameter:
372711a5261eSBarry Smith . mat - the matrix (currently only `MATAIJ` matrices support this option)
3728be6bf707SBarry Smith 
372915091d37SBarry Smith   Level: advanced
373015091d37SBarry Smith 
37312920cce0SJacob Faibussowitsch   Example Usage:
373227430b45SBarry Smith .vb
37332ef1f0ffSBarry Smith     Using SNES
373427430b45SBarry Smith     Create Jacobian matrix
373527430b45SBarry Smith     Set linear terms into matrix
373627430b45SBarry Smith     Apply boundary conditions to matrix, at this time matrix must have
373727430b45SBarry Smith       final nonzero structure (i.e. setting the nonlinear terms and applying
373827430b45SBarry Smith       boundary conditions again will not change the nonzero structure
373927430b45SBarry Smith     MatSetOption(mat, MAT_NEW_NONZERO_LOCATIONS, PETSC_FALSE);
374027430b45SBarry Smith     MatStoreValues(mat);
374127430b45SBarry Smith     Call SNESSetJacobian() with matrix
374227430b45SBarry Smith     In your Jacobian routine
374327430b45SBarry Smith       MatRetrieveValues(mat);
374427430b45SBarry Smith       Set nonlinear terms in matrix
3745be6bf707SBarry Smith 
374627430b45SBarry Smith     Without `SNESSolve()`, i.e. when you handle nonlinear solve yourself:
374727430b45SBarry Smith     // build linear portion of Jacobian
374827430b45SBarry Smith     MatSetOption(mat, MAT_NEW_NONZERO_LOCATIONS, PETSC_FALSE);
374927430b45SBarry Smith     MatStoreValues(mat);
375027430b45SBarry Smith     loop over nonlinear iterations
375127430b45SBarry Smith        MatRetrieveValues(mat);
375227430b45SBarry Smith        // call MatSetValues(mat,...) to set nonliner portion of Jacobian
375327430b45SBarry Smith        // call MatAssemblyBegin/End() on matrix
375427430b45SBarry Smith        Solve linear system with Jacobian
375527430b45SBarry Smith     endloop
375627430b45SBarry Smith .ve
3757be6bf707SBarry Smith 
3758be6bf707SBarry Smith   Notes:
3759da81f932SPierre Jolivet   Matrix must already be assembled before calling this routine
376011a5261eSBarry Smith   Must set the matrix option `MatSetOption`(mat,`MAT_NEW_NONZERO_LOCATIONS`,`PETSC_FALSE`); before
3761be6bf707SBarry Smith   calling this routine.
3762be6bf707SBarry Smith 
37630c468ba9SBarry Smith   When this is called multiple times it overwrites the previous set of stored values
37640c468ba9SBarry Smith   and does not allocated additional space.
37650c468ba9SBarry Smith 
3766fe59aa6dSJacob Faibussowitsch .seealso: [](ch_matrices), `Mat`, `MatRetrieveValues()`
3767be6bf707SBarry Smith @*/
3768d71ae5a4SJacob Faibussowitsch PetscErrorCode MatStoreValues(Mat mat)
3769d71ae5a4SJacob Faibussowitsch {
3770be6bf707SBarry Smith   PetscFunctionBegin;
37710700a824SBarry Smith   PetscValidHeaderSpecific(mat, MAT_CLASSID, 1);
377228b400f6SJacob Faibussowitsch   PetscCheck(mat->assembled, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for unassembled matrix");
377328b400f6SJacob Faibussowitsch   PetscCheck(!mat->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix");
3774cac4c232SBarry Smith   PetscUseMethod(mat, "MatStoreValues_C", (Mat), (mat));
37753ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3776be6bf707SBarry Smith }
3777be6bf707SBarry Smith 
3778ba38deedSJacob Faibussowitsch static PetscErrorCode MatRetrieveValues_SeqAIJ(Mat mat)
3779d71ae5a4SJacob Faibussowitsch {
3780be6bf707SBarry Smith   Mat_SeqAIJ *aij = (Mat_SeqAIJ *)mat->data;
3781d0f46423SBarry Smith   PetscInt    nz  = aij->i[mat->rmap->n];
3782be6bf707SBarry Smith 
3783be6bf707SBarry Smith   PetscFunctionBegin;
378428b400f6SJacob Faibussowitsch   PetscCheck(aij->nonew, PETSC_COMM_SELF, PETSC_ERR_ORDER, "Must call MatSetOption(A,MAT_NEW_NONZERO_LOCATIONS,PETSC_FALSE);first");
378528b400f6SJacob Faibussowitsch   PetscCheck(aij->saved_values, PETSC_COMM_SELF, PETSC_ERR_ORDER, "Must call MatStoreValues(A);first");
3786be6bf707SBarry Smith   /* copy values over */
37879566063dSJacob Faibussowitsch   PetscCall(PetscArraycpy(aij->a, aij->saved_values, nz));
37883ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3789be6bf707SBarry Smith }
3790be6bf707SBarry Smith 
3791be6bf707SBarry Smith /*@
379220f4b53cSBarry Smith   MatRetrieveValues - Retrieves the copy of the matrix values that was stored with `MatStoreValues()`
3793be6bf707SBarry Smith 
3794c3339decSBarry Smith   Logically Collect
3795be6bf707SBarry Smith 
37962fe279fdSBarry Smith   Input Parameter:
379711a5261eSBarry Smith . mat - the matrix (currently only `MATAIJ` matrices support this option)
3798be6bf707SBarry Smith 
379915091d37SBarry Smith   Level: advanced
380015091d37SBarry Smith 
38011cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatStoreValues()`
3802be6bf707SBarry Smith @*/
3803d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRetrieveValues(Mat mat)
3804d71ae5a4SJacob Faibussowitsch {
3805be6bf707SBarry Smith   PetscFunctionBegin;
38060700a824SBarry Smith   PetscValidHeaderSpecific(mat, MAT_CLASSID, 1);
380728b400f6SJacob Faibussowitsch   PetscCheck(mat->assembled, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for unassembled matrix");
380828b400f6SJacob Faibussowitsch   PetscCheck(!mat->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix");
3809cac4c232SBarry Smith   PetscUseMethod(mat, "MatRetrieveValues_C", (Mat), (mat));
38103ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3811be6bf707SBarry Smith }
3812be6bf707SBarry Smith 
38135d83a8b1SBarry Smith /*@
381411a5261eSBarry Smith   MatCreateSeqAIJ - Creates a sparse matrix in `MATSEQAIJ` (compressed row) format
38150d15e28bSLois Curfman McInnes   (the default parallel PETSc format).  For good matrix assembly performance
381620f4b53cSBarry Smith   the user should preallocate the matrix storage by setting the parameter `nz`
381720f4b53cSBarry Smith   (or the array `nnz`).
381817ab2063SBarry Smith 
3819d083f849SBarry Smith   Collective
3820db81eaa0SLois Curfman McInnes 
382117ab2063SBarry Smith   Input Parameters:
382211a5261eSBarry Smith + comm - MPI communicator, set to `PETSC_COMM_SELF`
382317ab2063SBarry Smith . m    - number of rows
382417ab2063SBarry Smith . n    - number of columns
382517ab2063SBarry Smith . nz   - number of nonzeros per row (same for all rows)
382651c19458SBarry Smith - nnz  - array containing the number of nonzeros in the various rows
38270298fd71SBarry Smith          (possibly different for each row) or NULL
382817ab2063SBarry Smith 
382917ab2063SBarry Smith   Output Parameter:
3830416022c9SBarry Smith . A - the matrix
383117ab2063SBarry Smith 
38322ef1f0ffSBarry Smith   Options Database Keys:
38332ef1f0ffSBarry Smith + -mat_no_inode            - Do not use inodes
38342ef1f0ffSBarry Smith - -mat_inode_limit <limit> - Sets inode limit (max limit=5)
38352ef1f0ffSBarry Smith 
38362ef1f0ffSBarry Smith   Level: intermediate
3837175b88e8SBarry Smith 
3838b259b22eSLois Curfman McInnes   Notes:
383977433607SBarry Smith   It is recommend to use `MatCreateFromOptions()` instead of this routine
384077433607SBarry Smith 
38412ef1f0ffSBarry Smith   If `nnz` is given then `nz` is ignored
384249a6f317SBarry Smith 
38432ef1f0ffSBarry Smith   The `MATSEQAIJ` format, also called
38442ef1f0ffSBarry Smith   compressed row storage, is fully compatible with standard Fortran
38450002213bSLois Curfman McInnes   storage.  That is, the stored row and column indices can begin at
38462ef1f0ffSBarry Smith   either one (as in Fortran) or zero.
384717ab2063SBarry Smith 
384820f4b53cSBarry Smith   Specify the preallocated storage with either `nz` or `nnz` (not both).
38492ef1f0ffSBarry Smith   Set `nz` = `PETSC_DEFAULT` and `nnz` = `NULL` for PETSc to control dynamic memory
385020f4b53cSBarry Smith   allocation.
385117ab2063SBarry Smith 
3852682d7d0cSBarry Smith   By default, this format uses inodes (identical nodes) when possible, to
38534fca80b9SLois Curfman McInnes   improve numerical efficiency of matrix-vector products and solves. We
3854682d7d0cSBarry Smith   search for consecutive rows with the same nonzero structure, thereby
38556c7ebb05SLois Curfman McInnes   reusing matrix information to achieve increased efficiency.
38566c7ebb05SLois Curfman McInnes 
38571cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, [Sparse Matrix Creation](sec_matsparse), `MatCreate()`, `MatCreateAIJ()`, `MatSetValues()`, `MatSeqAIJSetColumnIndices()`, `MatCreateSeqAIJWithArrays()`
385817ab2063SBarry Smith @*/
3859d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateSeqAIJ(MPI_Comm comm, PetscInt m, PetscInt n, PetscInt nz, const PetscInt nnz[], Mat *A)
3860d71ae5a4SJacob Faibussowitsch {
38613a40ed3dSBarry Smith   PetscFunctionBegin;
38629566063dSJacob Faibussowitsch   PetscCall(MatCreate(comm, A));
38639566063dSJacob Faibussowitsch   PetscCall(MatSetSizes(*A, m, n, m, n));
38649566063dSJacob Faibussowitsch   PetscCall(MatSetType(*A, MATSEQAIJ));
38659566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(*A, nz, nnz));
38663ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3867273d9f13SBarry Smith }
3868273d9f13SBarry Smith 
38695d83a8b1SBarry Smith /*@
3870273d9f13SBarry Smith   MatSeqAIJSetPreallocation - For good matrix assembly performance
3871273d9f13SBarry Smith   the user should preallocate the matrix storage by setting the parameter nz
3872273d9f13SBarry Smith   (or the array nnz).  By setting these parameters accurately, performance
3873273d9f13SBarry Smith   during matrix assembly can be increased by more than a factor of 50.
3874273d9f13SBarry Smith 
3875d083f849SBarry Smith   Collective
3876273d9f13SBarry Smith 
3877273d9f13SBarry Smith   Input Parameters:
38781c4f3114SJed Brown + B   - The matrix
3879273d9f13SBarry Smith . nz  - number of nonzeros per row (same for all rows)
3880273d9f13SBarry Smith - nnz - array containing the number of nonzeros in the various rows
38810298fd71SBarry Smith          (possibly different for each row) or NULL
3882273d9f13SBarry Smith 
38832ef1f0ffSBarry Smith   Options Database Keys:
38842ef1f0ffSBarry Smith + -mat_no_inode            - Do not use inodes
38852ef1f0ffSBarry Smith - -mat_inode_limit <limit> - Sets inode limit (max limit=5)
38862ef1f0ffSBarry Smith 
38872ef1f0ffSBarry Smith   Level: intermediate
38882ef1f0ffSBarry Smith 
3889273d9f13SBarry Smith   Notes:
38902ef1f0ffSBarry Smith   If `nnz` is given then `nz` is ignored
389149a6f317SBarry Smith 
389211a5261eSBarry Smith   The `MATSEQAIJ` format also called
38932ef1f0ffSBarry Smith   compressed row storage, is fully compatible with standard Fortran
3894273d9f13SBarry Smith   storage.  That is, the stored row and column indices can begin at
3895273d9f13SBarry Smith   either one (as in Fortran) or zero.  See the users' manual for details.
3896273d9f13SBarry Smith 
38972ef1f0ffSBarry Smith   Specify the preallocated storage with either `nz` or `nnz` (not both).
38982ef1f0ffSBarry Smith   Set nz = `PETSC_DEFAULT` and `nnz` = `NULL` for PETSc to control dynamic memory
38992ef1f0ffSBarry Smith   allocation.
3900273d9f13SBarry Smith 
390111a5261eSBarry Smith   You can call `MatGetInfo()` to get information on how effective the preallocation was;
3902aa95bbe8SBarry Smith   for example the fields mallocs,nz_allocated,nz_used,nz_unneeded;
3903aa95bbe8SBarry Smith   You can also run with the option -info and look for messages with the string
3904aa95bbe8SBarry Smith   malloc in them to see if additional memory allocation was needed.
3905aa95bbe8SBarry Smith 
390611a5261eSBarry Smith   Developer Notes:
390711a5261eSBarry Smith   Use nz of `MAT_SKIP_ALLOCATION` to not allocate any space for the matrix
3908a96a251dSBarry Smith   entries or columns indices
3909a96a251dSBarry Smith 
3910273d9f13SBarry Smith   By default, this format uses inodes (identical nodes) when possible, to
3911273d9f13SBarry Smith   improve numerical efficiency of matrix-vector products and solves. We
3912273d9f13SBarry Smith   search for consecutive rows with the same nonzero structure, thereby
3913273d9f13SBarry Smith   reusing matrix information to achieve increased efficiency.
3914273d9f13SBarry Smith 
39151cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatCreate()`, `MatCreateAIJ()`, `MatSetValues()`, `MatSeqAIJSetColumnIndices()`, `MatCreateSeqAIJWithArrays()`, `MatGetInfo()`,
3916db781477SPatrick Sanan           `MatSeqAIJSetTotalPreallocation()`
3917273d9f13SBarry Smith @*/
3918d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetPreallocation(Mat B, PetscInt nz, const PetscInt nnz[])
3919d71ae5a4SJacob Faibussowitsch {
3920a23d5eceSKris Buschelman   PetscFunctionBegin;
39216ba663aaSJed Brown   PetscValidHeaderSpecific(B, MAT_CLASSID, 1);
39226ba663aaSJed Brown   PetscValidType(B, 1);
3923cac4c232SBarry Smith   PetscTryMethod(B, "MatSeqAIJSetPreallocation_C", (Mat, PetscInt, const PetscInt[]), (B, nz, nnz));
39243ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
3925a23d5eceSKris Buschelman }
3926a23d5eceSKris Buschelman 
3927d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetPreallocation_SeqAIJ(Mat B, PetscInt nz, const PetscInt *nnz)
3928d71ae5a4SJacob Faibussowitsch {
3929ad79cf63SBarry Smith   Mat_SeqAIJ *b              = (Mat_SeqAIJ *)B->data;
39302576faa2SJed Brown   PetscBool   skipallocation = PETSC_FALSE, realalloc = PETSC_FALSE;
393197f1f81fSBarry Smith   PetscInt    i;
3932273d9f13SBarry Smith 
3933273d9f13SBarry Smith   PetscFunctionBegin;
3934ad79cf63SBarry Smith   if (B->hash_active) {
3935aea10558SJacob Faibussowitsch     B->ops[0] = b->cops;
3936ad79cf63SBarry Smith     PetscCall(PetscHMapIJVDestroy(&b->ht));
3937ad79cf63SBarry Smith     PetscCall(PetscFree(b->dnz));
3938ad79cf63SBarry Smith     B->hash_active = PETSC_FALSE;
3939ad79cf63SBarry Smith   }
39402576faa2SJed Brown   if (nz >= 0 || nnz) realalloc = PETSC_TRUE;
3941a96a251dSBarry Smith   if (nz == MAT_SKIP_ALLOCATION) {
3942c461c341SBarry Smith     skipallocation = PETSC_TRUE;
3943c461c341SBarry Smith     nz             = 0;
3944c461c341SBarry Smith   }
39459566063dSJacob Faibussowitsch   PetscCall(PetscLayoutSetUp(B->rmap));
39469566063dSJacob Faibussowitsch   PetscCall(PetscLayoutSetUp(B->cmap));
3947899cda47SBarry Smith 
3948435da068SBarry Smith   if (nz == PETSC_DEFAULT || nz == PETSC_DECIDE) nz = 5;
394908401ef6SPierre Jolivet   PetscCheck(nz >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "nz cannot be less than 0: value %" PetscInt_FMT, nz);
39509f0612e4SBarry Smith   if (nnz) {
3951d0f46423SBarry Smith     for (i = 0; i < B->rmap->n; i++) {
395208401ef6SPierre Jolivet       PetscCheck(nnz[i] >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "nnz cannot be less than 0: local row %" PetscInt_FMT " value %" PetscInt_FMT, i, nnz[i]);
395308401ef6SPierre Jolivet       PetscCheck(nnz[i] <= B->cmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "nnz cannot be greater than row length: local row %" PetscInt_FMT " value %" PetscInt_FMT " rowlength %" PetscInt_FMT, i, nnz[i], B->cmap->n);
3954b73539f3SBarry Smith     }
3955b73539f3SBarry Smith   }
3956b73539f3SBarry Smith 
3957273d9f13SBarry Smith   B->preallocated = PETSC_TRUE;
3958ab93d7beSBarry Smith   if (!skipallocation) {
39593a7d0413SPierre Jolivet     if (!b->imax) PetscCall(PetscMalloc1(B->rmap->n, &b->imax));
3960071fcb05SBarry Smith     if (!b->ilen) {
3961071fcb05SBarry Smith       /* b->ilen will count nonzeros in each row so far. */
39629566063dSJacob Faibussowitsch       PetscCall(PetscCalloc1(B->rmap->n, &b->ilen));
3963071fcb05SBarry Smith     } else {
39649566063dSJacob Faibussowitsch       PetscCall(PetscMemzero(b->ilen, B->rmap->n * sizeof(PetscInt)));
39652ee49352SLisandro Dalcin     }
3966aa624791SPierre Jolivet     if (!b->ipre) PetscCall(PetscMalloc1(B->rmap->n, &b->ipre));
3967273d9f13SBarry Smith     if (!nnz) {
3968435da068SBarry Smith       if (nz == PETSC_DEFAULT || nz == PETSC_DECIDE) nz = 10;
3969c62bd62aSJed Brown       else if (nz < 0) nz = 1;
39705d2a9ed1SStefano Zampini       nz = PetscMin(nz, B->cmap->n);
3971d0f46423SBarry Smith       for (i = 0; i < B->rmap->n; i++) b->imax[i] = nz;
3972c43c4a61SBarry Smith       PetscCall(PetscIntMultError(nz, B->rmap->n, &nz));
3973273d9f13SBarry Smith     } else {
3974c73702f5SBarry Smith       PetscInt64 nz64 = 0;
39759371c9d4SSatish Balay       for (i = 0; i < B->rmap->n; i++) {
39769371c9d4SSatish Balay         b->imax[i] = nnz[i];
39779371c9d4SSatish Balay         nz64 += nnz[i];
39789371c9d4SSatish Balay       }
39799566063dSJacob Faibussowitsch       PetscCall(PetscIntCast(nz64, &nz));
3980273d9f13SBarry Smith     }
3981ab93d7beSBarry Smith 
3982273d9f13SBarry Smith     /* allocate the matrix space */
39839566063dSJacob Faibussowitsch     PetscCall(MatSeqXAIJFreeAIJ(B, &b->a, &b->j, &b->i));
39849f0612e4SBarry Smith     PetscCall(PetscShmgetAllocateArray(nz, sizeof(PetscInt), (void **)&b->j));
39859f0612e4SBarry Smith     PetscCall(PetscShmgetAllocateArray(B->rmap->n + 1, sizeof(PetscInt), (void **)&b->i));
39869f0612e4SBarry Smith     b->free_ij = PETSC_TRUE;
3987396832f4SHong Zhang     if (B->structure_only) {
39889f0612e4SBarry Smith       b->free_a = PETSC_FALSE;
3989396832f4SHong Zhang     } else {
39909f0612e4SBarry Smith       PetscCall(PetscShmgetAllocateArray(nz, sizeof(PetscScalar), (void **)&b->a));
39919f0612e4SBarry Smith       b->free_a = PETSC_TRUE;
3992396832f4SHong Zhang     }
3993bfeeae90SHong Zhang     b->i[0] = 0;
3994ad540459SPierre Jolivet     for (i = 1; i < B->rmap->n + 1; i++) b->i[i] = b->i[i - 1] + b->imax[i - 1];
3995c461c341SBarry Smith   } else {
3996e6b907acSBarry Smith     b->free_a  = PETSC_FALSE;
3997e6b907acSBarry Smith     b->free_ij = PETSC_FALSE;
3998c461c341SBarry Smith   }
3999273d9f13SBarry Smith 
4000846b4da1SFande Kong   if (b->ipre && nnz != b->ipre && b->imax) {
4001846b4da1SFande Kong     /* reserve user-requested sparsity */
40029566063dSJacob Faibussowitsch     PetscCall(PetscArraycpy(b->ipre, b->imax, B->rmap->n));
4003846b4da1SFande Kong   }
4004846b4da1SFande Kong 
4005273d9f13SBarry Smith   b->nz               = 0;
4006273d9f13SBarry Smith   b->maxnz            = nz;
4007273d9f13SBarry Smith   B->info.nz_unneeded = (double)b->maxnz;
40081baa6e33SBarry Smith   if (realalloc) PetscCall(MatSetOption(B, MAT_NEW_NONZERO_ALLOCATION_ERR, PETSC_TRUE));
4009cb7b82ddSBarry Smith   B->was_assembled = PETSC_FALSE;
4010cb7b82ddSBarry Smith   B->assembled     = PETSC_FALSE;
40115519a089SJose E. Roman   /* We simply deem preallocation has changed nonzero state. Updating the state
40125519a089SJose E. Roman      will give clients (like AIJKokkos) a chance to know something has happened.
40135519a089SJose E. Roman   */
40145519a089SJose E. Roman   B->nonzerostate++;
40153ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
4016273d9f13SBarry Smith }
4017273d9f13SBarry Smith 
40184c51d546SAlexander PetscErrorCode MatResetPreallocation_SeqAIJ_Private(Mat A, PetscBool *memoryreset)
4019d71ae5a4SJacob Faibussowitsch {
4020846b4da1SFande Kong   Mat_SeqAIJ *a;
4021a5bbaf83SFande Kong   PetscInt    i;
40221f14be2bSBarry Smith   PetscBool   skipreset;
4023846b4da1SFande Kong 
4024846b4da1SFande Kong   PetscFunctionBegin;
4025846b4da1SFande Kong   PetscValidHeaderSpecific(A, MAT_CLASSID, 1);
402614d0e64fSAlex Lindsay 
40274c51d546SAlexander   PetscCheck(A->insertmode == NOT_SET_VALUES, PETSC_COMM_SELF, PETSC_ERR_SUP, "Cannot reset preallocation after setting some values but not yet calling MatAssemblyBegin()/MatAssemblyEnd()");
40284c51d546SAlexander   if (A->num_ass == 0) PetscFunctionReturn(PETSC_SUCCESS);
40294c51d546SAlexander 
403014d0e64fSAlex Lindsay   /* Check local size. If zero, then return */
40313ba16761SJacob Faibussowitsch   if (!A->rmap->n) PetscFunctionReturn(PETSC_SUCCESS);
403214d0e64fSAlex Lindsay 
4033846b4da1SFande Kong   a = (Mat_SeqAIJ *)A->data;
40342c814fdeSFande Kong   /* if no saved info, we error out */
403528b400f6SJacob Faibussowitsch   PetscCheck(a->ipre, PETSC_COMM_SELF, PETSC_ERR_ARG_NULL, "No saved preallocation info ");
40362c814fdeSFande Kong 
40371f14be2bSBarry Smith   PetscCheck(a->i && a->imax && a->ilen, PETSC_COMM_SELF, PETSC_ERR_ARG_NULL, "Memory info is incomplete, and cannot reset preallocation ");
40382c814fdeSFande Kong 
40391f14be2bSBarry Smith   PetscCall(PetscArraycmp(a->ipre, a->ilen, A->rmap->n, &skipreset));
40404c51d546SAlexander   if (skipreset) PetscCall(MatZeroEntries(A));
40414c51d546SAlexander   else {
40429566063dSJacob Faibussowitsch     PetscCall(PetscArraycpy(a->imax, a->ipre, A->rmap->n));
40439566063dSJacob Faibussowitsch     PetscCall(PetscArrayzero(a->ilen, A->rmap->n));
4044846b4da1SFande Kong     a->i[0] = 0;
4045ad540459SPierre Jolivet     for (i = 1; i < A->rmap->n + 1; i++) a->i[i] = a->i[i - 1] + a->imax[i - 1];
4046846b4da1SFande Kong     A->preallocated     = PETSC_TRUE;
4047846b4da1SFande Kong     a->nz               = 0;
4048846b4da1SFande Kong     a->maxnz            = a->i[A->rmap->n];
4049846b4da1SFande Kong     A->info.nz_unneeded = (double)a->maxnz;
4050846b4da1SFande Kong     A->was_assembled    = PETSC_FALSE;
4051846b4da1SFande Kong     A->assembled        = PETSC_FALSE;
4052b3a35320SAlex Lindsay     A->nonzerostate++;
4053b3a35320SAlex Lindsay     /* Log that the state of this object has changed; this will help guarantee that preconditioners get re-setup */
4054b3a35320SAlex Lindsay     PetscCall(PetscObjectStateIncrease((PetscObject)A));
40551f14be2bSBarry Smith   }
40564c51d546SAlexander   if (memoryreset) *memoryreset = (PetscBool)!skipreset;
40574c51d546SAlexander   PetscFunctionReturn(PETSC_SUCCESS);
40584c51d546SAlexander }
40594c51d546SAlexander 
40604c51d546SAlexander static PetscErrorCode MatResetPreallocation_SeqAIJ(Mat A)
40614c51d546SAlexander {
40624c51d546SAlexander   PetscFunctionBegin;
40634c51d546SAlexander   PetscCall(MatResetPreallocation_SeqAIJ_Private(A, NULL));
40643ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
4065846b4da1SFande Kong }
4066846b4da1SFande Kong 
406758d36128SBarry Smith /*@
406811a5261eSBarry Smith   MatSeqAIJSetPreallocationCSR - Allocates memory for a sparse sequential matrix in `MATSEQAIJ` format.
4069a1661176SMatthew Knepley 
4070a1661176SMatthew Knepley   Input Parameters:
4071a1661176SMatthew Knepley + B - the matrix
4072d8a51d2aSBarry Smith . i - the indices into `j` for the start of each row (indices start with zero)
4073d8a51d2aSBarry Smith . j - the column indices for each row (indices start with zero) these must be sorted for each row
4074d8a51d2aSBarry Smith - v - optional values in the matrix, use `NULL` if not provided
4075a1661176SMatthew Knepley 
4076a1661176SMatthew Knepley   Level: developer
4077a1661176SMatthew Knepley 
40786a9b8d82SBarry Smith   Notes:
40792ef1f0ffSBarry Smith   The `i`,`j`,`v` values are COPIED with this routine; to avoid the copy use `MatCreateSeqAIJWithArrays()`
408058d36128SBarry Smith 
40816a9b8d82SBarry Smith   This routine may be called multiple times with different nonzero patterns (or the same nonzero pattern). The nonzero
40826a9b8d82SBarry Smith   structure will be the union of all the previous nonzero structures.
40836a9b8d82SBarry Smith 
40846a9b8d82SBarry Smith   Developer Notes:
40852ef1f0ffSBarry Smith   An optimization could be added to the implementation where it checks if the `i`, and `j` are identical to the current `i` and `j` and
40862ef1f0ffSBarry Smith   then just copies the `v` values directly with `PetscMemcpy()`.
40876a9b8d82SBarry Smith 
408811a5261eSBarry Smith   This routine could also take a `PetscCopyMode` argument to allow sharing the values instead of always copying them.
40896a9b8d82SBarry Smith 
4090fe59aa6dSJacob Faibussowitsch .seealso: [](ch_matrices), `Mat`, `MatCreate()`, `MatCreateSeqAIJ()`, `MatSetValues()`, `MatSeqAIJSetPreallocation()`, `MATSEQAIJ`, `MatResetPreallocation()`
4091a1661176SMatthew Knepley @*/
4092d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetPreallocationCSR(Mat B, const PetscInt i[], const PetscInt j[], const PetscScalar v[])
4093d71ae5a4SJacob Faibussowitsch {
4094a1661176SMatthew Knepley   PetscFunctionBegin;
40950700a824SBarry Smith   PetscValidHeaderSpecific(B, MAT_CLASSID, 1);
40966ba663aaSJed Brown   PetscValidType(B, 1);
4097cac4c232SBarry Smith   PetscTryMethod(B, "MatSeqAIJSetPreallocationCSR_C", (Mat, const PetscInt[], const PetscInt[], const PetscScalar[]), (B, i, j, v));
40983ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
4099a1661176SMatthew Knepley }
4100a1661176SMatthew Knepley 
4101ba38deedSJacob Faibussowitsch static PetscErrorCode MatSeqAIJSetPreallocationCSR_SeqAIJ(Mat B, const PetscInt Ii[], const PetscInt J[], const PetscScalar v[])
4102d71ae5a4SJacob Faibussowitsch {
4103a1661176SMatthew Knepley   PetscInt  i;
4104a1661176SMatthew Knepley   PetscInt  m, n;
4105a1661176SMatthew Knepley   PetscInt  nz;
41066a9b8d82SBarry Smith   PetscInt *nnz;
4107a1661176SMatthew Knepley 
4108a1661176SMatthew Knepley   PetscFunctionBegin;
4109aed4548fSBarry Smith   PetscCheck(Ii[0] == 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Ii[0] must be 0 it is %" PetscInt_FMT, Ii[0]);
4110779a8d59SSatish Balay 
41119566063dSJacob Faibussowitsch   PetscCall(PetscLayoutSetUp(B->rmap));
41129566063dSJacob Faibussowitsch   PetscCall(PetscLayoutSetUp(B->cmap));
4113779a8d59SSatish Balay 
41149566063dSJacob Faibussowitsch   PetscCall(MatGetSize(B, &m, &n));
41159566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(m + 1, &nnz));
4116a1661176SMatthew Knepley   for (i = 0; i < m; i++) {
4117b7940d39SSatish Balay     nz = Ii[i + 1] - Ii[i];
411808401ef6SPierre Jolivet     PetscCheck(nz >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Local row %" PetscInt_FMT " has a negative number of columns %" PetscInt_FMT, i, nz);
4119a1661176SMatthew Knepley     nnz[i] = nz;
4120a1661176SMatthew Knepley   }
41219566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJSetPreallocation(B, 0, nnz));
41229566063dSJacob Faibussowitsch   PetscCall(PetscFree(nnz));
4123a1661176SMatthew Knepley 
41248e3a54c0SPierre Jolivet   for (i = 0; i < m; i++) PetscCall(MatSetValues_SeqAIJ(B, 1, &i, Ii[i + 1] - Ii[i], J + Ii[i], PetscSafePointerPlusOffset(v, Ii[i]), INSERT_VALUES));
4125a1661176SMatthew Knepley 
41269566063dSJacob Faibussowitsch   PetscCall(MatAssemblyBegin(B, MAT_FINAL_ASSEMBLY));
41279566063dSJacob Faibussowitsch   PetscCall(MatAssemblyEnd(B, MAT_FINAL_ASSEMBLY));
4128a1661176SMatthew Knepley 
41299566063dSJacob Faibussowitsch   PetscCall(MatSetOption(B, MAT_NEW_NONZERO_LOCATION_ERR, PETSC_TRUE));
41303ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
4131a1661176SMatthew Knepley }
4132a1661176SMatthew Knepley 
4133ad7e164aSPierre Jolivet /*@
41342ef1f0ffSBarry Smith   MatSeqAIJKron - Computes `C`, the Kronecker product of `A` and `B`.
4135ad7e164aSPierre Jolivet 
4136ad7e164aSPierre Jolivet   Input Parameters:
4137ad7e164aSPierre Jolivet + A     - left-hand side matrix
4138ad7e164aSPierre Jolivet . B     - right-hand side matrix
413911a5261eSBarry Smith - reuse - either `MAT_INITIAL_MATRIX` or `MAT_REUSE_MATRIX`
4140ad7e164aSPierre Jolivet 
4141ad7e164aSPierre Jolivet   Output Parameter:
41422ef1f0ffSBarry Smith . C - Kronecker product of `A` and `B`
4143ad7e164aSPierre Jolivet 
4144ad7e164aSPierre Jolivet   Level: intermediate
4145ad7e164aSPierre Jolivet 
414611a5261eSBarry Smith   Note:
414711a5261eSBarry Smith   `MAT_REUSE_MATRIX` can only be used when the nonzero structure of the product matrix has not changed from that last call to `MatSeqAIJKron()`.
4148ad7e164aSPierre Jolivet 
41491cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatCreateSeqAIJ()`, `MATSEQAIJ`, `MATKAIJ`, `MatReuse`
4150ad7e164aSPierre Jolivet @*/
4151d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJKron(Mat A, Mat B, MatReuse reuse, Mat *C)
4152d71ae5a4SJacob Faibussowitsch {
4153ad7e164aSPierre Jolivet   PetscFunctionBegin;
4154ad7e164aSPierre Jolivet   PetscValidHeaderSpecific(A, MAT_CLASSID, 1);
4155ad7e164aSPierre Jolivet   PetscValidType(A, 1);
4156ad7e164aSPierre Jolivet   PetscValidHeaderSpecific(B, MAT_CLASSID, 2);
4157ad7e164aSPierre Jolivet   PetscValidType(B, 2);
41584f572ea9SToby Isaac   PetscAssertPointer(C, 4);
4159ad7e164aSPierre Jolivet   if (reuse == MAT_REUSE_MATRIX) {
4160ad7e164aSPierre Jolivet     PetscValidHeaderSpecific(*C, MAT_CLASSID, 4);
4161ad7e164aSPierre Jolivet     PetscValidType(*C, 4);
4162ad7e164aSPierre Jolivet   }
4163cac4c232SBarry Smith   PetscTryMethod(A, "MatSeqAIJKron_C", (Mat, Mat, MatReuse, Mat *), (A, B, reuse, C));
41643ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
4165ad7e164aSPierre Jolivet }
4166ad7e164aSPierre Jolivet 
4167ba38deedSJacob Faibussowitsch static PetscErrorCode MatSeqAIJKron_SeqAIJ(Mat A, Mat B, MatReuse reuse, Mat *C)
4168d71ae5a4SJacob Faibussowitsch {
4169ad7e164aSPierre Jolivet   Mat                newmat;
4170ad7e164aSPierre Jolivet   Mat_SeqAIJ        *a = (Mat_SeqAIJ *)A->data;
4171ad7e164aSPierre Jolivet   Mat_SeqAIJ        *b = (Mat_SeqAIJ *)B->data;
4172ad7e164aSPierre Jolivet   PetscScalar       *v;
4173fff043a9SJunchao Zhang   const PetscScalar *aa, *ba;
4174ad7e164aSPierre Jolivet   PetscInt          *i, *j, m, n, p, q, nnz = 0, am = A->rmap->n, bm = B->rmap->n, an = A->cmap->n, bn = B->cmap->n;
4175ad7e164aSPierre Jolivet   PetscBool          flg;
4176ad7e164aSPierre Jolivet 
4177ad7e164aSPierre Jolivet   PetscFunctionBegin;
417828b400f6SJacob Faibussowitsch   PetscCheck(!A->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix");
417928b400f6SJacob Faibussowitsch   PetscCheck(A->assembled, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for unassembled matrix");
418028b400f6SJacob Faibussowitsch   PetscCheck(!B->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix");
418128b400f6SJacob Faibussowitsch   PetscCheck(B->assembled, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for unassembled matrix");
41829566063dSJacob Faibussowitsch   PetscCall(PetscObjectTypeCompare((PetscObject)B, MATSEQAIJ, &flg));
418328b400f6SJacob Faibussowitsch   PetscCheck(flg, PETSC_COMM_SELF, PETSC_ERR_SUP, "MatType %s", ((PetscObject)B)->type_name);
4184aed4548fSBarry Smith   PetscCheck(reuse == MAT_INITIAL_MATRIX || reuse == MAT_REUSE_MATRIX, PETSC_COMM_SELF, PETSC_ERR_SUP, "MatReuse %d", (int)reuse);
4185ad7e164aSPierre Jolivet   if (reuse == MAT_INITIAL_MATRIX) {
41869566063dSJacob Faibussowitsch     PetscCall(PetscMalloc2(am * bm + 1, &i, a->i[am] * b->i[bm], &j));
41879566063dSJacob Faibussowitsch     PetscCall(MatCreate(PETSC_COMM_SELF, &newmat));
41889566063dSJacob Faibussowitsch     PetscCall(MatSetSizes(newmat, am * bm, an * bn, am * bm, an * bn));
41899566063dSJacob Faibussowitsch     PetscCall(MatSetType(newmat, MATAIJ));
4190ad7e164aSPierre Jolivet     i[0] = 0;
4191ad7e164aSPierre Jolivet     for (m = 0; m < am; ++m) {
4192ad7e164aSPierre Jolivet       for (p = 0; p < bm; ++p) {
4193ad7e164aSPierre Jolivet         i[m * bm + p + 1] = i[m * bm + p] + (a->i[m + 1] - a->i[m]) * (b->i[p + 1] - b->i[p]);
4194ad7e164aSPierre Jolivet         for (n = a->i[m]; n < a->i[m + 1]; ++n) {
4195ad540459SPierre Jolivet           for (q = b->i[p]; q < b->i[p + 1]; ++q) j[nnz++] = a->j[n] * bn + b->j[q];
4196ad7e164aSPierre Jolivet         }
4197ad7e164aSPierre Jolivet       }
4198ad7e164aSPierre Jolivet     }
41999566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJSetPreallocationCSR(newmat, i, j, NULL));
4200ad7e164aSPierre Jolivet     *C = newmat;
42019566063dSJacob Faibussowitsch     PetscCall(PetscFree2(i, j));
4202ad7e164aSPierre Jolivet     nnz = 0;
4203ad7e164aSPierre Jolivet   }
42049566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArray(*C, &v));
42059566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &aa));
42069566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(B, &ba));
4207ad7e164aSPierre Jolivet   for (m = 0; m < am; ++m) {
4208ad7e164aSPierre Jolivet     for (p = 0; p < bm; ++p) {
4209ad7e164aSPierre Jolivet       for (n = a->i[m]; n < a->i[m + 1]; ++n) {
4210ad540459SPierre Jolivet         for (q = b->i[p]; q < b->i[p + 1]; ++q) v[nnz++] = aa[n] * ba[q];
4211ad7e164aSPierre Jolivet       }
4212ad7e164aSPierre Jolivet     }
4213ad7e164aSPierre Jolivet   }
42149566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArray(*C, &v));
42159566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &aa));
42169566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(B, &ba));
42173ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
4218ad7e164aSPierre Jolivet }
4219ad7e164aSPierre Jolivet 
4220c6db04a5SJed Brown #include <../src/mat/impls/dense/seq/dense.h>
4221af0996ceSBarry Smith #include <petsc/private/kernels/petscaxpy.h>
4222170fe5c8SBarry Smith 
4223170fe5c8SBarry Smith /*
4224170fe5c8SBarry Smith     Computes (B'*A')' since computing B*A directly is untenable
4225170fe5c8SBarry Smith 
4226170fe5c8SBarry Smith                n                       p                          p
42272da392ccSBarry Smith         [             ]       [             ]         [                 ]
42282da392ccSBarry Smith       m [      A      ]  *  n [       B     ]   =   m [         C       ]
42292da392ccSBarry Smith         [             ]       [             ]         [                 ]
4230170fe5c8SBarry Smith 
4231170fe5c8SBarry Smith */
4232d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMatMultNumeric_SeqDense_SeqAIJ(Mat A, Mat B, Mat C)
4233d71ae5a4SJacob Faibussowitsch {
4234170fe5c8SBarry Smith   Mat_SeqDense      *sub_a = (Mat_SeqDense *)A->data;
4235170fe5c8SBarry Smith   Mat_SeqAIJ        *sub_b = (Mat_SeqAIJ *)B->data;
4236170fe5c8SBarry Smith   Mat_SeqDense      *sub_c = (Mat_SeqDense *)C->data;
423786214ceeSStefano Zampini   PetscInt           i, j, n, m, q, p;
4238170fe5c8SBarry Smith   const PetscInt    *ii, *idx;
4239170fe5c8SBarry Smith   const PetscScalar *b, *a, *a_q;
4240170fe5c8SBarry Smith   PetscScalar       *c, *c_q;
424186214ceeSStefano Zampini   PetscInt           clda = sub_c->lda;
424286214ceeSStefano Zampini   PetscInt           alda = sub_a->lda;
4243170fe5c8SBarry Smith 
4244170fe5c8SBarry Smith   PetscFunctionBegin;
4245d0f46423SBarry Smith   m = A->rmap->n;
4246d0f46423SBarry Smith   n = A->cmap->n;
4247d0f46423SBarry Smith   p = B->cmap->n;
4248170fe5c8SBarry Smith   a = sub_a->v;
4249170fe5c8SBarry Smith   b = sub_b->a;
4250170fe5c8SBarry Smith   c = sub_c->v;
425186214ceeSStefano Zampini   if (clda == m) {
42529566063dSJacob Faibussowitsch     PetscCall(PetscArrayzero(c, m * p));
425386214ceeSStefano Zampini   } else {
425486214ceeSStefano Zampini     for (j = 0; j < p; j++)
42559371c9d4SSatish Balay       for (i = 0; i < m; i++) c[j * clda + i] = 0.0;
425686214ceeSStefano Zampini   }
4257170fe5c8SBarry Smith   ii  = sub_b->i;
4258170fe5c8SBarry Smith   idx = sub_b->j;
4259170fe5c8SBarry Smith   for (i = 0; i < n; i++) {
4260170fe5c8SBarry Smith     q = ii[i + 1] - ii[i];
4261170fe5c8SBarry Smith     while (q-- > 0) {
426286214ceeSStefano Zampini       c_q = c + clda * (*idx);
426386214ceeSStefano Zampini       a_q = a + alda * i;
4264854c7f52SBarry Smith       PetscKernelAXPY(c_q, *b, a_q, m);
4265170fe5c8SBarry Smith       idx++;
4266170fe5c8SBarry Smith       b++;
4267170fe5c8SBarry Smith     }
4268170fe5c8SBarry Smith   }
42693ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
4270170fe5c8SBarry Smith }
4271170fe5c8SBarry Smith 
4272d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMatMultSymbolic_SeqDense_SeqAIJ(Mat A, Mat B, PetscReal fill, Mat C)
4273d71ae5a4SJacob Faibussowitsch {
4274d0f46423SBarry Smith   PetscInt  m = A->rmap->n, n = B->cmap->n;
427586214ceeSStefano Zampini   PetscBool cisdense;
4276170fe5c8SBarry Smith 
4277170fe5c8SBarry Smith   PetscFunctionBegin;
427808401ef6SPierre Jolivet   PetscCheck(A->cmap->n == B->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "A->cmap->n %" PetscInt_FMT " != B->rmap->n %" PetscInt_FMT, A->cmap->n, B->rmap->n);
42799566063dSJacob Faibussowitsch   PetscCall(MatSetSizes(C, m, n, m, n));
42809566063dSJacob Faibussowitsch   PetscCall(MatSetBlockSizesFromMats(C, A, B));
4281d5e393b6SSuyash Tandon   PetscCall(PetscObjectTypeCompareAny((PetscObject)C, &cisdense, MATSEQDENSE, MATSEQDENSECUDA, MATSEQDENSEHIP, ""));
428248a46eb9SPierre Jolivet   if (!cisdense) PetscCall(MatSetType(C, MATDENSE));
42839566063dSJacob Faibussowitsch   PetscCall(MatSetUp(C));
4284d73949e8SHong Zhang 
42854222ddf1SHong Zhang   C->ops->matmultnumeric = MatMatMultNumeric_SeqDense_SeqAIJ;
42863ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
4287170fe5c8SBarry Smith }
4288170fe5c8SBarry Smith 
42890bad9183SKris Buschelman /*MC
4290fafad747SKris Buschelman    MATSEQAIJ - MATSEQAIJ = "seqaij" - A matrix type to be used for sequential sparse matrices,
42910bad9183SKris Buschelman    based on compressed sparse row format.
42920bad9183SKris Buschelman 
42932ef1f0ffSBarry Smith    Options Database Key:
42940bad9183SKris Buschelman . -mat_type seqaij - sets the matrix type to "seqaij" during a call to MatSetFromOptions()
42950bad9183SKris Buschelman 
42960bad9183SKris Buschelman    Level: beginner
42970bad9183SKris Buschelman 
42980cd7f59aSBarry Smith    Notes:
42992ef1f0ffSBarry Smith     `MatSetValues()` may be called for this matrix type with a `NULL` argument for the numerical values,
43000cd7f59aSBarry Smith     in this case the values associated with the rows and columns one passes in are set to zero
43010cd7f59aSBarry Smith     in the matrix
43020cd7f59aSBarry Smith 
430311a5261eSBarry Smith     `MatSetOptions`(,`MAT_STRUCTURE_ONLY`,`PETSC_TRUE`) may be called for this matrix type. In this no
430411a5261eSBarry Smith     space is allocated for the nonzero entries and any entries passed with `MatSetValues()` are ignored
43050cd7f59aSBarry Smith 
430611a5261eSBarry Smith   Developer Note:
43072ef1f0ffSBarry Smith     It would be nice if all matrix formats supported passing `NULL` in for the numerical values
43080cd7f59aSBarry Smith 
43091cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatCreateSeqAIJ()`, `MatSetFromOptions()`, `MatSetType()`, `MatCreate()`, `MatType`, `MATSELL`, `MATSEQSELL`, `MATMPISELL`
43100bad9183SKris Buschelman M*/
43110bad9183SKris Buschelman 
4312ccd284c7SBarry Smith /*MC
4313ccd284c7SBarry Smith    MATAIJ - MATAIJ = "aij" - A matrix type to be used for sparse matrices.
4314ccd284c7SBarry Smith 
431511a5261eSBarry Smith    This matrix type is identical to `MATSEQAIJ` when constructed with a single process communicator,
431611a5261eSBarry Smith    and `MATMPIAIJ` otherwise.  As a result, for single process communicators,
431711a5261eSBarry Smith    `MatSeqAIJSetPreallocation()` is supported, and similarly `MatMPIAIJSetPreallocation()` is supported
4318ccd284c7SBarry Smith    for communicators controlling multiple processes.  It is recommended that you call both of
4319ccd284c7SBarry Smith    the above preallocation routines for simplicity.
4320ccd284c7SBarry Smith 
43212ef1f0ffSBarry Smith    Options Database Key:
432211a5261eSBarry Smith . -mat_type aij - sets the matrix type to "aij" during a call to `MatSetFromOptions()`
4323ccd284c7SBarry Smith 
43242ef1f0ffSBarry Smith   Level: beginner
43252ef1f0ffSBarry Smith 
432611a5261eSBarry Smith    Note:
432711a5261eSBarry Smith    Subclasses include `MATAIJCUSPARSE`, `MATAIJPERM`, `MATAIJSELL`, `MATAIJMKL`, `MATAIJCRL`, and also automatically switches over to use inodes when
4328ccd284c7SBarry Smith    enough exist.
4329ccd284c7SBarry Smith 
43301cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatCreateAIJ()`, `MatCreateSeqAIJ()`, `MATSEQAIJ`, `MATMPIAIJ`, `MATSELL`, `MATSEQSELL`, `MATMPISELL`
4331ccd284c7SBarry Smith M*/
4332ccd284c7SBarry Smith 
4333ccd284c7SBarry Smith /*MC
4334ccd284c7SBarry Smith    MATAIJCRL - MATAIJCRL = "aijcrl" - A matrix type to be used for sparse matrices.
4335ccd284c7SBarry Smith 
43362ef1f0ffSBarry Smith    Options Database Key:
43372ef1f0ffSBarry Smith . -mat_type aijcrl - sets the matrix type to "aijcrl" during a call to `MatSetFromOptions()`
43382ef1f0ffSBarry Smith 
43392ef1f0ffSBarry Smith   Level: beginner
43402ef1f0ffSBarry Smith 
43412ef1f0ffSBarry Smith    Note:
434211a5261eSBarry Smith    This matrix type is identical to `MATSEQAIJCRL` when constructed with a single process communicator,
434311a5261eSBarry Smith    and `MATMPIAIJCRL` otherwise.  As a result, for single process communicators,
434411a5261eSBarry Smith    `MatSeqAIJSetPreallocation()` is supported, and similarly `MatMPIAIJSetPreallocation()` is supported
4345ccd284c7SBarry Smith    for communicators controlling multiple processes.  It is recommended that you call both of
4346ccd284c7SBarry Smith    the above preallocation routines for simplicity.
4347ccd284c7SBarry Smith 
43481cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatCreateMPIAIJCRL`, `MATSEQAIJCRL`, `MATMPIAIJCRL`, `MATSEQAIJCRL`, `MATMPIAIJCRL`
4349ccd284c7SBarry Smith M*/
4350ccd284c7SBarry Smith 
43517906f579SHong Zhang PETSC_INTERN PetscErrorCode MatConvert_SeqAIJ_SeqAIJCRL(Mat, MatType, MatReuse, Mat *);
43527906f579SHong Zhang #if defined(PETSC_HAVE_ELEMENTAL)
43537906f579SHong Zhang PETSC_INTERN PetscErrorCode MatConvert_SeqAIJ_Elemental(Mat, MatType, MatReuse, Mat *);
43547906f579SHong Zhang #endif
4355d1a032dbSPierre Jolivet #if defined(PETSC_HAVE_SCALAPACK) && (defined(PETSC_USE_REAL_SINGLE) || defined(PETSC_USE_REAL_DOUBLE))
4356d24d4204SJose E. Roman PETSC_INTERN PetscErrorCode MatConvert_AIJ_ScaLAPACK(Mat, MatType, MatReuse, Mat *);
4357d24d4204SJose E. Roman #endif
43587906f579SHong Zhang #if defined(PETSC_HAVE_HYPRE)
43597906f579SHong Zhang PETSC_INTERN PetscErrorCode MatConvert_AIJ_HYPRE(Mat A, MatType, MatReuse, Mat *);
43607906f579SHong Zhang #endif
43617906f579SHong Zhang 
4362d4002b98SHong Zhang PETSC_EXTERN PetscErrorCode MatConvert_SeqAIJ_SeqSELL(Mat, MatType, MatReuse, Mat *);
4363c9225affSStefano Zampini PETSC_INTERN PetscErrorCode MatConvert_XAIJ_IS(Mat, MatType, MatReuse, Mat *);
43644222ddf1SHong Zhang PETSC_INTERN PetscErrorCode MatProductSetFromOptions_IS_XAIJ(Mat);
43657906f579SHong Zhang 
43668c778c55SBarry Smith /*@C
436711a5261eSBarry Smith   MatSeqAIJGetArray - gives read/write access to the array where the data for a `MATSEQAIJ` matrix is stored
43688c778c55SBarry Smith 
43698c778c55SBarry Smith   Not Collective
43708c778c55SBarry Smith 
43718c778c55SBarry Smith   Input Parameter:
4372fe59aa6dSJacob Faibussowitsch . A - a `MATSEQAIJ` matrix
43738c778c55SBarry Smith 
43748c778c55SBarry Smith   Output Parameter:
43758c778c55SBarry Smith . array - pointer to the data
43768c778c55SBarry Smith 
43778c778c55SBarry Smith   Level: intermediate
43788c778c55SBarry Smith 
4379ce78bad3SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJRestoreArray()`
43808c778c55SBarry Smith @*/
43815d83a8b1SBarry Smith PetscErrorCode MatSeqAIJGetArray(Mat A, PetscScalar *array[])
4382d71ae5a4SJacob Faibussowitsch {
4383d67d9f35SJunchao Zhang   Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data;
43848c778c55SBarry Smith 
43858c778c55SBarry Smith   PetscFunctionBegin;
4386d67d9f35SJunchao Zhang   if (aij->ops->getarray) {
43879566063dSJacob Faibussowitsch     PetscCall((*aij->ops->getarray)(A, array));
4388d67d9f35SJunchao Zhang   } else {
4389d67d9f35SJunchao Zhang     *array = aij->a;
4390d67d9f35SJunchao Zhang   }
43913ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
4392d67d9f35SJunchao Zhang }
4393d67d9f35SJunchao Zhang 
4394d67d9f35SJunchao Zhang /*@C
439511a5261eSBarry Smith   MatSeqAIJRestoreArray - returns access to the array where the data for a `MATSEQAIJ` matrix is stored obtained by `MatSeqAIJGetArray()`
4396d67d9f35SJunchao Zhang 
4397d67d9f35SJunchao Zhang   Not Collective
4398d67d9f35SJunchao Zhang 
4399d67d9f35SJunchao Zhang   Input Parameters:
4400fe59aa6dSJacob Faibussowitsch + A     - a `MATSEQAIJ` matrix
4401d67d9f35SJunchao Zhang - array - pointer to the data
4402d67d9f35SJunchao Zhang 
4403d67d9f35SJunchao Zhang   Level: intermediate
4404d67d9f35SJunchao Zhang 
4405ce78bad3SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJGetArray()`
4406d67d9f35SJunchao Zhang @*/
44075d83a8b1SBarry Smith PetscErrorCode MatSeqAIJRestoreArray(Mat A, PetscScalar *array[])
4408d71ae5a4SJacob Faibussowitsch {
4409d67d9f35SJunchao Zhang   Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data;
4410d67d9f35SJunchao Zhang 
4411d67d9f35SJunchao Zhang   PetscFunctionBegin;
4412d67d9f35SJunchao Zhang   if (aij->ops->restorearray) {
44139566063dSJacob Faibussowitsch     PetscCall((*aij->ops->restorearray)(A, array));
4414d67d9f35SJunchao Zhang   } else {
4415d67d9f35SJunchao Zhang     *array = NULL;
4416d67d9f35SJunchao Zhang   }
44179566063dSJacob Faibussowitsch   PetscCall(PetscObjectStateIncrease((PetscObject)A));
44183ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
44198c778c55SBarry Smith }
44208c778c55SBarry Smith 
442121e72a00SBarry Smith /*@C
442211a5261eSBarry Smith   MatSeqAIJGetArrayRead - gives read-only access to the array where the data for a `MATSEQAIJ` matrix is stored
44238f1ea47aSStefano Zampini 
44240ab4885dSBarry Smith   Not Collective; No Fortran Support
44258f1ea47aSStefano Zampini 
44268f1ea47aSStefano Zampini   Input Parameter:
4427fe59aa6dSJacob Faibussowitsch . A - a `MATSEQAIJ` matrix
44288f1ea47aSStefano Zampini 
44298f1ea47aSStefano Zampini   Output Parameter:
44308f1ea47aSStefano Zampini . array - pointer to the data
44318f1ea47aSStefano Zampini 
44328f1ea47aSStefano Zampini   Level: intermediate
44338f1ea47aSStefano Zampini 
44341cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJGetArray()`, `MatSeqAIJRestoreArrayRead()`
44358f1ea47aSStefano Zampini @*/
44365d83a8b1SBarry Smith PetscErrorCode MatSeqAIJGetArrayRead(Mat A, const PetscScalar *array[])
4437d71ae5a4SJacob Faibussowitsch {
4438d67d9f35SJunchao Zhang   Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data;
44398f1ea47aSStefano Zampini 
44408f1ea47aSStefano Zampini   PetscFunctionBegin;
4441d67d9f35SJunchao Zhang   if (aij->ops->getarrayread) {
44429566063dSJacob Faibussowitsch     PetscCall((*aij->ops->getarrayread)(A, array));
4443d67d9f35SJunchao Zhang   } else {
4444d67d9f35SJunchao Zhang     *array = aij->a;
4445d67d9f35SJunchao Zhang   }
44463ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
44478f1ea47aSStefano Zampini }
44488f1ea47aSStefano Zampini 
44498f1ea47aSStefano Zampini /*@C
445011a5261eSBarry Smith   MatSeqAIJRestoreArrayRead - restore the read-only access array obtained from `MatSeqAIJGetArrayRead()`
44518f1ea47aSStefano Zampini 
44520ab4885dSBarry Smith   Not Collective; No Fortran Support
44538f1ea47aSStefano Zampini 
44548f1ea47aSStefano Zampini   Input Parameter:
4455fe59aa6dSJacob Faibussowitsch . A - a `MATSEQAIJ` matrix
44568f1ea47aSStefano Zampini 
44578f1ea47aSStefano Zampini   Output Parameter:
44588f1ea47aSStefano Zampini . array - pointer to the data
44598f1ea47aSStefano Zampini 
44608f1ea47aSStefano Zampini   Level: intermediate
44618f1ea47aSStefano Zampini 
44621cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJGetArray()`, `MatSeqAIJGetArrayRead()`
44638f1ea47aSStefano Zampini @*/
44645d83a8b1SBarry Smith PetscErrorCode MatSeqAIJRestoreArrayRead(Mat A, const PetscScalar *array[])
4465d71ae5a4SJacob Faibussowitsch {
4466d67d9f35SJunchao Zhang   Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data;
44678f1ea47aSStefano Zampini 
44688f1ea47aSStefano Zampini   PetscFunctionBegin;
4469d67d9f35SJunchao Zhang   if (aij->ops->restorearrayread) {
44709566063dSJacob Faibussowitsch     PetscCall((*aij->ops->restorearrayread)(A, array));
4471d67d9f35SJunchao Zhang   } else {
4472d67d9f35SJunchao Zhang     *array = NULL;
4473d67d9f35SJunchao Zhang   }
44743ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
4475d67d9f35SJunchao Zhang }
4476d67d9f35SJunchao Zhang 
4477d67d9f35SJunchao Zhang /*@C
447811a5261eSBarry Smith   MatSeqAIJGetArrayWrite - gives write-only access to the array where the data for a `MATSEQAIJ` matrix is stored
4479d67d9f35SJunchao Zhang 
44800ab4885dSBarry Smith   Not Collective; No Fortran Support
4481d67d9f35SJunchao Zhang 
4482d67d9f35SJunchao Zhang   Input Parameter:
4483fe59aa6dSJacob Faibussowitsch . A - a `MATSEQAIJ` matrix
4484d67d9f35SJunchao Zhang 
4485d67d9f35SJunchao Zhang   Output Parameter:
4486d67d9f35SJunchao Zhang . array - pointer to the data
4487d67d9f35SJunchao Zhang 
4488d67d9f35SJunchao Zhang   Level: intermediate
4489d67d9f35SJunchao Zhang 
44901cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJGetArray()`, `MatSeqAIJRestoreArrayRead()`
4491d67d9f35SJunchao Zhang @*/
44925d83a8b1SBarry Smith PetscErrorCode MatSeqAIJGetArrayWrite(Mat A, PetscScalar *array[])
4493d71ae5a4SJacob Faibussowitsch {
4494d67d9f35SJunchao Zhang   Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data;
4495d67d9f35SJunchao Zhang 
4496d67d9f35SJunchao Zhang   PetscFunctionBegin;
4497d67d9f35SJunchao Zhang   if (aij->ops->getarraywrite) {
44989566063dSJacob Faibussowitsch     PetscCall((*aij->ops->getarraywrite)(A, array));
4499d67d9f35SJunchao Zhang   } else {
4500d67d9f35SJunchao Zhang     *array = aij->a;
4501d67d9f35SJunchao Zhang   }
45029566063dSJacob Faibussowitsch   PetscCall(PetscObjectStateIncrease((PetscObject)A));
45033ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
4504d67d9f35SJunchao Zhang }
4505d67d9f35SJunchao Zhang 
4506d67d9f35SJunchao Zhang /*@C
4507d67d9f35SJunchao Zhang   MatSeqAIJRestoreArrayWrite - restore the read-only access array obtained from MatSeqAIJGetArrayRead
4508d67d9f35SJunchao Zhang 
45090ab4885dSBarry Smith   Not Collective; No Fortran Support
4510d67d9f35SJunchao Zhang 
4511d67d9f35SJunchao Zhang   Input Parameter:
4512fe59aa6dSJacob Faibussowitsch . A - a MATSEQAIJ matrix
4513d67d9f35SJunchao Zhang 
4514d67d9f35SJunchao Zhang   Output Parameter:
4515d67d9f35SJunchao Zhang . array - pointer to the data
4516d67d9f35SJunchao Zhang 
4517d67d9f35SJunchao Zhang   Level: intermediate
4518d67d9f35SJunchao Zhang 
45191cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJGetArray()`, `MatSeqAIJGetArrayRead()`
4520d67d9f35SJunchao Zhang @*/
45215d83a8b1SBarry Smith PetscErrorCode MatSeqAIJRestoreArrayWrite(Mat A, PetscScalar *array[])
4522d71ae5a4SJacob Faibussowitsch {
4523d67d9f35SJunchao Zhang   Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data;
4524d67d9f35SJunchao Zhang 
4525d67d9f35SJunchao Zhang   PetscFunctionBegin;
4526d67d9f35SJunchao Zhang   if (aij->ops->restorearraywrite) {
45279566063dSJacob Faibussowitsch     PetscCall((*aij->ops->restorearraywrite)(A, array));
4528d67d9f35SJunchao Zhang   } else {
4529d67d9f35SJunchao Zhang     *array = NULL;
4530d67d9f35SJunchao Zhang   }
45313ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
45328f1ea47aSStefano Zampini }
45338f1ea47aSStefano Zampini 
45348f1ea47aSStefano Zampini /*@C
453511a5261eSBarry Smith   MatSeqAIJGetCSRAndMemType - Get the CSR arrays and the memory type of the `MATSEQAIJ` matrix
45367ee59b9bSJunchao Zhang 
45370ab4885dSBarry Smith   Not Collective; No Fortran Support
45387ee59b9bSJunchao Zhang 
45397ee59b9bSJunchao Zhang   Input Parameter:
454011a5261eSBarry Smith . mat - a matrix of type `MATSEQAIJ` or its subclasses
45417ee59b9bSJunchao Zhang 
45427ee59b9bSJunchao Zhang   Output Parameters:
45437ee59b9bSJunchao Zhang + i     - row map array of the matrix
45447ee59b9bSJunchao Zhang . j     - column index array of the matrix
45457ee59b9bSJunchao Zhang . a     - data array of the matrix
4546fe59aa6dSJacob Faibussowitsch - mtype - memory type of the arrays
45477ee59b9bSJunchao Zhang 
4548fe59aa6dSJacob Faibussowitsch   Level: developer
45492ef1f0ffSBarry Smith 
45507ee59b9bSJunchao Zhang   Notes:
45512ef1f0ffSBarry Smith   Any of the output parameters can be `NULL`, in which case the corresponding value is not returned.
45527ee59b9bSJunchao Zhang   If mat is a device matrix, the arrays are on the device. Otherwise, they are on the host.
45537ee59b9bSJunchao Zhang 
45547ee59b9bSJunchao Zhang   One can call this routine on a preallocated but not assembled matrix to just get the memory of the CSR underneath the matrix.
45552ef1f0ffSBarry Smith   If the matrix is assembled, the data array `a` is guaranteed to have the latest values of the matrix.
45567ee59b9bSJunchao Zhang 
45571cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJGetArray()`, `MatSeqAIJGetArrayRead()`
45587ee59b9bSJunchao Zhang @*/
45595d83a8b1SBarry Smith PetscErrorCode MatSeqAIJGetCSRAndMemType(Mat mat, const PetscInt *i[], const PetscInt *j[], PetscScalar *a[], PetscMemType *mtype)
4560d71ae5a4SJacob Faibussowitsch {
45617ee59b9bSJunchao Zhang   Mat_SeqAIJ *aij = (Mat_SeqAIJ *)mat->data;
45627ee59b9bSJunchao Zhang 
45637ee59b9bSJunchao Zhang   PetscFunctionBegin;
45647ee59b9bSJunchao Zhang   PetscCheck(mat->preallocated, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "matrix is not preallocated");
45657ee59b9bSJunchao Zhang   if (aij->ops->getcsrandmemtype) {
45667ee59b9bSJunchao Zhang     PetscCall((*aij->ops->getcsrandmemtype)(mat, i, j, a, mtype));
45677ee59b9bSJunchao Zhang   } else {
45687ee59b9bSJunchao Zhang     if (i) *i = aij->i;
45697ee59b9bSJunchao Zhang     if (j) *j = aij->j;
45707ee59b9bSJunchao Zhang     if (a) *a = aij->a;
45717ee59b9bSJunchao Zhang     if (mtype) *mtype = PETSC_MEMTYPE_HOST;
45727ee59b9bSJunchao Zhang   }
45733ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
45747ee59b9bSJunchao Zhang }
45757ee59b9bSJunchao Zhang 
4576cc4c1da9SBarry Smith /*@
457721e72a00SBarry Smith   MatSeqAIJGetMaxRowNonzeros - returns the maximum number of nonzeros in any row
457821e72a00SBarry Smith 
457921e72a00SBarry Smith   Not Collective
458021e72a00SBarry Smith 
458121e72a00SBarry Smith   Input Parameter:
4582fe59aa6dSJacob Faibussowitsch . A - a `MATSEQAIJ` matrix
458321e72a00SBarry Smith 
458421e72a00SBarry Smith   Output Parameter:
458521e72a00SBarry Smith . nz - the maximum number of nonzeros in any row
458621e72a00SBarry Smith 
458721e72a00SBarry Smith   Level: intermediate
458821e72a00SBarry Smith 
4589ce78bad3SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJRestoreArray()`
459021e72a00SBarry Smith @*/
4591d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJGetMaxRowNonzeros(Mat A, PetscInt *nz)
4592d71ae5a4SJacob Faibussowitsch {
459321e72a00SBarry Smith   Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data;
459421e72a00SBarry Smith 
459521e72a00SBarry Smith   PetscFunctionBegin;
459621e72a00SBarry Smith   *nz = aij->rmax;
45973ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
459821e72a00SBarry Smith }
459921e72a00SBarry Smith 
460049abdd8aSBarry Smith static PetscErrorCode MatCOOStructDestroy_SeqAIJ(void **data)
46012c4ab24aSJunchao Zhang {
460249abdd8aSBarry Smith   MatCOOStruct_SeqAIJ *coo = (MatCOOStruct_SeqAIJ *)*data;
46034d86920dSPierre Jolivet 
46042c4ab24aSJunchao Zhang   PetscFunctionBegin;
46052c4ab24aSJunchao Zhang   PetscCall(PetscFree(coo->perm));
46062c4ab24aSJunchao Zhang   PetscCall(PetscFree(coo->jmap));
46072c4ab24aSJunchao Zhang   PetscCall(PetscFree(coo));
46082c4ab24aSJunchao Zhang   PetscFunctionReturn(PETSC_SUCCESS);
46092c4ab24aSJunchao Zhang }
46102c4ab24aSJunchao Zhang 
4611d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetPreallocationCOO_SeqAIJ(Mat mat, PetscCount coo_n, PetscInt coo_i[], PetscInt coo_j[])
4612d71ae5a4SJacob Faibussowitsch {
4613394ed5ebSJunchao Zhang   MPI_Comm             comm;
4614394ed5ebSJunchao Zhang   PetscInt            *i, *j;
46150d88f7f4SJunchao Zhang   PetscInt             M, N, row, iprev;
4616394ed5ebSJunchao Zhang   PetscCount           k, p, q, nneg, nnz, start, end; /* Index the coo array, so use PetscCount as their type */
4617394ed5ebSJunchao Zhang   PetscInt            *Ai;                             /* Change to PetscCount once we use it for row pointers */
4618394ed5ebSJunchao Zhang   PetscInt            *Aj;
4619394ed5ebSJunchao Zhang   PetscScalar         *Aa;
4620f4f49eeaSPierre Jolivet   Mat_SeqAIJ          *seqaij = (Mat_SeqAIJ *)mat->data;
4621cbc6b225SStefano Zampini   MatType              rtype;
4622394ed5ebSJunchao Zhang   PetscCount          *perm, *jmap;
46232c4ab24aSJunchao Zhang   MatCOOStruct_SeqAIJ *coo;
46240d88f7f4SJunchao Zhang   PetscBool            isorted;
46259f0612e4SBarry Smith   PetscBool            hypre;
4626394ed5ebSJunchao Zhang 
4627394ed5ebSJunchao Zhang   PetscFunctionBegin;
46289566063dSJacob Faibussowitsch   PetscCall(PetscObjectGetComm((PetscObject)mat, &comm));
46299566063dSJacob Faibussowitsch   PetscCall(MatGetSize(mat, &M, &N));
4630e8729f6fSJunchao Zhang   i = coo_i;
4631e8729f6fSJunchao Zhang   j = coo_j;
46329566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(coo_n, &perm));
46330d88f7f4SJunchao Zhang 
46340d88f7f4SJunchao Zhang   /* Ignore entries with negative row or col indices; at the same time, check if i[] is already sorted (e.g., MatConvert_AlJ_HYPRE results in this case) */
46350d88f7f4SJunchao Zhang   isorted = PETSC_TRUE;
46360d88f7f4SJunchao Zhang   iprev   = PETSC_INT_MIN;
46370d88f7f4SJunchao Zhang   for (k = 0; k < coo_n; k++) {
4638394ed5ebSJunchao Zhang     if (j[k] < 0) i[k] = -1;
46390d88f7f4SJunchao Zhang     if (isorted) {
46400d88f7f4SJunchao Zhang       if (i[k] < iprev) isorted = PETSC_FALSE;
46410d88f7f4SJunchao Zhang       else iprev = i[k];
46420d88f7f4SJunchao Zhang     }
4643394ed5ebSJunchao Zhang     perm[k] = k;
4644394ed5ebSJunchao Zhang   }
4645394ed5ebSJunchao Zhang 
46460d88f7f4SJunchao Zhang   /* Sort by row if not already */
46470d88f7f4SJunchao Zhang   if (!isorted) PetscCall(PetscSortIntWithIntCountArrayPair(coo_n, i, j, perm));
46482b35a777SBarry Smith   PetscCheck(coo_n == 0 || i[coo_n - 1] < M, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "COO row index %" PetscInt_FMT " is >= the matrix row size %" PetscInt_FMT, i[coo_n - 1], M);
4649651b1cf9SStefano Zampini 
4650651b1cf9SStefano Zampini   /* Advance k to the first row with a non-negative index */
4651651b1cf9SStefano Zampini   for (k = 0; k < coo_n; k++)
46529371c9d4SSatish Balay     if (i[k] >= 0) break;
4653394ed5ebSJunchao Zhang   nneg = k;
46549566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(coo_n - nneg + 1, &jmap)); /* +1 to make a CSR-like data structure. jmap[i] originally is the number of repeats for i-th nonzero */
4655394ed5ebSJunchao Zhang   nnz = 0;                                          /* Total number of unique nonzeros to be counted */
465635cb6cd3SPierre Jolivet   jmap++;                                           /* Inc jmap by 1 for convenience */
4657394ed5ebSJunchao Zhang 
46589f0612e4SBarry Smith   PetscCall(PetscShmgetAllocateArray(M + 1, sizeof(PetscInt), (void **)&Ai)); /* CSR of A */
46599f0612e4SBarry Smith   PetscCall(PetscArrayzero(Ai, M + 1));
46609f0612e4SBarry Smith   PetscCall(PetscShmgetAllocateArray(coo_n - nneg, sizeof(PetscInt), (void **)&Aj)); /* We have at most coo_n-nneg unique nonzeros */
4661394ed5ebSJunchao Zhang 
466221fb621cSStefano Zampini   PetscCall(PetscStrcmp("_internal_COO_mat_for_hypre", ((PetscObject)mat)->name, &hypre));
4663651b1cf9SStefano Zampini 
4664394ed5ebSJunchao Zhang   /* In each row, sort by column, then unique column indices to get row length */
466535cb6cd3SPierre Jolivet   Ai++;  /* Inc by 1 for convenience */
4666394ed5ebSJunchao Zhang   q = 0; /* q-th unique nonzero, with q starting from 0 */
4667394ed5ebSJunchao Zhang   while (k < coo_n) {
46680d88f7f4SJunchao Zhang     PetscBool strictly_sorted; // this row is strictly sorted?
46690d88f7f4SJunchao Zhang     PetscInt  jprev;
46700d88f7f4SJunchao Zhang 
46710d88f7f4SJunchao Zhang     /* get [start,end) indices for this row; also check if cols in this row are strictly sorted */
4672394ed5ebSJunchao Zhang     row             = i[k];
46730d88f7f4SJunchao Zhang     start           = k;
46740d88f7f4SJunchao Zhang     jprev           = PETSC_INT_MIN;
46750d88f7f4SJunchao Zhang     strictly_sorted = PETSC_TRUE;
46760d88f7f4SJunchao Zhang     while (k < coo_n && i[k] == row) {
46770d88f7f4SJunchao Zhang       if (strictly_sorted) {
46780d88f7f4SJunchao Zhang         if (j[k] <= jprev) strictly_sorted = PETSC_FALSE;
46790d88f7f4SJunchao Zhang         else jprev = j[k];
46800d88f7f4SJunchao Zhang       }
46810d88f7f4SJunchao Zhang       k++;
46820d88f7f4SJunchao Zhang     }
4683394ed5ebSJunchao Zhang     end = k;
46840d88f7f4SJunchao Zhang 
4685651b1cf9SStefano Zampini     /* hack for HYPRE: swap min column to diag so that diagonal values will go first */
4686651b1cf9SStefano Zampini     if (hypre) {
46871690c2aeSBarry Smith       PetscInt  minj    = PETSC_INT_MAX;
4688651b1cf9SStefano Zampini       PetscBool hasdiag = PETSC_FALSE;
46890d88f7f4SJunchao Zhang 
46900d88f7f4SJunchao Zhang       if (strictly_sorted) { // fast path to swap the first and the diag
46910d88f7f4SJunchao Zhang         PetscCount tmp;
46920d88f7f4SJunchao Zhang         for (p = start; p < end; p++) {
46930d88f7f4SJunchao Zhang           if (j[p] == row && p != start) {
46941c265611SJunchao Zhang             j[p]        = j[start]; // swap j[], so that the diagonal value will go first (manipulated by perm[])
46950d88f7f4SJunchao Zhang             j[start]    = row;
46960d88f7f4SJunchao Zhang             tmp         = perm[start];
46971c265611SJunchao Zhang             perm[start] = perm[p]; // also swap perm[] so we can save the call to PetscSortIntWithCountArray() below
46980d88f7f4SJunchao Zhang             perm[p]     = tmp;
46990d88f7f4SJunchao Zhang             break;
47000d88f7f4SJunchao Zhang           }
47010d88f7f4SJunchao Zhang         }
47020d88f7f4SJunchao Zhang       } else {
4703651b1cf9SStefano Zampini         for (p = start; p < end; p++) {
4704651b1cf9SStefano Zampini           hasdiag = (PetscBool)(hasdiag || (j[p] == row));
4705651b1cf9SStefano Zampini           minj    = PetscMin(minj, j[p]);
4706651b1cf9SStefano Zampini         }
47070d88f7f4SJunchao Zhang 
4708651b1cf9SStefano Zampini         if (hasdiag) {
4709651b1cf9SStefano Zampini           for (p = start; p < end; p++) {
4710651b1cf9SStefano Zampini             if (j[p] == minj) j[p] = row;
4711651b1cf9SStefano Zampini             else if (j[p] == row) j[p] = minj;
4712651b1cf9SStefano Zampini           }
4713651b1cf9SStefano Zampini         }
4714651b1cf9SStefano Zampini       }
47150d88f7f4SJunchao Zhang     }
47161c265611SJunchao Zhang     // sort by columns in a row. perm[] indicates their original order
47170d88f7f4SJunchao Zhang     if (!strictly_sorted) PetscCall(PetscSortIntWithCountArray(end - start, j + start, perm + start));
47188551dd9cSJunchao Zhang     PetscCheck(end == start || j[end - 1] < N, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "COO column index %" PetscInt_FMT " is >= the matrix column size %" PetscInt_FMT, j[end - 1], N);
4719651b1cf9SStefano Zampini 
47200d88f7f4SJunchao Zhang     if (strictly_sorted) { // fast path to set Aj[], jmap[], Ai[], nnz, q
47210d88f7f4SJunchao Zhang       for (p = start; p < end; p++, q++) {
47220d88f7f4SJunchao Zhang         Aj[q]   = j[p];
47230d88f7f4SJunchao Zhang         jmap[q] = 1;
47240d88f7f4SJunchao Zhang       }
47256497c311SBarry Smith       PetscCall(PetscIntCast(end - start, Ai + row));
47260d88f7f4SJunchao Zhang       nnz += Ai[row]; // q is already advanced
47270d88f7f4SJunchao Zhang     } else {
4728394ed5ebSJunchao Zhang       /* Find number of unique col entries in this row */
4729394ed5ebSJunchao Zhang       Aj[q]   = j[start]; /* Log the first nonzero in this row */
4730651b1cf9SStefano Zampini       jmap[q] = 1;        /* Number of repeats of this nonzero entry */
4731394ed5ebSJunchao Zhang       Ai[row] = 1;
4732394ed5ebSJunchao Zhang       nnz++;
4733394ed5ebSJunchao Zhang 
4734394ed5ebSJunchao Zhang       for (p = start + 1; p < end; p++) { /* Scan remaining nonzero in this row */
4735394ed5ebSJunchao Zhang         if (j[p] != j[p - 1]) {           /* Meet a new nonzero */
4736394ed5ebSJunchao Zhang           q++;
4737394ed5ebSJunchao Zhang           jmap[q] = 1;
4738394ed5ebSJunchao Zhang           Aj[q]   = j[p];
4739394ed5ebSJunchao Zhang           Ai[row]++;
4740394ed5ebSJunchao Zhang           nnz++;
4741394ed5ebSJunchao Zhang         } else {
4742394ed5ebSJunchao Zhang           jmap[q]++;
4743394ed5ebSJunchao Zhang         }
4744394ed5ebSJunchao Zhang       }
4745394ed5ebSJunchao Zhang       q++; /* Move to next row and thus next unique nonzero */
4746394ed5ebSJunchao Zhang     }
47470d88f7f4SJunchao Zhang   }
47480d88f7f4SJunchao Zhang 
4749394ed5ebSJunchao Zhang   Ai--; /* Back to the beginning of Ai[] */
4750394ed5ebSJunchao Zhang   for (k = 0; k < M; k++) Ai[k + 1] += Ai[k];
47510d88f7f4SJunchao Zhang   jmap--; // Back to the beginning of jmap[]
4752394ed5ebSJunchao Zhang   jmap[0] = 0;
4753394ed5ebSJunchao Zhang   for (k = 0; k < nnz; k++) jmap[k + 1] += jmap[k];
47540d88f7f4SJunchao Zhang 
47559f0612e4SBarry Smith   if (nnz < coo_n - nneg) { /* Reallocate with actual number of unique nonzeros */
4756394ed5ebSJunchao Zhang     PetscCount *jmap_new;
4757394ed5ebSJunchao Zhang     PetscInt   *Aj_new;
4758394ed5ebSJunchao Zhang 
47599566063dSJacob Faibussowitsch     PetscCall(PetscMalloc1(nnz + 1, &jmap_new));
47609566063dSJacob Faibussowitsch     PetscCall(PetscArraycpy(jmap_new, jmap, nnz + 1));
47619566063dSJacob Faibussowitsch     PetscCall(PetscFree(jmap));
4762394ed5ebSJunchao Zhang     jmap = jmap_new;
4763394ed5ebSJunchao Zhang 
47649f0612e4SBarry Smith     PetscCall(PetscShmgetAllocateArray(nnz, sizeof(PetscInt), (void **)&Aj_new));
47659566063dSJacob Faibussowitsch     PetscCall(PetscArraycpy(Aj_new, Aj, nnz));
47669f0612e4SBarry Smith     PetscCall(PetscShmgetDeallocateArray((void **)&Aj));
4767394ed5ebSJunchao Zhang     Aj = Aj_new;
4768394ed5ebSJunchao Zhang   }
4769394ed5ebSJunchao Zhang 
4770394ed5ebSJunchao Zhang   if (nneg) { /* Discard heading entries with negative indices in perm[], as we'll access it from index 0 in MatSetValuesCOO */
4771394ed5ebSJunchao Zhang     PetscCount *perm_new;
4772cbc6b225SStefano Zampini 
47739566063dSJacob Faibussowitsch     PetscCall(PetscMalloc1(coo_n - nneg, &perm_new));
47749566063dSJacob Faibussowitsch     PetscCall(PetscArraycpy(perm_new, perm + nneg, coo_n - nneg));
47759566063dSJacob Faibussowitsch     PetscCall(PetscFree(perm));
4776394ed5ebSJunchao Zhang     perm = perm_new;
4777394ed5ebSJunchao Zhang   }
4778394ed5ebSJunchao Zhang 
47799566063dSJacob Faibussowitsch   PetscCall(MatGetRootType_Private(mat, &rtype));
47809f0612e4SBarry Smith   PetscCall(PetscShmgetAllocateArray(nnz, sizeof(PetscScalar), (void **)&Aa));
47819f0612e4SBarry Smith   PetscCall(PetscArrayzero(Aa, nnz));
47829566063dSJacob Faibussowitsch   PetscCall(MatSetSeqAIJWithArrays_private(PETSC_COMM_SELF, M, N, Ai, Aj, Aa, rtype, mat));
4783394ed5ebSJunchao Zhang 
4784394ed5ebSJunchao Zhang   seqaij->free_a = seqaij->free_ij = PETSC_TRUE; /* Let newmat own Ai, Aj and Aa */
47852c4ab24aSJunchao Zhang 
47862c4ab24aSJunchao Zhang   // Put the COO struct in a container and then attach that to the matrix
47872c4ab24aSJunchao Zhang   PetscCall(PetscMalloc1(1, &coo));
47886497c311SBarry Smith   PetscCall(PetscIntCast(nnz, &coo->nz));
47892c4ab24aSJunchao Zhang   coo->n    = coo_n;
47902c4ab24aSJunchao Zhang   coo->Atot = coo_n - nneg; // Annz is seqaij->nz, so no need to record that again
47912c4ab24aSJunchao Zhang   coo->jmap = jmap;         // of length nnz+1
47922c4ab24aSJunchao Zhang   coo->perm = perm;
479303e76207SPierre Jolivet   PetscCall(PetscObjectContainerCompose((PetscObject)mat, "__PETSc_MatCOOStruct_Host", coo, MatCOOStructDestroy_SeqAIJ));
47943ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
4795394ed5ebSJunchao Zhang }
4796394ed5ebSJunchao Zhang 
4797d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatSetValuesCOO_SeqAIJ(Mat A, const PetscScalar v[], InsertMode imode)
4798d71ae5a4SJacob Faibussowitsch {
4799394ed5ebSJunchao Zhang   Mat_SeqAIJ          *aseq = (Mat_SeqAIJ *)A->data;
4800394ed5ebSJunchao Zhang   PetscCount           i, j, Annz = aseq->nz;
48012c4ab24aSJunchao Zhang   PetscCount          *perm, *jmap;
4802394ed5ebSJunchao Zhang   PetscScalar         *Aa;
48032c4ab24aSJunchao Zhang   PetscContainer       container;
48042c4ab24aSJunchao Zhang   MatCOOStruct_SeqAIJ *coo;
4805394ed5ebSJunchao Zhang 
4806394ed5ebSJunchao Zhang   PetscFunctionBegin;
48072c4ab24aSJunchao Zhang   PetscCall(PetscObjectQuery((PetscObject)A, "__PETSc_MatCOOStruct_Host", (PetscObject *)&container));
48082c4ab24aSJunchao Zhang   PetscCheck(container, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Not found MatCOOStruct on this matrix");
48092c4ab24aSJunchao Zhang   PetscCall(PetscContainerGetPointer(container, (void **)&coo));
48102c4ab24aSJunchao Zhang   perm = coo->perm;
48112c4ab24aSJunchao Zhang   jmap = coo->jmap;
48129566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArray(A, &Aa));
4813394ed5ebSJunchao Zhang   for (i = 0; i < Annz; i++) {
4814b6c38306SJunchao Zhang     PetscScalar sum = 0.0;
4815b6c38306SJunchao Zhang     for (j = jmap[i]; j < jmap[i + 1]; j++) sum += v[perm[j]];
4816b6c38306SJunchao Zhang     Aa[i] = (imode == INSERT_VALUES ? 0.0 : Aa[i]) + sum;
4817394ed5ebSJunchao Zhang   }
48189566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArray(A, &Aa));
48193ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
4820394ed5ebSJunchao Zhang }
4821394ed5ebSJunchao Zhang 
482234b5b067SBarry Smith #if defined(PETSC_HAVE_CUDA)
48235063d097SStefano Zampini PETSC_INTERN PetscErrorCode MatConvert_SeqAIJ_SeqAIJCUSPARSE(Mat, MatType, MatReuse, Mat *);
482402fe1965SBarry Smith #endif
4825d5e393b6SSuyash Tandon #if defined(PETSC_HAVE_HIP)
4826d5e393b6SSuyash Tandon PETSC_INTERN PetscErrorCode MatConvert_SeqAIJ_SeqAIJHIPSPARSE(Mat, MatType, MatReuse, Mat *);
4827d5e393b6SSuyash Tandon #endif
48283d0639e7SStefano Zampini #if defined(PETSC_HAVE_KOKKOS_KERNELS)
48295063d097SStefano Zampini PETSC_INTERN PetscErrorCode MatConvert_SeqAIJ_SeqAIJKokkos(Mat, MatType, MatReuse, Mat *);
48303d0639e7SStefano Zampini #endif
483102fe1965SBarry Smith 
4832d71ae5a4SJacob Faibussowitsch PETSC_EXTERN PetscErrorCode MatCreate_SeqAIJ(Mat B)
4833d71ae5a4SJacob Faibussowitsch {
4834273d9f13SBarry Smith   Mat_SeqAIJ *b;
483538baddfdSBarry Smith   PetscMPIInt size;
4836273d9f13SBarry Smith 
4837273d9f13SBarry Smith   PetscFunctionBegin;
48389566063dSJacob Faibussowitsch   PetscCallMPI(MPI_Comm_size(PetscObjectComm((PetscObject)B), &size));
483908401ef6SPierre Jolivet   PetscCheck(size <= 1, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Comm must be of size 1");
4840273d9f13SBarry Smith 
48414dfa11a4SJacob Faibussowitsch   PetscCall(PetscNew(&b));
48422205254eSKarl Rupp 
4843b0a32e0cSBarry Smith   B->data   = (void *)b;
4844aea10558SJacob Faibussowitsch   B->ops[0] = MatOps_Values;
4845071fcb05SBarry Smith   if (B->sortedfull) B->ops->setvalues = MatSetValues_SeqAIJ_SortedFull;
48462205254eSKarl Rupp 
4847f4259b30SLisandro Dalcin   b->row                = NULL;
4848f4259b30SLisandro Dalcin   b->col                = NULL;
4849f4259b30SLisandro Dalcin   b->icol               = NULL;
4850b810aeb4SBarry Smith   b->reallocs           = 0;
485136db0b34SBarry Smith   b->ignorezeroentries  = PETSC_FALSE;
4852f1e2ffcdSBarry Smith   b->roworiented        = PETSC_TRUE;
4853416022c9SBarry Smith   b->nonew              = 0;
4854f4259b30SLisandro Dalcin   b->diag               = NULL;
4855f4259b30SLisandro Dalcin   b->solve_work         = NULL;
4856f4259b30SLisandro Dalcin   B->spptr              = NULL;
4857f4259b30SLisandro Dalcin   b->saved_values       = NULL;
4858f4259b30SLisandro Dalcin   b->idiag              = NULL;
4859f4259b30SLisandro Dalcin   b->mdiag              = NULL;
4860f4259b30SLisandro Dalcin   b->ssor_work          = NULL;
486171f1c65dSBarry Smith   b->omega              = 1.0;
486271f1c65dSBarry Smith   b->fshift             = 0.0;
4863bbead8a2SBarry Smith   b->ibdiagvalid        = PETSC_FALSE;
4864a9817697SBarry Smith   b->keepnonzeropattern = PETSC_FALSE;
486517ab2063SBarry Smith 
48669566063dSJacob Faibussowitsch   PetscCall(PetscObjectChangeTypeName((PetscObject)B, MATSEQAIJ));
4867d1e78c4fSBarry Smith #if defined(PETSC_HAVE_MATLAB)
48689566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "PetscMatlabEnginePut_C", MatlabEnginePut_SeqAIJ));
48699566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "PetscMatlabEngineGet_C", MatlabEngineGet_SeqAIJ));
4870b3866ffcSBarry Smith #endif
48719566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSeqAIJSetColumnIndices_C", MatSeqAIJSetColumnIndices_SeqAIJ));
48729566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatStoreValues_C", MatStoreValues_SeqAIJ));
48739566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatRetrieveValues_C", MatRetrieveValues_SeqAIJ));
48749566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqsbaij_C", MatConvert_SeqAIJ_SeqSBAIJ));
48759566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqbaij_C", MatConvert_SeqAIJ_SeqBAIJ));
48769566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijperm_C", MatConvert_SeqAIJ_SeqAIJPERM));
48779566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijsell_C", MatConvert_SeqAIJ_SeqAIJSELL));
48789779e05dSSatish Balay #if defined(PETSC_HAVE_MKL_SPARSE)
48799566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijmkl_C", MatConvert_SeqAIJ_SeqAIJMKL));
4880191b95cbSRichard Tran Mills #endif
488134b5b067SBarry Smith #if defined(PETSC_HAVE_CUDA)
48829566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijcusparse_C", MatConvert_SeqAIJ_SeqAIJCUSPARSE));
48839566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_seqaijcusparse_seqaij_C", MatProductSetFromOptions_SeqAIJ));
48849566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_seqaij_seqaijcusparse_C", MatProductSetFromOptions_SeqAIJ));
488502fe1965SBarry Smith #endif
4886d5e393b6SSuyash Tandon #if defined(PETSC_HAVE_HIP)
4887d5e393b6SSuyash Tandon   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijhipsparse_C", MatConvert_SeqAIJ_SeqAIJHIPSPARSE));
4888d5e393b6SSuyash Tandon   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_seqaijhipsparse_seqaij_C", MatProductSetFromOptions_SeqAIJ));
4889d5e393b6SSuyash Tandon   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_seqaij_seqaijhipsparse_C", MatProductSetFromOptions_SeqAIJ));
4890d5e393b6SSuyash Tandon #endif
48913d0639e7SStefano Zampini #if defined(PETSC_HAVE_KOKKOS_KERNELS)
48929566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijkokkos_C", MatConvert_SeqAIJ_SeqAIJKokkos));
48933d0639e7SStefano Zampini #endif
48949566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijcrl_C", MatConvert_SeqAIJ_SeqAIJCRL));
4895af8000cdSHong Zhang #if defined(PETSC_HAVE_ELEMENTAL)
48969566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_elemental_C", MatConvert_SeqAIJ_Elemental));
4897af8000cdSHong Zhang #endif
4898d1a032dbSPierre Jolivet #if defined(PETSC_HAVE_SCALAPACK) && (defined(PETSC_USE_REAL_SINGLE) || defined(PETSC_USE_REAL_DOUBLE))
48999566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_scalapack_C", MatConvert_AIJ_ScaLAPACK));
4900d24d4204SJose E. Roman #endif
490163c07aadSStefano Zampini #if defined(PETSC_HAVE_HYPRE)
49029566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_hypre_C", MatConvert_AIJ_HYPRE));
49039566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_transpose_seqaij_seqaij_C", MatProductSetFromOptions_Transpose_AIJ_AIJ));
490463c07aadSStefano Zampini #endif
49059566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqdense_C", MatConvert_SeqAIJ_SeqDense));
49069566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqsell_C", MatConvert_SeqAIJ_SeqSELL));
49079566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_is_C", MatConvert_XAIJ_IS));
49089566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatIsTranspose_C", MatIsTranspose_SeqAIJ));
490914e4dea2SJose E. Roman   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatIsHermitianTranspose_C", MatIsHermitianTranspose_SeqAIJ));
49109566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSeqAIJSetPreallocation_C", MatSeqAIJSetPreallocation_SeqAIJ));
49119566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatResetPreallocation_C", MatResetPreallocation_SeqAIJ));
4912674b392bSAlexander   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatResetHash_C", MatResetHash_SeqAIJ));
49139566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSeqAIJSetPreallocationCSR_C", MatSeqAIJSetPreallocationCSR_SeqAIJ));
49149566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatReorderForNonzeroDiagonal_C", MatReorderForNonzeroDiagonal_SeqAIJ));
49159566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_is_seqaij_C", MatProductSetFromOptions_IS_XAIJ));
49169566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_seqdense_seqaij_C", MatProductSetFromOptions_SeqDense_SeqAIJ));
49179566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_seqaij_seqaij_C", MatProductSetFromOptions_SeqAIJ));
49189566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSeqAIJKron_C", MatSeqAIJKron_SeqAIJ));
49199566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSetPreallocationCOO_C", MatSetPreallocationCOO_SeqAIJ));
49209566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSetValuesCOO_C", MatSetValuesCOO_SeqAIJ));
49219566063dSJacob Faibussowitsch   PetscCall(MatCreate_SeqAIJ_Inode(B));
49229566063dSJacob Faibussowitsch   PetscCall(PetscObjectChangeTypeName((PetscObject)B, MATSEQAIJ));
49239566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJSetTypeFromOptions(B)); /* this allows changing the matrix subtype to say MATSEQAIJPERM */
49243ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
492517ab2063SBarry Smith }
492617ab2063SBarry Smith 
4927b24902e0SBarry Smith /*
49283893b582SJunchao Zhang     Given a matrix generated with MatGetFactor() duplicates all the information in A into C
4929b24902e0SBarry Smith */
4930d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDuplicateNoCreate_SeqAIJ(Mat C, Mat A, MatDuplicateOption cpvalues, PetscBool mallocmatspace)
4931d71ae5a4SJacob Faibussowitsch {
49322a350339SBarry Smith   Mat_SeqAIJ *c = (Mat_SeqAIJ *)C->data, *a = (Mat_SeqAIJ *)A->data;
4933071fcb05SBarry Smith   PetscInt    m = A->rmap->n, i;
493417ab2063SBarry Smith 
49353a40ed3dSBarry Smith   PetscFunctionBegin;
4936aed4548fSBarry Smith   PetscCheck(A->assembled || cpvalues == MAT_DO_NOT_COPY_VALUES, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Cannot duplicate unassembled matrix");
4937273d9f13SBarry Smith 
4938d5f3da31SBarry Smith   C->factortype = A->factortype;
4939f4259b30SLisandro Dalcin   c->row        = NULL;
4940f4259b30SLisandro Dalcin   c->col        = NULL;
4941f4259b30SLisandro Dalcin   c->icol       = NULL;
49426ad4291fSHong Zhang   c->reallocs   = 0;
4943*07425a8dSBarry Smith   c->diagDense  = a->diagDense;
494417ab2063SBarry Smith 
494569272f91SPierre Jolivet   C->assembled = A->assembled;
494617ab2063SBarry Smith 
494769272f91SPierre Jolivet   if (A->preallocated) {
49489566063dSJacob Faibussowitsch     PetscCall(PetscLayoutReference(A->rmap, &C->rmap));
49499566063dSJacob Faibussowitsch     PetscCall(PetscLayoutReference(A->cmap, &C->cmap));
4950eec197d1SBarry Smith 
495131fe6a7dSBarry Smith     if (!A->hash_active) {
49529566063dSJacob Faibussowitsch       PetscCall(PetscMalloc1(m, &c->imax));
49539566063dSJacob Faibussowitsch       PetscCall(PetscMemcpy(c->imax, a->imax, m * sizeof(PetscInt)));
49549566063dSJacob Faibussowitsch       PetscCall(PetscMalloc1(m, &c->ilen));
49559566063dSJacob Faibussowitsch       PetscCall(PetscMemcpy(c->ilen, a->ilen, m * sizeof(PetscInt)));
495617ab2063SBarry Smith 
495717ab2063SBarry Smith       /* allocate the matrix space */
4958f77e22a1SHong Zhang       if (mallocmatspace) {
49599f0612e4SBarry Smith         PetscCall(PetscShmgetAllocateArray(a->i[m], sizeof(PetscScalar), (void **)&c->a));
49609f0612e4SBarry Smith         PetscCall(PetscShmgetAllocateArray(a->i[m], sizeof(PetscInt), (void **)&c->j));
49619f0612e4SBarry Smith         PetscCall(PetscShmgetAllocateArray(m + 1, sizeof(PetscInt), (void **)&c->i));
49629566063dSJacob Faibussowitsch         PetscCall(PetscArraycpy(c->i, a->i, m + 1));
49639f0612e4SBarry Smith         c->free_a  = PETSC_TRUE;
49649f0612e4SBarry Smith         c->free_ij = PETSC_TRUE;
496517ab2063SBarry Smith         if (m > 0) {
49669566063dSJacob Faibussowitsch           PetscCall(PetscArraycpy(c->j, a->j, a->i[m]));
4967be6bf707SBarry Smith           if (cpvalues == MAT_COPY_VALUES) {
49682e5835c6SStefano Zampini             const PetscScalar *aa;
49692e5835c6SStefano Zampini 
49709566063dSJacob Faibussowitsch             PetscCall(MatSeqAIJGetArrayRead(A, &aa));
49719566063dSJacob Faibussowitsch             PetscCall(PetscArraycpy(c->a, aa, a->i[m]));
49729566063dSJacob Faibussowitsch             PetscCall(MatSeqAIJGetArrayRead(A, &aa));
4973be6bf707SBarry Smith           } else {
49749566063dSJacob Faibussowitsch             PetscCall(PetscArrayzero(c->a, a->i[m]));
497517ab2063SBarry Smith           }
497608480c60SBarry Smith         }
4977f77e22a1SHong Zhang       }
497831fe6a7dSBarry Smith       C->preallocated = PETSC_TRUE;
497931fe6a7dSBarry Smith     } else {
498031fe6a7dSBarry Smith       PetscCheck(mallocmatspace, PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_WRONGSTATE, "Cannot malloc matrix memory from a non-preallocated matrix");
498131fe6a7dSBarry Smith       PetscCall(MatSetUp(C));
498231fe6a7dSBarry Smith     }
498317ab2063SBarry Smith 
49846ad4291fSHong Zhang     c->ignorezeroentries = a->ignorezeroentries;
4985416022c9SBarry Smith     c->roworiented       = a->roworiented;
4986416022c9SBarry Smith     c->nonew             = a->nonew;
4987416022c9SBarry Smith     if (a->diag) {
49889566063dSJacob Faibussowitsch       PetscCall(PetscMalloc1(m + 1, &c->diag));
49899566063dSJacob Faibussowitsch       PetscCall(PetscMemcpy(c->diag, a->diag, m * sizeof(PetscInt)));
4990071fcb05SBarry Smith     } else c->diag = NULL;
49912205254eSKarl Rupp 
4992f4259b30SLisandro Dalcin     c->solve_work         = NULL;
4993f4259b30SLisandro Dalcin     c->saved_values       = NULL;
4994f4259b30SLisandro Dalcin     c->idiag              = NULL;
4995f4259b30SLisandro Dalcin     c->ssor_work          = NULL;
4996a9817697SBarry Smith     c->keepnonzeropattern = a->keepnonzeropattern;
49976ad4291fSHong Zhang 
4998893ad86cSHong Zhang     c->rmax  = a->rmax;
4999416022c9SBarry Smith     c->nz    = a->nz;
50008ed568f8SMatthew G Knepley     c->maxnz = a->nz; /* Since we allocate exactly the right amount */
5001754ec7b1SSatish Balay 
50026ad4291fSHong Zhang     c->compressedrow.use   = a->compressedrow.use;
50036ad4291fSHong Zhang     c->compressedrow.nrows = a->compressedrow.nrows;
5004cd6b891eSBarry Smith     if (a->compressedrow.use) {
50056ad4291fSHong Zhang       i = a->compressedrow.nrows;
50069566063dSJacob Faibussowitsch       PetscCall(PetscMalloc2(i + 1, &c->compressedrow.i, i, &c->compressedrow.rindex));
50079566063dSJacob Faibussowitsch       PetscCall(PetscArraycpy(c->compressedrow.i, a->compressedrow.i, i + 1));
50089566063dSJacob Faibussowitsch       PetscCall(PetscArraycpy(c->compressedrow.rindex, a->compressedrow.rindex, i));
500927ea64f8SHong Zhang     } else {
501027ea64f8SHong Zhang       c->compressedrow.use    = PETSC_FALSE;
50110298fd71SBarry Smith       c->compressedrow.i      = NULL;
50120298fd71SBarry Smith       c->compressedrow.rindex = NULL;
50136ad4291fSHong Zhang     }
5014ea632784SBarry Smith     c->nonzerorowcnt = a->nonzerorowcnt;
5015e56f5c9eSBarry Smith     C->nonzerostate  = A->nonzerostate;
50164846f1f5SKris Buschelman 
50179566063dSJacob Faibussowitsch     PetscCall(MatDuplicate_SeqAIJ_Inode(A, cpvalues, &C));
501869272f91SPierre Jolivet   }
50199566063dSJacob Faibussowitsch   PetscCall(PetscFunctionListDuplicate(((PetscObject)A)->qlist, &((PetscObject)C)->qlist));
50203ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
502117ab2063SBarry Smith }
502217ab2063SBarry Smith 
5023d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDuplicate_SeqAIJ(Mat A, MatDuplicateOption cpvalues, Mat *B)
5024d71ae5a4SJacob Faibussowitsch {
5025b24902e0SBarry Smith   PetscFunctionBegin;
50269566063dSJacob Faibussowitsch   PetscCall(MatCreate(PetscObjectComm((PetscObject)A), B));
50279566063dSJacob Faibussowitsch   PetscCall(MatSetSizes(*B, A->rmap->n, A->cmap->n, A->rmap->n, A->cmap->n));
502848a46eb9SPierre Jolivet   if (!(A->rmap->n % A->rmap->bs) && !(A->cmap->n % A->cmap->bs)) PetscCall(MatSetBlockSizesFromMats(*B, A, A));
50299566063dSJacob Faibussowitsch   PetscCall(MatSetType(*B, ((PetscObject)A)->type_name));
50309566063dSJacob Faibussowitsch   PetscCall(MatDuplicateNoCreate_SeqAIJ(*B, A, cpvalues, PETSC_TRUE));
50313ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
5032b24902e0SBarry Smith }
5033b24902e0SBarry Smith 
5034d71ae5a4SJacob Faibussowitsch PetscErrorCode MatLoad_SeqAIJ(Mat newMat, PetscViewer viewer)
5035d71ae5a4SJacob Faibussowitsch {
503652f91c60SVaclav Hapla   PetscBool isbinary, ishdf5;
503752f91c60SVaclav Hapla 
503852f91c60SVaclav Hapla   PetscFunctionBegin;
503952f91c60SVaclav Hapla   PetscValidHeaderSpecific(newMat, MAT_CLASSID, 1);
504052f91c60SVaclav Hapla   PetscValidHeaderSpecific(viewer, PETSC_VIEWER_CLASSID, 2);
5041c27b3999SVaclav Hapla   /* force binary viewer to load .info file if it has not yet done so */
50429566063dSJacob Faibussowitsch   PetscCall(PetscViewerSetUp(viewer));
50439566063dSJacob Faibussowitsch   PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERBINARY, &isbinary));
50449566063dSJacob Faibussowitsch   PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERHDF5, &ishdf5));
504552f91c60SVaclav Hapla   if (isbinary) {
50469566063dSJacob Faibussowitsch     PetscCall(MatLoad_SeqAIJ_Binary(newMat, viewer));
504752f91c60SVaclav Hapla   } else if (ishdf5) {
504852f91c60SVaclav Hapla #if defined(PETSC_HAVE_HDF5)
50499566063dSJacob Faibussowitsch     PetscCall(MatLoad_AIJ_HDF5(newMat, viewer));
505052f91c60SVaclav Hapla #else
505152f91c60SVaclav Hapla     SETERRQ(PetscObjectComm((PetscObject)newMat), PETSC_ERR_SUP, "HDF5 not supported in this build.\nPlease reconfigure using --download-hdf5");
505252f91c60SVaclav Hapla #endif
505352f91c60SVaclav Hapla   } else {
505498921bdaSJacob Faibussowitsch     SETERRQ(PetscObjectComm((PetscObject)newMat), PETSC_ERR_SUP, "Viewer type %s not yet supported for reading %s matrices", ((PetscObject)viewer)->type_name, ((PetscObject)newMat)->type_name);
505552f91c60SVaclav Hapla   }
50563ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
505752f91c60SVaclav Hapla }
505852f91c60SVaclav Hapla 
5059d71ae5a4SJacob Faibussowitsch PetscErrorCode MatLoad_SeqAIJ_Binary(Mat mat, PetscViewer viewer)
5060d71ae5a4SJacob Faibussowitsch {
50613ea6fe3dSLisandro Dalcin   Mat_SeqAIJ *a = (Mat_SeqAIJ *)mat->data;
50623ea6fe3dSLisandro Dalcin   PetscInt    header[4], *rowlens, M, N, nz, sum, rows, cols, i;
5063fbdbba38SShri Abhyankar 
5064fbdbba38SShri Abhyankar   PetscFunctionBegin;
50659566063dSJacob Faibussowitsch   PetscCall(PetscViewerSetUp(viewer));
5066bbead8a2SBarry Smith 
50673ea6fe3dSLisandro Dalcin   /* read in matrix header */
50689566063dSJacob Faibussowitsch   PetscCall(PetscViewerBinaryRead(viewer, header, 4, NULL, PETSC_INT));
506908401ef6SPierre Jolivet   PetscCheck(header[0] == MAT_FILE_CLASSID, PETSC_COMM_SELF, PETSC_ERR_FILE_UNEXPECTED, "Not a matrix object in file");
50709371c9d4SSatish Balay   M  = header[1];
50719371c9d4SSatish Balay   N  = header[2];
50729371c9d4SSatish Balay   nz = header[3];
507308401ef6SPierre Jolivet   PetscCheck(M >= 0, PetscObjectComm((PetscObject)viewer), PETSC_ERR_FILE_UNEXPECTED, "Matrix row size (%" PetscInt_FMT ") in file is negative", M);
507408401ef6SPierre Jolivet   PetscCheck(N >= 0, PetscObjectComm((PetscObject)viewer), PETSC_ERR_FILE_UNEXPECTED, "Matrix column size (%" PetscInt_FMT ") in file is negative", N);
507508401ef6SPierre Jolivet   PetscCheck(nz >= 0, PETSC_COMM_SELF, PETSC_ERR_FILE_UNEXPECTED, "Matrix stored in special format on disk, cannot load as SeqAIJ");
5076fbdbba38SShri Abhyankar 
50773ea6fe3dSLisandro Dalcin   /* set block sizes from the viewer's .info file */
50789566063dSJacob Faibussowitsch   PetscCall(MatLoad_Binary_BlockSizes(mat, viewer));
50793ea6fe3dSLisandro Dalcin   /* set local and global sizes if not set already */
50803ea6fe3dSLisandro Dalcin   if (mat->rmap->n < 0) mat->rmap->n = M;
50813ea6fe3dSLisandro Dalcin   if (mat->cmap->n < 0) mat->cmap->n = N;
50823ea6fe3dSLisandro Dalcin   if (mat->rmap->N < 0) mat->rmap->N = M;
50833ea6fe3dSLisandro Dalcin   if (mat->cmap->N < 0) mat->cmap->N = N;
50849566063dSJacob Faibussowitsch   PetscCall(PetscLayoutSetUp(mat->rmap));
50859566063dSJacob Faibussowitsch   PetscCall(PetscLayoutSetUp(mat->cmap));
50863ea6fe3dSLisandro Dalcin 
50873ea6fe3dSLisandro Dalcin   /* check if the matrix sizes are correct */
50889566063dSJacob Faibussowitsch   PetscCall(MatGetSize(mat, &rows, &cols));
5089aed4548fSBarry Smith   PetscCheck(M == rows && N == cols, PETSC_COMM_SELF, PETSC_ERR_FILE_UNEXPECTED, "Matrix in file of different sizes (%" PetscInt_FMT ", %" PetscInt_FMT ") than the input matrix (%" PetscInt_FMT ", %" PetscInt_FMT ")", M, N, rows, cols);
50903ea6fe3dSLisandro Dalcin 
5091fbdbba38SShri Abhyankar   /* read in row lengths */
50929566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(M, &rowlens));
50939566063dSJacob Faibussowitsch   PetscCall(PetscViewerBinaryRead(viewer, rowlens, M, NULL, PETSC_INT));
50943ea6fe3dSLisandro Dalcin   /* check if sum(rowlens) is same as nz */
50959371c9d4SSatish Balay   sum = 0;
50969371c9d4SSatish Balay   for (i = 0; i < M; i++) sum += rowlens[i];
509708401ef6SPierre Jolivet   PetscCheck(sum == nz, PETSC_COMM_SELF, PETSC_ERR_FILE_UNEXPECTED, "Inconsistent matrix data in file: nonzeros = %" PetscInt_FMT ", sum-row-lengths = %" PetscInt_FMT, nz, sum);
50983ea6fe3dSLisandro Dalcin   /* preallocate and check sizes */
50999566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(mat, 0, rowlens));
51009566063dSJacob Faibussowitsch   PetscCall(MatGetSize(mat, &rows, &cols));
5101aed4548fSBarry Smith   PetscCheck(M == rows && N == cols, PETSC_COMM_SELF, PETSC_ERR_FILE_UNEXPECTED, "Matrix in file of different length (%" PetscInt_FMT ", %" PetscInt_FMT ") than the input matrix (%" PetscInt_FMT ", %" PetscInt_FMT ")", M, N, rows, cols);
51023ea6fe3dSLisandro Dalcin   /* store row lengths */
51039566063dSJacob Faibussowitsch   PetscCall(PetscArraycpy(a->ilen, rowlens, M));
51049566063dSJacob Faibussowitsch   PetscCall(PetscFree(rowlens));
5105fbdbba38SShri Abhyankar 
51063ea6fe3dSLisandro Dalcin   /* fill in "i" row pointers */
51079371c9d4SSatish Balay   a->i[0] = 0;
51089371c9d4SSatish Balay   for (i = 0; i < M; i++) a->i[i + 1] = a->i[i] + a->ilen[i];
51093ea6fe3dSLisandro Dalcin   /* read in "j" column indices */
51109566063dSJacob Faibussowitsch   PetscCall(PetscViewerBinaryRead(viewer, a->j, nz, NULL, PETSC_INT));
51113ea6fe3dSLisandro Dalcin   /* read in "a" nonzero values */
51129566063dSJacob Faibussowitsch   PetscCall(PetscViewerBinaryRead(viewer, a->a, nz, NULL, PETSC_SCALAR));
5113fbdbba38SShri Abhyankar 
51149566063dSJacob Faibussowitsch   PetscCall(MatAssemblyBegin(mat, MAT_FINAL_ASSEMBLY));
51159566063dSJacob Faibussowitsch   PetscCall(MatAssemblyEnd(mat, MAT_FINAL_ASSEMBLY));
51163ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
5117fbdbba38SShri Abhyankar }
5118fbdbba38SShri Abhyankar 
5119d71ae5a4SJacob Faibussowitsch PetscErrorCode MatEqual_SeqAIJ(Mat A, Mat B, PetscBool *flg)
5120d71ae5a4SJacob Faibussowitsch {
51217264ac53SSatish Balay   Mat_SeqAIJ        *a = (Mat_SeqAIJ *)A->data, *b = (Mat_SeqAIJ *)B->data;
5122fff043a9SJunchao Zhang   const PetscScalar *aa, *ba;
5123eeffb40dSHong Zhang #if defined(PETSC_USE_COMPLEX)
5124eeffb40dSHong Zhang   PetscInt k;
5125eeffb40dSHong Zhang #endif
51267264ac53SSatish Balay 
51273a40ed3dSBarry Smith   PetscFunctionBegin;
5128bfeeae90SHong Zhang   /* If the  matrix dimensions are not equal,or no of nonzeros */
5129d0f46423SBarry Smith   if ((A->rmap->n != B->rmap->n) || (A->cmap->n != B->cmap->n) || (a->nz != b->nz)) {
5130ca44d042SBarry Smith     *flg = PETSC_FALSE;
51313ba16761SJacob Faibussowitsch     PetscFunctionReturn(PETSC_SUCCESS);
5132bcd2baecSBarry Smith   }
51337264ac53SSatish Balay 
51347264ac53SSatish Balay   /* if the a->i are the same */
51359566063dSJacob Faibussowitsch   PetscCall(PetscArraycmp(a->i, b->i, A->rmap->n + 1, flg));
51363ba16761SJacob Faibussowitsch   if (!*flg) PetscFunctionReturn(PETSC_SUCCESS);
51377264ac53SSatish Balay 
51387264ac53SSatish Balay   /* if a->j are the same */
51399566063dSJacob Faibussowitsch   PetscCall(PetscArraycmp(a->j, b->j, a->nz, flg));
51403ba16761SJacob Faibussowitsch   if (!*flg) PetscFunctionReturn(PETSC_SUCCESS);
5141bcd2baecSBarry Smith 
51429566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &aa));
51439566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(B, &ba));
5144bcd2baecSBarry Smith   /* if a->a are the same */
5145eeffb40dSHong Zhang #if defined(PETSC_USE_COMPLEX)
5146eeffb40dSHong Zhang   for (k = 0; k < a->nz; k++) {
5147fff043a9SJunchao Zhang     if (PetscRealPart(aa[k]) != PetscRealPart(ba[k]) || PetscImaginaryPart(aa[k]) != PetscImaginaryPart(ba[k])) {
5148eeffb40dSHong Zhang       *flg = PETSC_FALSE;
51493ba16761SJacob Faibussowitsch       PetscFunctionReturn(PETSC_SUCCESS);
5150eeffb40dSHong Zhang     }
5151eeffb40dSHong Zhang   }
5152eeffb40dSHong Zhang #else
51539566063dSJacob Faibussowitsch   PetscCall(PetscArraycmp(aa, ba, a->nz, flg));
5154eeffb40dSHong Zhang #endif
51559566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &aa));
51569566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(B, &ba));
51573ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
51587264ac53SSatish Balay }
515936db0b34SBarry Smith 
516005869f15SSatish Balay /*@
516111a5261eSBarry Smith   MatCreateSeqAIJWithArrays - Creates an sequential `MATSEQAIJ` matrix using matrix elements (in CSR format)
516236db0b34SBarry Smith   provided by the user.
516336db0b34SBarry Smith 
5164d083f849SBarry Smith   Collective
516536db0b34SBarry Smith 
516636db0b34SBarry Smith   Input Parameters:
516736db0b34SBarry Smith + comm - must be an MPI communicator of size 1
516836db0b34SBarry Smith . m    - number of rows
516936db0b34SBarry Smith . n    - number of columns
5170483a2f95SBarry Smith . i    - row indices; that is i[0] = 0, i[row] = i[row-1] + number of elements in that row of the matrix
517136db0b34SBarry Smith . j    - column indices
517236db0b34SBarry Smith - a    - matrix values
517336db0b34SBarry Smith 
517436db0b34SBarry Smith   Output Parameter:
517536db0b34SBarry Smith . mat - the matrix
517636db0b34SBarry Smith 
517736db0b34SBarry Smith   Level: intermediate
517836db0b34SBarry Smith 
517936db0b34SBarry Smith   Notes:
51802ef1f0ffSBarry Smith   The `i`, `j`, and `a` arrays are not copied by this routine, the user must free these arrays
5181292fb18eSBarry Smith   once the matrix is destroyed and not before
518236db0b34SBarry Smith 
518336db0b34SBarry Smith   You cannot set new nonzero locations into this matrix, that will generate an error.
518436db0b34SBarry Smith 
51852ef1f0ffSBarry Smith   The `i` and `j` indices are 0 based
518636db0b34SBarry Smith 
5187a4552177SSatish Balay   The format which is used for the sparse matrix input, is equivalent to a
5188a4552177SSatish Balay   row-major ordering.. i.e for the following matrix, the input data expected is
51898eef79e4SBarry Smith   as shown
51902ef1f0ffSBarry Smith .vb
51912ef1f0ffSBarry Smith         1 0 0
51922ef1f0ffSBarry Smith         2 0 3
51932ef1f0ffSBarry Smith         4 5 6
5194a4552177SSatish Balay 
51952ef1f0ffSBarry Smith         i =  {0,1,3,6}  [size = nrow+1  = 3+1]
51962ef1f0ffSBarry Smith         j =  {0,0,2,0,1,2}  [size = 6]; values must be sorted for each row
51972ef1f0ffSBarry Smith         v =  {1,2,3,4,5,6}  [size = 6]
51982ef1f0ffSBarry Smith .ve
5199a4552177SSatish Balay 
52001cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatCreate()`, `MatCreateAIJ()`, `MatCreateSeqAIJ()`, `MatCreateMPIAIJWithArrays()`, `MatMPIAIJSetPreallocationCSR()`
520136db0b34SBarry Smith @*/
5202d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateSeqAIJWithArrays(MPI_Comm comm, PetscInt m, PetscInt n, PetscInt i[], PetscInt j[], PetscScalar a[], Mat *mat)
5203d71ae5a4SJacob Faibussowitsch {
5204cbcfb4deSHong Zhang   PetscInt    ii;
520536db0b34SBarry Smith   Mat_SeqAIJ *aij;
5206cbcfb4deSHong Zhang   PetscInt    jj;
520736db0b34SBarry Smith 
520836db0b34SBarry Smith   PetscFunctionBegin;
5209aed4548fSBarry Smith   PetscCheck(m <= 0 || i[0] == 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "i (row indices) must start with 0");
52109566063dSJacob Faibussowitsch   PetscCall(MatCreate(comm, mat));
52119566063dSJacob Faibussowitsch   PetscCall(MatSetSizes(*mat, m, n, m, n));
52129566063dSJacob Faibussowitsch   /* PetscCall(MatSetBlockSizes(*mat,,)); */
52139566063dSJacob Faibussowitsch   PetscCall(MatSetType(*mat, MATSEQAIJ));
52149566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(*mat, MAT_SKIP_ALLOCATION, NULL));
5215ab93d7beSBarry Smith   aij = (Mat_SeqAIJ *)(*mat)->data;
52169566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(m, &aij->imax));
52179566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(m, &aij->ilen));
5218ab93d7beSBarry Smith 
521936db0b34SBarry Smith   aij->i       = i;
522036db0b34SBarry Smith   aij->j       = j;
522136db0b34SBarry Smith   aij->a       = a;
522236db0b34SBarry Smith   aij->nonew   = -1; /*this indicates that inserting a new value in the matrix that generates a new nonzero is an error*/
5223e6b907acSBarry Smith   aij->free_a  = PETSC_FALSE;
5224e6b907acSBarry Smith   aij->free_ij = PETSC_FALSE;
522536db0b34SBarry Smith 
5226cbc6b225SStefano Zampini   for (ii = 0, aij->nonzerorowcnt = 0, aij->rmax = 0; ii < m; ii++) {
522736db0b34SBarry Smith     aij->ilen[ii] = aij->imax[ii] = i[ii + 1] - i[ii];
522876bd3646SJed Brown     if (PetscDefined(USE_DEBUG)) {
5229aed4548fSBarry Smith       PetscCheck(i[ii + 1] - i[ii] >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Negative row length in i (row indices) row = %" PetscInt_FMT " length = %" PetscInt_FMT, ii, i[ii + 1] - i[ii]);
52309985e31cSBarry Smith       for (jj = i[ii] + 1; jj < i[ii + 1]; jj++) {
523108401ef6SPierre Jolivet         PetscCheck(j[jj] >= j[jj - 1], PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Column entry number %" PetscInt_FMT " (actual column %" PetscInt_FMT ") in row %" PetscInt_FMT " is not sorted", jj - i[ii], j[jj], ii);
523208401ef6SPierre Jolivet         PetscCheck(j[jj] != j[jj - 1], PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Column entry number %" PetscInt_FMT " (actual column %" PetscInt_FMT ") in row %" PetscInt_FMT " is identical to previous entry", jj - i[ii], j[jj], ii);
52339985e31cSBarry Smith       }
523436db0b34SBarry Smith     }
523576bd3646SJed Brown   }
523676bd3646SJed Brown   if (PetscDefined(USE_DEBUG)) {
523736db0b34SBarry Smith     for (ii = 0; ii < aij->i[m]; ii++) {
523808401ef6SPierre Jolivet       PetscCheck(j[ii] >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Negative column index at location = %" PetscInt_FMT " index = %" PetscInt_FMT, ii, j[ii]);
5239da0802e2SStefano Zampini       PetscCheck(j[ii] <= n - 1, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Column index to large at location = %" PetscInt_FMT " index = %" PetscInt_FMT " last column = %" PetscInt_FMT, ii, j[ii], n - 1);
524036db0b34SBarry Smith     }
524176bd3646SJed Brown   }
524236db0b34SBarry Smith 
52439566063dSJacob Faibussowitsch   PetscCall(MatAssemblyBegin(*mat, MAT_FINAL_ASSEMBLY));
52449566063dSJacob Faibussowitsch   PetscCall(MatAssemblyEnd(*mat, MAT_FINAL_ASSEMBLY));
52453ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
524636db0b34SBarry Smith }
5247cbc6b225SStefano Zampini 
5248f62e3866SBarry Smith /*@
524911a5261eSBarry Smith   MatCreateSeqAIJFromTriple - Creates an sequential `MATSEQAIJ` matrix using matrix elements (in COO format)
52508a0b0e6bSVictor Minden   provided by the user.
52518a0b0e6bSVictor Minden 
5252d083f849SBarry Smith   Collective
52538a0b0e6bSVictor Minden 
52548a0b0e6bSVictor Minden   Input Parameters:
52558a0b0e6bSVictor Minden + comm - must be an MPI communicator of size 1
52568a0b0e6bSVictor Minden . m    - number of rows
52578a0b0e6bSVictor Minden . n    - number of columns
52588a0b0e6bSVictor Minden . i    - row indices
52598a0b0e6bSVictor Minden . j    - column indices
52601230e6d1SVictor Minden . a    - matrix values
52611230e6d1SVictor Minden . nz   - number of nonzeros
52622ef1f0ffSBarry Smith - idx  - if the `i` and `j` indices start with 1 use `PETSC_TRUE` otherwise use `PETSC_FALSE`
52638a0b0e6bSVictor Minden 
52648a0b0e6bSVictor Minden   Output Parameter:
52658a0b0e6bSVictor Minden . mat - the matrix
52668a0b0e6bSVictor Minden 
52678a0b0e6bSVictor Minden   Level: intermediate
52688a0b0e6bSVictor Minden 
5269f62e3866SBarry Smith   Example:
5270f62e3866SBarry Smith   For the following matrix, the input data expected is as shown (using 0 based indexing)
52719e99939fSJunchao Zhang .vb
52728a0b0e6bSVictor Minden         1 0 0
52738a0b0e6bSVictor Minden         2 0 3
52748a0b0e6bSVictor Minden         4 5 6
52758a0b0e6bSVictor Minden 
52768a0b0e6bSVictor Minden         i =  {0,1,1,2,2,2}
52778a0b0e6bSVictor Minden         j =  {0,0,2,0,1,2}
52788a0b0e6bSVictor Minden         v =  {1,2,3,4,5,6}
52799e99939fSJunchao Zhang .ve
5280fe59aa6dSJacob Faibussowitsch 
52812ef1f0ffSBarry Smith   Note:
5282d7547e51SJunchao Zhang   Instead of using this function, users should also consider `MatSetPreallocationCOO()` and `MatSetValuesCOO()`, which allow repeated or remote entries,
5283d7547e51SJunchao Zhang   and are particularly useful in iterative applications.
52848a0b0e6bSVictor Minden 
52851cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatCreate()`, `MatCreateAIJ()`, `MatCreateSeqAIJ()`, `MatCreateSeqAIJWithArrays()`, `MatMPIAIJSetPreallocationCSR()`, `MatSetValuesCOO()`, `MatSetPreallocationCOO()`
52868a0b0e6bSVictor Minden @*/
5287ce78bad3SBarry Smith PetscErrorCode MatCreateSeqAIJFromTriple(MPI_Comm comm, PetscInt m, PetscInt n, PetscInt i[], PetscInt j[], PetscScalar a[], Mat *mat, PetscCount nz, PetscBool idx)
5288d71ae5a4SJacob Faibussowitsch {
5289d021a1c5SVictor Minden   PetscInt ii, *nnz, one = 1, row, col;
52908a0b0e6bSVictor Minden 
52918a0b0e6bSVictor Minden   PetscFunctionBegin;
52929566063dSJacob Faibussowitsch   PetscCall(PetscCalloc1(m, &nnz));
5293ad540459SPierre Jolivet   for (ii = 0; ii < nz; ii++) nnz[i[ii] - !!idx] += 1;
52949566063dSJacob Faibussowitsch   PetscCall(MatCreate(comm, mat));
52959566063dSJacob Faibussowitsch   PetscCall(MatSetSizes(*mat, m, n, m, n));
52969566063dSJacob Faibussowitsch   PetscCall(MatSetType(*mat, MATSEQAIJ));
52979566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(*mat, 0, nnz));
52981230e6d1SVictor Minden   for (ii = 0; ii < nz; ii++) {
52991230e6d1SVictor Minden     if (idx) {
53001230e6d1SVictor Minden       row = i[ii] - 1;
53011230e6d1SVictor Minden       col = j[ii] - 1;
53021230e6d1SVictor Minden     } else {
53031230e6d1SVictor Minden       row = i[ii];
53041230e6d1SVictor Minden       col = j[ii];
53058a0b0e6bSVictor Minden     }
53069566063dSJacob Faibussowitsch     PetscCall(MatSetValues(*mat, one, &row, one, &col, &a[ii], ADD_VALUES));
53078a0b0e6bSVictor Minden   }
53089566063dSJacob Faibussowitsch   PetscCall(MatAssemblyBegin(*mat, MAT_FINAL_ASSEMBLY));
53099566063dSJacob Faibussowitsch   PetscCall(MatAssemblyEnd(*mat, MAT_FINAL_ASSEMBLY));
53109566063dSJacob Faibussowitsch   PetscCall(PetscFree(nnz));
53113ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
53128a0b0e6bSVictor Minden }
531336db0b34SBarry Smith 
5314d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateMPIMatConcatenateSeqMat_SeqAIJ(MPI_Comm comm, Mat inmat, PetscInt n, MatReuse scall, Mat *outmat)
5315d71ae5a4SJacob Faibussowitsch {
53169c8f2541SHong Zhang   PetscFunctionBegin;
53179566063dSJacob Faibussowitsch   PetscCall(MatCreateMPIMatConcatenateSeqMat_MPIAIJ(comm, inmat, n, scall, outmat));
53183ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
53199c8f2541SHong Zhang }
53209c8f2541SHong Zhang 
532181824310SBarry Smith /*
532253dd7562SDmitry Karpeev  Permute A into C's *local* index space using rowemb,colemb.
532353dd7562SDmitry Karpeev  The embedding are supposed to be injections and the above implies that the range of rowemb is a subset
532453dd7562SDmitry Karpeev  of [0,m), colemb is in [0,n).
532553dd7562SDmitry Karpeev  If pattern == DIFFERENT_NONZERO_PATTERN, C is preallocated according to A.
532653dd7562SDmitry Karpeev  */
5327d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetSeqMat_SeqAIJ(Mat C, IS rowemb, IS colemb, MatStructure pattern, Mat B)
5328d71ae5a4SJacob Faibussowitsch {
532953dd7562SDmitry Karpeev   /* If making this function public, change the error returned in this function away from _PLIB. */
533053dd7562SDmitry Karpeev   Mat_SeqAIJ     *Baij;
533153dd7562SDmitry Karpeev   PetscBool       seqaij;
533253dd7562SDmitry Karpeev   PetscInt        m, n, *nz, i, j, count;
533353dd7562SDmitry Karpeev   PetscScalar     v;
533453dd7562SDmitry Karpeev   const PetscInt *rowindices, *colindices;
533553dd7562SDmitry Karpeev 
533653dd7562SDmitry Karpeev   PetscFunctionBegin;
53373ba16761SJacob Faibussowitsch   if (!B) PetscFunctionReturn(PETSC_SUCCESS);
533853dd7562SDmitry Karpeev   /* Check to make sure the target matrix (and embeddings) are compatible with C and each other. */
53399566063dSJacob Faibussowitsch   PetscCall(PetscObjectBaseTypeCompare((PetscObject)B, MATSEQAIJ, &seqaij));
534028b400f6SJacob Faibussowitsch   PetscCheck(seqaij, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Input matrix is of wrong type");
534153dd7562SDmitry Karpeev   if (rowemb) {
53429566063dSJacob Faibussowitsch     PetscCall(ISGetLocalSize(rowemb, &m));
534308401ef6SPierre Jolivet     PetscCheck(m == B->rmap->n, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Row IS of size %" PetscInt_FMT " is incompatible with matrix row size %" PetscInt_FMT, m, B->rmap->n);
534453dd7562SDmitry Karpeev   } else {
534508401ef6SPierre Jolivet     PetscCheck(C->rmap->n == B->rmap->n, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Input matrix is row-incompatible with the target matrix");
534653dd7562SDmitry Karpeev   }
534753dd7562SDmitry Karpeev   if (colemb) {
53489566063dSJacob Faibussowitsch     PetscCall(ISGetLocalSize(colemb, &n));
534908401ef6SPierre Jolivet     PetscCheck(n == B->cmap->n, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Diag col IS of size %" PetscInt_FMT " is incompatible with input matrix col size %" PetscInt_FMT, n, B->cmap->n);
535053dd7562SDmitry Karpeev   } else {
535108401ef6SPierre Jolivet     PetscCheck(C->cmap->n == B->cmap->n, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Input matrix is col-incompatible with the target matrix");
535253dd7562SDmitry Karpeev   }
535353dd7562SDmitry Karpeev 
5354f4f49eeaSPierre Jolivet   Baij = (Mat_SeqAIJ *)B->data;
535553dd7562SDmitry Karpeev   if (pattern == DIFFERENT_NONZERO_PATTERN) {
53569566063dSJacob Faibussowitsch     PetscCall(PetscMalloc1(B->rmap->n, &nz));
5357ad540459SPierre Jolivet     for (i = 0; i < B->rmap->n; i++) nz[i] = Baij->i[i + 1] - Baij->i[i];
53589566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJSetPreallocation(C, 0, nz));
53599566063dSJacob Faibussowitsch     PetscCall(PetscFree(nz));
536053dd7562SDmitry Karpeev   }
536148a46eb9SPierre Jolivet   if (pattern == SUBSET_NONZERO_PATTERN) PetscCall(MatZeroEntries(C));
536253dd7562SDmitry Karpeev   count      = 0;
536353dd7562SDmitry Karpeev   rowindices = NULL;
536453dd7562SDmitry Karpeev   colindices = NULL;
536548a46eb9SPierre Jolivet   if (rowemb) PetscCall(ISGetIndices(rowemb, &rowindices));
536648a46eb9SPierre Jolivet   if (colemb) PetscCall(ISGetIndices(colemb, &colindices));
536753dd7562SDmitry Karpeev   for (i = 0; i < B->rmap->n; i++) {
536853dd7562SDmitry Karpeev     PetscInt row;
536953dd7562SDmitry Karpeev     row = i;
537053dd7562SDmitry Karpeev     if (rowindices) row = rowindices[i];
537153dd7562SDmitry Karpeev     for (j = Baij->i[i]; j < Baij->i[i + 1]; j++) {
537253dd7562SDmitry Karpeev       PetscInt col;
537353dd7562SDmitry Karpeev       col = Baij->j[count];
537453dd7562SDmitry Karpeev       if (colindices) col = colindices[col];
537553dd7562SDmitry Karpeev       v = Baij->a[count];
53769566063dSJacob Faibussowitsch       PetscCall(MatSetValues(C, 1, &row, 1, &col, &v, INSERT_VALUES));
537753dd7562SDmitry Karpeev       ++count;
537853dd7562SDmitry Karpeev     }
537953dd7562SDmitry Karpeev   }
538053dd7562SDmitry Karpeev   /* FIXME: set C's nonzerostate correctly. */
538153dd7562SDmitry Karpeev   /* Assembly for C is necessary. */
538253dd7562SDmitry Karpeev   C->preallocated  = PETSC_TRUE;
538353dd7562SDmitry Karpeev   C->assembled     = PETSC_TRUE;
538453dd7562SDmitry Karpeev   C->was_assembled = PETSC_FALSE;
53853ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
538653dd7562SDmitry Karpeev }
538753dd7562SDmitry Karpeev 
538858c11ad4SPierre Jolivet PetscErrorCode MatEliminateZeros_SeqAIJ(Mat A, PetscBool keep)
5389dec0b466SHong Zhang {
5390dec0b466SHong Zhang   Mat_SeqAIJ *a  = (Mat_SeqAIJ *)A->data;
5391dec0b466SHong Zhang   MatScalar  *aa = a->a;
5392dec0b466SHong Zhang   PetscInt    m = A->rmap->n, fshift = 0, fshift_prev = 0, i, k;
5393dec0b466SHong Zhang   PetscInt   *ailen = a->ilen, *imax = a->imax, *ai = a->i, *aj = a->j, rmax = 0;
5394dec0b466SHong Zhang 
5395dec0b466SHong Zhang   PetscFunctionBegin;
5396dec0b466SHong Zhang   PetscCheck(A->assembled, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Cannot eliminate zeros for unassembled matrix");
5397dec0b466SHong Zhang   if (m) rmax = ailen[0]; /* determine row with most nonzeros */
5398dec0b466SHong Zhang   for (i = 1; i <= m; i++) {
5399dec0b466SHong Zhang     /* move each nonzero entry back by the amount of zero slots (fshift) before it*/
5400dec0b466SHong Zhang     for (k = ai[i - 1]; k < ai[i]; k++) {
540158c11ad4SPierre Jolivet       if (aa[k] == 0 && (aj[k] != i - 1 || !keep)) fshift++;
5402dec0b466SHong Zhang       else {
5403dec0b466SHong Zhang         if (aa[k] == 0 && aj[k] == i - 1) PetscCall(PetscInfo(A, "Keep the diagonal zero at row %" PetscInt_FMT "\n", i - 1));
5404dec0b466SHong Zhang         aa[k - fshift] = aa[k];
5405dec0b466SHong Zhang         aj[k - fshift] = aj[k];
5406dec0b466SHong Zhang       }
5407dec0b466SHong Zhang     }
5408dec0b466SHong Zhang     ai[i - 1] -= fshift_prev; // safe to update ai[i-1] now since it will not be used in the next iteration
5409dec0b466SHong Zhang     fshift_prev = fshift;
5410dec0b466SHong Zhang     /* reset ilen and imax for each row */
5411dec0b466SHong Zhang     ailen[i - 1] = imax[i - 1] = ai[i] - fshift - ai[i - 1];
5412dec0b466SHong Zhang     a->nonzerorowcnt += ((ai[i] - fshift - ai[i - 1]) > 0);
5413dec0b466SHong Zhang     rmax = PetscMax(rmax, ailen[i - 1]);
5414dec0b466SHong Zhang   }
5415312eded4SPierre Jolivet   if (fshift) {
5416dec0b466SHong Zhang     if (m) {
5417dec0b466SHong Zhang       ai[m] -= fshift;
5418dec0b466SHong Zhang       a->nz = ai[m];
5419dec0b466SHong Zhang     }
5420dec0b466SHong Zhang     PetscCall(PetscInfo(A, "Matrix size: %" PetscInt_FMT " X %" PetscInt_FMT "; zeros eliminated: %" PetscInt_FMT "; nonzeros left: %" PetscInt_FMT "\n", m, A->cmap->n, fshift, a->nz));
5421312eded4SPierre Jolivet     A->nonzerostate++;
5422dec0b466SHong Zhang     A->info.nz_unneeded += (PetscReal)fshift;
5423dec0b466SHong Zhang     a->rmax = rmax;
5424dec0b466SHong Zhang     if (a->inode.use && a->inode.checked) PetscCall(MatSeqAIJCheckInode(A));
5425dec0b466SHong Zhang     PetscCall(MatAssemblyBegin(A, MAT_FINAL_ASSEMBLY));
5426dec0b466SHong Zhang     PetscCall(MatAssemblyEnd(A, MAT_FINAL_ASSEMBLY));
5427312eded4SPierre Jolivet   }
54283ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
5429dec0b466SHong Zhang }
5430dec0b466SHong Zhang 
54314099cc6bSBarry Smith PetscFunctionList MatSeqAIJList = NULL;
54324099cc6bSBarry Smith 
5433cc4c1da9SBarry Smith /*@
543411a5261eSBarry Smith   MatSeqAIJSetType - Converts a `MATSEQAIJ` matrix to a subtype
54354099cc6bSBarry Smith 
5436c3339decSBarry Smith   Collective
54374099cc6bSBarry Smith 
54384099cc6bSBarry Smith   Input Parameters:
54394099cc6bSBarry Smith + mat    - the matrix object
54404099cc6bSBarry Smith - matype - matrix type
54414099cc6bSBarry Smith 
54424099cc6bSBarry Smith   Options Database Key:
54434e187271SRichard Tran Mills . -mat_seqaij_type  <method> - for example seqaijcrl
54444099cc6bSBarry Smith 
54454099cc6bSBarry Smith   Level: intermediate
54464099cc6bSBarry Smith 
5447fe59aa6dSJacob Faibussowitsch .seealso: [](ch_matrices), `Mat`, `PCSetType()`, `VecSetType()`, `MatCreate()`, `MatType`
54484099cc6bSBarry Smith @*/
5449d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetType(Mat mat, MatType matype)
5450d71ae5a4SJacob Faibussowitsch {
54514099cc6bSBarry Smith   PetscBool sametype;
54525f80ce2aSJacob Faibussowitsch   PetscErrorCode (*r)(Mat, MatType, MatReuse, Mat *);
54534099cc6bSBarry Smith 
54544099cc6bSBarry Smith   PetscFunctionBegin;
54554099cc6bSBarry Smith   PetscValidHeaderSpecific(mat, MAT_CLASSID, 1);
54569566063dSJacob Faibussowitsch   PetscCall(PetscObjectTypeCompare((PetscObject)mat, matype, &sametype));
54573ba16761SJacob Faibussowitsch   if (sametype) PetscFunctionReturn(PETSC_SUCCESS);
54584099cc6bSBarry Smith 
54599566063dSJacob Faibussowitsch   PetscCall(PetscFunctionListFind(MatSeqAIJList, matype, &r));
54606adde796SStefano Zampini   PetscCheck(r, PetscObjectComm((PetscObject)mat), PETSC_ERR_ARG_UNKNOWN_TYPE, "Unknown Mat type given: %s", matype);
54619566063dSJacob Faibussowitsch   PetscCall((*r)(mat, matype, MAT_INPLACE_MATRIX, &mat));
54623ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
54634099cc6bSBarry Smith }
54644099cc6bSBarry Smith 
54654099cc6bSBarry Smith /*@C
546611a5261eSBarry Smith   MatSeqAIJRegister -  - Adds a new sub-matrix type for sequential `MATSEQAIJ` matrices
54674099cc6bSBarry Smith 
5468cc4c1da9SBarry Smith   Not Collective, No Fortran Support
54694099cc6bSBarry Smith 
54704099cc6bSBarry Smith   Input Parameters:
5471fe59aa6dSJacob Faibussowitsch + sname    - name of a new user-defined matrix type, for example `MATSEQAIJCRL`
54724099cc6bSBarry Smith - function - routine to convert to subtype
54734099cc6bSBarry Smith 
54742ef1f0ffSBarry Smith   Level: advanced
54752ef1f0ffSBarry Smith 
54764099cc6bSBarry Smith   Notes:
547711a5261eSBarry Smith   `MatSeqAIJRegister()` may be called multiple times to add several user-defined solvers.
54784099cc6bSBarry Smith 
54794099cc6bSBarry Smith   Then, your matrix can be chosen with the procedural interface at runtime via the option
5480b44f4de4SBarry Smith .vb
5481b44f4de4SBarry Smith   -mat_seqaij_type my_mat
5482b44f4de4SBarry Smith .ve
54834099cc6bSBarry Smith 
54841cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatSeqAIJRegisterAll()`
54854099cc6bSBarry Smith @*/
5486d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJRegister(const char sname[], PetscErrorCode (*function)(Mat, MatType, MatReuse, Mat *))
5487d71ae5a4SJacob Faibussowitsch {
54884099cc6bSBarry Smith   PetscFunctionBegin;
54899566063dSJacob Faibussowitsch   PetscCall(MatInitializePackage());
54909566063dSJacob Faibussowitsch   PetscCall(PetscFunctionListAdd(&MatSeqAIJList, sname, function));
54913ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
54924099cc6bSBarry Smith }
54934099cc6bSBarry Smith 
54944099cc6bSBarry Smith PetscBool MatSeqAIJRegisterAllCalled = PETSC_FALSE;
54954099cc6bSBarry Smith 
54964099cc6bSBarry Smith /*@C
549711a5261eSBarry Smith   MatSeqAIJRegisterAll - Registers all of the matrix subtypes of `MATSSEQAIJ`
54984099cc6bSBarry Smith 
54994099cc6bSBarry Smith   Not Collective
55004099cc6bSBarry Smith 
55014099cc6bSBarry Smith   Level: advanced
55024099cc6bSBarry Smith 
55032ef1f0ffSBarry Smith   Note:
55042ef1f0ffSBarry Smith   This registers the versions of `MATSEQAIJ` for GPUs
55052ef1f0ffSBarry Smith 
55061cc06b55SBarry Smith .seealso: [](ch_matrices), `Mat`, `MatRegisterAll()`, `MatSeqAIJRegister()`
55074099cc6bSBarry Smith @*/
5508d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJRegisterAll(void)
5509d71ae5a4SJacob Faibussowitsch {
55104099cc6bSBarry Smith   PetscFunctionBegin;
55113ba16761SJacob Faibussowitsch   if (MatSeqAIJRegisterAllCalled) PetscFunctionReturn(PETSC_SUCCESS);
55124099cc6bSBarry Smith   MatSeqAIJRegisterAllCalled = PETSC_TRUE;
55134099cc6bSBarry Smith 
55149566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRegister(MATSEQAIJCRL, MatConvert_SeqAIJ_SeqAIJCRL));
55159566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRegister(MATSEQAIJPERM, MatConvert_SeqAIJ_SeqAIJPERM));
55169566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRegister(MATSEQAIJSELL, MatConvert_SeqAIJ_SeqAIJSELL));
55179779e05dSSatish Balay #if defined(PETSC_HAVE_MKL_SPARSE)
55189566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRegister(MATSEQAIJMKL, MatConvert_SeqAIJ_SeqAIJMKL));
5519485f9817SRichard Tran Mills #endif
55205063d097SStefano Zampini #if defined(PETSC_HAVE_CUDA)
55219566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRegister(MATSEQAIJCUSPARSE, MatConvert_SeqAIJ_SeqAIJCUSPARSE));
55225063d097SStefano Zampini #endif
5523d5e393b6SSuyash Tandon #if defined(PETSC_HAVE_HIP)
5524d5e393b6SSuyash Tandon   PetscCall(MatSeqAIJRegister(MATSEQAIJHIPSPARSE, MatConvert_SeqAIJ_SeqAIJHIPSPARSE));
5525d5e393b6SSuyash Tandon #endif
55265063d097SStefano Zampini #if defined(PETSC_HAVE_KOKKOS_KERNELS)
55279566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRegister(MATSEQAIJKOKKOS, MatConvert_SeqAIJ_SeqAIJKokkos));
55285063d097SStefano Zampini #endif
55294099cc6bSBarry Smith #if defined(PETSC_HAVE_VIENNACL) && defined(PETSC_HAVE_VIENNACL_NO_CUDA)
55309566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRegister(MATMPIAIJVIENNACL, MatConvert_SeqAIJ_SeqAIJViennaCL));
55314099cc6bSBarry Smith #endif
55323ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
55334099cc6bSBarry Smith }
553453dd7562SDmitry Karpeev 
553553dd7562SDmitry Karpeev /*
553681824310SBarry Smith     Special version for direct calls from Fortran
553781824310SBarry Smith */
553881824310SBarry Smith #if defined(PETSC_HAVE_FORTRAN_CAPS)
553981824310SBarry Smith   #define matsetvaluesseqaij_ MATSETVALUESSEQAIJ
554081824310SBarry Smith #elif !defined(PETSC_HAVE_FORTRAN_UNDERSCORE)
554181824310SBarry Smith   #define matsetvaluesseqaij_ matsetvaluesseqaij
554281824310SBarry Smith #endif
554381824310SBarry Smith 
554481824310SBarry Smith /* Change these macros so can be used in void function */
554598921bdaSJacob Faibussowitsch 
554698921bdaSJacob Faibussowitsch /* Change these macros so can be used in void function */
55479566063dSJacob Faibussowitsch /* Identical to PetscCallVoid, except it assigns to *_ierr */
55489566063dSJacob Faibussowitsch #undef PetscCall
55499371c9d4SSatish Balay #define PetscCall(...) \
55509371c9d4SSatish Balay   do { \
55515f80ce2aSJacob Faibussowitsch     PetscErrorCode ierr_msv_mpiaij = __VA_ARGS__; \
555298921bdaSJacob Faibussowitsch     if (PetscUnlikely(ierr_msv_mpiaij)) { \
555398921bdaSJacob Faibussowitsch       *_ierr = PetscError(PETSC_COMM_SELF, __LINE__, PETSC_FUNCTION_NAME, __FILE__, ierr_msv_mpiaij, PETSC_ERROR_REPEAT, " "); \
555498921bdaSJacob Faibussowitsch       return; \
555598921bdaSJacob Faibussowitsch     } \
555698921bdaSJacob Faibussowitsch   } while (0)
555798921bdaSJacob Faibussowitsch 
555898921bdaSJacob Faibussowitsch #undef SETERRQ
55599371c9d4SSatish Balay #define SETERRQ(comm, ierr, ...) \
55609371c9d4SSatish Balay   do { \
556198921bdaSJacob Faibussowitsch     *_ierr = PetscError(comm, __LINE__, PETSC_FUNCTION_NAME, __FILE__, ierr, PETSC_ERROR_INITIAL, __VA_ARGS__); \
556298921bdaSJacob Faibussowitsch     return; \
556398921bdaSJacob Faibussowitsch   } while (0)
556481824310SBarry Smith 
5565d71ae5a4SJacob Faibussowitsch PETSC_EXTERN void matsetvaluesseqaij_(Mat *AA, PetscInt *mm, const PetscInt im[], PetscInt *nn, const PetscInt in[], const PetscScalar v[], InsertMode *isis, PetscErrorCode *_ierr)
5566d71ae5a4SJacob Faibussowitsch {
556781824310SBarry Smith   Mat         A = *AA;
556881824310SBarry Smith   PetscInt    m = *mm, n = *nn;
556981824310SBarry Smith   InsertMode  is = *isis;
557081824310SBarry Smith   Mat_SeqAIJ *a  = (Mat_SeqAIJ *)A->data;
557181824310SBarry Smith   PetscInt   *rp, k, low, high, t, ii, row, nrow, i, col, l, rmax, N;
557281824310SBarry Smith   PetscInt   *imax, *ai, *ailen;
557381824310SBarry Smith   PetscInt   *aj, nonew = a->nonew, lastcol = -1;
557454f21887SBarry Smith   MatScalar  *ap, value, *aa;
5575ace3abfcSBarry Smith   PetscBool   ignorezeroentries = a->ignorezeroentries;
5576ace3abfcSBarry Smith   PetscBool   roworiented       = a->roworiented;
557781824310SBarry Smith 
557881824310SBarry Smith   PetscFunctionBegin;
55794994cf47SJed Brown   MatCheckPreallocated(A, 1);
558081824310SBarry Smith   imax  = a->imax;
558181824310SBarry Smith   ai    = a->i;
558281824310SBarry Smith   ailen = a->ilen;
558381824310SBarry Smith   aj    = a->j;
558481824310SBarry Smith   aa    = a->a;
558581824310SBarry Smith 
558681824310SBarry Smith   for (k = 0; k < m; k++) { /* loop over added rows */
558781824310SBarry Smith     row = im[k];
558881824310SBarry Smith     if (row < 0) continue;
55895f80ce2aSJacob Faibussowitsch     PetscCheck(row < A->rmap->n, PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_OUTOFRANGE, "Row too large");
55909371c9d4SSatish Balay     rp   = aj + ai[row];
55919371c9d4SSatish Balay     ap   = aa + ai[row];
55929371c9d4SSatish Balay     rmax = imax[row];
55939371c9d4SSatish Balay     nrow = ailen[row];
559481824310SBarry Smith     low  = 0;
559581824310SBarry Smith     high = nrow;
559681824310SBarry Smith     for (l = 0; l < n; l++) { /* loop over added columns */
559781824310SBarry Smith       if (in[l] < 0) continue;
55985f80ce2aSJacob Faibussowitsch       PetscCheck(in[l] < A->cmap->n, PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_OUTOFRANGE, "Column too large");
559981824310SBarry Smith       col = in[l];
56002205254eSKarl Rupp       if (roworiented) value = v[l + k * n];
56012205254eSKarl Rupp       else value = v[k + l * m];
56022205254eSKarl Rupp 
560381824310SBarry Smith       if (value == 0.0 && ignorezeroentries && (is == ADD_VALUES)) continue;
560481824310SBarry Smith 
56052205254eSKarl Rupp       if (col <= lastcol) low = 0;
56062205254eSKarl Rupp       else high = nrow;
560781824310SBarry Smith       lastcol = col;
560881824310SBarry Smith       while (high - low > 5) {
560981824310SBarry Smith         t = (low + high) / 2;
561081824310SBarry Smith         if (rp[t] > col) high = t;
561181824310SBarry Smith         else low = t;
561281824310SBarry Smith       }
561381824310SBarry Smith       for (i = low; i < high; i++) {
561481824310SBarry Smith         if (rp[i] > col) break;
561581824310SBarry Smith         if (rp[i] == col) {
561681824310SBarry Smith           if (is == ADD_VALUES) ap[i] += value;
561781824310SBarry Smith           else ap[i] = value;
561881824310SBarry Smith           goto noinsert;
561981824310SBarry Smith         }
562081824310SBarry Smith       }
562181824310SBarry Smith       if (value == 0.0 && ignorezeroentries) goto noinsert;
562281824310SBarry Smith       if (nonew == 1) goto noinsert;
56235f80ce2aSJacob Faibussowitsch       PetscCheck(nonew != -1, PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_OUTOFRANGE, "Inserting a new nonzero in the matrix");
5624fef13f97SBarry Smith       MatSeqXAIJReallocateAIJ(A, A->rmap->n, 1, nrow, row, col, rmax, aa, ai, aj, rp, ap, imax, nonew, MatScalar);
56259371c9d4SSatish Balay       N = nrow++ - 1;
56269371c9d4SSatish Balay       a->nz++;
56279371c9d4SSatish Balay       high++;
562881824310SBarry Smith       /* shift up all the later entries in this row */
562981824310SBarry Smith       for (ii = N; ii >= i; ii--) {
563081824310SBarry Smith         rp[ii + 1] = rp[ii];
563181824310SBarry Smith         ap[ii + 1] = ap[ii];
563281824310SBarry Smith       }
563381824310SBarry Smith       rp[i] = col;
563481824310SBarry Smith       ap[i] = value;
563581824310SBarry Smith     noinsert:;
563681824310SBarry Smith       low = i + 1;
563781824310SBarry Smith     }
563881824310SBarry Smith     ailen[row] = nrow;
563981824310SBarry Smith   }
564081824310SBarry Smith   PetscFunctionReturnVoid();
564181824310SBarry Smith }
564298921bdaSJacob Faibussowitsch /* Undefining these here since they were redefined from their original definition above! No
564398921bdaSJacob Faibussowitsch  * other PETSc functions should be defined past this point, as it is impossible to recover the
564498921bdaSJacob Faibussowitsch  * original definitions */
56459566063dSJacob Faibussowitsch #undef PetscCall
564698921bdaSJacob Faibussowitsch #undef SETERRQ
5647