xref: /petsc/src/mat/impls/aij/seq/aij.c (revision d7547e516efde0cd36ffdeebcfafd4768debadcc)
1d5d45c9bSBarry Smith /*
23369ce9aSBarry Smith     Defines the basic matrix operations for the AIJ (compressed row)
3d5d45c9bSBarry Smith   matrix storage format.
4d5d45c9bSBarry Smith */
53369ce9aSBarry Smith 
6c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/aij.h> /*I "petscmat.h" I*/
7c6db04a5SJed Brown #include <petscblaslapack.h>
8c6db04a5SJed Brown #include <petscbt.h>
9af0996ceSBarry Smith #include <petsc/private/kernels/blocktranspose.h>
100716a85fSBarry Smith 
11d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetTypeFromOptions(Mat A)
12d71ae5a4SJacob Faibussowitsch {
134099cc6bSBarry Smith   PetscBool flg;
144099cc6bSBarry Smith   char      type[256];
154099cc6bSBarry Smith 
164099cc6bSBarry Smith   PetscFunctionBegin;
17d0609cedSBarry Smith   PetscObjectOptionsBegin((PetscObject)A);
189566063dSJacob Faibussowitsch   PetscCall(PetscOptionsFList("-mat_seqaij_type", "Matrix SeqAIJ type", "MatSeqAIJSetType", MatSeqAIJList, "seqaij", type, 256, &flg));
199566063dSJacob Faibussowitsch   if (flg) PetscCall(MatSeqAIJSetType(A, type));
20d0609cedSBarry Smith   PetscOptionsEnd();
214099cc6bSBarry Smith   PetscFunctionReturn(0);
224099cc6bSBarry Smith }
234099cc6bSBarry Smith 
24d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetColumnReductions_SeqAIJ(Mat A, PetscInt type, PetscReal *reductions)
25d71ae5a4SJacob Faibussowitsch {
260716a85fSBarry Smith   PetscInt    i, m, n;
270716a85fSBarry Smith   Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data;
280716a85fSBarry Smith 
290716a85fSBarry Smith   PetscFunctionBegin;
309566063dSJacob Faibussowitsch   PetscCall(MatGetSize(A, &m, &n));
319566063dSJacob Faibussowitsch   PetscCall(PetscArrayzero(reductions, n));
320716a85fSBarry Smith   if (type == NORM_2) {
33ad540459SPierre Jolivet     for (i = 0; i < aij->i[m]; i++) reductions[aij->j[i]] += PetscAbsScalar(aij->a[i] * aij->a[i]);
340716a85fSBarry Smith   } else if (type == NORM_1) {
35ad540459SPierre Jolivet     for (i = 0; i < aij->i[m]; i++) reductions[aij->j[i]] += PetscAbsScalar(aij->a[i]);
360716a85fSBarry Smith   } else if (type == NORM_INFINITY) {
37ad540459SPierre Jolivet     for (i = 0; i < aij->i[m]; i++) reductions[aij->j[i]] = PetscMax(PetscAbsScalar(aij->a[i]), reductions[aij->j[i]]);
38857cbf51SRichard Tran Mills   } else if (type == REDUCTION_SUM_REALPART || type == REDUCTION_MEAN_REALPART) {
39ad540459SPierre Jolivet     for (i = 0; i < aij->i[m]; i++) reductions[aij->j[i]] += PetscRealPart(aij->a[i]);
40857cbf51SRichard Tran Mills   } else if (type == REDUCTION_SUM_IMAGINARYPART || type == REDUCTION_MEAN_IMAGINARYPART) {
41ad540459SPierre Jolivet     for (i = 0; i < aij->i[m]; i++) reductions[aij->j[i]] += PetscImaginaryPart(aij->a[i]);
42857cbf51SRichard Tran Mills   } else SETERRQ(PETSC_COMM_SELF, PETSC_ERR_ARG_WRONG, "Unknown reduction type");
430716a85fSBarry Smith 
440716a85fSBarry Smith   if (type == NORM_2) {
45a873a8cdSSam Reynolds     for (i = 0; i < n; i++) reductions[i] = PetscSqrtReal(reductions[i]);
46857cbf51SRichard Tran Mills   } else if (type == REDUCTION_MEAN_REALPART || type == REDUCTION_MEAN_IMAGINARYPART) {
47a873a8cdSSam Reynolds     for (i = 0; i < n; i++) reductions[i] /= m;
480716a85fSBarry Smith   }
490716a85fSBarry Smith   PetscFunctionReturn(0);
500716a85fSBarry Smith }
510716a85fSBarry Smith 
52d71ae5a4SJacob Faibussowitsch PetscErrorCode MatFindOffBlockDiagonalEntries_SeqAIJ(Mat A, IS *is)
53d71ae5a4SJacob Faibussowitsch {
543a062f41SBarry Smith   Mat_SeqAIJ     *a = (Mat_SeqAIJ *)A->data;
553a062f41SBarry Smith   PetscInt        i, m = A->rmap->n, cnt = 0, bs = A->rmap->bs;
563a062f41SBarry Smith   const PetscInt *jj = a->j, *ii = a->i;
573a062f41SBarry Smith   PetscInt       *rows;
583a062f41SBarry Smith 
593a062f41SBarry Smith   PetscFunctionBegin;
603a062f41SBarry Smith   for (i = 0; i < m; i++) {
61ad540459SPierre Jolivet     if ((ii[i] != ii[i + 1]) && ((jj[ii[i]] < bs * (i / bs)) || (jj[ii[i + 1] - 1] > bs * ((i + bs) / bs) - 1))) cnt++;
623a062f41SBarry Smith   }
639566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(cnt, &rows));
643a062f41SBarry Smith   cnt = 0;
653a062f41SBarry Smith   for (i = 0; i < m; i++) {
663a062f41SBarry Smith     if ((ii[i] != ii[i + 1]) && ((jj[ii[i]] < bs * (i / bs)) || (jj[ii[i + 1] - 1] > bs * ((i + bs) / bs) - 1))) {
673a062f41SBarry Smith       rows[cnt] = i;
683a062f41SBarry Smith       cnt++;
693a062f41SBarry Smith     }
703a062f41SBarry Smith   }
719566063dSJacob Faibussowitsch   PetscCall(ISCreateGeneral(PETSC_COMM_SELF, cnt, rows, PETSC_OWN_POINTER, is));
723a062f41SBarry Smith   PetscFunctionReturn(0);
733a062f41SBarry Smith }
743a062f41SBarry Smith 
75d71ae5a4SJacob Faibussowitsch PetscErrorCode MatFindZeroDiagonals_SeqAIJ_Private(Mat A, PetscInt *nrows, PetscInt **zrows)
76d71ae5a4SJacob Faibussowitsch {
776ce1633cSBarry Smith   Mat_SeqAIJ      *a = (Mat_SeqAIJ *)A->data;
78fff043a9SJunchao Zhang   const MatScalar *aa;
796ce1633cSBarry Smith   PetscInt         i, m = A->rmap->n, cnt = 0;
80b2db7409Sstefano_zampini   const PetscInt  *ii = a->i, *jj = a->j, *diag;
816ce1633cSBarry Smith   PetscInt        *rows;
826ce1633cSBarry Smith 
836ce1633cSBarry Smith   PetscFunctionBegin;
849566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &aa));
859566063dSJacob Faibussowitsch   PetscCall(MatMarkDiagonal_SeqAIJ(A));
866ce1633cSBarry Smith   diag = a->diag;
876ce1633cSBarry Smith   for (i = 0; i < m; i++) {
88ad540459SPierre Jolivet     if ((diag[i] >= ii[i + 1]) || (jj[diag[i]] != i) || (aa[diag[i]] == 0.0)) cnt++;
896ce1633cSBarry Smith   }
909566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(cnt, &rows));
916ce1633cSBarry Smith   cnt = 0;
926ce1633cSBarry Smith   for (i = 0; i < m; i++) {
93ad540459SPierre Jolivet     if ((diag[i] >= ii[i + 1]) || (jj[diag[i]] != i) || (aa[diag[i]] == 0.0)) rows[cnt++] = i;
946ce1633cSBarry Smith   }
95f1f41ecbSJed Brown   *nrows = cnt;
96f1f41ecbSJed Brown   *zrows = rows;
979566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &aa));
98f1f41ecbSJed Brown   PetscFunctionReturn(0);
99f1f41ecbSJed Brown }
100f1f41ecbSJed Brown 
101d71ae5a4SJacob Faibussowitsch PetscErrorCode MatFindZeroDiagonals_SeqAIJ(Mat A, IS *zrows)
102d71ae5a4SJacob Faibussowitsch {
103f1f41ecbSJed Brown   PetscInt nrows, *rows;
104f1f41ecbSJed Brown 
105f1f41ecbSJed Brown   PetscFunctionBegin;
1060298fd71SBarry Smith   *zrows = NULL;
1079566063dSJacob Faibussowitsch   PetscCall(MatFindZeroDiagonals_SeqAIJ_Private(A, &nrows, &rows));
1089566063dSJacob Faibussowitsch   PetscCall(ISCreateGeneral(PetscObjectComm((PetscObject)A), nrows, rows, PETSC_OWN_POINTER, zrows));
1096ce1633cSBarry Smith   PetscFunctionReturn(0);
1106ce1633cSBarry Smith }
1116ce1633cSBarry Smith 
112d71ae5a4SJacob Faibussowitsch PetscErrorCode MatFindNonzeroRows_SeqAIJ(Mat A, IS *keptrows)
113d71ae5a4SJacob Faibussowitsch {
114b3a44c85SBarry Smith   Mat_SeqAIJ      *a = (Mat_SeqAIJ *)A->data;
115b3a44c85SBarry Smith   const MatScalar *aa;
116b3a44c85SBarry Smith   PetscInt         m = A->rmap->n, cnt = 0;
117b3a44c85SBarry Smith   const PetscInt  *ii;
118b3a44c85SBarry Smith   PetscInt         n, i, j, *rows;
119b3a44c85SBarry Smith 
120b3a44c85SBarry Smith   PetscFunctionBegin;
1219566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &aa));
122f4259b30SLisandro Dalcin   *keptrows = NULL;
123b3a44c85SBarry Smith   ii        = a->i;
124b3a44c85SBarry Smith   for (i = 0; i < m; i++) {
125b3a44c85SBarry Smith     n = ii[i + 1] - ii[i];
126b3a44c85SBarry Smith     if (!n) {
127b3a44c85SBarry Smith       cnt++;
128b3a44c85SBarry Smith       goto ok1;
129b3a44c85SBarry Smith     }
1302e5835c6SStefano Zampini     for (j = ii[i]; j < ii[i + 1]; j++) {
131b3a44c85SBarry Smith       if (aa[j] != 0.0) goto ok1;
132b3a44c85SBarry Smith     }
133b3a44c85SBarry Smith     cnt++;
134b3a44c85SBarry Smith   ok1:;
135b3a44c85SBarry Smith   }
1362e5835c6SStefano Zampini   if (!cnt) {
1379566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJRestoreArrayRead(A, &aa));
1382e5835c6SStefano Zampini     PetscFunctionReturn(0);
1392e5835c6SStefano Zampini   }
1409566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(A->rmap->n - cnt, &rows));
141b3a44c85SBarry Smith   cnt = 0;
142b3a44c85SBarry Smith   for (i = 0; i < m; i++) {
143b3a44c85SBarry Smith     n = ii[i + 1] - ii[i];
144b3a44c85SBarry Smith     if (!n) continue;
1452e5835c6SStefano Zampini     for (j = ii[i]; j < ii[i + 1]; j++) {
146b3a44c85SBarry Smith       if (aa[j] != 0.0) {
147b3a44c85SBarry Smith         rows[cnt++] = i;
148b3a44c85SBarry Smith         break;
149b3a44c85SBarry Smith       }
150b3a44c85SBarry Smith     }
151b3a44c85SBarry Smith   }
1529566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &aa));
1539566063dSJacob Faibussowitsch   PetscCall(ISCreateGeneral(PETSC_COMM_SELF, cnt, rows, PETSC_OWN_POINTER, keptrows));
154b3a44c85SBarry Smith   PetscFunctionReturn(0);
155b3a44c85SBarry Smith }
156b3a44c85SBarry Smith 
157d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDiagonalSet_SeqAIJ(Mat Y, Vec D, InsertMode is)
158d71ae5a4SJacob Faibussowitsch {
15979299369SBarry Smith   Mat_SeqAIJ        *aij = (Mat_SeqAIJ *)Y->data;
16099e65526SBarry Smith   PetscInt           i, m = Y->rmap->n;
16199e65526SBarry Smith   const PetscInt    *diag;
1622e5835c6SStefano Zampini   MatScalar         *aa;
16399e65526SBarry Smith   const PetscScalar *v;
164ace3abfcSBarry Smith   PetscBool          missing;
16579299369SBarry Smith 
16679299369SBarry Smith   PetscFunctionBegin;
16709f38230SBarry Smith   if (Y->assembled) {
1689566063dSJacob Faibussowitsch     PetscCall(MatMissingDiagonal_SeqAIJ(Y, &missing, NULL));
16909f38230SBarry Smith     if (!missing) {
17079299369SBarry Smith       diag = aij->diag;
1719566063dSJacob Faibussowitsch       PetscCall(VecGetArrayRead(D, &v));
1729566063dSJacob Faibussowitsch       PetscCall(MatSeqAIJGetArray(Y, &aa));
17379299369SBarry Smith       if (is == INSERT_VALUES) {
174ad540459SPierre Jolivet         for (i = 0; i < m; i++) aa[diag[i]] = v[i];
17579299369SBarry Smith       } else {
176ad540459SPierre Jolivet         for (i = 0; i < m; i++) aa[diag[i]] += v[i];
17779299369SBarry Smith       }
1789566063dSJacob Faibussowitsch       PetscCall(MatSeqAIJRestoreArray(Y, &aa));
1799566063dSJacob Faibussowitsch       PetscCall(VecRestoreArrayRead(D, &v));
18079299369SBarry Smith       PetscFunctionReturn(0);
18179299369SBarry Smith     }
1829566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJInvalidateDiagonal(Y));
18309f38230SBarry Smith   }
1849566063dSJacob Faibussowitsch   PetscCall(MatDiagonalSet_Default(Y, D, is));
18509f38230SBarry Smith   PetscFunctionReturn(0);
18609f38230SBarry Smith }
18779299369SBarry Smith 
188d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetRowIJ_SeqAIJ(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *m, const PetscInt *ia[], const PetscInt *ja[], PetscBool *done)
189d71ae5a4SJacob Faibussowitsch {
190416022c9SBarry Smith   Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data;
19197f1f81fSBarry Smith   PetscInt    i, ishift;
19217ab2063SBarry Smith 
1933a40ed3dSBarry Smith   PetscFunctionBegin;
194f1f2ae84SBarry Smith   if (m) *m = A->rmap->n;
1953a40ed3dSBarry Smith   if (!ia) PetscFunctionReturn(0);
196bfeeae90SHong Zhang   ishift = 0;
197b94d7dedSBarry Smith   if (symmetric && A->structurally_symmetric != PETSC_BOOL3_TRUE) {
1989566063dSJacob Faibussowitsch     PetscCall(MatToSymmetricIJ_SeqAIJ(A->rmap->n, a->i, a->j, PETSC_TRUE, ishift, oshift, (PetscInt **)ia, (PetscInt **)ja));
199bfeeae90SHong Zhang   } else if (oshift == 1) {
2001a83f524SJed Brown     PetscInt *tia;
201d0f46423SBarry Smith     PetscInt  nz = a->i[A->rmap->n];
2023b2fbd54SBarry Smith     /* malloc space and  add 1 to i and j indices */
2039566063dSJacob Faibussowitsch     PetscCall(PetscMalloc1(A->rmap->n + 1, &tia));
2041a83f524SJed Brown     for (i = 0; i < A->rmap->n + 1; i++) tia[i] = a->i[i] + 1;
2051a83f524SJed Brown     *ia = tia;
206ecc77c7aSBarry Smith     if (ja) {
2071a83f524SJed Brown       PetscInt *tja;
2089566063dSJacob Faibussowitsch       PetscCall(PetscMalloc1(nz + 1, &tja));
2091a83f524SJed Brown       for (i = 0; i < nz; i++) tja[i] = a->j[i] + 1;
2101a83f524SJed Brown       *ja = tja;
211ecc77c7aSBarry Smith     }
2126945ee14SBarry Smith   } else {
213ecc77c7aSBarry Smith     *ia = a->i;
214ecc77c7aSBarry Smith     if (ja) *ja = a->j;
215a2ce50c7SBarry Smith   }
2163a40ed3dSBarry Smith   PetscFunctionReturn(0);
217a2744918SBarry Smith }
218a2744918SBarry Smith 
219d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRestoreRowIJ_SeqAIJ(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *n, const PetscInt *ia[], const PetscInt *ja[], PetscBool *done)
220d71ae5a4SJacob Faibussowitsch {
2213a40ed3dSBarry Smith   PetscFunctionBegin;
2223a40ed3dSBarry Smith   if (!ia) PetscFunctionReturn(0);
223b94d7dedSBarry Smith   if ((symmetric && A->structurally_symmetric != PETSC_BOOL3_TRUE) || oshift == 1) {
2249566063dSJacob Faibussowitsch     PetscCall(PetscFree(*ia));
2259566063dSJacob Faibussowitsch     if (ja) PetscCall(PetscFree(*ja));
226bcd2baecSBarry Smith   }
2273a40ed3dSBarry Smith   PetscFunctionReturn(0);
22817ab2063SBarry Smith }
22917ab2063SBarry Smith 
230d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetColumnIJ_SeqAIJ(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *nn, const PetscInt *ia[], const PetscInt *ja[], PetscBool *done)
231d71ae5a4SJacob Faibussowitsch {
2323b2fbd54SBarry Smith   Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data;
233d0f46423SBarry Smith   PetscInt    i, *collengths, *cia, *cja, n = A->cmap->n, m = A->rmap->n;
23497f1f81fSBarry Smith   PetscInt    nz = a->i[m], row, *jj, mr, col;
2353b2fbd54SBarry Smith 
2363a40ed3dSBarry Smith   PetscFunctionBegin;
237899cda47SBarry Smith   *nn = n;
2383a40ed3dSBarry Smith   if (!ia) PetscFunctionReturn(0);
2393b2fbd54SBarry Smith   if (symmetric) {
2409566063dSJacob Faibussowitsch     PetscCall(MatToSymmetricIJ_SeqAIJ(A->rmap->n, a->i, a->j, PETSC_TRUE, 0, oshift, (PetscInt **)ia, (PetscInt **)ja));
2413b2fbd54SBarry Smith   } else {
2429566063dSJacob Faibussowitsch     PetscCall(PetscCalloc1(n, &collengths));
2439566063dSJacob Faibussowitsch     PetscCall(PetscMalloc1(n + 1, &cia));
2449566063dSJacob Faibussowitsch     PetscCall(PetscMalloc1(nz, &cja));
2453b2fbd54SBarry Smith     jj = a->j;
246ad540459SPierre Jolivet     for (i = 0; i < nz; i++) collengths[jj[i]]++;
2473b2fbd54SBarry Smith     cia[0] = oshift;
248ad540459SPierre Jolivet     for (i = 0; i < n; i++) cia[i + 1] = cia[i] + collengths[i];
2499566063dSJacob Faibussowitsch     PetscCall(PetscArrayzero(collengths, n));
2503b2fbd54SBarry Smith     jj = a->j;
251a93ec695SBarry Smith     for (row = 0; row < m; row++) {
252a93ec695SBarry Smith       mr = a->i[row + 1] - a->i[row];
253a93ec695SBarry Smith       for (i = 0; i < mr; i++) {
254bfeeae90SHong Zhang         col = *jj++;
2552205254eSKarl Rupp 
2563b2fbd54SBarry Smith         cja[cia[col] + collengths[col]++ - oshift] = row + oshift;
2573b2fbd54SBarry Smith       }
2583b2fbd54SBarry Smith     }
2599566063dSJacob Faibussowitsch     PetscCall(PetscFree(collengths));
2609371c9d4SSatish Balay     *ia = cia;
2619371c9d4SSatish Balay     *ja = cja;
2623b2fbd54SBarry Smith   }
2633a40ed3dSBarry Smith   PetscFunctionReturn(0);
2643b2fbd54SBarry Smith }
2653b2fbd54SBarry Smith 
266d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRestoreColumnIJ_SeqAIJ(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *n, const PetscInt *ia[], const PetscInt *ja[], PetscBool *done)
267d71ae5a4SJacob Faibussowitsch {
2683a40ed3dSBarry Smith   PetscFunctionBegin;
2693a40ed3dSBarry Smith   if (!ia) PetscFunctionReturn(0);
2703b2fbd54SBarry Smith 
2719566063dSJacob Faibussowitsch   PetscCall(PetscFree(*ia));
2729566063dSJacob Faibussowitsch   PetscCall(PetscFree(*ja));
2733a40ed3dSBarry Smith   PetscFunctionReturn(0);
2743b2fbd54SBarry Smith }
2753b2fbd54SBarry Smith 
2767cee066cSHong Zhang /*
2777cee066cSHong Zhang  MatGetColumnIJ_SeqAIJ_Color() and MatRestoreColumnIJ_SeqAIJ_Color() are customized from
2787cee066cSHong Zhang  MatGetColumnIJ_SeqAIJ() and MatRestoreColumnIJ_SeqAIJ() by adding an output
279040ebd07SHong Zhang  spidx[], index of a->a, to be used in MatTransposeColoringCreate_SeqAIJ() and MatFDColoringCreate_SeqXAIJ()
2807cee066cSHong Zhang */
281d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetColumnIJ_SeqAIJ_Color(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *nn, const PetscInt *ia[], const PetscInt *ja[], PetscInt *spidx[], PetscBool *done)
282d71ae5a4SJacob Faibussowitsch {
2837cee066cSHong Zhang   Mat_SeqAIJ     *a = (Mat_SeqAIJ *)A->data;
2847cee066cSHong Zhang   PetscInt        i, *collengths, *cia, *cja, n = A->cmap->n, m = A->rmap->n;
285071fcb05SBarry Smith   PetscInt        nz = a->i[m], row, mr, col, tmp;
2867cee066cSHong Zhang   PetscInt       *cspidx;
287071fcb05SBarry Smith   const PetscInt *jj;
2887cee066cSHong Zhang 
2897cee066cSHong Zhang   PetscFunctionBegin;
2907cee066cSHong Zhang   *nn = n;
2917cee066cSHong Zhang   if (!ia) PetscFunctionReturn(0);
292625f6d37SHong Zhang 
2939566063dSJacob Faibussowitsch   PetscCall(PetscCalloc1(n, &collengths));
2949566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(n + 1, &cia));
2959566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(nz, &cja));
2969566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(nz, &cspidx));
2977cee066cSHong Zhang   jj = a->j;
298ad540459SPierre Jolivet   for (i = 0; i < nz; i++) collengths[jj[i]]++;
2997cee066cSHong Zhang   cia[0] = oshift;
300ad540459SPierre Jolivet   for (i = 0; i < n; i++) cia[i + 1] = cia[i] + collengths[i];
3019566063dSJacob Faibussowitsch   PetscCall(PetscArrayzero(collengths, n));
3027cee066cSHong Zhang   jj = a->j;
3037cee066cSHong Zhang   for (row = 0; row < m; row++) {
3047cee066cSHong Zhang     mr = a->i[row + 1] - a->i[row];
3057cee066cSHong Zhang     for (i = 0; i < mr; i++) {
3067cee066cSHong Zhang       col         = *jj++;
307071fcb05SBarry Smith       tmp         = cia[col] + collengths[col]++ - oshift;
308071fcb05SBarry Smith       cspidx[tmp] = a->i[row] + i; /* index of a->j */
309071fcb05SBarry Smith       cja[tmp]    = row + oshift;
3107cee066cSHong Zhang     }
3117cee066cSHong Zhang   }
3129566063dSJacob Faibussowitsch   PetscCall(PetscFree(collengths));
313071fcb05SBarry Smith   *ia    = cia;
314071fcb05SBarry Smith   *ja    = cja;
3157cee066cSHong Zhang   *spidx = cspidx;
3167cee066cSHong Zhang   PetscFunctionReturn(0);
3177cee066cSHong Zhang }
3187cee066cSHong Zhang 
319d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRestoreColumnIJ_SeqAIJ_Color(Mat A, PetscInt oshift, PetscBool symmetric, PetscBool inodecompressed, PetscInt *n, const PetscInt *ia[], const PetscInt *ja[], PetscInt *spidx[], PetscBool *done)
320d71ae5a4SJacob Faibussowitsch {
3217cee066cSHong Zhang   PetscFunctionBegin;
3229566063dSJacob Faibussowitsch   PetscCall(MatRestoreColumnIJ_SeqAIJ(A, oshift, symmetric, inodecompressed, n, ia, ja, done));
3239566063dSJacob Faibussowitsch   PetscCall(PetscFree(*spidx));
3247cee066cSHong Zhang   PetscFunctionReturn(0);
3257cee066cSHong Zhang }
3267cee066cSHong Zhang 
327d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetValuesRow_SeqAIJ(Mat A, PetscInt row, const PetscScalar v[])
328d71ae5a4SJacob Faibussowitsch {
32987d4246cSBarry Smith   Mat_SeqAIJ  *a  = (Mat_SeqAIJ *)A->data;
33087d4246cSBarry Smith   PetscInt    *ai = a->i;
331fff043a9SJunchao Zhang   PetscScalar *aa;
33287d4246cSBarry Smith 
33387d4246cSBarry Smith   PetscFunctionBegin;
3349566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArray(A, &aa));
3359566063dSJacob Faibussowitsch   PetscCall(PetscArraycpy(aa + ai[row], v, ai[row + 1] - ai[row]));
3369566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArray(A, &aa));
33787d4246cSBarry Smith   PetscFunctionReturn(0);
33887d4246cSBarry Smith }
33987d4246cSBarry Smith 
340bd04181cSBarry Smith /*
341bd04181cSBarry Smith     MatSeqAIJSetValuesLocalFast - An optimized version of MatSetValuesLocal() for SeqAIJ matrices with several assumptions
342bd04181cSBarry Smith 
343bd04181cSBarry Smith       -   a single row of values is set with each call
344bd04181cSBarry Smith       -   no row or column indices are negative or (in error) larger than the number of rows or columns
345bd04181cSBarry Smith       -   the values are always added to the matrix, not set
346bd04181cSBarry Smith       -   no new locations are introduced in the nonzero structure of the matrix
347bd04181cSBarry Smith 
3481f763a69SBarry Smith      This does NOT assume the global column indices are sorted
349bd04181cSBarry Smith 
3501f763a69SBarry Smith */
351bd04181cSBarry Smith 
352af0996ceSBarry Smith #include <petsc/private/isimpl.h>
353d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetValuesLocalFast(Mat A, PetscInt m, const PetscInt im[], PetscInt n, const PetscInt in[], const PetscScalar v[], InsertMode is)
354d71ae5a4SJacob Faibussowitsch {
355189e4007SBarry Smith   Mat_SeqAIJ     *a = (Mat_SeqAIJ *)A->data;
3561f763a69SBarry Smith   PetscInt        low, high, t, row, nrow, i, col, l;
3571f763a69SBarry Smith   const PetscInt *rp, *ai = a->i, *ailen = a->ilen, *aj = a->j;
3581f763a69SBarry Smith   PetscInt        lastcol = -1;
359fff043a9SJunchao Zhang   MatScalar      *ap, value, *aa;
360189e4007SBarry Smith   const PetscInt *ridx = A->rmap->mapping->indices, *cidx = A->cmap->mapping->indices;
361189e4007SBarry Smith 
362fff043a9SJunchao Zhang   PetscFunctionBegin;
3639566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArray(A, &aa));
364f38dd0b8SBarry Smith   row  = ridx[im[0]];
3651f763a69SBarry Smith   rp   = aj + ai[row];
3661f763a69SBarry Smith   ap   = aa + ai[row];
3671f763a69SBarry Smith   nrow = ailen[row];
368189e4007SBarry Smith   low  = 0;
369189e4007SBarry Smith   high = nrow;
370189e4007SBarry Smith   for (l = 0; l < n; l++) { /* loop over added columns */
371189e4007SBarry Smith     col   = cidx[in[l]];
372f38dd0b8SBarry Smith     value = v[l];
373189e4007SBarry Smith 
374189e4007SBarry Smith     if (col <= lastcol) low = 0;
375189e4007SBarry Smith     else high = nrow;
376189e4007SBarry Smith     lastcol = col;
377189e4007SBarry Smith     while (high - low > 5) {
378189e4007SBarry Smith       t = (low + high) / 2;
379189e4007SBarry Smith       if (rp[t] > col) high = t;
380189e4007SBarry Smith       else low = t;
381189e4007SBarry Smith     }
382189e4007SBarry Smith     for (i = low; i < high; i++) {
383189e4007SBarry Smith       if (rp[i] == col) {
3841f763a69SBarry Smith         ap[i] += value;
385189e4007SBarry Smith         low = i + 1;
3861f763a69SBarry Smith         break;
387189e4007SBarry Smith       }
388189e4007SBarry Smith     }
389189e4007SBarry Smith   }
3909566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArray(A, &aa));
391f38dd0b8SBarry Smith   return 0;
392189e4007SBarry Smith }
393189e4007SBarry Smith 
394d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetValues_SeqAIJ(Mat A, PetscInt m, const PetscInt im[], PetscInt n, const PetscInt in[], const PetscScalar v[], InsertMode is)
395d71ae5a4SJacob Faibussowitsch {
396416022c9SBarry Smith   Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data;
397e2ee6c50SBarry Smith   PetscInt   *rp, k, low, high, t, ii, row, nrow, i, col, l, rmax, N;
39897f1f81fSBarry Smith   PetscInt   *imax = a->imax, *ai = a->i, *ailen = a->ilen;
399e2ee6c50SBarry Smith   PetscInt   *aj = a->j, nonew = a->nonew, lastcol = -1;
400ce496241SStefano Zampini   MatScalar  *ap = NULL, value = 0.0, *aa;
401ace3abfcSBarry Smith   PetscBool   ignorezeroentries = a->ignorezeroentries;
402ace3abfcSBarry Smith   PetscBool   roworiented       = a->roworiented;
40317ab2063SBarry Smith 
4043a40ed3dSBarry Smith   PetscFunctionBegin;
4059566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArray(A, &aa));
40617ab2063SBarry Smith   for (k = 0; k < m; k++) { /* loop over added rows */
407416022c9SBarry Smith     row = im[k];
4085ef9f2a5SBarry Smith     if (row < 0) continue;
4096bdcaf15SBarry Smith     PetscCheck(row < A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Row too large: row %" PetscInt_FMT " max %" PetscInt_FMT, row, A->rmap->n - 1);
410720833daSHong Zhang     rp = aj + ai[row];
411876c6284SHong Zhang     if (!A->structure_only) ap = aa + ai[row];
4129371c9d4SSatish Balay     rmax = imax[row];
4139371c9d4SSatish Balay     nrow = ailen[row];
414416022c9SBarry Smith     low  = 0;
415c71e6ed7SBarry Smith     high = nrow;
41617ab2063SBarry Smith     for (l = 0; l < n; l++) { /* loop over added columns */
4175ef9f2a5SBarry Smith       if (in[l] < 0) continue;
4186bdcaf15SBarry Smith       PetscCheck(in[l] < A->cmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Column too large: col %" PetscInt_FMT " max %" PetscInt_FMT, in[l], A->cmap->n - 1);
419bfeeae90SHong Zhang       col = in[l];
420071fcb05SBarry Smith       if (v && !A->structure_only) value = roworiented ? v[l + k * n] : v[k + l * m];
421071fcb05SBarry Smith       if (!A->structure_only && value == 0.0 && ignorezeroentries && is == ADD_VALUES && row != col) continue;
42236db0b34SBarry Smith 
4232205254eSKarl Rupp       if (col <= lastcol) low = 0;
4242205254eSKarl Rupp       else high = nrow;
425e2ee6c50SBarry Smith       lastcol = col;
426416022c9SBarry Smith       while (high - low > 5) {
427416022c9SBarry Smith         t = (low + high) / 2;
428416022c9SBarry Smith         if (rp[t] > col) high = t;
429416022c9SBarry Smith         else low = t;
43017ab2063SBarry Smith       }
431416022c9SBarry Smith       for (i = low; i < high; i++) {
43217ab2063SBarry Smith         if (rp[i] > col) break;
43317ab2063SBarry Smith         if (rp[i] == col) {
434876c6284SHong Zhang           if (!A->structure_only) {
4350c0d7e18SFande Kong             if (is == ADD_VALUES) {
4360c0d7e18SFande Kong               ap[i] += value;
4370c0d7e18SFande Kong               (void)PetscLogFlops(1.0);
4389371c9d4SSatish Balay             } else ap[i] = value;
439720833daSHong Zhang           }
440e44c0bd4SBarry Smith           low = i + 1;
44117ab2063SBarry Smith           goto noinsert;
44217ab2063SBarry Smith         }
44317ab2063SBarry Smith       }
444dcd36c23SBarry Smith       if (value == 0.0 && ignorezeroentries && row != col) goto noinsert;
445c2653b3dSLois Curfman McInnes       if (nonew == 1) goto noinsert;
44608401ef6SPierre Jolivet       PetscCheck(nonew != -1, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Inserting a new nonzero at (%" PetscInt_FMT ",%" PetscInt_FMT ") in the matrix", row, col);
447720833daSHong Zhang       if (A->structure_only) {
448876c6284SHong Zhang         MatSeqXAIJReallocateAIJ_structure_only(A, A->rmap->n, 1, nrow, row, col, rmax, ai, aj, rp, imax, nonew, MatScalar);
449720833daSHong Zhang       } else {
450fef13f97SBarry Smith         MatSeqXAIJReallocateAIJ(A, A->rmap->n, 1, nrow, row, col, rmax, aa, ai, aj, rp, ap, imax, nonew, MatScalar);
451720833daSHong Zhang       }
4529371c9d4SSatish Balay       N = nrow++ - 1;
4539371c9d4SSatish Balay       a->nz++;
4549371c9d4SSatish Balay       high++;
455416022c9SBarry Smith       /* shift up all the later entries in this row */
4569566063dSJacob Faibussowitsch       PetscCall(PetscArraymove(rp + i + 1, rp + i, N - i + 1));
45717ab2063SBarry Smith       rp[i] = col;
458580bdb30SBarry Smith       if (!A->structure_only) {
4599566063dSJacob Faibussowitsch         PetscCall(PetscArraymove(ap + i + 1, ap + i, N - i + 1));
460580bdb30SBarry Smith         ap[i] = value;
461580bdb30SBarry Smith       }
462416022c9SBarry Smith       low = i + 1;
463e56f5c9eSBarry Smith       A->nonzerostate++;
464e44c0bd4SBarry Smith     noinsert:;
46517ab2063SBarry Smith     }
46617ab2063SBarry Smith     ailen[row] = nrow;
46717ab2063SBarry Smith   }
4689566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArray(A, &aa));
4693a40ed3dSBarry Smith   PetscFunctionReturn(0);
47017ab2063SBarry Smith }
47117ab2063SBarry Smith 
472d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetValues_SeqAIJ_SortedFullNoPreallocation(Mat A, PetscInt m, const PetscInt im[], PetscInt n, const PetscInt in[], const PetscScalar v[], InsertMode is)
473d71ae5a4SJacob Faibussowitsch {
47419b08ed1SBarry Smith   Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data;
47519b08ed1SBarry Smith   PetscInt   *rp, k, row;
47619b08ed1SBarry Smith   PetscInt   *ai = a->i;
47719b08ed1SBarry Smith   PetscInt   *aj = a->j;
478fff043a9SJunchao Zhang   MatScalar  *aa, *ap;
47919b08ed1SBarry Smith 
48019b08ed1SBarry Smith   PetscFunctionBegin;
48128b400f6SJacob Faibussowitsch   PetscCheck(!A->was_assembled, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Cannot call on assembled matrix.");
48208401ef6SPierre Jolivet   PetscCheck(m * n + a->nz <= a->maxnz, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Number of entries in matrix will be larger than maximum nonzeros allocated for %" PetscInt_FMT " in MatSeqAIJSetTotalPreallocation()", a->maxnz);
483fff043a9SJunchao Zhang 
4849566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArray(A, &aa));
48519b08ed1SBarry Smith   for (k = 0; k < m; k++) { /* loop over added rows */
48619b08ed1SBarry Smith     row = im[k];
48719b08ed1SBarry Smith     rp  = aj + ai[row];
48819b08ed1SBarry Smith     ap  = aa + ai[row];
48919b08ed1SBarry Smith 
4909566063dSJacob Faibussowitsch     PetscCall(PetscMemcpy(rp, in, n * sizeof(PetscInt)));
49119b08ed1SBarry Smith     if (!A->structure_only) {
49219b08ed1SBarry Smith       if (v) {
4939566063dSJacob Faibussowitsch         PetscCall(PetscMemcpy(ap, v, n * sizeof(PetscScalar)));
49419b08ed1SBarry Smith         v += n;
49519b08ed1SBarry Smith       } else {
4969566063dSJacob Faibussowitsch         PetscCall(PetscMemzero(ap, n * sizeof(PetscScalar)));
49719b08ed1SBarry Smith       }
49819b08ed1SBarry Smith     }
49919b08ed1SBarry Smith     a->ilen[row]  = n;
50019b08ed1SBarry Smith     a->imax[row]  = n;
50119b08ed1SBarry Smith     a->i[row + 1] = a->i[row] + n;
50219b08ed1SBarry Smith     a->nz += n;
50319b08ed1SBarry Smith   }
5049566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArray(A, &aa));
50519b08ed1SBarry Smith   PetscFunctionReturn(0);
50619b08ed1SBarry Smith }
50719b08ed1SBarry Smith 
50819b08ed1SBarry Smith /*@
50919b08ed1SBarry Smith     MatSeqAIJSetTotalPreallocation - Sets an upper bound on the total number of expected nonzeros in the matrix.
51019b08ed1SBarry Smith 
51119b08ed1SBarry Smith   Input Parameters:
51211a5261eSBarry Smith +  A - the `MATSEQAIJ` matrix
51319b08ed1SBarry Smith -  nztotal - bound on the number of nonzeros
51419b08ed1SBarry Smith 
51519b08ed1SBarry Smith   Level: advanced
51619b08ed1SBarry Smith 
51719b08ed1SBarry Smith   Notes:
51819b08ed1SBarry Smith     This can be called if you will be provided the matrix row by row (from row zero) with sorted column indices for each row.
51911a5261eSBarry Smith     Simply call `MatSetValues()` after this call to provide the matrix entries in the usual manner. This matrix may be used
52019b08ed1SBarry Smith     as always with multiple matrix assemblies.
52119b08ed1SBarry Smith 
522db781477SPatrick Sanan .seealso: `MatSetOption()`, `MAT_SORTED_FULL`, `MatSetValues()`, `MatSeqAIJSetPreallocation()`
52319b08ed1SBarry Smith @*/
52419b08ed1SBarry Smith 
525d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetTotalPreallocation(Mat A, PetscInt nztotal)
526d71ae5a4SJacob Faibussowitsch {
52719b08ed1SBarry Smith   Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data;
52819b08ed1SBarry Smith 
52919b08ed1SBarry Smith   PetscFunctionBegin;
5309566063dSJacob Faibussowitsch   PetscCall(PetscLayoutSetUp(A->rmap));
5319566063dSJacob Faibussowitsch   PetscCall(PetscLayoutSetUp(A->cmap));
53219b08ed1SBarry Smith   a->maxnz = nztotal;
5334dfa11a4SJacob Faibussowitsch   if (!a->imax) { PetscCall(PetscMalloc1(A->rmap->n, &a->imax)); }
53419b08ed1SBarry Smith   if (!a->ilen) {
5359566063dSJacob Faibussowitsch     PetscCall(PetscMalloc1(A->rmap->n, &a->ilen));
53619b08ed1SBarry Smith   } else {
5379566063dSJacob Faibussowitsch     PetscCall(PetscMemzero(a->ilen, A->rmap->n * sizeof(PetscInt)));
53819b08ed1SBarry Smith   }
53919b08ed1SBarry Smith 
54019b08ed1SBarry Smith   /* allocate the matrix space */
54119b08ed1SBarry Smith   if (A->structure_only) {
5429566063dSJacob Faibussowitsch     PetscCall(PetscMalloc1(nztotal, &a->j));
5439566063dSJacob Faibussowitsch     PetscCall(PetscMalloc1(A->rmap->n + 1, &a->i));
54419b08ed1SBarry Smith   } else {
5459566063dSJacob Faibussowitsch     PetscCall(PetscMalloc3(nztotal, &a->a, nztotal, &a->j, A->rmap->n + 1, &a->i));
54619b08ed1SBarry Smith   }
54719b08ed1SBarry Smith   a->i[0] = 0;
54819b08ed1SBarry Smith   if (A->structure_only) {
54919b08ed1SBarry Smith     a->singlemalloc = PETSC_FALSE;
55019b08ed1SBarry Smith     a->free_a       = PETSC_FALSE;
55119b08ed1SBarry Smith   } else {
55219b08ed1SBarry Smith     a->singlemalloc = PETSC_TRUE;
55319b08ed1SBarry Smith     a->free_a       = PETSC_TRUE;
55419b08ed1SBarry Smith   }
55519b08ed1SBarry Smith   a->free_ij        = PETSC_TRUE;
55619b08ed1SBarry Smith   A->ops->setvalues = MatSetValues_SeqAIJ_SortedFullNoPreallocation;
55719b08ed1SBarry Smith   A->preallocated   = PETSC_TRUE;
55819b08ed1SBarry Smith   PetscFunctionReturn(0);
55919b08ed1SBarry Smith }
56019b08ed1SBarry Smith 
561d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetValues_SeqAIJ_SortedFull(Mat A, PetscInt m, const PetscInt im[], PetscInt n, const PetscInt in[], const PetscScalar v[], InsertMode is)
562d71ae5a4SJacob Faibussowitsch {
563071fcb05SBarry Smith   Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data;
564071fcb05SBarry Smith   PetscInt   *rp, k, row;
565071fcb05SBarry Smith   PetscInt   *ai = a->i, *ailen = a->ilen;
566071fcb05SBarry Smith   PetscInt   *aj = a->j;
567fff043a9SJunchao Zhang   MatScalar  *aa, *ap;
568071fcb05SBarry Smith 
569071fcb05SBarry Smith   PetscFunctionBegin;
5709566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArray(A, &aa));
571071fcb05SBarry Smith   for (k = 0; k < m; k++) { /* loop over added rows */
572071fcb05SBarry Smith     row = im[k];
5736bdcaf15SBarry Smith     PetscCheck(n <= a->imax[row], PETSC_COMM_SELF, PETSC_ERR_ARG_WRONG, "Preallocation for row %" PetscInt_FMT " does not match number of columns provided", n);
574071fcb05SBarry Smith     rp = aj + ai[row];
575071fcb05SBarry Smith     ap = aa + ai[row];
57648a46eb9SPierre Jolivet     if (!A->was_assembled) PetscCall(PetscMemcpy(rp, in, n * sizeof(PetscInt)));
577071fcb05SBarry Smith     if (!A->structure_only) {
578071fcb05SBarry Smith       if (v) {
5799566063dSJacob Faibussowitsch         PetscCall(PetscMemcpy(ap, v, n * sizeof(PetscScalar)));
580071fcb05SBarry Smith         v += n;
581071fcb05SBarry Smith       } else {
5829566063dSJacob Faibussowitsch         PetscCall(PetscMemzero(ap, n * sizeof(PetscScalar)));
583071fcb05SBarry Smith       }
584071fcb05SBarry Smith     }
585071fcb05SBarry Smith     ailen[row] = n;
586071fcb05SBarry Smith     a->nz += n;
587071fcb05SBarry Smith   }
5889566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArray(A, &aa));
589071fcb05SBarry Smith   PetscFunctionReturn(0);
590071fcb05SBarry Smith }
591071fcb05SBarry Smith 
592d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetValues_SeqAIJ(Mat A, PetscInt m, const PetscInt im[], PetscInt n, const PetscInt in[], PetscScalar v[])
593d71ae5a4SJacob Faibussowitsch {
5947eb43aa7SLois Curfman McInnes   Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data;
59597f1f81fSBarry Smith   PetscInt   *rp, k, low, high, t, row, nrow, i, col, l, *aj = a->j;
59697f1f81fSBarry Smith   PetscInt   *ai = a->i, *ailen = a->ilen;
597fff043a9SJunchao Zhang   MatScalar  *ap, *aa;
5987eb43aa7SLois Curfman McInnes 
5993a40ed3dSBarry Smith   PetscFunctionBegin;
6009566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArray(A, &aa));
6017eb43aa7SLois Curfman McInnes   for (k = 0; k < m; k++) { /* loop over rows */
6027eb43aa7SLois Curfman McInnes     row = im[k];
6039371c9d4SSatish Balay     if (row < 0) {
6049371c9d4SSatish Balay       v += n;
6059371c9d4SSatish Balay       continue;
6069371c9d4SSatish Balay     } /* negative row */
60754c59aa7SJacob Faibussowitsch     PetscCheck(row < A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Row too large: row %" PetscInt_FMT " max %" PetscInt_FMT, row, A->rmap->n - 1);
6089371c9d4SSatish Balay     rp   = aj + ai[row];
6099371c9d4SSatish Balay     ap   = aa + ai[row];
6107eb43aa7SLois Curfman McInnes     nrow = ailen[row];
6117eb43aa7SLois Curfman McInnes     for (l = 0; l < n; l++) { /* loop over columns */
6129371c9d4SSatish Balay       if (in[l] < 0) {
6139371c9d4SSatish Balay         v++;
6149371c9d4SSatish Balay         continue;
6159371c9d4SSatish Balay       } /* negative column */
61654c59aa7SJacob Faibussowitsch       PetscCheck(in[l] < A->cmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Column too large: col %" PetscInt_FMT " max %" PetscInt_FMT, in[l], A->cmap->n - 1);
617bfeeae90SHong Zhang       col  = in[l];
6189371c9d4SSatish Balay       high = nrow;
6199371c9d4SSatish Balay       low  = 0; /* assume unsorted */
6207eb43aa7SLois Curfman McInnes       while (high - low > 5) {
6217eb43aa7SLois Curfman McInnes         t = (low + high) / 2;
6227eb43aa7SLois Curfman McInnes         if (rp[t] > col) high = t;
6237eb43aa7SLois Curfman McInnes         else low = t;
6247eb43aa7SLois Curfman McInnes       }
6257eb43aa7SLois Curfman McInnes       for (i = low; i < high; i++) {
6267eb43aa7SLois Curfman McInnes         if (rp[i] > col) break;
6277eb43aa7SLois Curfman McInnes         if (rp[i] == col) {
628b49de8d1SLois Curfman McInnes           *v++ = ap[i];
6297eb43aa7SLois Curfman McInnes           goto finished;
6307eb43aa7SLois Curfman McInnes         }
6317eb43aa7SLois Curfman McInnes       }
63297e567efSBarry Smith       *v++ = 0.0;
6337eb43aa7SLois Curfman McInnes     finished:;
6347eb43aa7SLois Curfman McInnes     }
6357eb43aa7SLois Curfman McInnes   }
6369566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArray(A, &aa));
6373a40ed3dSBarry Smith   PetscFunctionReturn(0);
6387eb43aa7SLois Curfman McInnes }
6397eb43aa7SLois Curfman McInnes 
640d71ae5a4SJacob Faibussowitsch PetscErrorCode MatView_SeqAIJ_Binary(Mat mat, PetscViewer viewer)
641d71ae5a4SJacob Faibussowitsch {
6423ea6fe3dSLisandro Dalcin   Mat_SeqAIJ        *A = (Mat_SeqAIJ *)mat->data;
643c898d852SStefano Zampini   const PetscScalar *av;
6443ea6fe3dSLisandro Dalcin   PetscInt           header[4], M, N, m, nz, i;
6453ea6fe3dSLisandro Dalcin   PetscInt          *rowlens;
64617ab2063SBarry Smith 
6473a40ed3dSBarry Smith   PetscFunctionBegin;
6489566063dSJacob Faibussowitsch   PetscCall(PetscViewerSetUp(viewer));
6492205254eSKarl Rupp 
6503ea6fe3dSLisandro Dalcin   M  = mat->rmap->N;
6513ea6fe3dSLisandro Dalcin   N  = mat->cmap->N;
6523ea6fe3dSLisandro Dalcin   m  = mat->rmap->n;
6533ea6fe3dSLisandro Dalcin   nz = A->nz;
654416022c9SBarry Smith 
6553ea6fe3dSLisandro Dalcin   /* write matrix header */
6563ea6fe3dSLisandro Dalcin   header[0] = MAT_FILE_CLASSID;
6579371c9d4SSatish Balay   header[1] = M;
6589371c9d4SSatish Balay   header[2] = N;
6599371c9d4SSatish Balay   header[3] = nz;
6609566063dSJacob Faibussowitsch   PetscCall(PetscViewerBinaryWrite(viewer, header, 4, PETSC_INT));
661416022c9SBarry Smith 
6623ea6fe3dSLisandro Dalcin   /* fill in and store row lengths */
6639566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(m, &rowlens));
6643ea6fe3dSLisandro Dalcin   for (i = 0; i < m; i++) rowlens[i] = A->i[i + 1] - A->i[i];
6659566063dSJacob Faibussowitsch   PetscCall(PetscViewerBinaryWrite(viewer, rowlens, m, PETSC_INT));
6669566063dSJacob Faibussowitsch   PetscCall(PetscFree(rowlens));
6673ea6fe3dSLisandro Dalcin   /* store column indices */
6689566063dSJacob Faibussowitsch   PetscCall(PetscViewerBinaryWrite(viewer, A->j, nz, PETSC_INT));
669416022c9SBarry Smith   /* store nonzero values */
6709566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(mat, &av));
6719566063dSJacob Faibussowitsch   PetscCall(PetscViewerBinaryWrite(viewer, av, nz, PETSC_SCALAR));
6729566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(mat, &av));
673b37d52dbSMark F. Adams 
6743ea6fe3dSLisandro Dalcin   /* write block size option to the viewer's .info file */
6759566063dSJacob Faibussowitsch   PetscCall(MatView_Binary_BlockSizes(mat, viewer));
6763a40ed3dSBarry Smith   PetscFunctionReturn(0);
67717ab2063SBarry Smith }
678416022c9SBarry Smith 
679d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatView_SeqAIJ_ASCII_structonly(Mat A, PetscViewer viewer)
680d71ae5a4SJacob Faibussowitsch {
6817dc0baabSHong Zhang   Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data;
6827dc0baabSHong Zhang   PetscInt    i, k, m = A->rmap->N;
6837dc0baabSHong Zhang 
6847dc0baabSHong Zhang   PetscFunctionBegin;
6859566063dSJacob Faibussowitsch   PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE));
6867dc0baabSHong Zhang   for (i = 0; i < m; i++) {
6879566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIPrintf(viewer, "row %" PetscInt_FMT ":", i));
68848a46eb9SPierre Jolivet     for (k = a->i[i]; k < a->i[i + 1]; k++) PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ") ", a->j[k]));
6899566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIPrintf(viewer, "\n"));
6907dc0baabSHong Zhang   }
6919566063dSJacob Faibussowitsch   PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE));
6927dc0baabSHong Zhang   PetscFunctionReturn(0);
6937dc0baabSHong Zhang }
6947dc0baabSHong Zhang 
69509573ac7SBarry Smith extern PetscErrorCode MatSeqAIJFactorInfo_Matlab(Mat, PetscViewer);
696cd155464SBarry Smith 
697d71ae5a4SJacob Faibussowitsch PetscErrorCode MatView_SeqAIJ_ASCII(Mat A, PetscViewer viewer)
698d71ae5a4SJacob Faibussowitsch {
699416022c9SBarry Smith   Mat_SeqAIJ        *a = (Mat_SeqAIJ *)A->data;
700c898d852SStefano Zampini   const PetscScalar *av;
70160e0710aSBarry Smith   PetscInt           i, j, m = A->rmap->n;
702e060cb09SBarry Smith   const char        *name;
703f3ef73ceSBarry Smith   PetscViewerFormat  format;
70417ab2063SBarry Smith 
7053a40ed3dSBarry Smith   PetscFunctionBegin;
7067dc0baabSHong Zhang   if (A->structure_only) {
7079566063dSJacob Faibussowitsch     PetscCall(MatView_SeqAIJ_ASCII_structonly(A, viewer));
7087dc0baabSHong Zhang     PetscFunctionReturn(0);
7097dc0baabSHong Zhang   }
71043e49210SHong Zhang 
7119566063dSJacob Faibussowitsch   PetscCall(PetscViewerGetFormat(viewer, &format));
7122e5835c6SStefano Zampini   if (format == PETSC_VIEWER_ASCII_FACTOR_INFO || format == PETSC_VIEWER_ASCII_INFO || format == PETSC_VIEWER_ASCII_INFO_DETAIL) PetscFunctionReturn(0);
7132e5835c6SStefano Zampini 
714c898d852SStefano Zampini   /* trigger copy to CPU if needed */
7159566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &av));
7169566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &av));
71771c2f376SKris Buschelman   if (format == PETSC_VIEWER_ASCII_MATLAB) {
71897f1f81fSBarry Smith     PetscInt nofinalvalue = 0;
71960e0710aSBarry Smith     if (m && ((a->i[m] == a->i[m - 1]) || (a->j[a->nz - 1] != A->cmap->n - 1))) {
720c337ccceSJed Brown       /* Need a dummy value to ensure the dimension of the matrix. */
721d00d2cf4SBarry Smith       nofinalvalue = 1;
722d00d2cf4SBarry Smith     }
7239566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE));
7249566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIPrintf(viewer, "%% Size = %" PetscInt_FMT " %" PetscInt_FMT " \n", m, A->cmap->n));
7259566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIPrintf(viewer, "%% Nonzeros = %" PetscInt_FMT " \n", a->nz));
726fbfe6fa7SJed Brown #if defined(PETSC_USE_COMPLEX)
7279566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIPrintf(viewer, "zzz = zeros(%" PetscInt_FMT ",4);\n", a->nz + nofinalvalue));
728fbfe6fa7SJed Brown #else
7299566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIPrintf(viewer, "zzz = zeros(%" PetscInt_FMT ",3);\n", a->nz + nofinalvalue));
730fbfe6fa7SJed Brown #endif
7319566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIPrintf(viewer, "zzz = [\n"));
73217ab2063SBarry Smith 
73317ab2063SBarry Smith     for (i = 0; i < m; i++) {
73460e0710aSBarry Smith       for (j = a->i[i]; j < a->i[i + 1]; j++) {
735aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX)
7369566063dSJacob Faibussowitsch         PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT "  %18.16e %18.16e\n", i + 1, a->j[j] + 1, (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j])));
73717ab2063SBarry Smith #else
7389566063dSJacob Faibussowitsch         PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT "  %18.16e\n", i + 1, a->j[j] + 1, (double)a->a[j]));
73917ab2063SBarry Smith #endif
74017ab2063SBarry Smith       }
74117ab2063SBarry Smith     }
742d00d2cf4SBarry Smith     if (nofinalvalue) {
743c337ccceSJed Brown #if defined(PETSC_USE_COMPLEX)
7449566063dSJacob Faibussowitsch       PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT "  %18.16e %18.16e\n", m, A->cmap->n, 0., 0.));
745c337ccceSJed Brown #else
7469566063dSJacob Faibussowitsch       PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT "  %18.16e\n", m, A->cmap->n, 0.0));
747c337ccceSJed Brown #endif
748d00d2cf4SBarry Smith     }
7499566063dSJacob Faibussowitsch     PetscCall(PetscObjectGetName((PetscObject)A, &name));
7509566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIPrintf(viewer, "];\n %s = spconvert(zzz);\n", name));
7519566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE));
752fb9695e5SSatish Balay   } else if (format == PETSC_VIEWER_ASCII_COMMON) {
7539566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE));
75444cd7ae7SLois Curfman McInnes     for (i = 0; i < m; i++) {
7559566063dSJacob Faibussowitsch       PetscCall(PetscViewerASCIIPrintf(viewer, "row %" PetscInt_FMT ":", i));
75660e0710aSBarry Smith       for (j = a->i[i]; j < a->i[i + 1]; j++) {
757aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX)
75836db0b34SBarry Smith         if (PetscImaginaryPart(a->a[j]) > 0.0 && PetscRealPart(a->a[j]) != 0.0) {
7599566063dSJacob Faibussowitsch           PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g + %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j])));
76036db0b34SBarry Smith         } else if (PetscImaginaryPart(a->a[j]) < 0.0 && PetscRealPart(a->a[j]) != 0.0) {
7619566063dSJacob Faibussowitsch           PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g - %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)-PetscImaginaryPart(a->a[j])));
76236db0b34SBarry Smith         } else if (PetscRealPart(a->a[j]) != 0.0) {
7639566063dSJacob Faibussowitsch           PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)PetscRealPart(a->a[j])));
7646831982aSBarry Smith         }
76544cd7ae7SLois Curfman McInnes #else
7669566063dSJacob Faibussowitsch         if (a->a[j] != 0.0) PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)a->a[j]));
76744cd7ae7SLois Curfman McInnes #endif
76844cd7ae7SLois Curfman McInnes       }
7699566063dSJacob Faibussowitsch       PetscCall(PetscViewerASCIIPrintf(viewer, "\n"));
77044cd7ae7SLois Curfman McInnes     }
7719566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE));
772fb9695e5SSatish Balay   } else if (format == PETSC_VIEWER_ASCII_SYMMODU) {
77397f1f81fSBarry Smith     PetscInt nzd = 0, fshift = 1, *sptr;
7749566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE));
7759566063dSJacob Faibussowitsch     PetscCall(PetscMalloc1(m + 1, &sptr));
776496be53dSLois Curfman McInnes     for (i = 0; i < m; i++) {
777496be53dSLois Curfman McInnes       sptr[i] = nzd + 1;
77860e0710aSBarry Smith       for (j = a->i[i]; j < a->i[i + 1]; j++) {
779496be53dSLois Curfman McInnes         if (a->j[j] >= i) {
780aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX)
78136db0b34SBarry Smith           if (PetscImaginaryPart(a->a[j]) != 0.0 || PetscRealPart(a->a[j]) != 0.0) nzd++;
782496be53dSLois Curfman McInnes #else
783496be53dSLois Curfman McInnes           if (a->a[j] != 0.0) nzd++;
784496be53dSLois Curfman McInnes #endif
785496be53dSLois Curfman McInnes         }
786496be53dSLois Curfman McInnes       }
787496be53dSLois Curfman McInnes     }
7882e44a96cSLois Curfman McInnes     sptr[m] = nzd + 1;
7899566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " %" PetscInt_FMT "\n\n", m, nzd));
7902e44a96cSLois Curfman McInnes     for (i = 0; i < m + 1; i += 6) {
7912205254eSKarl Rupp       if (i + 4 < m) {
7929566063dSJacob Faibussowitsch         PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT "\n", sptr[i], sptr[i + 1], sptr[i + 2], sptr[i + 3], sptr[i + 4], sptr[i + 5]));
7932205254eSKarl Rupp       } else if (i + 3 < m) {
7949566063dSJacob Faibussowitsch         PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT "\n", sptr[i], sptr[i + 1], sptr[i + 2], sptr[i + 3], sptr[i + 4]));
7952205254eSKarl Rupp       } else if (i + 2 < m) {
7969566063dSJacob Faibussowitsch         PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT "\n", sptr[i], sptr[i + 1], sptr[i + 2], sptr[i + 3]));
7972205254eSKarl Rupp       } else if (i + 1 < m) {
7989566063dSJacob Faibussowitsch         PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT "\n", sptr[i], sptr[i + 1], sptr[i + 2]));
7992205254eSKarl Rupp       } else if (i < m) {
8009566063dSJacob Faibussowitsch         PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " %" PetscInt_FMT "\n", sptr[i], sptr[i + 1]));
8012205254eSKarl Rupp       } else {
8029566063dSJacob Faibussowitsch         PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT "\n", sptr[i]));
8032205254eSKarl Rupp       }
804496be53dSLois Curfman McInnes     }
8059566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIPrintf(viewer, "\n"));
8069566063dSJacob Faibussowitsch     PetscCall(PetscFree(sptr));
807496be53dSLois Curfman McInnes     for (i = 0; i < m; i++) {
80860e0710aSBarry Smith       for (j = a->i[i]; j < a->i[i + 1]; j++) {
8099566063dSJacob Faibussowitsch         if (a->j[j] >= i) PetscCall(PetscViewerASCIIPrintf(viewer, " %" PetscInt_FMT " ", a->j[j] + fshift));
810496be53dSLois Curfman McInnes       }
8119566063dSJacob Faibussowitsch       PetscCall(PetscViewerASCIIPrintf(viewer, "\n"));
812496be53dSLois Curfman McInnes     }
8139566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIPrintf(viewer, "\n"));
814496be53dSLois Curfman McInnes     for (i = 0; i < m; i++) {
81560e0710aSBarry Smith       for (j = a->i[i]; j < a->i[i + 1]; j++) {
816496be53dSLois Curfman McInnes         if (a->j[j] >= i) {
817aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX)
81848a46eb9SPierre Jolivet           if (PetscImaginaryPart(a->a[j]) != 0.0 || PetscRealPart(a->a[j]) != 0.0) PetscCall(PetscViewerASCIIPrintf(viewer, " %18.16e %18.16e ", (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j])));
819496be53dSLois Curfman McInnes #else
8209566063dSJacob Faibussowitsch           if (a->a[j] != 0.0) PetscCall(PetscViewerASCIIPrintf(viewer, " %18.16e ", (double)a->a[j]));
821496be53dSLois Curfman McInnes #endif
822496be53dSLois Curfman McInnes         }
823496be53dSLois Curfman McInnes       }
8249566063dSJacob Faibussowitsch       PetscCall(PetscViewerASCIIPrintf(viewer, "\n"));
825496be53dSLois Curfman McInnes     }
8269566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE));
827fb9695e5SSatish Balay   } else if (format == PETSC_VIEWER_ASCII_DENSE) {
82897f1f81fSBarry Smith     PetscInt    cnt = 0, jcnt;
82987828ca2SBarry Smith     PetscScalar value;
83068f1ed48SBarry Smith #if defined(PETSC_USE_COMPLEX)
83168f1ed48SBarry Smith     PetscBool realonly = PETSC_TRUE;
83268f1ed48SBarry Smith 
83368f1ed48SBarry Smith     for (i = 0; i < a->i[m]; i++) {
83468f1ed48SBarry Smith       if (PetscImaginaryPart(a->a[i]) != 0.0) {
83568f1ed48SBarry Smith         realonly = PETSC_FALSE;
83668f1ed48SBarry Smith         break;
83768f1ed48SBarry Smith       }
83868f1ed48SBarry Smith     }
83968f1ed48SBarry Smith #endif
84002594712SBarry Smith 
8419566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE));
84202594712SBarry Smith     for (i = 0; i < m; i++) {
84302594712SBarry Smith       jcnt = 0;
844d0f46423SBarry Smith       for (j = 0; j < A->cmap->n; j++) {
845e24b481bSBarry Smith         if (jcnt < a->i[i + 1] - a->i[i] && j == a->j[cnt]) {
84602594712SBarry Smith           value = a->a[cnt++];
847e24b481bSBarry Smith           jcnt++;
84802594712SBarry Smith         } else {
84902594712SBarry Smith           value = 0.0;
85002594712SBarry Smith         }
851aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX)
85268f1ed48SBarry Smith         if (realonly) {
8539566063dSJacob Faibussowitsch           PetscCall(PetscViewerASCIIPrintf(viewer, " %7.5e ", (double)PetscRealPart(value)));
85468f1ed48SBarry Smith         } else {
8559566063dSJacob Faibussowitsch           PetscCall(PetscViewerASCIIPrintf(viewer, " %7.5e+%7.5e i ", (double)PetscRealPart(value), (double)PetscImaginaryPart(value)));
85668f1ed48SBarry Smith         }
85702594712SBarry Smith #else
8589566063dSJacob Faibussowitsch         PetscCall(PetscViewerASCIIPrintf(viewer, " %7.5e ", (double)value));
85902594712SBarry Smith #endif
86002594712SBarry Smith       }
8619566063dSJacob Faibussowitsch       PetscCall(PetscViewerASCIIPrintf(viewer, "\n"));
86202594712SBarry Smith     }
8639566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE));
8643c215bfdSMatthew Knepley   } else if (format == PETSC_VIEWER_ASCII_MATRIXMARKET) {
865150b93efSMatthew G. Knepley     PetscInt fshift = 1;
8669566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE));
8673c215bfdSMatthew Knepley #if defined(PETSC_USE_COMPLEX)
8689566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIPrintf(viewer, "%%%%MatrixMarket matrix coordinate complex general\n"));
8693c215bfdSMatthew Knepley #else
8709566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIPrintf(viewer, "%%%%MatrixMarket matrix coordinate real general\n"));
8713c215bfdSMatthew Knepley #endif
8729566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT " %" PetscInt_FMT "\n", m, A->cmap->n, a->nz));
8733c215bfdSMatthew Knepley     for (i = 0; i < m; i++) {
87460e0710aSBarry Smith       for (j = a->i[i]; j < a->i[i + 1]; j++) {
8753c215bfdSMatthew Knepley #if defined(PETSC_USE_COMPLEX)
8769566063dSJacob Faibussowitsch         PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT " %g %g\n", i + fshift, a->j[j] + fshift, (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j])));
8773c215bfdSMatthew Knepley #else
8789566063dSJacob Faibussowitsch         PetscCall(PetscViewerASCIIPrintf(viewer, "%" PetscInt_FMT " %" PetscInt_FMT " %g\n", i + fshift, a->j[j] + fshift, (double)a->a[j]));
8793c215bfdSMatthew Knepley #endif
8803c215bfdSMatthew Knepley       }
8813c215bfdSMatthew Knepley     }
8829566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE));
8833a40ed3dSBarry Smith   } else {
8849566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_FALSE));
885d5f3da31SBarry Smith     if (A->factortype) {
88616cd7e1dSShri Abhyankar       for (i = 0; i < m; i++) {
8879566063dSJacob Faibussowitsch         PetscCall(PetscViewerASCIIPrintf(viewer, "row %" PetscInt_FMT ":", i));
88816cd7e1dSShri Abhyankar         /* L part */
88960e0710aSBarry Smith         for (j = a->i[i]; j < a->i[i + 1]; j++) {
89016cd7e1dSShri Abhyankar #if defined(PETSC_USE_COMPLEX)
89116cd7e1dSShri Abhyankar           if (PetscImaginaryPart(a->a[j]) > 0.0) {
8929566063dSJacob Faibussowitsch             PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g + %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j])));
89316cd7e1dSShri Abhyankar           } else if (PetscImaginaryPart(a->a[j]) < 0.0) {
8949566063dSJacob Faibussowitsch             PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g - %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)(-PetscImaginaryPart(a->a[j]))));
89516cd7e1dSShri Abhyankar           } else {
8969566063dSJacob Faibussowitsch             PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)PetscRealPart(a->a[j])));
89716cd7e1dSShri Abhyankar           }
89816cd7e1dSShri Abhyankar #else
8999566063dSJacob Faibussowitsch           PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)a->a[j]));
90016cd7e1dSShri Abhyankar #endif
90116cd7e1dSShri Abhyankar         }
90216cd7e1dSShri Abhyankar         /* diagonal */
90316cd7e1dSShri Abhyankar         j = a->diag[i];
90416cd7e1dSShri Abhyankar #if defined(PETSC_USE_COMPLEX)
90516cd7e1dSShri Abhyankar         if (PetscImaginaryPart(a->a[j]) > 0.0) {
9069566063dSJacob Faibussowitsch           PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g + %g i)", a->j[j], (double)PetscRealPart(1.0 / a->a[j]), (double)PetscImaginaryPart(1.0 / a->a[j])));
90716cd7e1dSShri Abhyankar         } else if (PetscImaginaryPart(a->a[j]) < 0.0) {
9089566063dSJacob Faibussowitsch           PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g - %g i)", a->j[j], (double)PetscRealPart(1.0 / a->a[j]), (double)(-PetscImaginaryPart(1.0 / a->a[j]))));
90916cd7e1dSShri Abhyankar         } else {
9109566063dSJacob Faibussowitsch           PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)PetscRealPart(1.0 / a->a[j])));
91116cd7e1dSShri Abhyankar         }
91216cd7e1dSShri Abhyankar #else
9139566063dSJacob Faibussowitsch         PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)(1.0 / a->a[j])));
91416cd7e1dSShri Abhyankar #endif
91516cd7e1dSShri Abhyankar 
91616cd7e1dSShri Abhyankar         /* U part */
91760e0710aSBarry Smith         for (j = a->diag[i + 1] + 1; j < a->diag[i]; j++) {
91816cd7e1dSShri Abhyankar #if defined(PETSC_USE_COMPLEX)
91916cd7e1dSShri Abhyankar           if (PetscImaginaryPart(a->a[j]) > 0.0) {
9209566063dSJacob Faibussowitsch             PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g + %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j])));
92116cd7e1dSShri Abhyankar           } else if (PetscImaginaryPart(a->a[j]) < 0.0) {
9229566063dSJacob Faibussowitsch             PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g - %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)(-PetscImaginaryPart(a->a[j]))));
92316cd7e1dSShri Abhyankar           } else {
9249566063dSJacob Faibussowitsch             PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)PetscRealPart(a->a[j])));
92516cd7e1dSShri Abhyankar           }
92616cd7e1dSShri Abhyankar #else
9279566063dSJacob Faibussowitsch           PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)a->a[j]));
92816cd7e1dSShri Abhyankar #endif
92916cd7e1dSShri Abhyankar         }
9309566063dSJacob Faibussowitsch         PetscCall(PetscViewerASCIIPrintf(viewer, "\n"));
93116cd7e1dSShri Abhyankar       }
93216cd7e1dSShri Abhyankar     } else {
93317ab2063SBarry Smith       for (i = 0; i < m; i++) {
9349566063dSJacob Faibussowitsch         PetscCall(PetscViewerASCIIPrintf(viewer, "row %" PetscInt_FMT ":", i));
93560e0710aSBarry Smith         for (j = a->i[i]; j < a->i[i + 1]; j++) {
936aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX)
93736db0b34SBarry Smith           if (PetscImaginaryPart(a->a[j]) > 0.0) {
9389566063dSJacob Faibussowitsch             PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g + %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)PetscImaginaryPart(a->a[j])));
93936db0b34SBarry Smith           } else if (PetscImaginaryPart(a->a[j]) < 0.0) {
9409566063dSJacob Faibussowitsch             PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g - %g i)", a->j[j], (double)PetscRealPart(a->a[j]), (double)-PetscImaginaryPart(a->a[j])));
9413a40ed3dSBarry Smith           } else {
9429566063dSJacob Faibussowitsch             PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)PetscRealPart(a->a[j])));
94317ab2063SBarry Smith           }
94417ab2063SBarry Smith #else
9459566063dSJacob Faibussowitsch           PetscCall(PetscViewerASCIIPrintf(viewer, " (%" PetscInt_FMT ", %g) ", a->j[j], (double)a->a[j]));
94617ab2063SBarry Smith #endif
94717ab2063SBarry Smith         }
9489566063dSJacob Faibussowitsch         PetscCall(PetscViewerASCIIPrintf(viewer, "\n"));
94917ab2063SBarry Smith       }
95016cd7e1dSShri Abhyankar     }
9519566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIUseTabs(viewer, PETSC_TRUE));
95217ab2063SBarry Smith   }
9539566063dSJacob Faibussowitsch   PetscCall(PetscViewerFlush(viewer));
9543a40ed3dSBarry Smith   PetscFunctionReturn(0);
955416022c9SBarry Smith }
956416022c9SBarry Smith 
9579804daf3SBarry Smith #include <petscdraw.h>
958d71ae5a4SJacob Faibussowitsch PetscErrorCode MatView_SeqAIJ_Draw_Zoom(PetscDraw draw, void *Aa)
959d71ae5a4SJacob Faibussowitsch {
960480ef9eaSBarry Smith   Mat                A = (Mat)Aa;
961416022c9SBarry Smith   Mat_SeqAIJ        *a = (Mat_SeqAIJ *)A->data;
962383922c3SLisandro Dalcin   PetscInt           i, j, m = A->rmap->n;
963383922c3SLisandro Dalcin   int                color;
964b05fc000SLisandro Dalcin   PetscReal          xl, yl, xr, yr, x_l, x_r, y_l, y_r;
965b0a32e0cSBarry Smith   PetscViewer        viewer;
966f3ef73ceSBarry Smith   PetscViewerFormat  format;
967fff043a9SJunchao Zhang   const PetscScalar *aa;
968cddf8d76SBarry Smith 
9693a40ed3dSBarry Smith   PetscFunctionBegin;
9709566063dSJacob Faibussowitsch   PetscCall(PetscObjectQuery((PetscObject)A, "Zoomviewer", (PetscObject *)&viewer));
9719566063dSJacob Faibussowitsch   PetscCall(PetscViewerGetFormat(viewer, &format));
9729566063dSJacob Faibussowitsch   PetscCall(PetscDrawGetCoordinates(draw, &xl, &yl, &xr, &yr));
973383922c3SLisandro Dalcin 
974416022c9SBarry Smith   /* loop over matrix elements drawing boxes */
9759566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &aa));
976fb9695e5SSatish Balay   if (format != PETSC_VIEWER_DRAW_CONTOUR) {
977d0609cedSBarry Smith     PetscDrawCollectiveBegin(draw);
9780513a670SBarry Smith     /* Blue for negative, Cyan for zero and  Red for positive */
979b0a32e0cSBarry Smith     color = PETSC_DRAW_BLUE;
980416022c9SBarry Smith     for (i = 0; i < m; i++) {
9819371c9d4SSatish Balay       y_l = m - i - 1.0;
9829371c9d4SSatish Balay       y_r = y_l + 1.0;
983bfeeae90SHong Zhang       for (j = a->i[i]; j < a->i[i + 1]; j++) {
9849371c9d4SSatish Balay         x_l = a->j[j];
9859371c9d4SSatish Balay         x_r = x_l + 1.0;
986fff043a9SJunchao Zhang         if (PetscRealPart(aa[j]) >= 0.) continue;
9879566063dSJacob Faibussowitsch         PetscCall(PetscDrawRectangle(draw, x_l, y_l, x_r, y_r, color, color, color, color));
988cddf8d76SBarry Smith       }
989cddf8d76SBarry Smith     }
990b0a32e0cSBarry Smith     color = PETSC_DRAW_CYAN;
991cddf8d76SBarry Smith     for (i = 0; i < m; i++) {
9929371c9d4SSatish Balay       y_l = m - i - 1.0;
9939371c9d4SSatish Balay       y_r = y_l + 1.0;
994bfeeae90SHong Zhang       for (j = a->i[i]; j < a->i[i + 1]; j++) {
9959371c9d4SSatish Balay         x_l = a->j[j];
9969371c9d4SSatish Balay         x_r = x_l + 1.0;
997fff043a9SJunchao Zhang         if (aa[j] != 0.) continue;
9989566063dSJacob Faibussowitsch         PetscCall(PetscDrawRectangle(draw, x_l, y_l, x_r, y_r, color, color, color, color));
999cddf8d76SBarry Smith       }
1000cddf8d76SBarry Smith     }
1001b0a32e0cSBarry Smith     color = PETSC_DRAW_RED;
1002cddf8d76SBarry Smith     for (i = 0; i < m; i++) {
10039371c9d4SSatish Balay       y_l = m - i - 1.0;
10049371c9d4SSatish Balay       y_r = y_l + 1.0;
1005bfeeae90SHong Zhang       for (j = a->i[i]; j < a->i[i + 1]; j++) {
10069371c9d4SSatish Balay         x_l = a->j[j];
10079371c9d4SSatish Balay         x_r = x_l + 1.0;
1008fff043a9SJunchao Zhang         if (PetscRealPart(aa[j]) <= 0.) continue;
10099566063dSJacob Faibussowitsch         PetscCall(PetscDrawRectangle(draw, x_l, y_l, x_r, y_r, color, color, color, color));
1010416022c9SBarry Smith       }
1011416022c9SBarry Smith     }
1012d0609cedSBarry Smith     PetscDrawCollectiveEnd(draw);
10130513a670SBarry Smith   } else {
10140513a670SBarry Smith     /* use contour shading to indicate magnitude of values */
10150513a670SBarry Smith     /* first determine max of all nonzero values */
1016b05fc000SLisandro Dalcin     PetscReal minv = 0.0, maxv = 0.0;
1017383922c3SLisandro Dalcin     PetscInt  nz = a->nz, count = 0;
1018b0a32e0cSBarry Smith     PetscDraw popup;
10190513a670SBarry Smith 
10200513a670SBarry Smith     for (i = 0; i < nz; i++) {
1021fff043a9SJunchao Zhang       if (PetscAbsScalar(aa[i]) > maxv) maxv = PetscAbsScalar(aa[i]);
10220513a670SBarry Smith     }
1023383922c3SLisandro Dalcin     if (minv >= maxv) maxv = minv + PETSC_SMALL;
10249566063dSJacob Faibussowitsch     PetscCall(PetscDrawGetPopup(draw, &popup));
10259566063dSJacob Faibussowitsch     PetscCall(PetscDrawScalePopup(popup, minv, maxv));
1026383922c3SLisandro Dalcin 
1027d0609cedSBarry Smith     PetscDrawCollectiveBegin(draw);
10280513a670SBarry Smith     for (i = 0; i < m; i++) {
1029383922c3SLisandro Dalcin       y_l = m - i - 1.0;
1030383922c3SLisandro Dalcin       y_r = y_l + 1.0;
1031bfeeae90SHong Zhang       for (j = a->i[i]; j < a->i[i + 1]; j++) {
1032383922c3SLisandro Dalcin         x_l   = a->j[j];
1033383922c3SLisandro Dalcin         x_r   = x_l + 1.0;
1034fff043a9SJunchao Zhang         color = PetscDrawRealToColor(PetscAbsScalar(aa[count]), minv, maxv);
10359566063dSJacob Faibussowitsch         PetscCall(PetscDrawRectangle(draw, x_l, y_l, x_r, y_r, color, color, color, color));
10360513a670SBarry Smith         count++;
10370513a670SBarry Smith       }
10380513a670SBarry Smith     }
1039d0609cedSBarry Smith     PetscDrawCollectiveEnd(draw);
10400513a670SBarry Smith   }
10419566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &aa));
1042480ef9eaSBarry Smith   PetscFunctionReturn(0);
1043480ef9eaSBarry Smith }
1044cddf8d76SBarry Smith 
10459804daf3SBarry Smith #include <petscdraw.h>
1046d71ae5a4SJacob Faibussowitsch PetscErrorCode MatView_SeqAIJ_Draw(Mat A, PetscViewer viewer)
1047d71ae5a4SJacob Faibussowitsch {
1048b0a32e0cSBarry Smith   PetscDraw draw;
104936db0b34SBarry Smith   PetscReal xr, yr, xl, yl, h, w;
1050ace3abfcSBarry Smith   PetscBool isnull;
1051480ef9eaSBarry Smith 
1052480ef9eaSBarry Smith   PetscFunctionBegin;
10539566063dSJacob Faibussowitsch   PetscCall(PetscViewerDrawGetDraw(viewer, 0, &draw));
10549566063dSJacob Faibussowitsch   PetscCall(PetscDrawIsNull(draw, &isnull));
1055480ef9eaSBarry Smith   if (isnull) PetscFunctionReturn(0);
1056480ef9eaSBarry Smith 
10579371c9d4SSatish Balay   xr = A->cmap->n;
10589371c9d4SSatish Balay   yr = A->rmap->n;
10599371c9d4SSatish Balay   h  = yr / 10.0;
10609371c9d4SSatish Balay   w  = xr / 10.0;
10619371c9d4SSatish Balay   xr += w;
10629371c9d4SSatish Balay   yr += h;
10639371c9d4SSatish Balay   xl = -w;
10649371c9d4SSatish Balay   yl = -h;
10659566063dSJacob Faibussowitsch   PetscCall(PetscDrawSetCoordinates(draw, xl, yl, xr, yr));
10669566063dSJacob Faibussowitsch   PetscCall(PetscObjectCompose((PetscObject)A, "Zoomviewer", (PetscObject)viewer));
10679566063dSJacob Faibussowitsch   PetscCall(PetscDrawZoom(draw, MatView_SeqAIJ_Draw_Zoom, A));
10689566063dSJacob Faibussowitsch   PetscCall(PetscObjectCompose((PetscObject)A, "Zoomviewer", NULL));
10699566063dSJacob Faibussowitsch   PetscCall(PetscDrawSave(draw));
10703a40ed3dSBarry Smith   PetscFunctionReturn(0);
1071416022c9SBarry Smith }
1072416022c9SBarry Smith 
1073d71ae5a4SJacob Faibussowitsch PetscErrorCode MatView_SeqAIJ(Mat A, PetscViewer viewer)
1074d71ae5a4SJacob Faibussowitsch {
1075ace3abfcSBarry Smith   PetscBool iascii, isbinary, isdraw;
1076416022c9SBarry Smith 
10773a40ed3dSBarry Smith   PetscFunctionBegin;
10789566063dSJacob Faibussowitsch   PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERASCII, &iascii));
10799566063dSJacob Faibussowitsch   PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERBINARY, &isbinary));
10809566063dSJacob Faibussowitsch   PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERDRAW, &isdraw));
10811baa6e33SBarry Smith   if (iascii) PetscCall(MatView_SeqAIJ_ASCII(A, viewer));
10821baa6e33SBarry Smith   else if (isbinary) PetscCall(MatView_SeqAIJ_Binary(A, viewer));
10831baa6e33SBarry Smith   else if (isdraw) PetscCall(MatView_SeqAIJ_Draw(A, viewer));
10849566063dSJacob Faibussowitsch   PetscCall(MatView_SeqAIJ_Inode(A, viewer));
10853a40ed3dSBarry Smith   PetscFunctionReturn(0);
108617ab2063SBarry Smith }
108719bcc07fSBarry Smith 
1088d71ae5a4SJacob Faibussowitsch PetscErrorCode MatAssemblyEnd_SeqAIJ(Mat A, MatAssemblyType mode)
1089d71ae5a4SJacob Faibussowitsch {
1090416022c9SBarry Smith   Mat_SeqAIJ *a      = (Mat_SeqAIJ *)A->data;
1091580bdb30SBarry Smith   PetscInt    fshift = 0, i, *ai = a->i, *aj = a->j, *imax = a->imax;
1092d0f46423SBarry Smith   PetscInt    m = A->rmap->n, *ip, N, *ailen = a->ilen, rmax = 0;
109354f21887SBarry Smith   MatScalar  *aa    = a->a, *ap;
10943447b6efSHong Zhang   PetscReal   ratio = 0.6;
109517ab2063SBarry Smith 
10963a40ed3dSBarry Smith   PetscFunctionBegin;
10973a40ed3dSBarry Smith   if (mode == MAT_FLUSH_ASSEMBLY) PetscFunctionReturn(0);
10989566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJInvalidateDiagonal(A));
1099b215bc84SStefano Zampini   if (A->was_assembled && A->ass_nonzerostate == A->nonzerostate) {
1100b215bc84SStefano Zampini     /* we need to respect users asking to use or not the inodes routine in between matrix assemblies */
11019566063dSJacob Faibussowitsch     PetscCall(MatAssemblyEnd_SeqAIJ_Inode(A, mode));
1102b215bc84SStefano Zampini     PetscFunctionReturn(0);
1103b215bc84SStefano Zampini   }
110417ab2063SBarry Smith 
110543ee02c3SBarry Smith   if (m) rmax = ailen[0]; /* determine row with most nonzeros */
110617ab2063SBarry Smith   for (i = 1; i < m; i++) {
1107416022c9SBarry Smith     /* move each row back by the amount of empty slots (fshift) before it*/
110817ab2063SBarry Smith     fshift += imax[i - 1] - ailen[i - 1];
110994a9d846SBarry Smith     rmax = PetscMax(rmax, ailen[i]);
111017ab2063SBarry Smith     if (fshift) {
1111bfeeae90SHong Zhang       ip = aj + ai[i];
1112bfeeae90SHong Zhang       ap = aa + ai[i];
111317ab2063SBarry Smith       N  = ailen[i];
11149566063dSJacob Faibussowitsch       PetscCall(PetscArraymove(ip - fshift, ip, N));
111548a46eb9SPierre Jolivet       if (!A->structure_only) PetscCall(PetscArraymove(ap - fshift, ap, N));
111617ab2063SBarry Smith     }
111717ab2063SBarry Smith     ai[i] = ai[i - 1] + ailen[i - 1];
111817ab2063SBarry Smith   }
111917ab2063SBarry Smith   if (m) {
112017ab2063SBarry Smith     fshift += imax[m - 1] - ailen[m - 1];
112117ab2063SBarry Smith     ai[m] = ai[m - 1] + ailen[m - 1];
112217ab2063SBarry Smith   }
11237b083b7cSBarry Smith 
112417ab2063SBarry Smith   /* reset ilen and imax for each row */
11257b083b7cSBarry Smith   a->nonzerorowcnt = 0;
1126396832f4SHong Zhang   if (A->structure_only) {
11279566063dSJacob Faibussowitsch     PetscCall(PetscFree(a->imax));
11289566063dSJacob Faibussowitsch     PetscCall(PetscFree(a->ilen));
1129396832f4SHong Zhang   } else { /* !A->structure_only */
113017ab2063SBarry Smith     for (i = 0; i < m; i++) {
113117ab2063SBarry Smith       ailen[i] = imax[i] = ai[i + 1] - ai[i];
11327b083b7cSBarry Smith       a->nonzerorowcnt += ((ai[i + 1] - ai[i]) > 0);
113317ab2063SBarry Smith     }
1134396832f4SHong Zhang   }
1135bfeeae90SHong Zhang   a->nz = ai[m];
1136aed4548fSBarry Smith   PetscCheck(!fshift || a->nounused != -1, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Unused space detected in matrix: %" PetscInt_FMT " X %" PetscInt_FMT ", %" PetscInt_FMT " unneeded", m, A->cmap->n, fshift);
113717ab2063SBarry Smith 
11389566063dSJacob Faibussowitsch   PetscCall(MatMarkDiagonal_SeqAIJ(A));
11399566063dSJacob Faibussowitsch   PetscCall(PetscInfo(A, "Matrix size: %" PetscInt_FMT " X %" PetscInt_FMT "; storage space: %" PetscInt_FMT " unneeded,%" PetscInt_FMT " used\n", m, A->cmap->n, fshift, a->nz));
11409566063dSJacob Faibussowitsch   PetscCall(PetscInfo(A, "Number of mallocs during MatSetValues() is %" PetscInt_FMT "\n", a->reallocs));
11419566063dSJacob Faibussowitsch   PetscCall(PetscInfo(A, "Maximum nonzeros in any row is %" PetscInt_FMT "\n", rmax));
11422205254eSKarl Rupp 
11438e58a170SBarry Smith   A->info.mallocs += a->reallocs;
1144dd5f02e7SSatish Balay   a->reallocs         = 0;
11456712e2f1SBarry Smith   A->info.nz_unneeded = (PetscReal)fshift;
114636db0b34SBarry Smith   a->rmax             = rmax;
11474e220ebcSLois Curfman McInnes 
114848a46eb9SPierre Jolivet   if (!A->structure_only) PetscCall(MatCheckCompressedRow(A, a->nonzerorowcnt, &a->compressedrow, a->i, m, ratio));
11499566063dSJacob Faibussowitsch   PetscCall(MatAssemblyEnd_SeqAIJ_Inode(A, mode));
11503a40ed3dSBarry Smith   PetscFunctionReturn(0);
115117ab2063SBarry Smith }
115217ab2063SBarry Smith 
1153d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRealPart_SeqAIJ(Mat A)
1154d71ae5a4SJacob Faibussowitsch {
115599cafbc1SBarry Smith   Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data;
115699cafbc1SBarry Smith   PetscInt    i, nz = a->nz;
11572e5835c6SStefano Zampini   MatScalar  *aa;
115899cafbc1SBarry Smith 
115999cafbc1SBarry Smith   PetscFunctionBegin;
11609566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArray(A, &aa));
116199cafbc1SBarry Smith   for (i = 0; i < nz; i++) aa[i] = PetscRealPart(aa[i]);
11629566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArray(A, &aa));
11639566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJInvalidateDiagonal(A));
116499cafbc1SBarry Smith   PetscFunctionReturn(0);
116599cafbc1SBarry Smith }
116699cafbc1SBarry Smith 
1167d71ae5a4SJacob Faibussowitsch PetscErrorCode MatImaginaryPart_SeqAIJ(Mat A)
1168d71ae5a4SJacob Faibussowitsch {
116999cafbc1SBarry Smith   Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data;
117099cafbc1SBarry Smith   PetscInt    i, nz = a->nz;
11712e5835c6SStefano Zampini   MatScalar  *aa;
117299cafbc1SBarry Smith 
117399cafbc1SBarry Smith   PetscFunctionBegin;
11749566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArray(A, &aa));
117599cafbc1SBarry Smith   for (i = 0; i < nz; i++) aa[i] = PetscImaginaryPart(aa[i]);
11769566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArray(A, &aa));
11779566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJInvalidateDiagonal(A));
117899cafbc1SBarry Smith   PetscFunctionReturn(0);
117999cafbc1SBarry Smith }
118099cafbc1SBarry Smith 
1181d71ae5a4SJacob Faibussowitsch PetscErrorCode MatZeroEntries_SeqAIJ(Mat A)
1182d71ae5a4SJacob Faibussowitsch {
1183fff043a9SJunchao Zhang   Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data;
1184fff043a9SJunchao Zhang   MatScalar  *aa;
11853a40ed3dSBarry Smith 
11863a40ed3dSBarry Smith   PetscFunctionBegin;
11879566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayWrite(A, &aa));
11889566063dSJacob Faibussowitsch   PetscCall(PetscArrayzero(aa, a->i[A->rmap->n]));
11899566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayWrite(A, &aa));
11909566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJInvalidateDiagonal(A));
11913a40ed3dSBarry Smith   PetscFunctionReturn(0);
119217ab2063SBarry Smith }
1193416022c9SBarry Smith 
1194d71ae5a4SJacob Faibussowitsch PETSC_INTERN PetscErrorCode MatResetPreallocationCOO_SeqAIJ(Mat A)
1195d71ae5a4SJacob Faibussowitsch {
1196cbc6b225SStefano Zampini   Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data;
1197cbc6b225SStefano Zampini 
1198cbc6b225SStefano Zampini   PetscFunctionBegin;
11999566063dSJacob Faibussowitsch   PetscCall(PetscFree(a->perm));
12009566063dSJacob Faibussowitsch   PetscCall(PetscFree(a->jmap));
1201cbc6b225SStefano Zampini   PetscFunctionReturn(0);
1202cbc6b225SStefano Zampini }
1203cbc6b225SStefano Zampini 
1204d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDestroy_SeqAIJ(Mat A)
1205d71ae5a4SJacob Faibussowitsch {
1206416022c9SBarry Smith   Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data;
1207d5d45c9bSBarry Smith 
12083a40ed3dSBarry Smith   PetscFunctionBegin;
1209aa482453SBarry Smith #if defined(PETSC_USE_LOG)
1210c0aa6a63SJacob Faibussowitsch   PetscLogObjectState((PetscObject)A, "Rows=%" PetscInt_FMT ", Cols=%" PetscInt_FMT ", NZ=%" PetscInt_FMT, A->rmap->n, A->cmap->n, a->nz);
121117ab2063SBarry Smith #endif
12129566063dSJacob Faibussowitsch   PetscCall(MatSeqXAIJFreeAIJ(A, &a->a, &a->j, &a->i));
12139566063dSJacob Faibussowitsch   PetscCall(MatResetPreallocationCOO_SeqAIJ(A));
12149566063dSJacob Faibussowitsch   PetscCall(ISDestroy(&a->row));
12159566063dSJacob Faibussowitsch   PetscCall(ISDestroy(&a->col));
12169566063dSJacob Faibussowitsch   PetscCall(PetscFree(a->diag));
12179566063dSJacob Faibussowitsch   PetscCall(PetscFree(a->ibdiag));
12189566063dSJacob Faibussowitsch   PetscCall(PetscFree(a->imax));
12199566063dSJacob Faibussowitsch   PetscCall(PetscFree(a->ilen));
12209566063dSJacob Faibussowitsch   PetscCall(PetscFree(a->ipre));
12219566063dSJacob Faibussowitsch   PetscCall(PetscFree3(a->idiag, a->mdiag, a->ssor_work));
12229566063dSJacob Faibussowitsch   PetscCall(PetscFree(a->solve_work));
12239566063dSJacob Faibussowitsch   PetscCall(ISDestroy(&a->icol));
12249566063dSJacob Faibussowitsch   PetscCall(PetscFree(a->saved_values));
12259566063dSJacob Faibussowitsch   PetscCall(PetscFree2(a->compressedrow.i, a->compressedrow.rindex));
12269566063dSJacob Faibussowitsch   PetscCall(MatDestroy_SeqAIJ_Inode(A));
12279566063dSJacob Faibussowitsch   PetscCall(PetscFree(A->data));
1228901853e0SKris Buschelman 
12296718818eSStefano Zampini   /* MatMatMultNumeric_SeqAIJ_SeqAIJ_Sorted may allocate this.
12306718818eSStefano Zampini      That function is so heavily used (sometimes in an hidden way through multnumeric function pointers)
12316718818eSStefano Zampini      that is hard to properly add this data to the MatProduct data. We free it here to avoid
12326718818eSStefano Zampini      users reusing the matrix object with different data to incur in obscure segmentation faults
12336718818eSStefano Zampini      due to different matrix sizes */
12349566063dSJacob Faibussowitsch   PetscCall(PetscObjectCompose((PetscObject)A, "__PETSc__ab_dense", NULL));
12356718818eSStefano Zampini 
12369566063dSJacob Faibussowitsch   PetscCall(PetscObjectChangeTypeName((PetscObject)A, NULL));
12372e956fe4SStefano Zampini   PetscCall(PetscObjectComposeFunction((PetscObject)A, "PetscMatlabEnginePut_C", NULL));
12382e956fe4SStefano Zampini   PetscCall(PetscObjectComposeFunction((PetscObject)A, "PetscMatlabEngineGet_C", NULL));
12399566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSeqAIJSetColumnIndices_C", NULL));
12409566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatStoreValues_C", NULL));
12419566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatRetrieveValues_C", NULL));
12429566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqsbaij_C", NULL));
12439566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqbaij_C", NULL));
12449566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijperm_C", NULL));
12452e956fe4SStefano Zampini   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijsell_C", NULL));
12462e956fe4SStefano Zampini #if defined(PETSC_HAVE_MKL_SPARSE)
12472e956fe4SStefano Zampini   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijmkl_C", NULL));
12482e956fe4SStefano Zampini #endif
12494222ddf1SHong Zhang #if defined(PETSC_HAVE_CUDA)
12509566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijcusparse_C", NULL));
12519566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaijcusparse_seqaij_C", NULL));
12529566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaij_seqaijcusparse_C", NULL));
12534222ddf1SHong Zhang #endif
12543d0639e7SStefano Zampini #if defined(PETSC_HAVE_KOKKOS_KERNELS)
12559566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijkokkos_C", NULL));
12563d0639e7SStefano Zampini #endif
12579566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijcrl_C", NULL));
1258af8000cdSHong Zhang #if defined(PETSC_HAVE_ELEMENTAL)
12599566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_elemental_C", NULL));
1260af8000cdSHong Zhang #endif
1261d24d4204SJose E. Roman #if defined(PETSC_HAVE_SCALAPACK)
12629566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_scalapack_C", NULL));
1263d24d4204SJose E. Roman #endif
126463c07aadSStefano Zampini #if defined(PETSC_HAVE_HYPRE)
12659566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_hypre_C", NULL));
12669566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_transpose_seqaij_seqaij_C", NULL));
126763c07aadSStefano Zampini #endif
12689566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqdense_C", NULL));
12699566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqsell_C", NULL));
12709566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_is_C", NULL));
12719566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatIsTranspose_C", NULL));
12722e956fe4SStefano Zampini   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatIsHermitianTranspose_C", NULL));
12739566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSeqAIJSetPreallocation_C", NULL));
12749566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatResetPreallocation_C", NULL));
12759566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSeqAIJSetPreallocationCSR_C", NULL));
12769566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatReorderForNonzeroDiagonal_C", NULL));
12779566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_is_seqaij_C", NULL));
12789566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqdense_seqaij_C", NULL));
12799566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaij_seqaij_C", NULL));
12809566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSeqAIJKron_C", NULL));
12819566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSetPreallocationCOO_C", NULL));
12829566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatSetValuesCOO_C", NULL));
12832e956fe4SStefano Zampini   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatFactorGetSolverType_C", NULL));
12842e956fe4SStefano Zampini   /* these calls do not belong here: the subclasses Duplicate/Destroy are wrong */
12852e956fe4SStefano Zampini   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaijsell_seqaij_C", NULL));
12862e956fe4SStefano Zampini   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaijperm_seqaij_C", NULL));
12872e956fe4SStefano Zampini   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatConvert_seqaij_seqaijviennacl_C", NULL));
12882e956fe4SStefano Zampini   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaijviennacl_seqdense_C", NULL));
12892e956fe4SStefano Zampini   PetscCall(PetscObjectComposeFunction((PetscObject)A, "MatProductSetFromOptions_seqaijviennacl_seqaij_C", NULL));
12903a40ed3dSBarry Smith   PetscFunctionReturn(0);
129117ab2063SBarry Smith }
129217ab2063SBarry Smith 
1293d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetOption_SeqAIJ(Mat A, MatOption op, PetscBool flg)
1294d71ae5a4SJacob Faibussowitsch {
1295416022c9SBarry Smith   Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data;
12963a40ed3dSBarry Smith 
12973a40ed3dSBarry Smith   PetscFunctionBegin;
1298a65d3064SKris Buschelman   switch (op) {
1299d71ae5a4SJacob Faibussowitsch   case MAT_ROW_ORIENTED:
1300d71ae5a4SJacob Faibussowitsch     a->roworiented = flg;
1301d71ae5a4SJacob Faibussowitsch     break;
1302d71ae5a4SJacob Faibussowitsch   case MAT_KEEP_NONZERO_PATTERN:
1303d71ae5a4SJacob Faibussowitsch     a->keepnonzeropattern = flg;
1304d71ae5a4SJacob Faibussowitsch     break;
1305d71ae5a4SJacob Faibussowitsch   case MAT_NEW_NONZERO_LOCATIONS:
1306d71ae5a4SJacob Faibussowitsch     a->nonew = (flg ? 0 : 1);
1307d71ae5a4SJacob Faibussowitsch     break;
1308d71ae5a4SJacob Faibussowitsch   case MAT_NEW_NONZERO_LOCATION_ERR:
1309d71ae5a4SJacob Faibussowitsch     a->nonew = (flg ? -1 : 0);
1310d71ae5a4SJacob Faibussowitsch     break;
1311d71ae5a4SJacob Faibussowitsch   case MAT_NEW_NONZERO_ALLOCATION_ERR:
1312d71ae5a4SJacob Faibussowitsch     a->nonew = (flg ? -2 : 0);
1313d71ae5a4SJacob Faibussowitsch     break;
1314d71ae5a4SJacob Faibussowitsch   case MAT_UNUSED_NONZERO_LOCATION_ERR:
1315d71ae5a4SJacob Faibussowitsch     a->nounused = (flg ? -1 : 0);
1316d71ae5a4SJacob Faibussowitsch     break;
1317d71ae5a4SJacob Faibussowitsch   case MAT_IGNORE_ZERO_ENTRIES:
1318d71ae5a4SJacob Faibussowitsch     a->ignorezeroentries = flg;
1319d71ae5a4SJacob Faibussowitsch     break;
13203d472b54SHong Zhang   case MAT_SPD:
1321b1646e73SJed Brown   case MAT_SYMMETRIC:
1322b1646e73SJed Brown   case MAT_STRUCTURALLY_SYMMETRIC:
1323b1646e73SJed Brown   case MAT_HERMITIAN:
1324b1646e73SJed Brown   case MAT_SYMMETRY_ETERNAL:
1325957cac9fSHong Zhang   case MAT_STRUCTURE_ONLY:
1326b94d7dedSBarry Smith   case MAT_STRUCTURAL_SYMMETRY_ETERNAL:
1327b94d7dedSBarry Smith   case MAT_SPD_ETERNAL:
1328b94d7dedSBarry Smith     /* if the diagonal matrix is square it inherits some of the properties above */
13295021d80fSJed Brown     break;
13308c78258cSHong Zhang   case MAT_FORCE_DIAGONAL_ENTRIES:
1331a65d3064SKris Buschelman   case MAT_IGNORE_OFF_PROC_ENTRIES:
1332d71ae5a4SJacob Faibussowitsch   case MAT_USE_HASH_TABLE:
1333d71ae5a4SJacob Faibussowitsch     PetscCall(PetscInfo(A, "Option %s ignored\n", MatOptions[op]));
1334d71ae5a4SJacob Faibussowitsch     break;
1335d71ae5a4SJacob Faibussowitsch   case MAT_USE_INODES:
1336d71ae5a4SJacob Faibussowitsch     PetscCall(MatSetOption_SeqAIJ_Inode(A, MAT_USE_INODES, flg));
1337d71ae5a4SJacob Faibussowitsch     break;
1338d71ae5a4SJacob Faibussowitsch   case MAT_SUBMAT_SINGLEIS:
1339d71ae5a4SJacob Faibussowitsch     A->submat_singleis = flg;
1340d71ae5a4SJacob Faibussowitsch     break;
1341071fcb05SBarry Smith   case MAT_SORTED_FULL:
1342071fcb05SBarry Smith     if (flg) A->ops->setvalues = MatSetValues_SeqAIJ_SortedFull;
1343071fcb05SBarry Smith     else A->ops->setvalues = MatSetValues_SeqAIJ;
1344071fcb05SBarry Smith     break;
1345d71ae5a4SJacob Faibussowitsch   case MAT_FORM_EXPLICIT_TRANSPOSE:
1346d71ae5a4SJacob Faibussowitsch     A->form_explicit_transpose = flg;
1347d71ae5a4SJacob Faibussowitsch     break;
1348d71ae5a4SJacob Faibussowitsch   default:
1349d71ae5a4SJacob Faibussowitsch     SETERRQ(PETSC_COMM_SELF, PETSC_ERR_SUP, "unknown option %d", op);
1350a65d3064SKris Buschelman   }
13513a40ed3dSBarry Smith   PetscFunctionReturn(0);
135217ab2063SBarry Smith }
135317ab2063SBarry Smith 
1354d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetDiagonal_SeqAIJ(Mat A, Vec v)
1355d71ae5a4SJacob Faibussowitsch {
1356416022c9SBarry Smith   Mat_SeqAIJ        *a = (Mat_SeqAIJ *)A->data;
1357fdc842d1SBarry Smith   PetscInt           i, j, n, *ai = a->i, *aj = a->j;
1358c898d852SStefano Zampini   PetscScalar       *x;
1359c898d852SStefano Zampini   const PetscScalar *aa;
136017ab2063SBarry Smith 
13613a40ed3dSBarry Smith   PetscFunctionBegin;
13629566063dSJacob Faibussowitsch   PetscCall(VecGetLocalSize(v, &n));
136308401ef6SPierre Jolivet   PetscCheck(n == A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Nonconforming matrix and vector");
13649566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &aa));
1365d5f3da31SBarry Smith   if (A->factortype == MAT_FACTOR_ILU || A->factortype == MAT_FACTOR_LU) {
1366d3e70bfaSHong Zhang     PetscInt *diag = a->diag;
13679566063dSJacob Faibussowitsch     PetscCall(VecGetArrayWrite(v, &x));
13682c990fa1SHong Zhang     for (i = 0; i < n; i++) x[i] = 1.0 / aa[diag[i]];
13699566063dSJacob Faibussowitsch     PetscCall(VecRestoreArrayWrite(v, &x));
13709566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJRestoreArrayRead(A, &aa));
137135e7444dSHong Zhang     PetscFunctionReturn(0);
137235e7444dSHong Zhang   }
137335e7444dSHong Zhang 
13749566063dSJacob Faibussowitsch   PetscCall(VecGetArrayWrite(v, &x));
137535e7444dSHong Zhang   for (i = 0; i < n; i++) {
1376fdc842d1SBarry Smith     x[i] = 0.0;
137735e7444dSHong Zhang     for (j = ai[i]; j < ai[i + 1]; j++) {
137835e7444dSHong Zhang       if (aj[j] == i) {
137935e7444dSHong Zhang         x[i] = aa[j];
138017ab2063SBarry Smith         break;
138117ab2063SBarry Smith       }
138217ab2063SBarry Smith     }
138317ab2063SBarry Smith   }
13849566063dSJacob Faibussowitsch   PetscCall(VecRestoreArrayWrite(v, &x));
13859566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &aa));
13863a40ed3dSBarry Smith   PetscFunctionReturn(0);
138717ab2063SBarry Smith }
138817ab2063SBarry Smith 
1389c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/ftn-kernels/fmult.h>
1390d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMultTransposeAdd_SeqAIJ(Mat A, Vec xx, Vec zz, Vec yy)
1391d71ae5a4SJacob Faibussowitsch {
1392416022c9SBarry Smith   Mat_SeqAIJ        *a = (Mat_SeqAIJ *)A->data;
13935f22a7b3SSebastian Grimberg   const MatScalar   *aa;
1394d9ca1df4SBarry Smith   PetscScalar       *y;
1395d9ca1df4SBarry Smith   const PetscScalar *x;
1396d0f46423SBarry Smith   PetscInt           m = A->rmap->n;
13975c897100SBarry Smith #if !defined(PETSC_USE_FORTRAN_KERNEL_MULTTRANSPOSEAIJ)
13985f22a7b3SSebastian Grimberg   const MatScalar  *v;
1399a77337e4SBarry Smith   PetscScalar       alpha;
1400d9ca1df4SBarry Smith   PetscInt          n, i, j;
1401d9ca1df4SBarry Smith   const PetscInt   *idx, *ii, *ridx = NULL;
14023447b6efSHong Zhang   Mat_CompressedRow cprow    = a->compressedrow;
1403ace3abfcSBarry Smith   PetscBool         usecprow = cprow.use;
14045c897100SBarry Smith #endif
140517ab2063SBarry Smith 
14063a40ed3dSBarry Smith   PetscFunctionBegin;
14079566063dSJacob Faibussowitsch   if (zz != yy) PetscCall(VecCopy(zz, yy));
14089566063dSJacob Faibussowitsch   PetscCall(VecGetArrayRead(xx, &x));
14099566063dSJacob Faibussowitsch   PetscCall(VecGetArray(yy, &y));
14109566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &aa));
14115c897100SBarry Smith 
14125c897100SBarry Smith #if defined(PETSC_USE_FORTRAN_KERNEL_MULTTRANSPOSEAIJ)
1413fff043a9SJunchao Zhang   fortranmulttransposeaddaij_(&m, x, a->i, a->j, aa, y);
14145c897100SBarry Smith #else
14153447b6efSHong Zhang   if (usecprow) {
14163447b6efSHong Zhang     m = cprow.nrows;
14173447b6efSHong Zhang     ii = cprow.i;
14187b2bb3b9SHong Zhang     ridx = cprow.rindex;
14193447b6efSHong Zhang   } else {
14203447b6efSHong Zhang     ii = a->i;
14213447b6efSHong Zhang   }
142217ab2063SBarry Smith   for (i = 0; i < m; i++) {
14233447b6efSHong Zhang     idx = a->j + ii[i];
1424fff043a9SJunchao Zhang     v = aa + ii[i];
14253447b6efSHong Zhang     n = ii[i + 1] - ii[i];
14263447b6efSHong Zhang     if (usecprow) {
14277b2bb3b9SHong Zhang       alpha = x[ridx[i]];
14283447b6efSHong Zhang     } else {
142917ab2063SBarry Smith       alpha = x[i];
14303447b6efSHong Zhang     }
143104fbf559SBarry Smith     for (j = 0; j < n; j++) y[idx[j]] += alpha * v[j];
143217ab2063SBarry Smith   }
14335c897100SBarry Smith #endif
14349566063dSJacob Faibussowitsch   PetscCall(PetscLogFlops(2.0 * a->nz));
14359566063dSJacob Faibussowitsch   PetscCall(VecRestoreArrayRead(xx, &x));
14369566063dSJacob Faibussowitsch   PetscCall(VecRestoreArray(yy, &y));
14379566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &aa));
14383a40ed3dSBarry Smith   PetscFunctionReturn(0);
143917ab2063SBarry Smith }
144017ab2063SBarry Smith 
1441d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMultTranspose_SeqAIJ(Mat A, Vec xx, Vec yy)
1442d71ae5a4SJacob Faibussowitsch {
14435c897100SBarry Smith   PetscFunctionBegin;
14449566063dSJacob Faibussowitsch   PetscCall(VecSet(yy, 0.0));
14459566063dSJacob Faibussowitsch   PetscCall(MatMultTransposeAdd_SeqAIJ(A, xx, yy, yy));
14465c897100SBarry Smith   PetscFunctionReturn(0);
14475c897100SBarry Smith }
14485c897100SBarry Smith 
1449c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/ftn-kernels/fmult.h>
145078b84d54SShri Abhyankar 
1451d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMult_SeqAIJ(Mat A, Vec xx, Vec yy)
1452d71ae5a4SJacob Faibussowitsch {
1453416022c9SBarry Smith   Mat_SeqAIJ        *a = (Mat_SeqAIJ *)A->data;
1454d9fead3dSBarry Smith   PetscScalar       *y;
145554f21887SBarry Smith   const PetscScalar *x;
1456fff043a9SJunchao Zhang   const MatScalar   *aa, *a_a;
1457003131ecSBarry Smith   PetscInt           m = A->rmap->n;
14580298fd71SBarry Smith   const PetscInt    *aj, *ii, *ridx = NULL;
14597b083b7cSBarry Smith   PetscInt           n, i;
1460362ced78SSatish Balay   PetscScalar        sum;
1461ace3abfcSBarry Smith   PetscBool          usecprow = a->compressedrow.use;
146217ab2063SBarry Smith 
1463b6410449SSatish Balay #if defined(PETSC_HAVE_PRAGMA_DISJOINT)
146497952fefSHong Zhang   #pragma disjoint(*x, *y, *aa)
1465fee21e36SBarry Smith #endif
1466fee21e36SBarry Smith 
14673a40ed3dSBarry Smith   PetscFunctionBegin;
1468b215bc84SStefano Zampini   if (a->inode.use && a->inode.checked) {
14699566063dSJacob Faibussowitsch     PetscCall(MatMult_SeqAIJ_Inode(A, xx, yy));
1470b215bc84SStefano Zampini     PetscFunctionReturn(0);
1471b215bc84SStefano Zampini   }
14729566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &a_a));
14739566063dSJacob Faibussowitsch   PetscCall(VecGetArrayRead(xx, &x));
14749566063dSJacob Faibussowitsch   PetscCall(VecGetArray(yy, &y));
1475416022c9SBarry Smith   ii = a->i;
14764eb6d288SHong Zhang   if (usecprow) { /* use compressed row format */
14779566063dSJacob Faibussowitsch     PetscCall(PetscArrayzero(y, m));
147897952fefSHong Zhang     m    = a->compressedrow.nrows;
147997952fefSHong Zhang     ii   = a->compressedrow.i;
148097952fefSHong Zhang     ridx = a->compressedrow.rindex;
148197952fefSHong Zhang     for (i = 0; i < m; i++) {
148297952fefSHong Zhang       n   = ii[i + 1] - ii[i];
148397952fefSHong Zhang       aj  = a->j + ii[i];
1484fff043a9SJunchao Zhang       aa  = a_a + ii[i];
148597952fefSHong Zhang       sum = 0.0;
1486003131ecSBarry Smith       PetscSparseDensePlusDot(sum, x, aa, aj, n);
1487003131ecSBarry Smith       /* for (j=0; j<n; j++) sum += (*aa++)*x[*aj++]; */
148897952fefSHong Zhang       y[*ridx++] = sum;
148997952fefSHong Zhang     }
149097952fefSHong Zhang   } else { /* do not use compressed row format */
1491b05257ddSBarry Smith #if defined(PETSC_USE_FORTRAN_KERNEL_MULTAIJ)
14923d3eaba7SBarry Smith     aj = a->j;
1493fff043a9SJunchao Zhang     aa = a_a;
1494b05257ddSBarry Smith     fortranmultaij_(&m, x, ii, aj, aa, y);
1495b05257ddSBarry Smith #else
149617ab2063SBarry Smith     for (i = 0; i < m; i++) {
1497003131ecSBarry Smith       n = ii[i + 1] - ii[i];
1498003131ecSBarry Smith       aj = a->j + ii[i];
1499fff043a9SJunchao Zhang       aa = a_a + ii[i];
150017ab2063SBarry Smith       sum = 0.0;
1501003131ecSBarry Smith       PetscSparseDensePlusDot(sum, x, aa, aj, n);
150217ab2063SBarry Smith       y[i] = sum;
150317ab2063SBarry Smith     }
15048d195f9aSBarry Smith #endif
1505b05257ddSBarry Smith   }
15069566063dSJacob Faibussowitsch   PetscCall(PetscLogFlops(2.0 * a->nz - a->nonzerorowcnt));
15079566063dSJacob Faibussowitsch   PetscCall(VecRestoreArrayRead(xx, &x));
15089566063dSJacob Faibussowitsch   PetscCall(VecRestoreArray(yy, &y));
15099566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &a_a));
15103a40ed3dSBarry Smith   PetscFunctionReturn(0);
151117ab2063SBarry Smith }
151217ab2063SBarry Smith 
1513d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMultMax_SeqAIJ(Mat A, Vec xx, Vec yy)
1514d71ae5a4SJacob Faibussowitsch {
1515b434eb95SMatthew G. Knepley   Mat_SeqAIJ        *a = (Mat_SeqAIJ *)A->data;
1516b434eb95SMatthew G. Knepley   PetscScalar       *y;
1517b434eb95SMatthew G. Knepley   const PetscScalar *x;
1518fff043a9SJunchao Zhang   const MatScalar   *aa, *a_a;
1519b434eb95SMatthew G. Knepley   PetscInt           m = A->rmap->n;
1520b434eb95SMatthew G. Knepley   const PetscInt    *aj, *ii, *ridx   = NULL;
1521b434eb95SMatthew G. Knepley   PetscInt           n, i, nonzerorow = 0;
1522b434eb95SMatthew G. Knepley   PetscScalar        sum;
1523b434eb95SMatthew G. Knepley   PetscBool          usecprow = a->compressedrow.use;
1524b434eb95SMatthew G. Knepley 
1525b434eb95SMatthew G. Knepley #if defined(PETSC_HAVE_PRAGMA_DISJOINT)
1526b434eb95SMatthew G. Knepley   #pragma disjoint(*x, *y, *aa)
1527b434eb95SMatthew G. Knepley #endif
1528b434eb95SMatthew G. Knepley 
1529b434eb95SMatthew G. Knepley   PetscFunctionBegin;
15309566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &a_a));
15319566063dSJacob Faibussowitsch   PetscCall(VecGetArrayRead(xx, &x));
15329566063dSJacob Faibussowitsch   PetscCall(VecGetArray(yy, &y));
1533b434eb95SMatthew G. Knepley   if (usecprow) { /* use compressed row format */
1534b434eb95SMatthew G. Knepley     m    = a->compressedrow.nrows;
1535b434eb95SMatthew G. Knepley     ii   = a->compressedrow.i;
1536b434eb95SMatthew G. Knepley     ridx = a->compressedrow.rindex;
1537b434eb95SMatthew G. Knepley     for (i = 0; i < m; i++) {
1538b434eb95SMatthew G. Knepley       n   = ii[i + 1] - ii[i];
1539b434eb95SMatthew G. Knepley       aj  = a->j + ii[i];
1540fff043a9SJunchao Zhang       aa  = a_a + ii[i];
1541b434eb95SMatthew G. Knepley       sum = 0.0;
1542b434eb95SMatthew G. Knepley       nonzerorow += (n > 0);
1543b434eb95SMatthew G. Knepley       PetscSparseDenseMaxDot(sum, x, aa, aj, n);
1544b434eb95SMatthew G. Knepley       /* for (j=0; j<n; j++) sum += (*aa++)*x[*aj++]; */
1545b434eb95SMatthew G. Knepley       y[*ridx++] = sum;
1546b434eb95SMatthew G. Knepley     }
1547b434eb95SMatthew G. Knepley   } else { /* do not use compressed row format */
15483d3eaba7SBarry Smith     ii = a->i;
1549b434eb95SMatthew G. Knepley     for (i = 0; i < m; i++) {
1550b434eb95SMatthew G. Knepley       n   = ii[i + 1] - ii[i];
1551b434eb95SMatthew G. Knepley       aj  = a->j + ii[i];
1552fff043a9SJunchao Zhang       aa  = a_a + ii[i];
1553b434eb95SMatthew G. Knepley       sum = 0.0;
1554b434eb95SMatthew G. Knepley       nonzerorow += (n > 0);
1555b434eb95SMatthew G. Knepley       PetscSparseDenseMaxDot(sum, x, aa, aj, n);
1556b434eb95SMatthew G. Knepley       y[i] = sum;
1557b434eb95SMatthew G. Knepley     }
1558b434eb95SMatthew G. Knepley   }
15599566063dSJacob Faibussowitsch   PetscCall(PetscLogFlops(2.0 * a->nz - nonzerorow));
15609566063dSJacob Faibussowitsch   PetscCall(VecRestoreArrayRead(xx, &x));
15619566063dSJacob Faibussowitsch   PetscCall(VecRestoreArray(yy, &y));
15629566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &a_a));
1563b434eb95SMatthew G. Knepley   PetscFunctionReturn(0);
1564b434eb95SMatthew G. Knepley }
1565b434eb95SMatthew G. Knepley 
1566d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMultAddMax_SeqAIJ(Mat A, Vec xx, Vec yy, Vec zz)
1567d71ae5a4SJacob Faibussowitsch {
1568b434eb95SMatthew G. Knepley   Mat_SeqAIJ        *a = (Mat_SeqAIJ *)A->data;
1569b434eb95SMatthew G. Knepley   PetscScalar       *y, *z;
1570b434eb95SMatthew G. Knepley   const PetscScalar *x;
1571fff043a9SJunchao Zhang   const MatScalar   *aa, *a_a;
1572b434eb95SMatthew G. Knepley   PetscInt           m = A->rmap->n, *aj, *ii;
1573b434eb95SMatthew G. Knepley   PetscInt           n, i, *ridx = NULL;
1574b434eb95SMatthew G. Knepley   PetscScalar        sum;
1575b434eb95SMatthew G. Knepley   PetscBool          usecprow = a->compressedrow.use;
1576b434eb95SMatthew G. Knepley 
1577b434eb95SMatthew G. Knepley   PetscFunctionBegin;
15789566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &a_a));
15799566063dSJacob Faibussowitsch   PetscCall(VecGetArrayRead(xx, &x));
15809566063dSJacob Faibussowitsch   PetscCall(VecGetArrayPair(yy, zz, &y, &z));
1581b434eb95SMatthew G. Knepley   if (usecprow) { /* use compressed row format */
158248a46eb9SPierre Jolivet     if (zz != yy) PetscCall(PetscArraycpy(z, y, m));
1583b434eb95SMatthew G. Knepley     m    = a->compressedrow.nrows;
1584b434eb95SMatthew G. Knepley     ii   = a->compressedrow.i;
1585b434eb95SMatthew G. Knepley     ridx = a->compressedrow.rindex;
1586b434eb95SMatthew G. Knepley     for (i = 0; i < m; i++) {
1587b434eb95SMatthew G. Knepley       n   = ii[i + 1] - ii[i];
1588b434eb95SMatthew G. Knepley       aj  = a->j + ii[i];
1589fff043a9SJunchao Zhang       aa  = a_a + ii[i];
1590b434eb95SMatthew G. Knepley       sum = y[*ridx];
1591b434eb95SMatthew G. Knepley       PetscSparseDenseMaxDot(sum, x, aa, aj, n);
1592b434eb95SMatthew G. Knepley       z[*ridx++] = sum;
1593b434eb95SMatthew G. Knepley     }
1594b434eb95SMatthew G. Knepley   } else { /* do not use compressed row format */
15953d3eaba7SBarry Smith     ii = a->i;
1596b434eb95SMatthew G. Knepley     for (i = 0; i < m; i++) {
1597b434eb95SMatthew G. Knepley       n   = ii[i + 1] - ii[i];
1598b434eb95SMatthew G. Knepley       aj  = a->j + ii[i];
1599fff043a9SJunchao Zhang       aa  = a_a + ii[i];
1600b434eb95SMatthew G. Knepley       sum = y[i];
1601b434eb95SMatthew G. Knepley       PetscSparseDenseMaxDot(sum, x, aa, aj, n);
1602b434eb95SMatthew G. Knepley       z[i] = sum;
1603b434eb95SMatthew G. Knepley     }
1604b434eb95SMatthew G. Knepley   }
16059566063dSJacob Faibussowitsch   PetscCall(PetscLogFlops(2.0 * a->nz));
16069566063dSJacob Faibussowitsch   PetscCall(VecRestoreArrayRead(xx, &x));
16079566063dSJacob Faibussowitsch   PetscCall(VecRestoreArrayPair(yy, zz, &y, &z));
16089566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &a_a));
1609b434eb95SMatthew G. Knepley   PetscFunctionReturn(0);
1610b434eb95SMatthew G. Knepley }
1611b434eb95SMatthew G. Knepley 
1612c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/ftn-kernels/fmultadd.h>
1613d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMultAdd_SeqAIJ(Mat A, Vec xx, Vec yy, Vec zz)
1614d71ae5a4SJacob Faibussowitsch {
1615416022c9SBarry Smith   Mat_SeqAIJ        *a = (Mat_SeqAIJ *)A->data;
1616f15663dcSBarry Smith   PetscScalar       *y, *z;
1617f15663dcSBarry Smith   const PetscScalar *x;
1618fff043a9SJunchao Zhang   const MatScalar   *aa, *a_a;
1619d9ca1df4SBarry Smith   const PetscInt    *aj, *ii, *ridx = NULL;
1620d9ca1df4SBarry Smith   PetscInt           m = A->rmap->n, n, i;
1621362ced78SSatish Balay   PetscScalar        sum;
1622ace3abfcSBarry Smith   PetscBool          usecprow = a->compressedrow.use;
16239ea0dfa2SSatish Balay 
16243a40ed3dSBarry Smith   PetscFunctionBegin;
1625b215bc84SStefano Zampini   if (a->inode.use && a->inode.checked) {
16269566063dSJacob Faibussowitsch     PetscCall(MatMultAdd_SeqAIJ_Inode(A, xx, yy, zz));
1627b215bc84SStefano Zampini     PetscFunctionReturn(0);
1628b215bc84SStefano Zampini   }
16299566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &a_a));
16309566063dSJacob Faibussowitsch   PetscCall(VecGetArrayRead(xx, &x));
16319566063dSJacob Faibussowitsch   PetscCall(VecGetArrayPair(yy, zz, &y, &z));
16324eb6d288SHong Zhang   if (usecprow) { /* use compressed row format */
163348a46eb9SPierre Jolivet     if (zz != yy) PetscCall(PetscArraycpy(z, y, m));
163497952fefSHong Zhang     m    = a->compressedrow.nrows;
163597952fefSHong Zhang     ii   = a->compressedrow.i;
163697952fefSHong Zhang     ridx = a->compressedrow.rindex;
163797952fefSHong Zhang     for (i = 0; i < m; i++) {
163897952fefSHong Zhang       n   = ii[i + 1] - ii[i];
163997952fefSHong Zhang       aj  = a->j + ii[i];
1640fff043a9SJunchao Zhang       aa  = a_a + ii[i];
164197952fefSHong Zhang       sum = y[*ridx];
1642f15663dcSBarry Smith       PetscSparseDensePlusDot(sum, x, aa, aj, n);
164397952fefSHong Zhang       z[*ridx++] = sum;
164497952fefSHong Zhang     }
164597952fefSHong Zhang   } else { /* do not use compressed row format */
16463d3eaba7SBarry Smith     ii = a->i;
1647f15663dcSBarry Smith #if defined(PETSC_USE_FORTRAN_KERNEL_MULTADDAIJ)
16483d3eaba7SBarry Smith     aj = a->j;
1649fff043a9SJunchao Zhang     aa = a_a;
1650f15663dcSBarry Smith     fortranmultaddaij_(&m, x, ii, aj, aa, y, z);
1651f15663dcSBarry Smith #else
165217ab2063SBarry Smith     for (i = 0; i < m; i++) {
1653f15663dcSBarry Smith       n = ii[i + 1] - ii[i];
1654f15663dcSBarry Smith       aj = a->j + ii[i];
1655fff043a9SJunchao Zhang       aa = a_a + ii[i];
165617ab2063SBarry Smith       sum = y[i];
1657f15663dcSBarry Smith       PetscSparseDensePlusDot(sum, x, aa, aj, n);
165817ab2063SBarry Smith       z[i] = sum;
165917ab2063SBarry Smith     }
166002ab625aSSatish Balay #endif
1661f15663dcSBarry Smith   }
16629566063dSJacob Faibussowitsch   PetscCall(PetscLogFlops(2.0 * a->nz));
16639566063dSJacob Faibussowitsch   PetscCall(VecRestoreArrayRead(xx, &x));
16649566063dSJacob Faibussowitsch   PetscCall(VecRestoreArrayPair(yy, zz, &y, &z));
16659566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &a_a));
16663a40ed3dSBarry Smith   PetscFunctionReturn(0);
166717ab2063SBarry Smith }
166817ab2063SBarry Smith 
166917ab2063SBarry Smith /*
167017ab2063SBarry Smith      Adds diagonal pointers to sparse matrix structure.
167117ab2063SBarry Smith */
1672d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMarkDiagonal_SeqAIJ(Mat A)
1673d71ae5a4SJacob Faibussowitsch {
1674416022c9SBarry Smith   Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data;
1675d0f46423SBarry Smith   PetscInt    i, j, m = A->rmap->n;
1676c0c07093SJunchao Zhang   PetscBool   alreadySet = PETSC_TRUE;
167717ab2063SBarry Smith 
16783a40ed3dSBarry Smith   PetscFunctionBegin;
167909f38230SBarry Smith   if (!a->diag) {
16809566063dSJacob Faibussowitsch     PetscCall(PetscMalloc1(m, &a->diag));
1681c0c07093SJunchao Zhang     alreadySet = PETSC_FALSE;
168209f38230SBarry Smith   }
1683d0f46423SBarry Smith   for (i = 0; i < A->rmap->n; i++) {
1684c0c07093SJunchao Zhang     /* If A's diagonal is already correctly set, this fast track enables cheap and repeated MatMarkDiagonal_SeqAIJ() calls */
1685c0c07093SJunchao Zhang     if (alreadySet) {
1686c0c07093SJunchao Zhang       PetscInt pos = a->diag[i];
1687c0c07093SJunchao Zhang       if (pos >= a->i[i] && pos < a->i[i + 1] && a->j[pos] == i) continue;
1688c0c07093SJunchao Zhang     }
1689c0c07093SJunchao Zhang 
169009f38230SBarry Smith     a->diag[i] = a->i[i + 1];
1691bfeeae90SHong Zhang     for (j = a->i[i]; j < a->i[i + 1]; j++) {
1692bfeeae90SHong Zhang       if (a->j[j] == i) {
169309f38230SBarry Smith         a->diag[i] = j;
169417ab2063SBarry Smith         break;
169517ab2063SBarry Smith       }
169617ab2063SBarry Smith     }
169717ab2063SBarry Smith   }
16983a40ed3dSBarry Smith   PetscFunctionReturn(0);
169917ab2063SBarry Smith }
170017ab2063SBarry Smith 
1701d71ae5a4SJacob Faibussowitsch PetscErrorCode MatShift_SeqAIJ(Mat A, PetscScalar v)
1702d71ae5a4SJacob Faibussowitsch {
170361ecd0c6SBarry Smith   Mat_SeqAIJ     *a    = (Mat_SeqAIJ *)A->data;
170461ecd0c6SBarry Smith   const PetscInt *diag = (const PetscInt *)a->diag;
170561ecd0c6SBarry Smith   const PetscInt *ii   = (const PetscInt *)a->i;
170661ecd0c6SBarry Smith   PetscInt        i, *mdiag = NULL;
170761ecd0c6SBarry Smith   PetscInt        cnt = 0; /* how many diagonals are missing */
170861ecd0c6SBarry Smith 
170961ecd0c6SBarry Smith   PetscFunctionBegin;
171061ecd0c6SBarry Smith   if (!A->preallocated || !a->nz) {
17119566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJSetPreallocation(A, 1, NULL));
17129566063dSJacob Faibussowitsch     PetscCall(MatShift_Basic(A, v));
171361ecd0c6SBarry Smith     PetscFunctionReturn(0);
171461ecd0c6SBarry Smith   }
171561ecd0c6SBarry Smith 
171661ecd0c6SBarry Smith   if (a->diagonaldense) {
171761ecd0c6SBarry Smith     cnt = 0;
171861ecd0c6SBarry Smith   } else {
17199566063dSJacob Faibussowitsch     PetscCall(PetscCalloc1(A->rmap->n, &mdiag));
172061ecd0c6SBarry Smith     for (i = 0; i < A->rmap->n; i++) {
1721349d3b71SJunchao Zhang       if (i < A->cmap->n && diag[i] >= ii[i + 1]) { /* 'out of range' rows never have diagonals */
172261ecd0c6SBarry Smith         cnt++;
172361ecd0c6SBarry Smith         mdiag[i] = 1;
172461ecd0c6SBarry Smith       }
172561ecd0c6SBarry Smith     }
172661ecd0c6SBarry Smith   }
172761ecd0c6SBarry Smith   if (!cnt) {
17289566063dSJacob Faibussowitsch     PetscCall(MatShift_Basic(A, v));
172961ecd0c6SBarry Smith   } else {
1730b6f2aa54SBarry Smith     PetscScalar *olda = a->a; /* preserve pointers to current matrix nonzeros structure and values */
1731b6f2aa54SBarry Smith     PetscInt    *oldj = a->j, *oldi = a->i;
173261ecd0c6SBarry Smith     PetscBool    singlemalloc = a->singlemalloc, free_a = a->free_a, free_ij = a->free_ij;
173361ecd0c6SBarry Smith 
173461ecd0c6SBarry Smith     a->a = NULL;
173561ecd0c6SBarry Smith     a->j = NULL;
173661ecd0c6SBarry Smith     a->i = NULL;
173761ecd0c6SBarry Smith     /* increase the values in imax for each row where a diagonal is being inserted then reallocate the matrix data structures */
1738ad540459SPierre Jolivet     for (i = 0; i < PetscMin(A->rmap->n, A->cmap->n); i++) a->imax[i] += mdiag[i];
17399566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(A, 0, a->imax));
174061ecd0c6SBarry Smith 
174161ecd0c6SBarry Smith     /* copy old values into new matrix data structure */
174261ecd0c6SBarry Smith     for (i = 0; i < A->rmap->n; i++) {
17439566063dSJacob Faibussowitsch       PetscCall(MatSetValues(A, 1, &i, a->imax[i] - mdiag[i], &oldj[oldi[i]], &olda[oldi[i]], ADD_VALUES));
174448a46eb9SPierre Jolivet       if (i < A->cmap->n) PetscCall(MatSetValue(A, i, i, v, ADD_VALUES));
1745447d62f5SStefano Zampini     }
17469566063dSJacob Faibussowitsch     PetscCall(MatAssemblyBegin(A, MAT_FINAL_ASSEMBLY));
17479566063dSJacob Faibussowitsch     PetscCall(MatAssemblyEnd(A, MAT_FINAL_ASSEMBLY));
174861ecd0c6SBarry Smith     if (singlemalloc) {
17499566063dSJacob Faibussowitsch       PetscCall(PetscFree3(olda, oldj, oldi));
175061ecd0c6SBarry Smith     } else {
17519566063dSJacob Faibussowitsch       if (free_a) PetscCall(PetscFree(olda));
17529566063dSJacob Faibussowitsch       if (free_ij) PetscCall(PetscFree(oldj));
17539566063dSJacob Faibussowitsch       if (free_ij) PetscCall(PetscFree(oldi));
175461ecd0c6SBarry Smith     }
175561ecd0c6SBarry Smith   }
17569566063dSJacob Faibussowitsch   PetscCall(PetscFree(mdiag));
175761ecd0c6SBarry Smith   a->diagonaldense = PETSC_TRUE;
175861ecd0c6SBarry Smith   PetscFunctionReturn(0);
175961ecd0c6SBarry Smith }
176061ecd0c6SBarry Smith 
1761be5855fcSBarry Smith /*
1762be5855fcSBarry Smith      Checks for missing diagonals
1763be5855fcSBarry Smith */
1764d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMissingDiagonal_SeqAIJ(Mat A, PetscBool *missing, PetscInt *d)
1765d71ae5a4SJacob Faibussowitsch {
1766be5855fcSBarry Smith   Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data;
17677734d3b5SMatthew G. Knepley   PetscInt   *diag, *ii = a->i, i;
1768be5855fcSBarry Smith 
1769be5855fcSBarry Smith   PetscFunctionBegin;
177009f38230SBarry Smith   *missing = PETSC_FALSE;
17717734d3b5SMatthew G. Knepley   if (A->rmap->n > 0 && !ii) {
177209f38230SBarry Smith     *missing = PETSC_TRUE;
177309f38230SBarry Smith     if (d) *d = 0;
17749566063dSJacob Faibussowitsch     PetscCall(PetscInfo(A, "Matrix has no entries therefore is missing diagonal\n"));
177509f38230SBarry Smith   } else {
177601445905SHong Zhang     PetscInt n;
177701445905SHong Zhang     n    = PetscMin(A->rmap->n, A->cmap->n);
1778f1e2ffcdSBarry Smith     diag = a->diag;
177901445905SHong Zhang     for (i = 0; i < n; i++) {
17807734d3b5SMatthew G. Knepley       if (diag[i] >= ii[i + 1]) {
178109f38230SBarry Smith         *missing = PETSC_TRUE;
178209f38230SBarry Smith         if (d) *d = i;
17839566063dSJacob Faibussowitsch         PetscCall(PetscInfo(A, "Matrix is missing diagonal number %" PetscInt_FMT "\n", i));
1784358d2f5dSShri Abhyankar         break;
178509f38230SBarry Smith       }
1786be5855fcSBarry Smith     }
1787be5855fcSBarry Smith   }
1788be5855fcSBarry Smith   PetscFunctionReturn(0);
1789be5855fcSBarry Smith }
1790be5855fcSBarry Smith 
17910da83c2eSBarry Smith #include <petscblaslapack.h>
17920da83c2eSBarry Smith #include <petsc/private/kernels/blockinvert.h>
17930da83c2eSBarry Smith 
17940da83c2eSBarry Smith /*
17950da83c2eSBarry Smith     Note that values is allocated externally by the PC and then passed into this routine
17960da83c2eSBarry Smith */
1797d71ae5a4SJacob Faibussowitsch PetscErrorCode MatInvertVariableBlockDiagonal_SeqAIJ(Mat A, PetscInt nblocks, const PetscInt *bsizes, PetscScalar *diag)
1798d71ae5a4SJacob Faibussowitsch {
17990da83c2eSBarry Smith   PetscInt        n = A->rmap->n, i, ncnt = 0, *indx, j, bsizemax = 0, *v_pivots;
18000da83c2eSBarry Smith   PetscBool       allowzeropivot, zeropivotdetected = PETSC_FALSE;
18010da83c2eSBarry Smith   const PetscReal shift = 0.0;
18020da83c2eSBarry Smith   PetscInt        ipvt[5];
18030da83c2eSBarry Smith   PetscScalar     work[25], *v_work;
18040da83c2eSBarry Smith 
18050da83c2eSBarry Smith   PetscFunctionBegin;
18060da83c2eSBarry Smith   allowzeropivot = PetscNot(A->erroriffailure);
18070da83c2eSBarry Smith   for (i = 0; i < nblocks; i++) ncnt += bsizes[i];
180808401ef6SPierre Jolivet   PetscCheck(ncnt == n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Total blocksizes %" PetscInt_FMT " doesn't match number matrix rows %" PetscInt_FMT, ncnt, n);
1809ad540459SPierre Jolivet   for (i = 0; i < nblocks; i++) bsizemax = PetscMax(bsizemax, bsizes[i]);
18109566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(bsizemax, &indx));
181148a46eb9SPierre Jolivet   if (bsizemax > 7) PetscCall(PetscMalloc2(bsizemax, &v_work, bsizemax, &v_pivots));
18120da83c2eSBarry Smith   ncnt = 0;
18130da83c2eSBarry Smith   for (i = 0; i < nblocks; i++) {
18140da83c2eSBarry Smith     for (j = 0; j < bsizes[i]; j++) indx[j] = ncnt + j;
18159566063dSJacob Faibussowitsch     PetscCall(MatGetValues(A, bsizes[i], indx, bsizes[i], indx, diag));
18160da83c2eSBarry Smith     switch (bsizes[i]) {
1817d71ae5a4SJacob Faibussowitsch     case 1:
1818d71ae5a4SJacob Faibussowitsch       *diag = 1.0 / (*diag);
1819d71ae5a4SJacob Faibussowitsch       break;
18200da83c2eSBarry Smith     case 2:
18219566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_inverse_A_2(diag, shift, allowzeropivot, &zeropivotdetected));
18220da83c2eSBarry Smith       if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT;
18239566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_transpose_A_2(diag));
18240da83c2eSBarry Smith       break;
18250da83c2eSBarry Smith     case 3:
18269566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_inverse_A_3(diag, shift, allowzeropivot, &zeropivotdetected));
18270da83c2eSBarry Smith       if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT;
18289566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_transpose_A_3(diag));
18290da83c2eSBarry Smith       break;
18300da83c2eSBarry Smith     case 4:
18319566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_inverse_A_4(diag, shift, allowzeropivot, &zeropivotdetected));
18320da83c2eSBarry Smith       if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT;
18339566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_transpose_A_4(diag));
18340da83c2eSBarry Smith       break;
18350da83c2eSBarry Smith     case 5:
18369566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_inverse_A_5(diag, ipvt, work, shift, allowzeropivot, &zeropivotdetected));
18370da83c2eSBarry Smith       if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT;
18389566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_transpose_A_5(diag));
18390da83c2eSBarry Smith       break;
18400da83c2eSBarry Smith     case 6:
18419566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_inverse_A_6(diag, shift, allowzeropivot, &zeropivotdetected));
18420da83c2eSBarry Smith       if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT;
18439566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_transpose_A_6(diag));
18440da83c2eSBarry Smith       break;
18450da83c2eSBarry Smith     case 7:
18469566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_inverse_A_7(diag, shift, allowzeropivot, &zeropivotdetected));
18470da83c2eSBarry Smith       if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT;
18489566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_transpose_A_7(diag));
18490da83c2eSBarry Smith       break;
18500da83c2eSBarry Smith     default:
18519566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_inverse_A(bsizes[i], diag, v_pivots, v_work, allowzeropivot, &zeropivotdetected));
18520da83c2eSBarry Smith       if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT;
18539566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_transpose_A_N(diag, bsizes[i]));
18540da83c2eSBarry Smith     }
18550da83c2eSBarry Smith     ncnt += bsizes[i];
18560da83c2eSBarry Smith     diag += bsizes[i] * bsizes[i];
18570da83c2eSBarry Smith   }
185848a46eb9SPierre Jolivet   if (bsizemax > 7) PetscCall(PetscFree2(v_work, v_pivots));
18599566063dSJacob Faibussowitsch   PetscCall(PetscFree(indx));
18600da83c2eSBarry Smith   PetscFunctionReturn(0);
18610da83c2eSBarry Smith }
18620da83c2eSBarry Smith 
1863422a814eSBarry Smith /*
1864422a814eSBarry Smith    Negative shift indicates do not generate an error if there is a zero diagonal, just invert it anyways
1865422a814eSBarry Smith */
1866d71ae5a4SJacob Faibussowitsch PetscErrorCode MatInvertDiagonal_SeqAIJ(Mat A, PetscScalar omega, PetscScalar fshift)
1867d71ae5a4SJacob Faibussowitsch {
186871f1c65dSBarry Smith   Mat_SeqAIJ      *a = (Mat_SeqAIJ *)A->data;
1869d0f46423SBarry Smith   PetscInt         i, *diag, m = A->rmap->n;
18702e5835c6SStefano Zampini   const MatScalar *v;
187154f21887SBarry Smith   PetscScalar     *idiag, *mdiag;
187271f1c65dSBarry Smith 
187371f1c65dSBarry Smith   PetscFunctionBegin;
187471f1c65dSBarry Smith   if (a->idiagvalid) PetscFunctionReturn(0);
18759566063dSJacob Faibussowitsch   PetscCall(MatMarkDiagonal_SeqAIJ(A));
187671f1c65dSBarry Smith   diag = a->diag;
18774dfa11a4SJacob Faibussowitsch   if (!a->idiag) { PetscCall(PetscMalloc3(m, &a->idiag, m, &a->mdiag, m, &a->ssor_work)); }
18782e5835c6SStefano Zampini 
187971f1c65dSBarry Smith   mdiag = a->mdiag;
188071f1c65dSBarry Smith   idiag = a->idiag;
18819566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &v));
1882422a814eSBarry Smith   if (omega == 1.0 && PetscRealPart(fshift) <= 0.0) {
188371f1c65dSBarry Smith     for (i = 0; i < m; i++) {
188471f1c65dSBarry Smith       mdiag[i] = v[diag[i]];
1885899639b0SHong Zhang       if (!PetscAbsScalar(mdiag[i])) { /* zero diagonal */
1886899639b0SHong Zhang         if (PetscRealPart(fshift)) {
18879566063dSJacob Faibussowitsch           PetscCall(PetscInfo(A, "Zero diagonal on row %" PetscInt_FMT "\n", i));
18887b6c816cSBarry Smith           A->factorerrortype             = MAT_FACTOR_NUMERIC_ZEROPIVOT;
18897b6c816cSBarry Smith           A->factorerror_zeropivot_value = 0.0;
18907b6c816cSBarry Smith           A->factorerror_zeropivot_row   = i;
189198921bdaSJacob Faibussowitsch         } else SETERRQ(PETSC_COMM_SELF, PETSC_ERR_ARG_INCOMP, "Zero diagonal on row %" PetscInt_FMT, i);
1892899639b0SHong Zhang       }
189371f1c65dSBarry Smith       idiag[i] = 1.0 / v[diag[i]];
189471f1c65dSBarry Smith     }
18959566063dSJacob Faibussowitsch     PetscCall(PetscLogFlops(m));
189671f1c65dSBarry Smith   } else {
189771f1c65dSBarry Smith     for (i = 0; i < m; i++) {
189871f1c65dSBarry Smith       mdiag[i] = v[diag[i]];
189971f1c65dSBarry Smith       idiag[i] = omega / (fshift + v[diag[i]]);
190071f1c65dSBarry Smith     }
19019566063dSJacob Faibussowitsch     PetscCall(PetscLogFlops(2.0 * m));
190271f1c65dSBarry Smith   }
190371f1c65dSBarry Smith   a->idiagvalid = PETSC_TRUE;
19049566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &v));
190571f1c65dSBarry Smith   PetscFunctionReturn(0);
190671f1c65dSBarry Smith }
190771f1c65dSBarry Smith 
1908c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/ftn-kernels/frelax.h>
1909d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSOR_SeqAIJ(Mat A, Vec bb, PetscReal omega, MatSORType flag, PetscReal fshift, PetscInt its, PetscInt lits, Vec xx)
1910d71ae5a4SJacob Faibussowitsch {
1911416022c9SBarry Smith   Mat_SeqAIJ        *a = (Mat_SeqAIJ *)A->data;
1912e6d1f457SBarry Smith   PetscScalar       *x, d, sum, *t, scale;
19132e5835c6SStefano Zampini   const MatScalar   *v, *idiag = NULL, *mdiag, *aa;
191454f21887SBarry Smith   const PetscScalar *b, *bs, *xb, *ts;
19153d3eaba7SBarry Smith   PetscInt           n, m = A->rmap->n, i;
191697f1f81fSBarry Smith   const PetscInt    *idx, *diag;
191717ab2063SBarry Smith 
19183a40ed3dSBarry Smith   PetscFunctionBegin;
1919b215bc84SStefano Zampini   if (a->inode.use && a->inode.checked && omega == 1.0 && fshift == 0.0) {
19209566063dSJacob Faibussowitsch     PetscCall(MatSOR_SeqAIJ_Inode(A, bb, omega, flag, fshift, its, lits, xx));
1921b215bc84SStefano Zampini     PetscFunctionReturn(0);
1922b215bc84SStefano Zampini   }
1923b965ef7fSBarry Smith   its = its * lits;
192491723122SBarry Smith 
192571f1c65dSBarry Smith   if (fshift != a->fshift || omega != a->omega) a->idiagvalid = PETSC_FALSE; /* must recompute idiag[] */
19269566063dSJacob Faibussowitsch   if (!a->idiagvalid) PetscCall(MatInvertDiagonal_SeqAIJ(A, omega, fshift));
192771f1c65dSBarry Smith   a->fshift = fshift;
192871f1c65dSBarry Smith   a->omega  = omega;
1929ed480e8bSBarry Smith 
193071f1c65dSBarry Smith   diag  = a->diag;
193171f1c65dSBarry Smith   t     = a->ssor_work;
1932ed480e8bSBarry Smith   idiag = a->idiag;
193371f1c65dSBarry Smith   mdiag = a->mdiag;
1934ed480e8bSBarry Smith 
19359566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &aa));
19369566063dSJacob Faibussowitsch   PetscCall(VecGetArray(xx, &x));
19379566063dSJacob Faibussowitsch   PetscCall(VecGetArrayRead(bb, &b));
1938ed480e8bSBarry Smith   /* We count flops by assuming the upper triangular and lower triangular parts have the same number of nonzeros */
193917ab2063SBarry Smith   if (flag == SOR_APPLY_UPPER) {
194017ab2063SBarry Smith     /* apply (U + D/omega) to the vector */
1941ed480e8bSBarry Smith     bs = b;
194217ab2063SBarry Smith     for (i = 0; i < m; i++) {
194371f1c65dSBarry Smith       d   = fshift + mdiag[i];
1944416022c9SBarry Smith       n   = a->i[i + 1] - diag[i] - 1;
1945ed480e8bSBarry Smith       idx = a->j + diag[i] + 1;
19462e5835c6SStefano Zampini       v   = aa + diag[i] + 1;
194717ab2063SBarry Smith       sum = b[i] * d / omega;
1948003131ecSBarry Smith       PetscSparseDensePlusDot(sum, bs, v, idx, n);
194917ab2063SBarry Smith       x[i] = sum;
195017ab2063SBarry Smith     }
19519566063dSJacob Faibussowitsch     PetscCall(VecRestoreArray(xx, &x));
19529566063dSJacob Faibussowitsch     PetscCall(VecRestoreArrayRead(bb, &b));
19539566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJRestoreArrayRead(A, &aa));
19549566063dSJacob Faibussowitsch     PetscCall(PetscLogFlops(a->nz));
19553a40ed3dSBarry Smith     PetscFunctionReturn(0);
195617ab2063SBarry Smith   }
1957c783ea89SBarry Smith 
195808401ef6SPierre Jolivet   PetscCheck(flag != SOR_APPLY_LOWER, PETSC_COMM_SELF, PETSC_ERR_SUP, "SOR_APPLY_LOWER is not implemented");
1959f7d195e4SLawrence Mitchell   if (flag & SOR_EISENSTAT) {
19604c500f23SPierre Jolivet     /* Let  A = L + U + D; where L is lower triangular,
1961887ee2caSBarry Smith     U is upper triangular, E = D/omega; This routine applies
196217ab2063SBarry Smith 
196317ab2063SBarry Smith             (L + E)^{-1} A (U + E)^{-1}
196417ab2063SBarry Smith 
1965887ee2caSBarry Smith     to a vector efficiently using Eisenstat's trick.
196617ab2063SBarry Smith     */
196717ab2063SBarry Smith     scale = (2.0 / omega) - 1.0;
196817ab2063SBarry Smith 
196917ab2063SBarry Smith     /*  x = (E + U)^{-1} b */
197017ab2063SBarry Smith     for (i = m - 1; i >= 0; i--) {
1971416022c9SBarry Smith       n   = a->i[i + 1] - diag[i] - 1;
1972ed480e8bSBarry Smith       idx = a->j + diag[i] + 1;
19732e5835c6SStefano Zampini       v   = aa + diag[i] + 1;
197417ab2063SBarry Smith       sum = b[i];
1975e6d1f457SBarry Smith       PetscSparseDenseMinusDot(sum, x, v, idx, n);
1976ed480e8bSBarry Smith       x[i] = sum * idiag[i];
197717ab2063SBarry Smith     }
197817ab2063SBarry Smith 
197917ab2063SBarry Smith     /*  t = b - (2*E - D)x */
19802e5835c6SStefano Zampini     v = aa;
19812205254eSKarl Rupp     for (i = 0; i < m; i++) t[i] = b[i] - scale * (v[*diag++]) * x[i];
198217ab2063SBarry Smith 
198317ab2063SBarry Smith     /*  t = (E + L)^{-1}t */
1984ed480e8bSBarry Smith     ts   = t;
1985416022c9SBarry Smith     diag = a->diag;
198617ab2063SBarry Smith     for (i = 0; i < m; i++) {
1987416022c9SBarry Smith       n   = diag[i] - a->i[i];
1988ed480e8bSBarry Smith       idx = a->j + a->i[i];
19892e5835c6SStefano Zampini       v   = aa + a->i[i];
199017ab2063SBarry Smith       sum = t[i];
1991003131ecSBarry Smith       PetscSparseDenseMinusDot(sum, ts, v, idx, n);
1992ed480e8bSBarry Smith       t[i] = sum * idiag[i];
1993733d66baSBarry Smith       /*  x = x + t */
1994733d66baSBarry Smith       x[i] += t[i];
199517ab2063SBarry Smith     }
199617ab2063SBarry Smith 
19979566063dSJacob Faibussowitsch     PetscCall(PetscLogFlops(6.0 * m - 1 + 2.0 * a->nz));
19989566063dSJacob Faibussowitsch     PetscCall(VecRestoreArray(xx, &x));
19999566063dSJacob Faibussowitsch     PetscCall(VecRestoreArrayRead(bb, &b));
20003a40ed3dSBarry Smith     PetscFunctionReturn(0);
200117ab2063SBarry Smith   }
200217ab2063SBarry Smith   if (flag & SOR_ZERO_INITIAL_GUESS) {
200317ab2063SBarry Smith     if (flag & SOR_FORWARD_SWEEP || flag & SOR_LOCAL_FORWARD_SWEEP) {
200417ab2063SBarry Smith       for (i = 0; i < m; i++) {
2005416022c9SBarry Smith         n   = diag[i] - a->i[i];
2006ed480e8bSBarry Smith         idx = a->j + a->i[i];
20072e5835c6SStefano Zampini         v   = aa + a->i[i];
200817ab2063SBarry Smith         sum = b[i];
2009e6d1f457SBarry Smith         PetscSparseDenseMinusDot(sum, x, v, idx, n);
20105c99c7daSBarry Smith         t[i] = sum;
2011ed480e8bSBarry Smith         x[i] = sum * idiag[i];
201217ab2063SBarry Smith       }
20135c99c7daSBarry Smith       xb = t;
20149566063dSJacob Faibussowitsch       PetscCall(PetscLogFlops(a->nz));
20153a40ed3dSBarry Smith     } else xb = b;
201617ab2063SBarry Smith     if (flag & SOR_BACKWARD_SWEEP || flag & SOR_LOCAL_BACKWARD_SWEEP) {
201717ab2063SBarry Smith       for (i = m - 1; i >= 0; i--) {
2018416022c9SBarry Smith         n   = a->i[i + 1] - diag[i] - 1;
2019ed480e8bSBarry Smith         idx = a->j + diag[i] + 1;
20202e5835c6SStefano Zampini         v   = aa + diag[i] + 1;
202117ab2063SBarry Smith         sum = xb[i];
2022e6d1f457SBarry Smith         PetscSparseDenseMinusDot(sum, x, v, idx, n);
20235c99c7daSBarry Smith         if (xb == b) {
2024ed480e8bSBarry Smith           x[i] = sum * idiag[i];
20255c99c7daSBarry Smith         } else {
2026b19a5dc2SMark Adams           x[i] = (1 - omega) * x[i] + sum * idiag[i]; /* omega in idiag */
202717ab2063SBarry Smith         }
20285c99c7daSBarry Smith       }
20299566063dSJacob Faibussowitsch       PetscCall(PetscLogFlops(a->nz)); /* assumes 1/2 in upper */
203017ab2063SBarry Smith     }
203117ab2063SBarry Smith     its--;
203217ab2063SBarry Smith   }
203317ab2063SBarry Smith   while (its--) {
203417ab2063SBarry Smith     if (flag & SOR_FORWARD_SWEEP || flag & SOR_LOCAL_FORWARD_SWEEP) {
203517ab2063SBarry Smith       for (i = 0; i < m; i++) {
2036b19a5dc2SMark Adams         /* lower */
2037b19a5dc2SMark Adams         n   = diag[i] - a->i[i];
2038ed480e8bSBarry Smith         idx = a->j + a->i[i];
20392e5835c6SStefano Zampini         v   = aa + a->i[i];
204017ab2063SBarry Smith         sum = b[i];
2041e6d1f457SBarry Smith         PetscSparseDenseMinusDot(sum, x, v, idx, n);
2042b19a5dc2SMark Adams         t[i] = sum; /* save application of the lower-triangular part */
2043b19a5dc2SMark Adams         /* upper */
2044b19a5dc2SMark Adams         n   = a->i[i + 1] - diag[i] - 1;
2045b19a5dc2SMark Adams         idx = a->j + diag[i] + 1;
20462e5835c6SStefano Zampini         v   = aa + diag[i] + 1;
2047b19a5dc2SMark Adams         PetscSparseDenseMinusDot(sum, x, v, idx, n);
2048b19a5dc2SMark Adams         x[i] = (1. - omega) * x[i] + sum * idiag[i]; /* omega in idiag */
204917ab2063SBarry Smith       }
2050b19a5dc2SMark Adams       xb = t;
20519566063dSJacob Faibussowitsch       PetscCall(PetscLogFlops(2.0 * a->nz));
2052b19a5dc2SMark Adams     } else xb = b;
205317ab2063SBarry Smith     if (flag & SOR_BACKWARD_SWEEP || flag & SOR_LOCAL_BACKWARD_SWEEP) {
205417ab2063SBarry Smith       for (i = m - 1; i >= 0; i--) {
2055b19a5dc2SMark Adams         sum = xb[i];
2056b19a5dc2SMark Adams         if (xb == b) {
2057b19a5dc2SMark Adams           /* whole matrix (no checkpointing available) */
2058416022c9SBarry Smith           n   = a->i[i + 1] - a->i[i];
2059ed480e8bSBarry Smith           idx = a->j + a->i[i];
20602e5835c6SStefano Zampini           v   = aa + a->i[i];
2061e6d1f457SBarry Smith           PetscSparseDenseMinusDot(sum, x, v, idx, n);
2062ed480e8bSBarry Smith           x[i] = (1. - omega) * x[i] + (sum + mdiag[i] * x[i]) * idiag[i];
2063b19a5dc2SMark Adams         } else { /* lower-triangular part has been saved, so only apply upper-triangular */
2064b19a5dc2SMark Adams           n   = a->i[i + 1] - diag[i] - 1;
2065b19a5dc2SMark Adams           idx = a->j + diag[i] + 1;
20662e5835c6SStefano Zampini           v   = aa + diag[i] + 1;
2067b19a5dc2SMark Adams           PetscSparseDenseMinusDot(sum, x, v, idx, n);
2068b19a5dc2SMark Adams           x[i] = (1. - omega) * x[i] + sum * idiag[i]; /* omega in idiag */
206917ab2063SBarry Smith         }
2070b19a5dc2SMark Adams       }
2071b19a5dc2SMark Adams       if (xb == b) {
20729566063dSJacob Faibussowitsch         PetscCall(PetscLogFlops(2.0 * a->nz));
2073b19a5dc2SMark Adams       } else {
20749566063dSJacob Faibussowitsch         PetscCall(PetscLogFlops(a->nz)); /* assumes 1/2 in upper */
2075b19a5dc2SMark Adams       }
207617ab2063SBarry Smith     }
207717ab2063SBarry Smith   }
20789566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &aa));
20799566063dSJacob Faibussowitsch   PetscCall(VecRestoreArray(xx, &x));
20809566063dSJacob Faibussowitsch   PetscCall(VecRestoreArrayRead(bb, &b));
2081365a8a9eSBarry Smith   PetscFunctionReturn(0);
208217ab2063SBarry Smith }
208317ab2063SBarry Smith 
2084d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetInfo_SeqAIJ(Mat A, MatInfoType flag, MatInfo *info)
2085d71ae5a4SJacob Faibussowitsch {
2086416022c9SBarry Smith   Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data;
20874e220ebcSLois Curfman McInnes 
20883a40ed3dSBarry Smith   PetscFunctionBegin;
20894e220ebcSLois Curfman McInnes   info->block_size   = 1.0;
20903966268fSBarry Smith   info->nz_allocated = a->maxnz;
20913966268fSBarry Smith   info->nz_used      = a->nz;
20923966268fSBarry Smith   info->nz_unneeded  = (a->maxnz - a->nz);
20933966268fSBarry Smith   info->assemblies   = A->num_ass;
20943966268fSBarry Smith   info->mallocs      = A->info.mallocs;
20954dfa11a4SJacob Faibussowitsch   info->memory       = 0; /* REVIEW ME */
2096d5f3da31SBarry Smith   if (A->factortype) {
20974e220ebcSLois Curfman McInnes     info->fill_ratio_given  = A->info.fill_ratio_given;
20984e220ebcSLois Curfman McInnes     info->fill_ratio_needed = A->info.fill_ratio_needed;
20994e220ebcSLois Curfman McInnes     info->factor_mallocs    = A->info.factor_mallocs;
21004e220ebcSLois Curfman McInnes   } else {
21014e220ebcSLois Curfman McInnes     info->fill_ratio_given  = 0;
21024e220ebcSLois Curfman McInnes     info->fill_ratio_needed = 0;
21034e220ebcSLois Curfman McInnes     info->factor_mallocs    = 0;
21044e220ebcSLois Curfman McInnes   }
21053a40ed3dSBarry Smith   PetscFunctionReturn(0);
210617ab2063SBarry Smith }
210717ab2063SBarry Smith 
2108d71ae5a4SJacob Faibussowitsch PetscErrorCode MatZeroRows_SeqAIJ(Mat A, PetscInt N, const PetscInt rows[], PetscScalar diag, Vec x, Vec b)
2109d71ae5a4SJacob Faibussowitsch {
2110416022c9SBarry Smith   Mat_SeqAIJ        *a = (Mat_SeqAIJ *)A->data;
2111c7da8527SEric Chamberland   PetscInt           i, m = A->rmap->n - 1;
211297b48c8fSBarry Smith   const PetscScalar *xx;
21132e5835c6SStefano Zampini   PetscScalar       *bb, *aa;
2114c7da8527SEric Chamberland   PetscInt           d = 0;
211517ab2063SBarry Smith 
21163a40ed3dSBarry Smith   PetscFunctionBegin;
211797b48c8fSBarry Smith   if (x && b) {
21189566063dSJacob Faibussowitsch     PetscCall(VecGetArrayRead(x, &xx));
21199566063dSJacob Faibussowitsch     PetscCall(VecGetArray(b, &bb));
212097b48c8fSBarry Smith     for (i = 0; i < N; i++) {
2121aed4548fSBarry Smith       PetscCheck(rows[i] >= 0 && rows[i] <= m, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "row %" PetscInt_FMT " out of range", rows[i]);
2122447d62f5SStefano Zampini       if (rows[i] >= A->cmap->n) continue;
212397b48c8fSBarry Smith       bb[rows[i]] = diag * xx[rows[i]];
212497b48c8fSBarry Smith     }
21259566063dSJacob Faibussowitsch     PetscCall(VecRestoreArrayRead(x, &xx));
21269566063dSJacob Faibussowitsch     PetscCall(VecRestoreArray(b, &bb));
212797b48c8fSBarry Smith   }
212897b48c8fSBarry Smith 
21299566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArray(A, &aa));
2130a9817697SBarry Smith   if (a->keepnonzeropattern) {
2131f1e2ffcdSBarry Smith     for (i = 0; i < N; i++) {
2132aed4548fSBarry Smith       PetscCheck(rows[i] >= 0 && rows[i] <= m, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "row %" PetscInt_FMT " out of range", rows[i]);
21339566063dSJacob Faibussowitsch       PetscCall(PetscArrayzero(&aa[a->i[rows[i]]], a->ilen[rows[i]]));
2134f1e2ffcdSBarry Smith     }
2135f4df32b1SMatthew Knepley     if (diag != 0.0) {
2136c7da8527SEric Chamberland       for (i = 0; i < N; i++) {
2137c7da8527SEric Chamberland         d = rows[i];
2138447d62f5SStefano Zampini         if (rows[i] >= A->cmap->n) continue;
213908401ef6SPierre Jolivet         PetscCheck(a->diag[d] < a->i[d + 1], PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Matrix is missing diagonal entry in the zeroed row %" PetscInt_FMT, d);
2140c7da8527SEric Chamberland       }
2141f1e2ffcdSBarry Smith       for (i = 0; i < N; i++) {
2142447d62f5SStefano Zampini         if (rows[i] >= A->cmap->n) continue;
21432e5835c6SStefano Zampini         aa[a->diag[rows[i]]] = diag;
2144f1e2ffcdSBarry Smith       }
2145f1e2ffcdSBarry Smith     }
2146f1e2ffcdSBarry Smith   } else {
2147f4df32b1SMatthew Knepley     if (diag != 0.0) {
214817ab2063SBarry Smith       for (i = 0; i < N; i++) {
2149aed4548fSBarry Smith         PetscCheck(rows[i] >= 0 && rows[i] <= m, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "row %" PetscInt_FMT " out of range", rows[i]);
21507ae801bdSBarry Smith         if (a->ilen[rows[i]] > 0) {
2151447d62f5SStefano Zampini           if (rows[i] >= A->cmap->n) {
2152447d62f5SStefano Zampini             a->ilen[rows[i]] = 0;
2153447d62f5SStefano Zampini           } else {
2154416022c9SBarry Smith             a->ilen[rows[i]]    = 1;
21552e5835c6SStefano Zampini             aa[a->i[rows[i]]]   = diag;
2156bfeeae90SHong Zhang             a->j[a->i[rows[i]]] = rows[i];
2157447d62f5SStefano Zampini           }
2158447d62f5SStefano Zampini         } else if (rows[i] < A->cmap->n) { /* in case row was completely empty */
21599566063dSJacob Faibussowitsch           PetscCall(MatSetValues_SeqAIJ(A, 1, &rows[i], 1, &rows[i], &diag, INSERT_VALUES));
216017ab2063SBarry Smith         }
216117ab2063SBarry Smith       }
21623a40ed3dSBarry Smith     } else {
216317ab2063SBarry Smith       for (i = 0; i < N; i++) {
2164aed4548fSBarry Smith         PetscCheck(rows[i] >= 0 && rows[i] <= m, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "row %" PetscInt_FMT " out of range", rows[i]);
2165416022c9SBarry Smith         a->ilen[rows[i]] = 0;
216617ab2063SBarry Smith       }
216717ab2063SBarry Smith     }
2168e56f5c9eSBarry Smith     A->nonzerostate++;
2169f1e2ffcdSBarry Smith   }
21709566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArray(A, &aa));
2171dbbe0bcdSBarry Smith   PetscUseTypeMethod(A, assemblyend, MAT_FINAL_ASSEMBLY);
21723a40ed3dSBarry Smith   PetscFunctionReturn(0);
217317ab2063SBarry Smith }
217417ab2063SBarry Smith 
2175d71ae5a4SJacob Faibussowitsch PetscErrorCode MatZeroRowsColumns_SeqAIJ(Mat A, PetscInt N, const PetscInt rows[], PetscScalar diag, Vec x, Vec b)
2176d71ae5a4SJacob Faibussowitsch {
21776e169961SBarry Smith   Mat_SeqAIJ        *a = (Mat_SeqAIJ *)A->data;
21786e169961SBarry Smith   PetscInt           i, j, m = A->rmap->n - 1, d = 0;
21792b40b63fSBarry Smith   PetscBool          missing, *zeroed, vecs = PETSC_FALSE;
21806e169961SBarry Smith   const PetscScalar *xx;
21812e5835c6SStefano Zampini   PetscScalar       *bb, *aa;
21826e169961SBarry Smith 
21836e169961SBarry Smith   PetscFunctionBegin;
21842e5835c6SStefano Zampini   if (!N) PetscFunctionReturn(0);
21859566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArray(A, &aa));
21866e169961SBarry Smith   if (x && b) {
21879566063dSJacob Faibussowitsch     PetscCall(VecGetArrayRead(x, &xx));
21889566063dSJacob Faibussowitsch     PetscCall(VecGetArray(b, &bb));
21892b40b63fSBarry Smith     vecs = PETSC_TRUE;
21906e169961SBarry Smith   }
21919566063dSJacob Faibussowitsch   PetscCall(PetscCalloc1(A->rmap->n, &zeroed));
21926e169961SBarry Smith   for (i = 0; i < N; i++) {
2193aed4548fSBarry Smith     PetscCheck(rows[i] >= 0 && rows[i] <= m, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "row %" PetscInt_FMT " out of range", rows[i]);
21949566063dSJacob Faibussowitsch     PetscCall(PetscArrayzero(&aa[a->i[rows[i]]], a->ilen[rows[i]]));
21952205254eSKarl Rupp 
21966e169961SBarry Smith     zeroed[rows[i]] = PETSC_TRUE;
21976e169961SBarry Smith   }
21986e169961SBarry Smith   for (i = 0; i < A->rmap->n; i++) {
21996e169961SBarry Smith     if (!zeroed[i]) {
22006e169961SBarry Smith       for (j = a->i[i]; j < a->i[i + 1]; j++) {
22014cf107fdSStefano Zampini         if (a->j[j] < A->rmap->n && zeroed[a->j[j]]) {
22022e5835c6SStefano Zampini           if (vecs) bb[i] -= aa[j] * xx[a->j[j]];
22032e5835c6SStefano Zampini           aa[j] = 0.0;
22046e169961SBarry Smith         }
22056e169961SBarry Smith       }
22064cf107fdSStefano Zampini     } else if (vecs && i < A->cmap->N) bb[i] = diag * xx[i];
22076e169961SBarry Smith   }
22086e169961SBarry Smith   if (x && b) {
22099566063dSJacob Faibussowitsch     PetscCall(VecRestoreArrayRead(x, &xx));
22109566063dSJacob Faibussowitsch     PetscCall(VecRestoreArray(b, &bb));
22116e169961SBarry Smith   }
22129566063dSJacob Faibussowitsch   PetscCall(PetscFree(zeroed));
22136e169961SBarry Smith   if (diag != 0.0) {
22149566063dSJacob Faibussowitsch     PetscCall(MatMissingDiagonal_SeqAIJ(A, &missing, &d));
22151d5a398dSstefano_zampini     if (missing) {
22161d5a398dSstefano_zampini       for (i = 0; i < N; i++) {
22174cf107fdSStefano Zampini         if (rows[i] >= A->cmap->N) continue;
2218aed4548fSBarry Smith         PetscCheck(!a->nonew || rows[i] < d, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Matrix is missing diagonal entry in row %" PetscInt_FMT " (%" PetscInt_FMT ")", d, rows[i]);
22199566063dSJacob Faibussowitsch         PetscCall(MatSetValues_SeqAIJ(A, 1, &rows[i], 1, &rows[i], &diag, INSERT_VALUES));
22201d5a398dSstefano_zampini       }
22211d5a398dSstefano_zampini     } else {
2222ad540459SPierre Jolivet       for (i = 0; i < N; i++) aa[a->diag[rows[i]]] = diag;
22236e169961SBarry Smith     }
22241d5a398dSstefano_zampini   }
22259566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArray(A, &aa));
2226dbbe0bcdSBarry Smith   PetscUseTypeMethod(A, assemblyend, MAT_FINAL_ASSEMBLY);
22276e169961SBarry Smith   PetscFunctionReturn(0);
22286e169961SBarry Smith }
22296e169961SBarry Smith 
2230d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetRow_SeqAIJ(Mat A, PetscInt row, PetscInt *nz, PetscInt **idx, PetscScalar **v)
2231d71ae5a4SJacob Faibussowitsch {
2232fff043a9SJunchao Zhang   Mat_SeqAIJ        *a = (Mat_SeqAIJ *)A->data;
2233fff043a9SJunchao Zhang   const PetscScalar *aa;
2234fff043a9SJunchao Zhang   PetscInt          *itmp;
223517ab2063SBarry Smith 
22363a40ed3dSBarry Smith   PetscFunctionBegin;
22379566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &aa));
2238416022c9SBarry Smith   *nz = a->i[row + 1] - a->i[row];
22392e5835c6SStefano Zampini   if (v) *v = (PetscScalar *)(aa + a->i[row]);
224017ab2063SBarry Smith   if (idx) {
2241bfeeae90SHong Zhang     itmp = a->j + a->i[row];
224226fbe8dcSKarl Rupp     if (*nz) *idx = itmp;
2243f4259b30SLisandro Dalcin     else *idx = NULL;
224417ab2063SBarry Smith   }
22459566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &aa));
22463a40ed3dSBarry Smith   PetscFunctionReturn(0);
224717ab2063SBarry Smith }
224817ab2063SBarry Smith 
2249d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRestoreRow_SeqAIJ(Mat A, PetscInt row, PetscInt *nz, PetscInt **idx, PetscScalar **v)
2250d71ae5a4SJacob Faibussowitsch {
22513a40ed3dSBarry Smith   PetscFunctionBegin;
2252cb4a9cd9SHong Zhang   if (nz) *nz = 0;
22532e5835c6SStefano Zampini   if (idx) *idx = NULL;
22542e5835c6SStefano Zampini   if (v) *v = NULL;
22553a40ed3dSBarry Smith   PetscFunctionReturn(0);
225617ab2063SBarry Smith }
225717ab2063SBarry Smith 
2258d71ae5a4SJacob Faibussowitsch PetscErrorCode MatNorm_SeqAIJ(Mat A, NormType type, PetscReal *nrm)
2259d71ae5a4SJacob Faibussowitsch {
2260416022c9SBarry Smith   Mat_SeqAIJ      *a = (Mat_SeqAIJ *)A->data;
22612e5835c6SStefano Zampini   const MatScalar *v;
226236db0b34SBarry Smith   PetscReal        sum = 0.0;
226397f1f81fSBarry Smith   PetscInt         i, j;
226417ab2063SBarry Smith 
22653a40ed3dSBarry Smith   PetscFunctionBegin;
22669566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &v));
226717ab2063SBarry Smith   if (type == NORM_FROBENIUS) {
2268570b7f6dSBarry Smith #if defined(PETSC_USE_REAL___FP16)
2269570b7f6dSBarry Smith     PetscBLASInt one = 1, nz = a->nz;
2270792fecdfSBarry Smith     PetscCallBLAS("BLASnrm2", *nrm = BLASnrm2_(&nz, v, &one));
2271570b7f6dSBarry Smith #else
2272416022c9SBarry Smith     for (i = 0; i < a->nz; i++) {
22739371c9d4SSatish Balay       sum += PetscRealPart(PetscConj(*v) * (*v));
22749371c9d4SSatish Balay       v++;
227517ab2063SBarry Smith     }
22768f1a2a5eSBarry Smith     *nrm = PetscSqrtReal(sum);
2277570b7f6dSBarry Smith #endif
22789566063dSJacob Faibussowitsch     PetscCall(PetscLogFlops(2.0 * a->nz));
22793a40ed3dSBarry Smith   } else if (type == NORM_1) {
228036db0b34SBarry Smith     PetscReal *tmp;
228197f1f81fSBarry Smith     PetscInt  *jj = a->j;
22829566063dSJacob Faibussowitsch     PetscCall(PetscCalloc1(A->cmap->n + 1, &tmp));
2283064f8208SBarry Smith     *nrm = 0.0;
2284416022c9SBarry Smith     for (j = 0; j < a->nz; j++) {
22859371c9d4SSatish Balay       tmp[*jj++] += PetscAbsScalar(*v);
22869371c9d4SSatish Balay       v++;
228717ab2063SBarry Smith     }
2288d0f46423SBarry Smith     for (j = 0; j < A->cmap->n; j++) {
2289064f8208SBarry Smith       if (tmp[j] > *nrm) *nrm = tmp[j];
229017ab2063SBarry Smith     }
22919566063dSJacob Faibussowitsch     PetscCall(PetscFree(tmp));
22929566063dSJacob Faibussowitsch     PetscCall(PetscLogFlops(PetscMax(a->nz - 1, 0)));
22933a40ed3dSBarry Smith   } else if (type == NORM_INFINITY) {
2294064f8208SBarry Smith     *nrm = 0.0;
2295d0f46423SBarry Smith     for (j = 0; j < A->rmap->n; j++) {
22962e5835c6SStefano Zampini       const PetscScalar *v2 = v + a->i[j];
229717ab2063SBarry Smith       sum                   = 0.0;
2298416022c9SBarry Smith       for (i = 0; i < a->i[j + 1] - a->i[j]; i++) {
22999371c9d4SSatish Balay         sum += PetscAbsScalar(*v2);
23009371c9d4SSatish Balay         v2++;
230117ab2063SBarry Smith       }
2302064f8208SBarry Smith       if (sum > *nrm) *nrm = sum;
230317ab2063SBarry Smith     }
23049566063dSJacob Faibussowitsch     PetscCall(PetscLogFlops(PetscMax(a->nz - 1, 0)));
2305f23aa3ddSBarry Smith   } else SETERRQ(PETSC_COMM_SELF, PETSC_ERR_SUP, "No support for two norm");
23069566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &v));
23073a40ed3dSBarry Smith   PetscFunctionReturn(0);
230817ab2063SBarry Smith }
230917ab2063SBarry Smith 
2310d71ae5a4SJacob Faibussowitsch PetscErrorCode MatIsTranspose_SeqAIJ(Mat A, Mat B, PetscReal tol, PetscBool *f)
2311d71ae5a4SJacob Faibussowitsch {
23123d3eaba7SBarry Smith   Mat_SeqAIJ      *aij = (Mat_SeqAIJ *)A->data, *bij = (Mat_SeqAIJ *)B->data;
231354f21887SBarry Smith   PetscInt        *adx, *bdx, *aii, *bii, *aptr, *bptr;
23142e5835c6SStefano Zampini   const MatScalar *va, *vb;
231597f1f81fSBarry Smith   PetscInt         ma, na, mb, nb, i;
2316cd0d46ebSvictorle 
2317cd0d46ebSvictorle   PetscFunctionBegin;
23189566063dSJacob Faibussowitsch   PetscCall(MatGetSize(A, &ma, &na));
23199566063dSJacob Faibussowitsch   PetscCall(MatGetSize(B, &mb, &nb));
23205485867bSBarry Smith   if (ma != nb || na != mb) {
23215485867bSBarry Smith     *f = PETSC_FALSE;
23225485867bSBarry Smith     PetscFunctionReturn(0);
23235485867bSBarry Smith   }
23249566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &va));
23259566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(B, &vb));
23269371c9d4SSatish Balay   aii = aij->i;
23279371c9d4SSatish Balay   bii = bij->i;
23289371c9d4SSatish Balay   adx = aij->j;
23299371c9d4SSatish Balay   bdx = bij->j;
23309566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(ma, &aptr));
23319566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(mb, &bptr));
2332cd0d46ebSvictorle   for (i = 0; i < ma; i++) aptr[i] = aii[i];
2333cd0d46ebSvictorle   for (i = 0; i < mb; i++) bptr[i] = bii[i];
2334cd0d46ebSvictorle 
2335cd0d46ebSvictorle   *f = PETSC_TRUE;
2336cd0d46ebSvictorle   for (i = 0; i < ma; i++) {
2337cd0d46ebSvictorle     while (aptr[i] < aii[i + 1]) {
233897f1f81fSBarry Smith       PetscInt    idc, idr;
23395485867bSBarry Smith       PetscScalar vc, vr;
2340cd0d46ebSvictorle       /* column/row index/value */
23415485867bSBarry Smith       idc = adx[aptr[i]];
23425485867bSBarry Smith       idr = bdx[bptr[idc]];
23435485867bSBarry Smith       vc  = va[aptr[i]];
23445485867bSBarry Smith       vr  = vb[bptr[idc]];
23455485867bSBarry Smith       if (i != idr || PetscAbsScalar(vc - vr) > tol) {
23465485867bSBarry Smith         *f = PETSC_FALSE;
23475485867bSBarry Smith         goto done;
2348cd0d46ebSvictorle       } else {
23495485867bSBarry Smith         aptr[i]++;
23505485867bSBarry Smith         if (B || i != idc) bptr[idc]++;
2351cd0d46ebSvictorle       }
2352cd0d46ebSvictorle     }
2353cd0d46ebSvictorle   }
2354cd0d46ebSvictorle done:
23559566063dSJacob Faibussowitsch   PetscCall(PetscFree(aptr));
23569566063dSJacob Faibussowitsch   PetscCall(PetscFree(bptr));
23579566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &va));
23589566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(B, &vb));
2359cd0d46ebSvictorle   PetscFunctionReturn(0);
2360cd0d46ebSvictorle }
2361cd0d46ebSvictorle 
2362d71ae5a4SJacob Faibussowitsch PetscErrorCode MatIsHermitianTranspose_SeqAIJ(Mat A, Mat B, PetscReal tol, PetscBool *f)
2363d71ae5a4SJacob Faibussowitsch {
23643d3eaba7SBarry Smith   Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data, *bij = (Mat_SeqAIJ *)B->data;
236554f21887SBarry Smith   PetscInt   *adx, *bdx, *aii, *bii, *aptr, *bptr;
236654f21887SBarry Smith   MatScalar  *va, *vb;
23671cbb95d3SBarry Smith   PetscInt    ma, na, mb, nb, i;
23681cbb95d3SBarry Smith 
23691cbb95d3SBarry Smith   PetscFunctionBegin;
23709566063dSJacob Faibussowitsch   PetscCall(MatGetSize(A, &ma, &na));
23719566063dSJacob Faibussowitsch   PetscCall(MatGetSize(B, &mb, &nb));
23721cbb95d3SBarry Smith   if (ma != nb || na != mb) {
23731cbb95d3SBarry Smith     *f = PETSC_FALSE;
23741cbb95d3SBarry Smith     PetscFunctionReturn(0);
23751cbb95d3SBarry Smith   }
23769371c9d4SSatish Balay   aii = aij->i;
23779371c9d4SSatish Balay   bii = bij->i;
23789371c9d4SSatish Balay   adx = aij->j;
23799371c9d4SSatish Balay   bdx = bij->j;
23809371c9d4SSatish Balay   va  = aij->a;
23819371c9d4SSatish Balay   vb  = bij->a;
23829566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(ma, &aptr));
23839566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(mb, &bptr));
23841cbb95d3SBarry Smith   for (i = 0; i < ma; i++) aptr[i] = aii[i];
23851cbb95d3SBarry Smith   for (i = 0; i < mb; i++) bptr[i] = bii[i];
23861cbb95d3SBarry Smith 
23871cbb95d3SBarry Smith   *f = PETSC_TRUE;
23881cbb95d3SBarry Smith   for (i = 0; i < ma; i++) {
23891cbb95d3SBarry Smith     while (aptr[i] < aii[i + 1]) {
23901cbb95d3SBarry Smith       PetscInt    idc, idr;
23911cbb95d3SBarry Smith       PetscScalar vc, vr;
23921cbb95d3SBarry Smith       /* column/row index/value */
23931cbb95d3SBarry Smith       idc = adx[aptr[i]];
23941cbb95d3SBarry Smith       idr = bdx[bptr[idc]];
23951cbb95d3SBarry Smith       vc  = va[aptr[i]];
23961cbb95d3SBarry Smith       vr  = vb[bptr[idc]];
23971cbb95d3SBarry Smith       if (i != idr || PetscAbsScalar(vc - PetscConj(vr)) > tol) {
23981cbb95d3SBarry Smith         *f = PETSC_FALSE;
23991cbb95d3SBarry Smith         goto done;
24001cbb95d3SBarry Smith       } else {
24011cbb95d3SBarry Smith         aptr[i]++;
24021cbb95d3SBarry Smith         if (B || i != idc) bptr[idc]++;
24031cbb95d3SBarry Smith       }
24041cbb95d3SBarry Smith     }
24051cbb95d3SBarry Smith   }
24061cbb95d3SBarry Smith done:
24079566063dSJacob Faibussowitsch   PetscCall(PetscFree(aptr));
24089566063dSJacob Faibussowitsch   PetscCall(PetscFree(bptr));
24091cbb95d3SBarry Smith   PetscFunctionReturn(0);
24101cbb95d3SBarry Smith }
24111cbb95d3SBarry Smith 
2412d71ae5a4SJacob Faibussowitsch PetscErrorCode MatIsSymmetric_SeqAIJ(Mat A, PetscReal tol, PetscBool *f)
2413d71ae5a4SJacob Faibussowitsch {
24149e29f15eSvictorle   PetscFunctionBegin;
24159566063dSJacob Faibussowitsch   PetscCall(MatIsTranspose_SeqAIJ(A, A, tol, f));
24169e29f15eSvictorle   PetscFunctionReturn(0);
24179e29f15eSvictorle }
24189e29f15eSvictorle 
2419d71ae5a4SJacob Faibussowitsch PetscErrorCode MatIsHermitian_SeqAIJ(Mat A, PetscReal tol, PetscBool *f)
2420d71ae5a4SJacob Faibussowitsch {
24211cbb95d3SBarry Smith   PetscFunctionBegin;
24229566063dSJacob Faibussowitsch   PetscCall(MatIsHermitianTranspose_SeqAIJ(A, A, tol, f));
24231cbb95d3SBarry Smith   PetscFunctionReturn(0);
24241cbb95d3SBarry Smith }
24251cbb95d3SBarry Smith 
2426d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDiagonalScale_SeqAIJ(Mat A, Vec ll, Vec rr)
2427d71ae5a4SJacob Faibussowitsch {
2428416022c9SBarry Smith   Mat_SeqAIJ        *a = (Mat_SeqAIJ *)A->data;
2429fff8e43fSBarry Smith   const PetscScalar *l, *r;
2430fff8e43fSBarry Smith   PetscScalar        x;
243154f21887SBarry Smith   MatScalar         *v;
2432fff8e43fSBarry Smith   PetscInt           i, j, m = A->rmap->n, n = A->cmap->n, M, nz = a->nz;
2433fff8e43fSBarry Smith   const PetscInt    *jj;
243417ab2063SBarry Smith 
24353a40ed3dSBarry Smith   PetscFunctionBegin;
243617ab2063SBarry Smith   if (ll) {
24373ea7c6a1SSatish Balay     /* The local size is used so that VecMPI can be passed to this routine
24383ea7c6a1SSatish Balay        by MatDiagonalScale_MPIAIJ */
24399566063dSJacob Faibussowitsch     PetscCall(VecGetLocalSize(ll, &m));
244008401ef6SPierre Jolivet     PetscCheck(m == A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Left scaling vector wrong length");
24419566063dSJacob Faibussowitsch     PetscCall(VecGetArrayRead(ll, &l));
24429566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJGetArray(A, &v));
244317ab2063SBarry Smith     for (i = 0; i < m; i++) {
244417ab2063SBarry Smith       x = l[i];
2445416022c9SBarry Smith       M = a->i[i + 1] - a->i[i];
24462205254eSKarl Rupp       for (j = 0; j < M; j++) (*v++) *= x;
244717ab2063SBarry Smith     }
24489566063dSJacob Faibussowitsch     PetscCall(VecRestoreArrayRead(ll, &l));
24499566063dSJacob Faibussowitsch     PetscCall(PetscLogFlops(nz));
24509566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJRestoreArray(A, &v));
245117ab2063SBarry Smith   }
245217ab2063SBarry Smith   if (rr) {
24539566063dSJacob Faibussowitsch     PetscCall(VecGetLocalSize(rr, &n));
245408401ef6SPierre Jolivet     PetscCheck(n == A->cmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Right scaling vector wrong length");
24559566063dSJacob Faibussowitsch     PetscCall(VecGetArrayRead(rr, &r));
24569566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJGetArray(A, &v));
24572e5835c6SStefano Zampini     jj = a->j;
24582205254eSKarl Rupp     for (i = 0; i < nz; i++) (*v++) *= r[*jj++];
24599566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJRestoreArray(A, &v));
24609566063dSJacob Faibussowitsch     PetscCall(VecRestoreArrayRead(rr, &r));
24619566063dSJacob Faibussowitsch     PetscCall(PetscLogFlops(nz));
246217ab2063SBarry Smith   }
24639566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJInvalidateDiagonal(A));
24643a40ed3dSBarry Smith   PetscFunctionReturn(0);
246517ab2063SBarry Smith }
246617ab2063SBarry Smith 
2467d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateSubMatrix_SeqAIJ(Mat A, IS isrow, IS iscol, PetscInt csize, MatReuse scall, Mat *B)
2468d71ae5a4SJacob Faibussowitsch {
2469db02288aSLois Curfman McInnes   Mat_SeqAIJ        *a = (Mat_SeqAIJ *)A->data, *c;
2470d0f46423SBarry Smith   PetscInt          *smap, i, k, kstart, kend, oldcols = A->cmap->n, *lens;
247197f1f81fSBarry Smith   PetscInt           row, mat_i, *mat_j, tcol, first, step, *mat_ilen, sum, lensi;
24725d0c19d7SBarry Smith   const PetscInt    *irow, *icol;
24732e5835c6SStefano Zampini   const PetscScalar *aa;
24745d0c19d7SBarry Smith   PetscInt           nrows, ncols;
247597f1f81fSBarry Smith   PetscInt          *starts, *j_new, *i_new, *aj = a->j, *ai = a->i, ii, *ailen = a->ilen;
247654f21887SBarry Smith   MatScalar         *a_new, *mat_a;
2477416022c9SBarry Smith   Mat                C;
2478cdc6f3adSToby Isaac   PetscBool          stride;
247917ab2063SBarry Smith 
24803a40ed3dSBarry Smith   PetscFunctionBegin;
24819566063dSJacob Faibussowitsch   PetscCall(ISGetIndices(isrow, &irow));
24829566063dSJacob Faibussowitsch   PetscCall(ISGetLocalSize(isrow, &nrows));
24839566063dSJacob Faibussowitsch   PetscCall(ISGetLocalSize(iscol, &ncols));
248417ab2063SBarry Smith 
24859566063dSJacob Faibussowitsch   PetscCall(PetscObjectTypeCompare((PetscObject)iscol, ISSTRIDE, &stride));
2486ff718158SBarry Smith   if (stride) {
24879566063dSJacob Faibussowitsch     PetscCall(ISStrideGetInfo(iscol, &first, &step));
2488ff718158SBarry Smith   } else {
2489ff718158SBarry Smith     first = 0;
2490ff718158SBarry Smith     step  = 0;
2491ff718158SBarry Smith   }
2492fee21e36SBarry Smith   if (stride && step == 1) {
249302834360SBarry Smith     /* special case of contiguous rows */
24949566063dSJacob Faibussowitsch     PetscCall(PetscMalloc2(nrows, &lens, nrows, &starts));
249502834360SBarry Smith     /* loop over new rows determining lens and starting points */
249602834360SBarry Smith     for (i = 0; i < nrows; i++) {
2497bfeeae90SHong Zhang       kstart    = ai[irow[i]];
2498a2744918SBarry Smith       kend      = kstart + ailen[irow[i]];
2499a91a9bebSLisandro Dalcin       starts[i] = kstart;
250002834360SBarry Smith       for (k = kstart; k < kend; k++) {
2501bfeeae90SHong Zhang         if (aj[k] >= first) {
250202834360SBarry Smith           starts[i] = k;
250302834360SBarry Smith           break;
250402834360SBarry Smith         }
250502834360SBarry Smith       }
2506a2744918SBarry Smith       sum = 0;
250702834360SBarry Smith       while (k < kend) {
2508bfeeae90SHong Zhang         if (aj[k++] >= first + ncols) break;
2509a2744918SBarry Smith         sum++;
251002834360SBarry Smith       }
2511a2744918SBarry Smith       lens[i] = sum;
251202834360SBarry Smith     }
251302834360SBarry Smith     /* create submatrix */
2514cddf8d76SBarry Smith     if (scall == MAT_REUSE_MATRIX) {
251597f1f81fSBarry Smith       PetscInt n_cols, n_rows;
25169566063dSJacob Faibussowitsch       PetscCall(MatGetSize(*B, &n_rows, &n_cols));
2517aed4548fSBarry Smith       PetscCheck(n_rows == nrows && n_cols == ncols, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Reused submatrix wrong size");
25189566063dSJacob Faibussowitsch       PetscCall(MatZeroEntries(*B));
251908480c60SBarry Smith       C = *B;
25203a40ed3dSBarry Smith     } else {
25213bef6203SJed Brown       PetscInt rbs, cbs;
25229566063dSJacob Faibussowitsch       PetscCall(MatCreate(PetscObjectComm((PetscObject)A), &C));
25239566063dSJacob Faibussowitsch       PetscCall(MatSetSizes(C, nrows, ncols, PETSC_DETERMINE, PETSC_DETERMINE));
25249566063dSJacob Faibussowitsch       PetscCall(ISGetBlockSize(isrow, &rbs));
25259566063dSJacob Faibussowitsch       PetscCall(ISGetBlockSize(iscol, &cbs));
25269566063dSJacob Faibussowitsch       PetscCall(MatSetBlockSizes(C, rbs, cbs));
25279566063dSJacob Faibussowitsch       PetscCall(MatSetType(C, ((PetscObject)A)->type_name));
25289566063dSJacob Faibussowitsch       PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(C, 0, lens));
252908480c60SBarry Smith     }
2530db02288aSLois Curfman McInnes     c = (Mat_SeqAIJ *)C->data;
2531db02288aSLois Curfman McInnes 
253202834360SBarry Smith     /* loop over rows inserting into submatrix */
2533db02288aSLois Curfman McInnes     a_new = c->a;
2534db02288aSLois Curfman McInnes     j_new = c->j;
2535db02288aSLois Curfman McInnes     i_new = c->i;
25369566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJGetArrayRead(A, &aa));
253702834360SBarry Smith     for (i = 0; i < nrows; i++) {
2538a2744918SBarry Smith       ii    = starts[i];
2539a2744918SBarry Smith       lensi = lens[i];
2540ad540459SPierre Jolivet       for (k = 0; k < lensi; k++) *j_new++ = aj[ii + k] - first;
25419566063dSJacob Faibussowitsch       PetscCall(PetscArraycpy(a_new, aa + starts[i], lensi));
2542a2744918SBarry Smith       a_new += lensi;
2543a2744918SBarry Smith       i_new[i + 1] = i_new[i] + lensi;
2544a2744918SBarry Smith       c->ilen[i]   = lensi;
254502834360SBarry Smith     }
25469566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJRestoreArrayRead(A, &aa));
25479566063dSJacob Faibussowitsch     PetscCall(PetscFree2(lens, starts));
25483a40ed3dSBarry Smith   } else {
25499566063dSJacob Faibussowitsch     PetscCall(ISGetIndices(iscol, &icol));
25509566063dSJacob Faibussowitsch     PetscCall(PetscCalloc1(oldcols, &smap));
25519566063dSJacob Faibussowitsch     PetscCall(PetscMalloc1(1 + nrows, &lens));
25524dcab191SBarry Smith     for (i = 0; i < ncols; i++) {
25536bdcaf15SBarry Smith       PetscCheck(icol[i] < oldcols, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Requesting column beyond largest column icol[%" PetscInt_FMT "] %" PetscInt_FMT " >= A->cmap->n %" PetscInt_FMT, i, icol[i], oldcols);
25544dcab191SBarry Smith       smap[icol[i]] = i + 1;
25554dcab191SBarry Smith     }
25564dcab191SBarry Smith 
255702834360SBarry Smith     /* determine lens of each row */
255802834360SBarry Smith     for (i = 0; i < nrows; i++) {
2559bfeeae90SHong Zhang       kstart  = ai[irow[i]];
256002834360SBarry Smith       kend    = kstart + a->ilen[irow[i]];
256102834360SBarry Smith       lens[i] = 0;
256202834360SBarry Smith       for (k = kstart; k < kend; k++) {
2563ad540459SPierre Jolivet         if (smap[aj[k]]) lens[i]++;
256402834360SBarry Smith       }
256502834360SBarry Smith     }
256617ab2063SBarry Smith     /* Create and fill new matrix */
2567a2744918SBarry Smith     if (scall == MAT_REUSE_MATRIX) {
2568ace3abfcSBarry Smith       PetscBool equal;
25690f5bd95cSBarry Smith 
257099141d43SSatish Balay       c = (Mat_SeqAIJ *)((*B)->data);
2571aed4548fSBarry Smith       PetscCheck((*B)->rmap->n == nrows && (*B)->cmap->n == ncols, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Cannot reuse matrix. wrong size");
25729566063dSJacob Faibussowitsch       PetscCall(PetscArraycmp(c->ilen, lens, (*B)->rmap->n, &equal));
257328b400f6SJacob Faibussowitsch       PetscCheck(equal, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Cannot reuse matrix. wrong no of nonzeros");
25749566063dSJacob Faibussowitsch       PetscCall(PetscArrayzero(c->ilen, (*B)->rmap->n));
257508480c60SBarry Smith       C = *B;
25763a40ed3dSBarry Smith     } else {
25773bef6203SJed Brown       PetscInt rbs, cbs;
25789566063dSJacob Faibussowitsch       PetscCall(MatCreate(PetscObjectComm((PetscObject)A), &C));
25799566063dSJacob Faibussowitsch       PetscCall(MatSetSizes(C, nrows, ncols, PETSC_DETERMINE, PETSC_DETERMINE));
25809566063dSJacob Faibussowitsch       PetscCall(ISGetBlockSize(isrow, &rbs));
25819566063dSJacob Faibussowitsch       PetscCall(ISGetBlockSize(iscol, &cbs));
25829566063dSJacob Faibussowitsch       PetscCall(MatSetBlockSizes(C, rbs, cbs));
25839566063dSJacob Faibussowitsch       PetscCall(MatSetType(C, ((PetscObject)A)->type_name));
25849566063dSJacob Faibussowitsch       PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(C, 0, lens));
258508480c60SBarry Smith     }
25869566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJGetArrayRead(A, &aa));
258799141d43SSatish Balay     c = (Mat_SeqAIJ *)(C->data);
258817ab2063SBarry Smith     for (i = 0; i < nrows; i++) {
258999141d43SSatish Balay       row      = irow[i];
2590bfeeae90SHong Zhang       kstart   = ai[row];
259199141d43SSatish Balay       kend     = kstart + a->ilen[row];
2592bfeeae90SHong Zhang       mat_i    = c->i[i];
259399141d43SSatish Balay       mat_j    = c->j + mat_i;
259499141d43SSatish Balay       mat_a    = c->a + mat_i;
259599141d43SSatish Balay       mat_ilen = c->ilen + i;
259617ab2063SBarry Smith       for (k = kstart; k < kend; k++) {
2597bfeeae90SHong Zhang         if ((tcol = smap[a->j[k]])) {
2598ed480e8bSBarry Smith           *mat_j++ = tcol - 1;
25992e5835c6SStefano Zampini           *mat_a++ = aa[k];
260099141d43SSatish Balay           (*mat_ilen)++;
260117ab2063SBarry Smith         }
260217ab2063SBarry Smith       }
260317ab2063SBarry Smith     }
26049566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJRestoreArrayRead(A, &aa));
260502834360SBarry Smith     /* Free work space */
26069566063dSJacob Faibussowitsch     PetscCall(ISRestoreIndices(iscol, &icol));
26079566063dSJacob Faibussowitsch     PetscCall(PetscFree(smap));
26089566063dSJacob Faibussowitsch     PetscCall(PetscFree(lens));
2609cdc6f3adSToby Isaac     /* sort */
2610cdc6f3adSToby Isaac     for (i = 0; i < nrows; i++) {
2611cdc6f3adSToby Isaac       PetscInt ilen;
2612cdc6f3adSToby Isaac 
2613cdc6f3adSToby Isaac       mat_i = c->i[i];
2614cdc6f3adSToby Isaac       mat_j = c->j + mat_i;
2615cdc6f3adSToby Isaac       mat_a = c->a + mat_i;
2616cdc6f3adSToby Isaac       ilen  = c->ilen[i];
26179566063dSJacob Faibussowitsch       PetscCall(PetscSortIntWithScalarArray(ilen, mat_j, mat_a));
2618cdc6f3adSToby Isaac     }
261902834360SBarry Smith   }
26208c3ff71bSJunchao Zhang #if defined(PETSC_HAVE_DEVICE)
26219566063dSJacob Faibussowitsch   PetscCall(MatBindToCPU(C, A->boundtocpu));
2622305c6ccfSStefano Zampini #endif
26239566063dSJacob Faibussowitsch   PetscCall(MatAssemblyBegin(C, MAT_FINAL_ASSEMBLY));
26249566063dSJacob Faibussowitsch   PetscCall(MatAssemblyEnd(C, MAT_FINAL_ASSEMBLY));
262517ab2063SBarry Smith 
26269566063dSJacob Faibussowitsch   PetscCall(ISRestoreIndices(isrow, &irow));
2627416022c9SBarry Smith   *B = C;
26283a40ed3dSBarry Smith   PetscFunctionReturn(0);
262917ab2063SBarry Smith }
263017ab2063SBarry Smith 
2631d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetMultiProcBlock_SeqAIJ(Mat mat, MPI_Comm subComm, MatReuse scall, Mat *subMat)
2632d71ae5a4SJacob Faibussowitsch {
263382d44351SHong Zhang   Mat B;
263482d44351SHong Zhang 
263582d44351SHong Zhang   PetscFunctionBegin;
2636c2d650bdSHong Zhang   if (scall == MAT_INITIAL_MATRIX) {
26379566063dSJacob Faibussowitsch     PetscCall(MatCreate(subComm, &B));
26389566063dSJacob Faibussowitsch     PetscCall(MatSetSizes(B, mat->rmap->n, mat->cmap->n, mat->rmap->n, mat->cmap->n));
26399566063dSJacob Faibussowitsch     PetscCall(MatSetBlockSizesFromMats(B, mat, mat));
26409566063dSJacob Faibussowitsch     PetscCall(MatSetType(B, MATSEQAIJ));
26419566063dSJacob Faibussowitsch     PetscCall(MatDuplicateNoCreate_SeqAIJ(B, mat, MAT_COPY_VALUES, PETSC_TRUE));
264282d44351SHong Zhang     *subMat = B;
2643c2d650bdSHong Zhang   } else {
26449566063dSJacob Faibussowitsch     PetscCall(MatCopy_SeqAIJ(mat, *subMat, SAME_NONZERO_PATTERN));
2645c2d650bdSHong Zhang   }
264682d44351SHong Zhang   PetscFunctionReturn(0);
264782d44351SHong Zhang }
264882d44351SHong Zhang 
2649d71ae5a4SJacob Faibussowitsch PetscErrorCode MatILUFactor_SeqAIJ(Mat inA, IS row, IS col, const MatFactorInfo *info)
2650d71ae5a4SJacob Faibussowitsch {
265163b91edcSBarry Smith   Mat_SeqAIJ *a = (Mat_SeqAIJ *)inA->data;
265263b91edcSBarry Smith   Mat         outA;
2653ace3abfcSBarry Smith   PetscBool   row_identity, col_identity;
265463b91edcSBarry Smith 
26553a40ed3dSBarry Smith   PetscFunctionBegin;
265608401ef6SPierre Jolivet   PetscCheck(info->levels == 0, PETSC_COMM_SELF, PETSC_ERR_SUP, "Only levels=0 supported for in-place ilu");
26571df811f5SHong Zhang 
26589566063dSJacob Faibussowitsch   PetscCall(ISIdentity(row, &row_identity));
26599566063dSJacob Faibussowitsch   PetscCall(ISIdentity(col, &col_identity));
2660a871dcd8SBarry Smith 
266163b91edcSBarry Smith   outA             = inA;
2662d5f3da31SBarry Smith   outA->factortype = MAT_FACTOR_LU;
26639566063dSJacob Faibussowitsch   PetscCall(PetscFree(inA->solvertype));
26649566063dSJacob Faibussowitsch   PetscCall(PetscStrallocpy(MATSOLVERPETSC, &inA->solvertype));
26652205254eSKarl Rupp 
26669566063dSJacob Faibussowitsch   PetscCall(PetscObjectReference((PetscObject)row));
26679566063dSJacob Faibussowitsch   PetscCall(ISDestroy(&a->row));
26682205254eSKarl Rupp 
2669c3122656SLisandro Dalcin   a->row = row;
26702205254eSKarl Rupp 
26719566063dSJacob Faibussowitsch   PetscCall(PetscObjectReference((PetscObject)col));
26729566063dSJacob Faibussowitsch   PetscCall(ISDestroy(&a->col));
26732205254eSKarl Rupp 
2674c3122656SLisandro Dalcin   a->col = col;
267563b91edcSBarry Smith 
267636db0b34SBarry Smith   /* Create the inverse permutation so that it can be used in MatLUFactorNumeric() */
26779566063dSJacob Faibussowitsch   PetscCall(ISDestroy(&a->icol));
26789566063dSJacob Faibussowitsch   PetscCall(ISInvertPermutation(col, PETSC_DECIDE, &a->icol));
2679f0ec6fceSSatish Balay 
268094a9d846SBarry Smith   if (!a->solve_work) { /* this matrix may have been factored before */
26819566063dSJacob Faibussowitsch     PetscCall(PetscMalloc1(inA->rmap->n + 1, &a->solve_work));
268294a9d846SBarry Smith   }
268363b91edcSBarry Smith 
26849566063dSJacob Faibussowitsch   PetscCall(MatMarkDiagonal_SeqAIJ(inA));
2685137fb511SHong Zhang   if (row_identity && col_identity) {
26869566063dSJacob Faibussowitsch     PetscCall(MatLUFactorNumeric_SeqAIJ_inplace(outA, inA, info));
2687137fb511SHong Zhang   } else {
26889566063dSJacob Faibussowitsch     PetscCall(MatLUFactorNumeric_SeqAIJ_InplaceWithPerm(outA, inA, info));
2689137fb511SHong Zhang   }
26903a40ed3dSBarry Smith   PetscFunctionReturn(0);
2691a871dcd8SBarry Smith }
2692a871dcd8SBarry Smith 
2693d71ae5a4SJacob Faibussowitsch PetscErrorCode MatScale_SeqAIJ(Mat inA, PetscScalar alpha)
2694d71ae5a4SJacob Faibussowitsch {
2695f0b747eeSBarry Smith   Mat_SeqAIJ  *a = (Mat_SeqAIJ *)inA->data;
2696dfa0f9e5SStefano Zampini   PetscScalar *v;
2697c5df96a5SBarry Smith   PetscBLASInt one = 1, bnz;
26983a40ed3dSBarry Smith 
26993a40ed3dSBarry Smith   PetscFunctionBegin;
27009566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArray(inA, &v));
27019566063dSJacob Faibussowitsch   PetscCall(PetscBLASIntCast(a->nz, &bnz));
2702792fecdfSBarry Smith   PetscCallBLAS("BLASscal", BLASscal_(&bnz, &alpha, v, &one));
27039566063dSJacob Faibussowitsch   PetscCall(PetscLogFlops(a->nz));
27049566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArray(inA, &v));
27059566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJInvalidateDiagonal(inA));
27063a40ed3dSBarry Smith   PetscFunctionReturn(0);
2707f0b747eeSBarry Smith }
2708f0b747eeSBarry Smith 
2709d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDestroySubMatrix_Private(Mat_SubSppt *submatj)
2710d71ae5a4SJacob Faibussowitsch {
271116b64355SHong Zhang   PetscInt i;
271216b64355SHong Zhang 
271316b64355SHong Zhang   PetscFunctionBegin;
271416b64355SHong Zhang   if (!submatj->id) { /* delete data that are linked only to submats[id=0] */
27159566063dSJacob Faibussowitsch     PetscCall(PetscFree4(submatj->sbuf1, submatj->ptr, submatj->tmp, submatj->ctr));
271616b64355SHong Zhang 
271748a46eb9SPierre Jolivet     for (i = 0; i < submatj->nrqr; ++i) PetscCall(PetscFree(submatj->sbuf2[i]));
27189566063dSJacob Faibussowitsch     PetscCall(PetscFree3(submatj->sbuf2, submatj->req_size, submatj->req_source1));
271916b64355SHong Zhang 
272016b64355SHong Zhang     if (submatj->rbuf1) {
27219566063dSJacob Faibussowitsch       PetscCall(PetscFree(submatj->rbuf1[0]));
27229566063dSJacob Faibussowitsch       PetscCall(PetscFree(submatj->rbuf1));
272316b64355SHong Zhang     }
272416b64355SHong Zhang 
272548a46eb9SPierre Jolivet     for (i = 0; i < submatj->nrqs; ++i) PetscCall(PetscFree(submatj->rbuf3[i]));
27269566063dSJacob Faibussowitsch     PetscCall(PetscFree3(submatj->req_source2, submatj->rbuf2, submatj->rbuf3));
27279566063dSJacob Faibussowitsch     PetscCall(PetscFree(submatj->pa));
272816b64355SHong Zhang   }
272916b64355SHong Zhang 
273016b64355SHong Zhang #if defined(PETSC_USE_CTABLE)
27319566063dSJacob Faibussowitsch   PetscCall(PetscTableDestroy((PetscTable *)&submatj->rmap));
27329566063dSJacob Faibussowitsch   if (submatj->cmap_loc) PetscCall(PetscFree(submatj->cmap_loc));
27339566063dSJacob Faibussowitsch   PetscCall(PetscFree(submatj->rmap_loc));
273416b64355SHong Zhang #else
27359566063dSJacob Faibussowitsch   PetscCall(PetscFree(submatj->rmap));
273616b64355SHong Zhang #endif
273716b64355SHong Zhang 
273816b64355SHong Zhang   if (!submatj->allcolumns) {
273916b64355SHong Zhang #if defined(PETSC_USE_CTABLE)
27409566063dSJacob Faibussowitsch     PetscCall(PetscTableDestroy((PetscTable *)&submatj->cmap));
274116b64355SHong Zhang #else
27429566063dSJacob Faibussowitsch     PetscCall(PetscFree(submatj->cmap));
274316b64355SHong Zhang #endif
274416b64355SHong Zhang   }
27459566063dSJacob Faibussowitsch   PetscCall(PetscFree(submatj->row2proc));
274616b64355SHong Zhang 
27479566063dSJacob Faibussowitsch   PetscCall(PetscFree(submatj));
274816b64355SHong Zhang   PetscFunctionReturn(0);
274916b64355SHong Zhang }
275016b64355SHong Zhang 
2751d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDestroySubMatrix_SeqAIJ(Mat C)
2752d71ae5a4SJacob Faibussowitsch {
275316b64355SHong Zhang   Mat_SeqAIJ  *c       = (Mat_SeqAIJ *)C->data;
27545c39f6d9SHong Zhang   Mat_SubSppt *submatj = c->submatis1;
275516b64355SHong Zhang 
275616b64355SHong Zhang   PetscFunctionBegin;
27579566063dSJacob Faibussowitsch   PetscCall((*submatj->destroy)(C));
27589566063dSJacob Faibussowitsch   PetscCall(MatDestroySubMatrix_Private(submatj));
275916b64355SHong Zhang   PetscFunctionReturn(0);
276016b64355SHong Zhang }
276116b64355SHong Zhang 
276289a1a59bSHong Zhang /* Note this has code duplication with MatDestroySubMatrices_SeqBAIJ() */
2763d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDestroySubMatrices_SeqAIJ(PetscInt n, Mat *mat[])
2764d71ae5a4SJacob Faibussowitsch {
27652d033e1fSHong Zhang   PetscInt     i;
27660fb991dcSHong Zhang   Mat          C;
27670fb991dcSHong Zhang   Mat_SeqAIJ  *c;
27680fb991dcSHong Zhang   Mat_SubSppt *submatj;
27692d033e1fSHong Zhang 
27702d033e1fSHong Zhang   PetscFunctionBegin;
27712d033e1fSHong Zhang   for (i = 0; i < n; i++) {
27720fb991dcSHong Zhang     C       = (*mat)[i];
27730fb991dcSHong Zhang     c       = (Mat_SeqAIJ *)C->data;
27740fb991dcSHong Zhang     submatj = c->submatis1;
27752d033e1fSHong Zhang     if (submatj) {
2776682e4c99SStefano Zampini       if (--((PetscObject)C)->refct <= 0) {
277726cc229bSBarry Smith         PetscCall(PetscFree(C->factorprefix));
27789566063dSJacob Faibussowitsch         PetscCall((*submatj->destroy)(C));
27799566063dSJacob Faibussowitsch         PetscCall(MatDestroySubMatrix_Private(submatj));
27809566063dSJacob Faibussowitsch         PetscCall(PetscFree(C->defaultvectype));
27813faff063SStefano Zampini         PetscCall(PetscFree(C->defaultrandtype));
27829566063dSJacob Faibussowitsch         PetscCall(PetscLayoutDestroy(&C->rmap));
27839566063dSJacob Faibussowitsch         PetscCall(PetscLayoutDestroy(&C->cmap));
27849566063dSJacob Faibussowitsch         PetscCall(PetscHeaderDestroy(&C));
2785682e4c99SStefano Zampini       }
27862d033e1fSHong Zhang     } else {
27879566063dSJacob Faibussowitsch       PetscCall(MatDestroy(&C));
27882d033e1fSHong Zhang     }
27892d033e1fSHong Zhang   }
279086e85357SHong Zhang 
279163a75b2aSHong Zhang   /* Destroy Dummy submatrices created for reuse */
27929566063dSJacob Faibussowitsch   PetscCall(MatDestroySubMatrices_Dummy(n, mat));
279363a75b2aSHong Zhang 
27949566063dSJacob Faibussowitsch   PetscCall(PetscFree(*mat));
27952d033e1fSHong Zhang   PetscFunctionReturn(0);
27962d033e1fSHong Zhang }
27972d033e1fSHong Zhang 
2798d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateSubMatrices_SeqAIJ(Mat A, PetscInt n, const IS irow[], const IS icol[], MatReuse scall, Mat *B[])
2799d71ae5a4SJacob Faibussowitsch {
280097f1f81fSBarry Smith   PetscInt i;
2801cddf8d76SBarry Smith 
28023a40ed3dSBarry Smith   PetscFunctionBegin;
280348a46eb9SPierre Jolivet   if (scall == MAT_INITIAL_MATRIX) PetscCall(PetscCalloc1(n + 1, B));
2804cddf8d76SBarry Smith 
280548a46eb9SPierre Jolivet   for (i = 0; i < n; i++) PetscCall(MatCreateSubMatrix_SeqAIJ(A, irow[i], icol[i], PETSC_DECIDE, scall, &(*B)[i]));
28063a40ed3dSBarry Smith   PetscFunctionReturn(0);
2807cddf8d76SBarry Smith }
2808cddf8d76SBarry Smith 
2809d71ae5a4SJacob Faibussowitsch PetscErrorCode MatIncreaseOverlap_SeqAIJ(Mat A, PetscInt is_max, IS is[], PetscInt ov)
2810d71ae5a4SJacob Faibussowitsch {
2811e4d965acSSatish Balay   Mat_SeqAIJ     *a = (Mat_SeqAIJ *)A->data;
28125d0c19d7SBarry Smith   PetscInt        row, i, j, k, l, m, n, *nidx, isz, val;
28135d0c19d7SBarry Smith   const PetscInt *idx;
281497f1f81fSBarry Smith   PetscInt        start, end, *ai, *aj;
2815f1af5d2fSBarry Smith   PetscBT         table;
2816bbd702dbSSatish Balay 
28173a40ed3dSBarry Smith   PetscFunctionBegin;
2818d0f46423SBarry Smith   m  = A->rmap->n;
2819e4d965acSSatish Balay   ai = a->i;
2820bfeeae90SHong Zhang   aj = a->j;
28218a047759SSatish Balay 
282208401ef6SPierre Jolivet   PetscCheck(ov >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "illegal negative overlap value used");
282306763907SSatish Balay 
28249566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(m + 1, &nidx));
28259566063dSJacob Faibussowitsch   PetscCall(PetscBTCreate(m, &table));
282606763907SSatish Balay 
2827e4d965acSSatish Balay   for (i = 0; i < is_max; i++) {
2828b97fc60eSLois Curfman McInnes     /* Initialize the two local arrays */
2829e4d965acSSatish Balay     isz = 0;
28309566063dSJacob Faibussowitsch     PetscCall(PetscBTMemzero(m, table));
2831e4d965acSSatish Balay 
2832e4d965acSSatish Balay     /* Extract the indices, assume there can be duplicate entries */
28339566063dSJacob Faibussowitsch     PetscCall(ISGetIndices(is[i], &idx));
28349566063dSJacob Faibussowitsch     PetscCall(ISGetLocalSize(is[i], &n));
2835e4d965acSSatish Balay 
2836dd097bc3SLois Curfman McInnes     /* Enter these into the temp arrays. I.e., mark table[row], enter row into new index */
2837e4d965acSSatish Balay     for (j = 0; j < n; ++j) {
28382205254eSKarl Rupp       if (!PetscBTLookupSet(table, idx[j])) nidx[isz++] = idx[j];
28394dcbc457SBarry Smith     }
28409566063dSJacob Faibussowitsch     PetscCall(ISRestoreIndices(is[i], &idx));
28419566063dSJacob Faibussowitsch     PetscCall(ISDestroy(&is[i]));
2842e4d965acSSatish Balay 
284304a348a9SBarry Smith     k = 0;
284404a348a9SBarry Smith     for (j = 0; j < ov; j++) { /* for each overlap */
284504a348a9SBarry Smith       n = isz;
284606763907SSatish Balay       for (; k < n; k++) { /* do only those rows in nidx[k], which are not done yet */
2847e4d965acSSatish Balay         row   = nidx[k];
2848e4d965acSSatish Balay         start = ai[row];
2849e4d965acSSatish Balay         end   = ai[row + 1];
285004a348a9SBarry Smith         for (l = start; l < end; l++) {
2851efb16452SHong Zhang           val = aj[l];
28522205254eSKarl Rupp           if (!PetscBTLookupSet(table, val)) nidx[isz++] = val;
2853e4d965acSSatish Balay         }
2854e4d965acSSatish Balay       }
2855e4d965acSSatish Balay     }
28569566063dSJacob Faibussowitsch     PetscCall(ISCreateGeneral(PETSC_COMM_SELF, isz, nidx, PETSC_COPY_VALUES, (is + i)));
2857e4d965acSSatish Balay   }
28589566063dSJacob Faibussowitsch   PetscCall(PetscBTDestroy(&table));
28599566063dSJacob Faibussowitsch   PetscCall(PetscFree(nidx));
28603a40ed3dSBarry Smith   PetscFunctionReturn(0);
28614dcbc457SBarry Smith }
286217ab2063SBarry Smith 
28630513a670SBarry Smith /* -------------------------------------------------------------- */
2864d71ae5a4SJacob Faibussowitsch PetscErrorCode MatPermute_SeqAIJ(Mat A, IS rowp, IS colp, Mat *B)
2865d71ae5a4SJacob Faibussowitsch {
28660513a670SBarry Smith   Mat_SeqAIJ     *a = (Mat_SeqAIJ *)A->data;
28673b98c0a2SBarry Smith   PetscInt        i, nz = 0, m = A->rmap->n, n = A->cmap->n;
28685d0c19d7SBarry Smith   const PetscInt *row, *col;
28695d0c19d7SBarry Smith   PetscInt       *cnew, j, *lens;
287056cd22aeSBarry Smith   IS              icolp, irowp;
28710298fd71SBarry Smith   PetscInt       *cwork = NULL;
28720298fd71SBarry Smith   PetscScalar    *vwork = NULL;
28730513a670SBarry Smith 
28743a40ed3dSBarry Smith   PetscFunctionBegin;
28759566063dSJacob Faibussowitsch   PetscCall(ISInvertPermutation(rowp, PETSC_DECIDE, &irowp));
28769566063dSJacob Faibussowitsch   PetscCall(ISGetIndices(irowp, &row));
28779566063dSJacob Faibussowitsch   PetscCall(ISInvertPermutation(colp, PETSC_DECIDE, &icolp));
28789566063dSJacob Faibussowitsch   PetscCall(ISGetIndices(icolp, &col));
28790513a670SBarry Smith 
28800513a670SBarry Smith   /* determine lengths of permuted rows */
28819566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(m + 1, &lens));
28822205254eSKarl Rupp   for (i = 0; i < m; i++) lens[row[i]] = a->i[i + 1] - a->i[i];
28839566063dSJacob Faibussowitsch   PetscCall(MatCreate(PetscObjectComm((PetscObject)A), B));
28849566063dSJacob Faibussowitsch   PetscCall(MatSetSizes(*B, m, n, m, n));
28859566063dSJacob Faibussowitsch   PetscCall(MatSetBlockSizesFromMats(*B, A, A));
28869566063dSJacob Faibussowitsch   PetscCall(MatSetType(*B, ((PetscObject)A)->type_name));
28879566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(*B, 0, lens));
28889566063dSJacob Faibussowitsch   PetscCall(PetscFree(lens));
28890513a670SBarry Smith 
28909566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(n, &cnew));
28910513a670SBarry Smith   for (i = 0; i < m; i++) {
28929566063dSJacob Faibussowitsch     PetscCall(MatGetRow_SeqAIJ(A, i, &nz, &cwork, &vwork));
28932205254eSKarl Rupp     for (j = 0; j < nz; j++) cnew[j] = col[cwork[j]];
28949566063dSJacob Faibussowitsch     PetscCall(MatSetValues_SeqAIJ(*B, 1, &row[i], nz, cnew, vwork, INSERT_VALUES));
28959566063dSJacob Faibussowitsch     PetscCall(MatRestoreRow_SeqAIJ(A, i, &nz, &cwork, &vwork));
28960513a670SBarry Smith   }
28979566063dSJacob Faibussowitsch   PetscCall(PetscFree(cnew));
28982205254eSKarl Rupp 
28993c7d62e4SBarry Smith   (*B)->assembled = PETSC_FALSE;
29002205254eSKarl Rupp 
29018c3ff71bSJunchao Zhang #if defined(PETSC_HAVE_DEVICE)
29029566063dSJacob Faibussowitsch   PetscCall(MatBindToCPU(*B, A->boundtocpu));
29039fe5e383SStefano Zampini #endif
29049566063dSJacob Faibussowitsch   PetscCall(MatAssemblyBegin(*B, MAT_FINAL_ASSEMBLY));
29059566063dSJacob Faibussowitsch   PetscCall(MatAssemblyEnd(*B, MAT_FINAL_ASSEMBLY));
29069566063dSJacob Faibussowitsch   PetscCall(ISRestoreIndices(irowp, &row));
29079566063dSJacob Faibussowitsch   PetscCall(ISRestoreIndices(icolp, &col));
29089566063dSJacob Faibussowitsch   PetscCall(ISDestroy(&irowp));
29099566063dSJacob Faibussowitsch   PetscCall(ISDestroy(&icolp));
291048a46eb9SPierre Jolivet   if (rowp == colp) PetscCall(MatPropagateSymmetryOptions(A, *B));
29113a40ed3dSBarry Smith   PetscFunctionReturn(0);
29120513a670SBarry Smith }
29130513a670SBarry Smith 
2914d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCopy_SeqAIJ(Mat A, Mat B, MatStructure str)
2915d71ae5a4SJacob Faibussowitsch {
2916cb5b572fSBarry Smith   PetscFunctionBegin;
291733f4a19fSKris Buschelman   /* If the two matrices have the same copy implementation, use fast copy. */
291833f4a19fSKris Buschelman   if (str == SAME_NONZERO_PATTERN && (A->ops->copy == B->ops->copy)) {
2919be6bf707SBarry Smith     Mat_SeqAIJ        *a = (Mat_SeqAIJ *)A->data;
2920be6bf707SBarry Smith     Mat_SeqAIJ        *b = (Mat_SeqAIJ *)B->data;
29212e5835c6SStefano Zampini     const PetscScalar *aa;
2922be6bf707SBarry Smith 
29239566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJGetArrayRead(A, &aa));
292408401ef6SPierre Jolivet     PetscCheck(a->i[A->rmap->n] == b->i[B->rmap->n], PETSC_COMM_SELF, PETSC_ERR_ARG_INCOMP, "Number of nonzeros in two matrices are different %" PetscInt_FMT " != %" PetscInt_FMT, a->i[A->rmap->n], b->i[B->rmap->n]);
29259566063dSJacob Faibussowitsch     PetscCall(PetscArraycpy(b->a, aa, a->i[A->rmap->n]));
29269566063dSJacob Faibussowitsch     PetscCall(PetscObjectStateIncrease((PetscObject)B));
29279566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJRestoreArrayRead(A, &aa));
2928cb5b572fSBarry Smith   } else {
29299566063dSJacob Faibussowitsch     PetscCall(MatCopy_Basic(A, B, str));
2930cb5b572fSBarry Smith   }
2931cb5b572fSBarry Smith   PetscFunctionReturn(0);
2932cb5b572fSBarry Smith }
2933cb5b572fSBarry Smith 
2934d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetUp_SeqAIJ(Mat A)
2935d71ae5a4SJacob Faibussowitsch {
2936273d9f13SBarry Smith   PetscFunctionBegin;
29379566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(A, PETSC_DEFAULT, NULL));
2938273d9f13SBarry Smith   PetscFunctionReturn(0);
2939273d9f13SBarry Smith }
2940273d9f13SBarry Smith 
2941d71ae5a4SJacob Faibussowitsch PETSC_INTERN PetscErrorCode MatSeqAIJGetArray_SeqAIJ(Mat A, PetscScalar *array[])
2942d71ae5a4SJacob Faibussowitsch {
29436c0721eeSBarry Smith   Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data;
29446e111a19SKarl Rupp 
29456c0721eeSBarry Smith   PetscFunctionBegin;
29466c0721eeSBarry Smith   *array = a->a;
29476c0721eeSBarry Smith   PetscFunctionReturn(0);
29486c0721eeSBarry Smith }
29496c0721eeSBarry Smith 
2950d71ae5a4SJacob Faibussowitsch PETSC_INTERN PetscErrorCode MatSeqAIJRestoreArray_SeqAIJ(Mat A, PetscScalar *array[])
2951d71ae5a4SJacob Faibussowitsch {
29526c0721eeSBarry Smith   PetscFunctionBegin;
2953f38c1e66SStefano Zampini   *array = NULL;
29546c0721eeSBarry Smith   PetscFunctionReturn(0);
29556c0721eeSBarry Smith }
2956273d9f13SBarry Smith 
29578229c054SShri Abhyankar /*
29588229c054SShri Abhyankar    Computes the number of nonzeros per row needed for preallocation when X and Y
29598229c054SShri Abhyankar    have different nonzero structure.
29608229c054SShri Abhyankar */
2961d71ae5a4SJacob Faibussowitsch PetscErrorCode MatAXPYGetPreallocation_SeqX_private(PetscInt m, const PetscInt *xi, const PetscInt *xj, const PetscInt *yi, const PetscInt *yj, PetscInt *nnz)
2962d71ae5a4SJacob Faibussowitsch {
2963b264fe52SHong Zhang   PetscInt i, j, k, nzx, nzy;
2964ec7775f6SShri Abhyankar 
2965ec7775f6SShri Abhyankar   PetscFunctionBegin;
2966ec7775f6SShri Abhyankar   /* Set the number of nonzeros in the new matrix */
2967ec7775f6SShri Abhyankar   for (i = 0; i < m; i++) {
2968b264fe52SHong Zhang     const PetscInt *xjj = xj + xi[i], *yjj = yj + yi[i];
2969b264fe52SHong Zhang     nzx    = xi[i + 1] - xi[i];
2970b264fe52SHong Zhang     nzy    = yi[i + 1] - yi[i];
29718af7cee1SJed Brown     nnz[i] = 0;
29728af7cee1SJed Brown     for (j = 0, k = 0; j < nzx; j++) {                  /* Point in X */
2973b264fe52SHong Zhang       for (; k < nzy && yjj[k] < xjj[j]; k++) nnz[i]++; /* Catch up to X */
2974b264fe52SHong Zhang       if (k < nzy && yjj[k] == xjj[j]) k++;             /* Skip duplicate */
29758af7cee1SJed Brown       nnz[i]++;
29768af7cee1SJed Brown     }
29778af7cee1SJed Brown     for (; k < nzy; k++) nnz[i]++;
2978ec7775f6SShri Abhyankar   }
2979ec7775f6SShri Abhyankar   PetscFunctionReturn(0);
2980ec7775f6SShri Abhyankar }
2981ec7775f6SShri Abhyankar 
2982d71ae5a4SJacob Faibussowitsch PetscErrorCode MatAXPYGetPreallocation_SeqAIJ(Mat Y, Mat X, PetscInt *nnz)
2983d71ae5a4SJacob Faibussowitsch {
2984b264fe52SHong Zhang   PetscInt    m = Y->rmap->N;
2985b264fe52SHong Zhang   Mat_SeqAIJ *x = (Mat_SeqAIJ *)X->data;
2986b264fe52SHong Zhang   Mat_SeqAIJ *y = (Mat_SeqAIJ *)Y->data;
2987b264fe52SHong Zhang 
2988b264fe52SHong Zhang   PetscFunctionBegin;
2989b264fe52SHong Zhang   /* Set the number of nonzeros in the new matrix */
29909566063dSJacob Faibussowitsch   PetscCall(MatAXPYGetPreallocation_SeqX_private(m, x->i, x->j, y->i, y->j, nnz));
2991b264fe52SHong Zhang   PetscFunctionReturn(0);
2992b264fe52SHong Zhang }
2993b264fe52SHong Zhang 
2994d71ae5a4SJacob Faibussowitsch PetscErrorCode MatAXPY_SeqAIJ(Mat Y, PetscScalar a, Mat X, MatStructure str)
2995d71ae5a4SJacob Faibussowitsch {
2996ac90fabeSBarry Smith   Mat_SeqAIJ *x = (Mat_SeqAIJ *)X->data, *y = (Mat_SeqAIJ *)Y->data;
2997ac90fabeSBarry Smith 
2998ac90fabeSBarry Smith   PetscFunctionBegin;
2999134adf20SPierre Jolivet   if (str == UNKNOWN_NONZERO_PATTERN || (PetscDefined(USE_DEBUG) && str == SAME_NONZERO_PATTERN)) {
3000134adf20SPierre Jolivet     PetscBool e = x->nz == y->nz ? PETSC_TRUE : PETSC_FALSE;
3001134adf20SPierre Jolivet     if (e) {
30029566063dSJacob Faibussowitsch       PetscCall(PetscArraycmp(x->i, y->i, Y->rmap->n + 1, &e));
300381fa06acSBarry Smith       if (e) {
30049566063dSJacob Faibussowitsch         PetscCall(PetscArraycmp(x->j, y->j, y->nz, &e));
3005134adf20SPierre Jolivet         if (e) str = SAME_NONZERO_PATTERN;
300681fa06acSBarry Smith       }
300781fa06acSBarry Smith     }
300854c59aa7SJacob Faibussowitsch     if (!e) PetscCheck(str != SAME_NONZERO_PATTERN, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONG, "MatStructure is not SAME_NONZERO_PATTERN");
300981fa06acSBarry Smith   }
3010ac90fabeSBarry Smith   if (str == SAME_NONZERO_PATTERN) {
30112e5835c6SStefano Zampini     const PetscScalar *xa;
30122e5835c6SStefano Zampini     PetscScalar       *ya, alpha = a;
301381fa06acSBarry Smith     PetscBLASInt       one = 1, bnz;
301481fa06acSBarry Smith 
30159566063dSJacob Faibussowitsch     PetscCall(PetscBLASIntCast(x->nz, &bnz));
30169566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJGetArray(Y, &ya));
30179566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJGetArrayRead(X, &xa));
3018792fecdfSBarry Smith     PetscCallBLAS("BLASaxpy", BLASaxpy_(&bnz, &alpha, xa, &one, ya, &one));
30199566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJRestoreArrayRead(X, &xa));
30209566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJRestoreArray(Y, &ya));
30219566063dSJacob Faibussowitsch     PetscCall(PetscLogFlops(2.0 * bnz));
30229566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJInvalidateDiagonal(Y));
30239566063dSJacob Faibussowitsch     PetscCall(PetscObjectStateIncrease((PetscObject)Y));
3024ab784542SHong Zhang   } else if (str == SUBSET_NONZERO_PATTERN) { /* nonzeros of X is a subset of Y's */
30259566063dSJacob Faibussowitsch     PetscCall(MatAXPY_Basic(Y, a, X, str));
3026ac90fabeSBarry Smith   } else {
30278229c054SShri Abhyankar     Mat       B;
30288229c054SShri Abhyankar     PetscInt *nnz;
30299566063dSJacob Faibussowitsch     PetscCall(PetscMalloc1(Y->rmap->N, &nnz));
30309566063dSJacob Faibussowitsch     PetscCall(MatCreate(PetscObjectComm((PetscObject)Y), &B));
30319566063dSJacob Faibussowitsch     PetscCall(PetscObjectSetName((PetscObject)B, ((PetscObject)Y)->name));
30329566063dSJacob Faibussowitsch     PetscCall(MatSetLayouts(B, Y->rmap, Y->cmap));
30339566063dSJacob Faibussowitsch     PetscCall(MatSetType(B, ((PetscObject)Y)->type_name));
30349566063dSJacob Faibussowitsch     PetscCall(MatAXPYGetPreallocation_SeqAIJ(Y, X, nnz));
30359566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJSetPreallocation(B, 0, nnz));
30369566063dSJacob Faibussowitsch     PetscCall(MatAXPY_BasicWithPreallocation(B, Y, a, X, str));
30379566063dSJacob Faibussowitsch     PetscCall(MatHeaderMerge(Y, &B));
30389bb234a9SBarry Smith     PetscCall(MatSeqAIJCheckInode(Y));
30399566063dSJacob Faibussowitsch     PetscCall(PetscFree(nnz));
3040ac90fabeSBarry Smith   }
3041ac90fabeSBarry Smith   PetscFunctionReturn(0);
3042ac90fabeSBarry Smith }
3043ac90fabeSBarry Smith 
3044d71ae5a4SJacob Faibussowitsch PETSC_INTERN PetscErrorCode MatConjugate_SeqAIJ(Mat mat)
3045d71ae5a4SJacob Faibussowitsch {
3046354c94deSBarry Smith #if defined(PETSC_USE_COMPLEX)
3047354c94deSBarry Smith   Mat_SeqAIJ  *aij = (Mat_SeqAIJ *)mat->data;
3048354c94deSBarry Smith   PetscInt     i, nz;
3049354c94deSBarry Smith   PetscScalar *a;
3050354c94deSBarry Smith 
3051354c94deSBarry Smith   PetscFunctionBegin;
3052354c94deSBarry Smith   nz = aij->nz;
30539566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArray(mat, &a));
30542205254eSKarl Rupp   for (i = 0; i < nz; i++) a[i] = PetscConj(a[i]);
30559566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArray(mat, &a));
3056354c94deSBarry Smith #else
3057354c94deSBarry Smith   PetscFunctionBegin;
3058354c94deSBarry Smith #endif
3059354c94deSBarry Smith   PetscFunctionReturn(0);
3060354c94deSBarry Smith }
3061354c94deSBarry Smith 
3062d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetRowMaxAbs_SeqAIJ(Mat A, Vec v, PetscInt idx[])
3063d71ae5a4SJacob Faibussowitsch {
3064e34fafa9SBarry Smith   Mat_SeqAIJ      *a = (Mat_SeqAIJ *)A->data;
3065d0f46423SBarry Smith   PetscInt         i, j, m = A->rmap->n, *ai, *aj, ncols, n;
3066e34fafa9SBarry Smith   PetscReal        atmp;
3067985db425SBarry Smith   PetscScalar     *x;
3068ce496241SStefano Zampini   const MatScalar *aa, *av;
3069e34fafa9SBarry Smith 
3070e34fafa9SBarry Smith   PetscFunctionBegin;
307128b400f6SJacob Faibussowitsch   PetscCheck(!A->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix");
30729566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &av));
3073ce496241SStefano Zampini   aa = av;
3074e34fafa9SBarry Smith   ai = a->i;
3075e34fafa9SBarry Smith   aj = a->j;
3076e34fafa9SBarry Smith 
30779566063dSJacob Faibussowitsch   PetscCall(VecSet(v, 0.0));
30789566063dSJacob Faibussowitsch   PetscCall(VecGetArrayWrite(v, &x));
30799566063dSJacob Faibussowitsch   PetscCall(VecGetLocalSize(v, &n));
308008401ef6SPierre Jolivet   PetscCheck(n == A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Nonconforming matrix and vector");
3081e34fafa9SBarry Smith   for (i = 0; i < m; i++) {
30829371c9d4SSatish Balay     ncols = ai[1] - ai[0];
30839371c9d4SSatish Balay     ai++;
3084e34fafa9SBarry Smith     for (j = 0; j < ncols; j++) {
3085985db425SBarry Smith       atmp = PetscAbsScalar(*aa);
30869371c9d4SSatish Balay       if (PetscAbsScalar(x[i]) < atmp) {
30879371c9d4SSatish Balay         x[i] = atmp;
30889371c9d4SSatish Balay         if (idx) idx[i] = *aj;
30899371c9d4SSatish Balay       }
30909371c9d4SSatish Balay       aa++;
30919371c9d4SSatish Balay       aj++;
3092985db425SBarry Smith     }
3093985db425SBarry Smith   }
30949566063dSJacob Faibussowitsch   PetscCall(VecRestoreArrayWrite(v, &x));
30959566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &av));
3096985db425SBarry Smith   PetscFunctionReturn(0);
3097985db425SBarry Smith }
3098985db425SBarry Smith 
3099d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetRowMax_SeqAIJ(Mat A, Vec v, PetscInt idx[])
3100d71ae5a4SJacob Faibussowitsch {
3101985db425SBarry Smith   Mat_SeqAIJ      *a = (Mat_SeqAIJ *)A->data;
3102d0f46423SBarry Smith   PetscInt         i, j, m = A->rmap->n, *ai, *aj, ncols, n;
3103985db425SBarry Smith   PetscScalar     *x;
3104ce496241SStefano Zampini   const MatScalar *aa, *av;
3105985db425SBarry Smith 
3106985db425SBarry Smith   PetscFunctionBegin;
310728b400f6SJacob Faibussowitsch   PetscCheck(!A->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix");
31089566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &av));
3109ce496241SStefano Zampini   aa = av;
3110985db425SBarry Smith   ai = a->i;
3111985db425SBarry Smith   aj = a->j;
3112985db425SBarry Smith 
31139566063dSJacob Faibussowitsch   PetscCall(VecSet(v, 0.0));
31149566063dSJacob Faibussowitsch   PetscCall(VecGetArrayWrite(v, &x));
31159566063dSJacob Faibussowitsch   PetscCall(VecGetLocalSize(v, &n));
311608401ef6SPierre Jolivet   PetscCheck(n == A->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Nonconforming matrix and vector");
3117985db425SBarry Smith   for (i = 0; i < m; i++) {
31189371c9d4SSatish Balay     ncols = ai[1] - ai[0];
31199371c9d4SSatish Balay     ai++;
3120d0f46423SBarry Smith     if (ncols == A->cmap->n) { /* row is dense */
31219371c9d4SSatish Balay       x[i] = *aa;
31229371c9d4SSatish Balay       if (idx) idx[i] = 0;
3123985db425SBarry Smith     } else { /* row is sparse so already KNOW maximum is 0.0 or higher */
3124985db425SBarry Smith       x[i] = 0.0;
3125985db425SBarry Smith       if (idx) {
3126985db425SBarry Smith         for (j = 0; j < ncols; j++) { /* find first implicit 0.0 in the row */
3127985db425SBarry Smith           if (aj[j] > j) {
3128985db425SBarry Smith             idx[i] = j;
3129985db425SBarry Smith             break;
3130985db425SBarry Smith           }
3131985db425SBarry Smith         }
31321a254869SHong Zhang         /* in case first implicit 0.0 in the row occurs at ncols-th column */
31331a254869SHong Zhang         if (j == ncols && j < A->cmap->n) idx[i] = j;
3134985db425SBarry Smith       }
3135985db425SBarry Smith     }
3136985db425SBarry Smith     for (j = 0; j < ncols; j++) {
31379371c9d4SSatish Balay       if (PetscRealPart(x[i]) < PetscRealPart(*aa)) {
31389371c9d4SSatish Balay         x[i] = *aa;
31399371c9d4SSatish Balay         if (idx) idx[i] = *aj;
31409371c9d4SSatish Balay       }
31419371c9d4SSatish Balay       aa++;
31429371c9d4SSatish Balay       aj++;
3143985db425SBarry Smith     }
3144985db425SBarry Smith   }
31459566063dSJacob Faibussowitsch   PetscCall(VecRestoreArrayWrite(v, &x));
31469566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &av));
3147985db425SBarry Smith   PetscFunctionReturn(0);
3148985db425SBarry Smith }
3149985db425SBarry Smith 
3150d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetRowMinAbs_SeqAIJ(Mat A, Vec v, PetscInt idx[])
3151d71ae5a4SJacob Faibussowitsch {
3152c87e5d42SMatthew Knepley   Mat_SeqAIJ      *a = (Mat_SeqAIJ *)A->data;
3153c87e5d42SMatthew Knepley   PetscInt         i, j, m = A->rmap->n, *ai, *aj, ncols, n;
3154ce496241SStefano Zampini   PetscScalar     *x;
3155ce496241SStefano Zampini   const MatScalar *aa, *av;
3156c87e5d42SMatthew Knepley 
3157c87e5d42SMatthew Knepley   PetscFunctionBegin;
31589566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &av));
3159ce496241SStefano Zampini   aa = av;
3160c87e5d42SMatthew Knepley   ai = a->i;
3161c87e5d42SMatthew Knepley   aj = a->j;
3162c87e5d42SMatthew Knepley 
31639566063dSJacob Faibussowitsch   PetscCall(VecSet(v, 0.0));
31649566063dSJacob Faibussowitsch   PetscCall(VecGetArrayWrite(v, &x));
31659566063dSJacob Faibussowitsch   PetscCall(VecGetLocalSize(v, &n));
316608401ef6SPierre Jolivet   PetscCheck(n == m, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Nonconforming matrix and vector, %" PetscInt_FMT " vs. %" PetscInt_FMT " rows", m, n);
3167c87e5d42SMatthew Knepley   for (i = 0; i < m; i++) {
31689371c9d4SSatish Balay     ncols = ai[1] - ai[0];
31699371c9d4SSatish Balay     ai++;
3170f07e67edSHong Zhang     if (ncols == A->cmap->n) { /* row is dense */
31719371c9d4SSatish Balay       x[i] = *aa;
31729371c9d4SSatish Balay       if (idx) idx[i] = 0;
3173f07e67edSHong Zhang     } else { /* row is sparse so already KNOW minimum is 0.0 or higher */
3174f07e67edSHong Zhang       x[i] = 0.0;
3175f07e67edSHong Zhang       if (idx) { /* find first implicit 0.0 in the row */
3176289a08f5SMatthew Knepley         for (j = 0; j < ncols; j++) {
3177f07e67edSHong Zhang           if (aj[j] > j) {
3178f07e67edSHong Zhang             idx[i] = j;
31792205254eSKarl Rupp             break;
31802205254eSKarl Rupp           }
3181289a08f5SMatthew Knepley         }
3182f07e67edSHong Zhang         /* in case first implicit 0.0 in the row occurs at ncols-th column */
3183f07e67edSHong Zhang         if (j == ncols && j < A->cmap->n) idx[i] = j;
3184f07e67edSHong Zhang       }
3185289a08f5SMatthew Knepley     }
3186c87e5d42SMatthew Knepley     for (j = 0; j < ncols; j++) {
31879371c9d4SSatish Balay       if (PetscAbsScalar(x[i]) > PetscAbsScalar(*aa)) {
31889371c9d4SSatish Balay         x[i] = *aa;
31899371c9d4SSatish Balay         if (idx) idx[i] = *aj;
31909371c9d4SSatish Balay       }
31919371c9d4SSatish Balay       aa++;
31929371c9d4SSatish Balay       aj++;
3193c87e5d42SMatthew Knepley     }
3194c87e5d42SMatthew Knepley   }
31959566063dSJacob Faibussowitsch   PetscCall(VecRestoreArrayWrite(v, &x));
31969566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &av));
3197c87e5d42SMatthew Knepley   PetscFunctionReturn(0);
3198c87e5d42SMatthew Knepley }
3199c87e5d42SMatthew Knepley 
3200d71ae5a4SJacob Faibussowitsch PetscErrorCode MatGetRowMin_SeqAIJ(Mat A, Vec v, PetscInt idx[])
3201d71ae5a4SJacob Faibussowitsch {
3202985db425SBarry Smith   Mat_SeqAIJ      *a = (Mat_SeqAIJ *)A->data;
3203d9ca1df4SBarry Smith   PetscInt         i, j, m = A->rmap->n, ncols, n;
3204d9ca1df4SBarry Smith   const PetscInt  *ai, *aj;
3205985db425SBarry Smith   PetscScalar     *x;
3206ce496241SStefano Zampini   const MatScalar *aa, *av;
3207985db425SBarry Smith 
3208985db425SBarry Smith   PetscFunctionBegin;
320928b400f6SJacob Faibussowitsch   PetscCheck(!A->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix");
32109566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &av));
3211ce496241SStefano Zampini   aa = av;
3212985db425SBarry Smith   ai = a->i;
3213985db425SBarry Smith   aj = a->j;
3214985db425SBarry Smith 
32159566063dSJacob Faibussowitsch   PetscCall(VecSet(v, 0.0));
32169566063dSJacob Faibussowitsch   PetscCall(VecGetArrayWrite(v, &x));
32179566063dSJacob Faibussowitsch   PetscCall(VecGetLocalSize(v, &n));
321808401ef6SPierre Jolivet   PetscCheck(n == m, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "Nonconforming matrix and vector");
3219985db425SBarry Smith   for (i = 0; i < m; i++) {
32209371c9d4SSatish Balay     ncols = ai[1] - ai[0];
32219371c9d4SSatish Balay     ai++;
3222d0f46423SBarry Smith     if (ncols == A->cmap->n) { /* row is dense */
32239371c9d4SSatish Balay       x[i] = *aa;
32249371c9d4SSatish Balay       if (idx) idx[i] = 0;
3225985db425SBarry Smith     } else { /* row is sparse so already KNOW minimum is 0.0 or lower */
3226985db425SBarry Smith       x[i] = 0.0;
3227985db425SBarry Smith       if (idx) { /* find first implicit 0.0 in the row */
3228985db425SBarry Smith         for (j = 0; j < ncols; j++) {
3229985db425SBarry Smith           if (aj[j] > j) {
3230985db425SBarry Smith             idx[i] = j;
3231985db425SBarry Smith             break;
3232985db425SBarry Smith           }
3233985db425SBarry Smith         }
3234fa213d2fSHong Zhang         /* in case first implicit 0.0 in the row occurs at ncols-th column */
3235fa213d2fSHong Zhang         if (j == ncols && j < A->cmap->n) idx[i] = j;
3236985db425SBarry Smith       }
3237985db425SBarry Smith     }
3238985db425SBarry Smith     for (j = 0; j < ncols; j++) {
32399371c9d4SSatish Balay       if (PetscRealPart(x[i]) > PetscRealPart(*aa)) {
32409371c9d4SSatish Balay         x[i] = *aa;
32419371c9d4SSatish Balay         if (idx) idx[i] = *aj;
32429371c9d4SSatish Balay       }
32439371c9d4SSatish Balay       aa++;
32449371c9d4SSatish Balay       aj++;
3245e34fafa9SBarry Smith     }
3246e34fafa9SBarry Smith   }
32479566063dSJacob Faibussowitsch   PetscCall(VecRestoreArrayWrite(v, &x));
32489566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &av));
3249e34fafa9SBarry Smith   PetscFunctionReturn(0);
3250e34fafa9SBarry Smith }
3251bbead8a2SBarry Smith 
3252d71ae5a4SJacob Faibussowitsch PetscErrorCode MatInvertBlockDiagonal_SeqAIJ(Mat A, const PetscScalar **values)
3253d71ae5a4SJacob Faibussowitsch {
3254bbead8a2SBarry Smith   Mat_SeqAIJ     *a = (Mat_SeqAIJ *)A->data;
325533d57670SJed Brown   PetscInt        i, bs = PetscAbs(A->rmap->bs), mbs = A->rmap->n / bs, ipvt[5], bs2 = bs * bs, *v_pivots, ij[7], *IJ, j;
3256bbead8a2SBarry Smith   MatScalar      *diag, work[25], *v_work;
32570da83c2eSBarry Smith   const PetscReal shift = 0.0;
32581a9391e3SHong Zhang   PetscBool       allowzeropivot, zeropivotdetected = PETSC_FALSE;
3259bbead8a2SBarry Smith 
3260bbead8a2SBarry Smith   PetscFunctionBegin;
3261a455e926SHong Zhang   allowzeropivot = PetscNot(A->erroriffailure);
32624a0d0026SBarry Smith   if (a->ibdiagvalid) {
32634a0d0026SBarry Smith     if (values) *values = a->ibdiag;
32644a0d0026SBarry Smith     PetscFunctionReturn(0);
32654a0d0026SBarry Smith   }
32669566063dSJacob Faibussowitsch   PetscCall(MatMarkDiagonal_SeqAIJ(A));
32674dfa11a4SJacob Faibussowitsch   if (!a->ibdiag) { PetscCall(PetscMalloc1(bs2 * mbs, &a->ibdiag)); }
3268bbead8a2SBarry Smith   diag = a->ibdiag;
3269bbead8a2SBarry Smith   if (values) *values = a->ibdiag;
3270bbead8a2SBarry Smith   /* factor and invert each block */
3271bbead8a2SBarry Smith   switch (bs) {
3272bbead8a2SBarry Smith   case 1:
3273bbead8a2SBarry Smith     for (i = 0; i < mbs; i++) {
32749566063dSJacob Faibussowitsch       PetscCall(MatGetValues(A, 1, &i, 1, &i, diag + i));
3275ec1892c8SHong Zhang       if (PetscAbsScalar(diag[i] + shift) < PETSC_MACHINE_EPSILON) {
3276ec1892c8SHong Zhang         if (allowzeropivot) {
32777b6c816cSBarry Smith           A->factorerrortype             = MAT_FACTOR_NUMERIC_ZEROPIVOT;
32787b6c816cSBarry Smith           A->factorerror_zeropivot_value = PetscAbsScalar(diag[i]);
32797b6c816cSBarry Smith           A->factorerror_zeropivot_row   = i;
32809566063dSJacob Faibussowitsch           PetscCall(PetscInfo(A, "Zero pivot, row %" PetscInt_FMT " pivot %g tolerance %g\n", i, (double)PetscAbsScalar(diag[i]), (double)PETSC_MACHINE_EPSILON));
328198921bdaSJacob Faibussowitsch         } else SETERRQ(PETSC_COMM_SELF, PETSC_ERR_MAT_LU_ZRPVT, "Zero pivot, row %" PetscInt_FMT " pivot %g tolerance %g", i, (double)PetscAbsScalar(diag[i]), (double)PETSC_MACHINE_EPSILON);
3282ec1892c8SHong Zhang       }
3283bbead8a2SBarry Smith       diag[i] = (PetscScalar)1.0 / (diag[i] + shift);
3284bbead8a2SBarry Smith     }
3285bbead8a2SBarry Smith     break;
3286bbead8a2SBarry Smith   case 2:
3287bbead8a2SBarry Smith     for (i = 0; i < mbs; i++) {
32889371c9d4SSatish Balay       ij[0] = 2 * i;
32899371c9d4SSatish Balay       ij[1] = 2 * i + 1;
32909566063dSJacob Faibussowitsch       PetscCall(MatGetValues(A, 2, ij, 2, ij, diag));
32919566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_inverse_A_2(diag, shift, allowzeropivot, &zeropivotdetected));
32927b6c816cSBarry Smith       if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT;
32939566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_transpose_A_2(diag));
3294bbead8a2SBarry Smith       diag += 4;
3295bbead8a2SBarry Smith     }
3296bbead8a2SBarry Smith     break;
3297bbead8a2SBarry Smith   case 3:
3298bbead8a2SBarry Smith     for (i = 0; i < mbs; i++) {
32999371c9d4SSatish Balay       ij[0] = 3 * i;
33009371c9d4SSatish Balay       ij[1] = 3 * i + 1;
33019371c9d4SSatish Balay       ij[2] = 3 * i + 2;
33029566063dSJacob Faibussowitsch       PetscCall(MatGetValues(A, 3, ij, 3, ij, diag));
33039566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_inverse_A_3(diag, shift, allowzeropivot, &zeropivotdetected));
33047b6c816cSBarry Smith       if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT;
33059566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_transpose_A_3(diag));
3306bbead8a2SBarry Smith       diag += 9;
3307bbead8a2SBarry Smith     }
3308bbead8a2SBarry Smith     break;
3309bbead8a2SBarry Smith   case 4:
3310bbead8a2SBarry Smith     for (i = 0; i < mbs; i++) {
33119371c9d4SSatish Balay       ij[0] = 4 * i;
33129371c9d4SSatish Balay       ij[1] = 4 * i + 1;
33139371c9d4SSatish Balay       ij[2] = 4 * i + 2;
33149371c9d4SSatish Balay       ij[3] = 4 * i + 3;
33159566063dSJacob Faibussowitsch       PetscCall(MatGetValues(A, 4, ij, 4, ij, diag));
33169566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_inverse_A_4(diag, shift, allowzeropivot, &zeropivotdetected));
33177b6c816cSBarry Smith       if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT;
33189566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_transpose_A_4(diag));
3319bbead8a2SBarry Smith       diag += 16;
3320bbead8a2SBarry Smith     }
3321bbead8a2SBarry Smith     break;
3322bbead8a2SBarry Smith   case 5:
3323bbead8a2SBarry Smith     for (i = 0; i < mbs; i++) {
33249371c9d4SSatish Balay       ij[0] = 5 * i;
33259371c9d4SSatish Balay       ij[1] = 5 * i + 1;
33269371c9d4SSatish Balay       ij[2] = 5 * i + 2;
33279371c9d4SSatish Balay       ij[3] = 5 * i + 3;
33289371c9d4SSatish Balay       ij[4] = 5 * i + 4;
33299566063dSJacob Faibussowitsch       PetscCall(MatGetValues(A, 5, ij, 5, ij, diag));
33309566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_inverse_A_5(diag, ipvt, work, shift, allowzeropivot, &zeropivotdetected));
33317b6c816cSBarry Smith       if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT;
33329566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_transpose_A_5(diag));
3333bbead8a2SBarry Smith       diag += 25;
3334bbead8a2SBarry Smith     }
3335bbead8a2SBarry Smith     break;
3336bbead8a2SBarry Smith   case 6:
3337bbead8a2SBarry Smith     for (i = 0; i < mbs; i++) {
33389371c9d4SSatish Balay       ij[0] = 6 * i;
33399371c9d4SSatish Balay       ij[1] = 6 * i + 1;
33409371c9d4SSatish Balay       ij[2] = 6 * i + 2;
33419371c9d4SSatish Balay       ij[3] = 6 * i + 3;
33429371c9d4SSatish Balay       ij[4] = 6 * i + 4;
33439371c9d4SSatish Balay       ij[5] = 6 * i + 5;
33449566063dSJacob Faibussowitsch       PetscCall(MatGetValues(A, 6, ij, 6, ij, diag));
33459566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_inverse_A_6(diag, shift, allowzeropivot, &zeropivotdetected));
33467b6c816cSBarry Smith       if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT;
33479566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_transpose_A_6(diag));
3348bbead8a2SBarry Smith       diag += 36;
3349bbead8a2SBarry Smith     }
3350bbead8a2SBarry Smith     break;
3351bbead8a2SBarry Smith   case 7:
3352bbead8a2SBarry Smith     for (i = 0; i < mbs; i++) {
33539371c9d4SSatish Balay       ij[0] = 7 * i;
33549371c9d4SSatish Balay       ij[1] = 7 * i + 1;
33559371c9d4SSatish Balay       ij[2] = 7 * i + 2;
33569371c9d4SSatish Balay       ij[3] = 7 * i + 3;
33579371c9d4SSatish Balay       ij[4] = 7 * i + 4;
33589371c9d4SSatish Balay       ij[5] = 7 * i + 5;
33599371c9d4SSatish Balay       ij[5] = 7 * i + 6;
33609566063dSJacob Faibussowitsch       PetscCall(MatGetValues(A, 7, ij, 7, ij, diag));
33619566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_inverse_A_7(diag, shift, allowzeropivot, &zeropivotdetected));
33627b6c816cSBarry Smith       if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT;
33639566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_transpose_A_7(diag));
3364bbead8a2SBarry Smith       diag += 49;
3365bbead8a2SBarry Smith     }
3366bbead8a2SBarry Smith     break;
3367bbead8a2SBarry Smith   default:
33689566063dSJacob Faibussowitsch     PetscCall(PetscMalloc3(bs, &v_work, bs, &v_pivots, bs, &IJ));
3369bbead8a2SBarry Smith     for (i = 0; i < mbs; i++) {
3370ad540459SPierre Jolivet       for (j = 0; j < bs; j++) IJ[j] = bs * i + j;
33719566063dSJacob Faibussowitsch       PetscCall(MatGetValues(A, bs, IJ, bs, IJ, diag));
33729566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_inverse_A(bs, diag, v_pivots, v_work, allowzeropivot, &zeropivotdetected));
33737b6c816cSBarry Smith       if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT;
33749566063dSJacob Faibussowitsch       PetscCall(PetscKernel_A_gets_transpose_A_N(diag, bs));
3375bbead8a2SBarry Smith       diag += bs2;
3376bbead8a2SBarry Smith     }
33779566063dSJacob Faibussowitsch     PetscCall(PetscFree3(v_work, v_pivots, IJ));
3378bbead8a2SBarry Smith   }
3379bbead8a2SBarry Smith   a->ibdiagvalid = PETSC_TRUE;
3380bbead8a2SBarry Smith   PetscFunctionReturn(0);
3381bbead8a2SBarry Smith }
3382bbead8a2SBarry Smith 
3383d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatSetRandom_SeqAIJ(Mat x, PetscRandom rctx)
3384d71ae5a4SJacob Faibussowitsch {
338573a71a0fSBarry Smith   Mat_SeqAIJ *aij = (Mat_SeqAIJ *)x->data;
3386fff043a9SJunchao Zhang   PetscScalar a, *aa;
338773a71a0fSBarry Smith   PetscInt    m, n, i, j, col;
338873a71a0fSBarry Smith 
338973a71a0fSBarry Smith   PetscFunctionBegin;
339073a71a0fSBarry Smith   if (!x->assembled) {
33919566063dSJacob Faibussowitsch     PetscCall(MatGetSize(x, &m, &n));
339273a71a0fSBarry Smith     for (i = 0; i < m; i++) {
339373a71a0fSBarry Smith       for (j = 0; j < aij->imax[i]; j++) {
33949566063dSJacob Faibussowitsch         PetscCall(PetscRandomGetValue(rctx, &a));
339573a71a0fSBarry Smith         col = (PetscInt)(n * PetscRealPart(a));
33969566063dSJacob Faibussowitsch         PetscCall(MatSetValues(x, 1, &i, 1, &col, &a, ADD_VALUES));
339773a71a0fSBarry Smith       }
339873a71a0fSBarry Smith     }
3399e2ce353bSJunchao Zhang   } else {
34009566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJGetArrayWrite(x, &aa));
34019566063dSJacob Faibussowitsch     for (i = 0; i < aij->nz; i++) PetscCall(PetscRandomGetValue(rctx, aa + i));
34029566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJRestoreArrayWrite(x, &aa));
3403e2ce353bSJunchao Zhang   }
34049566063dSJacob Faibussowitsch   PetscCall(MatAssemblyBegin(x, MAT_FINAL_ASSEMBLY));
34059566063dSJacob Faibussowitsch   PetscCall(MatAssemblyEnd(x, MAT_FINAL_ASSEMBLY));
340673a71a0fSBarry Smith   PetscFunctionReturn(0);
340773a71a0fSBarry Smith }
340873a71a0fSBarry Smith 
3409679944adSJunchao Zhang /* Like MatSetRandom_SeqAIJ, but do not set values on columns in range of [low, high) */
3410d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetRandomSkipColumnRange_SeqAIJ_Private(Mat x, PetscInt low, PetscInt high, PetscRandom rctx)
3411d71ae5a4SJacob Faibussowitsch {
3412679944adSJunchao Zhang   Mat_SeqAIJ *aij = (Mat_SeqAIJ *)x->data;
3413679944adSJunchao Zhang   PetscScalar a;
3414679944adSJunchao Zhang   PetscInt    m, n, i, j, col, nskip;
3415679944adSJunchao Zhang 
3416679944adSJunchao Zhang   PetscFunctionBegin;
3417679944adSJunchao Zhang   nskip = high - low;
34189566063dSJacob Faibussowitsch   PetscCall(MatGetSize(x, &m, &n));
3419679944adSJunchao Zhang   n -= nskip; /* shrink number of columns where nonzeros can be set */
3420679944adSJunchao Zhang   for (i = 0; i < m; i++) {
3421679944adSJunchao Zhang     for (j = 0; j < aij->imax[i]; j++) {
34229566063dSJacob Faibussowitsch       PetscCall(PetscRandomGetValue(rctx, &a));
3423679944adSJunchao Zhang       col = (PetscInt)(n * PetscRealPart(a));
3424679944adSJunchao Zhang       if (col >= low) col += nskip; /* shift col rightward to skip the hole */
34259566063dSJacob Faibussowitsch       PetscCall(MatSetValues(x, 1, &i, 1, &col, &a, ADD_VALUES));
3426679944adSJunchao Zhang     }
3427e2ce353bSJunchao Zhang   }
34289566063dSJacob Faibussowitsch   PetscCall(MatAssemblyBegin(x, MAT_FINAL_ASSEMBLY));
34299566063dSJacob Faibussowitsch   PetscCall(MatAssemblyEnd(x, MAT_FINAL_ASSEMBLY));
3430679944adSJunchao Zhang   PetscFunctionReturn(0);
3431679944adSJunchao Zhang }
3432679944adSJunchao Zhang 
3433682d7d0cSBarry Smith /* -------------------------------------------------------------------*/
34340a6ffc59SBarry Smith static struct _MatOps MatOps_Values = {MatSetValues_SeqAIJ,
3435cb5b572fSBarry Smith                                        MatGetRow_SeqAIJ,
3436cb5b572fSBarry Smith                                        MatRestoreRow_SeqAIJ,
3437cb5b572fSBarry Smith                                        MatMult_SeqAIJ,
343897304618SKris Buschelman                                        /*  4*/ MatMultAdd_SeqAIJ,
34397c922b88SBarry Smith                                        MatMultTranspose_SeqAIJ,
34407c922b88SBarry Smith                                        MatMultTransposeAdd_SeqAIJ,
3441f4259b30SLisandro Dalcin                                        NULL,
3442f4259b30SLisandro Dalcin                                        NULL,
3443f4259b30SLisandro Dalcin                                        NULL,
3444f4259b30SLisandro Dalcin                                        /* 10*/ NULL,
3445cb5b572fSBarry Smith                                        MatLUFactor_SeqAIJ,
3446f4259b30SLisandro Dalcin                                        NULL,
344741f059aeSBarry Smith                                        MatSOR_SeqAIJ,
344891e9d3e2SHong Zhang                                        MatTranspose_SeqAIJ,
344997304618SKris Buschelman                                        /*1 5*/ MatGetInfo_SeqAIJ,
3450cb5b572fSBarry Smith                                        MatEqual_SeqAIJ,
3451cb5b572fSBarry Smith                                        MatGetDiagonal_SeqAIJ,
3452cb5b572fSBarry Smith                                        MatDiagonalScale_SeqAIJ,
3453cb5b572fSBarry Smith                                        MatNorm_SeqAIJ,
3454f4259b30SLisandro Dalcin                                        /* 20*/ NULL,
3455cb5b572fSBarry Smith                                        MatAssemblyEnd_SeqAIJ,
3456cb5b572fSBarry Smith                                        MatSetOption_SeqAIJ,
3457cb5b572fSBarry Smith                                        MatZeroEntries_SeqAIJ,
3458d519adbfSMatthew Knepley                                        /* 24*/ MatZeroRows_SeqAIJ,
3459f4259b30SLisandro Dalcin                                        NULL,
3460f4259b30SLisandro Dalcin                                        NULL,
3461f4259b30SLisandro Dalcin                                        NULL,
3462f4259b30SLisandro Dalcin                                        NULL,
34634994cf47SJed Brown                                        /* 29*/ MatSetUp_SeqAIJ,
3464f4259b30SLisandro Dalcin                                        NULL,
3465f4259b30SLisandro Dalcin                                        NULL,
3466f4259b30SLisandro Dalcin                                        NULL,
3467f4259b30SLisandro Dalcin                                        NULL,
3468d519adbfSMatthew Knepley                                        /* 34*/ MatDuplicate_SeqAIJ,
3469f4259b30SLisandro Dalcin                                        NULL,
3470f4259b30SLisandro Dalcin                                        NULL,
3471cb5b572fSBarry Smith                                        MatILUFactor_SeqAIJ,
3472f4259b30SLisandro Dalcin                                        NULL,
3473d519adbfSMatthew Knepley                                        /* 39*/ MatAXPY_SeqAIJ,
34747dae84e0SHong Zhang                                        MatCreateSubMatrices_SeqAIJ,
3475cb5b572fSBarry Smith                                        MatIncreaseOverlap_SeqAIJ,
3476cb5b572fSBarry Smith                                        MatGetValues_SeqAIJ,
3477cb5b572fSBarry Smith                                        MatCopy_SeqAIJ,
3478d519adbfSMatthew Knepley                                        /* 44*/ MatGetRowMax_SeqAIJ,
3479cb5b572fSBarry Smith                                        MatScale_SeqAIJ,
34807d68702bSBarry Smith                                        MatShift_SeqAIJ,
348179299369SBarry Smith                                        MatDiagonalSet_SeqAIJ,
34826e169961SBarry Smith                                        MatZeroRowsColumns_SeqAIJ,
348373a71a0fSBarry Smith                                        /* 49*/ MatSetRandom_SeqAIJ,
34843b2fbd54SBarry Smith                                        MatGetRowIJ_SeqAIJ,
34853b2fbd54SBarry Smith                                        MatRestoreRowIJ_SeqAIJ,
34863b2fbd54SBarry Smith                                        MatGetColumnIJ_SeqAIJ,
3487a93ec695SBarry Smith                                        MatRestoreColumnIJ_SeqAIJ,
348893dfae19SHong Zhang                                        /* 54*/ MatFDColoringCreate_SeqXAIJ,
3489f4259b30SLisandro Dalcin                                        NULL,
3490f4259b30SLisandro Dalcin                                        NULL,
3491cda55fadSBarry Smith                                        MatPermute_SeqAIJ,
3492f4259b30SLisandro Dalcin                                        NULL,
3493f4259b30SLisandro Dalcin                                        /* 59*/ NULL,
3494b9b97703SBarry Smith                                        MatDestroy_SeqAIJ,
3495b9b97703SBarry Smith                                        MatView_SeqAIJ,
3496f4259b30SLisandro Dalcin                                        NULL,
3497f4259b30SLisandro Dalcin                                        NULL,
3498f4259b30SLisandro Dalcin                                        /* 64*/ NULL,
3499321b30b9SSatish Balay                                        MatMatMatMultNumeric_SeqAIJ_SeqAIJ_SeqAIJ,
3500f4259b30SLisandro Dalcin                                        NULL,
3501f4259b30SLisandro Dalcin                                        NULL,
3502f4259b30SLisandro Dalcin                                        NULL,
3503d519adbfSMatthew Knepley                                        /* 69*/ MatGetRowMaxAbs_SeqAIJ,
3504c87e5d42SMatthew Knepley                                        MatGetRowMinAbs_SeqAIJ,
3505f4259b30SLisandro Dalcin                                        NULL,
3506f4259b30SLisandro Dalcin                                        NULL,
3507f4259b30SLisandro Dalcin                                        NULL,
3508f4259b30SLisandro Dalcin                                        /* 74*/ NULL,
35093acb8795SBarry Smith                                        MatFDColoringApply_AIJ,
3510f4259b30SLisandro Dalcin                                        NULL,
3511f4259b30SLisandro Dalcin                                        NULL,
3512f4259b30SLisandro Dalcin                                        NULL,
35136ce1633cSBarry Smith                                        /* 79*/ MatFindZeroDiagonals_SeqAIJ,
3514f4259b30SLisandro Dalcin                                        NULL,
3515f4259b30SLisandro Dalcin                                        NULL,
3516f4259b30SLisandro Dalcin                                        NULL,
3517bc011b1eSHong Zhang                                        MatLoad_SeqAIJ,
3518d519adbfSMatthew Knepley                                        /* 84*/ MatIsSymmetric_SeqAIJ,
35191cbb95d3SBarry Smith                                        MatIsHermitian_SeqAIJ,
3520f4259b30SLisandro Dalcin                                        NULL,
3521f4259b30SLisandro Dalcin                                        NULL,
3522f4259b30SLisandro Dalcin                                        NULL,
3523f4259b30SLisandro Dalcin                                        /* 89*/ NULL,
3524f4259b30SLisandro Dalcin                                        NULL,
352526be0446SHong Zhang                                        MatMatMultNumeric_SeqAIJ_SeqAIJ,
3526f4259b30SLisandro Dalcin                                        NULL,
3527f4259b30SLisandro Dalcin                                        NULL,
35288fa4b5a6SHong Zhang                                        /* 94*/ MatPtAPNumeric_SeqAIJ_SeqAIJ_SparseAxpy,
3529f4259b30SLisandro Dalcin                                        NULL,
3530f4259b30SLisandro Dalcin                                        NULL,
35316fc122caSHong Zhang                                        MatMatTransposeMultNumeric_SeqAIJ_SeqAIJ,
3532f4259b30SLisandro Dalcin                                        NULL,
35334222ddf1SHong Zhang                                        /* 99*/ MatProductSetFromOptions_SeqAIJ,
3534f4259b30SLisandro Dalcin                                        NULL,
3535f4259b30SLisandro Dalcin                                        NULL,
353687d4246cSBarry Smith                                        MatConjugate_SeqAIJ,
3537f4259b30SLisandro Dalcin                                        NULL,
3538d519adbfSMatthew Knepley                                        /*104*/ MatSetValuesRow_SeqAIJ,
353999cafbc1SBarry Smith                                        MatRealPart_SeqAIJ,
3540f5edf698SHong Zhang                                        MatImaginaryPart_SeqAIJ,
3541f4259b30SLisandro Dalcin                                        NULL,
3542f4259b30SLisandro Dalcin                                        NULL,
3543cbd44569SHong Zhang                                        /*109*/ MatMatSolve_SeqAIJ,
3544f4259b30SLisandro Dalcin                                        NULL,
35452af78befSBarry Smith                                        MatGetRowMin_SeqAIJ,
3546f4259b30SLisandro Dalcin                                        NULL,
3547599ef60dSHong Zhang                                        MatMissingDiagonal_SeqAIJ,
3548f4259b30SLisandro Dalcin                                        /*114*/ NULL,
3549f4259b30SLisandro Dalcin                                        NULL,
3550f4259b30SLisandro Dalcin                                        NULL,
3551f4259b30SLisandro Dalcin                                        NULL,
3552f4259b30SLisandro Dalcin                                        NULL,
3553f4259b30SLisandro Dalcin                                        /*119*/ NULL,
3554f4259b30SLisandro Dalcin                                        NULL,
3555f4259b30SLisandro Dalcin                                        NULL,
3556f4259b30SLisandro Dalcin                                        NULL,
3557b3a44c85SBarry Smith                                        MatGetMultiProcBlock_SeqAIJ,
35580716a85fSBarry Smith                                        /*124*/ MatFindNonzeroRows_SeqAIJ,
3559a873a8cdSSam Reynolds                                        MatGetColumnReductions_SeqAIJ,
356037868618SMatthew G Knepley                                        MatInvertBlockDiagonal_SeqAIJ,
35610da83c2eSBarry Smith                                        MatInvertVariableBlockDiagonal_SeqAIJ,
3562f4259b30SLisandro Dalcin                                        NULL,
3563f4259b30SLisandro Dalcin                                        /*129*/ NULL,
3564f4259b30SLisandro Dalcin                                        NULL,
3565f4259b30SLisandro Dalcin                                        NULL,
356675648e8dSHong Zhang                                        MatTransposeMatMultNumeric_SeqAIJ_SeqAIJ,
3567b9af6bddSHong Zhang                                        MatTransposeColoringCreate_SeqAIJ,
3568b9af6bddSHong Zhang                                        /*134*/ MatTransColoringApplySpToDen_SeqAIJ,
35692b8ad9a3SHong Zhang                                        MatTransColoringApplyDenToSp_SeqAIJ,
3570f4259b30SLisandro Dalcin                                        NULL,
3571f4259b30SLisandro Dalcin                                        NULL,
35723964eb88SJed Brown                                        MatRARtNumeric_SeqAIJ_SeqAIJ,
3573f4259b30SLisandro Dalcin                                        /*139*/ NULL,
3574f4259b30SLisandro Dalcin                                        NULL,
3575f4259b30SLisandro Dalcin                                        NULL,
35763a062f41SBarry Smith                                        MatFDColoringSetUp_SeqXAIJ,
35779c8f2541SHong Zhang                                        MatFindOffBlockDiagonalEntries_SeqAIJ,
35784222ddf1SHong Zhang                                        MatCreateMPIMatConcatenateSeqMat_SeqAIJ,
35794222ddf1SHong Zhang                                        /*145*/ MatDestroySubMatrices_SeqAIJ,
3580f4259b30SLisandro Dalcin                                        NULL,
358172833a62Smarkadams4                                        NULL,
358272833a62Smarkadams4                                        MatCreateGraph_Simple_AIJ,
35832d776b49SBarry Smith                                        NULL,
35849371c9d4SSatish Balay                                        /*150*/ MatTransposeSymbolic_SeqAIJ};
358517ab2063SBarry Smith 
3586d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetColumnIndices_SeqAIJ(Mat mat, PetscInt *indices)
3587d71ae5a4SJacob Faibussowitsch {
3588bef8e0ddSBarry Smith   Mat_SeqAIJ *aij = (Mat_SeqAIJ *)mat->data;
358997f1f81fSBarry Smith   PetscInt    i, nz, n;
3590bef8e0ddSBarry Smith 
3591bef8e0ddSBarry Smith   PetscFunctionBegin;
3592bef8e0ddSBarry Smith   nz = aij->maxnz;
3593d0f46423SBarry Smith   n  = mat->rmap->n;
3594ad540459SPierre Jolivet   for (i = 0; i < nz; i++) aij->j[i] = indices[i];
3595bef8e0ddSBarry Smith   aij->nz = nz;
3596ad540459SPierre Jolivet   for (i = 0; i < n; i++) aij->ilen[i] = aij->imax[i];
3597bef8e0ddSBarry Smith   PetscFunctionReturn(0);
3598bef8e0ddSBarry Smith }
3599bef8e0ddSBarry Smith 
3600a3bb6f32SFande Kong /*
3601ddea5d60SJunchao Zhang  * Given a sparse matrix with global column indices, compact it by using a local column space.
3602ddea5d60SJunchao Zhang  * The result matrix helps saving memory in other algorithms, such as MatPtAPSymbolic_MPIAIJ_MPIAIJ_scalable()
3603ddea5d60SJunchao Zhang  */
3604d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJCompactOutExtraColumns_SeqAIJ(Mat mat, ISLocalToGlobalMapping *mapping)
3605d71ae5a4SJacob Faibussowitsch {
3606a3bb6f32SFande Kong   Mat_SeqAIJ        *aij = (Mat_SeqAIJ *)mat->data;
3607a3bb6f32SFande Kong   PetscTable         gid1_lid1;
3608a3bb6f32SFande Kong   PetscTablePosition tpos;
360925b670f0SStefano Zampini   PetscInt           gid, lid, i, ec, nz = aij->nz;
361025b670f0SStefano Zampini   PetscInt          *garray, *jj = aij->j;
3611a3bb6f32SFande Kong 
3612a3bb6f32SFande Kong   PetscFunctionBegin;
3613a3bb6f32SFande Kong   PetscValidHeaderSpecific(mat, MAT_CLASSID, 1);
3614a3bb6f32SFande Kong   PetscValidPointer(mapping, 2);
3615a3bb6f32SFande Kong   /* use a table */
36169566063dSJacob Faibussowitsch   PetscCall(PetscTableCreate(mat->rmap->n, mat->cmap->N + 1, &gid1_lid1));
3617a3bb6f32SFande Kong   ec = 0;
361825b670f0SStefano Zampini   for (i = 0; i < nz; i++) {
361925b670f0SStefano Zampini     PetscInt data, gid1 = jj[i] + 1;
36209566063dSJacob Faibussowitsch     PetscCall(PetscTableFind(gid1_lid1, gid1, &data));
3621a3bb6f32SFande Kong     if (!data) {
3622a3bb6f32SFande Kong       /* one based table */
36239566063dSJacob Faibussowitsch       PetscCall(PetscTableAdd(gid1_lid1, gid1, ++ec, INSERT_VALUES));
3624a3bb6f32SFande Kong     }
3625a3bb6f32SFande Kong   }
3626a3bb6f32SFande Kong   /* form array of columns we need */
36279566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(ec, &garray));
36289566063dSJacob Faibussowitsch   PetscCall(PetscTableGetHeadPosition(gid1_lid1, &tpos));
3629a3bb6f32SFande Kong   while (tpos) {
36309566063dSJacob Faibussowitsch     PetscCall(PetscTableGetNext(gid1_lid1, &tpos, &gid, &lid));
3631a3bb6f32SFande Kong     gid--;
3632a3bb6f32SFande Kong     lid--;
3633a3bb6f32SFande Kong     garray[lid] = gid;
3634a3bb6f32SFande Kong   }
36359566063dSJacob Faibussowitsch   PetscCall(PetscSortInt(ec, garray)); /* sort, and rebuild */
36369566063dSJacob Faibussowitsch   PetscCall(PetscTableRemoveAll(gid1_lid1));
363748a46eb9SPierre Jolivet   for (i = 0; i < ec; i++) PetscCall(PetscTableAdd(gid1_lid1, garray[i] + 1, i + 1, INSERT_VALUES));
3638a3bb6f32SFande Kong   /* compact out the extra columns in B */
363925b670f0SStefano Zampini   for (i = 0; i < nz; i++) {
364025b670f0SStefano Zampini     PetscInt gid1 = jj[i] + 1;
36419566063dSJacob Faibussowitsch     PetscCall(PetscTableFind(gid1_lid1, gid1, &lid));
3642a3bb6f32SFande Kong     lid--;
364325b670f0SStefano Zampini     jj[i] = lid;
3644a3bb6f32SFande Kong   }
36459566063dSJacob Faibussowitsch   PetscCall(PetscLayoutDestroy(&mat->cmap));
36469566063dSJacob Faibussowitsch   PetscCall(PetscTableDestroy(&gid1_lid1));
36479566063dSJacob Faibussowitsch   PetscCall(PetscLayoutCreateFromSizes(PetscObjectComm((PetscObject)mat), ec, ec, 1, &mat->cmap));
36489566063dSJacob Faibussowitsch   PetscCall(ISLocalToGlobalMappingCreate(PETSC_COMM_SELF, mat->cmap->bs, mat->cmap->n, garray, PETSC_OWN_POINTER, mapping));
36499566063dSJacob Faibussowitsch   PetscCall(ISLocalToGlobalMappingSetType(*mapping, ISLOCALTOGLOBALMAPPINGHASH));
3650a3bb6f32SFande Kong   PetscFunctionReturn(0);
3651a3bb6f32SFande Kong }
3652a3bb6f32SFande Kong 
3653bef8e0ddSBarry Smith /*@
3654bef8e0ddSBarry Smith     MatSeqAIJSetColumnIndices - Set the column indices for all the rows
3655bef8e0ddSBarry Smith        in the matrix.
3656bef8e0ddSBarry Smith 
3657bef8e0ddSBarry Smith   Input Parameters:
365811a5261eSBarry Smith +  mat - the `MATSEQAIJ` matrix
3659bef8e0ddSBarry Smith -  indices - the column indices
3660bef8e0ddSBarry Smith 
366115091d37SBarry Smith   Level: advanced
366215091d37SBarry Smith 
3663bef8e0ddSBarry Smith   Notes:
3664bef8e0ddSBarry Smith     This can be called if you have precomputed the nonzero structure of the
3665bef8e0ddSBarry Smith   matrix and want to provide it to the matrix object to improve the performance
366611a5261eSBarry Smith   of the `MatSetValues()` operation.
3667bef8e0ddSBarry Smith 
3668bef8e0ddSBarry Smith     You MUST have set the correct numbers of nonzeros per row in the call to
366911a5261eSBarry Smith   `MatCreateSeqAIJ()`, and the columns indices MUST be sorted.
3670bef8e0ddSBarry Smith 
367111a5261eSBarry Smith     MUST be called before any calls to `MatSetValues()`
3672bef8e0ddSBarry Smith 
3673b9617806SBarry Smith     The indices should start with zero, not one.
3674b9617806SBarry Smith 
3675bef8e0ddSBarry Smith @*/
3676d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetColumnIndices(Mat mat, PetscInt *indices)
3677d71ae5a4SJacob Faibussowitsch {
3678bef8e0ddSBarry Smith   PetscFunctionBegin;
36790700a824SBarry Smith   PetscValidHeaderSpecific(mat, MAT_CLASSID, 1);
3680dadcf809SJacob Faibussowitsch   PetscValidIntPointer(indices, 2);
3681cac4c232SBarry Smith   PetscUseMethod(mat, "MatSeqAIJSetColumnIndices_C", (Mat, PetscInt *), (mat, indices));
3682bef8e0ddSBarry Smith   PetscFunctionReturn(0);
3683bef8e0ddSBarry Smith }
3684bef8e0ddSBarry Smith 
3685be6bf707SBarry Smith /* ----------------------------------------------------------------------------------------*/
3686be6bf707SBarry Smith 
3687d71ae5a4SJacob Faibussowitsch PetscErrorCode MatStoreValues_SeqAIJ(Mat mat)
3688d71ae5a4SJacob Faibussowitsch {
3689be6bf707SBarry Smith   Mat_SeqAIJ *aij = (Mat_SeqAIJ *)mat->data;
3690d0f46423SBarry Smith   size_t      nz  = aij->i[mat->rmap->n];
3691be6bf707SBarry Smith 
3692be6bf707SBarry Smith   PetscFunctionBegin;
369328b400f6SJacob Faibussowitsch   PetscCheck(aij->nonew, PETSC_COMM_SELF, PETSC_ERR_ORDER, "Must call MatSetOption(A,MAT_NEW_NONZERO_LOCATIONS,PETSC_FALSE);first");
3694be6bf707SBarry Smith 
3695be6bf707SBarry Smith   /* allocate space for values if not already there */
36964dfa11a4SJacob Faibussowitsch   if (!aij->saved_values) { PetscCall(PetscMalloc1(nz + 1, &aij->saved_values)); }
3697be6bf707SBarry Smith 
3698be6bf707SBarry Smith   /* copy values over */
36999566063dSJacob Faibussowitsch   PetscCall(PetscArraycpy(aij->saved_values, aij->a, nz));
3700be6bf707SBarry Smith   PetscFunctionReturn(0);
3701be6bf707SBarry Smith }
3702be6bf707SBarry Smith 
3703be6bf707SBarry Smith /*@
3704be6bf707SBarry Smith     MatStoreValues - Stashes a copy of the matrix values; this allows, for
3705be6bf707SBarry Smith        example, reuse of the linear part of a Jacobian, while recomputing the
3706be6bf707SBarry Smith        nonlinear portion.
3707be6bf707SBarry Smith 
370811a5261eSBarry Smith    Collect on mat
3709be6bf707SBarry Smith 
3710be6bf707SBarry Smith   Input Parameters:
371111a5261eSBarry Smith .  mat - the matrix (currently only `MATAIJ` matrices support this option)
3712be6bf707SBarry Smith 
371315091d37SBarry Smith   Level: advanced
371415091d37SBarry Smith 
371511a5261eSBarry Smith   Common Usage, with `SNESSolve()`:
3716be6bf707SBarry Smith $    Create Jacobian matrix
3717be6bf707SBarry Smith $    Set linear terms into matrix
3718be6bf707SBarry Smith $    Apply boundary conditions to matrix, at this time matrix must have
3719be6bf707SBarry Smith $      final nonzero structure (i.e. setting the nonlinear terms and applying
3720be6bf707SBarry Smith $      boundary conditions again will not change the nonzero structure
3721512a5fc5SBarry Smith $    ierr = MatSetOption(mat,MAT_NEW_NONZERO_LOCATIONS,PETSC_FALSE);
3722be6bf707SBarry Smith $    ierr = MatStoreValues(mat);
3723be6bf707SBarry Smith $    Call SNESSetJacobian() with matrix
3724be6bf707SBarry Smith $    In your Jacobian routine
3725be6bf707SBarry Smith $      ierr = MatRetrieveValues(mat);
3726be6bf707SBarry Smith $      Set nonlinear terms in matrix
3727be6bf707SBarry Smith 
3728be6bf707SBarry Smith   Common Usage without SNESSolve(), i.e. when you handle nonlinear solve yourself:
3729be6bf707SBarry Smith $    // build linear portion of Jacobian
3730512a5fc5SBarry Smith $    ierr = MatSetOption(mat,MAT_NEW_NONZERO_LOCATIONS,PETSC_FALSE);
3731be6bf707SBarry Smith $    ierr = MatStoreValues(mat);
3732be6bf707SBarry Smith $    loop over nonlinear iterations
3733be6bf707SBarry Smith $       ierr = MatRetrieveValues(mat);
3734be6bf707SBarry Smith $       // call MatSetValues(mat,...) to set nonliner portion of Jacobian
3735be6bf707SBarry Smith $       // call MatAssemblyBegin/End() on matrix
3736be6bf707SBarry Smith $       Solve linear system with Jacobian
3737be6bf707SBarry Smith $    endloop
3738be6bf707SBarry Smith 
3739be6bf707SBarry Smith   Notes:
3740be6bf707SBarry Smith     Matrix must already be assemblied before calling this routine
374111a5261eSBarry Smith     Must set the matrix option `MatSetOption`(mat,`MAT_NEW_NONZERO_LOCATIONS`,`PETSC_FALSE`); before
3742be6bf707SBarry Smith     calling this routine.
3743be6bf707SBarry Smith 
37440c468ba9SBarry Smith     When this is called multiple times it overwrites the previous set of stored values
37450c468ba9SBarry Smith     and does not allocated additional space.
37460c468ba9SBarry Smith 
3747db781477SPatrick Sanan .seealso: `MatRetrieveValues()`
3748be6bf707SBarry Smith @*/
3749d71ae5a4SJacob Faibussowitsch PetscErrorCode MatStoreValues(Mat mat)
3750d71ae5a4SJacob Faibussowitsch {
3751be6bf707SBarry Smith   PetscFunctionBegin;
37520700a824SBarry Smith   PetscValidHeaderSpecific(mat, MAT_CLASSID, 1);
375328b400f6SJacob Faibussowitsch   PetscCheck(mat->assembled, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for unassembled matrix");
375428b400f6SJacob Faibussowitsch   PetscCheck(!mat->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix");
3755cac4c232SBarry Smith   PetscUseMethod(mat, "MatStoreValues_C", (Mat), (mat));
3756be6bf707SBarry Smith   PetscFunctionReturn(0);
3757be6bf707SBarry Smith }
3758be6bf707SBarry Smith 
3759d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRetrieveValues_SeqAIJ(Mat mat)
3760d71ae5a4SJacob Faibussowitsch {
3761be6bf707SBarry Smith   Mat_SeqAIJ *aij = (Mat_SeqAIJ *)mat->data;
3762d0f46423SBarry Smith   PetscInt    nz  = aij->i[mat->rmap->n];
3763be6bf707SBarry Smith 
3764be6bf707SBarry Smith   PetscFunctionBegin;
376528b400f6SJacob Faibussowitsch   PetscCheck(aij->nonew, PETSC_COMM_SELF, PETSC_ERR_ORDER, "Must call MatSetOption(A,MAT_NEW_NONZERO_LOCATIONS,PETSC_FALSE);first");
376628b400f6SJacob Faibussowitsch   PetscCheck(aij->saved_values, PETSC_COMM_SELF, PETSC_ERR_ORDER, "Must call MatStoreValues(A);first");
3767be6bf707SBarry Smith   /* copy values over */
37689566063dSJacob Faibussowitsch   PetscCall(PetscArraycpy(aij->a, aij->saved_values, nz));
3769be6bf707SBarry Smith   PetscFunctionReturn(0);
3770be6bf707SBarry Smith }
3771be6bf707SBarry Smith 
3772be6bf707SBarry Smith /*@
3773be6bf707SBarry Smith     MatRetrieveValues - Retrieves the copy of the matrix values; this allows, for
3774be6bf707SBarry Smith        example, reuse of the linear part of a Jacobian, while recomputing the
3775be6bf707SBarry Smith        nonlinear portion.
3776be6bf707SBarry Smith 
377711a5261eSBarry Smith    Collect on mat
3778be6bf707SBarry Smith 
3779be6bf707SBarry Smith   Input Parameters:
378011a5261eSBarry Smith .  mat - the matrix (currently only `MATAIJ` matrices support this option)
3781be6bf707SBarry Smith 
378215091d37SBarry Smith   Level: advanced
378315091d37SBarry Smith 
3784db781477SPatrick Sanan .seealso: `MatStoreValues()`
3785be6bf707SBarry Smith @*/
3786d71ae5a4SJacob Faibussowitsch PetscErrorCode MatRetrieveValues(Mat mat)
3787d71ae5a4SJacob Faibussowitsch {
3788be6bf707SBarry Smith   PetscFunctionBegin;
37890700a824SBarry Smith   PetscValidHeaderSpecific(mat, MAT_CLASSID, 1);
379028b400f6SJacob Faibussowitsch   PetscCheck(mat->assembled, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for unassembled matrix");
379128b400f6SJacob Faibussowitsch   PetscCheck(!mat->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix");
3792cac4c232SBarry Smith   PetscUseMethod(mat, "MatRetrieveValues_C", (Mat), (mat));
3793be6bf707SBarry Smith   PetscFunctionReturn(0);
3794be6bf707SBarry Smith }
3795be6bf707SBarry Smith 
3796be6bf707SBarry Smith /* --------------------------------------------------------------------------------*/
379717ab2063SBarry Smith /*@C
379811a5261eSBarry Smith    MatCreateSeqAIJ - Creates a sparse matrix in `MATSEQAIJ` (compressed row) format
37990d15e28bSLois Curfman McInnes    (the default parallel PETSc format).  For good matrix assembly performance
38006e62573dSLois Curfman McInnes    the user should preallocate the matrix storage by setting the parameter nz
380151c19458SBarry Smith    (or the array nnz).  By setting these parameters accurately, performance
38022bd5e0b2SLois Curfman McInnes    during matrix assembly can be increased by more than a factor of 50.
380317ab2063SBarry Smith 
3804d083f849SBarry Smith    Collective
3805db81eaa0SLois Curfman McInnes 
380617ab2063SBarry Smith    Input Parameters:
380711a5261eSBarry Smith +  comm - MPI communicator, set to `PETSC_COMM_SELF`
380817ab2063SBarry Smith .  m - number of rows
380917ab2063SBarry Smith .  n - number of columns
381017ab2063SBarry Smith .  nz - number of nonzeros per row (same for all rows)
381151c19458SBarry Smith -  nnz - array containing the number of nonzeros in the various rows
38120298fd71SBarry Smith          (possibly different for each row) or NULL
381317ab2063SBarry Smith 
381417ab2063SBarry Smith    Output Parameter:
3815416022c9SBarry Smith .  A - the matrix
381617ab2063SBarry Smith 
381711a5261eSBarry Smith    It is recommended that one use the `MatCreate()`, `MatSetType()` and/or `MatSetFromOptions()`,
3818f6f02116SRichard Tran Mills    MatXXXXSetPreallocation() paradigm instead of this routine directly.
381911a5261eSBarry Smith    [MatXXXXSetPreallocation() is, for example, `MatSeqAIJSetPreallocation()`]
3820175b88e8SBarry Smith 
3821b259b22eSLois Curfman McInnes    Notes:
382249a6f317SBarry Smith    If nnz is given then nz is ignored
382349a6f317SBarry Smith 
382411a5261eSBarry Smith    The AIJ format, also called
382511a5261eSBarry Smith    compressed row storage, is fully compatible with standard Fortran 77
38260002213bSLois Curfman McInnes    storage.  That is, the stored row and column indices can begin at
382744cd7ae7SLois Curfman McInnes    either one (as in Fortran) or zero.  See the users' manual for details.
382817ab2063SBarry Smith 
382917ab2063SBarry Smith    Specify the preallocated storage with either nz or nnz (not both).
383011a5261eSBarry Smith    Set nz = `PETSC_DEFAULT` and nnz = NULL for PETSc to control dynamic memory
38313d323bbdSBarry Smith    allocation.  For large problems you MUST preallocate memory or you
38326da5968aSLois Curfman McInnes    will get TERRIBLE performance, see the users' manual chapter on matrices.
383317ab2063SBarry Smith 
3834682d7d0cSBarry Smith    By default, this format uses inodes (identical nodes) when possible, to
38354fca80b9SLois Curfman McInnes    improve numerical efficiency of matrix-vector products and solves. We
3836682d7d0cSBarry Smith    search for consecutive rows with the same nonzero structure, thereby
38376c7ebb05SLois Curfman McInnes    reusing matrix information to achieve increased efficiency.
38386c7ebb05SLois Curfman McInnes 
38396c7ebb05SLois Curfman McInnes    Options Database Keys:
3840698d4c6aSKris Buschelman +  -mat_no_inode  - Do not use inodes
38419db58ca8SBarry Smith -  -mat_inode_limit <limit> - Sets inode limit (max limit=5)
384217ab2063SBarry Smith 
3843027ccd11SLois Curfman McInnes    Level: intermediate
3844027ccd11SLois Curfman McInnes 
384560161072SBarry Smith .seealso: [Sparse Matrix Creation](sec_matsparse), `MatCreate()`, `MatCreateAIJ()`, `MatSetValues()`, `MatSeqAIJSetColumnIndices()`, `MatCreateSeqAIJWithArrays()`
384617ab2063SBarry Smith @*/
3847d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateSeqAIJ(MPI_Comm comm, PetscInt m, PetscInt n, PetscInt nz, const PetscInt nnz[], Mat *A)
3848d71ae5a4SJacob Faibussowitsch {
38493a40ed3dSBarry Smith   PetscFunctionBegin;
38509566063dSJacob Faibussowitsch   PetscCall(MatCreate(comm, A));
38519566063dSJacob Faibussowitsch   PetscCall(MatSetSizes(*A, m, n, m, n));
38529566063dSJacob Faibussowitsch   PetscCall(MatSetType(*A, MATSEQAIJ));
38539566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(*A, nz, nnz));
3854273d9f13SBarry Smith   PetscFunctionReturn(0);
3855273d9f13SBarry Smith }
3856273d9f13SBarry Smith 
3857273d9f13SBarry Smith /*@C
3858273d9f13SBarry Smith    MatSeqAIJSetPreallocation - For good matrix assembly performance
3859273d9f13SBarry Smith    the user should preallocate the matrix storage by setting the parameter nz
3860273d9f13SBarry Smith    (or the array nnz).  By setting these parameters accurately, performance
3861273d9f13SBarry Smith    during matrix assembly can be increased by more than a factor of 50.
3862273d9f13SBarry Smith 
3863d083f849SBarry Smith    Collective
3864273d9f13SBarry Smith 
3865273d9f13SBarry Smith    Input Parameters:
38661c4f3114SJed Brown +  B - The matrix
3867273d9f13SBarry Smith .  nz - number of nonzeros per row (same for all rows)
3868273d9f13SBarry Smith -  nnz - array containing the number of nonzeros in the various rows
38690298fd71SBarry Smith          (possibly different for each row) or NULL
3870273d9f13SBarry Smith 
3871273d9f13SBarry Smith    Notes:
387249a6f317SBarry Smith      If nnz is given then nz is ignored
387349a6f317SBarry Smith 
387411a5261eSBarry Smith     The `MATSEQAIJ` format also called
387511a5261eSBarry Smith    compressed row storage, is fully compatible with standard Fortran 77
3876273d9f13SBarry Smith    storage.  That is, the stored row and column indices can begin at
3877273d9f13SBarry Smith    either one (as in Fortran) or zero.  See the users' manual for details.
3878273d9f13SBarry Smith 
3879273d9f13SBarry Smith    Specify the preallocated storage with either nz or nnz (not both).
388011a5261eSBarry Smith    Set nz = `PETSC_DEFAULT` and nnz = NULL for PETSc to control dynamic memory
3881273d9f13SBarry Smith    allocation.  For large problems you MUST preallocate memory or you
3882273d9f13SBarry Smith    will get TERRIBLE performance, see the users' manual chapter on matrices.
3883273d9f13SBarry Smith 
388411a5261eSBarry Smith    You can call `MatGetInfo()` to get information on how effective the preallocation was;
3885aa95bbe8SBarry Smith    for example the fields mallocs,nz_allocated,nz_used,nz_unneeded;
3886aa95bbe8SBarry Smith    You can also run with the option -info and look for messages with the string
3887aa95bbe8SBarry Smith    malloc in them to see if additional memory allocation was needed.
3888aa95bbe8SBarry Smith 
388911a5261eSBarry Smith    Developer Notes:
389011a5261eSBarry Smith    Use nz of `MAT_SKIP_ALLOCATION` to not allocate any space for the matrix
3891a96a251dSBarry Smith    entries or columns indices
3892a96a251dSBarry Smith 
3893273d9f13SBarry Smith    By default, this format uses inodes (identical nodes) when possible, to
3894273d9f13SBarry Smith    improve numerical efficiency of matrix-vector products and solves. We
3895273d9f13SBarry Smith    search for consecutive rows with the same nonzero structure, thereby
3896273d9f13SBarry Smith    reusing matrix information to achieve increased efficiency.
3897273d9f13SBarry Smith 
3898273d9f13SBarry Smith    Options Database Keys:
3899698d4c6aSKris Buschelman +  -mat_no_inode  - Do not use inodes
390047b2e64bSBarry Smith -  -mat_inode_limit <limit> - Sets inode limit (max limit=5)
3901273d9f13SBarry Smith 
3902273d9f13SBarry Smith    Level: intermediate
3903273d9f13SBarry Smith 
3904db781477SPatrick Sanan .seealso: `MatCreate()`, `MatCreateAIJ()`, `MatSetValues()`, `MatSeqAIJSetColumnIndices()`, `MatCreateSeqAIJWithArrays()`, `MatGetInfo()`,
3905db781477SPatrick Sanan           `MatSeqAIJSetTotalPreallocation()`
3906273d9f13SBarry Smith @*/
3907d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetPreallocation(Mat B, PetscInt nz, const PetscInt nnz[])
3908d71ae5a4SJacob Faibussowitsch {
3909a23d5eceSKris Buschelman   PetscFunctionBegin;
39106ba663aaSJed Brown   PetscValidHeaderSpecific(B, MAT_CLASSID, 1);
39116ba663aaSJed Brown   PetscValidType(B, 1);
3912cac4c232SBarry Smith   PetscTryMethod(B, "MatSeqAIJSetPreallocation_C", (Mat, PetscInt, const PetscInt[]), (B, nz, nnz));
3913a23d5eceSKris Buschelman   PetscFunctionReturn(0);
3914a23d5eceSKris Buschelman }
3915a23d5eceSKris Buschelman 
3916d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetPreallocation_SeqAIJ(Mat B, PetscInt nz, const PetscInt *nnz)
3917d71ae5a4SJacob Faibussowitsch {
3918273d9f13SBarry Smith   Mat_SeqAIJ *b;
39192576faa2SJed Brown   PetscBool   skipallocation = PETSC_FALSE, realalloc = PETSC_FALSE;
392097f1f81fSBarry Smith   PetscInt    i;
3921273d9f13SBarry Smith 
3922273d9f13SBarry Smith   PetscFunctionBegin;
39232576faa2SJed Brown   if (nz >= 0 || nnz) realalloc = PETSC_TRUE;
3924a96a251dSBarry Smith   if (nz == MAT_SKIP_ALLOCATION) {
3925c461c341SBarry Smith     skipallocation = PETSC_TRUE;
3926c461c341SBarry Smith     nz             = 0;
3927c461c341SBarry Smith   }
39289566063dSJacob Faibussowitsch   PetscCall(PetscLayoutSetUp(B->rmap));
39299566063dSJacob Faibussowitsch   PetscCall(PetscLayoutSetUp(B->cmap));
3930899cda47SBarry Smith 
3931435da068SBarry Smith   if (nz == PETSC_DEFAULT || nz == PETSC_DECIDE) nz = 5;
393208401ef6SPierre Jolivet   PetscCheck(nz >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "nz cannot be less than 0: value %" PetscInt_FMT, nz);
3933cf9c20a2SJed Brown   if (PetscUnlikelyDebug(nnz)) {
3934d0f46423SBarry Smith     for (i = 0; i < B->rmap->n; i++) {
393508401ef6SPierre Jolivet       PetscCheck(nnz[i] >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "nnz cannot be less than 0: local row %" PetscInt_FMT " value %" PetscInt_FMT, i, nnz[i]);
393608401ef6SPierre Jolivet       PetscCheck(nnz[i] <= B->cmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "nnz cannot be greater than row length: local row %" PetscInt_FMT " value %" PetscInt_FMT " rowlength %" PetscInt_FMT, i, nnz[i], B->cmap->n);
3937b73539f3SBarry Smith     }
3938b73539f3SBarry Smith   }
3939b73539f3SBarry Smith 
3940273d9f13SBarry Smith   B->preallocated = PETSC_TRUE;
39412205254eSKarl Rupp 
3942273d9f13SBarry Smith   b = (Mat_SeqAIJ *)B->data;
3943273d9f13SBarry Smith 
3944ab93d7beSBarry Smith   if (!skipallocation) {
39454dfa11a4SJacob Faibussowitsch     if (!b->imax) { PetscCall(PetscMalloc1(B->rmap->n, &b->imax)); }
3946071fcb05SBarry Smith     if (!b->ilen) {
3947071fcb05SBarry Smith       /* b->ilen will count nonzeros in each row so far. */
39489566063dSJacob Faibussowitsch       PetscCall(PetscCalloc1(B->rmap->n, &b->ilen));
3949071fcb05SBarry Smith     } else {
39509566063dSJacob Faibussowitsch       PetscCall(PetscMemzero(b->ilen, B->rmap->n * sizeof(PetscInt)));
39512ee49352SLisandro Dalcin     }
39524dfa11a4SJacob Faibussowitsch     if (!b->ipre) { PetscCall(PetscMalloc1(B->rmap->n, &b->ipre)); }
3953273d9f13SBarry Smith     if (!nnz) {
3954435da068SBarry Smith       if (nz == PETSC_DEFAULT || nz == PETSC_DECIDE) nz = 10;
3955c62bd62aSJed Brown       else if (nz < 0) nz = 1;
39565d2a9ed1SStefano Zampini       nz = PetscMin(nz, B->cmap->n);
3957d0f46423SBarry Smith       for (i = 0; i < B->rmap->n; i++) b->imax[i] = nz;
3958d0f46423SBarry Smith       nz = nz * B->rmap->n;
3959273d9f13SBarry Smith     } else {
3960c73702f5SBarry Smith       PetscInt64 nz64 = 0;
39619371c9d4SSatish Balay       for (i = 0; i < B->rmap->n; i++) {
39629371c9d4SSatish Balay         b->imax[i] = nnz[i];
39639371c9d4SSatish Balay         nz64 += nnz[i];
39649371c9d4SSatish Balay       }
39659566063dSJacob Faibussowitsch       PetscCall(PetscIntCast(nz64, &nz));
3966273d9f13SBarry Smith     }
3967ab93d7beSBarry Smith 
3968273d9f13SBarry Smith     /* allocate the matrix space */
396953dd7562SDmitry Karpeev     /* FIXME: should B's old memory be unlogged? */
39709566063dSJacob Faibussowitsch     PetscCall(MatSeqXAIJFreeAIJ(B, &b->a, &b->j, &b->i));
3971396832f4SHong Zhang     if (B->structure_only) {
39729566063dSJacob Faibussowitsch       PetscCall(PetscMalloc1(nz, &b->j));
39739566063dSJacob Faibussowitsch       PetscCall(PetscMalloc1(B->rmap->n + 1, &b->i));
3974396832f4SHong Zhang     } else {
39759566063dSJacob Faibussowitsch       PetscCall(PetscMalloc3(nz, &b->a, nz, &b->j, B->rmap->n + 1, &b->i));
3976396832f4SHong Zhang     }
3977bfeeae90SHong Zhang     b->i[0] = 0;
3978ad540459SPierre Jolivet     for (i = 1; i < B->rmap->n + 1; i++) b->i[i] = b->i[i - 1] + b->imax[i - 1];
3979396832f4SHong Zhang     if (B->structure_only) {
3980396832f4SHong Zhang       b->singlemalloc = PETSC_FALSE;
3981396832f4SHong Zhang       b->free_a       = PETSC_FALSE;
3982396832f4SHong Zhang     } else {
3983273d9f13SBarry Smith       b->singlemalloc = PETSC_TRUE;
3984e6b907acSBarry Smith       b->free_a       = PETSC_TRUE;
3985396832f4SHong Zhang     }
3986e6b907acSBarry Smith     b->free_ij = PETSC_TRUE;
3987c461c341SBarry Smith   } else {
3988e6b907acSBarry Smith     b->free_a  = PETSC_FALSE;
3989e6b907acSBarry Smith     b->free_ij = PETSC_FALSE;
3990c461c341SBarry Smith   }
3991273d9f13SBarry Smith 
3992846b4da1SFande Kong   if (b->ipre && nnz != b->ipre && b->imax) {
3993846b4da1SFande Kong     /* reserve user-requested sparsity */
39949566063dSJacob Faibussowitsch     PetscCall(PetscArraycpy(b->ipre, b->imax, B->rmap->n));
3995846b4da1SFande Kong   }
3996846b4da1SFande Kong 
3997273d9f13SBarry Smith   b->nz               = 0;
3998273d9f13SBarry Smith   b->maxnz            = nz;
3999273d9f13SBarry Smith   B->info.nz_unneeded = (double)b->maxnz;
40001baa6e33SBarry Smith   if (realalloc) PetscCall(MatSetOption(B, MAT_NEW_NONZERO_ALLOCATION_ERR, PETSC_TRUE));
4001cb7b82ddSBarry Smith   B->was_assembled = PETSC_FALSE;
4002cb7b82ddSBarry Smith   B->assembled     = PETSC_FALSE;
40035519a089SJose E. Roman   /* We simply deem preallocation has changed nonzero state. Updating the state
40045519a089SJose E. Roman      will give clients (like AIJKokkos) a chance to know something has happened.
40055519a089SJose E. Roman   */
40065519a089SJose E. Roman   B->nonzerostate++;
4007273d9f13SBarry Smith   PetscFunctionReturn(0);
4008273d9f13SBarry Smith }
4009273d9f13SBarry Smith 
4010d71ae5a4SJacob Faibussowitsch PetscErrorCode MatResetPreallocation_SeqAIJ(Mat A)
4011d71ae5a4SJacob Faibussowitsch {
4012846b4da1SFande Kong   Mat_SeqAIJ *a;
4013a5bbaf83SFande Kong   PetscInt    i;
4014846b4da1SFande Kong 
4015846b4da1SFande Kong   PetscFunctionBegin;
4016846b4da1SFande Kong   PetscValidHeaderSpecific(A, MAT_CLASSID, 1);
401714d0e64fSAlex Lindsay 
401814d0e64fSAlex Lindsay   /* Check local size. If zero, then return */
401914d0e64fSAlex Lindsay   if (!A->rmap->n) PetscFunctionReturn(0);
402014d0e64fSAlex Lindsay 
4021846b4da1SFande Kong   a = (Mat_SeqAIJ *)A->data;
40222c814fdeSFande Kong   /* if no saved info, we error out */
402328b400f6SJacob Faibussowitsch   PetscCheck(a->ipre, PETSC_COMM_SELF, PETSC_ERR_ARG_NULL, "No saved preallocation info ");
40242c814fdeSFande Kong 
4025aed4548fSBarry Smith   PetscCheck(a->i && a->j && a->a && a->imax && a->ilen, PETSC_COMM_SELF, PETSC_ERR_ARG_NULL, "Memory info is incomplete, and can not reset preallocation ");
40262c814fdeSFande Kong 
40279566063dSJacob Faibussowitsch   PetscCall(PetscArraycpy(a->imax, a->ipre, A->rmap->n));
40289566063dSJacob Faibussowitsch   PetscCall(PetscArrayzero(a->ilen, A->rmap->n));
4029846b4da1SFande Kong   a->i[0] = 0;
4030ad540459SPierre Jolivet   for (i = 1; i < A->rmap->n + 1; i++) a->i[i] = a->i[i - 1] + a->imax[i - 1];
4031846b4da1SFande Kong   A->preallocated     = PETSC_TRUE;
4032846b4da1SFande Kong   a->nz               = 0;
4033846b4da1SFande Kong   a->maxnz            = a->i[A->rmap->n];
4034846b4da1SFande Kong   A->info.nz_unneeded = (double)a->maxnz;
4035846b4da1SFande Kong   A->was_assembled    = PETSC_FALSE;
4036846b4da1SFande Kong   A->assembled        = PETSC_FALSE;
4037846b4da1SFande Kong   PetscFunctionReturn(0);
4038846b4da1SFande Kong }
4039846b4da1SFande Kong 
404058d36128SBarry Smith /*@
404111a5261eSBarry Smith    MatSeqAIJSetPreallocationCSR - Allocates memory for a sparse sequential matrix in `MATSEQAIJ` format.
4042a1661176SMatthew Knepley 
4043a1661176SMatthew Knepley    Input Parameters:
4044a1661176SMatthew Knepley +  B - the matrix
4045a1661176SMatthew Knepley .  i - the indices into j for the start of each row (starts with zero)
4046a1661176SMatthew Knepley .  j - the column indices for each row (starts with zero) these must be sorted for each row
4047a1661176SMatthew Knepley -  v - optional values in the matrix
4048a1661176SMatthew Knepley 
4049a1661176SMatthew Knepley    Level: developer
4050a1661176SMatthew Knepley 
40516a9b8d82SBarry Smith    Notes:
405211a5261eSBarry Smith       The i,j,v values are COPIED with this routine; to avoid the copy use `MatCreateSeqAIJWithArrays()`
405358d36128SBarry Smith 
40546a9b8d82SBarry Smith       This routine may be called multiple times with different nonzero patterns (or the same nonzero pattern). The nonzero
40556a9b8d82SBarry Smith       structure will be the union of all the previous nonzero structures.
40566a9b8d82SBarry Smith 
40576a9b8d82SBarry Smith     Developer Notes:
40586a9b8d82SBarry Smith       An optimization could be added to the implementation where it checks if the i, and j are identical to the current i and j and
405911a5261eSBarry Smith       then just copies the v values directly with `PetscMemcpy()`.
40606a9b8d82SBarry Smith 
406111a5261eSBarry Smith       This routine could also take a `PetscCopyMode` argument to allow sharing the values instead of always copying them.
40626a9b8d82SBarry Smith 
4063db781477SPatrick Sanan .seealso: `MatCreate()`, `MatCreateSeqAIJ()`, `MatSetValues()`, `MatSeqAIJSetPreallocation()`, `MatCreateSeqAIJ()`, `MATSEQAIJ`, `MatResetPreallocation()`
4064a1661176SMatthew Knepley @*/
4065d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetPreallocationCSR(Mat B, const PetscInt i[], const PetscInt j[], const PetscScalar v[])
4066d71ae5a4SJacob Faibussowitsch {
4067a1661176SMatthew Knepley   PetscFunctionBegin;
40680700a824SBarry Smith   PetscValidHeaderSpecific(B, MAT_CLASSID, 1);
40696ba663aaSJed Brown   PetscValidType(B, 1);
4070cac4c232SBarry Smith   PetscTryMethod(B, "MatSeqAIJSetPreallocationCSR_C", (Mat, const PetscInt[], const PetscInt[], const PetscScalar[]), (B, i, j, v));
4071a1661176SMatthew Knepley   PetscFunctionReturn(0);
4072a1661176SMatthew Knepley }
4073a1661176SMatthew Knepley 
4074d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetPreallocationCSR_SeqAIJ(Mat B, const PetscInt Ii[], const PetscInt J[], const PetscScalar v[])
4075d71ae5a4SJacob Faibussowitsch {
4076a1661176SMatthew Knepley   PetscInt  i;
4077a1661176SMatthew Knepley   PetscInt  m, n;
4078a1661176SMatthew Knepley   PetscInt  nz;
40796a9b8d82SBarry Smith   PetscInt *nnz;
4080a1661176SMatthew Knepley 
4081a1661176SMatthew Knepley   PetscFunctionBegin;
4082aed4548fSBarry Smith   PetscCheck(Ii[0] == 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Ii[0] must be 0 it is %" PetscInt_FMT, Ii[0]);
4083779a8d59SSatish Balay 
40849566063dSJacob Faibussowitsch   PetscCall(PetscLayoutSetUp(B->rmap));
40859566063dSJacob Faibussowitsch   PetscCall(PetscLayoutSetUp(B->cmap));
4086779a8d59SSatish Balay 
40879566063dSJacob Faibussowitsch   PetscCall(MatGetSize(B, &m, &n));
40889566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(m + 1, &nnz));
4089a1661176SMatthew Knepley   for (i = 0; i < m; i++) {
4090b7940d39SSatish Balay     nz = Ii[i + 1] - Ii[i];
409108401ef6SPierre Jolivet     PetscCheck(nz >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Local row %" PetscInt_FMT " has a negative number of columns %" PetscInt_FMT, i, nz);
4092a1661176SMatthew Knepley     nnz[i] = nz;
4093a1661176SMatthew Knepley   }
40949566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJSetPreallocation(B, 0, nnz));
40959566063dSJacob Faibussowitsch   PetscCall(PetscFree(nnz));
4096a1661176SMatthew Knepley 
409748a46eb9SPierre Jolivet   for (i = 0; i < m; i++) PetscCall(MatSetValues_SeqAIJ(B, 1, &i, Ii[i + 1] - Ii[i], J + Ii[i], v ? v + Ii[i] : NULL, INSERT_VALUES));
4098a1661176SMatthew Knepley 
40999566063dSJacob Faibussowitsch   PetscCall(MatAssemblyBegin(B, MAT_FINAL_ASSEMBLY));
41009566063dSJacob Faibussowitsch   PetscCall(MatAssemblyEnd(B, MAT_FINAL_ASSEMBLY));
4101a1661176SMatthew Knepley 
41029566063dSJacob Faibussowitsch   PetscCall(MatSetOption(B, MAT_NEW_NONZERO_LOCATION_ERR, PETSC_TRUE));
4103a1661176SMatthew Knepley   PetscFunctionReturn(0);
4104a1661176SMatthew Knepley }
4105a1661176SMatthew Knepley 
4106ad7e164aSPierre Jolivet /*@
4107ad7e164aSPierre Jolivet    MatSeqAIJKron - Computes C, the Kronecker product of A and B.
4108ad7e164aSPierre Jolivet 
4109ad7e164aSPierre Jolivet    Input Parameters:
4110ad7e164aSPierre Jolivet +  A - left-hand side matrix
4111ad7e164aSPierre Jolivet .  B - right-hand side matrix
411211a5261eSBarry Smith -  reuse - either `MAT_INITIAL_MATRIX` or `MAT_REUSE_MATRIX`
4113ad7e164aSPierre Jolivet 
4114ad7e164aSPierre Jolivet    Output Parameter:
4115ad7e164aSPierre Jolivet .  C - Kronecker product of A and B
4116ad7e164aSPierre Jolivet 
4117ad7e164aSPierre Jolivet    Level: intermediate
4118ad7e164aSPierre Jolivet 
411911a5261eSBarry Smith    Note:
412011a5261eSBarry Smith       `MAT_REUSE_MATRIX` can only be used when the nonzero structure of the product matrix has not changed from that last call to `MatSeqAIJKron()`.
4121ad7e164aSPierre Jolivet 
4122db781477SPatrick Sanan .seealso: `MatCreateSeqAIJ()`, `MATSEQAIJ`, `MATKAIJ`, `MatReuse`
4123ad7e164aSPierre Jolivet @*/
4124d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJKron(Mat A, Mat B, MatReuse reuse, Mat *C)
4125d71ae5a4SJacob Faibussowitsch {
4126ad7e164aSPierre Jolivet   PetscFunctionBegin;
4127ad7e164aSPierre Jolivet   PetscValidHeaderSpecific(A, MAT_CLASSID, 1);
4128ad7e164aSPierre Jolivet   PetscValidType(A, 1);
4129ad7e164aSPierre Jolivet   PetscValidHeaderSpecific(B, MAT_CLASSID, 2);
4130ad7e164aSPierre Jolivet   PetscValidType(B, 2);
4131ad7e164aSPierre Jolivet   PetscValidPointer(C, 4);
4132ad7e164aSPierre Jolivet   if (reuse == MAT_REUSE_MATRIX) {
4133ad7e164aSPierre Jolivet     PetscValidHeaderSpecific(*C, MAT_CLASSID, 4);
4134ad7e164aSPierre Jolivet     PetscValidType(*C, 4);
4135ad7e164aSPierre Jolivet   }
4136cac4c232SBarry Smith   PetscTryMethod(A, "MatSeqAIJKron_C", (Mat, Mat, MatReuse, Mat *), (A, B, reuse, C));
4137ad7e164aSPierre Jolivet   PetscFunctionReturn(0);
4138ad7e164aSPierre Jolivet }
4139ad7e164aSPierre Jolivet 
4140d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJKron_SeqAIJ(Mat A, Mat B, MatReuse reuse, Mat *C)
4141d71ae5a4SJacob Faibussowitsch {
4142ad7e164aSPierre Jolivet   Mat                newmat;
4143ad7e164aSPierre Jolivet   Mat_SeqAIJ        *a = (Mat_SeqAIJ *)A->data;
4144ad7e164aSPierre Jolivet   Mat_SeqAIJ        *b = (Mat_SeqAIJ *)B->data;
4145ad7e164aSPierre Jolivet   PetscScalar       *v;
4146fff043a9SJunchao Zhang   const PetscScalar *aa, *ba;
4147ad7e164aSPierre Jolivet   PetscInt          *i, *j, m, n, p, q, nnz = 0, am = A->rmap->n, bm = B->rmap->n, an = A->cmap->n, bn = B->cmap->n;
4148ad7e164aSPierre Jolivet   PetscBool          flg;
4149ad7e164aSPierre Jolivet 
4150ad7e164aSPierre Jolivet   PetscFunctionBegin;
415128b400f6SJacob Faibussowitsch   PetscCheck(!A->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix");
415228b400f6SJacob Faibussowitsch   PetscCheck(A->assembled, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for unassembled matrix");
415328b400f6SJacob Faibussowitsch   PetscCheck(!B->factortype, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for factored matrix");
415428b400f6SJacob Faibussowitsch   PetscCheck(B->assembled, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Not for unassembled matrix");
41559566063dSJacob Faibussowitsch   PetscCall(PetscObjectTypeCompare((PetscObject)B, MATSEQAIJ, &flg));
415628b400f6SJacob Faibussowitsch   PetscCheck(flg, PETSC_COMM_SELF, PETSC_ERR_SUP, "MatType %s", ((PetscObject)B)->type_name);
4157aed4548fSBarry Smith   PetscCheck(reuse == MAT_INITIAL_MATRIX || reuse == MAT_REUSE_MATRIX, PETSC_COMM_SELF, PETSC_ERR_SUP, "MatReuse %d", (int)reuse);
4158ad7e164aSPierre Jolivet   if (reuse == MAT_INITIAL_MATRIX) {
41599566063dSJacob Faibussowitsch     PetscCall(PetscMalloc2(am * bm + 1, &i, a->i[am] * b->i[bm], &j));
41609566063dSJacob Faibussowitsch     PetscCall(MatCreate(PETSC_COMM_SELF, &newmat));
41619566063dSJacob Faibussowitsch     PetscCall(MatSetSizes(newmat, am * bm, an * bn, am * bm, an * bn));
41629566063dSJacob Faibussowitsch     PetscCall(MatSetType(newmat, MATAIJ));
4163ad7e164aSPierre Jolivet     i[0] = 0;
4164ad7e164aSPierre Jolivet     for (m = 0; m < am; ++m) {
4165ad7e164aSPierre Jolivet       for (p = 0; p < bm; ++p) {
4166ad7e164aSPierre Jolivet         i[m * bm + p + 1] = i[m * bm + p] + (a->i[m + 1] - a->i[m]) * (b->i[p + 1] - b->i[p]);
4167ad7e164aSPierre Jolivet         for (n = a->i[m]; n < a->i[m + 1]; ++n) {
4168ad540459SPierre Jolivet           for (q = b->i[p]; q < b->i[p + 1]; ++q) j[nnz++] = a->j[n] * bn + b->j[q];
4169ad7e164aSPierre Jolivet         }
4170ad7e164aSPierre Jolivet       }
4171ad7e164aSPierre Jolivet     }
41729566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJSetPreallocationCSR(newmat, i, j, NULL));
4173ad7e164aSPierre Jolivet     *C = newmat;
41749566063dSJacob Faibussowitsch     PetscCall(PetscFree2(i, j));
4175ad7e164aSPierre Jolivet     nnz = 0;
4176ad7e164aSPierre Jolivet   }
41779566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArray(*C, &v));
41789566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &aa));
41799566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(B, &ba));
4180ad7e164aSPierre Jolivet   for (m = 0; m < am; ++m) {
4181ad7e164aSPierre Jolivet     for (p = 0; p < bm; ++p) {
4182ad7e164aSPierre Jolivet       for (n = a->i[m]; n < a->i[m + 1]; ++n) {
4183ad540459SPierre Jolivet         for (q = b->i[p]; q < b->i[p + 1]; ++q) v[nnz++] = aa[n] * ba[q];
4184ad7e164aSPierre Jolivet       }
4185ad7e164aSPierre Jolivet     }
4186ad7e164aSPierre Jolivet   }
41879566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArray(*C, &v));
41889566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &aa));
41899566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(B, &ba));
4190ad7e164aSPierre Jolivet   PetscFunctionReturn(0);
4191ad7e164aSPierre Jolivet }
4192ad7e164aSPierre Jolivet 
4193c6db04a5SJed Brown #include <../src/mat/impls/dense/seq/dense.h>
4194af0996ceSBarry Smith #include <petsc/private/kernels/petscaxpy.h>
4195170fe5c8SBarry Smith 
4196170fe5c8SBarry Smith /*
4197170fe5c8SBarry Smith     Computes (B'*A')' since computing B*A directly is untenable
4198170fe5c8SBarry Smith 
4199170fe5c8SBarry Smith                n                       p                          p
42002da392ccSBarry Smith         [             ]       [             ]         [                 ]
42012da392ccSBarry Smith       m [      A      ]  *  n [       B     ]   =   m [         C       ]
42022da392ccSBarry Smith         [             ]       [             ]         [                 ]
4203170fe5c8SBarry Smith 
4204170fe5c8SBarry Smith */
4205d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMatMultNumeric_SeqDense_SeqAIJ(Mat A, Mat B, Mat C)
4206d71ae5a4SJacob Faibussowitsch {
4207170fe5c8SBarry Smith   Mat_SeqDense      *sub_a = (Mat_SeqDense *)A->data;
4208170fe5c8SBarry Smith   Mat_SeqAIJ        *sub_b = (Mat_SeqAIJ *)B->data;
4209170fe5c8SBarry Smith   Mat_SeqDense      *sub_c = (Mat_SeqDense *)C->data;
421086214ceeSStefano Zampini   PetscInt           i, j, n, m, q, p;
4211170fe5c8SBarry Smith   const PetscInt    *ii, *idx;
4212170fe5c8SBarry Smith   const PetscScalar *b, *a, *a_q;
4213170fe5c8SBarry Smith   PetscScalar       *c, *c_q;
421486214ceeSStefano Zampini   PetscInt           clda = sub_c->lda;
421586214ceeSStefano Zampini   PetscInt           alda = sub_a->lda;
4216170fe5c8SBarry Smith 
4217170fe5c8SBarry Smith   PetscFunctionBegin;
4218d0f46423SBarry Smith   m = A->rmap->n;
4219d0f46423SBarry Smith   n = A->cmap->n;
4220d0f46423SBarry Smith   p = B->cmap->n;
4221170fe5c8SBarry Smith   a = sub_a->v;
4222170fe5c8SBarry Smith   b = sub_b->a;
4223170fe5c8SBarry Smith   c = sub_c->v;
422486214ceeSStefano Zampini   if (clda == m) {
42259566063dSJacob Faibussowitsch     PetscCall(PetscArrayzero(c, m * p));
422686214ceeSStefano Zampini   } else {
422786214ceeSStefano Zampini     for (j = 0; j < p; j++)
42289371c9d4SSatish Balay       for (i = 0; i < m; i++) c[j * clda + i] = 0.0;
422986214ceeSStefano Zampini   }
4230170fe5c8SBarry Smith   ii  = sub_b->i;
4231170fe5c8SBarry Smith   idx = sub_b->j;
4232170fe5c8SBarry Smith   for (i = 0; i < n; i++) {
4233170fe5c8SBarry Smith     q = ii[i + 1] - ii[i];
4234170fe5c8SBarry Smith     while (q-- > 0) {
423586214ceeSStefano Zampini       c_q = c + clda * (*idx);
423686214ceeSStefano Zampini       a_q = a + alda * i;
4237854c7f52SBarry Smith       PetscKernelAXPY(c_q, *b, a_q, m);
4238170fe5c8SBarry Smith       idx++;
4239170fe5c8SBarry Smith       b++;
4240170fe5c8SBarry Smith     }
4241170fe5c8SBarry Smith   }
4242170fe5c8SBarry Smith   PetscFunctionReturn(0);
4243170fe5c8SBarry Smith }
4244170fe5c8SBarry Smith 
4245d71ae5a4SJacob Faibussowitsch PetscErrorCode MatMatMultSymbolic_SeqDense_SeqAIJ(Mat A, Mat B, PetscReal fill, Mat C)
4246d71ae5a4SJacob Faibussowitsch {
4247d0f46423SBarry Smith   PetscInt  m = A->rmap->n, n = B->cmap->n;
424886214ceeSStefano Zampini   PetscBool cisdense;
4249170fe5c8SBarry Smith 
4250170fe5c8SBarry Smith   PetscFunctionBegin;
425108401ef6SPierre Jolivet   PetscCheck(A->cmap->n == B->rmap->n, PETSC_COMM_SELF, PETSC_ERR_ARG_SIZ, "A->cmap->n %" PetscInt_FMT " != B->rmap->n %" PetscInt_FMT, A->cmap->n, B->rmap->n);
42529566063dSJacob Faibussowitsch   PetscCall(MatSetSizes(C, m, n, m, n));
42539566063dSJacob Faibussowitsch   PetscCall(MatSetBlockSizesFromMats(C, A, B));
42549566063dSJacob Faibussowitsch   PetscCall(PetscObjectTypeCompareAny((PetscObject)C, &cisdense, MATSEQDENSE, MATSEQDENSECUDA, ""));
425548a46eb9SPierre Jolivet   if (!cisdense) PetscCall(MatSetType(C, MATDENSE));
42569566063dSJacob Faibussowitsch   PetscCall(MatSetUp(C));
4257d73949e8SHong Zhang 
42584222ddf1SHong Zhang   C->ops->matmultnumeric = MatMatMultNumeric_SeqDense_SeqAIJ;
4259170fe5c8SBarry Smith   PetscFunctionReturn(0);
4260170fe5c8SBarry Smith }
4261170fe5c8SBarry Smith 
4262170fe5c8SBarry Smith /* ----------------------------------------------------------------*/
42630bad9183SKris Buschelman /*MC
4264fafad747SKris Buschelman    MATSEQAIJ - MATSEQAIJ = "seqaij" - A matrix type to be used for sequential sparse matrices,
42650bad9183SKris Buschelman    based on compressed sparse row format.
42660bad9183SKris Buschelman 
42670bad9183SKris Buschelman    Options Database Keys:
42680bad9183SKris Buschelman . -mat_type seqaij - sets the matrix type to "seqaij" during a call to MatSetFromOptions()
42690bad9183SKris Buschelman 
42700bad9183SKris Buschelman    Level: beginner
42710bad9183SKris Buschelman 
42720cd7f59aSBarry Smith    Notes:
427311a5261eSBarry Smith     `MatSetValues()` may be called for this matrix type with a NULL argument for the numerical values,
42740cd7f59aSBarry Smith     in this case the values associated with the rows and columns one passes in are set to zero
42750cd7f59aSBarry Smith     in the matrix
42760cd7f59aSBarry Smith 
427711a5261eSBarry Smith     `MatSetOptions`(,`MAT_STRUCTURE_ONLY`,`PETSC_TRUE`) may be called for this matrix type. In this no
427811a5261eSBarry Smith     space is allocated for the nonzero entries and any entries passed with `MatSetValues()` are ignored
42790cd7f59aSBarry Smith 
428011a5261eSBarry Smith   Developer Note:
42810cd7f59aSBarry Smith     It would be nice if all matrix formats supported passing NULL in for the numerical values
42820cd7f59aSBarry Smith 
4283db781477SPatrick Sanan .seealso: `MatCreateSeqAIJ()`, `MatSetFromOptions()`, `MatSetType()`, `MatCreate()`, `MatType`, `MATSELL`, `MATSEQSELL`, `MATMPISELL`
42840bad9183SKris Buschelman M*/
42850bad9183SKris Buschelman 
4286ccd284c7SBarry Smith /*MC
4287ccd284c7SBarry Smith    MATAIJ - MATAIJ = "aij" - A matrix type to be used for sparse matrices.
4288ccd284c7SBarry Smith 
428911a5261eSBarry Smith    This matrix type is identical to `MATSEQAIJ` when constructed with a single process communicator,
429011a5261eSBarry Smith    and `MATMPIAIJ` otherwise.  As a result, for single process communicators,
429111a5261eSBarry Smith    `MatSeqAIJSetPreallocation()` is supported, and similarly `MatMPIAIJSetPreallocation()` is supported
4292ccd284c7SBarry Smith    for communicators controlling multiple processes.  It is recommended that you call both of
4293ccd284c7SBarry Smith    the above preallocation routines for simplicity.
4294ccd284c7SBarry Smith 
4295ccd284c7SBarry Smith    Options Database Keys:
429611a5261eSBarry Smith . -mat_type aij - sets the matrix type to "aij" during a call to `MatSetFromOptions()`
4297ccd284c7SBarry Smith 
429811a5261eSBarry Smith    Note:
429911a5261eSBarry Smith    Subclasses include `MATAIJCUSPARSE`, `MATAIJPERM`, `MATAIJSELL`, `MATAIJMKL`, `MATAIJCRL`, and also automatically switches over to use inodes when
4300ccd284c7SBarry Smith    enough exist.
4301ccd284c7SBarry Smith 
4302ccd284c7SBarry Smith   Level: beginner
4303ccd284c7SBarry Smith 
4304db781477SPatrick Sanan .seealso: `MatCreateAIJ()`, `MatCreateSeqAIJ()`, `MATSEQAIJ`, `MATMPIAIJ`, `MATSELL`, `MATSEQSELL`, `MATMPISELL`
4305ccd284c7SBarry Smith M*/
4306ccd284c7SBarry Smith 
4307ccd284c7SBarry Smith /*MC
4308ccd284c7SBarry Smith    MATAIJCRL - MATAIJCRL = "aijcrl" - A matrix type to be used for sparse matrices.
4309ccd284c7SBarry Smith 
431011a5261eSBarry Smith    This matrix type is identical to `MATSEQAIJCRL` when constructed with a single process communicator,
431111a5261eSBarry Smith    and `MATMPIAIJCRL` otherwise.  As a result, for single process communicators,
431211a5261eSBarry Smith    `MatSeqAIJSetPreallocation()` is supported, and similarly `MatMPIAIJSetPreallocation()` is supported
4313ccd284c7SBarry Smith    for communicators controlling multiple processes.  It is recommended that you call both of
4314ccd284c7SBarry Smith    the above preallocation routines for simplicity.
4315ccd284c7SBarry Smith 
4316ccd284c7SBarry Smith    Options Database Keys:
431711a5261eSBarry Smith . -mat_type aijcrl - sets the matrix type to "aijcrl" during a call to `MatSetFromOptions()`
4318ccd284c7SBarry Smith 
4319ccd284c7SBarry Smith   Level: beginner
4320ccd284c7SBarry Smith 
4321c2e3fba1SPatrick Sanan .seealso: `MatCreateMPIAIJCRL`, `MATSEQAIJCRL`, `MATMPIAIJCRL`, `MATSEQAIJCRL`, `MATMPIAIJCRL`
4322ccd284c7SBarry Smith M*/
4323ccd284c7SBarry Smith 
43247906f579SHong Zhang PETSC_INTERN PetscErrorCode MatConvert_SeqAIJ_SeqAIJCRL(Mat, MatType, MatReuse, Mat *);
43257906f579SHong Zhang #if defined(PETSC_HAVE_ELEMENTAL)
43267906f579SHong Zhang PETSC_INTERN PetscErrorCode MatConvert_SeqAIJ_Elemental(Mat, MatType, MatReuse, Mat *);
43277906f579SHong Zhang #endif
4328d24d4204SJose E. Roman #if defined(PETSC_HAVE_SCALAPACK)
4329d24d4204SJose E. Roman PETSC_INTERN PetscErrorCode MatConvert_AIJ_ScaLAPACK(Mat, MatType, MatReuse, Mat *);
4330d24d4204SJose E. Roman #endif
43317906f579SHong Zhang #if defined(PETSC_HAVE_HYPRE)
43327906f579SHong Zhang PETSC_INTERN PetscErrorCode MatConvert_AIJ_HYPRE(Mat A, MatType, MatReuse, Mat *);
43337906f579SHong Zhang #endif
43347906f579SHong Zhang 
4335d4002b98SHong Zhang PETSC_EXTERN PetscErrorCode MatConvert_SeqAIJ_SeqSELL(Mat, MatType, MatReuse, Mat *);
4336c9225affSStefano Zampini PETSC_INTERN PetscErrorCode MatConvert_XAIJ_IS(Mat, MatType, MatReuse, Mat *);
43374222ddf1SHong Zhang PETSC_INTERN PetscErrorCode MatProductSetFromOptions_IS_XAIJ(Mat);
43387906f579SHong Zhang 
43398c778c55SBarry Smith /*@C
434011a5261eSBarry Smith    MatSeqAIJGetArray - gives read/write access to the array where the data for a `MATSEQAIJ` matrix is stored
43418c778c55SBarry Smith 
43428c778c55SBarry Smith    Not Collective
43438c778c55SBarry Smith 
43448c778c55SBarry Smith    Input Parameter:
434511a5261eSBarry Smith .  mat - a `MATSEQAIJ` matrix
43468c778c55SBarry Smith 
43478c778c55SBarry Smith    Output Parameter:
43488c778c55SBarry Smith .   array - pointer to the data
43498c778c55SBarry Smith 
43508c778c55SBarry Smith    Level: intermediate
43518c778c55SBarry Smith 
4352db781477SPatrick Sanan .seealso: `MatSeqAIJRestoreArray()`, `MatSeqAIJGetArrayF90()`
43538c778c55SBarry Smith @*/
4354d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJGetArray(Mat A, PetscScalar **array)
4355d71ae5a4SJacob Faibussowitsch {
4356d67d9f35SJunchao Zhang   Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data;
43578c778c55SBarry Smith 
43588c778c55SBarry Smith   PetscFunctionBegin;
4359d67d9f35SJunchao Zhang   if (aij->ops->getarray) {
43609566063dSJacob Faibussowitsch     PetscCall((*aij->ops->getarray)(A, array));
4361d67d9f35SJunchao Zhang   } else {
4362d67d9f35SJunchao Zhang     *array = aij->a;
4363d67d9f35SJunchao Zhang   }
4364d67d9f35SJunchao Zhang   PetscFunctionReturn(0);
4365d67d9f35SJunchao Zhang }
4366d67d9f35SJunchao Zhang 
4367d67d9f35SJunchao Zhang /*@C
436811a5261eSBarry Smith    MatSeqAIJRestoreArray - returns access to the array where the data for a `MATSEQAIJ` matrix is stored obtained by `MatSeqAIJGetArray()`
4369d67d9f35SJunchao Zhang 
4370d67d9f35SJunchao Zhang    Not Collective
4371d67d9f35SJunchao Zhang 
4372d67d9f35SJunchao Zhang    Input Parameters:
437311a5261eSBarry Smith +  mat - a `MATSEQAIJ` matrix
4374d67d9f35SJunchao Zhang -  array - pointer to the data
4375d67d9f35SJunchao Zhang 
4376d67d9f35SJunchao Zhang    Level: intermediate
4377d67d9f35SJunchao Zhang 
4378db781477SPatrick Sanan .seealso: `MatSeqAIJGetArray()`, `MatSeqAIJRestoreArrayF90()`
4379d67d9f35SJunchao Zhang @*/
4380d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJRestoreArray(Mat A, PetscScalar **array)
4381d71ae5a4SJacob Faibussowitsch {
4382d67d9f35SJunchao Zhang   Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data;
4383d67d9f35SJunchao Zhang 
4384d67d9f35SJunchao Zhang   PetscFunctionBegin;
4385d67d9f35SJunchao Zhang   if (aij->ops->restorearray) {
43869566063dSJacob Faibussowitsch     PetscCall((*aij->ops->restorearray)(A, array));
4387d67d9f35SJunchao Zhang   } else {
4388d67d9f35SJunchao Zhang     *array = NULL;
4389d67d9f35SJunchao Zhang   }
43909566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJInvalidateDiagonal(A));
43919566063dSJacob Faibussowitsch   PetscCall(PetscObjectStateIncrease((PetscObject)A));
43928c778c55SBarry Smith   PetscFunctionReturn(0);
43938c778c55SBarry Smith }
43948c778c55SBarry Smith 
439521e72a00SBarry Smith /*@C
439611a5261eSBarry Smith    MatSeqAIJGetArrayRead - gives read-only access to the array where the data for a `MATSEQAIJ` matrix is stored
43978f1ea47aSStefano Zampini 
43988f1ea47aSStefano Zampini    Not Collective
43998f1ea47aSStefano Zampini 
44008f1ea47aSStefano Zampini    Input Parameter:
440111a5261eSBarry Smith .  mat - a `MATSEQAIJ` matrix
44028f1ea47aSStefano Zampini 
44038f1ea47aSStefano Zampini    Output Parameter:
44048f1ea47aSStefano Zampini .   array - pointer to the data
44058f1ea47aSStefano Zampini 
44068f1ea47aSStefano Zampini    Level: intermediate
44078f1ea47aSStefano Zampini 
4408db781477SPatrick Sanan .seealso: `MatSeqAIJGetArray()`, `MatSeqAIJRestoreArrayRead()`
44098f1ea47aSStefano Zampini @*/
4410d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJGetArrayRead(Mat A, const PetscScalar **array)
4411d71ae5a4SJacob Faibussowitsch {
4412d67d9f35SJunchao Zhang   Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data;
44138f1ea47aSStefano Zampini 
44148f1ea47aSStefano Zampini   PetscFunctionBegin;
4415d67d9f35SJunchao Zhang   if (aij->ops->getarrayread) {
44169566063dSJacob Faibussowitsch     PetscCall((*aij->ops->getarrayread)(A, array));
4417d67d9f35SJunchao Zhang   } else {
4418d67d9f35SJunchao Zhang     *array = aij->a;
4419d67d9f35SJunchao Zhang   }
44208f1ea47aSStefano Zampini   PetscFunctionReturn(0);
44218f1ea47aSStefano Zampini }
44228f1ea47aSStefano Zampini 
44238f1ea47aSStefano Zampini /*@C
442411a5261eSBarry Smith    MatSeqAIJRestoreArrayRead - restore the read-only access array obtained from `MatSeqAIJGetArrayRead()`
44258f1ea47aSStefano Zampini 
44268f1ea47aSStefano Zampini    Not Collective
44278f1ea47aSStefano Zampini 
44288f1ea47aSStefano Zampini    Input Parameter:
442911a5261eSBarry Smith .  mat - a `MATSEQAIJ` matrix
44308f1ea47aSStefano Zampini 
44318f1ea47aSStefano Zampini    Output Parameter:
44328f1ea47aSStefano Zampini .   array - pointer to the data
44338f1ea47aSStefano Zampini 
44348f1ea47aSStefano Zampini    Level: intermediate
44358f1ea47aSStefano Zampini 
4436db781477SPatrick Sanan .seealso: `MatSeqAIJGetArray()`, `MatSeqAIJGetArrayRead()`
44378f1ea47aSStefano Zampini @*/
4438d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJRestoreArrayRead(Mat A, const PetscScalar **array)
4439d71ae5a4SJacob Faibussowitsch {
4440d67d9f35SJunchao Zhang   Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data;
44418f1ea47aSStefano Zampini 
44428f1ea47aSStefano Zampini   PetscFunctionBegin;
4443d67d9f35SJunchao Zhang   if (aij->ops->restorearrayread) {
44449566063dSJacob Faibussowitsch     PetscCall((*aij->ops->restorearrayread)(A, array));
4445d67d9f35SJunchao Zhang   } else {
4446d67d9f35SJunchao Zhang     *array = NULL;
4447d67d9f35SJunchao Zhang   }
4448d67d9f35SJunchao Zhang   PetscFunctionReturn(0);
4449d67d9f35SJunchao Zhang }
4450d67d9f35SJunchao Zhang 
4451d67d9f35SJunchao Zhang /*@C
445211a5261eSBarry Smith    MatSeqAIJGetArrayWrite - gives write-only access to the array where the data for a `MATSEQAIJ` matrix is stored
4453d67d9f35SJunchao Zhang 
4454d67d9f35SJunchao Zhang    Not Collective
4455d67d9f35SJunchao Zhang 
4456d67d9f35SJunchao Zhang    Input Parameter:
445711a5261eSBarry Smith .  mat - a `MATSEQAIJ` matrix
4458d67d9f35SJunchao Zhang 
4459d67d9f35SJunchao Zhang    Output Parameter:
4460d67d9f35SJunchao Zhang .   array - pointer to the data
4461d67d9f35SJunchao Zhang 
4462d67d9f35SJunchao Zhang    Level: intermediate
4463d67d9f35SJunchao Zhang 
4464db781477SPatrick Sanan .seealso: `MatSeqAIJGetArray()`, `MatSeqAIJRestoreArrayRead()`
4465d67d9f35SJunchao Zhang @*/
4466d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJGetArrayWrite(Mat A, PetscScalar **array)
4467d71ae5a4SJacob Faibussowitsch {
4468d67d9f35SJunchao Zhang   Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data;
4469d67d9f35SJunchao Zhang 
4470d67d9f35SJunchao Zhang   PetscFunctionBegin;
4471d67d9f35SJunchao Zhang   if (aij->ops->getarraywrite) {
44729566063dSJacob Faibussowitsch     PetscCall((*aij->ops->getarraywrite)(A, array));
4473d67d9f35SJunchao Zhang   } else {
4474d67d9f35SJunchao Zhang     *array = aij->a;
4475d67d9f35SJunchao Zhang   }
44769566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJInvalidateDiagonal(A));
44779566063dSJacob Faibussowitsch   PetscCall(PetscObjectStateIncrease((PetscObject)A));
4478d67d9f35SJunchao Zhang   PetscFunctionReturn(0);
4479d67d9f35SJunchao Zhang }
4480d67d9f35SJunchao Zhang 
4481d67d9f35SJunchao Zhang /*@C
4482d67d9f35SJunchao Zhang    MatSeqAIJRestoreArrayWrite - restore the read-only access array obtained from MatSeqAIJGetArrayRead
4483d67d9f35SJunchao Zhang 
4484d67d9f35SJunchao Zhang    Not Collective
4485d67d9f35SJunchao Zhang 
4486d67d9f35SJunchao Zhang    Input Parameter:
4487d67d9f35SJunchao Zhang .  mat - a MATSEQAIJ matrix
4488d67d9f35SJunchao Zhang 
4489d67d9f35SJunchao Zhang    Output Parameter:
4490d67d9f35SJunchao Zhang .   array - pointer to the data
4491d67d9f35SJunchao Zhang 
4492d67d9f35SJunchao Zhang    Level: intermediate
4493d67d9f35SJunchao Zhang 
4494db781477SPatrick Sanan .seealso: `MatSeqAIJGetArray()`, `MatSeqAIJGetArrayRead()`
4495d67d9f35SJunchao Zhang @*/
4496d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJRestoreArrayWrite(Mat A, PetscScalar **array)
4497d71ae5a4SJacob Faibussowitsch {
4498d67d9f35SJunchao Zhang   Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data;
4499d67d9f35SJunchao Zhang 
4500d67d9f35SJunchao Zhang   PetscFunctionBegin;
4501d67d9f35SJunchao Zhang   if (aij->ops->restorearraywrite) {
45029566063dSJacob Faibussowitsch     PetscCall((*aij->ops->restorearraywrite)(A, array));
4503d67d9f35SJunchao Zhang   } else {
4504d67d9f35SJunchao Zhang     *array = NULL;
4505d67d9f35SJunchao Zhang   }
45068f1ea47aSStefano Zampini   PetscFunctionReturn(0);
45078f1ea47aSStefano Zampini }
45088f1ea47aSStefano Zampini 
45098f1ea47aSStefano Zampini /*@C
451011a5261eSBarry Smith    MatSeqAIJGetCSRAndMemType - Get the CSR arrays and the memory type of the `MATSEQAIJ` matrix
45117ee59b9bSJunchao Zhang 
45127ee59b9bSJunchao Zhang    Not Collective
45137ee59b9bSJunchao Zhang 
45147ee59b9bSJunchao Zhang    Input Parameter:
451511a5261eSBarry Smith .  mat - a matrix of type `MATSEQAIJ` or its subclasses
45167ee59b9bSJunchao Zhang 
45177ee59b9bSJunchao Zhang    Output Parameters:
45187ee59b9bSJunchao Zhang +  i - row map array of the matrix
45197ee59b9bSJunchao Zhang .  j - column index array of the matrix
45207ee59b9bSJunchao Zhang .  a - data array of the matrix
45217ee59b9bSJunchao Zhang -  memtype - memory type of the arrays
45227ee59b9bSJunchao Zhang 
45237ee59b9bSJunchao Zhang   Notes:
45247ee59b9bSJunchao Zhang    Any of the output parameters can be NULL, in which case the corresponding value is not returned.
45257ee59b9bSJunchao Zhang    If mat is a device matrix, the arrays are on the device. Otherwise, they are on the host.
45267ee59b9bSJunchao Zhang 
45277ee59b9bSJunchao Zhang    One can call this routine on a preallocated but not assembled matrix to just get the memory of the CSR underneath the matrix.
45287ee59b9bSJunchao Zhang    If the matrix is assembled, the data array 'a' is guaranteed to have the latest values of the matrix.
45297ee59b9bSJunchao Zhang 
45307ee59b9bSJunchao Zhang    Level: Developer
45317ee59b9bSJunchao Zhang 
4532db781477SPatrick Sanan .seealso: `MatSeqAIJGetArray()`, `MatSeqAIJGetArrayRead()`
45337ee59b9bSJunchao Zhang @*/
4534d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJGetCSRAndMemType(Mat mat, const PetscInt **i, const PetscInt **j, PetscScalar **a, PetscMemType *mtype)
4535d71ae5a4SJacob Faibussowitsch {
45367ee59b9bSJunchao Zhang   Mat_SeqAIJ *aij = (Mat_SeqAIJ *)mat->data;
45377ee59b9bSJunchao Zhang 
45387ee59b9bSJunchao Zhang   PetscFunctionBegin;
45397ee59b9bSJunchao Zhang   PetscCheck(mat->preallocated, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "matrix is not preallocated");
45407ee59b9bSJunchao Zhang   if (aij->ops->getcsrandmemtype) {
45417ee59b9bSJunchao Zhang     PetscCall((*aij->ops->getcsrandmemtype)(mat, i, j, a, mtype));
45427ee59b9bSJunchao Zhang   } else {
45437ee59b9bSJunchao Zhang     if (i) *i = aij->i;
45447ee59b9bSJunchao Zhang     if (j) *j = aij->j;
45457ee59b9bSJunchao Zhang     if (a) *a = aij->a;
45467ee59b9bSJunchao Zhang     if (mtype) *mtype = PETSC_MEMTYPE_HOST;
45477ee59b9bSJunchao Zhang   }
45487ee59b9bSJunchao Zhang   PetscFunctionReturn(0);
45497ee59b9bSJunchao Zhang }
45507ee59b9bSJunchao Zhang 
45517ee59b9bSJunchao Zhang /*@C
455221e72a00SBarry Smith    MatSeqAIJGetMaxRowNonzeros - returns the maximum number of nonzeros in any row
455321e72a00SBarry Smith 
455421e72a00SBarry Smith    Not Collective
455521e72a00SBarry Smith 
455621e72a00SBarry Smith    Input Parameter:
455711a5261eSBarry Smith .  mat - a `MATSEQAIJ` matrix
455821e72a00SBarry Smith 
455921e72a00SBarry Smith    Output Parameter:
456021e72a00SBarry Smith .   nz - the maximum number of nonzeros in any row
456121e72a00SBarry Smith 
456221e72a00SBarry Smith    Level: intermediate
456321e72a00SBarry Smith 
4564db781477SPatrick Sanan .seealso: `MatSeqAIJRestoreArray()`, `MatSeqAIJGetArrayF90()`
456521e72a00SBarry Smith @*/
4566d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJGetMaxRowNonzeros(Mat A, PetscInt *nz)
4567d71ae5a4SJacob Faibussowitsch {
456821e72a00SBarry Smith   Mat_SeqAIJ *aij = (Mat_SeqAIJ *)A->data;
456921e72a00SBarry Smith 
457021e72a00SBarry Smith   PetscFunctionBegin;
457121e72a00SBarry Smith   *nz = aij->rmax;
457221e72a00SBarry Smith   PetscFunctionReturn(0);
457321e72a00SBarry Smith }
457421e72a00SBarry Smith 
4575d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetPreallocationCOO_SeqAIJ(Mat mat, PetscCount coo_n, PetscInt coo_i[], PetscInt coo_j[])
4576d71ae5a4SJacob Faibussowitsch {
4577394ed5ebSJunchao Zhang   MPI_Comm     comm;
4578394ed5ebSJunchao Zhang   PetscInt    *i, *j;
4579394ed5ebSJunchao Zhang   PetscInt     M, N, row;
4580394ed5ebSJunchao Zhang   PetscCount   k, p, q, nneg, nnz, start, end; /* Index the coo array, so use PetscCount as their type */
4581394ed5ebSJunchao Zhang   PetscInt    *Ai;                             /* Change to PetscCount once we use it for row pointers */
4582394ed5ebSJunchao Zhang   PetscInt    *Aj;
4583394ed5ebSJunchao Zhang   PetscScalar *Aa;
4584cbc6b225SStefano Zampini   Mat_SeqAIJ  *seqaij = (Mat_SeqAIJ *)(mat->data);
4585cbc6b225SStefano Zampini   MatType      rtype;
4586394ed5ebSJunchao Zhang   PetscCount  *perm, *jmap;
4587394ed5ebSJunchao Zhang 
4588394ed5ebSJunchao Zhang   PetscFunctionBegin;
45899566063dSJacob Faibussowitsch   PetscCall(MatResetPreallocationCOO_SeqAIJ(mat));
45909566063dSJacob Faibussowitsch   PetscCall(PetscObjectGetComm((PetscObject)mat, &comm));
45919566063dSJacob Faibussowitsch   PetscCall(MatGetSize(mat, &M, &N));
4592e8729f6fSJunchao Zhang   i = coo_i;
4593e8729f6fSJunchao Zhang   j = coo_j;
45949566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(coo_n, &perm));
4595394ed5ebSJunchao Zhang   for (k = 0; k < coo_n; k++) { /* Ignore entries with negative row or col indices */
4596394ed5ebSJunchao Zhang     if (j[k] < 0) i[k] = -1;
4597394ed5ebSJunchao Zhang     perm[k] = k;
4598394ed5ebSJunchao Zhang   }
4599394ed5ebSJunchao Zhang 
4600394ed5ebSJunchao Zhang   /* Sort by row */
46019566063dSJacob Faibussowitsch   PetscCall(PetscSortIntWithIntCountArrayPair(coo_n, i, j, perm));
46029371c9d4SSatish Balay   for (k = 0; k < coo_n; k++) {
46039371c9d4SSatish Balay     if (i[k] >= 0) break;
46049371c9d4SSatish Balay   } /* Advance k to the first row with a non-negative index */
4605394ed5ebSJunchao Zhang   nneg = k;
46069566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(coo_n - nneg + 1, &jmap)); /* +1 to make a CSR-like data structure. jmap[i] originally is the number of repeats for i-th nonzero */
4607394ed5ebSJunchao Zhang   nnz = 0;                                          /* Total number of unique nonzeros to be counted */
4608394ed5ebSJunchao Zhang   jmap++;                                           /* Inc jmap by 1 for convinience */
4609394ed5ebSJunchao Zhang 
46109566063dSJacob Faibussowitsch   PetscCall(PetscCalloc1(M + 1, &Ai));        /* CSR of A */
46119566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(coo_n - nneg, &Aj)); /* We have at most coo_n-nneg unique nonzeros */
4612394ed5ebSJunchao Zhang 
4613394ed5ebSJunchao Zhang   /* In each row, sort by column, then unique column indices to get row length */
4614394ed5ebSJunchao Zhang   Ai++;  /* Inc by 1 for convinience */
4615394ed5ebSJunchao Zhang   q = 0; /* q-th unique nonzero, with q starting from 0 */
4616394ed5ebSJunchao Zhang   while (k < coo_n) {
4617394ed5ebSJunchao Zhang     row   = i[k];
4618394ed5ebSJunchao Zhang     start = k; /* [start,end) indices for this row */
4619394ed5ebSJunchao Zhang     while (k < coo_n && i[k] == row) k++;
4620394ed5ebSJunchao Zhang     end = k;
46219566063dSJacob Faibussowitsch     PetscCall(PetscSortIntWithCountArray(end - start, j + start, perm + start));
4622394ed5ebSJunchao Zhang     /* Find number of unique col entries in this row */
4623394ed5ebSJunchao Zhang     Aj[q]   = j[start]; /* Log the first nonzero in this row */
4624394ed5ebSJunchao Zhang     jmap[q] = 1;        /* Number of repeats of this nozero entry */
4625394ed5ebSJunchao Zhang     Ai[row] = 1;
4626394ed5ebSJunchao Zhang     nnz++;
4627394ed5ebSJunchao Zhang 
4628394ed5ebSJunchao Zhang     for (p = start + 1; p < end; p++) { /* Scan remaining nonzero in this row */
4629394ed5ebSJunchao Zhang       if (j[p] != j[p - 1]) {           /* Meet a new nonzero */
4630394ed5ebSJunchao Zhang         q++;
4631394ed5ebSJunchao Zhang         jmap[q] = 1;
4632394ed5ebSJunchao Zhang         Aj[q]   = j[p];
4633394ed5ebSJunchao Zhang         Ai[row]++;
4634394ed5ebSJunchao Zhang         nnz++;
4635394ed5ebSJunchao Zhang       } else {
4636394ed5ebSJunchao Zhang         jmap[q]++;
4637394ed5ebSJunchao Zhang       }
4638394ed5ebSJunchao Zhang     }
4639394ed5ebSJunchao Zhang     q++; /* Move to next row and thus next unique nonzero */
4640394ed5ebSJunchao Zhang   }
4641394ed5ebSJunchao Zhang 
4642394ed5ebSJunchao Zhang   Ai--; /* Back to the beginning of Ai[] */
4643394ed5ebSJunchao Zhang   for (k = 0; k < M; k++) Ai[k + 1] += Ai[k];
4644394ed5ebSJunchao Zhang   jmap--; /* Back to the beginning of jmap[] */
4645394ed5ebSJunchao Zhang   jmap[0] = 0;
4646394ed5ebSJunchao Zhang   for (k = 0; k < nnz; k++) jmap[k + 1] += jmap[k];
4647394ed5ebSJunchao Zhang   if (nnz < coo_n - nneg) { /* Realloc with actual number of unique nonzeros */
4648394ed5ebSJunchao Zhang     PetscCount *jmap_new;
4649394ed5ebSJunchao Zhang     PetscInt   *Aj_new;
4650394ed5ebSJunchao Zhang 
46519566063dSJacob Faibussowitsch     PetscCall(PetscMalloc1(nnz + 1, &jmap_new));
46529566063dSJacob Faibussowitsch     PetscCall(PetscArraycpy(jmap_new, jmap, nnz + 1));
46539566063dSJacob Faibussowitsch     PetscCall(PetscFree(jmap));
4654394ed5ebSJunchao Zhang     jmap = jmap_new;
4655394ed5ebSJunchao Zhang 
46569566063dSJacob Faibussowitsch     PetscCall(PetscMalloc1(nnz, &Aj_new));
46579566063dSJacob Faibussowitsch     PetscCall(PetscArraycpy(Aj_new, Aj, nnz));
46589566063dSJacob Faibussowitsch     PetscCall(PetscFree(Aj));
4659394ed5ebSJunchao Zhang     Aj = Aj_new;
4660394ed5ebSJunchao Zhang   }
4661394ed5ebSJunchao Zhang 
4662394ed5ebSJunchao Zhang   if (nneg) { /* Discard heading entries with negative indices in perm[], as we'll access it from index 0 in MatSetValuesCOO */
4663394ed5ebSJunchao Zhang     PetscCount *perm_new;
4664cbc6b225SStefano Zampini 
46659566063dSJacob Faibussowitsch     PetscCall(PetscMalloc1(coo_n - nneg, &perm_new));
46669566063dSJacob Faibussowitsch     PetscCall(PetscArraycpy(perm_new, perm + nneg, coo_n - nneg));
46679566063dSJacob Faibussowitsch     PetscCall(PetscFree(perm));
4668394ed5ebSJunchao Zhang     perm = perm_new;
4669394ed5ebSJunchao Zhang   }
4670394ed5ebSJunchao Zhang 
46719566063dSJacob Faibussowitsch   PetscCall(MatGetRootType_Private(mat, &rtype));
46729566063dSJacob Faibussowitsch   PetscCall(PetscCalloc1(nnz, &Aa)); /* Zero the matrix */
46739566063dSJacob Faibussowitsch   PetscCall(MatSetSeqAIJWithArrays_private(PETSC_COMM_SELF, M, N, Ai, Aj, Aa, rtype, mat));
4674394ed5ebSJunchao Zhang 
4675394ed5ebSJunchao Zhang   seqaij->singlemalloc = PETSC_FALSE;            /* Ai, Aj and Aa are not allocated in one big malloc */
4676394ed5ebSJunchao Zhang   seqaij->free_a = seqaij->free_ij = PETSC_TRUE; /* Let newmat own Ai, Aj and Aa */
4677394ed5ebSJunchao Zhang   /* Record COO fields */
4678394ed5ebSJunchao Zhang   seqaij->coo_n = coo_n;
4679394ed5ebSJunchao Zhang   seqaij->Atot  = coo_n - nneg; /* Annz is seqaij->nz, so no need to record that again */
4680394ed5ebSJunchao Zhang   seqaij->jmap  = jmap;         /* of length nnz+1 */
4681394ed5ebSJunchao Zhang   seqaij->perm  = perm;
4682394ed5ebSJunchao Zhang   PetscFunctionReturn(0);
4683394ed5ebSJunchao Zhang }
4684394ed5ebSJunchao Zhang 
4685d71ae5a4SJacob Faibussowitsch static PetscErrorCode MatSetValuesCOO_SeqAIJ(Mat A, const PetscScalar v[], InsertMode imode)
4686d71ae5a4SJacob Faibussowitsch {
4687394ed5ebSJunchao Zhang   Mat_SeqAIJ  *aseq = (Mat_SeqAIJ *)A->data;
4688394ed5ebSJunchao Zhang   PetscCount   i, j, Annz = aseq->nz;
4689394ed5ebSJunchao Zhang   PetscCount  *perm = aseq->perm, *jmap = aseq->jmap;
4690394ed5ebSJunchao Zhang   PetscScalar *Aa;
4691394ed5ebSJunchao Zhang 
4692394ed5ebSJunchao Zhang   PetscFunctionBegin;
46939566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArray(A, &Aa));
4694394ed5ebSJunchao Zhang   for (i = 0; i < Annz; i++) {
4695b6c38306SJunchao Zhang     PetscScalar sum = 0.0;
4696b6c38306SJunchao Zhang     for (j = jmap[i]; j < jmap[i + 1]; j++) sum += v[perm[j]];
4697b6c38306SJunchao Zhang     Aa[i] = (imode == INSERT_VALUES ? 0.0 : Aa[i]) + sum;
4698394ed5ebSJunchao Zhang   }
46999566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArray(A, &Aa));
4700394ed5ebSJunchao Zhang   PetscFunctionReturn(0);
4701394ed5ebSJunchao Zhang }
4702394ed5ebSJunchao Zhang 
470334b5b067SBarry Smith #if defined(PETSC_HAVE_CUDA)
47045063d097SStefano Zampini PETSC_INTERN PetscErrorCode MatConvert_SeqAIJ_SeqAIJCUSPARSE(Mat, MatType, MatReuse, Mat *);
470502fe1965SBarry Smith #endif
47063d0639e7SStefano Zampini #if defined(PETSC_HAVE_KOKKOS_KERNELS)
47075063d097SStefano Zampini PETSC_INTERN PetscErrorCode MatConvert_SeqAIJ_SeqAIJKokkos(Mat, MatType, MatReuse, Mat *);
47083d0639e7SStefano Zampini #endif
470902fe1965SBarry Smith 
4710d71ae5a4SJacob Faibussowitsch PETSC_EXTERN PetscErrorCode MatCreate_SeqAIJ(Mat B)
4711d71ae5a4SJacob Faibussowitsch {
4712273d9f13SBarry Smith   Mat_SeqAIJ *b;
471338baddfdSBarry Smith   PetscMPIInt size;
4714273d9f13SBarry Smith 
4715273d9f13SBarry Smith   PetscFunctionBegin;
47169566063dSJacob Faibussowitsch   PetscCallMPI(MPI_Comm_size(PetscObjectComm((PetscObject)B), &size));
471708401ef6SPierre Jolivet   PetscCheck(size <= 1, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Comm must be of size 1");
4718273d9f13SBarry Smith 
47194dfa11a4SJacob Faibussowitsch   PetscCall(PetscNew(&b));
47202205254eSKarl Rupp 
4721b0a32e0cSBarry Smith   B->data = (void *)b;
47222205254eSKarl Rupp 
47239566063dSJacob Faibussowitsch   PetscCall(PetscMemcpy(B->ops, &MatOps_Values, sizeof(struct _MatOps)));
4724071fcb05SBarry Smith   if (B->sortedfull) B->ops->setvalues = MatSetValues_SeqAIJ_SortedFull;
47252205254eSKarl Rupp 
4726f4259b30SLisandro Dalcin   b->row                = NULL;
4727f4259b30SLisandro Dalcin   b->col                = NULL;
4728f4259b30SLisandro Dalcin   b->icol               = NULL;
4729b810aeb4SBarry Smith   b->reallocs           = 0;
473036db0b34SBarry Smith   b->ignorezeroentries  = PETSC_FALSE;
4731f1e2ffcdSBarry Smith   b->roworiented        = PETSC_TRUE;
4732416022c9SBarry Smith   b->nonew              = 0;
4733f4259b30SLisandro Dalcin   b->diag               = NULL;
4734f4259b30SLisandro Dalcin   b->solve_work         = NULL;
4735f4259b30SLisandro Dalcin   B->spptr              = NULL;
4736f4259b30SLisandro Dalcin   b->saved_values       = NULL;
4737f4259b30SLisandro Dalcin   b->idiag              = NULL;
4738f4259b30SLisandro Dalcin   b->mdiag              = NULL;
4739f4259b30SLisandro Dalcin   b->ssor_work          = NULL;
474071f1c65dSBarry Smith   b->omega              = 1.0;
474171f1c65dSBarry Smith   b->fshift             = 0.0;
474271f1c65dSBarry Smith   b->idiagvalid         = PETSC_FALSE;
4743bbead8a2SBarry Smith   b->ibdiagvalid        = PETSC_FALSE;
4744a9817697SBarry Smith   b->keepnonzeropattern = PETSC_FALSE;
474517ab2063SBarry Smith 
47469566063dSJacob Faibussowitsch   PetscCall(PetscObjectChangeTypeName((PetscObject)B, MATSEQAIJ));
4747d1e78c4fSBarry Smith #if defined(PETSC_HAVE_MATLAB)
47489566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "PetscMatlabEnginePut_C", MatlabEnginePut_SeqAIJ));
47499566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "PetscMatlabEngineGet_C", MatlabEngineGet_SeqAIJ));
4750b3866ffcSBarry Smith #endif
47519566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSeqAIJSetColumnIndices_C", MatSeqAIJSetColumnIndices_SeqAIJ));
47529566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatStoreValues_C", MatStoreValues_SeqAIJ));
47539566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatRetrieveValues_C", MatRetrieveValues_SeqAIJ));
47549566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqsbaij_C", MatConvert_SeqAIJ_SeqSBAIJ));
47559566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqbaij_C", MatConvert_SeqAIJ_SeqBAIJ));
47569566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijperm_C", MatConvert_SeqAIJ_SeqAIJPERM));
47579566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijsell_C", MatConvert_SeqAIJ_SeqAIJSELL));
47589779e05dSSatish Balay #if defined(PETSC_HAVE_MKL_SPARSE)
47599566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijmkl_C", MatConvert_SeqAIJ_SeqAIJMKL));
4760191b95cbSRichard Tran Mills #endif
476134b5b067SBarry Smith #if defined(PETSC_HAVE_CUDA)
47629566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijcusparse_C", MatConvert_SeqAIJ_SeqAIJCUSPARSE));
47639566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_seqaijcusparse_seqaij_C", MatProductSetFromOptions_SeqAIJ));
47649566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_seqaij_seqaijcusparse_C", MatProductSetFromOptions_SeqAIJ));
476502fe1965SBarry Smith #endif
47663d0639e7SStefano Zampini #if defined(PETSC_HAVE_KOKKOS_KERNELS)
47679566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijkokkos_C", MatConvert_SeqAIJ_SeqAIJKokkos));
47683d0639e7SStefano Zampini #endif
47699566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqaijcrl_C", MatConvert_SeqAIJ_SeqAIJCRL));
4770af8000cdSHong Zhang #if defined(PETSC_HAVE_ELEMENTAL)
47719566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_elemental_C", MatConvert_SeqAIJ_Elemental));
4772af8000cdSHong Zhang #endif
4773d24d4204SJose E. Roman #if defined(PETSC_HAVE_SCALAPACK)
47749566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_scalapack_C", MatConvert_AIJ_ScaLAPACK));
4775d24d4204SJose E. Roman #endif
477663c07aadSStefano Zampini #if defined(PETSC_HAVE_HYPRE)
47779566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_hypre_C", MatConvert_AIJ_HYPRE));
47789566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_transpose_seqaij_seqaij_C", MatProductSetFromOptions_Transpose_AIJ_AIJ));
477963c07aadSStefano Zampini #endif
47809566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqdense_C", MatConvert_SeqAIJ_SeqDense));
47819566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_seqsell_C", MatConvert_SeqAIJ_SeqSELL));
47829566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatConvert_seqaij_is_C", MatConvert_XAIJ_IS));
47839566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatIsTranspose_C", MatIsTranspose_SeqAIJ));
47849566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatIsHermitianTranspose_C", MatIsTranspose_SeqAIJ));
47859566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSeqAIJSetPreallocation_C", MatSeqAIJSetPreallocation_SeqAIJ));
47869566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatResetPreallocation_C", MatResetPreallocation_SeqAIJ));
47879566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSeqAIJSetPreallocationCSR_C", MatSeqAIJSetPreallocationCSR_SeqAIJ));
47889566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatReorderForNonzeroDiagonal_C", MatReorderForNonzeroDiagonal_SeqAIJ));
47899566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_is_seqaij_C", MatProductSetFromOptions_IS_XAIJ));
47909566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_seqdense_seqaij_C", MatProductSetFromOptions_SeqDense_SeqAIJ));
47919566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatProductSetFromOptions_seqaij_seqaij_C", MatProductSetFromOptions_SeqAIJ));
47929566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSeqAIJKron_C", MatSeqAIJKron_SeqAIJ));
47939566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSetPreallocationCOO_C", MatSetPreallocationCOO_SeqAIJ));
47949566063dSJacob Faibussowitsch   PetscCall(PetscObjectComposeFunction((PetscObject)B, "MatSetValuesCOO_C", MatSetValuesCOO_SeqAIJ));
47959566063dSJacob Faibussowitsch   PetscCall(MatCreate_SeqAIJ_Inode(B));
47969566063dSJacob Faibussowitsch   PetscCall(PetscObjectChangeTypeName((PetscObject)B, MATSEQAIJ));
47979566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJSetTypeFromOptions(B)); /* this allows changing the matrix subtype to say MATSEQAIJPERM */
47983a40ed3dSBarry Smith   PetscFunctionReturn(0);
479917ab2063SBarry Smith }
480017ab2063SBarry Smith 
4801b24902e0SBarry Smith /*
48023893b582SJunchao Zhang     Given a matrix generated with MatGetFactor() duplicates all the information in A into C
4803b24902e0SBarry Smith */
4804d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDuplicateNoCreate_SeqAIJ(Mat C, Mat A, MatDuplicateOption cpvalues, PetscBool mallocmatspace)
4805d71ae5a4SJacob Faibussowitsch {
48062a350339SBarry Smith   Mat_SeqAIJ *c = (Mat_SeqAIJ *)C->data, *a = (Mat_SeqAIJ *)A->data;
4807071fcb05SBarry Smith   PetscInt    m = A->rmap->n, i;
480817ab2063SBarry Smith 
48093a40ed3dSBarry Smith   PetscFunctionBegin;
4810aed4548fSBarry Smith   PetscCheck(A->assembled || cpvalues == MAT_DO_NOT_COPY_VALUES, PETSC_COMM_SELF, PETSC_ERR_ARG_WRONGSTATE, "Cannot duplicate unassembled matrix");
4811273d9f13SBarry Smith 
4812d5f3da31SBarry Smith   C->factortype = A->factortype;
4813f4259b30SLisandro Dalcin   c->row        = NULL;
4814f4259b30SLisandro Dalcin   c->col        = NULL;
4815f4259b30SLisandro Dalcin   c->icol       = NULL;
48166ad4291fSHong Zhang   c->reallocs   = 0;
481717ab2063SBarry Smith 
481869272f91SPierre Jolivet   C->assembled    = A->assembled;
481969272f91SPierre Jolivet   C->preallocated = A->preallocated;
482017ab2063SBarry Smith 
482169272f91SPierre Jolivet   if (A->preallocated) {
48229566063dSJacob Faibussowitsch     PetscCall(PetscLayoutReference(A->rmap, &C->rmap));
48239566063dSJacob Faibussowitsch     PetscCall(PetscLayoutReference(A->cmap, &C->cmap));
4824eec197d1SBarry Smith 
48259566063dSJacob Faibussowitsch     PetscCall(PetscMalloc1(m, &c->imax));
48269566063dSJacob Faibussowitsch     PetscCall(PetscMemcpy(c->imax, a->imax, m * sizeof(PetscInt)));
48279566063dSJacob Faibussowitsch     PetscCall(PetscMalloc1(m, &c->ilen));
48289566063dSJacob Faibussowitsch     PetscCall(PetscMemcpy(c->ilen, a->ilen, m * sizeof(PetscInt)));
482917ab2063SBarry Smith 
483017ab2063SBarry Smith     /* allocate the matrix space */
4831f77e22a1SHong Zhang     if (mallocmatspace) {
48329566063dSJacob Faibussowitsch       PetscCall(PetscMalloc3(a->i[m], &c->a, a->i[m], &c->j, m + 1, &c->i));
48332205254eSKarl Rupp 
4834f1e2ffcdSBarry Smith       c->singlemalloc = PETSC_TRUE;
48352205254eSKarl Rupp 
48369566063dSJacob Faibussowitsch       PetscCall(PetscArraycpy(c->i, a->i, m + 1));
483717ab2063SBarry Smith       if (m > 0) {
48389566063dSJacob Faibussowitsch         PetscCall(PetscArraycpy(c->j, a->j, a->i[m]));
4839be6bf707SBarry Smith         if (cpvalues == MAT_COPY_VALUES) {
48402e5835c6SStefano Zampini           const PetscScalar *aa;
48412e5835c6SStefano Zampini 
48429566063dSJacob Faibussowitsch           PetscCall(MatSeqAIJGetArrayRead(A, &aa));
48439566063dSJacob Faibussowitsch           PetscCall(PetscArraycpy(c->a, aa, a->i[m]));
48449566063dSJacob Faibussowitsch           PetscCall(MatSeqAIJGetArrayRead(A, &aa));
4845be6bf707SBarry Smith         } else {
48469566063dSJacob Faibussowitsch           PetscCall(PetscArrayzero(c->a, a->i[m]));
484717ab2063SBarry Smith         }
484808480c60SBarry Smith       }
4849f77e22a1SHong Zhang     }
485017ab2063SBarry Smith 
48516ad4291fSHong Zhang     c->ignorezeroentries = a->ignorezeroentries;
4852416022c9SBarry Smith     c->roworiented       = a->roworiented;
4853416022c9SBarry Smith     c->nonew             = a->nonew;
4854416022c9SBarry Smith     if (a->diag) {
48559566063dSJacob Faibussowitsch       PetscCall(PetscMalloc1(m + 1, &c->diag));
48569566063dSJacob Faibussowitsch       PetscCall(PetscMemcpy(c->diag, a->diag, m * sizeof(PetscInt)));
4857071fcb05SBarry Smith     } else c->diag = NULL;
48582205254eSKarl Rupp 
4859f4259b30SLisandro Dalcin     c->solve_work         = NULL;
4860f4259b30SLisandro Dalcin     c->saved_values       = NULL;
4861f4259b30SLisandro Dalcin     c->idiag              = NULL;
4862f4259b30SLisandro Dalcin     c->ssor_work          = NULL;
4863a9817697SBarry Smith     c->keepnonzeropattern = a->keepnonzeropattern;
4864e6b907acSBarry Smith     c->free_a             = PETSC_TRUE;
4865e6b907acSBarry Smith     c->free_ij            = PETSC_TRUE;
48666ad4291fSHong Zhang 
4867893ad86cSHong Zhang     c->rmax  = a->rmax;
4868416022c9SBarry Smith     c->nz    = a->nz;
48698ed568f8SMatthew G Knepley     c->maxnz = a->nz; /* Since we allocate exactly the right amount */
4870754ec7b1SSatish Balay 
48716ad4291fSHong Zhang     c->compressedrow.use   = a->compressedrow.use;
48726ad4291fSHong Zhang     c->compressedrow.nrows = a->compressedrow.nrows;
4873cd6b891eSBarry Smith     if (a->compressedrow.use) {
48746ad4291fSHong Zhang       i = a->compressedrow.nrows;
48759566063dSJacob Faibussowitsch       PetscCall(PetscMalloc2(i + 1, &c->compressedrow.i, i, &c->compressedrow.rindex));
48769566063dSJacob Faibussowitsch       PetscCall(PetscArraycpy(c->compressedrow.i, a->compressedrow.i, i + 1));
48779566063dSJacob Faibussowitsch       PetscCall(PetscArraycpy(c->compressedrow.rindex, a->compressedrow.rindex, i));
487827ea64f8SHong Zhang     } else {
487927ea64f8SHong Zhang       c->compressedrow.use    = PETSC_FALSE;
48800298fd71SBarry Smith       c->compressedrow.i      = NULL;
48810298fd71SBarry Smith       c->compressedrow.rindex = NULL;
48826ad4291fSHong Zhang     }
4883ea632784SBarry Smith     c->nonzerorowcnt = a->nonzerorowcnt;
4884e56f5c9eSBarry Smith     C->nonzerostate  = A->nonzerostate;
48854846f1f5SKris Buschelman 
48869566063dSJacob Faibussowitsch     PetscCall(MatDuplicate_SeqAIJ_Inode(A, cpvalues, &C));
488769272f91SPierre Jolivet   }
48889566063dSJacob Faibussowitsch   PetscCall(PetscFunctionListDuplicate(((PetscObject)A)->qlist, &((PetscObject)C)->qlist));
48893a40ed3dSBarry Smith   PetscFunctionReturn(0);
489017ab2063SBarry Smith }
489117ab2063SBarry Smith 
4892d71ae5a4SJacob Faibussowitsch PetscErrorCode MatDuplicate_SeqAIJ(Mat A, MatDuplicateOption cpvalues, Mat *B)
4893d71ae5a4SJacob Faibussowitsch {
4894b24902e0SBarry Smith   PetscFunctionBegin;
48959566063dSJacob Faibussowitsch   PetscCall(MatCreate(PetscObjectComm((PetscObject)A), B));
48969566063dSJacob Faibussowitsch   PetscCall(MatSetSizes(*B, A->rmap->n, A->cmap->n, A->rmap->n, A->cmap->n));
489748a46eb9SPierre Jolivet   if (!(A->rmap->n % A->rmap->bs) && !(A->cmap->n % A->cmap->bs)) PetscCall(MatSetBlockSizesFromMats(*B, A, A));
48989566063dSJacob Faibussowitsch   PetscCall(MatSetType(*B, ((PetscObject)A)->type_name));
48999566063dSJacob Faibussowitsch   PetscCall(MatDuplicateNoCreate_SeqAIJ(*B, A, cpvalues, PETSC_TRUE));
4900b24902e0SBarry Smith   PetscFunctionReturn(0);
4901b24902e0SBarry Smith }
4902b24902e0SBarry Smith 
4903d71ae5a4SJacob Faibussowitsch PetscErrorCode MatLoad_SeqAIJ(Mat newMat, PetscViewer viewer)
4904d71ae5a4SJacob Faibussowitsch {
490552f91c60SVaclav Hapla   PetscBool isbinary, ishdf5;
490652f91c60SVaclav Hapla 
490752f91c60SVaclav Hapla   PetscFunctionBegin;
490852f91c60SVaclav Hapla   PetscValidHeaderSpecific(newMat, MAT_CLASSID, 1);
490952f91c60SVaclav Hapla   PetscValidHeaderSpecific(viewer, PETSC_VIEWER_CLASSID, 2);
4910c27b3999SVaclav Hapla   /* force binary viewer to load .info file if it has not yet done so */
49119566063dSJacob Faibussowitsch   PetscCall(PetscViewerSetUp(viewer));
49129566063dSJacob Faibussowitsch   PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERBINARY, &isbinary));
49139566063dSJacob Faibussowitsch   PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERHDF5, &ishdf5));
491452f91c60SVaclav Hapla   if (isbinary) {
49159566063dSJacob Faibussowitsch     PetscCall(MatLoad_SeqAIJ_Binary(newMat, viewer));
491652f91c60SVaclav Hapla   } else if (ishdf5) {
491752f91c60SVaclav Hapla #if defined(PETSC_HAVE_HDF5)
49189566063dSJacob Faibussowitsch     PetscCall(MatLoad_AIJ_HDF5(newMat, viewer));
491952f91c60SVaclav Hapla #else
492052f91c60SVaclav Hapla     SETERRQ(PetscObjectComm((PetscObject)newMat), PETSC_ERR_SUP, "HDF5 not supported in this build.\nPlease reconfigure using --download-hdf5");
492152f91c60SVaclav Hapla #endif
492252f91c60SVaclav Hapla   } else {
492398921bdaSJacob Faibussowitsch     SETERRQ(PetscObjectComm((PetscObject)newMat), PETSC_ERR_SUP, "Viewer type %s not yet supported for reading %s matrices", ((PetscObject)viewer)->type_name, ((PetscObject)newMat)->type_name);
492452f91c60SVaclav Hapla   }
492552f91c60SVaclav Hapla   PetscFunctionReturn(0);
492652f91c60SVaclav Hapla }
492752f91c60SVaclav Hapla 
4928d71ae5a4SJacob Faibussowitsch PetscErrorCode MatLoad_SeqAIJ_Binary(Mat mat, PetscViewer viewer)
4929d71ae5a4SJacob Faibussowitsch {
49303ea6fe3dSLisandro Dalcin   Mat_SeqAIJ *a = (Mat_SeqAIJ *)mat->data;
49313ea6fe3dSLisandro Dalcin   PetscInt    header[4], *rowlens, M, N, nz, sum, rows, cols, i;
4932fbdbba38SShri Abhyankar 
4933fbdbba38SShri Abhyankar   PetscFunctionBegin;
49349566063dSJacob Faibussowitsch   PetscCall(PetscViewerSetUp(viewer));
4935bbead8a2SBarry Smith 
49363ea6fe3dSLisandro Dalcin   /* read in matrix header */
49379566063dSJacob Faibussowitsch   PetscCall(PetscViewerBinaryRead(viewer, header, 4, NULL, PETSC_INT));
493808401ef6SPierre Jolivet   PetscCheck(header[0] == MAT_FILE_CLASSID, PETSC_COMM_SELF, PETSC_ERR_FILE_UNEXPECTED, "Not a matrix object in file");
49399371c9d4SSatish Balay   M  = header[1];
49409371c9d4SSatish Balay   N  = header[2];
49419371c9d4SSatish Balay   nz = header[3];
494208401ef6SPierre Jolivet   PetscCheck(M >= 0, PetscObjectComm((PetscObject)viewer), PETSC_ERR_FILE_UNEXPECTED, "Matrix row size (%" PetscInt_FMT ") in file is negative", M);
494308401ef6SPierre Jolivet   PetscCheck(N >= 0, PetscObjectComm((PetscObject)viewer), PETSC_ERR_FILE_UNEXPECTED, "Matrix column size (%" PetscInt_FMT ") in file is negative", N);
494408401ef6SPierre Jolivet   PetscCheck(nz >= 0, PETSC_COMM_SELF, PETSC_ERR_FILE_UNEXPECTED, "Matrix stored in special format on disk, cannot load as SeqAIJ");
4945fbdbba38SShri Abhyankar 
49463ea6fe3dSLisandro Dalcin   /* set block sizes from the viewer's .info file */
49479566063dSJacob Faibussowitsch   PetscCall(MatLoad_Binary_BlockSizes(mat, viewer));
49483ea6fe3dSLisandro Dalcin   /* set local and global sizes if not set already */
49493ea6fe3dSLisandro Dalcin   if (mat->rmap->n < 0) mat->rmap->n = M;
49503ea6fe3dSLisandro Dalcin   if (mat->cmap->n < 0) mat->cmap->n = N;
49513ea6fe3dSLisandro Dalcin   if (mat->rmap->N < 0) mat->rmap->N = M;
49523ea6fe3dSLisandro Dalcin   if (mat->cmap->N < 0) mat->cmap->N = N;
49539566063dSJacob Faibussowitsch   PetscCall(PetscLayoutSetUp(mat->rmap));
49549566063dSJacob Faibussowitsch   PetscCall(PetscLayoutSetUp(mat->cmap));
49553ea6fe3dSLisandro Dalcin 
49563ea6fe3dSLisandro Dalcin   /* check if the matrix sizes are correct */
49579566063dSJacob Faibussowitsch   PetscCall(MatGetSize(mat, &rows, &cols));
4958aed4548fSBarry Smith   PetscCheck(M == rows && N == cols, PETSC_COMM_SELF, PETSC_ERR_FILE_UNEXPECTED, "Matrix in file of different sizes (%" PetscInt_FMT ", %" PetscInt_FMT ") than the input matrix (%" PetscInt_FMT ", %" PetscInt_FMT ")", M, N, rows, cols);
49593ea6fe3dSLisandro Dalcin 
4960fbdbba38SShri Abhyankar   /* read in row lengths */
49619566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(M, &rowlens));
49629566063dSJacob Faibussowitsch   PetscCall(PetscViewerBinaryRead(viewer, rowlens, M, NULL, PETSC_INT));
49633ea6fe3dSLisandro Dalcin   /* check if sum(rowlens) is same as nz */
49649371c9d4SSatish Balay   sum = 0;
49659371c9d4SSatish Balay   for (i = 0; i < M; i++) sum += rowlens[i];
496608401ef6SPierre Jolivet   PetscCheck(sum == nz, PETSC_COMM_SELF, PETSC_ERR_FILE_UNEXPECTED, "Inconsistent matrix data in file: nonzeros = %" PetscInt_FMT ", sum-row-lengths = %" PetscInt_FMT, nz, sum);
49673ea6fe3dSLisandro Dalcin   /* preallocate and check sizes */
49689566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(mat, 0, rowlens));
49699566063dSJacob Faibussowitsch   PetscCall(MatGetSize(mat, &rows, &cols));
4970aed4548fSBarry Smith   PetscCheck(M == rows && N == cols, PETSC_COMM_SELF, PETSC_ERR_FILE_UNEXPECTED, "Matrix in file of different length (%" PetscInt_FMT ", %" PetscInt_FMT ") than the input matrix (%" PetscInt_FMT ", %" PetscInt_FMT ")", M, N, rows, cols);
49713ea6fe3dSLisandro Dalcin   /* store row lengths */
49729566063dSJacob Faibussowitsch   PetscCall(PetscArraycpy(a->ilen, rowlens, M));
49739566063dSJacob Faibussowitsch   PetscCall(PetscFree(rowlens));
4974fbdbba38SShri Abhyankar 
49753ea6fe3dSLisandro Dalcin   /* fill in "i" row pointers */
49769371c9d4SSatish Balay   a->i[0] = 0;
49779371c9d4SSatish Balay   for (i = 0; i < M; i++) a->i[i + 1] = a->i[i] + a->ilen[i];
49783ea6fe3dSLisandro Dalcin   /* read in "j" column indices */
49799566063dSJacob Faibussowitsch   PetscCall(PetscViewerBinaryRead(viewer, a->j, nz, NULL, PETSC_INT));
49803ea6fe3dSLisandro Dalcin   /* read in "a" nonzero values */
49819566063dSJacob Faibussowitsch   PetscCall(PetscViewerBinaryRead(viewer, a->a, nz, NULL, PETSC_SCALAR));
4982fbdbba38SShri Abhyankar 
49839566063dSJacob Faibussowitsch   PetscCall(MatAssemblyBegin(mat, MAT_FINAL_ASSEMBLY));
49849566063dSJacob Faibussowitsch   PetscCall(MatAssemblyEnd(mat, MAT_FINAL_ASSEMBLY));
4985fbdbba38SShri Abhyankar   PetscFunctionReturn(0);
4986fbdbba38SShri Abhyankar }
4987fbdbba38SShri Abhyankar 
4988d71ae5a4SJacob Faibussowitsch PetscErrorCode MatEqual_SeqAIJ(Mat A, Mat B, PetscBool *flg)
4989d71ae5a4SJacob Faibussowitsch {
49907264ac53SSatish Balay   Mat_SeqAIJ        *a = (Mat_SeqAIJ *)A->data, *b = (Mat_SeqAIJ *)B->data;
4991fff043a9SJunchao Zhang   const PetscScalar *aa, *ba;
4992eeffb40dSHong Zhang #if defined(PETSC_USE_COMPLEX)
4993eeffb40dSHong Zhang   PetscInt k;
4994eeffb40dSHong Zhang #endif
49957264ac53SSatish Balay 
49963a40ed3dSBarry Smith   PetscFunctionBegin;
4997bfeeae90SHong Zhang   /* If the  matrix dimensions are not equal,or no of nonzeros */
4998d0f46423SBarry Smith   if ((A->rmap->n != B->rmap->n) || (A->cmap->n != B->cmap->n) || (a->nz != b->nz)) {
4999ca44d042SBarry Smith     *flg = PETSC_FALSE;
5000ca44d042SBarry Smith     PetscFunctionReturn(0);
5001bcd2baecSBarry Smith   }
50027264ac53SSatish Balay 
50037264ac53SSatish Balay   /* if the a->i are the same */
50049566063dSJacob Faibussowitsch   PetscCall(PetscArraycmp(a->i, b->i, A->rmap->n + 1, flg));
5005abc0a331SBarry Smith   if (!*flg) PetscFunctionReturn(0);
50067264ac53SSatish Balay 
50077264ac53SSatish Balay   /* if a->j are the same */
50089566063dSJacob Faibussowitsch   PetscCall(PetscArraycmp(a->j, b->j, a->nz, flg));
5009abc0a331SBarry Smith   if (!*flg) PetscFunctionReturn(0);
5010bcd2baecSBarry Smith 
50119566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(A, &aa));
50129566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJGetArrayRead(B, &ba));
5013bcd2baecSBarry Smith   /* if a->a are the same */
5014eeffb40dSHong Zhang #if defined(PETSC_USE_COMPLEX)
5015eeffb40dSHong Zhang   for (k = 0; k < a->nz; k++) {
5016fff043a9SJunchao Zhang     if (PetscRealPart(aa[k]) != PetscRealPart(ba[k]) || PetscImaginaryPart(aa[k]) != PetscImaginaryPart(ba[k])) {
5017eeffb40dSHong Zhang       *flg = PETSC_FALSE;
50183a40ed3dSBarry Smith       PetscFunctionReturn(0);
5019eeffb40dSHong Zhang     }
5020eeffb40dSHong Zhang   }
5021eeffb40dSHong Zhang #else
50229566063dSJacob Faibussowitsch   PetscCall(PetscArraycmp(aa, ba, a->nz, flg));
5023eeffb40dSHong Zhang #endif
50249566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(A, &aa));
50259566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRestoreArrayRead(B, &ba));
5026eeffb40dSHong Zhang   PetscFunctionReturn(0);
50277264ac53SSatish Balay }
502836db0b34SBarry Smith 
502905869f15SSatish Balay /*@
503011a5261eSBarry Smith      MatCreateSeqAIJWithArrays - Creates an sequential `MATSEQAIJ` matrix using matrix elements (in CSR format)
503136db0b34SBarry Smith               provided by the user.
503236db0b34SBarry Smith 
5033d083f849SBarry Smith       Collective
503436db0b34SBarry Smith 
503536db0b34SBarry Smith    Input Parameters:
503636db0b34SBarry Smith +   comm - must be an MPI communicator of size 1
503736db0b34SBarry Smith .   m - number of rows
503836db0b34SBarry Smith .   n - number of columns
5039483a2f95SBarry Smith .   i - row indices; that is i[0] = 0, i[row] = i[row-1] + number of elements in that row of the matrix
504036db0b34SBarry Smith .   j - column indices
504136db0b34SBarry Smith -   a - matrix values
504236db0b34SBarry Smith 
504336db0b34SBarry Smith    Output Parameter:
504436db0b34SBarry Smith .   mat - the matrix
504536db0b34SBarry Smith 
504636db0b34SBarry Smith    Level: intermediate
504736db0b34SBarry Smith 
504836db0b34SBarry Smith    Notes:
50490551d7c0SBarry Smith        The i, j, and a arrays are not copied by this routine, the user must free these arrays
5050292fb18eSBarry Smith     once the matrix is destroyed and not before
505136db0b34SBarry Smith 
505236db0b34SBarry Smith        You cannot set new nonzero locations into this matrix, that will generate an error.
505336db0b34SBarry Smith 
5054bfeeae90SHong Zhang        The i and j indices are 0 based
505536db0b34SBarry Smith 
5056a4552177SSatish Balay        The format which is used for the sparse matrix input, is equivalent to a
5057a4552177SSatish Balay     row-major ordering.. i.e for the following matrix, the input data expected is
50588eef79e4SBarry Smith     as shown
5059a4552177SSatish Balay 
50608eef79e4SBarry Smith $        1 0 0
50618eef79e4SBarry Smith $        2 0 3
50628eef79e4SBarry Smith $        4 5 6
50638eef79e4SBarry Smith $
50648eef79e4SBarry Smith $        i =  {0,1,3,6}  [size = nrow+1  = 3+1]
50658eef79e4SBarry Smith $        j =  {0,0,2,0,1,2}  [size = 6]; values must be sorted for each row
50668eef79e4SBarry Smith $        v =  {1,2,3,4,5,6}  [size = 6]
5067a4552177SSatish Balay 
5068db781477SPatrick Sanan .seealso: `MatCreate()`, `MatCreateAIJ()`, `MatCreateSeqAIJ()`, `MatCreateMPIAIJWithArrays()`, `MatMPIAIJSetPreallocationCSR()`
506936db0b34SBarry Smith @*/
5070d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateSeqAIJWithArrays(MPI_Comm comm, PetscInt m, PetscInt n, PetscInt i[], PetscInt j[], PetscScalar a[], Mat *mat)
5071d71ae5a4SJacob Faibussowitsch {
5072cbcfb4deSHong Zhang   PetscInt    ii;
507336db0b34SBarry Smith   Mat_SeqAIJ *aij;
5074cbcfb4deSHong Zhang   PetscInt    jj;
507536db0b34SBarry Smith 
507636db0b34SBarry Smith   PetscFunctionBegin;
5077aed4548fSBarry Smith   PetscCheck(m <= 0 || i[0] == 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "i (row indices) must start with 0");
50789566063dSJacob Faibussowitsch   PetscCall(MatCreate(comm, mat));
50799566063dSJacob Faibussowitsch   PetscCall(MatSetSizes(*mat, m, n, m, n));
50809566063dSJacob Faibussowitsch   /* PetscCall(MatSetBlockSizes(*mat,,)); */
50819566063dSJacob Faibussowitsch   PetscCall(MatSetType(*mat, MATSEQAIJ));
50829566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(*mat, MAT_SKIP_ALLOCATION, NULL));
5083ab93d7beSBarry Smith   aij = (Mat_SeqAIJ *)(*mat)->data;
50849566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(m, &aij->imax));
50859566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(m, &aij->ilen));
5086ab93d7beSBarry Smith 
508736db0b34SBarry Smith   aij->i            = i;
508836db0b34SBarry Smith   aij->j            = j;
508936db0b34SBarry Smith   aij->a            = a;
509036db0b34SBarry Smith   aij->singlemalloc = PETSC_FALSE;
509136db0b34SBarry Smith   aij->nonew        = -1; /*this indicates that inserting a new value in the matrix that generates a new nonzero is an error*/
5092e6b907acSBarry Smith   aij->free_a       = PETSC_FALSE;
5093e6b907acSBarry Smith   aij->free_ij      = PETSC_FALSE;
509436db0b34SBarry Smith 
5095cbc6b225SStefano Zampini   for (ii = 0, aij->nonzerorowcnt = 0, aij->rmax = 0; ii < m; ii++) {
509636db0b34SBarry Smith     aij->ilen[ii] = aij->imax[ii] = i[ii + 1] - i[ii];
509776bd3646SJed Brown     if (PetscDefined(USE_DEBUG)) {
5098aed4548fSBarry Smith       PetscCheck(i[ii + 1] - i[ii] >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Negative row length in i (row indices) row = %" PetscInt_FMT " length = %" PetscInt_FMT, ii, i[ii + 1] - i[ii]);
50999985e31cSBarry Smith       for (jj = i[ii] + 1; jj < i[ii + 1]; jj++) {
510008401ef6SPierre Jolivet         PetscCheck(j[jj] >= j[jj - 1], PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Column entry number %" PetscInt_FMT " (actual column %" PetscInt_FMT ") in row %" PetscInt_FMT " is not sorted", jj - i[ii], j[jj], ii);
510108401ef6SPierre Jolivet         PetscCheck(j[jj] != j[jj - 1], PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Column entry number %" PetscInt_FMT " (actual column %" PetscInt_FMT ") in row %" PetscInt_FMT " is identical to previous entry", jj - i[ii], j[jj], ii);
51029985e31cSBarry Smith       }
510336db0b34SBarry Smith     }
510476bd3646SJed Brown   }
510576bd3646SJed Brown   if (PetscDefined(USE_DEBUG)) {
510636db0b34SBarry Smith     for (ii = 0; ii < aij->i[m]; ii++) {
510708401ef6SPierre Jolivet       PetscCheck(j[ii] >= 0, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Negative column index at location = %" PetscInt_FMT " index = %" PetscInt_FMT, ii, j[ii]);
5108aed4548fSBarry Smith       PetscCheck(j[ii] <= n - 1, PETSC_COMM_SELF, PETSC_ERR_ARG_OUTOFRANGE, "Column index to large at location = %" PetscInt_FMT " index = %" PetscInt_FMT, ii, j[ii]);
510936db0b34SBarry Smith     }
511076bd3646SJed Brown   }
511136db0b34SBarry Smith 
51129566063dSJacob Faibussowitsch   PetscCall(MatAssemblyBegin(*mat, MAT_FINAL_ASSEMBLY));
51139566063dSJacob Faibussowitsch   PetscCall(MatAssemblyEnd(*mat, MAT_FINAL_ASSEMBLY));
511436db0b34SBarry Smith   PetscFunctionReturn(0);
511536db0b34SBarry Smith }
5116cbc6b225SStefano Zampini 
5117f62e3866SBarry Smith /*@
511811a5261eSBarry Smith      MatCreateSeqAIJFromTriple - Creates an sequential `MATSEQAIJ` matrix using matrix elements (in COO format)
51198a0b0e6bSVictor Minden               provided by the user.
51208a0b0e6bSVictor Minden 
5121d083f849SBarry Smith       Collective
51228a0b0e6bSVictor Minden 
51238a0b0e6bSVictor Minden    Input Parameters:
51248a0b0e6bSVictor Minden +   comm - must be an MPI communicator of size 1
51258a0b0e6bSVictor Minden .   m   - number of rows
51268a0b0e6bSVictor Minden .   n   - number of columns
51278a0b0e6bSVictor Minden .   i   - row indices
51288a0b0e6bSVictor Minden .   j   - column indices
51291230e6d1SVictor Minden .   a   - matrix values
51301230e6d1SVictor Minden .   nz  - number of nonzeros
513111a5261eSBarry Smith -   idx - if the i and j indices start with 1 use `PETSC_TRUE` otherwise use `PETSC_FALSE`
51328a0b0e6bSVictor Minden 
51338a0b0e6bSVictor Minden    Output Parameter:
51348a0b0e6bSVictor Minden .   mat - the matrix
51358a0b0e6bSVictor Minden 
51368a0b0e6bSVictor Minden    Level: intermediate
51378a0b0e6bSVictor Minden 
5138f62e3866SBarry Smith    Example:
5139f62e3866SBarry Smith        For the following matrix, the input data expected is as shown (using 0 based indexing)
51409e99939fSJunchao Zhang .vb
51418a0b0e6bSVictor Minden         1 0 0
51428a0b0e6bSVictor Minden         2 0 3
51438a0b0e6bSVictor Minden         4 5 6
51448a0b0e6bSVictor Minden 
51458a0b0e6bSVictor Minden         i =  {0,1,1,2,2,2}
51468a0b0e6bSVictor Minden         j =  {0,0,2,0,1,2}
51478a0b0e6bSVictor Minden         v =  {1,2,3,4,5,6}
51489e99939fSJunchao Zhang .ve
5149*d7547e51SJunchao Zhang   Notes:
5150*d7547e51SJunchao Zhang     Instead of using this function, users should also consider `MatSetPreallocationCOO()` and `MatSetValuesCOO()`, which allow repeated or remote entries,
5151*d7547e51SJunchao Zhang     and are particularly useful in iterative applications.
51528a0b0e6bSVictor Minden 
5153*d7547e51SJunchao Zhang .seealso: `MatCreate()`, `MatCreateAIJ()`, `MatCreateSeqAIJ()`, `MatCreateSeqAIJWithArrays()`, `MatMPIAIJSetPreallocationCSR()`, `MatSetValuesCOO()`, `MatSetPreallocationCOO()`
51548a0b0e6bSVictor Minden @*/
5155d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateSeqAIJFromTriple(MPI_Comm comm, PetscInt m, PetscInt n, PetscInt i[], PetscInt j[], PetscScalar a[], Mat *mat, PetscInt nz, PetscBool idx)
5156d71ae5a4SJacob Faibussowitsch {
5157d021a1c5SVictor Minden   PetscInt ii, *nnz, one = 1, row, col;
51588a0b0e6bSVictor Minden 
51598a0b0e6bSVictor Minden   PetscFunctionBegin;
51609566063dSJacob Faibussowitsch   PetscCall(PetscCalloc1(m, &nnz));
5161ad540459SPierre Jolivet   for (ii = 0; ii < nz; ii++) nnz[i[ii] - !!idx] += 1;
51629566063dSJacob Faibussowitsch   PetscCall(MatCreate(comm, mat));
51639566063dSJacob Faibussowitsch   PetscCall(MatSetSizes(*mat, m, n, m, n));
51649566063dSJacob Faibussowitsch   PetscCall(MatSetType(*mat, MATSEQAIJ));
51659566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJSetPreallocation_SeqAIJ(*mat, 0, nnz));
51661230e6d1SVictor Minden   for (ii = 0; ii < nz; ii++) {
51671230e6d1SVictor Minden     if (idx) {
51681230e6d1SVictor Minden       row = i[ii] - 1;
51691230e6d1SVictor Minden       col = j[ii] - 1;
51701230e6d1SVictor Minden     } else {
51711230e6d1SVictor Minden       row = i[ii];
51721230e6d1SVictor Minden       col = j[ii];
51738a0b0e6bSVictor Minden     }
51749566063dSJacob Faibussowitsch     PetscCall(MatSetValues(*mat, one, &row, one, &col, &a[ii], ADD_VALUES));
51758a0b0e6bSVictor Minden   }
51769566063dSJacob Faibussowitsch   PetscCall(MatAssemblyBegin(*mat, MAT_FINAL_ASSEMBLY));
51779566063dSJacob Faibussowitsch   PetscCall(MatAssemblyEnd(*mat, MAT_FINAL_ASSEMBLY));
51789566063dSJacob Faibussowitsch   PetscCall(PetscFree(nnz));
51798a0b0e6bSVictor Minden   PetscFunctionReturn(0);
51808a0b0e6bSVictor Minden }
518136db0b34SBarry Smith 
5182d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJInvalidateDiagonal(Mat A)
5183d71ae5a4SJacob Faibussowitsch {
5184acf2f550SJed Brown   Mat_SeqAIJ *a = (Mat_SeqAIJ *)A->data;
5185acf2f550SJed Brown 
5186acf2f550SJed Brown   PetscFunctionBegin;
5187acf2f550SJed Brown   a->idiagvalid  = PETSC_FALSE;
5188acf2f550SJed Brown   a->ibdiagvalid = PETSC_FALSE;
51892205254eSKarl Rupp 
51909566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJInvalidateDiagonal_Inode(A));
5191acf2f550SJed Brown   PetscFunctionReturn(0);
5192acf2f550SJed Brown }
5193acf2f550SJed Brown 
5194d71ae5a4SJacob Faibussowitsch PetscErrorCode MatCreateMPIMatConcatenateSeqMat_SeqAIJ(MPI_Comm comm, Mat inmat, PetscInt n, MatReuse scall, Mat *outmat)
5195d71ae5a4SJacob Faibussowitsch {
51969c8f2541SHong Zhang   PetscFunctionBegin;
51979566063dSJacob Faibussowitsch   PetscCall(MatCreateMPIMatConcatenateSeqMat_MPIAIJ(comm, inmat, n, scall, outmat));
51989c8f2541SHong Zhang   PetscFunctionReturn(0);
51999c8f2541SHong Zhang }
52009c8f2541SHong Zhang 
520181824310SBarry Smith /*
520253dd7562SDmitry Karpeev  Permute A into C's *local* index space using rowemb,colemb.
520353dd7562SDmitry Karpeev  The embedding are supposed to be injections and the above implies that the range of rowemb is a subset
520453dd7562SDmitry Karpeev  of [0,m), colemb is in [0,n).
520553dd7562SDmitry Karpeev  If pattern == DIFFERENT_NONZERO_PATTERN, C is preallocated according to A.
520653dd7562SDmitry Karpeev  */
5207d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSetSeqMat_SeqAIJ(Mat C, IS rowemb, IS colemb, MatStructure pattern, Mat B)
5208d71ae5a4SJacob Faibussowitsch {
520953dd7562SDmitry Karpeev   /* If making this function public, change the error returned in this function away from _PLIB. */
521053dd7562SDmitry Karpeev   Mat_SeqAIJ     *Baij;
521153dd7562SDmitry Karpeev   PetscBool       seqaij;
521253dd7562SDmitry Karpeev   PetscInt        m, n, *nz, i, j, count;
521353dd7562SDmitry Karpeev   PetscScalar     v;
521453dd7562SDmitry Karpeev   const PetscInt *rowindices, *colindices;
521553dd7562SDmitry Karpeev 
521653dd7562SDmitry Karpeev   PetscFunctionBegin;
521753dd7562SDmitry Karpeev   if (!B) PetscFunctionReturn(0);
521853dd7562SDmitry Karpeev   /* Check to make sure the target matrix (and embeddings) are compatible with C and each other. */
52199566063dSJacob Faibussowitsch   PetscCall(PetscObjectBaseTypeCompare((PetscObject)B, MATSEQAIJ, &seqaij));
522028b400f6SJacob Faibussowitsch   PetscCheck(seqaij, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Input matrix is of wrong type");
522153dd7562SDmitry Karpeev   if (rowemb) {
52229566063dSJacob Faibussowitsch     PetscCall(ISGetLocalSize(rowemb, &m));
522308401ef6SPierre Jolivet     PetscCheck(m == B->rmap->n, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Row IS of size %" PetscInt_FMT " is incompatible with matrix row size %" PetscInt_FMT, m, B->rmap->n);
522453dd7562SDmitry Karpeev   } else {
522508401ef6SPierre Jolivet     PetscCheck(C->rmap->n == B->rmap->n, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Input matrix is row-incompatible with the target matrix");
522653dd7562SDmitry Karpeev   }
522753dd7562SDmitry Karpeev   if (colemb) {
52289566063dSJacob Faibussowitsch     PetscCall(ISGetLocalSize(colemb, &n));
522908401ef6SPierre Jolivet     PetscCheck(n == B->cmap->n, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Diag col IS of size %" PetscInt_FMT " is incompatible with input matrix col size %" PetscInt_FMT, n, B->cmap->n);
523053dd7562SDmitry Karpeev   } else {
523108401ef6SPierre Jolivet     PetscCheck(C->cmap->n == B->cmap->n, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Input matrix is col-incompatible with the target matrix");
523253dd7562SDmitry Karpeev   }
523353dd7562SDmitry Karpeev 
523453dd7562SDmitry Karpeev   Baij = (Mat_SeqAIJ *)(B->data);
523553dd7562SDmitry Karpeev   if (pattern == DIFFERENT_NONZERO_PATTERN) {
52369566063dSJacob Faibussowitsch     PetscCall(PetscMalloc1(B->rmap->n, &nz));
5237ad540459SPierre Jolivet     for (i = 0; i < B->rmap->n; i++) nz[i] = Baij->i[i + 1] - Baij->i[i];
52389566063dSJacob Faibussowitsch     PetscCall(MatSeqAIJSetPreallocation(C, 0, nz));
52399566063dSJacob Faibussowitsch     PetscCall(PetscFree(nz));
524053dd7562SDmitry Karpeev   }
524148a46eb9SPierre Jolivet   if (pattern == SUBSET_NONZERO_PATTERN) PetscCall(MatZeroEntries(C));
524253dd7562SDmitry Karpeev   count      = 0;
524353dd7562SDmitry Karpeev   rowindices = NULL;
524453dd7562SDmitry Karpeev   colindices = NULL;
524548a46eb9SPierre Jolivet   if (rowemb) PetscCall(ISGetIndices(rowemb, &rowindices));
524648a46eb9SPierre Jolivet   if (colemb) PetscCall(ISGetIndices(colemb, &colindices));
524753dd7562SDmitry Karpeev   for (i = 0; i < B->rmap->n; i++) {
524853dd7562SDmitry Karpeev     PetscInt row;
524953dd7562SDmitry Karpeev     row = i;
525053dd7562SDmitry Karpeev     if (rowindices) row = rowindices[i];
525153dd7562SDmitry Karpeev     for (j = Baij->i[i]; j < Baij->i[i + 1]; j++) {
525253dd7562SDmitry Karpeev       PetscInt col;
525353dd7562SDmitry Karpeev       col = Baij->j[count];
525453dd7562SDmitry Karpeev       if (colindices) col = colindices[col];
525553dd7562SDmitry Karpeev       v = Baij->a[count];
52569566063dSJacob Faibussowitsch       PetscCall(MatSetValues(C, 1, &row, 1, &col, &v, INSERT_VALUES));
525753dd7562SDmitry Karpeev       ++count;
525853dd7562SDmitry Karpeev     }
525953dd7562SDmitry Karpeev   }
526053dd7562SDmitry Karpeev   /* FIXME: set C's nonzerostate correctly. */
526153dd7562SDmitry Karpeev   /* Assembly for C is necessary. */
526253dd7562SDmitry Karpeev   C->preallocated  = PETSC_TRUE;
526353dd7562SDmitry Karpeev   C->assembled     = PETSC_TRUE;
526453dd7562SDmitry Karpeev   C->was_assembled = PETSC_FALSE;
526553dd7562SDmitry Karpeev   PetscFunctionReturn(0);
526653dd7562SDmitry Karpeev }
526753dd7562SDmitry Karpeev 
52684099cc6bSBarry Smith PetscFunctionList MatSeqAIJList = NULL;
52694099cc6bSBarry Smith 
52704099cc6bSBarry Smith /*@C
527111a5261eSBarry Smith    MatSeqAIJSetType - Converts a `MATSEQAIJ` matrix to a subtype
52724099cc6bSBarry Smith 
527311a5261eSBarry Smith    Collective on mat
52744099cc6bSBarry Smith 
52754099cc6bSBarry Smith    Input Parameters:
52764099cc6bSBarry Smith +  mat      - the matrix object
52774099cc6bSBarry Smith -  matype   - matrix type
52784099cc6bSBarry Smith 
52794099cc6bSBarry Smith    Options Database Key:
52804099cc6bSBarry Smith .  -mat_seqai_type  <method> - for example seqaijcrl
52814099cc6bSBarry Smith 
52824099cc6bSBarry Smith   Level: intermediate
52834099cc6bSBarry Smith 
5284db781477SPatrick Sanan .seealso: `PCSetType()`, `VecSetType()`, `MatCreate()`, `MatType`, `Mat`
52854099cc6bSBarry Smith @*/
5286d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJSetType(Mat mat, MatType matype)
5287d71ae5a4SJacob Faibussowitsch {
52884099cc6bSBarry Smith   PetscBool sametype;
52895f80ce2aSJacob Faibussowitsch   PetscErrorCode (*r)(Mat, MatType, MatReuse, Mat *);
52904099cc6bSBarry Smith 
52914099cc6bSBarry Smith   PetscFunctionBegin;
52924099cc6bSBarry Smith   PetscValidHeaderSpecific(mat, MAT_CLASSID, 1);
52939566063dSJacob Faibussowitsch   PetscCall(PetscObjectTypeCompare((PetscObject)mat, matype, &sametype));
52944099cc6bSBarry Smith   if (sametype) PetscFunctionReturn(0);
52954099cc6bSBarry Smith 
52969566063dSJacob Faibussowitsch   PetscCall(PetscFunctionListFind(MatSeqAIJList, matype, &r));
52975f80ce2aSJacob Faibussowitsch   PetscCheck(r, PETSC_COMM_SELF, PETSC_ERR_ARG_UNKNOWN_TYPE, "Unknown Mat type given: %s", matype);
52989566063dSJacob Faibussowitsch   PetscCall((*r)(mat, matype, MAT_INPLACE_MATRIX, &mat));
52994099cc6bSBarry Smith   PetscFunctionReturn(0);
53004099cc6bSBarry Smith }
53014099cc6bSBarry Smith 
53024099cc6bSBarry Smith /*@C
530311a5261eSBarry Smith   MatSeqAIJRegister -  - Adds a new sub-matrix type for sequential `MATSEQAIJ` matrices
53044099cc6bSBarry Smith 
53054099cc6bSBarry Smith    Not Collective
53064099cc6bSBarry Smith 
53074099cc6bSBarry Smith    Input Parameters:
530811a5261eSBarry Smith +  name - name of a new user-defined matrix type, for example `MATSEQAIJCRL`
53094099cc6bSBarry Smith -  function - routine to convert to subtype
53104099cc6bSBarry Smith 
53114099cc6bSBarry Smith    Notes:
531211a5261eSBarry Smith    `MatSeqAIJRegister()` may be called multiple times to add several user-defined solvers.
53134099cc6bSBarry Smith 
53144099cc6bSBarry Smith    Then, your matrix can be chosen with the procedural interface at runtime via the option
53154099cc6bSBarry Smith $     -mat_seqaij_type my_mat
53164099cc6bSBarry Smith 
53174099cc6bSBarry Smith    Level: advanced
53184099cc6bSBarry Smith 
5319db781477SPatrick Sanan .seealso: `MatSeqAIJRegisterAll()`
53204099cc6bSBarry Smith @*/
5321d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJRegister(const char sname[], PetscErrorCode (*function)(Mat, MatType, MatReuse, Mat *))
5322d71ae5a4SJacob Faibussowitsch {
53234099cc6bSBarry Smith   PetscFunctionBegin;
53249566063dSJacob Faibussowitsch   PetscCall(MatInitializePackage());
53259566063dSJacob Faibussowitsch   PetscCall(PetscFunctionListAdd(&MatSeqAIJList, sname, function));
53264099cc6bSBarry Smith   PetscFunctionReturn(0);
53274099cc6bSBarry Smith }
53284099cc6bSBarry Smith 
53294099cc6bSBarry Smith PetscBool MatSeqAIJRegisterAllCalled = PETSC_FALSE;
53304099cc6bSBarry Smith 
53314099cc6bSBarry Smith /*@C
533211a5261eSBarry Smith   MatSeqAIJRegisterAll - Registers all of the matrix subtypes of `MATSSEQAIJ`
53334099cc6bSBarry Smith 
53344099cc6bSBarry Smith   Not Collective
53354099cc6bSBarry Smith 
53364099cc6bSBarry Smith   Level: advanced
53374099cc6bSBarry Smith 
5338db781477SPatrick Sanan .seealso: `MatRegisterAll()`, `MatSeqAIJRegister()`
53394099cc6bSBarry Smith @*/
5340d71ae5a4SJacob Faibussowitsch PetscErrorCode MatSeqAIJRegisterAll(void)
5341d71ae5a4SJacob Faibussowitsch {
53424099cc6bSBarry Smith   PetscFunctionBegin;
53434099cc6bSBarry Smith   if (MatSeqAIJRegisterAllCalled) PetscFunctionReturn(0);
53444099cc6bSBarry Smith   MatSeqAIJRegisterAllCalled = PETSC_TRUE;
53454099cc6bSBarry Smith 
53469566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRegister(MATSEQAIJCRL, MatConvert_SeqAIJ_SeqAIJCRL));
53479566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRegister(MATSEQAIJPERM, MatConvert_SeqAIJ_SeqAIJPERM));
53489566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRegister(MATSEQAIJSELL, MatConvert_SeqAIJ_SeqAIJSELL));
53499779e05dSSatish Balay #if defined(PETSC_HAVE_MKL_SPARSE)
53509566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRegister(MATSEQAIJMKL, MatConvert_SeqAIJ_SeqAIJMKL));
5351485f9817SRichard Tran Mills #endif
53525063d097SStefano Zampini #if defined(PETSC_HAVE_CUDA)
53539566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRegister(MATSEQAIJCUSPARSE, MatConvert_SeqAIJ_SeqAIJCUSPARSE));
53545063d097SStefano Zampini #endif
53555063d097SStefano Zampini #if defined(PETSC_HAVE_KOKKOS_KERNELS)
53569566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRegister(MATSEQAIJKOKKOS, MatConvert_SeqAIJ_SeqAIJKokkos));
53575063d097SStefano Zampini #endif
53584099cc6bSBarry Smith #if defined(PETSC_HAVE_VIENNACL) && defined(PETSC_HAVE_VIENNACL_NO_CUDA)
53599566063dSJacob Faibussowitsch   PetscCall(MatSeqAIJRegister(MATMPIAIJVIENNACL, MatConvert_SeqAIJ_SeqAIJViennaCL));
53604099cc6bSBarry Smith #endif
53614099cc6bSBarry Smith   PetscFunctionReturn(0);
53624099cc6bSBarry Smith }
536353dd7562SDmitry Karpeev 
536453dd7562SDmitry Karpeev /*
536581824310SBarry Smith     Special version for direct calls from Fortran
536681824310SBarry Smith */
5367af0996ceSBarry Smith #include <petsc/private/fortranimpl.h>
536881824310SBarry Smith #if defined(PETSC_HAVE_FORTRAN_CAPS)
536981824310SBarry Smith   #define matsetvaluesseqaij_ MATSETVALUESSEQAIJ
537081824310SBarry Smith #elif !defined(PETSC_HAVE_FORTRAN_UNDERSCORE)
537181824310SBarry Smith   #define matsetvaluesseqaij_ matsetvaluesseqaij
537281824310SBarry Smith #endif
537381824310SBarry Smith 
537481824310SBarry Smith /* Change these macros so can be used in void function */
537598921bdaSJacob Faibussowitsch 
537698921bdaSJacob Faibussowitsch /* Change these macros so can be used in void function */
53779566063dSJacob Faibussowitsch /* Identical to PetscCallVoid, except it assigns to *_ierr */
53789566063dSJacob Faibussowitsch #undef PetscCall
53799371c9d4SSatish Balay #define PetscCall(...) \
53809371c9d4SSatish Balay   do { \
53815f80ce2aSJacob Faibussowitsch     PetscErrorCode ierr_msv_mpiaij = __VA_ARGS__; \
538298921bdaSJacob Faibussowitsch     if (PetscUnlikely(ierr_msv_mpiaij)) { \
538398921bdaSJacob Faibussowitsch       *_ierr = PetscError(PETSC_COMM_SELF, __LINE__, PETSC_FUNCTION_NAME, __FILE__, ierr_msv_mpiaij, PETSC_ERROR_REPEAT, " "); \
538498921bdaSJacob Faibussowitsch       return; \
538598921bdaSJacob Faibussowitsch     } \
538698921bdaSJacob Faibussowitsch   } while (0)
538798921bdaSJacob Faibussowitsch 
538898921bdaSJacob Faibussowitsch #undef SETERRQ
53899371c9d4SSatish Balay #define SETERRQ(comm, ierr, ...) \
53909371c9d4SSatish Balay   do { \
539198921bdaSJacob Faibussowitsch     *_ierr = PetscError(comm, __LINE__, PETSC_FUNCTION_NAME, __FILE__, ierr, PETSC_ERROR_INITIAL, __VA_ARGS__); \
539298921bdaSJacob Faibussowitsch     return; \
539398921bdaSJacob Faibussowitsch   } while (0)
539481824310SBarry Smith 
5395d71ae5a4SJacob Faibussowitsch PETSC_EXTERN void matsetvaluesseqaij_(Mat *AA, PetscInt *mm, const PetscInt im[], PetscInt *nn, const PetscInt in[], const PetscScalar v[], InsertMode *isis, PetscErrorCode *_ierr)
5396d71ae5a4SJacob Faibussowitsch {
539781824310SBarry Smith   Mat         A = *AA;
539881824310SBarry Smith   PetscInt    m = *mm, n = *nn;
539981824310SBarry Smith   InsertMode  is = *isis;
540081824310SBarry Smith   Mat_SeqAIJ *a  = (Mat_SeqAIJ *)A->data;
540181824310SBarry Smith   PetscInt   *rp, k, low, high, t, ii, row, nrow, i, col, l, rmax, N;
540281824310SBarry Smith   PetscInt   *imax, *ai, *ailen;
540381824310SBarry Smith   PetscInt   *aj, nonew = a->nonew, lastcol = -1;
540454f21887SBarry Smith   MatScalar  *ap, value, *aa;
5405ace3abfcSBarry Smith   PetscBool   ignorezeroentries = a->ignorezeroentries;
5406ace3abfcSBarry Smith   PetscBool   roworiented       = a->roworiented;
540781824310SBarry Smith 
540881824310SBarry Smith   PetscFunctionBegin;
54094994cf47SJed Brown   MatCheckPreallocated(A, 1);
541081824310SBarry Smith   imax  = a->imax;
541181824310SBarry Smith   ai    = a->i;
541281824310SBarry Smith   ailen = a->ilen;
541381824310SBarry Smith   aj    = a->j;
541481824310SBarry Smith   aa    = a->a;
541581824310SBarry Smith 
541681824310SBarry Smith   for (k = 0; k < m; k++) { /* loop over added rows */
541781824310SBarry Smith     row = im[k];
541881824310SBarry Smith     if (row < 0) continue;
54195f80ce2aSJacob Faibussowitsch     PetscCheck(row < A->rmap->n, PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_OUTOFRANGE, "Row too large");
54209371c9d4SSatish Balay     rp   = aj + ai[row];
54219371c9d4SSatish Balay     ap   = aa + ai[row];
54229371c9d4SSatish Balay     rmax = imax[row];
54239371c9d4SSatish Balay     nrow = ailen[row];
542481824310SBarry Smith     low  = 0;
542581824310SBarry Smith     high = nrow;
542681824310SBarry Smith     for (l = 0; l < n; l++) { /* loop over added columns */
542781824310SBarry Smith       if (in[l] < 0) continue;
54285f80ce2aSJacob Faibussowitsch       PetscCheck(in[l] < A->cmap->n, PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_OUTOFRANGE, "Column too large");
542981824310SBarry Smith       col = in[l];
54302205254eSKarl Rupp       if (roworiented) value = v[l + k * n];
54312205254eSKarl Rupp       else value = v[k + l * m];
54322205254eSKarl Rupp 
543381824310SBarry Smith       if (value == 0.0 && ignorezeroentries && (is == ADD_VALUES)) continue;
543481824310SBarry Smith 
54352205254eSKarl Rupp       if (col <= lastcol) low = 0;
54362205254eSKarl Rupp       else high = nrow;
543781824310SBarry Smith       lastcol = col;
543881824310SBarry Smith       while (high - low > 5) {
543981824310SBarry Smith         t = (low + high) / 2;
544081824310SBarry Smith         if (rp[t] > col) high = t;
544181824310SBarry Smith         else low = t;
544281824310SBarry Smith       }
544381824310SBarry Smith       for (i = low; i < high; i++) {
544481824310SBarry Smith         if (rp[i] > col) break;
544581824310SBarry Smith         if (rp[i] == col) {
544681824310SBarry Smith           if (is == ADD_VALUES) ap[i] += value;
544781824310SBarry Smith           else ap[i] = value;
544881824310SBarry Smith           goto noinsert;
544981824310SBarry Smith         }
545081824310SBarry Smith       }
545181824310SBarry Smith       if (value == 0.0 && ignorezeroentries) goto noinsert;
545281824310SBarry Smith       if (nonew == 1) goto noinsert;
54535f80ce2aSJacob Faibussowitsch       PetscCheck(nonew != -1, PetscObjectComm((PetscObject)A), PETSC_ERR_ARG_OUTOFRANGE, "Inserting a new nonzero in the matrix");
5454fef13f97SBarry Smith       MatSeqXAIJReallocateAIJ(A, A->rmap->n, 1, nrow, row, col, rmax, aa, ai, aj, rp, ap, imax, nonew, MatScalar);
54559371c9d4SSatish Balay       N = nrow++ - 1;
54569371c9d4SSatish Balay       a->nz++;
54579371c9d4SSatish Balay       high++;
545881824310SBarry Smith       /* shift up all the later entries in this row */
545981824310SBarry Smith       for (ii = N; ii >= i; ii--) {
546081824310SBarry Smith         rp[ii + 1] = rp[ii];
546181824310SBarry Smith         ap[ii + 1] = ap[ii];
546281824310SBarry Smith       }
546381824310SBarry Smith       rp[i] = col;
546481824310SBarry Smith       ap[i] = value;
5465e56f5c9eSBarry Smith       A->nonzerostate++;
546681824310SBarry Smith     noinsert:;
546781824310SBarry Smith       low = i + 1;
546881824310SBarry Smith     }
546981824310SBarry Smith     ailen[row] = nrow;
547081824310SBarry Smith   }
547181824310SBarry Smith   PetscFunctionReturnVoid();
547281824310SBarry Smith }
547398921bdaSJacob Faibussowitsch /* Undefining these here since they were redefined from their original definition above! No
547498921bdaSJacob Faibussowitsch  * other PETSc functions should be defined past this point, as it is impossible to recover the
547598921bdaSJacob Faibussowitsch  * original definitions */
54769566063dSJacob Faibussowitsch #undef PetscCall
547798921bdaSJacob Faibussowitsch #undef SETERRQ
5478