xref: /petsc/src/mat/impls/aij/seq/aij.c (revision 6718818e67c4802797f2feae43fc3d52878b6955)
1d5d45c9bSBarry Smith /*
23369ce9aSBarry Smith     Defines the basic matrix operations for the AIJ (compressed row)
3d5d45c9bSBarry Smith   matrix storage format.
4d5d45c9bSBarry Smith */
53369ce9aSBarry Smith 
67c4f633dSBarry Smith 
7c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/aij.h>          /*I "petscmat.h" I*/
8c6db04a5SJed Brown #include <petscblaslapack.h>
9c6db04a5SJed Brown #include <petscbt.h>
10af0996ceSBarry Smith #include <petsc/private/kernels/blocktranspose.h>
110716a85fSBarry Smith 
124099cc6bSBarry Smith PetscErrorCode MatSeqAIJSetTypeFromOptions(Mat A)
134099cc6bSBarry Smith {
144099cc6bSBarry Smith   PetscErrorCode       ierr;
154099cc6bSBarry Smith   PetscBool            flg;
164099cc6bSBarry Smith   char                 type[256];
174099cc6bSBarry Smith 
184099cc6bSBarry Smith   PetscFunctionBegin;
194099cc6bSBarry Smith   ierr = PetscObjectOptionsBegin((PetscObject)A);
204099cc6bSBarry Smith   ierr = PetscOptionsFList("-mat_seqaij_type","Matrix SeqAIJ type","MatSeqAIJSetType",MatSeqAIJList,"seqaij",type,256,&flg);CHKERRQ(ierr);
214099cc6bSBarry Smith   if (flg) {
224099cc6bSBarry Smith     ierr = MatSeqAIJSetType(A,type);CHKERRQ(ierr);
234099cc6bSBarry Smith   }
244099cc6bSBarry Smith   ierr = PetscOptionsEnd();CHKERRQ(ierr);
254099cc6bSBarry Smith   PetscFunctionReturn(0);
264099cc6bSBarry Smith }
274099cc6bSBarry Smith 
280716a85fSBarry Smith PetscErrorCode MatGetColumnNorms_SeqAIJ(Mat A,NormType type,PetscReal *norms)
290716a85fSBarry Smith {
300716a85fSBarry Smith   PetscErrorCode ierr;
310716a85fSBarry Smith   PetscInt       i,m,n;
320716a85fSBarry Smith   Mat_SeqAIJ     *aij = (Mat_SeqAIJ*)A->data;
330716a85fSBarry Smith 
340716a85fSBarry Smith   PetscFunctionBegin;
350716a85fSBarry Smith   ierr = MatGetSize(A,&m,&n);CHKERRQ(ierr);
36580bdb30SBarry Smith   ierr = PetscArrayzero(norms,n);CHKERRQ(ierr);
370716a85fSBarry Smith   if (type == NORM_2) {
380716a85fSBarry Smith     for (i=0; i<aij->i[m]; i++) {
390716a85fSBarry Smith       norms[aij->j[i]] += PetscAbsScalar(aij->a[i]*aij->a[i]);
400716a85fSBarry Smith     }
410716a85fSBarry Smith   } else if (type == NORM_1) {
420716a85fSBarry Smith     for (i=0; i<aij->i[m]; i++) {
430716a85fSBarry Smith       norms[aij->j[i]] += PetscAbsScalar(aij->a[i]);
440716a85fSBarry Smith     }
450716a85fSBarry Smith   } else if (type == NORM_INFINITY) {
460716a85fSBarry Smith     for (i=0; i<aij->i[m]; i++) {
470716a85fSBarry Smith       norms[aij->j[i]] = PetscMax(PetscAbsScalar(aij->a[i]),norms[aij->j[i]]);
480716a85fSBarry Smith     }
490716a85fSBarry Smith   } else SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONG,"Unknown NormType");
500716a85fSBarry Smith 
510716a85fSBarry Smith   if (type == NORM_2) {
528f1a2a5eSBarry Smith     for (i=0; i<n; i++) norms[i] = PetscSqrtReal(norms[i]);
530716a85fSBarry Smith   }
540716a85fSBarry Smith   PetscFunctionReturn(0);
550716a85fSBarry Smith }
560716a85fSBarry Smith 
573a062f41SBarry Smith PetscErrorCode MatFindOffBlockDiagonalEntries_SeqAIJ(Mat A,IS *is)
583a062f41SBarry Smith {
593a062f41SBarry Smith   Mat_SeqAIJ      *a  = (Mat_SeqAIJ*)A->data;
603a062f41SBarry Smith   PetscInt        i,m=A->rmap->n,cnt = 0, bs = A->rmap->bs;
613a062f41SBarry Smith   const PetscInt  *jj = a->j,*ii = a->i;
623a062f41SBarry Smith   PetscInt        *rows;
633a062f41SBarry Smith   PetscErrorCode  ierr;
643a062f41SBarry Smith 
653a062f41SBarry Smith   PetscFunctionBegin;
663a062f41SBarry Smith   for (i=0; i<m; i++) {
673a062f41SBarry Smith     if ((ii[i] != ii[i+1]) && ((jj[ii[i]] < bs*(i/bs)) || (jj[ii[i+1]-1] > bs*((i+bs)/bs)-1))) {
683a062f41SBarry Smith       cnt++;
693a062f41SBarry Smith     }
703a062f41SBarry Smith   }
713a062f41SBarry Smith   ierr = PetscMalloc1(cnt,&rows);CHKERRQ(ierr);
723a062f41SBarry Smith   cnt  = 0;
733a062f41SBarry Smith   for (i=0; i<m; i++) {
743a062f41SBarry Smith     if ((ii[i] != ii[i+1]) && ((jj[ii[i]] < bs*(i/bs)) || (jj[ii[i+1]-1] > bs*((i+bs)/bs)-1))) {
753a062f41SBarry Smith       rows[cnt] = i;
763a062f41SBarry Smith       cnt++;
773a062f41SBarry Smith     }
783a062f41SBarry Smith   }
793a062f41SBarry Smith   ierr = ISCreateGeneral(PETSC_COMM_SELF,cnt,rows,PETSC_OWN_POINTER,is);CHKERRQ(ierr);
803a062f41SBarry Smith   PetscFunctionReturn(0);
813a062f41SBarry Smith }
823a062f41SBarry Smith 
83f1f41ecbSJed Brown PetscErrorCode MatFindZeroDiagonals_SeqAIJ_Private(Mat A,PetscInt *nrows,PetscInt **zrows)
846ce1633cSBarry Smith {
856ce1633cSBarry Smith   Mat_SeqAIJ      *a  = (Mat_SeqAIJ*)A->data;
866ce1633cSBarry Smith   const MatScalar *aa = a->a;
876ce1633cSBarry Smith   PetscInt        i,m=A->rmap->n,cnt = 0;
88b2db7409Sstefano_zampini   const PetscInt  *ii = a->i,*jj = a->j,*diag;
896ce1633cSBarry Smith   PetscInt        *rows;
906ce1633cSBarry Smith   PetscErrorCode  ierr;
916ce1633cSBarry Smith 
926ce1633cSBarry Smith   PetscFunctionBegin;
936ce1633cSBarry Smith   ierr = MatMarkDiagonal_SeqAIJ(A);CHKERRQ(ierr);
946ce1633cSBarry Smith   diag = a->diag;
956ce1633cSBarry Smith   for (i=0; i<m; i++) {
96b2db7409Sstefano_zampini     if ((diag[i] >= ii[i+1]) || (jj[diag[i]] != i) || (aa[diag[i]] == 0.0)) {
976ce1633cSBarry Smith       cnt++;
986ce1633cSBarry Smith     }
996ce1633cSBarry Smith   }
100785e854fSJed Brown   ierr = PetscMalloc1(cnt,&rows);CHKERRQ(ierr);
1016ce1633cSBarry Smith   cnt  = 0;
1026ce1633cSBarry Smith   for (i=0; i<m; i++) {
103b2db7409Sstefano_zampini     if ((diag[i] >= ii[i+1]) || (jj[diag[i]] != i) || (aa[diag[i]] == 0.0)) {
1046ce1633cSBarry Smith       rows[cnt++] = i;
1056ce1633cSBarry Smith     }
1066ce1633cSBarry Smith   }
107f1f41ecbSJed Brown   *nrows = cnt;
108f1f41ecbSJed Brown   *zrows = rows;
109f1f41ecbSJed Brown   PetscFunctionReturn(0);
110f1f41ecbSJed Brown }
111f1f41ecbSJed Brown 
112f1f41ecbSJed Brown PetscErrorCode MatFindZeroDiagonals_SeqAIJ(Mat A,IS *zrows)
113f1f41ecbSJed Brown {
114f1f41ecbSJed Brown   PetscInt       nrows,*rows;
115f1f41ecbSJed Brown   PetscErrorCode ierr;
116f1f41ecbSJed Brown 
117f1f41ecbSJed Brown   PetscFunctionBegin;
1180298fd71SBarry Smith   *zrows = NULL;
119f1f41ecbSJed Brown   ierr   = MatFindZeroDiagonals_SeqAIJ_Private(A,&nrows,&rows);CHKERRQ(ierr);
120ce94432eSBarry Smith   ierr   = ISCreateGeneral(PetscObjectComm((PetscObject)A),nrows,rows,PETSC_OWN_POINTER,zrows);CHKERRQ(ierr);
1216ce1633cSBarry Smith   PetscFunctionReturn(0);
1226ce1633cSBarry Smith }
1236ce1633cSBarry Smith 
124b3a44c85SBarry Smith PetscErrorCode MatFindNonzeroRows_SeqAIJ(Mat A,IS *keptrows)
125b3a44c85SBarry Smith {
126b3a44c85SBarry Smith   Mat_SeqAIJ      *a = (Mat_SeqAIJ*)A->data;
127b3a44c85SBarry Smith   const MatScalar *aa;
128b3a44c85SBarry Smith   PetscInt        m=A->rmap->n,cnt = 0;
129b3a44c85SBarry Smith   const PetscInt  *ii;
130b3a44c85SBarry Smith   PetscInt        n,i,j,*rows;
131b3a44c85SBarry Smith   PetscErrorCode  ierr;
132b3a44c85SBarry Smith 
133b3a44c85SBarry Smith   PetscFunctionBegin;
134b3a44c85SBarry Smith   *keptrows = 0;
135b3a44c85SBarry Smith   ii        = a->i;
136b3a44c85SBarry Smith   for (i=0; i<m; i++) {
137b3a44c85SBarry Smith     n = ii[i+1] - ii[i];
138b3a44c85SBarry Smith     if (!n) {
139b3a44c85SBarry Smith       cnt++;
140b3a44c85SBarry Smith       goto ok1;
141b3a44c85SBarry Smith     }
142b3a44c85SBarry Smith     aa = a->a + ii[i];
143b3a44c85SBarry Smith     for (j=0; j<n; j++) {
144b3a44c85SBarry Smith       if (aa[j] != 0.0) goto ok1;
145b3a44c85SBarry Smith     }
146b3a44c85SBarry Smith     cnt++;
147b3a44c85SBarry Smith ok1:;
148b3a44c85SBarry Smith   }
149b3a44c85SBarry Smith   if (!cnt) PetscFunctionReturn(0);
150854ce69bSBarry Smith   ierr = PetscMalloc1(A->rmap->n-cnt,&rows);CHKERRQ(ierr);
151b3a44c85SBarry Smith   cnt  = 0;
152b3a44c85SBarry Smith   for (i=0; i<m; i++) {
153b3a44c85SBarry Smith     n = ii[i+1] - ii[i];
154b3a44c85SBarry Smith     if (!n) continue;
155b3a44c85SBarry Smith     aa = a->a + ii[i];
156b3a44c85SBarry Smith     for (j=0; j<n; j++) {
157b3a44c85SBarry Smith       if (aa[j] != 0.0) {
158b3a44c85SBarry Smith         rows[cnt++] = i;
159b3a44c85SBarry Smith         break;
160b3a44c85SBarry Smith       }
161b3a44c85SBarry Smith     }
162b3a44c85SBarry Smith   }
163b3a44c85SBarry Smith   ierr = ISCreateGeneral(PETSC_COMM_SELF,cnt,rows,PETSC_OWN_POINTER,keptrows);CHKERRQ(ierr);
164b3a44c85SBarry Smith   PetscFunctionReturn(0);
165b3a44c85SBarry Smith }
166b3a44c85SBarry Smith 
1677087cfbeSBarry Smith PetscErrorCode  MatDiagonalSet_SeqAIJ(Mat Y,Vec D,InsertMode is)
16879299369SBarry Smith {
16979299369SBarry Smith   PetscErrorCode    ierr;
17079299369SBarry Smith   Mat_SeqAIJ        *aij = (Mat_SeqAIJ*) Y->data;
17199e65526SBarry Smith   PetscInt          i,m = Y->rmap->n;
17299e65526SBarry Smith   const PetscInt    *diag;
17354f21887SBarry Smith   MatScalar         *aa = aij->a;
17499e65526SBarry Smith   const PetscScalar *v;
175ace3abfcSBarry Smith   PetscBool         missing;
176837a59e1SRichard Tran Mills #if defined(PETSC_HAVE_VIENNACL) || defined(PETSC_HAVE_CUDA)
177837a59e1SRichard Tran Mills   PetscBool         inserted = PETSC_FALSE;
178837a59e1SRichard Tran Mills #endif
17979299369SBarry Smith 
18079299369SBarry Smith   PetscFunctionBegin;
18109f38230SBarry Smith   if (Y->assembled) {
1820298fd71SBarry Smith     ierr = MatMissingDiagonal_SeqAIJ(Y,&missing,NULL);CHKERRQ(ierr);
18309f38230SBarry Smith     if (!missing) {
18479299369SBarry Smith       diag = aij->diag;
18599e65526SBarry Smith       ierr = VecGetArrayRead(D,&v);CHKERRQ(ierr);
18679299369SBarry Smith       if (is == INSERT_VALUES) {
187837a59e1SRichard Tran Mills #if defined(PETSC_HAVE_VIENNACL) || defined(PETSC_HAVE_CUDA)
188837a59e1SRichard Tran Mills         inserted = PETSC_TRUE;
189837a59e1SRichard Tran Mills #endif
19079299369SBarry Smith         for (i=0; i<m; i++) {
19179299369SBarry Smith           aa[diag[i]] = v[i];
19279299369SBarry Smith         }
19379299369SBarry Smith       } else {
19479299369SBarry Smith         for (i=0; i<m; i++) {
195837a59e1SRichard Tran Mills #if defined(PETSC_HAVE_VIENNACL) || defined(PETSC_HAVE_CUDA)
196837a59e1SRichard Tran Mills           if (v[i] != 0.0) inserted = PETSC_TRUE;
197837a59e1SRichard Tran Mills #endif
19879299369SBarry Smith           aa[diag[i]] += v[i];
19979299369SBarry Smith         }
20079299369SBarry Smith       }
201837a59e1SRichard Tran Mills #if defined(PETSC_HAVE_VIENNACL) || defined(PETSC_HAVE_CUDA)
202837a59e1SRichard Tran Mills       if (inserted) Y->offloadmask = PETSC_OFFLOAD_CPU;
203837a59e1SRichard Tran Mills #endif
20499e65526SBarry Smith       ierr = VecRestoreArrayRead(D,&v);CHKERRQ(ierr);
20579299369SBarry Smith       PetscFunctionReturn(0);
20679299369SBarry Smith     }
207acf2f550SJed Brown     ierr = MatSeqAIJInvalidateDiagonal(Y);CHKERRQ(ierr);
20809f38230SBarry Smith   }
20909f38230SBarry Smith   ierr = MatDiagonalSet_Default(Y,D,is);CHKERRQ(ierr);
21009f38230SBarry Smith   PetscFunctionReturn(0);
21109f38230SBarry Smith }
21279299369SBarry Smith 
2131a83f524SJed Brown PetscErrorCode MatGetRowIJ_SeqAIJ(Mat A,PetscInt oshift,PetscBool symmetric,PetscBool inodecompressed,PetscInt *m,const PetscInt *ia[],const PetscInt *ja[],PetscBool  *done)
21417ab2063SBarry Smith {
215416022c9SBarry Smith   Mat_SeqAIJ     *a = (Mat_SeqAIJ*)A->data;
216dfbe8321SBarry Smith   PetscErrorCode ierr;
21797f1f81fSBarry Smith   PetscInt       i,ishift;
21817ab2063SBarry Smith 
2193a40ed3dSBarry Smith   PetscFunctionBegin;
220d0f46423SBarry Smith   *m = A->rmap->n;
2213a40ed3dSBarry Smith   if (!ia) PetscFunctionReturn(0);
222bfeeae90SHong Zhang   ishift = 0;
22353e63a63SBarry Smith   if (symmetric && !A->structurally_symmetric) {
2242462f5fdSStefano Zampini     ierr = MatToSymmetricIJ_SeqAIJ(A->rmap->n,a->i,a->j,PETSC_TRUE,ishift,oshift,(PetscInt**)ia,(PetscInt**)ja);CHKERRQ(ierr);
225bfeeae90SHong Zhang   } else if (oshift == 1) {
2261a83f524SJed Brown     PetscInt *tia;
227d0f46423SBarry Smith     PetscInt nz = a->i[A->rmap->n];
2283b2fbd54SBarry Smith     /* malloc space and  add 1 to i and j indices */
229854ce69bSBarry Smith     ierr = PetscMalloc1(A->rmap->n+1,&tia);CHKERRQ(ierr);
2301a83f524SJed Brown     for (i=0; i<A->rmap->n+1; i++) tia[i] = a->i[i] + 1;
2311a83f524SJed Brown     *ia = tia;
232ecc77c7aSBarry Smith     if (ja) {
2331a83f524SJed Brown       PetscInt *tja;
234854ce69bSBarry Smith       ierr = PetscMalloc1(nz+1,&tja);CHKERRQ(ierr);
2351a83f524SJed Brown       for (i=0; i<nz; i++) tja[i] = a->j[i] + 1;
2361a83f524SJed Brown       *ja = tja;
237ecc77c7aSBarry Smith     }
2386945ee14SBarry Smith   } else {
239ecc77c7aSBarry Smith     *ia = a->i;
240ecc77c7aSBarry Smith     if (ja) *ja = a->j;
241a2ce50c7SBarry Smith   }
2423a40ed3dSBarry Smith   PetscFunctionReturn(0);
243a2744918SBarry Smith }
244a2744918SBarry Smith 
2451a83f524SJed Brown PetscErrorCode MatRestoreRowIJ_SeqAIJ(Mat A,PetscInt oshift,PetscBool symmetric,PetscBool inodecompressed,PetscInt *n,const PetscInt *ia[],const PetscInt *ja[],PetscBool  *done)
2466945ee14SBarry Smith {
247dfbe8321SBarry Smith   PetscErrorCode ierr;
2486945ee14SBarry Smith 
2493a40ed3dSBarry Smith   PetscFunctionBegin;
2503a40ed3dSBarry Smith   if (!ia) PetscFunctionReturn(0);
251bfeeae90SHong Zhang   if ((symmetric && !A->structurally_symmetric) || oshift == 1) {
252606d414cSSatish Balay     ierr = PetscFree(*ia);CHKERRQ(ierr);
253ecc77c7aSBarry Smith     if (ja) {ierr = PetscFree(*ja);CHKERRQ(ierr);}
254bcd2baecSBarry Smith   }
2553a40ed3dSBarry Smith   PetscFunctionReturn(0);
25617ab2063SBarry Smith }
25717ab2063SBarry Smith 
2581a83f524SJed Brown PetscErrorCode MatGetColumnIJ_SeqAIJ(Mat A,PetscInt oshift,PetscBool symmetric,PetscBool inodecompressed,PetscInt *nn,const PetscInt *ia[],const PetscInt *ja[],PetscBool  *done)
2593b2fbd54SBarry Smith {
2603b2fbd54SBarry Smith   Mat_SeqAIJ     *a = (Mat_SeqAIJ*)A->data;
261dfbe8321SBarry Smith   PetscErrorCode ierr;
262d0f46423SBarry Smith   PetscInt       i,*collengths,*cia,*cja,n = A->cmap->n,m = A->rmap->n;
26397f1f81fSBarry Smith   PetscInt       nz = a->i[m],row,*jj,mr,col;
2643b2fbd54SBarry Smith 
2653a40ed3dSBarry Smith   PetscFunctionBegin;
266899cda47SBarry Smith   *nn = n;
2673a40ed3dSBarry Smith   if (!ia) PetscFunctionReturn(0);
2683b2fbd54SBarry Smith   if (symmetric) {
2692462f5fdSStefano Zampini     ierr = MatToSymmetricIJ_SeqAIJ(A->rmap->n,a->i,a->j,PETSC_TRUE,0,oshift,(PetscInt**)ia,(PetscInt**)ja);CHKERRQ(ierr);
2703b2fbd54SBarry Smith   } else {
271b9e7e5c1SBarry Smith     ierr = PetscCalloc1(n,&collengths);CHKERRQ(ierr);
272854ce69bSBarry Smith     ierr = PetscMalloc1(n+1,&cia);CHKERRQ(ierr);
273b9e7e5c1SBarry Smith     ierr = PetscMalloc1(nz,&cja);CHKERRQ(ierr);
2743b2fbd54SBarry Smith     jj   = a->j;
2753b2fbd54SBarry Smith     for (i=0; i<nz; i++) {
276bfeeae90SHong Zhang       collengths[jj[i]]++;
2773b2fbd54SBarry Smith     }
2783b2fbd54SBarry Smith     cia[0] = oshift;
2793b2fbd54SBarry Smith     for (i=0; i<n; i++) {
2803b2fbd54SBarry Smith       cia[i+1] = cia[i] + collengths[i];
2813b2fbd54SBarry Smith     }
282580bdb30SBarry Smith     ierr = PetscArrayzero(collengths,n);CHKERRQ(ierr);
2833b2fbd54SBarry Smith     jj   = a->j;
284a93ec695SBarry Smith     for (row=0; row<m; row++) {
285a93ec695SBarry Smith       mr = a->i[row+1] - a->i[row];
286a93ec695SBarry Smith       for (i=0; i<mr; i++) {
287bfeeae90SHong Zhang         col = *jj++;
2882205254eSKarl Rupp 
2893b2fbd54SBarry Smith         cja[cia[col] + collengths[col]++ - oshift] = row + oshift;
2903b2fbd54SBarry Smith       }
2913b2fbd54SBarry Smith     }
292606d414cSSatish Balay     ierr = PetscFree(collengths);CHKERRQ(ierr);
2933b2fbd54SBarry Smith     *ia  = cia; *ja = cja;
2943b2fbd54SBarry Smith   }
2953a40ed3dSBarry Smith   PetscFunctionReturn(0);
2963b2fbd54SBarry Smith }
2973b2fbd54SBarry Smith 
2981a83f524SJed Brown PetscErrorCode MatRestoreColumnIJ_SeqAIJ(Mat A,PetscInt oshift,PetscBool symmetric,PetscBool inodecompressed,PetscInt *n,const PetscInt *ia[],const PetscInt *ja[],PetscBool  *done)
2993b2fbd54SBarry Smith {
300dfbe8321SBarry Smith   PetscErrorCode ierr;
301606d414cSSatish Balay 
3023a40ed3dSBarry Smith   PetscFunctionBegin;
3033a40ed3dSBarry Smith   if (!ia) PetscFunctionReturn(0);
3043b2fbd54SBarry Smith 
305606d414cSSatish Balay   ierr = PetscFree(*ia);CHKERRQ(ierr);
306606d414cSSatish Balay   ierr = PetscFree(*ja);CHKERRQ(ierr);
3073a40ed3dSBarry Smith   PetscFunctionReturn(0);
3083b2fbd54SBarry Smith }
3093b2fbd54SBarry Smith 
3107cee066cSHong Zhang /*
3117cee066cSHong Zhang  MatGetColumnIJ_SeqAIJ_Color() and MatRestoreColumnIJ_SeqAIJ_Color() are customized from
3127cee066cSHong Zhang  MatGetColumnIJ_SeqAIJ() and MatRestoreColumnIJ_SeqAIJ() by adding an output
313040ebd07SHong Zhang  spidx[], index of a->a, to be used in MatTransposeColoringCreate_SeqAIJ() and MatFDColoringCreate_SeqXAIJ()
3147cee066cSHong Zhang */
3157cee066cSHong Zhang PetscErrorCode MatGetColumnIJ_SeqAIJ_Color(Mat A,PetscInt oshift,PetscBool symmetric,PetscBool inodecompressed,PetscInt *nn,const PetscInt *ia[],const PetscInt *ja[],PetscInt *spidx[],PetscBool  *done)
3167cee066cSHong Zhang {
3177cee066cSHong Zhang   Mat_SeqAIJ     *a = (Mat_SeqAIJ*)A->data;
3187cee066cSHong Zhang   PetscErrorCode ierr;
3197cee066cSHong Zhang   PetscInt       i,*collengths,*cia,*cja,n = A->cmap->n,m = A->rmap->n;
320071fcb05SBarry Smith   PetscInt       nz = a->i[m],row,mr,col,tmp;
3217cee066cSHong Zhang   PetscInt       *cspidx;
322071fcb05SBarry Smith   const PetscInt *jj;
3237cee066cSHong Zhang 
3247cee066cSHong Zhang   PetscFunctionBegin;
3257cee066cSHong Zhang   *nn = n;
3267cee066cSHong Zhang   if (!ia) PetscFunctionReturn(0);
327625f6d37SHong Zhang 
328b9e7e5c1SBarry Smith   ierr = PetscCalloc1(n,&collengths);CHKERRQ(ierr);
329854ce69bSBarry Smith   ierr = PetscMalloc1(n+1,&cia);CHKERRQ(ierr);
330b9e7e5c1SBarry Smith   ierr = PetscMalloc1(nz,&cja);CHKERRQ(ierr);
331b9e7e5c1SBarry Smith   ierr = PetscMalloc1(nz,&cspidx);CHKERRQ(ierr);
3327cee066cSHong Zhang   jj   = a->j;
3337cee066cSHong Zhang   for (i=0; i<nz; i++) {
3347cee066cSHong Zhang     collengths[jj[i]]++;
3357cee066cSHong Zhang   }
3367cee066cSHong Zhang   cia[0] = oshift;
3377cee066cSHong Zhang   for (i=0; i<n; i++) {
3387cee066cSHong Zhang     cia[i+1] = cia[i] + collengths[i];
3397cee066cSHong Zhang   }
340580bdb30SBarry Smith   ierr = PetscArrayzero(collengths,n);CHKERRQ(ierr);
3417cee066cSHong Zhang   jj   = a->j;
3427cee066cSHong Zhang   for (row=0; row<m; row++) {
3437cee066cSHong Zhang     mr = a->i[row+1] - a->i[row];
3447cee066cSHong Zhang     for (i=0; i<mr; i++) {
3457cee066cSHong Zhang       col         = *jj++;
346071fcb05SBarry Smith       tmp         = cia[col] + collengths[col]++ - oshift;
347071fcb05SBarry Smith       cspidx[tmp] = a->i[row] + i; /* index of a->j */
348071fcb05SBarry Smith       cja[tmp]    = row + oshift;
3497cee066cSHong Zhang     }
3507cee066cSHong Zhang   }
3517cee066cSHong Zhang   ierr   = PetscFree(collengths);CHKERRQ(ierr);
352071fcb05SBarry Smith   *ia    = cia;
353071fcb05SBarry Smith   *ja    = cja;
3547cee066cSHong Zhang   *spidx = cspidx;
3557cee066cSHong Zhang   PetscFunctionReturn(0);
3567cee066cSHong Zhang }
3577cee066cSHong Zhang 
3587cee066cSHong Zhang PetscErrorCode MatRestoreColumnIJ_SeqAIJ_Color(Mat A,PetscInt oshift,PetscBool symmetric,PetscBool inodecompressed,PetscInt *n,const PetscInt *ia[],const PetscInt *ja[],PetscInt *spidx[],PetscBool  *done)
3597cee066cSHong Zhang {
3607cee066cSHong Zhang   PetscErrorCode ierr;
3617cee066cSHong Zhang 
3627cee066cSHong Zhang   PetscFunctionBegin;
3635243ef75SHong Zhang   ierr = MatRestoreColumnIJ_SeqAIJ(A,oshift,symmetric,inodecompressed,n,ia,ja,done);CHKERRQ(ierr);
3647cee066cSHong Zhang   ierr = PetscFree(*spidx);CHKERRQ(ierr);
3657cee066cSHong Zhang   PetscFunctionReturn(0);
3667cee066cSHong Zhang }
3677cee066cSHong Zhang 
36887d4246cSBarry Smith PetscErrorCode MatSetValuesRow_SeqAIJ(Mat A,PetscInt row,const PetscScalar v[])
36987d4246cSBarry Smith {
37087d4246cSBarry Smith   Mat_SeqAIJ     *a  = (Mat_SeqAIJ*)A->data;
37187d4246cSBarry Smith   PetscInt       *ai = a->i;
37287d4246cSBarry Smith   PetscErrorCode ierr;
37387d4246cSBarry Smith 
37487d4246cSBarry Smith   PetscFunctionBegin;
375580bdb30SBarry Smith   ierr = PetscArraycpy(a->a+ai[row],v,ai[row+1]-ai[row]);CHKERRQ(ierr);
376e2cf4d64SStefano Zampini #if defined(PETSC_HAVE_VIENNACL) || defined(PETSC_HAVE_CUDA)
377c70f7ee4SJunchao Zhang   if (A->offloadmask != PETSC_OFFLOAD_UNALLOCATED && ai[row+1]-ai[row]) A->offloadmask = PETSC_OFFLOAD_CPU;
378e2cf4d64SStefano Zampini #endif
37987d4246cSBarry Smith   PetscFunctionReturn(0);
38087d4246cSBarry Smith }
38187d4246cSBarry Smith 
382bd04181cSBarry Smith /*
383bd04181cSBarry Smith     MatSeqAIJSetValuesLocalFast - An optimized version of MatSetValuesLocal() for SeqAIJ matrices with several assumptions
384bd04181cSBarry Smith 
385bd04181cSBarry Smith       -   a single row of values is set with each call
386bd04181cSBarry Smith       -   no row or column indices are negative or (in error) larger than the number of rows or columns
387bd04181cSBarry Smith       -   the values are always added to the matrix, not set
388bd04181cSBarry Smith       -   no new locations are introduced in the nonzero structure of the matrix
389bd04181cSBarry Smith 
3901f763a69SBarry Smith      This does NOT assume the global column indices are sorted
391bd04181cSBarry Smith 
3921f763a69SBarry Smith */
393bd04181cSBarry Smith 
394af0996ceSBarry Smith #include <petsc/private/isimpl.h>
395189e4007SBarry Smith PetscErrorCode MatSeqAIJSetValuesLocalFast(Mat A,PetscInt m,const PetscInt im[],PetscInt n,const PetscInt in[],const PetscScalar v[],InsertMode is)
396189e4007SBarry Smith {
397189e4007SBarry Smith   Mat_SeqAIJ     *a = (Mat_SeqAIJ*)A->data;
3981f763a69SBarry Smith   PetscInt       low,high,t,row,nrow,i,col,l;
3991f763a69SBarry Smith   const PetscInt *rp,*ai = a->i,*ailen = a->ilen,*aj = a->j;
4001f763a69SBarry Smith   PetscInt       lastcol = -1;
401189e4007SBarry Smith   MatScalar      *ap,value,*aa = a->a;
402189e4007SBarry Smith   const PetscInt *ridx = A->rmap->mapping->indices,*cidx = A->cmap->mapping->indices;
403189e4007SBarry Smith 
404f38dd0b8SBarry Smith   row  = ridx[im[0]];
4051f763a69SBarry Smith   rp   = aj + ai[row];
4061f763a69SBarry Smith   ap   = aa + ai[row];
4071f763a69SBarry Smith   nrow = ailen[row];
408189e4007SBarry Smith   low  = 0;
409189e4007SBarry Smith   high = nrow;
410189e4007SBarry Smith   for (l=0; l<n; l++) { /* loop over added columns */
411189e4007SBarry Smith     col = cidx[in[l]];
412f38dd0b8SBarry Smith     value = v[l];
413189e4007SBarry Smith 
414189e4007SBarry Smith     if (col <= lastcol) low = 0;
415189e4007SBarry Smith     else high = nrow;
416189e4007SBarry Smith     lastcol = col;
417189e4007SBarry Smith     while (high-low > 5) {
418189e4007SBarry Smith       t = (low+high)/2;
419189e4007SBarry Smith       if (rp[t] > col) high = t;
420189e4007SBarry Smith       else low = t;
421189e4007SBarry Smith     }
422189e4007SBarry Smith     for (i=low; i<high; i++) {
423189e4007SBarry Smith       if (rp[i] == col) {
4241f763a69SBarry Smith         ap[i] += value;
425189e4007SBarry Smith         low = i + 1;
4261f763a69SBarry Smith         break;
427189e4007SBarry Smith       }
428189e4007SBarry Smith     }
429189e4007SBarry Smith   }
430e2cf4d64SStefano Zampini #if defined(PETSC_HAVE_VIENNACL) || defined(PETSC_HAVE_CUDA)
431c70f7ee4SJunchao Zhang   if (A->offloadmask != PETSC_OFFLOAD_UNALLOCATED && m && n) A->offloadmask = PETSC_OFFLOAD_CPU;
432e2cf4d64SStefano Zampini #endif
433f38dd0b8SBarry Smith   return 0;
434189e4007SBarry Smith }
435189e4007SBarry Smith 
43697f1f81fSBarry Smith PetscErrorCode MatSetValues_SeqAIJ(Mat A,PetscInt m,const PetscInt im[],PetscInt n,const PetscInt in[],const PetscScalar v[],InsertMode is)
43717ab2063SBarry Smith {
438416022c9SBarry Smith   Mat_SeqAIJ     *a = (Mat_SeqAIJ*)A->data;
439e2ee6c50SBarry Smith   PetscInt       *rp,k,low,high,t,ii,row,nrow,i,col,l,rmax,N;
44097f1f81fSBarry Smith   PetscInt       *imax = a->imax,*ai = a->i,*ailen = a->ilen;
4416849ba73SBarry Smith   PetscErrorCode ierr;
442e2ee6c50SBarry Smith   PetscInt       *aj = a->j,nonew = a->nonew,lastcol = -1;
443d8cdefa3SHong Zhang   MatScalar      *ap=NULL,value=0.0,*aa = a->a;
444ace3abfcSBarry Smith   PetscBool      ignorezeroentries = a->ignorezeroentries;
445ace3abfcSBarry Smith   PetscBool      roworiented       = a->roworiented;
446e2cf4d64SStefano Zampini #if defined(PETSC_HAVE_VIENNACL) || defined(PETSC_HAVE_CUDA)
447e2cf4d64SStefano Zampini   PetscBool      inserted          = PETSC_FALSE;
448e2cf4d64SStefano Zampini #endif
44917ab2063SBarry Smith 
4503a40ed3dSBarry Smith   PetscFunctionBegin;
45117ab2063SBarry Smith   for (k=0; k<m; k++) { /* loop over added rows */
452416022c9SBarry Smith     row = im[k];
4535ef9f2a5SBarry Smith     if (row < 0) continue;
454cf9c20a2SJed Brown     if (PetscUnlikelyDebug(row >= A->rmap->n)) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Row too large: row %D max %D",row,A->rmap->n-1);
455720833daSHong Zhang     rp   = aj + ai[row];
456876c6284SHong Zhang     if (!A->structure_only) ap = aa + ai[row];
45717ab2063SBarry Smith     rmax = imax[row]; nrow = ailen[row];
458416022c9SBarry Smith     low  = 0;
459c71e6ed7SBarry Smith     high = nrow;
46017ab2063SBarry Smith     for (l=0; l<n; l++) { /* loop over added columns */
4615ef9f2a5SBarry Smith       if (in[l] < 0) continue;
462cf9c20a2SJed Brown       if (PetscUnlikelyDebug(in[l] >= A->cmap->n)) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Column too large: col %D max %D",in[l],A->cmap->n-1);
463bfeeae90SHong Zhang       col = in[l];
464071fcb05SBarry Smith       if (v && !A->structure_only) value = roworiented ? v[l + k*n] : v[k + l*m];
465071fcb05SBarry Smith       if (!A->structure_only && value == 0.0 && ignorezeroentries && is == ADD_VALUES && row != col) continue;
46636db0b34SBarry Smith 
4672205254eSKarl Rupp       if (col <= lastcol) low = 0;
4682205254eSKarl Rupp       else high = nrow;
469e2ee6c50SBarry Smith       lastcol = col;
470416022c9SBarry Smith       while (high-low > 5) {
471416022c9SBarry Smith         t = (low+high)/2;
472416022c9SBarry Smith         if (rp[t] > col) high = t;
473416022c9SBarry Smith         else low = t;
47417ab2063SBarry Smith       }
475416022c9SBarry Smith       for (i=low; i<high; i++) {
47617ab2063SBarry Smith         if (rp[i] > col) break;
47717ab2063SBarry Smith         if (rp[i] == col) {
478876c6284SHong Zhang           if (!A->structure_only) {
4790c0d7e18SFande Kong             if (is == ADD_VALUES) {
4800c0d7e18SFande Kong               ap[i] += value;
4810c0d7e18SFande Kong               (void)PetscLogFlops(1.0);
4820c0d7e18SFande Kong             }
48317ab2063SBarry Smith             else ap[i] = value;
484e2cf4d64SStefano Zampini #if defined(PETSC_HAVE_VIENNACL) || defined(PETSC_HAVE_CUDA)
485e2cf4d64SStefano Zampini             inserted = PETSC_TRUE;
486e2cf4d64SStefano Zampini #endif
487720833daSHong Zhang           }
488e44c0bd4SBarry Smith           low = i + 1;
48917ab2063SBarry Smith           goto noinsert;
49017ab2063SBarry Smith         }
49117ab2063SBarry Smith       }
492dcd36c23SBarry Smith       if (value == 0.0 && ignorezeroentries && row != col) goto noinsert;
493c2653b3dSLois Curfman McInnes       if (nonew == 1) goto noinsert;
494e32f2f54SBarry Smith       if (nonew == -1) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Inserting a new nonzero at (%D,%D) in the matrix",row,col);
495720833daSHong Zhang       if (A->structure_only) {
496876c6284SHong Zhang         MatSeqXAIJReallocateAIJ_structure_only(A,A->rmap->n,1,nrow,row,col,rmax,ai,aj,rp,imax,nonew,MatScalar);
497720833daSHong Zhang       } else {
498fef13f97SBarry Smith         MatSeqXAIJReallocateAIJ(A,A->rmap->n,1,nrow,row,col,rmax,aa,ai,aj,rp,ap,imax,nonew,MatScalar);
499720833daSHong Zhang       }
500c03d1d03SSatish Balay       N = nrow++ - 1; a->nz++; high++;
501416022c9SBarry Smith       /* shift up all the later entries in this row */
502580bdb30SBarry Smith       ierr  = PetscArraymove(rp+i+1,rp+i,N-i+1);CHKERRQ(ierr);
50317ab2063SBarry Smith       rp[i] = col;
504580bdb30SBarry Smith       if (!A->structure_only){
505580bdb30SBarry Smith         ierr  = PetscArraymove(ap+i+1,ap+i,N-i+1);CHKERRQ(ierr);
506580bdb30SBarry Smith         ap[i] = value;
507580bdb30SBarry Smith       }
508416022c9SBarry Smith       low = i + 1;
509e56f5c9eSBarry Smith       A->nonzerostate++;
510e2cf4d64SStefano Zampini #if defined(PETSC_HAVE_VIENNACL) || defined(PETSC_HAVE_CUDA)
511e2cf4d64SStefano Zampini       inserted = PETSC_TRUE;
512e2cf4d64SStefano Zampini #endif
513e44c0bd4SBarry Smith noinsert:;
51417ab2063SBarry Smith     }
51517ab2063SBarry Smith     ailen[row] = nrow;
51617ab2063SBarry Smith   }
517e2cf4d64SStefano Zampini #if defined(PETSC_HAVE_VIENNACL) || defined(PETSC_HAVE_CUDA)
518c70f7ee4SJunchao Zhang   if (A->offloadmask != PETSC_OFFLOAD_UNALLOCATED && inserted) A->offloadmask = PETSC_OFFLOAD_CPU;
519e2cf4d64SStefano Zampini #endif
5203a40ed3dSBarry Smith   PetscFunctionReturn(0);
52117ab2063SBarry Smith }
52217ab2063SBarry Smith 
523071fcb05SBarry Smith PetscErrorCode MatSetValues_SeqAIJ_SortedFull(Mat A,PetscInt m,const PetscInt im[],PetscInt n,const PetscInt in[],const PetscScalar v[],InsertMode is)
524071fcb05SBarry Smith {
525071fcb05SBarry Smith   Mat_SeqAIJ     *a = (Mat_SeqAIJ*)A->data;
526071fcb05SBarry Smith   PetscInt       *rp,k,row;
527071fcb05SBarry Smith   PetscInt       *ai = a->i,*ailen = a->ilen;
528071fcb05SBarry Smith   PetscErrorCode ierr;
529071fcb05SBarry Smith   PetscInt       *aj = a->j;
530071fcb05SBarry Smith   MatScalar      *aa = a->a,*ap;
531071fcb05SBarry Smith 
532071fcb05SBarry Smith   PetscFunctionBegin;
533071fcb05SBarry Smith   for (k=0; k<m; k++) { /* loop over added rows */
534071fcb05SBarry Smith     row  = im[k];
535071fcb05SBarry Smith     rp   = aj + ai[row];
536071fcb05SBarry Smith     ap   = aa + ai[row];
537071fcb05SBarry Smith     if (!A->was_assembled) {
538071fcb05SBarry Smith       ierr = PetscMemcpy(rp,in,n*sizeof(PetscInt));CHKERRQ(ierr);
539071fcb05SBarry Smith     }
540071fcb05SBarry Smith     if (!A->structure_only) {
541071fcb05SBarry Smith       if (v) {
542071fcb05SBarry Smith         ierr = PetscMemcpy(ap,v,n*sizeof(PetscScalar));CHKERRQ(ierr);
543071fcb05SBarry Smith         v   += n;
544071fcb05SBarry Smith       } else {
545071fcb05SBarry Smith         ierr = PetscMemzero(ap,n*sizeof(PetscScalar));CHKERRQ(ierr);
546071fcb05SBarry Smith       }
547071fcb05SBarry Smith     }
548071fcb05SBarry Smith     ailen[row] = n;
549071fcb05SBarry Smith     a->nz      += n;
550071fcb05SBarry Smith   }
551e2cf4d64SStefano Zampini #if defined(PETSC_HAVE_VIENNACL) || defined(PETSC_HAVE_CUDA)
552c70f7ee4SJunchao Zhang   if (A->offloadmask != PETSC_OFFLOAD_UNALLOCATED && m && n) A->offloadmask = PETSC_OFFLOAD_CPU;
553e2cf4d64SStefano Zampini #endif
554071fcb05SBarry Smith   PetscFunctionReturn(0);
555071fcb05SBarry Smith }
556071fcb05SBarry Smith 
55781824310SBarry Smith 
558a77337e4SBarry Smith PetscErrorCode MatGetValues_SeqAIJ(Mat A,PetscInt m,const PetscInt im[],PetscInt n,const PetscInt in[],PetscScalar v[])
5597eb43aa7SLois Curfman McInnes {
5607eb43aa7SLois Curfman McInnes   Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data;
56197f1f81fSBarry Smith   PetscInt   *rp,k,low,high,t,row,nrow,i,col,l,*aj = a->j;
56297f1f81fSBarry Smith   PetscInt   *ai = a->i,*ailen = a->ilen;
56354f21887SBarry Smith   MatScalar  *ap,*aa = a->a;
5647eb43aa7SLois Curfman McInnes 
5653a40ed3dSBarry Smith   PetscFunctionBegin;
5667eb43aa7SLois Curfman McInnes   for (k=0; k<m; k++) { /* loop over rows */
5677eb43aa7SLois Curfman McInnes     row = im[k];
568e32f2f54SBarry Smith     if (row < 0) {v += n; continue;} /* SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Negative row: %D",row); */
569e32f2f54SBarry Smith     if (row >= A->rmap->n) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Row too large: row %D max %D",row,A->rmap->n-1);
570bfeeae90SHong Zhang     rp   = aj + ai[row]; ap = aa + ai[row];
5717eb43aa7SLois Curfman McInnes     nrow = ailen[row];
5727eb43aa7SLois Curfman McInnes     for (l=0; l<n; l++) { /* loop over columns */
573e32f2f54SBarry Smith       if (in[l] < 0) {v++; continue;} /* SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Negative column: %D",in[l]); */
574e32f2f54SBarry Smith       if (in[l] >= A->cmap->n) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Column too large: col %D max %D",in[l],A->cmap->n-1);
575bfeeae90SHong Zhang       col  = in[l];
5767eb43aa7SLois Curfman McInnes       high = nrow; low = 0; /* assume unsorted */
5777eb43aa7SLois Curfman McInnes       while (high-low > 5) {
5787eb43aa7SLois Curfman McInnes         t = (low+high)/2;
5797eb43aa7SLois Curfman McInnes         if (rp[t] > col) high = t;
5807eb43aa7SLois Curfman McInnes         else low = t;
5817eb43aa7SLois Curfman McInnes       }
5827eb43aa7SLois Curfman McInnes       for (i=low; i<high; i++) {
5837eb43aa7SLois Curfman McInnes         if (rp[i] > col) break;
5847eb43aa7SLois Curfman McInnes         if (rp[i] == col) {
585b49de8d1SLois Curfman McInnes           *v++ = ap[i];
5867eb43aa7SLois Curfman McInnes           goto finished;
5877eb43aa7SLois Curfman McInnes         }
5887eb43aa7SLois Curfman McInnes       }
58997e567efSBarry Smith       *v++ = 0.0;
5907eb43aa7SLois Curfman McInnes finished:;
5917eb43aa7SLois Curfman McInnes     }
5927eb43aa7SLois Curfman McInnes   }
5933a40ed3dSBarry Smith   PetscFunctionReturn(0);
5947eb43aa7SLois Curfman McInnes }
5957eb43aa7SLois Curfman McInnes 
5963ea6fe3dSLisandro Dalcin PetscErrorCode MatView_SeqAIJ_Binary(Mat mat,PetscViewer viewer)
59717ab2063SBarry Smith {
5983ea6fe3dSLisandro Dalcin   Mat_SeqAIJ     *A = (Mat_SeqAIJ*)mat->data;
5993ea6fe3dSLisandro Dalcin   PetscInt       header[4],M,N,m,nz,i;
6003ea6fe3dSLisandro Dalcin   PetscInt       *rowlens;
6016849ba73SBarry Smith   PetscErrorCode ierr;
60217ab2063SBarry Smith 
6033a40ed3dSBarry Smith   PetscFunctionBegin;
6043ea6fe3dSLisandro Dalcin   ierr = PetscViewerSetUp(viewer);CHKERRQ(ierr);
6052205254eSKarl Rupp 
6063ea6fe3dSLisandro Dalcin   M  = mat->rmap->N;
6073ea6fe3dSLisandro Dalcin   N  = mat->cmap->N;
6083ea6fe3dSLisandro Dalcin   m  = mat->rmap->n;
6093ea6fe3dSLisandro Dalcin   nz = A->nz;
610416022c9SBarry Smith 
6113ea6fe3dSLisandro Dalcin   /* write matrix header */
6123ea6fe3dSLisandro Dalcin   header[0] = MAT_FILE_CLASSID;
6133ea6fe3dSLisandro Dalcin   header[1] = M; header[2] = N; header[3] = nz;
6143ea6fe3dSLisandro Dalcin   ierr = PetscViewerBinaryWrite(viewer,header,4,PETSC_INT);CHKERRQ(ierr);
615416022c9SBarry Smith 
6163ea6fe3dSLisandro Dalcin   /* fill in and store row lengths */
6173ea6fe3dSLisandro Dalcin   ierr = PetscMalloc1(m,&rowlens);CHKERRQ(ierr);
6183ea6fe3dSLisandro Dalcin   for (i=0; i<m; i++) rowlens[i] = A->i[i+1] - A->i[i];
6193ea6fe3dSLisandro Dalcin   ierr = PetscViewerBinaryWrite(viewer,rowlens,m,PETSC_INT);CHKERRQ(ierr);
6203ea6fe3dSLisandro Dalcin   ierr = PetscFree(rowlens);CHKERRQ(ierr);
6213ea6fe3dSLisandro Dalcin   /* store column indices */
6223ea6fe3dSLisandro Dalcin   ierr = PetscViewerBinaryWrite(viewer,A->j,nz,PETSC_INT);CHKERRQ(ierr);
623416022c9SBarry Smith   /* store nonzero values */
6243ea6fe3dSLisandro Dalcin   ierr = PetscViewerBinaryWrite(viewer,A->a,nz,PETSC_SCALAR);CHKERRQ(ierr);
625b37d52dbSMark F. Adams 
6263ea6fe3dSLisandro Dalcin   /* write block size option to the viewer's .info file */
6273ea6fe3dSLisandro Dalcin   ierr = MatView_Binary_BlockSizes(mat,viewer);CHKERRQ(ierr);
6283a40ed3dSBarry Smith   PetscFunctionReturn(0);
62917ab2063SBarry Smith }
630416022c9SBarry Smith 
6317dc0baabSHong Zhang static PetscErrorCode MatView_SeqAIJ_ASCII_structonly(Mat A,PetscViewer viewer)
6327dc0baabSHong Zhang {
6337dc0baabSHong Zhang   PetscErrorCode ierr;
6347dc0baabSHong Zhang   Mat_SeqAIJ     *a = (Mat_SeqAIJ*)A->data;
6357dc0baabSHong Zhang   PetscInt       i,k,m=A->rmap->N;
6367dc0baabSHong Zhang 
6377dc0baabSHong Zhang   PetscFunctionBegin;
6387dc0baabSHong Zhang   ierr = PetscViewerASCIIUseTabs(viewer,PETSC_FALSE);CHKERRQ(ierr);
6397dc0baabSHong Zhang   for (i=0; i<m; i++) {
6407dc0baabSHong Zhang     ierr = PetscViewerASCIIPrintf(viewer,"row %D:",i);CHKERRQ(ierr);
6417dc0baabSHong Zhang     for (k=a->i[i]; k<a->i[i+1]; k++) {
6427dc0baabSHong Zhang       ierr = PetscViewerASCIIPrintf(viewer," (%D) ",a->j[k]);CHKERRQ(ierr);
6437dc0baabSHong Zhang     }
6447dc0baabSHong Zhang     ierr = PetscViewerASCIIPrintf(viewer,"\n");CHKERRQ(ierr);
6457dc0baabSHong Zhang   }
6467dc0baabSHong Zhang   ierr = PetscViewerASCIIUseTabs(viewer,PETSC_TRUE);CHKERRQ(ierr);
6477dc0baabSHong Zhang   PetscFunctionReturn(0);
6487dc0baabSHong Zhang }
6497dc0baabSHong Zhang 
65009573ac7SBarry Smith extern PetscErrorCode MatSeqAIJFactorInfo_Matlab(Mat,PetscViewer);
651cd155464SBarry Smith 
652dfbe8321SBarry Smith PetscErrorCode MatView_SeqAIJ_ASCII(Mat A,PetscViewer viewer)
653416022c9SBarry Smith {
654416022c9SBarry Smith   Mat_SeqAIJ        *a = (Mat_SeqAIJ*)A->data;
655dfbe8321SBarry Smith   PetscErrorCode    ierr;
65660e0710aSBarry Smith   PetscInt          i,j,m = A->rmap->n;
657e060cb09SBarry Smith   const char        *name;
658f3ef73ceSBarry Smith   PetscViewerFormat format;
65917ab2063SBarry Smith 
6603a40ed3dSBarry Smith   PetscFunctionBegin;
6617dc0baabSHong Zhang   if (A->structure_only) {
6627dc0baabSHong Zhang     ierr = MatView_SeqAIJ_ASCII_structonly(A,viewer);CHKERRQ(ierr);
6637dc0baabSHong Zhang     PetscFunctionReturn(0);
6647dc0baabSHong Zhang   }
66543e49210SHong Zhang 
666b0a32e0cSBarry Smith   ierr = PetscViewerGetFormat(viewer,&format);CHKERRQ(ierr);
66771c2f376SKris Buschelman   if (format == PETSC_VIEWER_ASCII_MATLAB) {
66897f1f81fSBarry Smith     PetscInt nofinalvalue = 0;
66960e0710aSBarry Smith     if (m && ((a->i[m] == a->i[m-1]) || (a->j[a->nz-1] != A->cmap->n-1))) {
670c337ccceSJed Brown       /* Need a dummy value to ensure the dimension of the matrix. */
671d00d2cf4SBarry Smith       nofinalvalue = 1;
672d00d2cf4SBarry Smith     }
673d00279f6SBarry Smith     ierr = PetscViewerASCIIUseTabs(viewer,PETSC_FALSE);CHKERRQ(ierr);
674d0f46423SBarry Smith     ierr = PetscViewerASCIIPrintf(viewer,"%% Size = %D %D \n",m,A->cmap->n);CHKERRQ(ierr);
67577431f27SBarry Smith     ierr = PetscViewerASCIIPrintf(viewer,"%% Nonzeros = %D \n",a->nz);CHKERRQ(ierr);
676fbfe6fa7SJed Brown #if defined(PETSC_USE_COMPLEX)
677fbfe6fa7SJed Brown     ierr = PetscViewerASCIIPrintf(viewer,"zzz = zeros(%D,4);\n",a->nz+nofinalvalue);CHKERRQ(ierr);
678fbfe6fa7SJed Brown #else
67977431f27SBarry Smith     ierr = PetscViewerASCIIPrintf(viewer,"zzz = zeros(%D,3);\n",a->nz+nofinalvalue);CHKERRQ(ierr);
680fbfe6fa7SJed Brown #endif
681b0a32e0cSBarry Smith     ierr = PetscViewerASCIIPrintf(viewer,"zzz = [\n");CHKERRQ(ierr);
68217ab2063SBarry Smith 
68317ab2063SBarry Smith     for (i=0; i<m; i++) {
68460e0710aSBarry Smith       for (j=a->i[i]; j<a->i[i+1]; j++) {
685aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX)
686a9bf72d8SJed Brown         ierr = PetscViewerASCIIPrintf(viewer,"%D %D  %18.16e %18.16e\n",i+1,a->j[j]+1,(double)PetscRealPart(a->a[j]),(double)PetscImaginaryPart(a->a[j]));CHKERRQ(ierr);
68717ab2063SBarry Smith #else
68860e0710aSBarry Smith         ierr = PetscViewerASCIIPrintf(viewer,"%D %D  %18.16e\n",i+1,a->j[j]+1,(double)a->a[j]);CHKERRQ(ierr);
68917ab2063SBarry Smith #endif
69017ab2063SBarry Smith       }
69117ab2063SBarry Smith     }
692d00d2cf4SBarry Smith     if (nofinalvalue) {
693c337ccceSJed Brown #if defined(PETSC_USE_COMPLEX)
694c337ccceSJed Brown       ierr = PetscViewerASCIIPrintf(viewer,"%D %D  %18.16e %18.16e\n",m,A->cmap->n,0.,0.);CHKERRQ(ierr);
695c337ccceSJed Brown #else
696d0f46423SBarry Smith       ierr = PetscViewerASCIIPrintf(viewer,"%D %D  %18.16e\n",m,A->cmap->n,0.0);CHKERRQ(ierr);
697c337ccceSJed Brown #endif
698d00d2cf4SBarry Smith     }
699317d6ea6SBarry Smith     ierr = PetscObjectGetName((PetscObject)A,&name);CHKERRQ(ierr);
700fb9695e5SSatish Balay     ierr = PetscViewerASCIIPrintf(viewer,"];\n %s = spconvert(zzz);\n",name);CHKERRQ(ierr);
701d00279f6SBarry Smith     ierr = PetscViewerASCIIUseTabs(viewer,PETSC_TRUE);CHKERRQ(ierr);
7022950ac48SStefano Zampini   } else if (format == PETSC_VIEWER_ASCII_FACTOR_INFO || format == PETSC_VIEWER_ASCII_INFO || format == PETSC_VIEWER_ASCII_INFO_DETAIL) {
703cd155464SBarry Smith     PetscFunctionReturn(0);
704fb9695e5SSatish Balay   } else if (format == PETSC_VIEWER_ASCII_COMMON) {
705d00279f6SBarry Smith     ierr = PetscViewerASCIIUseTabs(viewer,PETSC_FALSE);CHKERRQ(ierr);
70644cd7ae7SLois Curfman McInnes     for (i=0; i<m; i++) {
70777431f27SBarry Smith       ierr = PetscViewerASCIIPrintf(viewer,"row %D:",i);CHKERRQ(ierr);
70860e0710aSBarry Smith       for (j=a->i[i]; j<a->i[i+1]; j++) {
709aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX)
71036db0b34SBarry Smith         if (PetscImaginaryPart(a->a[j]) > 0.0 && PetscRealPart(a->a[j]) != 0.0) {
71160e0710aSBarry Smith           ierr = PetscViewerASCIIPrintf(viewer," (%D, %g + %g i)",a->j[j],(double)PetscRealPart(a->a[j]),(double)PetscImaginaryPart(a->a[j]));CHKERRQ(ierr);
71236db0b34SBarry Smith         } else if (PetscImaginaryPart(a->a[j]) < 0.0 && PetscRealPart(a->a[j]) != 0.0) {
71360e0710aSBarry Smith           ierr = PetscViewerASCIIPrintf(viewer," (%D, %g - %g i)",a->j[j],(double)PetscRealPart(a->a[j]),(double)-PetscImaginaryPart(a->a[j]));CHKERRQ(ierr);
71436db0b34SBarry Smith         } else if (PetscRealPart(a->a[j]) != 0.0) {
71560e0710aSBarry Smith           ierr = PetscViewerASCIIPrintf(viewer," (%D, %g) ",a->j[j],(double)PetscRealPart(a->a[j]));CHKERRQ(ierr);
7166831982aSBarry Smith         }
71744cd7ae7SLois Curfman McInnes #else
71860e0710aSBarry Smith         if (a->a[j] != 0.0) {ierr = PetscViewerASCIIPrintf(viewer," (%D, %g) ",a->j[j],(double)a->a[j]);CHKERRQ(ierr);}
71944cd7ae7SLois Curfman McInnes #endif
72044cd7ae7SLois Curfman McInnes       }
721b0a32e0cSBarry Smith       ierr = PetscViewerASCIIPrintf(viewer,"\n");CHKERRQ(ierr);
72244cd7ae7SLois Curfman McInnes     }
723d00279f6SBarry Smith     ierr = PetscViewerASCIIUseTabs(viewer,PETSC_TRUE);CHKERRQ(ierr);
724fb9695e5SSatish Balay   } else if (format == PETSC_VIEWER_ASCII_SYMMODU) {
72597f1f81fSBarry Smith     PetscInt nzd=0,fshift=1,*sptr;
726d00279f6SBarry Smith     ierr = PetscViewerASCIIUseTabs(viewer,PETSC_FALSE);CHKERRQ(ierr);
727854ce69bSBarry Smith     ierr = PetscMalloc1(m+1,&sptr);CHKERRQ(ierr);
728496be53dSLois Curfman McInnes     for (i=0; i<m; i++) {
729496be53dSLois Curfman McInnes       sptr[i] = nzd+1;
73060e0710aSBarry Smith       for (j=a->i[i]; j<a->i[i+1]; j++) {
731496be53dSLois Curfman McInnes         if (a->j[j] >= i) {
732aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX)
73336db0b34SBarry Smith           if (PetscImaginaryPart(a->a[j]) != 0.0 || PetscRealPart(a->a[j]) != 0.0) nzd++;
734496be53dSLois Curfman McInnes #else
735496be53dSLois Curfman McInnes           if (a->a[j] != 0.0) nzd++;
736496be53dSLois Curfman McInnes #endif
737496be53dSLois Curfman McInnes         }
738496be53dSLois Curfman McInnes       }
739496be53dSLois Curfman McInnes     }
7402e44a96cSLois Curfman McInnes     sptr[m] = nzd+1;
74177431f27SBarry Smith     ierr    = PetscViewerASCIIPrintf(viewer," %D %D\n\n",m,nzd);CHKERRQ(ierr);
7422e44a96cSLois Curfman McInnes     for (i=0; i<m+1; i+=6) {
7432205254eSKarl Rupp       if (i+4<m) {
7442205254eSKarl Rupp         ierr = PetscViewerASCIIPrintf(viewer," %D %D %D %D %D %D\n",sptr[i],sptr[i+1],sptr[i+2],sptr[i+3],sptr[i+4],sptr[i+5]);CHKERRQ(ierr);
7452205254eSKarl Rupp       } else if (i+3<m) {
7462205254eSKarl Rupp         ierr = PetscViewerASCIIPrintf(viewer," %D %D %D %D %D\n",sptr[i],sptr[i+1],sptr[i+2],sptr[i+3],sptr[i+4]);CHKERRQ(ierr);
7472205254eSKarl Rupp       } else if (i+2<m) {
7482205254eSKarl Rupp         ierr = PetscViewerASCIIPrintf(viewer," %D %D %D %D\n",sptr[i],sptr[i+1],sptr[i+2],sptr[i+3]);CHKERRQ(ierr);
7492205254eSKarl Rupp       } else if (i+1<m) {
7502205254eSKarl Rupp         ierr = PetscViewerASCIIPrintf(viewer," %D %D %D\n",sptr[i],sptr[i+1],sptr[i+2]);CHKERRQ(ierr);
7512205254eSKarl Rupp       } else if (i<m) {
7522205254eSKarl Rupp         ierr = PetscViewerASCIIPrintf(viewer," %D %D\n",sptr[i],sptr[i+1]);CHKERRQ(ierr);
7532205254eSKarl Rupp       } else {
7542205254eSKarl Rupp         ierr = PetscViewerASCIIPrintf(viewer," %D\n",sptr[i]);CHKERRQ(ierr);
7552205254eSKarl Rupp       }
756496be53dSLois Curfman McInnes     }
757b0a32e0cSBarry Smith     ierr = PetscViewerASCIIPrintf(viewer,"\n");CHKERRQ(ierr);
758606d414cSSatish Balay     ierr = PetscFree(sptr);CHKERRQ(ierr);
759496be53dSLois Curfman McInnes     for (i=0; i<m; i++) {
76060e0710aSBarry Smith       for (j=a->i[i]; j<a->i[i+1]; j++) {
76177431f27SBarry Smith         if (a->j[j] >= i) {ierr = PetscViewerASCIIPrintf(viewer," %D ",a->j[j]+fshift);CHKERRQ(ierr);}
762496be53dSLois Curfman McInnes       }
763b0a32e0cSBarry Smith       ierr = PetscViewerASCIIPrintf(viewer,"\n");CHKERRQ(ierr);
764496be53dSLois Curfman McInnes     }
765b0a32e0cSBarry Smith     ierr = PetscViewerASCIIPrintf(viewer,"\n");CHKERRQ(ierr);
766496be53dSLois Curfman McInnes     for (i=0; i<m; i++) {
76760e0710aSBarry Smith       for (j=a->i[i]; j<a->i[i+1]; j++) {
768496be53dSLois Curfman McInnes         if (a->j[j] >= i) {
769aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX)
77036db0b34SBarry Smith           if (PetscImaginaryPart(a->a[j]) != 0.0 || PetscRealPart(a->a[j]) != 0.0) {
77160e0710aSBarry Smith             ierr = PetscViewerASCIIPrintf(viewer," %18.16e %18.16e ",(double)PetscRealPart(a->a[j]),(double)PetscImaginaryPart(a->a[j]));CHKERRQ(ierr);
7726831982aSBarry Smith           }
773496be53dSLois Curfman McInnes #else
77460e0710aSBarry Smith           if (a->a[j] != 0.0) {ierr = PetscViewerASCIIPrintf(viewer," %18.16e ",(double)a->a[j]);CHKERRQ(ierr);}
775496be53dSLois Curfman McInnes #endif
776496be53dSLois Curfman McInnes         }
777496be53dSLois Curfman McInnes       }
778b0a32e0cSBarry Smith       ierr = PetscViewerASCIIPrintf(viewer,"\n");CHKERRQ(ierr);
779496be53dSLois Curfman McInnes     }
780d00279f6SBarry Smith     ierr = PetscViewerASCIIUseTabs(viewer,PETSC_TRUE);CHKERRQ(ierr);
781fb9695e5SSatish Balay   } else if (format == PETSC_VIEWER_ASCII_DENSE) {
78297f1f81fSBarry Smith     PetscInt    cnt = 0,jcnt;
78387828ca2SBarry Smith     PetscScalar value;
78468f1ed48SBarry Smith #if defined(PETSC_USE_COMPLEX)
78568f1ed48SBarry Smith     PetscBool   realonly = PETSC_TRUE;
78668f1ed48SBarry Smith 
78768f1ed48SBarry Smith     for (i=0; i<a->i[m]; i++) {
78868f1ed48SBarry Smith       if (PetscImaginaryPart(a->a[i]) != 0.0) {
78968f1ed48SBarry Smith         realonly = PETSC_FALSE;
79068f1ed48SBarry Smith         break;
79168f1ed48SBarry Smith       }
79268f1ed48SBarry Smith     }
79368f1ed48SBarry Smith #endif
79402594712SBarry Smith 
795d00279f6SBarry Smith     ierr = PetscViewerASCIIUseTabs(viewer,PETSC_FALSE);CHKERRQ(ierr);
79602594712SBarry Smith     for (i=0; i<m; i++) {
79702594712SBarry Smith       jcnt = 0;
798d0f46423SBarry Smith       for (j=0; j<A->cmap->n; j++) {
799e24b481bSBarry Smith         if (jcnt < a->i[i+1]-a->i[i] && j == a->j[cnt]) {
80002594712SBarry Smith           value = a->a[cnt++];
801e24b481bSBarry Smith           jcnt++;
80202594712SBarry Smith         } else {
80302594712SBarry Smith           value = 0.0;
80402594712SBarry Smith         }
805aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX)
80668f1ed48SBarry Smith         if (realonly) {
80760e0710aSBarry Smith           ierr = PetscViewerASCIIPrintf(viewer," %7.5e ",(double)PetscRealPart(value));CHKERRQ(ierr);
80868f1ed48SBarry Smith         } else {
80960e0710aSBarry Smith           ierr = PetscViewerASCIIPrintf(viewer," %7.5e+%7.5e i ",(double)PetscRealPart(value),(double)PetscImaginaryPart(value));CHKERRQ(ierr);
81068f1ed48SBarry Smith         }
81102594712SBarry Smith #else
81260e0710aSBarry Smith         ierr = PetscViewerASCIIPrintf(viewer," %7.5e ",(double)value);CHKERRQ(ierr);
81302594712SBarry Smith #endif
81402594712SBarry Smith       }
815b0a32e0cSBarry Smith       ierr = PetscViewerASCIIPrintf(viewer,"\n");CHKERRQ(ierr);
81602594712SBarry Smith     }
817d00279f6SBarry Smith     ierr = PetscViewerASCIIUseTabs(viewer,PETSC_TRUE);CHKERRQ(ierr);
8183c215bfdSMatthew Knepley   } else if (format == PETSC_VIEWER_ASCII_MATRIXMARKET) {
819150b93efSMatthew G. Knepley     PetscInt fshift=1;
820d00279f6SBarry Smith     ierr = PetscViewerASCIIUseTabs(viewer,PETSC_FALSE);CHKERRQ(ierr);
8213c215bfdSMatthew Knepley #if defined(PETSC_USE_COMPLEX)
82219303e72SJonathan Guyer     ierr = PetscViewerASCIIPrintf(viewer,"%%%%MatrixMarket matrix coordinate complex general\n");CHKERRQ(ierr);
8233c215bfdSMatthew Knepley #else
82419303e72SJonathan Guyer     ierr = PetscViewerASCIIPrintf(viewer,"%%%%MatrixMarket matrix coordinate real general\n");CHKERRQ(ierr);
8253c215bfdSMatthew Knepley #endif
826d0f46423SBarry Smith     ierr = PetscViewerASCIIPrintf(viewer,"%D %D %D\n", m, A->cmap->n, a->nz);CHKERRQ(ierr);
8273c215bfdSMatthew Knepley     for (i=0; i<m; i++) {
82860e0710aSBarry Smith       for (j=a->i[i]; j<a->i[i+1]; j++) {
8293c215bfdSMatthew Knepley #if defined(PETSC_USE_COMPLEX)
830a9a0e077SKarl Rupp         ierr = PetscViewerASCIIPrintf(viewer,"%D %D %g %g\n", i+fshift,a->j[j]+fshift,(double)PetscRealPart(a->a[j]),(double)PetscImaginaryPart(a->a[j]));CHKERRQ(ierr);
8313c215bfdSMatthew Knepley #else
832150b93efSMatthew G. Knepley         ierr = PetscViewerASCIIPrintf(viewer,"%D %D %g\n", i+fshift, a->j[j]+fshift, (double)a->a[j]);CHKERRQ(ierr);
8333c215bfdSMatthew Knepley #endif
8343c215bfdSMatthew Knepley       }
8353c215bfdSMatthew Knepley     }
836d00279f6SBarry Smith     ierr = PetscViewerASCIIUseTabs(viewer,PETSC_TRUE);CHKERRQ(ierr);
8373a40ed3dSBarry Smith   } else {
838d00279f6SBarry Smith     ierr = PetscViewerASCIIUseTabs(viewer,PETSC_FALSE);CHKERRQ(ierr);
839d5f3da31SBarry Smith     if (A->factortype) {
84016cd7e1dSShri Abhyankar       for (i=0; i<m; i++) {
84116cd7e1dSShri Abhyankar         ierr = PetscViewerASCIIPrintf(viewer,"row %D:",i);CHKERRQ(ierr);
84216cd7e1dSShri Abhyankar         /* L part */
84360e0710aSBarry Smith         for (j=a->i[i]; j<a->i[i+1]; j++) {
84416cd7e1dSShri Abhyankar #if defined(PETSC_USE_COMPLEX)
84516cd7e1dSShri Abhyankar           if (PetscImaginaryPart(a->a[j]) > 0.0) {
84660e0710aSBarry Smith             ierr = PetscViewerASCIIPrintf(viewer," (%D, %g + %g i)",a->j[j],(double)PetscRealPart(a->a[j]),(double)PetscImaginaryPart(a->a[j]));CHKERRQ(ierr);
84716cd7e1dSShri Abhyankar           } else if (PetscImaginaryPart(a->a[j]) < 0.0) {
8486712e2f1SBarry Smith             ierr = PetscViewerASCIIPrintf(viewer," (%D, %g - %g i)",a->j[j],(double)PetscRealPart(a->a[j]),(double)(-PetscImaginaryPart(a->a[j])));CHKERRQ(ierr);
84916cd7e1dSShri Abhyankar           } else {
85060e0710aSBarry Smith             ierr = PetscViewerASCIIPrintf(viewer," (%D, %g) ",a->j[j],(double)PetscRealPart(a->a[j]));CHKERRQ(ierr);
85116cd7e1dSShri Abhyankar           }
85216cd7e1dSShri Abhyankar #else
85360e0710aSBarry Smith           ierr = PetscViewerASCIIPrintf(viewer," (%D, %g) ",a->j[j],(double)a->a[j]);CHKERRQ(ierr);
85416cd7e1dSShri Abhyankar #endif
85516cd7e1dSShri Abhyankar         }
85616cd7e1dSShri Abhyankar         /* diagonal */
85716cd7e1dSShri Abhyankar         j = a->diag[i];
85816cd7e1dSShri Abhyankar #if defined(PETSC_USE_COMPLEX)
85916cd7e1dSShri Abhyankar         if (PetscImaginaryPart(a->a[j]) > 0.0) {
86060e0710aSBarry Smith           ierr = PetscViewerASCIIPrintf(viewer," (%D, %g + %g i)",a->j[j],(double)PetscRealPart(1.0/a->a[j]),(double)PetscImaginaryPart(1.0/a->a[j]));CHKERRQ(ierr);
86116cd7e1dSShri Abhyankar         } else if (PetscImaginaryPart(a->a[j]) < 0.0) {
8626712e2f1SBarry Smith           ierr = PetscViewerASCIIPrintf(viewer," (%D, %g - %g i)",a->j[j],(double)PetscRealPart(1.0/a->a[j]),(double)(-PetscImaginaryPart(1.0/a->a[j])));CHKERRQ(ierr);
86316cd7e1dSShri Abhyankar         } else {
86460e0710aSBarry Smith           ierr = PetscViewerASCIIPrintf(viewer," (%D, %g) ",a->j[j],(double)PetscRealPart(1.0/a->a[j]));CHKERRQ(ierr);
86516cd7e1dSShri Abhyankar         }
86616cd7e1dSShri Abhyankar #else
86760e0710aSBarry Smith         ierr = PetscViewerASCIIPrintf(viewer," (%D, %g) ",a->j[j],(double)(1.0/a->a[j]));CHKERRQ(ierr);
86816cd7e1dSShri Abhyankar #endif
86916cd7e1dSShri Abhyankar 
87016cd7e1dSShri Abhyankar         /* U part */
87160e0710aSBarry Smith         for (j=a->diag[i+1]+1; j<a->diag[i]; j++) {
87216cd7e1dSShri Abhyankar #if defined(PETSC_USE_COMPLEX)
87316cd7e1dSShri Abhyankar           if (PetscImaginaryPart(a->a[j]) > 0.0) {
87460e0710aSBarry Smith             ierr = PetscViewerASCIIPrintf(viewer," (%D, %g + %g i)",a->j[j],(double)PetscRealPart(a->a[j]),(double)PetscImaginaryPart(a->a[j]));CHKERRQ(ierr);
87516cd7e1dSShri Abhyankar           } else if (PetscImaginaryPart(a->a[j]) < 0.0) {
87622ab088eSBarry Smith             ierr = PetscViewerASCIIPrintf(viewer," (%D, %g - %g i)",a->j[j],(double)PetscRealPart(a->a[j]),(double)(-PetscImaginaryPart(a->a[j])));CHKERRQ(ierr);
87716cd7e1dSShri Abhyankar           } else {
87860e0710aSBarry Smith             ierr = PetscViewerASCIIPrintf(viewer," (%D, %g) ",a->j[j],(double)PetscRealPart(a->a[j]));CHKERRQ(ierr);
87916cd7e1dSShri Abhyankar           }
88016cd7e1dSShri Abhyankar #else
88160e0710aSBarry Smith           ierr = PetscViewerASCIIPrintf(viewer," (%D, %g) ",a->j[j],(double)a->a[j]);CHKERRQ(ierr);
88216cd7e1dSShri Abhyankar #endif
88316cd7e1dSShri Abhyankar         }
88416cd7e1dSShri Abhyankar         ierr = PetscViewerASCIIPrintf(viewer,"\n");CHKERRQ(ierr);
88516cd7e1dSShri Abhyankar       }
88616cd7e1dSShri Abhyankar     } else {
88717ab2063SBarry Smith       for (i=0; i<m; i++) {
88877431f27SBarry Smith         ierr = PetscViewerASCIIPrintf(viewer,"row %D:",i);CHKERRQ(ierr);
88960e0710aSBarry Smith         for (j=a->i[i]; j<a->i[i+1]; j++) {
890aa482453SBarry Smith #if defined(PETSC_USE_COMPLEX)
89136db0b34SBarry Smith           if (PetscImaginaryPart(a->a[j]) > 0.0) {
89260e0710aSBarry Smith             ierr = PetscViewerASCIIPrintf(viewer," (%D, %g + %g i)",a->j[j],(double)PetscRealPart(a->a[j]),(double)PetscImaginaryPart(a->a[j]));CHKERRQ(ierr);
89336db0b34SBarry Smith           } else if (PetscImaginaryPart(a->a[j]) < 0.0) {
89460e0710aSBarry Smith             ierr = PetscViewerASCIIPrintf(viewer," (%D, %g - %g i)",a->j[j],(double)PetscRealPart(a->a[j]),(double)-PetscImaginaryPart(a->a[j]));CHKERRQ(ierr);
8953a40ed3dSBarry Smith           } else {
89660e0710aSBarry Smith             ierr = PetscViewerASCIIPrintf(viewer," (%D, %g) ",a->j[j],(double)PetscRealPart(a->a[j]));CHKERRQ(ierr);
89717ab2063SBarry Smith           }
89817ab2063SBarry Smith #else
89960e0710aSBarry Smith           ierr = PetscViewerASCIIPrintf(viewer," (%D, %g) ",a->j[j],(double)a->a[j]);CHKERRQ(ierr);
90017ab2063SBarry Smith #endif
90117ab2063SBarry Smith         }
902b0a32e0cSBarry Smith         ierr = PetscViewerASCIIPrintf(viewer,"\n");CHKERRQ(ierr);
90317ab2063SBarry Smith       }
90416cd7e1dSShri Abhyankar     }
905d00279f6SBarry Smith     ierr = PetscViewerASCIIUseTabs(viewer,PETSC_TRUE);CHKERRQ(ierr);
90617ab2063SBarry Smith   }
907b0a32e0cSBarry Smith   ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
9083a40ed3dSBarry Smith   PetscFunctionReturn(0);
909416022c9SBarry Smith }
910416022c9SBarry Smith 
9119804daf3SBarry Smith #include <petscdraw.h>
912dfbe8321SBarry Smith PetscErrorCode MatView_SeqAIJ_Draw_Zoom(PetscDraw draw,void *Aa)
913416022c9SBarry Smith {
914480ef9eaSBarry Smith   Mat               A  = (Mat) Aa;
915416022c9SBarry Smith   Mat_SeqAIJ        *a = (Mat_SeqAIJ*)A->data;
916dfbe8321SBarry Smith   PetscErrorCode    ierr;
917383922c3SLisandro Dalcin   PetscInt          i,j,m = A->rmap->n;
918383922c3SLisandro Dalcin   int               color;
919b05fc000SLisandro Dalcin   PetscReal         xl,yl,xr,yr,x_l,x_r,y_l,y_r;
920b0a32e0cSBarry Smith   PetscViewer       viewer;
921f3ef73ceSBarry Smith   PetscViewerFormat format;
922cddf8d76SBarry Smith 
9233a40ed3dSBarry Smith   PetscFunctionBegin;
924480ef9eaSBarry Smith   ierr = PetscObjectQuery((PetscObject)A,"Zoomviewer",(PetscObject*)&viewer);CHKERRQ(ierr);
925b0a32e0cSBarry Smith   ierr = PetscViewerGetFormat(viewer,&format);CHKERRQ(ierr);
926b0a32e0cSBarry Smith   ierr = PetscDrawGetCoordinates(draw,&xl,&yl,&xr,&yr);CHKERRQ(ierr);
927383922c3SLisandro Dalcin 
928416022c9SBarry Smith   /* loop over matrix elements drawing boxes */
9290513a670SBarry Smith 
930fb9695e5SSatish Balay   if (format != PETSC_VIEWER_DRAW_CONTOUR) {
931383922c3SLisandro Dalcin     ierr = PetscDrawCollectiveBegin(draw);CHKERRQ(ierr);
9320513a670SBarry Smith     /* Blue for negative, Cyan for zero and  Red for positive */
933b0a32e0cSBarry Smith     color = PETSC_DRAW_BLUE;
934416022c9SBarry Smith     for (i=0; i<m; i++) {
935cddf8d76SBarry Smith       y_l = m - i - 1.0; y_r = y_l + 1.0;
936bfeeae90SHong Zhang       for (j=a->i[i]; j<a->i[i+1]; j++) {
937bfeeae90SHong Zhang         x_l = a->j[j]; x_r = x_l + 1.0;
93836db0b34SBarry Smith         if (PetscRealPart(a->a[j]) >=  0.) continue;
939b0a32e0cSBarry Smith         ierr = PetscDrawRectangle(draw,x_l,y_l,x_r,y_r,color,color,color,color);CHKERRQ(ierr);
940cddf8d76SBarry Smith       }
941cddf8d76SBarry Smith     }
942b0a32e0cSBarry Smith     color = PETSC_DRAW_CYAN;
943cddf8d76SBarry Smith     for (i=0; i<m; i++) {
944cddf8d76SBarry Smith       y_l = m - i - 1.0; y_r = y_l + 1.0;
945bfeeae90SHong Zhang       for (j=a->i[i]; j<a->i[i+1]; j++) {
946bfeeae90SHong Zhang         x_l = a->j[j]; x_r = x_l + 1.0;
947cddf8d76SBarry Smith         if (a->a[j] !=  0.) continue;
948b0a32e0cSBarry Smith         ierr = PetscDrawRectangle(draw,x_l,y_l,x_r,y_r,color,color,color,color);CHKERRQ(ierr);
949cddf8d76SBarry Smith       }
950cddf8d76SBarry Smith     }
951b0a32e0cSBarry Smith     color = PETSC_DRAW_RED;
952cddf8d76SBarry Smith     for (i=0; i<m; i++) {
953cddf8d76SBarry Smith       y_l = m - i - 1.0; y_r = y_l + 1.0;
954bfeeae90SHong Zhang       for (j=a->i[i]; j<a->i[i+1]; j++) {
955bfeeae90SHong Zhang         x_l = a->j[j]; x_r = x_l + 1.0;
95636db0b34SBarry Smith         if (PetscRealPart(a->a[j]) <=  0.) continue;
957b0a32e0cSBarry Smith         ierr = PetscDrawRectangle(draw,x_l,y_l,x_r,y_r,color,color,color,color);CHKERRQ(ierr);
958416022c9SBarry Smith       }
959416022c9SBarry Smith     }
960383922c3SLisandro Dalcin     ierr = PetscDrawCollectiveEnd(draw);CHKERRQ(ierr);
9610513a670SBarry Smith   } else {
9620513a670SBarry Smith     /* use contour shading to indicate magnitude of values */
9630513a670SBarry Smith     /* first determine max of all nonzero values */
964b05fc000SLisandro Dalcin     PetscReal minv = 0.0, maxv = 0.0;
965383922c3SLisandro Dalcin     PetscInt  nz = a->nz, count = 0;
966b0a32e0cSBarry Smith     PetscDraw popup;
9670513a670SBarry Smith 
9680513a670SBarry Smith     for (i=0; i<nz; i++) {
9690513a670SBarry Smith       if (PetscAbsScalar(a->a[i]) > maxv) maxv = PetscAbsScalar(a->a[i]);
9700513a670SBarry Smith     }
971383922c3SLisandro Dalcin     if (minv >= maxv) maxv = minv + PETSC_SMALL;
972b0a32e0cSBarry Smith     ierr = PetscDrawGetPopup(draw,&popup);CHKERRQ(ierr);
97345f3bb6eSLisandro Dalcin     ierr = PetscDrawScalePopup(popup,minv,maxv);CHKERRQ(ierr);
974383922c3SLisandro Dalcin 
975383922c3SLisandro Dalcin     ierr = PetscDrawCollectiveBegin(draw);CHKERRQ(ierr);
9760513a670SBarry Smith     for (i=0; i<m; i++) {
977383922c3SLisandro Dalcin       y_l = m - i - 1.0;
978383922c3SLisandro Dalcin       y_r = y_l + 1.0;
979bfeeae90SHong Zhang       for (j=a->i[i]; j<a->i[i+1]; j++) {
980383922c3SLisandro Dalcin         x_l = a->j[j];
981383922c3SLisandro Dalcin         x_r = x_l + 1.0;
982b05fc000SLisandro Dalcin         color = PetscDrawRealToColor(PetscAbsScalar(a->a[count]),minv,maxv);
983b0a32e0cSBarry Smith         ierr = PetscDrawRectangle(draw,x_l,y_l,x_r,y_r,color,color,color,color);CHKERRQ(ierr);
9840513a670SBarry Smith         count++;
9850513a670SBarry Smith       }
9860513a670SBarry Smith     }
987383922c3SLisandro Dalcin     ierr = PetscDrawCollectiveEnd(draw);CHKERRQ(ierr);
9880513a670SBarry Smith   }
989480ef9eaSBarry Smith   PetscFunctionReturn(0);
990480ef9eaSBarry Smith }
991cddf8d76SBarry Smith 
9929804daf3SBarry Smith #include <petscdraw.h>
993dfbe8321SBarry Smith PetscErrorCode MatView_SeqAIJ_Draw(Mat A,PetscViewer viewer)
994480ef9eaSBarry Smith {
995dfbe8321SBarry Smith   PetscErrorCode ierr;
996b0a32e0cSBarry Smith   PetscDraw      draw;
99736db0b34SBarry Smith   PetscReal      xr,yr,xl,yl,h,w;
998ace3abfcSBarry Smith   PetscBool      isnull;
999480ef9eaSBarry Smith 
1000480ef9eaSBarry Smith   PetscFunctionBegin;
1001b0a32e0cSBarry Smith   ierr = PetscViewerDrawGetDraw(viewer,0,&draw);CHKERRQ(ierr);
1002b0a32e0cSBarry Smith   ierr = PetscDrawIsNull(draw,&isnull);CHKERRQ(ierr);
1003480ef9eaSBarry Smith   if (isnull) PetscFunctionReturn(0);
1004480ef9eaSBarry Smith 
1005d0f46423SBarry Smith   xr   = A->cmap->n; yr  = A->rmap->n; h = yr/10.0; w = xr/10.0;
1006480ef9eaSBarry Smith   xr  += w;          yr += h;         xl = -w;     yl = -h;
1007b0a32e0cSBarry Smith   ierr = PetscDrawSetCoordinates(draw,xl,yl,xr,yr);CHKERRQ(ierr);
1008832b7cebSLisandro Dalcin   ierr = PetscObjectCompose((PetscObject)A,"Zoomviewer",(PetscObject)viewer);CHKERRQ(ierr);
1009b0a32e0cSBarry Smith   ierr = PetscDrawZoom(draw,MatView_SeqAIJ_Draw_Zoom,A);CHKERRQ(ierr);
10100298fd71SBarry Smith   ierr = PetscObjectCompose((PetscObject)A,"Zoomviewer",NULL);CHKERRQ(ierr);
1011832b7cebSLisandro Dalcin   ierr = PetscDrawSave(draw);CHKERRQ(ierr);
10123a40ed3dSBarry Smith   PetscFunctionReturn(0);
1013416022c9SBarry Smith }
1014416022c9SBarry Smith 
1015dfbe8321SBarry Smith PetscErrorCode MatView_SeqAIJ(Mat A,PetscViewer viewer)
1016416022c9SBarry Smith {
1017dfbe8321SBarry Smith   PetscErrorCode ierr;
1018ace3abfcSBarry Smith   PetscBool      iascii,isbinary,isdraw;
1019416022c9SBarry Smith 
10203a40ed3dSBarry Smith   PetscFunctionBegin;
1021251f4c67SDmitry Karpeev   ierr = PetscObjectTypeCompare((PetscObject)viewer,PETSCVIEWERASCII,&iascii);CHKERRQ(ierr);
1022251f4c67SDmitry Karpeev   ierr = PetscObjectTypeCompare((PetscObject)viewer,PETSCVIEWERBINARY,&isbinary);CHKERRQ(ierr);
1023251f4c67SDmitry Karpeev   ierr = PetscObjectTypeCompare((PetscObject)viewer,PETSCVIEWERDRAW,&isdraw);CHKERRQ(ierr);
1024c45a1595SBarry Smith   if (iascii) {
10253a40ed3dSBarry Smith     ierr = MatView_SeqAIJ_ASCII(A,viewer);CHKERRQ(ierr);
10260f5bd95cSBarry Smith   } else if (isbinary) {
10273a40ed3dSBarry Smith     ierr = MatView_SeqAIJ_Binary(A,viewer);CHKERRQ(ierr);
10280f5bd95cSBarry Smith   } else if (isdraw) {
10293a40ed3dSBarry Smith     ierr = MatView_SeqAIJ_Draw(A,viewer);CHKERRQ(ierr);
103011aeaf0aSBarry Smith   }
10314108e4d5SBarry Smith   ierr = MatView_SeqAIJ_Inode(A,viewer);CHKERRQ(ierr);
10323a40ed3dSBarry Smith   PetscFunctionReturn(0);
103317ab2063SBarry Smith }
103419bcc07fSBarry Smith 
1035dfbe8321SBarry Smith PetscErrorCode MatAssemblyEnd_SeqAIJ(Mat A,MatAssemblyType mode)
103617ab2063SBarry Smith {
1037416022c9SBarry Smith   Mat_SeqAIJ     *a = (Mat_SeqAIJ*)A->data;
10386849ba73SBarry Smith   PetscErrorCode ierr;
1039580bdb30SBarry Smith   PetscInt       fshift = 0,i,*ai = a->i,*aj = a->j,*imax = a->imax;
1040d0f46423SBarry Smith   PetscInt       m      = A->rmap->n,*ip,N,*ailen = a->ilen,rmax = 0;
104154f21887SBarry Smith   MatScalar      *aa    = a->a,*ap;
10423447b6efSHong Zhang   PetscReal      ratio  = 0.6;
104317ab2063SBarry Smith 
10443a40ed3dSBarry Smith   PetscFunctionBegin;
10453a40ed3dSBarry Smith   if (mode == MAT_FLUSH_ASSEMBLY) PetscFunctionReturn(0);
1046071fcb05SBarry Smith   ierr = MatSeqAIJInvalidateDiagonal(A);CHKERRQ(ierr);
1047071fcb05SBarry Smith   if (A->was_assembled && A->ass_nonzerostate == A->nonzerostate) PetscFunctionReturn(0);
104817ab2063SBarry Smith 
104943ee02c3SBarry Smith   if (m) rmax = ailen[0]; /* determine row with most nonzeros */
105017ab2063SBarry Smith   for (i=1; i<m; i++) {
1051416022c9SBarry Smith     /* move each row back by the amount of empty slots (fshift) before it*/
105217ab2063SBarry Smith     fshift += imax[i-1] - ailen[i-1];
105394a9d846SBarry Smith     rmax    = PetscMax(rmax,ailen[i]);
105417ab2063SBarry Smith     if (fshift) {
1055bfeeae90SHong Zhang       ip = aj + ai[i];
1056bfeeae90SHong Zhang       ap = aa + ai[i];
105717ab2063SBarry Smith       N  = ailen[i];
1058580bdb30SBarry Smith       ierr = PetscArraymove(ip-fshift,ip,N);CHKERRQ(ierr);
1059580bdb30SBarry Smith       if (!A->structure_only) {
1060580bdb30SBarry Smith         ierr = PetscArraymove(ap-fshift,ap,N);CHKERRQ(ierr);
106117ab2063SBarry Smith       }
106217ab2063SBarry Smith     }
106317ab2063SBarry Smith     ai[i] = ai[i-1] + ailen[i-1];
106417ab2063SBarry Smith   }
106517ab2063SBarry Smith   if (m) {
106617ab2063SBarry Smith     fshift += imax[m-1] - ailen[m-1];
106717ab2063SBarry Smith     ai[m]   = ai[m-1] + ailen[m-1];
106817ab2063SBarry Smith   }
10697b083b7cSBarry Smith 
107017ab2063SBarry Smith   /* reset ilen and imax for each row */
10717b083b7cSBarry Smith   a->nonzerorowcnt = 0;
1072396832f4SHong Zhang   if (A->structure_only) {
1073071fcb05SBarry Smith     ierr = PetscFree(a->imax);CHKERRQ(ierr);
1074071fcb05SBarry Smith     ierr = PetscFree(a->ilen);CHKERRQ(ierr);
1075396832f4SHong Zhang   } else { /* !A->structure_only */
107617ab2063SBarry Smith     for (i=0; i<m; i++) {
107717ab2063SBarry Smith       ailen[i] = imax[i] = ai[i+1] - ai[i];
10787b083b7cSBarry Smith       a->nonzerorowcnt += ((ai[i+1] - ai[i]) > 0);
107917ab2063SBarry Smith     }
1080396832f4SHong Zhang   }
1081bfeeae90SHong Zhang   a->nz = ai[m];
108265e19b50SBarry Smith   if (fshift && a->nounused == -1) SETERRQ3(PETSC_COMM_SELF,PETSC_ERR_PLIB, "Unused space detected in matrix: %D X %D, %D unneeded", m, A->cmap->n, fshift);
108317ab2063SBarry Smith 
108409f38230SBarry Smith   ierr = MatMarkDiagonal_SeqAIJ(A);CHKERRQ(ierr);
1085d0f46423SBarry Smith   ierr = PetscInfo4(A,"Matrix size: %D X %D; storage space: %D unneeded,%D used\n",m,A->cmap->n,fshift,a->nz);CHKERRQ(ierr);
1086ae15b995SBarry Smith   ierr = PetscInfo1(A,"Number of mallocs during MatSetValues() is %D\n",a->reallocs);CHKERRQ(ierr);
1087ae15b995SBarry Smith   ierr = PetscInfo1(A,"Maximum nonzeros in any row is %D\n",rmax);CHKERRQ(ierr);
10882205254eSKarl Rupp 
10898e58a170SBarry Smith   A->info.mallocs    += a->reallocs;
1090dd5f02e7SSatish Balay   a->reallocs         = 0;
10916712e2f1SBarry Smith   A->info.nz_unneeded = (PetscReal)fshift;
109236db0b34SBarry Smith   a->rmax             = rmax;
10934e220ebcSLois Curfman McInnes 
1094396832f4SHong Zhang   if (!A->structure_only) {
109511e456e1SBarry Smith     ierr = MatCheckCompressedRow(A,a->nonzerorowcnt,&a->compressedrow,a->i,m,ratio);CHKERRQ(ierr);
1096396832f4SHong Zhang   }
10974108e4d5SBarry Smith   ierr = MatAssemblyEnd_SeqAIJ_Inode(A,mode);CHKERRQ(ierr);
10983a40ed3dSBarry Smith   PetscFunctionReturn(0);
109917ab2063SBarry Smith }
110017ab2063SBarry Smith 
110199cafbc1SBarry Smith PetscErrorCode MatRealPart_SeqAIJ(Mat A)
110299cafbc1SBarry Smith {
110399cafbc1SBarry Smith   Mat_SeqAIJ     *a = (Mat_SeqAIJ*)A->data;
110499cafbc1SBarry Smith   PetscInt       i,nz = a->nz;
110554f21887SBarry Smith   MatScalar      *aa = a->a;
1106acf2f550SJed Brown   PetscErrorCode ierr;
110799cafbc1SBarry Smith 
110899cafbc1SBarry Smith   PetscFunctionBegin;
110999cafbc1SBarry Smith   for (i=0; i<nz; i++) aa[i] = PetscRealPart(aa[i]);
1110acf2f550SJed Brown   ierr = MatSeqAIJInvalidateDiagonal(A);CHKERRQ(ierr);
1111e2cf4d64SStefano Zampini #if defined(PETSC_HAVE_VIENNACL) || defined(PETSC_HAVE_CUDA)
1112c70f7ee4SJunchao Zhang   if (A->offloadmask != PETSC_OFFLOAD_UNALLOCATED) A->offloadmask = PETSC_OFFLOAD_CPU;
1113e2cf4d64SStefano Zampini #endif
111499cafbc1SBarry Smith   PetscFunctionReturn(0);
111599cafbc1SBarry Smith }
111699cafbc1SBarry Smith 
111799cafbc1SBarry Smith PetscErrorCode MatImaginaryPart_SeqAIJ(Mat A)
111899cafbc1SBarry Smith {
111999cafbc1SBarry Smith   Mat_SeqAIJ     *a = (Mat_SeqAIJ*)A->data;
112099cafbc1SBarry Smith   PetscInt       i,nz = a->nz;
112154f21887SBarry Smith   MatScalar      *aa = a->a;
1122acf2f550SJed Brown   PetscErrorCode ierr;
112399cafbc1SBarry Smith 
112499cafbc1SBarry Smith   PetscFunctionBegin;
112599cafbc1SBarry Smith   for (i=0; i<nz; i++) aa[i] = PetscImaginaryPart(aa[i]);
1126acf2f550SJed Brown   ierr = MatSeqAIJInvalidateDiagonal(A);CHKERRQ(ierr);
1127e2cf4d64SStefano Zampini #if defined(PETSC_HAVE_VIENNACL) || defined(PETSC_HAVE_CUDA)
1128c70f7ee4SJunchao Zhang   if (A->offloadmask != PETSC_OFFLOAD_UNALLOCATED) A->offloadmask = PETSC_OFFLOAD_CPU;
1129e2cf4d64SStefano Zampini #endif
113099cafbc1SBarry Smith   PetscFunctionReturn(0);
113199cafbc1SBarry Smith }
113299cafbc1SBarry Smith 
1133dfbe8321SBarry Smith PetscErrorCode MatZeroEntries_SeqAIJ(Mat A)
113417ab2063SBarry Smith {
1135416022c9SBarry Smith   Mat_SeqAIJ     *a = (Mat_SeqAIJ*)A->data;
1136dfbe8321SBarry Smith   PetscErrorCode ierr;
11373a40ed3dSBarry Smith 
11383a40ed3dSBarry Smith   PetscFunctionBegin;
1139580bdb30SBarry Smith   ierr = PetscArrayzero(a->a,a->i[A->rmap->n]);CHKERRQ(ierr);
1140acf2f550SJed Brown   ierr = MatSeqAIJInvalidateDiagonal(A);CHKERRQ(ierr);
1141e2cf4d64SStefano Zampini #if defined(PETSC_HAVE_VIENNACL) || defined(PETSC_HAVE_CUDA)
1142c70f7ee4SJunchao Zhang   if (A->offloadmask != PETSC_OFFLOAD_UNALLOCATED) A->offloadmask = PETSC_OFFLOAD_CPU;
1143e2cf4d64SStefano Zampini #endif
11443a40ed3dSBarry Smith   PetscFunctionReturn(0);
114517ab2063SBarry Smith }
1146416022c9SBarry Smith 
1147dfbe8321SBarry Smith PetscErrorCode MatDestroy_SeqAIJ(Mat A)
114817ab2063SBarry Smith {
1149416022c9SBarry Smith   Mat_SeqAIJ     *a = (Mat_SeqAIJ*)A->data;
1150dfbe8321SBarry Smith   PetscErrorCode ierr;
1151d5d45c9bSBarry Smith 
11523a40ed3dSBarry Smith   PetscFunctionBegin;
1153aa482453SBarry Smith #if defined(PETSC_USE_LOG)
1154d0f46423SBarry Smith   PetscLogObjectState((PetscObject)A,"Rows=%D, Cols=%D, NZ=%D",A->rmap->n,A->cmap->n,a->nz);
115517ab2063SBarry Smith #endif
1156e6b907acSBarry Smith   ierr = MatSeqXAIJFreeAIJ(A,&a->a,&a->j,&a->i);CHKERRQ(ierr);
11576bf464f9SBarry Smith   ierr = ISDestroy(&a->row);CHKERRQ(ierr);
11586bf464f9SBarry Smith   ierr = ISDestroy(&a->col);CHKERRQ(ierr);
115905b42c5fSBarry Smith   ierr = PetscFree(a->diag);CHKERRQ(ierr);
1160d48dcb14SBarry Smith   ierr = PetscFree(a->ibdiag);CHKERRQ(ierr);
1161071fcb05SBarry Smith   ierr = PetscFree(a->imax);CHKERRQ(ierr);
1162071fcb05SBarry Smith   ierr = PetscFree(a->ilen);CHKERRQ(ierr);
1163846b4da1SFande Kong   ierr = PetscFree(a->ipre);CHKERRQ(ierr);
116471f1c65dSBarry Smith   ierr = PetscFree3(a->idiag,a->mdiag,a->ssor_work);CHKERRQ(ierr);
116505b42c5fSBarry Smith   ierr = PetscFree(a->solve_work);CHKERRQ(ierr);
11666bf464f9SBarry Smith   ierr = ISDestroy(&a->icol);CHKERRQ(ierr);
116705b42c5fSBarry Smith   ierr = PetscFree(a->saved_values);CHKERRQ(ierr);
1168cd6b891eSBarry Smith   ierr = PetscFree2(a->compressedrow.i,a->compressedrow.rindex);CHKERRQ(ierr);
1169a30b2313SHong Zhang 
11704108e4d5SBarry Smith   ierr = MatDestroy_SeqAIJ_Inode(A);CHKERRQ(ierr);
1171bf0cc555SLisandro Dalcin   ierr = PetscFree(A->data);CHKERRQ(ierr);
1172901853e0SKris Buschelman 
1173*6718818eSStefano Zampini   /* MatMatMultNumeric_SeqAIJ_SeqAIJ_Sorted may allocate this.
1174*6718818eSStefano Zampini      That function is so heavily used (sometimes in an hidden way through multnumeric function pointers)
1175*6718818eSStefano Zampini      that is hard to properly add this data to the MatProduct data. We free it here to avoid
1176*6718818eSStefano Zampini      users reusing the matrix object with different data to incur in obscure segmentation faults
1177*6718818eSStefano Zampini      due to different matrix sizes */
1178*6718818eSStefano Zampini   ierr = PetscObjectCompose((PetscObject)A,"__PETSc__ab_dense",NULL);CHKERRQ(ierr);
1179*6718818eSStefano Zampini 
1180dbd8c25aSHong Zhang   ierr = PetscObjectChangeTypeName((PetscObject)A,0);CHKERRQ(ierr);
1181bdf89e91SBarry Smith   ierr = PetscObjectComposeFunction((PetscObject)A,"MatSeqAIJSetColumnIndices_C",NULL);CHKERRQ(ierr);
1182bdf89e91SBarry Smith   ierr = PetscObjectComposeFunction((PetscObject)A,"MatStoreValues_C",NULL);CHKERRQ(ierr);
1183bdf89e91SBarry Smith   ierr = PetscObjectComposeFunction((PetscObject)A,"MatRetrieveValues_C",NULL);CHKERRQ(ierr);
1184bdf89e91SBarry Smith   ierr = PetscObjectComposeFunction((PetscObject)A,"MatConvert_seqaij_seqsbaij_C",NULL);CHKERRQ(ierr);
1185bdf89e91SBarry Smith   ierr = PetscObjectComposeFunction((PetscObject)A,"MatConvert_seqaij_seqbaij_C",NULL);CHKERRQ(ierr);
1186bdf89e91SBarry Smith   ierr = PetscObjectComposeFunction((PetscObject)A,"MatConvert_seqaij_seqaijperm_C",NULL);CHKERRQ(ierr);
11874222ddf1SHong Zhang 
11884222ddf1SHong Zhang #if defined(PETSC_HAVE_CUDA)
11894222ddf1SHong Zhang   ierr = PetscObjectComposeFunction((PetscObject)A,"MatConvert_seqaij_seqaijcusparse_C",NULL);CHKERRQ(ierr);
11904222ddf1SHong Zhang   ierr = PetscObjectComposeFunction((PetscObject)A,"MatSetFromOptions_seqaijcusparse_seqaij_C",NULL);CHKERRQ(ierr);
11914222ddf1SHong Zhang #endif
11924222ddf1SHong Zhang   ierr = PetscObjectComposeFunction((PetscObject)A,"MatConvert_seqaij_seqaijcrl_C",NULL);CHKERRQ(ierr);
1193af8000cdSHong Zhang #if defined(PETSC_HAVE_ELEMENTAL)
1194af8000cdSHong Zhang   ierr = PetscObjectComposeFunction((PetscObject)A,"MatConvert_seqaij_elemental_C",NULL);CHKERRQ(ierr);
1195af8000cdSHong Zhang #endif
119663c07aadSStefano Zampini #if defined(PETSC_HAVE_HYPRE)
119763c07aadSStefano Zampini   ierr = PetscObjectComposeFunction((PetscObject)A,"MatConvert_seqaij_hypre_C",NULL);CHKERRQ(ierr);
11984222ddf1SHong Zhang   ierr = PetscObjectComposeFunction((PetscObject)A,"MatProductSetFromOptions_transpose_seqaij_seqaij_C",NULL);CHKERRQ(ierr);
119963c07aadSStefano Zampini #endif
1200b49cda9fSStefano Zampini   ierr = PetscObjectComposeFunction((PetscObject)A,"MatConvert_seqaij_seqdense_C",NULL);CHKERRQ(ierr);
1201c9225affSStefano Zampini   ierr = PetscObjectComposeFunction((PetscObject)A,"MatConvert_seqaij_seqsell_C",NULL);CHKERRQ(ierr);
1202c9225affSStefano Zampini   ierr = PetscObjectComposeFunction((PetscObject)A,"MatConvert_seqaij_is_C",NULL);CHKERRQ(ierr);
1203bdf89e91SBarry Smith   ierr = PetscObjectComposeFunction((PetscObject)A,"MatIsTranspose_C",NULL);CHKERRQ(ierr);
1204bdf89e91SBarry Smith   ierr = PetscObjectComposeFunction((PetscObject)A,"MatSeqAIJSetPreallocation_C",NULL);CHKERRQ(ierr);
1205846b4da1SFande Kong   ierr = PetscObjectComposeFunction((PetscObject)A,"MatResetPreallocation_C",NULL);CHKERRQ(ierr);
1206bdf89e91SBarry Smith   ierr = PetscObjectComposeFunction((PetscObject)A,"MatSeqAIJSetPreallocationCSR_C",NULL);CHKERRQ(ierr);
1207bdf89e91SBarry Smith   ierr = PetscObjectComposeFunction((PetscObject)A,"MatReorderForNonzeroDiagonal_C",NULL);CHKERRQ(ierr);
12084222ddf1SHong Zhang   ierr = PetscObjectComposeFunction((PetscObject)A,"MatProductSetFromOptions_is_seqaij_C",NULL);CHKERRQ(ierr);
12094222ddf1SHong Zhang   ierr = PetscObjectComposeFunction((PetscObject)A,"MatProductSetFromOptions_seqdense_seqaij_C",NULL);CHKERRQ(ierr);
12104222ddf1SHong Zhang   ierr = PetscObjectComposeFunction((PetscObject)A,"MatProductSetFromOptions_seqaij_seqaij_C",NULL);CHKERRQ(ierr);
12113a40ed3dSBarry Smith   PetscFunctionReturn(0);
121217ab2063SBarry Smith }
121317ab2063SBarry Smith 
1214ace3abfcSBarry Smith PetscErrorCode MatSetOption_SeqAIJ(Mat A,MatOption op,PetscBool flg)
121517ab2063SBarry Smith {
1216416022c9SBarry Smith   Mat_SeqAIJ     *a = (Mat_SeqAIJ*)A->data;
12174846f1f5SKris Buschelman   PetscErrorCode ierr;
12183a40ed3dSBarry Smith 
12193a40ed3dSBarry Smith   PetscFunctionBegin;
1220a65d3064SKris Buschelman   switch (op) {
1221a65d3064SKris Buschelman   case MAT_ROW_ORIENTED:
12224e0d8c25SBarry Smith     a->roworiented = flg;
1223a65d3064SKris Buschelman     break;
1224a9817697SBarry Smith   case MAT_KEEP_NONZERO_PATTERN:
1225a9817697SBarry Smith     a->keepnonzeropattern = flg;
1226a65d3064SKris Buschelman     break;
1227512a5fc5SBarry Smith   case MAT_NEW_NONZERO_LOCATIONS:
1228512a5fc5SBarry Smith     a->nonew = (flg ? 0 : 1);
1229a65d3064SKris Buschelman     break;
1230a65d3064SKris Buschelman   case MAT_NEW_NONZERO_LOCATION_ERR:
12314e0d8c25SBarry Smith     a->nonew = (flg ? -1 : 0);
1232a65d3064SKris Buschelman     break;
1233a65d3064SKris Buschelman   case MAT_NEW_NONZERO_ALLOCATION_ERR:
12344e0d8c25SBarry Smith     a->nonew = (flg ? -2 : 0);
1235a65d3064SKris Buschelman     break;
123628b2fa4aSMatthew Knepley   case MAT_UNUSED_NONZERO_LOCATION_ERR:
123728b2fa4aSMatthew Knepley     a->nounused = (flg ? -1 : 0);
123828b2fa4aSMatthew Knepley     break;
1239a65d3064SKris Buschelman   case MAT_IGNORE_ZERO_ENTRIES:
12404e0d8c25SBarry Smith     a->ignorezeroentries = flg;
12410df259c2SBarry Smith     break;
12423d472b54SHong Zhang   case MAT_SPD:
1243b1646e73SJed Brown   case MAT_SYMMETRIC:
1244b1646e73SJed Brown   case MAT_STRUCTURALLY_SYMMETRIC:
1245b1646e73SJed Brown   case MAT_HERMITIAN:
1246b1646e73SJed Brown   case MAT_SYMMETRY_ETERNAL:
1247957cac9fSHong Zhang   case MAT_STRUCTURE_ONLY:
12485021d80fSJed Brown     /* These options are handled directly by MatSetOption() */
12495021d80fSJed Brown     break;
12504e0d8c25SBarry Smith   case MAT_NEW_DIAGONALS:
1251a65d3064SKris Buschelman   case MAT_IGNORE_OFF_PROC_ENTRIES:
1252a65d3064SKris Buschelman   case MAT_USE_HASH_TABLE:
1253290bbb0aSBarry Smith     ierr = PetscInfo1(A,"Option %s ignored\n",MatOptions[op]);CHKERRQ(ierr);
1254a65d3064SKris Buschelman     break;
1255b87ac2d8SJed Brown   case MAT_USE_INODES:
1256b87ac2d8SJed Brown     /* Not an error because MatSetOption_SeqAIJ_Inode handles this one */
1257b87ac2d8SJed Brown     break;
1258c10200c1SHong Zhang   case MAT_SUBMAT_SINGLEIS:
1259c10200c1SHong Zhang     A->submat_singleis = flg;
1260c10200c1SHong Zhang     break;
1261071fcb05SBarry Smith   case MAT_SORTED_FULL:
1262071fcb05SBarry Smith     if (flg) A->ops->setvalues = MatSetValues_SeqAIJ_SortedFull;
1263071fcb05SBarry Smith     else     A->ops->setvalues = MatSetValues_SeqAIJ;
1264071fcb05SBarry Smith     break;
1265a65d3064SKris Buschelman   default:
1266e32f2f54SBarry Smith     SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_SUP,"unknown option %d",op);
1267a65d3064SKris Buschelman   }
12684108e4d5SBarry Smith   ierr = MatSetOption_SeqAIJ_Inode(A,op,flg);CHKERRQ(ierr);
12693a40ed3dSBarry Smith   PetscFunctionReturn(0);
127017ab2063SBarry Smith }
127117ab2063SBarry Smith 
1272dfbe8321SBarry Smith PetscErrorCode MatGetDiagonal_SeqAIJ(Mat A,Vec v)
127317ab2063SBarry Smith {
1274416022c9SBarry Smith   Mat_SeqAIJ     *a = (Mat_SeqAIJ*)A->data;
12756849ba73SBarry Smith   PetscErrorCode ierr;
1276fdc842d1SBarry Smith   PetscInt       i,j,n,*ai=a->i,*aj=a->j;
1277fdc842d1SBarry Smith   PetscScalar    *aa=a->a,*x;
127817ab2063SBarry Smith 
12793a40ed3dSBarry Smith   PetscFunctionBegin;
1280d3e70bfaSHong Zhang   ierr = VecGetLocalSize(v,&n);CHKERRQ(ierr);
1281e32f2f54SBarry Smith   if (n != A->rmap->n) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Nonconforming matrix and vector");
128235e7444dSHong Zhang 
1283d5f3da31SBarry Smith   if (A->factortype == MAT_FACTOR_ILU || A->factortype == MAT_FACTOR_LU) {
1284d3e70bfaSHong Zhang     PetscInt *diag=a->diag;
1285fdc842d1SBarry Smith     ierr = VecGetArrayWrite(v,&x);CHKERRQ(ierr);
12862c990fa1SHong Zhang     for (i=0; i<n; i++) x[i] = 1.0/aa[diag[i]];
1287fdc842d1SBarry Smith     ierr = VecRestoreArrayWrite(v,&x);CHKERRQ(ierr);
128835e7444dSHong Zhang     PetscFunctionReturn(0);
128935e7444dSHong Zhang   }
129035e7444dSHong Zhang 
1291fdc842d1SBarry Smith   ierr = VecGetArrayWrite(v,&x);CHKERRQ(ierr);
129235e7444dSHong Zhang   for (i=0; i<n; i++) {
1293fdc842d1SBarry Smith     x[i] = 0.0;
129435e7444dSHong Zhang     for (j=ai[i]; j<ai[i+1]; j++) {
129535e7444dSHong Zhang       if (aj[j] == i) {
129635e7444dSHong Zhang         x[i] = aa[j];
129717ab2063SBarry Smith         break;
129817ab2063SBarry Smith       }
129917ab2063SBarry Smith     }
130017ab2063SBarry Smith   }
1301fdc842d1SBarry Smith   ierr = VecRestoreArrayWrite(v,&x);CHKERRQ(ierr);
13023a40ed3dSBarry Smith   PetscFunctionReturn(0);
130317ab2063SBarry Smith }
130417ab2063SBarry Smith 
1305c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/ftn-kernels/fmult.h>
1306dfbe8321SBarry Smith PetscErrorCode MatMultTransposeAdd_SeqAIJ(Mat A,Vec xx,Vec zz,Vec yy)
130717ab2063SBarry Smith {
1308416022c9SBarry Smith   Mat_SeqAIJ        *a = (Mat_SeqAIJ*)A->data;
1309d9ca1df4SBarry Smith   PetscScalar       *y;
1310d9ca1df4SBarry Smith   const PetscScalar *x;
1311dfbe8321SBarry Smith   PetscErrorCode    ierr;
1312d0f46423SBarry Smith   PetscInt          m = A->rmap->n;
13135c897100SBarry Smith #if !defined(PETSC_USE_FORTRAN_KERNEL_MULTTRANSPOSEAIJ)
1314d9ca1df4SBarry Smith   const MatScalar   *v;
1315a77337e4SBarry Smith   PetscScalar       alpha;
1316d9ca1df4SBarry Smith   PetscInt          n,i,j;
1317d9ca1df4SBarry Smith   const PetscInt    *idx,*ii,*ridx=NULL;
13183447b6efSHong Zhang   Mat_CompressedRow cprow    = a->compressedrow;
1319ace3abfcSBarry Smith   PetscBool         usecprow = cprow.use;
13205c897100SBarry Smith #endif
132117ab2063SBarry Smith 
13223a40ed3dSBarry Smith   PetscFunctionBegin;
13232e8a6d31SBarry Smith   if (zz != yy) {ierr = VecCopy(zz,yy);CHKERRQ(ierr);}
1324d9ca1df4SBarry Smith   ierr = VecGetArrayRead(xx,&x);CHKERRQ(ierr);
13251ebc52fbSHong Zhang   ierr = VecGetArray(yy,&y);CHKERRQ(ierr);
13265c897100SBarry Smith 
13275c897100SBarry Smith #if defined(PETSC_USE_FORTRAN_KERNEL_MULTTRANSPOSEAIJ)
1328bfeeae90SHong Zhang   fortranmulttransposeaddaij_(&m,x,a->i,a->j,a->a,y);
13295c897100SBarry Smith #else
13303447b6efSHong Zhang   if (usecprow) {
13313447b6efSHong Zhang     m    = cprow.nrows;
13323447b6efSHong Zhang     ii   = cprow.i;
13337b2bb3b9SHong Zhang     ridx = cprow.rindex;
13343447b6efSHong Zhang   } else {
13353447b6efSHong Zhang     ii = a->i;
13363447b6efSHong Zhang   }
133717ab2063SBarry Smith   for (i=0; i<m; i++) {
13383447b6efSHong Zhang     idx = a->j + ii[i];
13393447b6efSHong Zhang     v   = a->a + ii[i];
13403447b6efSHong Zhang     n   = ii[i+1] - ii[i];
13413447b6efSHong Zhang     if (usecprow) {
13427b2bb3b9SHong Zhang       alpha = x[ridx[i]];
13433447b6efSHong Zhang     } else {
134417ab2063SBarry Smith       alpha = x[i];
13453447b6efSHong Zhang     }
134604fbf559SBarry Smith     for (j=0; j<n; j++) y[idx[j]] += alpha*v[j];
134717ab2063SBarry Smith   }
13485c897100SBarry Smith #endif
1349dc0b31edSSatish Balay   ierr = PetscLogFlops(2.0*a->nz);CHKERRQ(ierr);
1350d9ca1df4SBarry Smith   ierr = VecRestoreArrayRead(xx,&x);CHKERRQ(ierr);
13511ebc52fbSHong Zhang   ierr = VecRestoreArray(yy,&y);CHKERRQ(ierr);
13523a40ed3dSBarry Smith   PetscFunctionReturn(0);
135317ab2063SBarry Smith }
135417ab2063SBarry Smith 
1355dfbe8321SBarry Smith PetscErrorCode MatMultTranspose_SeqAIJ(Mat A,Vec xx,Vec yy)
13565c897100SBarry Smith {
1357dfbe8321SBarry Smith   PetscErrorCode ierr;
13585c897100SBarry Smith 
13595c897100SBarry Smith   PetscFunctionBegin;
1360170fe5c8SBarry Smith   ierr = VecSet(yy,0.0);CHKERRQ(ierr);
13615c897100SBarry Smith   ierr = MatMultTransposeAdd_SeqAIJ(A,xx,yy,yy);CHKERRQ(ierr);
13625c897100SBarry Smith   PetscFunctionReturn(0);
13635c897100SBarry Smith }
13645c897100SBarry Smith 
1365c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/ftn-kernels/fmult.h>
136678b84d54SShri Abhyankar 
1367dfbe8321SBarry Smith PetscErrorCode MatMult_SeqAIJ(Mat A,Vec xx,Vec yy)
136817ab2063SBarry Smith {
1369416022c9SBarry Smith   Mat_SeqAIJ        *a = (Mat_SeqAIJ*)A->data;
1370d9fead3dSBarry Smith   PetscScalar       *y;
137154f21887SBarry Smith   const PetscScalar *x;
137254f21887SBarry Smith   const MatScalar   *aa;
1373dfbe8321SBarry Smith   PetscErrorCode    ierr;
1374003131ecSBarry Smith   PetscInt          m=A->rmap->n;
13750298fd71SBarry Smith   const PetscInt    *aj,*ii,*ridx=NULL;
13767b083b7cSBarry Smith   PetscInt          n,i;
1377362ced78SSatish Balay   PetscScalar       sum;
1378ace3abfcSBarry Smith   PetscBool         usecprow=a->compressedrow.use;
137917ab2063SBarry Smith 
1380b6410449SSatish Balay #if defined(PETSC_HAVE_PRAGMA_DISJOINT)
138197952fefSHong Zhang #pragma disjoint(*x,*y,*aa)
1382fee21e36SBarry Smith #endif
1383fee21e36SBarry Smith 
13843a40ed3dSBarry Smith   PetscFunctionBegin;
13853649974fSBarry Smith   ierr = VecGetArrayRead(xx,&x);CHKERRQ(ierr);
13861ebc52fbSHong Zhang   ierr = VecGetArray(yy,&y);CHKERRQ(ierr);
1387416022c9SBarry Smith   ii   = a->i;
13884eb6d288SHong Zhang   if (usecprow) { /* use compressed row format */
1389580bdb30SBarry Smith     ierr = PetscArrayzero(y,m);CHKERRQ(ierr);
139097952fefSHong Zhang     m    = a->compressedrow.nrows;
139197952fefSHong Zhang     ii   = a->compressedrow.i;
139297952fefSHong Zhang     ridx = a->compressedrow.rindex;
139397952fefSHong Zhang     for (i=0; i<m; i++) {
139497952fefSHong Zhang       n           = ii[i+1] - ii[i];
139597952fefSHong Zhang       aj          = a->j + ii[i];
139697952fefSHong Zhang       aa          = a->a + ii[i];
139797952fefSHong Zhang       sum         = 0.0;
1398003131ecSBarry Smith       PetscSparseDensePlusDot(sum,x,aa,aj,n);
1399003131ecSBarry Smith       /* for (j=0; j<n; j++) sum += (*aa++)*x[*aj++]; */
140097952fefSHong Zhang       y[*ridx++] = sum;
140197952fefSHong Zhang     }
140297952fefSHong Zhang   } else { /* do not use compressed row format */
1403b05257ddSBarry Smith #if defined(PETSC_USE_FORTRAN_KERNEL_MULTAIJ)
14043d3eaba7SBarry Smith     aj   = a->j;
14053d3eaba7SBarry Smith     aa   = a->a;
1406b05257ddSBarry Smith     fortranmultaij_(&m,x,ii,aj,aa,y);
1407b05257ddSBarry Smith #else
140817ab2063SBarry Smith     for (i=0; i<m; i++) {
1409003131ecSBarry Smith       n           = ii[i+1] - ii[i];
1410003131ecSBarry Smith       aj          = a->j + ii[i];
1411003131ecSBarry Smith       aa          = a->a + ii[i];
141217ab2063SBarry Smith       sum         = 0.0;
1413003131ecSBarry Smith       PetscSparseDensePlusDot(sum,x,aa,aj,n);
141417ab2063SBarry Smith       y[i] = sum;
141517ab2063SBarry Smith     }
14168d195f9aSBarry Smith #endif
1417b05257ddSBarry Smith   }
14187b083b7cSBarry Smith   ierr = PetscLogFlops(2.0*a->nz - a->nonzerorowcnt);CHKERRQ(ierr);
14193649974fSBarry Smith   ierr = VecRestoreArrayRead(xx,&x);CHKERRQ(ierr);
14201ebc52fbSHong Zhang   ierr = VecRestoreArray(yy,&y);CHKERRQ(ierr);
14213a40ed3dSBarry Smith   PetscFunctionReturn(0);
142217ab2063SBarry Smith }
142317ab2063SBarry Smith 
1424b434eb95SMatthew G. Knepley PetscErrorCode MatMultMax_SeqAIJ(Mat A,Vec xx,Vec yy)
1425b434eb95SMatthew G. Knepley {
1426b434eb95SMatthew G. Knepley   Mat_SeqAIJ        *a = (Mat_SeqAIJ*)A->data;
1427b434eb95SMatthew G. Knepley   PetscScalar       *y;
1428b434eb95SMatthew G. Knepley   const PetscScalar *x;
1429b434eb95SMatthew G. Knepley   const MatScalar   *aa;
1430b434eb95SMatthew G. Knepley   PetscErrorCode    ierr;
1431b434eb95SMatthew G. Knepley   PetscInt          m=A->rmap->n;
1432b434eb95SMatthew G. Knepley   const PetscInt    *aj,*ii,*ridx=NULL;
1433b434eb95SMatthew G. Knepley   PetscInt          n,i,nonzerorow=0;
1434b434eb95SMatthew G. Knepley   PetscScalar       sum;
1435b434eb95SMatthew G. Knepley   PetscBool         usecprow=a->compressedrow.use;
1436b434eb95SMatthew G. Knepley 
1437b434eb95SMatthew G. Knepley #if defined(PETSC_HAVE_PRAGMA_DISJOINT)
1438b434eb95SMatthew G. Knepley #pragma disjoint(*x,*y,*aa)
1439b434eb95SMatthew G. Knepley #endif
1440b434eb95SMatthew G. Knepley 
1441b434eb95SMatthew G. Knepley   PetscFunctionBegin;
1442b434eb95SMatthew G. Knepley   ierr = VecGetArrayRead(xx,&x);CHKERRQ(ierr);
1443b434eb95SMatthew G. Knepley   ierr = VecGetArray(yy,&y);CHKERRQ(ierr);
1444b434eb95SMatthew G. Knepley   if (usecprow) { /* use compressed row format */
1445b434eb95SMatthew G. Knepley     m    = a->compressedrow.nrows;
1446b434eb95SMatthew G. Knepley     ii   = a->compressedrow.i;
1447b434eb95SMatthew G. Knepley     ridx = a->compressedrow.rindex;
1448b434eb95SMatthew G. Knepley     for (i=0; i<m; i++) {
1449b434eb95SMatthew G. Knepley       n           = ii[i+1] - ii[i];
1450b434eb95SMatthew G. Knepley       aj          = a->j + ii[i];
1451b434eb95SMatthew G. Knepley       aa          = a->a + ii[i];
1452b434eb95SMatthew G. Knepley       sum         = 0.0;
1453b434eb95SMatthew G. Knepley       nonzerorow += (n>0);
1454b434eb95SMatthew G. Knepley       PetscSparseDenseMaxDot(sum,x,aa,aj,n);
1455b434eb95SMatthew G. Knepley       /* for (j=0; j<n; j++) sum += (*aa++)*x[*aj++]; */
1456b434eb95SMatthew G. Knepley       y[*ridx++] = sum;
1457b434eb95SMatthew G. Knepley     }
1458b434eb95SMatthew G. Knepley   } else { /* do not use compressed row format */
14593d3eaba7SBarry Smith     ii = a->i;
1460b434eb95SMatthew G. Knepley     for (i=0; i<m; i++) {
1461b434eb95SMatthew G. Knepley       n           = ii[i+1] - ii[i];
1462b434eb95SMatthew G. Knepley       aj          = a->j + ii[i];
1463b434eb95SMatthew G. Knepley       aa          = a->a + ii[i];
1464b434eb95SMatthew G. Knepley       sum         = 0.0;
1465b434eb95SMatthew G. Knepley       nonzerorow += (n>0);
1466b434eb95SMatthew G. Knepley       PetscSparseDenseMaxDot(sum,x,aa,aj,n);
1467b434eb95SMatthew G. Knepley       y[i] = sum;
1468b434eb95SMatthew G. Knepley     }
1469b434eb95SMatthew G. Knepley   }
1470b434eb95SMatthew G. Knepley   ierr = PetscLogFlops(2.0*a->nz - nonzerorow);CHKERRQ(ierr);
1471b434eb95SMatthew G. Knepley   ierr = VecRestoreArrayRead(xx,&x);CHKERRQ(ierr);
1472b434eb95SMatthew G. Knepley   ierr = VecRestoreArray(yy,&y);CHKERRQ(ierr);
1473b434eb95SMatthew G. Knepley   PetscFunctionReturn(0);
1474b434eb95SMatthew G. Knepley }
1475b434eb95SMatthew G. Knepley 
1476b434eb95SMatthew G. Knepley PetscErrorCode MatMultAddMax_SeqAIJ(Mat A,Vec xx,Vec yy,Vec zz)
1477b434eb95SMatthew G. Knepley {
1478b434eb95SMatthew G. Knepley   Mat_SeqAIJ        *a = (Mat_SeqAIJ*)A->data;
1479b434eb95SMatthew G. Knepley   PetscScalar       *y,*z;
1480b434eb95SMatthew G. Knepley   const PetscScalar *x;
1481b434eb95SMatthew G. Knepley   const MatScalar   *aa;
1482b434eb95SMatthew G. Knepley   PetscErrorCode    ierr;
1483b434eb95SMatthew G. Knepley   PetscInt          m = A->rmap->n,*aj,*ii;
1484b434eb95SMatthew G. Knepley   PetscInt          n,i,*ridx=NULL;
1485b434eb95SMatthew G. Knepley   PetscScalar       sum;
1486b434eb95SMatthew G. Knepley   PetscBool         usecprow=a->compressedrow.use;
1487b434eb95SMatthew G. Knepley 
1488b434eb95SMatthew G. Knepley   PetscFunctionBegin;
1489b434eb95SMatthew G. Knepley   ierr = VecGetArrayRead(xx,&x);CHKERRQ(ierr);
1490d9ca1df4SBarry Smith   ierr = VecGetArrayPair(yy,zz,&y,&z);CHKERRQ(ierr);
1491b434eb95SMatthew G. Knepley   if (usecprow) { /* use compressed row format */
1492b434eb95SMatthew G. Knepley     if (zz != yy) {
1493580bdb30SBarry Smith       ierr = PetscArraycpy(z,y,m);CHKERRQ(ierr);
1494b434eb95SMatthew G. Knepley     }
1495b434eb95SMatthew G. Knepley     m    = a->compressedrow.nrows;
1496b434eb95SMatthew G. Knepley     ii   = a->compressedrow.i;
1497b434eb95SMatthew G. Knepley     ridx = a->compressedrow.rindex;
1498b434eb95SMatthew G. Knepley     for (i=0; i<m; i++) {
1499b434eb95SMatthew G. Knepley       n   = ii[i+1] - ii[i];
1500b434eb95SMatthew G. Knepley       aj  = a->j + ii[i];
1501b434eb95SMatthew G. Knepley       aa  = a->a + ii[i];
1502b434eb95SMatthew G. Knepley       sum = y[*ridx];
1503b434eb95SMatthew G. Knepley       PetscSparseDenseMaxDot(sum,x,aa,aj,n);
1504b434eb95SMatthew G. Knepley       z[*ridx++] = sum;
1505b434eb95SMatthew G. Knepley     }
1506b434eb95SMatthew G. Knepley   } else { /* do not use compressed row format */
15073d3eaba7SBarry Smith     ii = a->i;
1508b434eb95SMatthew G. Knepley     for (i=0; i<m; i++) {
1509b434eb95SMatthew G. Knepley       n   = ii[i+1] - ii[i];
1510b434eb95SMatthew G. Knepley       aj  = a->j + ii[i];
1511b434eb95SMatthew G. Knepley       aa  = a->a + ii[i];
1512b434eb95SMatthew G. Knepley       sum = y[i];
1513b434eb95SMatthew G. Knepley       PetscSparseDenseMaxDot(sum,x,aa,aj,n);
1514b434eb95SMatthew G. Knepley       z[i] = sum;
1515b434eb95SMatthew G. Knepley     }
1516b434eb95SMatthew G. Knepley   }
1517b434eb95SMatthew G. Knepley   ierr = PetscLogFlops(2.0*a->nz);CHKERRQ(ierr);
1518b434eb95SMatthew G. Knepley   ierr = VecRestoreArrayRead(xx,&x);CHKERRQ(ierr);
1519d9ca1df4SBarry Smith   ierr = VecRestoreArrayPair(yy,zz,&y,&z);CHKERRQ(ierr);
1520b434eb95SMatthew G. Knepley   PetscFunctionReturn(0);
1521b434eb95SMatthew G. Knepley }
1522b434eb95SMatthew G. Knepley 
1523c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/ftn-kernels/fmultadd.h>
1524dfbe8321SBarry Smith PetscErrorCode MatMultAdd_SeqAIJ(Mat A,Vec xx,Vec yy,Vec zz)
152517ab2063SBarry Smith {
1526416022c9SBarry Smith   Mat_SeqAIJ        *a = (Mat_SeqAIJ*)A->data;
1527f15663dcSBarry Smith   PetscScalar       *y,*z;
1528f15663dcSBarry Smith   const PetscScalar *x;
152954f21887SBarry Smith   const MatScalar   *aa;
1530dfbe8321SBarry Smith   PetscErrorCode    ierr;
1531d9ca1df4SBarry Smith   const PetscInt    *aj,*ii,*ridx=NULL;
1532d9ca1df4SBarry Smith   PetscInt          m = A->rmap->n,n,i;
1533362ced78SSatish Balay   PetscScalar       sum;
1534ace3abfcSBarry Smith   PetscBool         usecprow=a->compressedrow.use;
15359ea0dfa2SSatish Balay 
15363a40ed3dSBarry Smith   PetscFunctionBegin;
1537f15663dcSBarry Smith   ierr = VecGetArrayRead(xx,&x);CHKERRQ(ierr);
1538d9ca1df4SBarry Smith   ierr = VecGetArrayPair(yy,zz,&y,&z);CHKERRQ(ierr);
15394eb6d288SHong Zhang   if (usecprow) { /* use compressed row format */
15404eb6d288SHong Zhang     if (zz != yy) {
1541580bdb30SBarry Smith       ierr = PetscArraycpy(z,y,m);CHKERRQ(ierr);
15424eb6d288SHong Zhang     }
154397952fefSHong Zhang     m    = a->compressedrow.nrows;
154497952fefSHong Zhang     ii   = a->compressedrow.i;
154597952fefSHong Zhang     ridx = a->compressedrow.rindex;
154697952fefSHong Zhang     for (i=0; i<m; i++) {
154797952fefSHong Zhang       n   = ii[i+1] - ii[i];
154897952fefSHong Zhang       aj  = a->j + ii[i];
154997952fefSHong Zhang       aa  = a->a + ii[i];
155097952fefSHong Zhang       sum = y[*ridx];
1551f15663dcSBarry Smith       PetscSparseDensePlusDot(sum,x,aa,aj,n);
155297952fefSHong Zhang       z[*ridx++] = sum;
155397952fefSHong Zhang     }
155497952fefSHong Zhang   } else { /* do not use compressed row format */
15553d3eaba7SBarry Smith     ii = a->i;
1556f15663dcSBarry Smith #if defined(PETSC_USE_FORTRAN_KERNEL_MULTADDAIJ)
15573d3eaba7SBarry Smith     aj = a->j;
15583d3eaba7SBarry Smith     aa = a->a;
1559f15663dcSBarry Smith     fortranmultaddaij_(&m,x,ii,aj,aa,y,z);
1560f15663dcSBarry Smith #else
156117ab2063SBarry Smith     for (i=0; i<m; i++) {
1562f15663dcSBarry Smith       n   = ii[i+1] - ii[i];
1563f15663dcSBarry Smith       aj  = a->j + ii[i];
1564f15663dcSBarry Smith       aa  = a->a + ii[i];
156517ab2063SBarry Smith       sum = y[i];
1566f15663dcSBarry Smith       PetscSparseDensePlusDot(sum,x,aa,aj,n);
156717ab2063SBarry Smith       z[i] = sum;
156817ab2063SBarry Smith     }
156902ab625aSSatish Balay #endif
1570f15663dcSBarry Smith   }
1571dc0b31edSSatish Balay   ierr = PetscLogFlops(2.0*a->nz);CHKERRQ(ierr);
1572f15663dcSBarry Smith   ierr = VecRestoreArrayRead(xx,&x);CHKERRQ(ierr);
1573d9ca1df4SBarry Smith   ierr = VecRestoreArrayPair(yy,zz,&y,&z);CHKERRQ(ierr);
15743a40ed3dSBarry Smith   PetscFunctionReturn(0);
157517ab2063SBarry Smith }
157617ab2063SBarry Smith 
157717ab2063SBarry Smith /*
157817ab2063SBarry Smith      Adds diagonal pointers to sparse matrix structure.
157917ab2063SBarry Smith */
1580dfbe8321SBarry Smith PetscErrorCode MatMarkDiagonal_SeqAIJ(Mat A)
158117ab2063SBarry Smith {
1582416022c9SBarry Smith   Mat_SeqAIJ     *a = (Mat_SeqAIJ*)A->data;
15836849ba73SBarry Smith   PetscErrorCode ierr;
1584d0f46423SBarry Smith   PetscInt       i,j,m = A->rmap->n;
158517ab2063SBarry Smith 
15863a40ed3dSBarry Smith   PetscFunctionBegin;
158709f38230SBarry Smith   if (!a->diag) {
1588785e854fSJed Brown     ierr = PetscMalloc1(m,&a->diag);CHKERRQ(ierr);
15893bb1ff40SBarry Smith     ierr = PetscLogObjectMemory((PetscObject)A, m*sizeof(PetscInt));CHKERRQ(ierr);
159009f38230SBarry Smith   }
1591d0f46423SBarry Smith   for (i=0; i<A->rmap->n; i++) {
159209f38230SBarry Smith     a->diag[i] = a->i[i+1];
1593bfeeae90SHong Zhang     for (j=a->i[i]; j<a->i[i+1]; j++) {
1594bfeeae90SHong Zhang       if (a->j[j] == i) {
159509f38230SBarry Smith         a->diag[i] = j;
159617ab2063SBarry Smith         break;
159717ab2063SBarry Smith       }
159817ab2063SBarry Smith     }
159917ab2063SBarry Smith   }
16003a40ed3dSBarry Smith   PetscFunctionReturn(0);
160117ab2063SBarry Smith }
160217ab2063SBarry Smith 
160361ecd0c6SBarry Smith PetscErrorCode MatShift_SeqAIJ(Mat A,PetscScalar v)
160461ecd0c6SBarry Smith {
160561ecd0c6SBarry Smith   Mat_SeqAIJ        *a = (Mat_SeqAIJ*)A->data;
160661ecd0c6SBarry Smith   const PetscInt    *diag = (const PetscInt*)a->diag;
160761ecd0c6SBarry Smith   const PetscInt    *ii = (const PetscInt*) a->i;
160861ecd0c6SBarry Smith   PetscInt          i,*mdiag = NULL;
160961ecd0c6SBarry Smith   PetscErrorCode    ierr;
161061ecd0c6SBarry Smith   PetscInt          cnt = 0; /* how many diagonals are missing */
161161ecd0c6SBarry Smith 
161261ecd0c6SBarry Smith   PetscFunctionBegin;
161361ecd0c6SBarry Smith   if (!A->preallocated || !a->nz) {
161461ecd0c6SBarry Smith     ierr = MatSeqAIJSetPreallocation(A,1,NULL);CHKERRQ(ierr);
161561ecd0c6SBarry Smith     ierr = MatShift_Basic(A,v);CHKERRQ(ierr);
161661ecd0c6SBarry Smith     PetscFunctionReturn(0);
161761ecd0c6SBarry Smith   }
161861ecd0c6SBarry Smith 
161961ecd0c6SBarry Smith   if (a->diagonaldense) {
162061ecd0c6SBarry Smith     cnt = 0;
162161ecd0c6SBarry Smith   } else {
162261ecd0c6SBarry Smith     ierr = PetscCalloc1(A->rmap->n,&mdiag);CHKERRQ(ierr);
162361ecd0c6SBarry Smith     for (i=0; i<A->rmap->n; i++) {
162461ecd0c6SBarry Smith       if (diag[i] >= ii[i+1]) {
162561ecd0c6SBarry Smith         cnt++;
162661ecd0c6SBarry Smith         mdiag[i] = 1;
162761ecd0c6SBarry Smith       }
162861ecd0c6SBarry Smith     }
162961ecd0c6SBarry Smith   }
163061ecd0c6SBarry Smith   if (!cnt) {
163161ecd0c6SBarry Smith     ierr = MatShift_Basic(A,v);CHKERRQ(ierr);
163261ecd0c6SBarry Smith   } else {
1633b6f2aa54SBarry Smith     PetscScalar *olda = a->a;  /* preserve pointers to current matrix nonzeros structure and values */
1634b6f2aa54SBarry Smith     PetscInt    *oldj = a->j, *oldi = a->i;
163561ecd0c6SBarry Smith     PetscBool   singlemalloc = a->singlemalloc,free_a = a->free_a,free_ij = a->free_ij;
163661ecd0c6SBarry Smith 
163761ecd0c6SBarry Smith     a->a = NULL;
163861ecd0c6SBarry Smith     a->j = NULL;
163961ecd0c6SBarry Smith     a->i = NULL;
164061ecd0c6SBarry Smith     /* increase the values in imax for each row where a diagonal is being inserted then reallocate the matrix data structures */
164161ecd0c6SBarry Smith     for (i=0; i<A->rmap->n; i++) {
164261ecd0c6SBarry Smith       a->imax[i] += mdiag[i];
1643447d62f5SStefano Zampini       a->imax[i] = PetscMin(a->imax[i],A->cmap->n);
164461ecd0c6SBarry Smith     }
164561ecd0c6SBarry Smith     ierr = MatSeqAIJSetPreallocation_SeqAIJ(A,0,a->imax);CHKERRQ(ierr);
164661ecd0c6SBarry Smith 
164761ecd0c6SBarry Smith     /* copy old values into new matrix data structure */
164861ecd0c6SBarry Smith     for (i=0; i<A->rmap->n; i++) {
164961ecd0c6SBarry Smith       ierr = MatSetValues(A,1,&i,a->imax[i] - mdiag[i],&oldj[oldi[i]],&olda[oldi[i]],ADD_VALUES);CHKERRQ(ierr);
1650447d62f5SStefano Zampini       if (i < A->cmap->n) {
165161ecd0c6SBarry Smith         ierr = MatSetValue(A,i,i,v,ADD_VALUES);CHKERRQ(ierr);
165261ecd0c6SBarry Smith       }
1653447d62f5SStefano Zampini     }
165461ecd0c6SBarry Smith     ierr = MatAssemblyBegin(A,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
165561ecd0c6SBarry Smith     ierr = MatAssemblyEnd(A,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
165661ecd0c6SBarry Smith     if (singlemalloc) {
165761ecd0c6SBarry Smith       ierr = PetscFree3(olda,oldj,oldi);CHKERRQ(ierr);
165861ecd0c6SBarry Smith     } else {
165961ecd0c6SBarry Smith       if (free_a)  {ierr = PetscFree(olda);CHKERRQ(ierr);}
166061ecd0c6SBarry Smith       if (free_ij) {ierr = PetscFree(oldj);CHKERRQ(ierr);}
166161ecd0c6SBarry Smith       if (free_ij) {ierr = PetscFree(oldi);CHKERRQ(ierr);}
166261ecd0c6SBarry Smith     }
166361ecd0c6SBarry Smith   }
166461ecd0c6SBarry Smith   ierr = PetscFree(mdiag);CHKERRQ(ierr);
166561ecd0c6SBarry Smith   a->diagonaldense = PETSC_TRUE;
166661ecd0c6SBarry Smith   PetscFunctionReturn(0);
166761ecd0c6SBarry Smith }
166861ecd0c6SBarry Smith 
1669be5855fcSBarry Smith /*
1670be5855fcSBarry Smith      Checks for missing diagonals
1671be5855fcSBarry Smith */
1672ace3abfcSBarry Smith PetscErrorCode MatMissingDiagonal_SeqAIJ(Mat A,PetscBool  *missing,PetscInt *d)
1673be5855fcSBarry Smith {
1674be5855fcSBarry Smith   Mat_SeqAIJ     *a = (Mat_SeqAIJ*)A->data;
16757734d3b5SMatthew G. Knepley   PetscInt       *diag,*ii = a->i,i;
1676994fe344SLisandro Dalcin   PetscErrorCode ierr;
1677be5855fcSBarry Smith 
1678be5855fcSBarry Smith   PetscFunctionBegin;
167909f38230SBarry Smith   *missing = PETSC_FALSE;
16807734d3b5SMatthew G. Knepley   if (A->rmap->n > 0 && !ii) {
168109f38230SBarry Smith     *missing = PETSC_TRUE;
168209f38230SBarry Smith     if (d) *d = 0;
1683994fe344SLisandro Dalcin     ierr = PetscInfo(A,"Matrix has no entries therefore is missing diagonal\n");CHKERRQ(ierr);
168409f38230SBarry Smith   } else {
168501445905SHong Zhang     PetscInt n;
168601445905SHong Zhang     n = PetscMin(A->rmap->n, A->cmap->n);
1687f1e2ffcdSBarry Smith     diag = a->diag;
168801445905SHong Zhang     for (i=0; i<n; i++) {
16897734d3b5SMatthew G. Knepley       if (diag[i] >= ii[i+1]) {
169009f38230SBarry Smith         *missing = PETSC_TRUE;
169109f38230SBarry Smith         if (d) *d = i;
1692994fe344SLisandro Dalcin         ierr = PetscInfo1(A,"Matrix is missing diagonal number %D\n",i);CHKERRQ(ierr);
1693358d2f5dSShri Abhyankar         break;
169409f38230SBarry Smith       }
1695be5855fcSBarry Smith     }
1696be5855fcSBarry Smith   }
1697be5855fcSBarry Smith   PetscFunctionReturn(0);
1698be5855fcSBarry Smith }
1699be5855fcSBarry Smith 
17000da83c2eSBarry Smith #include <petscblaslapack.h>
17010da83c2eSBarry Smith #include <petsc/private/kernels/blockinvert.h>
17020da83c2eSBarry Smith 
17030da83c2eSBarry Smith /*
17040da83c2eSBarry Smith     Note that values is allocated externally by the PC and then passed into this routine
17050da83c2eSBarry Smith */
17060da83c2eSBarry Smith PetscErrorCode MatInvertVariableBlockDiagonal_SeqAIJ(Mat A,PetscInt nblocks,const PetscInt *bsizes,PetscScalar *diag)
17070da83c2eSBarry Smith {
17080da83c2eSBarry Smith   PetscErrorCode  ierr;
17090da83c2eSBarry Smith   PetscInt        n = A->rmap->n, i, ncnt = 0, *indx,j,bsizemax = 0,*v_pivots;
17100da83c2eSBarry Smith   PetscBool       allowzeropivot,zeropivotdetected=PETSC_FALSE;
17110da83c2eSBarry Smith   const PetscReal shift = 0.0;
17120da83c2eSBarry Smith   PetscInt        ipvt[5];
17130da83c2eSBarry Smith   PetscScalar     work[25],*v_work;
17140da83c2eSBarry Smith 
17150da83c2eSBarry Smith   PetscFunctionBegin;
17160da83c2eSBarry Smith   allowzeropivot = PetscNot(A->erroriffailure);
17170da83c2eSBarry Smith   for (i=0; i<nblocks; i++) ncnt += bsizes[i];
17180da83c2eSBarry Smith   if (ncnt != n) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Total blocksizes %D doesn't match number matrix rows %D",ncnt,n);
17190da83c2eSBarry Smith   for (i=0; i<nblocks; i++) {
17200da83c2eSBarry Smith     bsizemax = PetscMax(bsizemax,bsizes[i]);
17210da83c2eSBarry Smith   }
17220da83c2eSBarry Smith   ierr = PetscMalloc1(bsizemax,&indx);CHKERRQ(ierr);
17230da83c2eSBarry Smith   if (bsizemax > 7) {
17240da83c2eSBarry Smith     ierr = PetscMalloc2(bsizemax,&v_work,bsizemax,&v_pivots);CHKERRQ(ierr);
17250da83c2eSBarry Smith   }
17260da83c2eSBarry Smith   ncnt = 0;
17270da83c2eSBarry Smith   for (i=0; i<nblocks; i++) {
17280da83c2eSBarry Smith     for (j=0; j<bsizes[i]; j++) indx[j] = ncnt+j;
17290da83c2eSBarry Smith     ierr    = MatGetValues(A,bsizes[i],indx,bsizes[i],indx,diag);CHKERRQ(ierr);
17300da83c2eSBarry Smith     switch (bsizes[i]) {
17310da83c2eSBarry Smith     case 1:
17320da83c2eSBarry Smith       *diag = 1.0/(*diag);
17330da83c2eSBarry Smith       break;
17340da83c2eSBarry Smith     case 2:
17350da83c2eSBarry Smith       ierr  = PetscKernel_A_gets_inverse_A_2(diag,shift,allowzeropivot,&zeropivotdetected);CHKERRQ(ierr);
17360da83c2eSBarry Smith       if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT;
17370da83c2eSBarry Smith       ierr  = PetscKernel_A_gets_transpose_A_2(diag);CHKERRQ(ierr);
17380da83c2eSBarry Smith       break;
17390da83c2eSBarry Smith     case 3:
17400da83c2eSBarry Smith       ierr  = PetscKernel_A_gets_inverse_A_3(diag,shift,allowzeropivot,&zeropivotdetected);CHKERRQ(ierr);
17410da83c2eSBarry Smith       if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT;
17420da83c2eSBarry Smith       ierr  = PetscKernel_A_gets_transpose_A_3(diag);CHKERRQ(ierr);
17430da83c2eSBarry Smith       break;
17440da83c2eSBarry Smith     case 4:
17450da83c2eSBarry Smith       ierr  = PetscKernel_A_gets_inverse_A_4(diag,shift,allowzeropivot,&zeropivotdetected);CHKERRQ(ierr);
17460da83c2eSBarry Smith       if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT;
17470da83c2eSBarry Smith       ierr  = PetscKernel_A_gets_transpose_A_4(diag);CHKERRQ(ierr);
17480da83c2eSBarry Smith       break;
17490da83c2eSBarry Smith     case 5:
17500da83c2eSBarry Smith       ierr  = PetscKernel_A_gets_inverse_A_5(diag,ipvt,work,shift,allowzeropivot,&zeropivotdetected);CHKERRQ(ierr);
17510da83c2eSBarry Smith       if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT;
17520da83c2eSBarry Smith       ierr  = PetscKernel_A_gets_transpose_A_5(diag);CHKERRQ(ierr);
17530da83c2eSBarry Smith       break;
17540da83c2eSBarry Smith     case 6:
17550da83c2eSBarry Smith       ierr  = PetscKernel_A_gets_inverse_A_6(diag,shift,allowzeropivot,&zeropivotdetected);CHKERRQ(ierr);
17560da83c2eSBarry Smith       if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT;
17570da83c2eSBarry Smith       ierr  = PetscKernel_A_gets_transpose_A_6(diag);CHKERRQ(ierr);
17580da83c2eSBarry Smith       break;
17590da83c2eSBarry Smith     case 7:
17600da83c2eSBarry Smith       ierr  = PetscKernel_A_gets_inverse_A_7(diag,shift,allowzeropivot,&zeropivotdetected);CHKERRQ(ierr);
17610da83c2eSBarry Smith       if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT;
17620da83c2eSBarry Smith       ierr  = PetscKernel_A_gets_transpose_A_7(diag);CHKERRQ(ierr);
17630da83c2eSBarry Smith       break;
17640da83c2eSBarry Smith     default:
17650da83c2eSBarry Smith       ierr  = PetscKernel_A_gets_inverse_A(bsizes[i],diag,v_pivots,v_work,allowzeropivot,&zeropivotdetected);CHKERRQ(ierr);
17660da83c2eSBarry Smith       if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT;
17670da83c2eSBarry Smith       ierr  = PetscKernel_A_gets_transpose_A_N(diag,bsizes[i]);CHKERRQ(ierr);
17680da83c2eSBarry Smith     }
17690da83c2eSBarry Smith     ncnt   += bsizes[i];
17700da83c2eSBarry Smith     diag += bsizes[i]*bsizes[i];
17710da83c2eSBarry Smith   }
17720da83c2eSBarry Smith   if (bsizemax > 7) {
17730da83c2eSBarry Smith     ierr = PetscFree2(v_work,v_pivots);CHKERRQ(ierr);
17740da83c2eSBarry Smith   }
17750da83c2eSBarry Smith   ierr = PetscFree(indx);CHKERRQ(ierr);
17760da83c2eSBarry Smith   PetscFunctionReturn(0);
17770da83c2eSBarry Smith }
17780da83c2eSBarry Smith 
1779422a814eSBarry Smith /*
1780422a814eSBarry Smith    Negative shift indicates do not generate an error if there is a zero diagonal, just invert it anyways
1781422a814eSBarry Smith */
17827087cfbeSBarry Smith PetscErrorCode  MatInvertDiagonal_SeqAIJ(Mat A,PetscScalar omega,PetscScalar fshift)
178371f1c65dSBarry Smith {
178471f1c65dSBarry Smith   Mat_SeqAIJ     *a = (Mat_SeqAIJ*) A->data;
178571f1c65dSBarry Smith   PetscErrorCode ierr;
1786d0f46423SBarry Smith   PetscInt       i,*diag,m = A->rmap->n;
178754f21887SBarry Smith   MatScalar      *v = a->a;
178854f21887SBarry Smith   PetscScalar    *idiag,*mdiag;
178971f1c65dSBarry Smith 
179071f1c65dSBarry Smith   PetscFunctionBegin;
179171f1c65dSBarry Smith   if (a->idiagvalid) PetscFunctionReturn(0);
179271f1c65dSBarry Smith   ierr = MatMarkDiagonal_SeqAIJ(A);CHKERRQ(ierr);
179371f1c65dSBarry Smith   diag = a->diag;
179471f1c65dSBarry Smith   if (!a->idiag) {
1795dcca6d9dSJed Brown     ierr = PetscMalloc3(m,&a->idiag,m,&a->mdiag,m,&a->ssor_work);CHKERRQ(ierr);
17963bb1ff40SBarry Smith     ierr = PetscLogObjectMemory((PetscObject)A, 3*m*sizeof(PetscScalar));CHKERRQ(ierr);
179771f1c65dSBarry Smith     v    = a->a;
179871f1c65dSBarry Smith   }
179971f1c65dSBarry Smith   mdiag = a->mdiag;
180071f1c65dSBarry Smith   idiag = a->idiag;
180171f1c65dSBarry Smith 
1802422a814eSBarry Smith   if (omega == 1.0 && PetscRealPart(fshift) <= 0.0) {
180371f1c65dSBarry Smith     for (i=0; i<m; i++) {
180471f1c65dSBarry Smith       mdiag[i] = v[diag[i]];
1805899639b0SHong Zhang       if (!PetscAbsScalar(mdiag[i])) { /* zero diagonal */
1806899639b0SHong Zhang         if (PetscRealPart(fshift)) {
1807899639b0SHong Zhang           ierr = PetscInfo1(A,"Zero diagonal on row %D\n",i);CHKERRQ(ierr);
18087b6c816cSBarry Smith           A->factorerrortype             = MAT_FACTOR_NUMERIC_ZEROPIVOT;
18097b6c816cSBarry Smith           A->factorerror_zeropivot_value = 0.0;
18107b6c816cSBarry Smith           A->factorerror_zeropivot_row   = i;
1811a6fa060aSHong Zhang         } else SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_ARG_INCOMP,"Zero diagonal on row %D",i);
1812899639b0SHong Zhang       }
181371f1c65dSBarry Smith       idiag[i] = 1.0/v[diag[i]];
181471f1c65dSBarry Smith     }
181571f1c65dSBarry Smith     ierr = PetscLogFlops(m);CHKERRQ(ierr);
181671f1c65dSBarry Smith   } else {
181771f1c65dSBarry Smith     for (i=0; i<m; i++) {
181871f1c65dSBarry Smith       mdiag[i] = v[diag[i]];
181971f1c65dSBarry Smith       idiag[i] = omega/(fshift + v[diag[i]]);
182071f1c65dSBarry Smith     }
1821dc0b31edSSatish Balay     ierr = PetscLogFlops(2.0*m);CHKERRQ(ierr);
182271f1c65dSBarry Smith   }
182371f1c65dSBarry Smith   a->idiagvalid = PETSC_TRUE;
182471f1c65dSBarry Smith   PetscFunctionReturn(0);
182571f1c65dSBarry Smith }
182671f1c65dSBarry Smith 
1827c6db04a5SJed Brown #include <../src/mat/impls/aij/seq/ftn-kernels/frelax.h>
182841f059aeSBarry Smith PetscErrorCode MatSOR_SeqAIJ(Mat A,Vec bb,PetscReal omega,MatSORType flag,PetscReal fshift,PetscInt its,PetscInt lits,Vec xx)
182917ab2063SBarry Smith {
1830416022c9SBarry Smith   Mat_SeqAIJ        *a = (Mat_SeqAIJ*)A->data;
1831e6d1f457SBarry Smith   PetscScalar       *x,d,sum,*t,scale;
18323d3eaba7SBarry Smith   const MatScalar   *v,*idiag=0,*mdiag;
183354f21887SBarry Smith   const PetscScalar *b, *bs,*xb, *ts;
1834dfbe8321SBarry Smith   PetscErrorCode    ierr;
18353d3eaba7SBarry Smith   PetscInt          n,m = A->rmap->n,i;
183697f1f81fSBarry Smith   const PetscInt    *idx,*diag;
183717ab2063SBarry Smith 
18383a40ed3dSBarry Smith   PetscFunctionBegin;
1839b965ef7fSBarry Smith   its = its*lits;
184091723122SBarry Smith 
184171f1c65dSBarry Smith   if (fshift != a->fshift || omega != a->omega) a->idiagvalid = PETSC_FALSE; /* must recompute idiag[] */
184271f1c65dSBarry Smith   if (!a->idiagvalid) {ierr = MatInvertDiagonal_SeqAIJ(A,omega,fshift);CHKERRQ(ierr);}
184371f1c65dSBarry Smith   a->fshift = fshift;
184471f1c65dSBarry Smith   a->omega  = omega;
1845ed480e8bSBarry Smith 
184671f1c65dSBarry Smith   diag  = a->diag;
184771f1c65dSBarry Smith   t     = a->ssor_work;
1848ed480e8bSBarry Smith   idiag = a->idiag;
184971f1c65dSBarry Smith   mdiag = a->mdiag;
1850ed480e8bSBarry Smith 
18511ebc52fbSHong Zhang   ierr = VecGetArray(xx,&x);CHKERRQ(ierr);
18523649974fSBarry Smith   ierr = VecGetArrayRead(bb,&b);CHKERRQ(ierr);
1853ed480e8bSBarry Smith   /* We count flops by assuming the upper triangular and lower triangular parts have the same number of nonzeros */
185417ab2063SBarry Smith   if (flag == SOR_APPLY_UPPER) {
185517ab2063SBarry Smith     /* apply (U + D/omega) to the vector */
1856ed480e8bSBarry Smith     bs = b;
185717ab2063SBarry Smith     for (i=0; i<m; i++) {
185871f1c65dSBarry Smith       d   = fshift + mdiag[i];
1859416022c9SBarry Smith       n   = a->i[i+1] - diag[i] - 1;
1860ed480e8bSBarry Smith       idx = a->j + diag[i] + 1;
1861ed480e8bSBarry Smith       v   = a->a + diag[i] + 1;
186217ab2063SBarry Smith       sum = b[i]*d/omega;
1863003131ecSBarry Smith       PetscSparseDensePlusDot(sum,bs,v,idx,n);
186417ab2063SBarry Smith       x[i] = sum;
186517ab2063SBarry Smith     }
18661ebc52fbSHong Zhang     ierr = VecRestoreArray(xx,&x);CHKERRQ(ierr);
18673649974fSBarry Smith     ierr = VecRestoreArrayRead(bb,&b);CHKERRQ(ierr);
1868efee365bSSatish Balay     ierr = PetscLogFlops(a->nz);CHKERRQ(ierr);
18693a40ed3dSBarry Smith     PetscFunctionReturn(0);
187017ab2063SBarry Smith   }
1871c783ea89SBarry Smith 
18722205254eSKarl Rupp   if (flag == SOR_APPLY_LOWER) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_SUP,"SOR_APPLY_LOWER is not implemented");
18732205254eSKarl Rupp   else if (flag & SOR_EISENSTAT) {
18744c500f23SPierre Jolivet     /* Let  A = L + U + D; where L is lower triangular,
1875887ee2caSBarry Smith     U is upper triangular, E = D/omega; This routine applies
187617ab2063SBarry Smith 
187717ab2063SBarry Smith             (L + E)^{-1} A (U + E)^{-1}
187817ab2063SBarry Smith 
1879887ee2caSBarry Smith     to a vector efficiently using Eisenstat's trick.
188017ab2063SBarry Smith     */
188117ab2063SBarry Smith     scale = (2.0/omega) - 1.0;
188217ab2063SBarry Smith 
188317ab2063SBarry Smith     /*  x = (E + U)^{-1} b */
188417ab2063SBarry Smith     for (i=m-1; i>=0; i--) {
1885416022c9SBarry Smith       n   = a->i[i+1] - diag[i] - 1;
1886ed480e8bSBarry Smith       idx = a->j + diag[i] + 1;
1887ed480e8bSBarry Smith       v   = a->a + diag[i] + 1;
188817ab2063SBarry Smith       sum = b[i];
1889e6d1f457SBarry Smith       PetscSparseDenseMinusDot(sum,x,v,idx,n);
1890ed480e8bSBarry Smith       x[i] = sum*idiag[i];
189117ab2063SBarry Smith     }
189217ab2063SBarry Smith 
189317ab2063SBarry Smith     /*  t = b - (2*E - D)x */
1894416022c9SBarry Smith     v = a->a;
18952205254eSKarl Rupp     for (i=0; i<m; i++) t[i] = b[i] - scale*(v[*diag++])*x[i];
189617ab2063SBarry Smith 
189717ab2063SBarry Smith     /*  t = (E + L)^{-1}t */
1898ed480e8bSBarry Smith     ts   = t;
1899416022c9SBarry Smith     diag = a->diag;
190017ab2063SBarry Smith     for (i=0; i<m; i++) {
1901416022c9SBarry Smith       n   = diag[i] - a->i[i];
1902ed480e8bSBarry Smith       idx = a->j + a->i[i];
1903ed480e8bSBarry Smith       v   = a->a + a->i[i];
190417ab2063SBarry Smith       sum = t[i];
1905003131ecSBarry Smith       PetscSparseDenseMinusDot(sum,ts,v,idx,n);
1906ed480e8bSBarry Smith       t[i] = sum*idiag[i];
1907733d66baSBarry Smith       /*  x = x + t */
1908733d66baSBarry Smith       x[i] += t[i];
190917ab2063SBarry Smith     }
191017ab2063SBarry Smith 
1911dc0b31edSSatish Balay     ierr = PetscLogFlops(6.0*m-1 + 2.0*a->nz);CHKERRQ(ierr);
19121ebc52fbSHong Zhang     ierr = VecRestoreArray(xx,&x);CHKERRQ(ierr);
19133649974fSBarry Smith     ierr = VecRestoreArrayRead(bb,&b);CHKERRQ(ierr);
19143a40ed3dSBarry Smith     PetscFunctionReturn(0);
191517ab2063SBarry Smith   }
191617ab2063SBarry Smith   if (flag & SOR_ZERO_INITIAL_GUESS) {
191717ab2063SBarry Smith     if (flag & SOR_FORWARD_SWEEP || flag & SOR_LOCAL_FORWARD_SWEEP) {
191817ab2063SBarry Smith       for (i=0; i<m; i++) {
1919416022c9SBarry Smith         n   = diag[i] - a->i[i];
1920ed480e8bSBarry Smith         idx = a->j + a->i[i];
1921ed480e8bSBarry Smith         v   = a->a + a->i[i];
192217ab2063SBarry Smith         sum = b[i];
1923e6d1f457SBarry Smith         PetscSparseDenseMinusDot(sum,x,v,idx,n);
19245c99c7daSBarry Smith         t[i] = sum;
1925ed480e8bSBarry Smith         x[i] = sum*idiag[i];
192617ab2063SBarry Smith       }
19275c99c7daSBarry Smith       xb   = t;
1928efee365bSSatish Balay       ierr = PetscLogFlops(a->nz);CHKERRQ(ierr);
19293a40ed3dSBarry Smith     } else xb = b;
193017ab2063SBarry Smith     if (flag & SOR_BACKWARD_SWEEP || flag & SOR_LOCAL_BACKWARD_SWEEP) {
193117ab2063SBarry Smith       for (i=m-1; i>=0; i--) {
1932416022c9SBarry Smith         n   = a->i[i+1] - diag[i] - 1;
1933ed480e8bSBarry Smith         idx = a->j + diag[i] + 1;
1934ed480e8bSBarry Smith         v   = a->a + diag[i] + 1;
193517ab2063SBarry Smith         sum = xb[i];
1936e6d1f457SBarry Smith         PetscSparseDenseMinusDot(sum,x,v,idx,n);
19375c99c7daSBarry Smith         if (xb == b) {
1938ed480e8bSBarry Smith           x[i] = sum*idiag[i];
19395c99c7daSBarry Smith         } else {
1940b19a5dc2SMark Adams           x[i] = (1-omega)*x[i] + sum*idiag[i];  /* omega in idiag */
194117ab2063SBarry Smith         }
19425c99c7daSBarry Smith       }
1943b19a5dc2SMark Adams       ierr = PetscLogFlops(a->nz);CHKERRQ(ierr); /* assumes 1/2 in upper */
194417ab2063SBarry Smith     }
194517ab2063SBarry Smith     its--;
194617ab2063SBarry Smith   }
194717ab2063SBarry Smith   while (its--) {
194817ab2063SBarry Smith     if (flag & SOR_FORWARD_SWEEP || flag & SOR_LOCAL_FORWARD_SWEEP) {
194917ab2063SBarry Smith       for (i=0; i<m; i++) {
1950b19a5dc2SMark Adams         /* lower */
1951b19a5dc2SMark Adams         n   = diag[i] - a->i[i];
1952ed480e8bSBarry Smith         idx = a->j + a->i[i];
1953ed480e8bSBarry Smith         v   = a->a + a->i[i];
195417ab2063SBarry Smith         sum = b[i];
1955e6d1f457SBarry Smith         PetscSparseDenseMinusDot(sum,x,v,idx,n);
1956b19a5dc2SMark Adams         t[i] = sum;             /* save application of the lower-triangular part */
1957b19a5dc2SMark Adams         /* upper */
1958b19a5dc2SMark Adams         n   = a->i[i+1] - diag[i] - 1;
1959b19a5dc2SMark Adams         idx = a->j + diag[i] + 1;
1960b19a5dc2SMark Adams         v   = a->a + diag[i] + 1;
1961b19a5dc2SMark Adams         PetscSparseDenseMinusDot(sum,x,v,idx,n);
1962b19a5dc2SMark Adams         x[i] = (1. - omega)*x[i] + sum*idiag[i]; /* omega in idiag */
196317ab2063SBarry Smith       }
1964b19a5dc2SMark Adams       xb   = t;
19659f863219SBarry Smith       ierr = PetscLogFlops(2.0*a->nz);CHKERRQ(ierr);
1966b19a5dc2SMark Adams     } else xb = b;
196717ab2063SBarry Smith     if (flag & SOR_BACKWARD_SWEEP || flag & SOR_LOCAL_BACKWARD_SWEEP) {
196817ab2063SBarry Smith       for (i=m-1; i>=0; i--) {
1969b19a5dc2SMark Adams         sum = xb[i];
1970b19a5dc2SMark Adams         if (xb == b) {
1971b19a5dc2SMark Adams           /* whole matrix (no checkpointing available) */
1972416022c9SBarry Smith           n   = a->i[i+1] - a->i[i];
1973ed480e8bSBarry Smith           idx = a->j + a->i[i];
1974ed480e8bSBarry Smith           v   = a->a + a->i[i];
1975e6d1f457SBarry Smith           PetscSparseDenseMinusDot(sum,x,v,idx,n);
1976ed480e8bSBarry Smith           x[i] = (1. - omega)*x[i] + (sum + mdiag[i]*x[i])*idiag[i];
1977b19a5dc2SMark Adams         } else { /* lower-triangular part has been saved, so only apply upper-triangular */
1978b19a5dc2SMark Adams           n   = a->i[i+1] - diag[i] - 1;
1979b19a5dc2SMark Adams           idx = a->j + diag[i] + 1;
1980b19a5dc2SMark Adams           v   = a->a + diag[i] + 1;
1981b19a5dc2SMark Adams           PetscSparseDenseMinusDot(sum,x,v,idx,n);
1982b19a5dc2SMark Adams           x[i] = (1. - omega)*x[i] + sum*idiag[i];  /* omega in idiag */
198317ab2063SBarry Smith         }
1984b19a5dc2SMark Adams       }
1985b19a5dc2SMark Adams       if (xb == b) {
19869f863219SBarry Smith         ierr = PetscLogFlops(2.0*a->nz);CHKERRQ(ierr);
1987b19a5dc2SMark Adams       } else {
1988b19a5dc2SMark Adams         ierr = PetscLogFlops(a->nz);CHKERRQ(ierr); /* assumes 1/2 in upper */
1989b19a5dc2SMark Adams       }
199017ab2063SBarry Smith     }
199117ab2063SBarry Smith   }
19921ebc52fbSHong Zhang   ierr = VecRestoreArray(xx,&x);CHKERRQ(ierr);
19933649974fSBarry Smith   ierr = VecRestoreArrayRead(bb,&b);CHKERRQ(ierr);
1994365a8a9eSBarry Smith   PetscFunctionReturn(0);
199517ab2063SBarry Smith }
199617ab2063SBarry Smith 
19972af78befSBarry Smith 
1998dfbe8321SBarry Smith PetscErrorCode MatGetInfo_SeqAIJ(Mat A,MatInfoType flag,MatInfo *info)
199917ab2063SBarry Smith {
2000416022c9SBarry Smith   Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data;
20014e220ebcSLois Curfman McInnes 
20023a40ed3dSBarry Smith   PetscFunctionBegin;
20034e220ebcSLois Curfman McInnes   info->block_size   = 1.0;
20043966268fSBarry Smith   info->nz_allocated = a->maxnz;
20053966268fSBarry Smith   info->nz_used      = a->nz;
20063966268fSBarry Smith   info->nz_unneeded  = (a->maxnz - a->nz);
20073966268fSBarry Smith   info->assemblies   = A->num_ass;
20083966268fSBarry Smith   info->mallocs      = A->info.mallocs;
20097adad957SLisandro Dalcin   info->memory       = ((PetscObject)A)->mem;
2010d5f3da31SBarry Smith   if (A->factortype) {
20114e220ebcSLois Curfman McInnes     info->fill_ratio_given  = A->info.fill_ratio_given;
20124e220ebcSLois Curfman McInnes     info->fill_ratio_needed = A->info.fill_ratio_needed;
20134e220ebcSLois Curfman McInnes     info->factor_mallocs    = A->info.factor_mallocs;
20144e220ebcSLois Curfman McInnes   } else {
20154e220ebcSLois Curfman McInnes     info->fill_ratio_given  = 0;
20164e220ebcSLois Curfman McInnes     info->fill_ratio_needed = 0;
20174e220ebcSLois Curfman McInnes     info->factor_mallocs    = 0;
20184e220ebcSLois Curfman McInnes   }
20193a40ed3dSBarry Smith   PetscFunctionReturn(0);
202017ab2063SBarry Smith }
202117ab2063SBarry Smith 
20222b40b63fSBarry Smith PetscErrorCode MatZeroRows_SeqAIJ(Mat A,PetscInt N,const PetscInt rows[],PetscScalar diag,Vec x,Vec b)
202317ab2063SBarry Smith {
2024416022c9SBarry Smith   Mat_SeqAIJ        *a = (Mat_SeqAIJ*)A->data;
2025c7da8527SEric Chamberland   PetscInt          i,m = A->rmap->n - 1;
20266849ba73SBarry Smith   PetscErrorCode    ierr;
202797b48c8fSBarry Smith   const PetscScalar *xx;
202897b48c8fSBarry Smith   PetscScalar       *bb;
2029c7da8527SEric Chamberland   PetscInt          d = 0;
203017ab2063SBarry Smith 
20313a40ed3dSBarry Smith   PetscFunctionBegin;
203297b48c8fSBarry Smith   if (x && b) {
203397b48c8fSBarry Smith     ierr = VecGetArrayRead(x,&xx);CHKERRQ(ierr);
203497b48c8fSBarry Smith     ierr = VecGetArray(b,&bb);CHKERRQ(ierr);
203597b48c8fSBarry Smith     for (i=0; i<N; i++) {
203697b48c8fSBarry Smith       if (rows[i] < 0 || rows[i] > m) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"row %D out of range", rows[i]);
2037447d62f5SStefano Zampini       if (rows[i] >= A->cmap->n) continue;
203897b48c8fSBarry Smith       bb[rows[i]] = diag*xx[rows[i]];
203997b48c8fSBarry Smith     }
204097b48c8fSBarry Smith     ierr = VecRestoreArrayRead(x,&xx);CHKERRQ(ierr);
204197b48c8fSBarry Smith     ierr = VecRestoreArray(b,&bb);CHKERRQ(ierr);
204297b48c8fSBarry Smith   }
204397b48c8fSBarry Smith 
2044a9817697SBarry Smith   if (a->keepnonzeropattern) {
2045f1e2ffcdSBarry Smith     for (i=0; i<N; i++) {
2046e32f2f54SBarry Smith       if (rows[i] < 0 || rows[i] > m) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"row %D out of range", rows[i]);
2047580bdb30SBarry Smith       ierr = PetscArrayzero(&a->a[a->i[rows[i]]],a->ilen[rows[i]]);CHKERRQ(ierr);
2048f1e2ffcdSBarry Smith     }
2049f4df32b1SMatthew Knepley     if (diag != 0.0) {
2050c7da8527SEric Chamberland       for (i=0; i<N; i++) {
2051c7da8527SEric Chamberland         d = rows[i];
2052447d62f5SStefano Zampini         if (rows[i] >= A->cmap->n) continue;
2053c7da8527SEric Chamberland         if (a->diag[d] >= a->i[d+1]) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Matrix is missing diagonal entry in the zeroed row %D",d);
2054c7da8527SEric Chamberland       }
2055f1e2ffcdSBarry Smith       for (i=0; i<N; i++) {
2056447d62f5SStefano Zampini         if (rows[i] >= A->cmap->n) continue;
2057f4df32b1SMatthew Knepley         a->a[a->diag[rows[i]]] = diag;
2058f1e2ffcdSBarry Smith       }
2059f1e2ffcdSBarry Smith     }
2060f1e2ffcdSBarry Smith   } else {
2061f4df32b1SMatthew Knepley     if (diag != 0.0) {
206217ab2063SBarry Smith       for (i=0; i<N; i++) {
2063e32f2f54SBarry Smith         if (rows[i] < 0 || rows[i] > m) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"row %D out of range", rows[i]);
20647ae801bdSBarry Smith         if (a->ilen[rows[i]] > 0) {
2065447d62f5SStefano Zampini 	  if (rows[i] >= A->cmap->n) {
2066447d62f5SStefano Zampini             a->ilen[rows[i]] = 0;
2067447d62f5SStefano Zampini           } else {
2068416022c9SBarry Smith             a->ilen[rows[i]]    = 1;
2069f4df32b1SMatthew Knepley             a->a[a->i[rows[i]]] = diag;
2070bfeeae90SHong Zhang             a->j[a->i[rows[i]]] = rows[i];
2071447d62f5SStefano Zampini           }
2072447d62f5SStefano Zampini         } else if (rows[i] < A->cmap->n) { /* in case row was completely empty */
2073f4df32b1SMatthew Knepley           ierr = MatSetValues_SeqAIJ(A,1,&rows[i],1,&rows[i],&diag,INSERT_VALUES);CHKERRQ(ierr);
207417ab2063SBarry Smith         }
207517ab2063SBarry Smith       }
20763a40ed3dSBarry Smith     } else {
207717ab2063SBarry Smith       for (i=0; i<N; i++) {
2078e32f2f54SBarry Smith         if (rows[i] < 0 || rows[i] > m) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"row %D out of range", rows[i]);
2079416022c9SBarry Smith         a->ilen[rows[i]] = 0;
208017ab2063SBarry Smith       }
208117ab2063SBarry Smith     }
2082e56f5c9eSBarry Smith     A->nonzerostate++;
2083f1e2ffcdSBarry Smith   }
2084e2cf4d64SStefano Zampini #if defined(PETSC_HAVE_VIENNACL) || defined(PETSC_HAVE_CUDA)
2085c70f7ee4SJunchao Zhang   if (A->offloadmask != PETSC_OFFLOAD_UNALLOCATED) A->offloadmask = PETSC_OFFLOAD_CPU;
2086e2cf4d64SStefano Zampini #endif
20874099cc6bSBarry Smith   ierr = (*A->ops->assemblyend)(A,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
20883a40ed3dSBarry Smith   PetscFunctionReturn(0);
208917ab2063SBarry Smith }
209017ab2063SBarry Smith 
20916e169961SBarry Smith PetscErrorCode MatZeroRowsColumns_SeqAIJ(Mat A,PetscInt N,const PetscInt rows[],PetscScalar diag,Vec x,Vec b)
20926e169961SBarry Smith {
20936e169961SBarry Smith   Mat_SeqAIJ        *a = (Mat_SeqAIJ*)A->data;
20946e169961SBarry Smith   PetscInt          i,j,m = A->rmap->n - 1,d = 0;
20956e169961SBarry Smith   PetscErrorCode    ierr;
20962b40b63fSBarry Smith   PetscBool         missing,*zeroed,vecs = PETSC_FALSE;
20976e169961SBarry Smith   const PetscScalar *xx;
20986e169961SBarry Smith   PetscScalar       *bb;
20996e169961SBarry Smith 
21006e169961SBarry Smith   PetscFunctionBegin;
21016e169961SBarry Smith   if (x && b) {
21026e169961SBarry Smith     ierr = VecGetArrayRead(x,&xx);CHKERRQ(ierr);
21036e169961SBarry Smith     ierr = VecGetArray(b,&bb);CHKERRQ(ierr);
21042b40b63fSBarry Smith     vecs = PETSC_TRUE;
21056e169961SBarry Smith   }
21061795a4d1SJed Brown   ierr = PetscCalloc1(A->rmap->n,&zeroed);CHKERRQ(ierr);
21076e169961SBarry Smith   for (i=0; i<N; i++) {
21086e169961SBarry Smith     if (rows[i] < 0 || rows[i] > m) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"row %D out of range", rows[i]);
2109580bdb30SBarry Smith     ierr = PetscArrayzero(&a->a[a->i[rows[i]]],a->ilen[rows[i]]);CHKERRQ(ierr);
21102205254eSKarl Rupp 
21116e169961SBarry Smith     zeroed[rows[i]] = PETSC_TRUE;
21126e169961SBarry Smith   }
21136e169961SBarry Smith   for (i=0; i<A->rmap->n; i++) {
21146e169961SBarry Smith     if (!zeroed[i]) {
21156e169961SBarry Smith       for (j=a->i[i]; j<a->i[i+1]; j++) {
21164cf107fdSStefano Zampini         if (a->j[j] < A->rmap->n && zeroed[a->j[j]]) {
21172b40b63fSBarry Smith           if (vecs) bb[i] -= a->a[j]*xx[a->j[j]];
21186e169961SBarry Smith           a->a[j] = 0.0;
21196e169961SBarry Smith         }
21206e169961SBarry Smith       }
21214cf107fdSStefano Zampini     } else if (vecs && i < A->cmap->N) bb[i] = diag*xx[i];
21226e169961SBarry Smith   }
21236e169961SBarry Smith   if (x && b) {
21246e169961SBarry Smith     ierr = VecRestoreArrayRead(x,&xx);CHKERRQ(ierr);
21256e169961SBarry Smith     ierr = VecRestoreArray(b,&bb);CHKERRQ(ierr);
21266e169961SBarry Smith   }
21276e169961SBarry Smith   ierr = PetscFree(zeroed);CHKERRQ(ierr);
21286e169961SBarry Smith   if (diag != 0.0) {
21296e169961SBarry Smith     ierr = MatMissingDiagonal_SeqAIJ(A,&missing,&d);CHKERRQ(ierr);
21301d5a398dSstefano_zampini     if (missing) {
21311d5a398dSstefano_zampini       for (i=0; i<N; i++) {
21324cf107fdSStefano Zampini         if (rows[i] >= A->cmap->N) continue;
21334cf107fdSStefano Zampini         if (a->nonew && rows[i] >= d) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Matrix is missing diagonal entry in row %D (%D)",d,rows[i]);
21341d5a398dSstefano_zampini         ierr = MatSetValues_SeqAIJ(A,1,&rows[i],1,&rows[i],&diag,INSERT_VALUES);CHKERRQ(ierr);
21351d5a398dSstefano_zampini       }
21361d5a398dSstefano_zampini     } else {
21376e169961SBarry Smith       for (i=0; i<N; i++) {
21386e169961SBarry Smith         a->a[a->diag[rows[i]]] = diag;
21396e169961SBarry Smith       }
21406e169961SBarry Smith     }
21411d5a398dSstefano_zampini   }
2142e2cf4d64SStefano Zampini #if defined(PETSC_HAVE_VIENNACL) || defined(PETSC_HAVE_CUDA)
2143c70f7ee4SJunchao Zhang   if (A->offloadmask != PETSC_OFFLOAD_UNALLOCATED) A->offloadmask = PETSC_OFFLOAD_CPU;
2144e2cf4d64SStefano Zampini #endif
21454099cc6bSBarry Smith   ierr = (*A->ops->assemblyend)(A,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
21466e169961SBarry Smith   PetscFunctionReturn(0);
21476e169961SBarry Smith }
21486e169961SBarry Smith 
2149a77337e4SBarry Smith PetscErrorCode MatGetRow_SeqAIJ(Mat A,PetscInt row,PetscInt *nz,PetscInt **idx,PetscScalar **v)
215017ab2063SBarry Smith {
2151416022c9SBarry Smith   Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data;
215297f1f81fSBarry Smith   PetscInt   *itmp;
215317ab2063SBarry Smith 
21543a40ed3dSBarry Smith   PetscFunctionBegin;
2155e32f2f54SBarry Smith   if (row < 0 || row >= A->rmap->n) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Row %D out of range",row);
215617ab2063SBarry Smith 
2157416022c9SBarry Smith   *nz = a->i[row+1] - a->i[row];
2158bfeeae90SHong Zhang   if (v) *v = a->a + a->i[row];
215917ab2063SBarry Smith   if (idx) {
2160bfeeae90SHong Zhang     itmp = a->j + a->i[row];
216126fbe8dcSKarl Rupp     if (*nz) *idx = itmp;
216217ab2063SBarry Smith     else *idx = 0;
216317ab2063SBarry Smith   }
21643a40ed3dSBarry Smith   PetscFunctionReturn(0);
216517ab2063SBarry Smith }
216617ab2063SBarry Smith 
2167bfeeae90SHong Zhang /* remove this function? */
2168a77337e4SBarry Smith PetscErrorCode MatRestoreRow_SeqAIJ(Mat A,PetscInt row,PetscInt *nz,PetscInt **idx,PetscScalar **v)
216917ab2063SBarry Smith {
21703a40ed3dSBarry Smith   PetscFunctionBegin;
21713a40ed3dSBarry Smith   PetscFunctionReturn(0);
217217ab2063SBarry Smith }
217317ab2063SBarry Smith 
2174dfbe8321SBarry Smith PetscErrorCode MatNorm_SeqAIJ(Mat A,NormType type,PetscReal *nrm)
217517ab2063SBarry Smith {
2176416022c9SBarry Smith   Mat_SeqAIJ     *a  = (Mat_SeqAIJ*)A->data;
217754f21887SBarry Smith   MatScalar      *v  = a->a;
217836db0b34SBarry Smith   PetscReal      sum = 0.0;
21796849ba73SBarry Smith   PetscErrorCode ierr;
218097f1f81fSBarry Smith   PetscInt       i,j;
218117ab2063SBarry Smith 
21823a40ed3dSBarry Smith   PetscFunctionBegin;
218317ab2063SBarry Smith   if (type == NORM_FROBENIUS) {
2184570b7f6dSBarry Smith #if defined(PETSC_USE_REAL___FP16)
2185570b7f6dSBarry Smith     PetscBLASInt one = 1,nz = a->nz;
2186570b7f6dSBarry Smith     *nrm = BLASnrm2_(&nz,v,&one);
2187570b7f6dSBarry Smith #else
2188416022c9SBarry Smith     for (i=0; i<a->nz; i++) {
218936db0b34SBarry Smith       sum += PetscRealPart(PetscConj(*v)*(*v)); v++;
219017ab2063SBarry Smith     }
21918f1a2a5eSBarry Smith     *nrm = PetscSqrtReal(sum);
2192570b7f6dSBarry Smith #endif
219351f70360SJed Brown     ierr = PetscLogFlops(2*a->nz);CHKERRQ(ierr);
21943a40ed3dSBarry Smith   } else if (type == NORM_1) {
219536db0b34SBarry Smith     PetscReal *tmp;
219697f1f81fSBarry Smith     PetscInt  *jj = a->j;
21971795a4d1SJed Brown     ierr = PetscCalloc1(A->cmap->n+1,&tmp);CHKERRQ(ierr);
2198064f8208SBarry Smith     *nrm = 0.0;
2199416022c9SBarry Smith     for (j=0; j<a->nz; j++) {
2200bfeeae90SHong Zhang       tmp[*jj++] += PetscAbsScalar(*v);  v++;
220117ab2063SBarry Smith     }
2202d0f46423SBarry Smith     for (j=0; j<A->cmap->n; j++) {
2203064f8208SBarry Smith       if (tmp[j] > *nrm) *nrm = tmp[j];
220417ab2063SBarry Smith     }
2205606d414cSSatish Balay     ierr = PetscFree(tmp);CHKERRQ(ierr);
220651f70360SJed Brown     ierr = PetscLogFlops(PetscMax(a->nz-1,0));CHKERRQ(ierr);
22073a40ed3dSBarry Smith   } else if (type == NORM_INFINITY) {
2208064f8208SBarry Smith     *nrm = 0.0;
2209d0f46423SBarry Smith     for (j=0; j<A->rmap->n; j++) {
2210bfeeae90SHong Zhang       v   = a->a + a->i[j];
221117ab2063SBarry Smith       sum = 0.0;
2212416022c9SBarry Smith       for (i=0; i<a->i[j+1]-a->i[j]; i++) {
2213cddf8d76SBarry Smith         sum += PetscAbsScalar(*v); v++;
221417ab2063SBarry Smith       }
2215064f8208SBarry Smith       if (sum > *nrm) *nrm = sum;
221617ab2063SBarry Smith     }
221751f70360SJed Brown     ierr = PetscLogFlops(PetscMax(a->nz-1,0));CHKERRQ(ierr);
2218f23aa3ddSBarry Smith   } else SETERRQ(PETSC_COMM_SELF,PETSC_ERR_SUP,"No support for two norm");
22193a40ed3dSBarry Smith   PetscFunctionReturn(0);
222017ab2063SBarry Smith }
222117ab2063SBarry Smith 
22224e938277SHong Zhang /* Merged from MatGetSymbolicTranspose_SeqAIJ() - replace MatGetSymbolicTranspose_SeqAIJ()? */
22234e938277SHong Zhang PetscErrorCode MatTransposeSymbolic_SeqAIJ(Mat A,Mat *B)
22244e938277SHong Zhang {
22254e938277SHong Zhang   PetscErrorCode ierr;
22264e938277SHong Zhang   PetscInt       i,j,anzj;
22274e938277SHong Zhang   Mat_SeqAIJ     *a=(Mat_SeqAIJ*)A->data,*b;
22284e938277SHong Zhang   PetscInt       an=A->cmap->N,am=A->rmap->N;
22294e938277SHong Zhang   PetscInt       *ati,*atj,*atfill,*ai=a->i,*aj=a->j;
22304e938277SHong Zhang 
22314e938277SHong Zhang   PetscFunctionBegin;
22324e938277SHong Zhang   /* Allocate space for symbolic transpose info and work array */
2233854ce69bSBarry Smith   ierr = PetscCalloc1(an+1,&ati);CHKERRQ(ierr);
2234785e854fSJed Brown   ierr = PetscMalloc1(ai[am],&atj);CHKERRQ(ierr);
2235785e854fSJed Brown   ierr = PetscMalloc1(an,&atfill);CHKERRQ(ierr);
22364e938277SHong Zhang 
22374e938277SHong Zhang   /* Walk through aj and count ## of non-zeros in each row of A^T. */
22384e938277SHong Zhang   /* Note: offset by 1 for fast conversion into csr format. */
223926fbe8dcSKarl Rupp   for (i=0;i<ai[am];i++) ati[aj[i]+1] += 1;
22404e938277SHong Zhang   /* Form ati for csr format of A^T. */
224126fbe8dcSKarl Rupp   for (i=0;i<an;i++) ati[i+1] += ati[i];
22424e938277SHong Zhang 
22434e938277SHong Zhang   /* Copy ati into atfill so we have locations of the next free space in atj */
2244580bdb30SBarry Smith   ierr = PetscArraycpy(atfill,ati,an);CHKERRQ(ierr);
22454e938277SHong Zhang 
22464e938277SHong Zhang   /* Walk through A row-wise and mark nonzero entries of A^T. */
22474e938277SHong Zhang   for (i=0;i<am;i++) {
22484e938277SHong Zhang     anzj = ai[i+1] - ai[i];
22494e938277SHong Zhang     for (j=0;j<anzj;j++) {
22504e938277SHong Zhang       atj[atfill[*aj]] = i;
22514e938277SHong Zhang       atfill[*aj++]   += 1;
22524e938277SHong Zhang     }
22534e938277SHong Zhang   }
22544e938277SHong Zhang 
22554e938277SHong Zhang   /* Clean up temporary space and complete requests. */
22564e938277SHong Zhang   ierr = PetscFree(atfill);CHKERRQ(ierr);
2257ce94432eSBarry Smith   ierr = MatCreateSeqAIJWithArrays(PetscObjectComm((PetscObject)A),an,am,ati,atj,NULL,B);CHKERRQ(ierr);
225833d57670SJed Brown   ierr = MatSetBlockSizes(*B,PetscAbs(A->cmap->bs),PetscAbs(A->rmap->bs));CHKERRQ(ierr);
2259b5bb3eecSMark Adams   ierr = MatSetType(*B,((PetscObject)A)->type_name);CHKERRQ(ierr);
2260a2f3521dSMark F. Adams 
22614e938277SHong Zhang   b          = (Mat_SeqAIJ*)((*B)->data);
22624e938277SHong Zhang   b->free_a  = PETSC_FALSE;
22634e938277SHong Zhang   b->free_ij = PETSC_TRUE;
22644e938277SHong Zhang   b->nonew   = 0;
22654e938277SHong Zhang   PetscFunctionReturn(0);
22664e938277SHong Zhang }
22674e938277SHong Zhang 
22687087cfbeSBarry Smith PetscErrorCode  MatIsTranspose_SeqAIJ(Mat A,Mat B,PetscReal tol,PetscBool  *f)
2269cd0d46ebSvictorle {
22703d3eaba7SBarry Smith   Mat_SeqAIJ     *aij = (Mat_SeqAIJ*) A->data,*bij = (Mat_SeqAIJ*) B->data;
227154f21887SBarry Smith   PetscInt       *adx,*bdx,*aii,*bii,*aptr,*bptr;
227254f21887SBarry Smith   MatScalar      *va,*vb;
22736849ba73SBarry Smith   PetscErrorCode ierr;
227497f1f81fSBarry Smith   PetscInt       ma,na,mb,nb, i;
2275cd0d46ebSvictorle 
2276cd0d46ebSvictorle   PetscFunctionBegin;
2277cd0d46ebSvictorle   ierr = MatGetSize(A,&ma,&na);CHKERRQ(ierr);
2278cd0d46ebSvictorle   ierr = MatGetSize(B,&mb,&nb);CHKERRQ(ierr);
22795485867bSBarry Smith   if (ma!=nb || na!=mb) {
22805485867bSBarry Smith     *f = PETSC_FALSE;
22815485867bSBarry Smith     PetscFunctionReturn(0);
22825485867bSBarry Smith   }
2283cd0d46ebSvictorle   aii  = aij->i; bii = bij->i;
2284cd0d46ebSvictorle   adx  = aij->j; bdx = bij->j;
2285cd0d46ebSvictorle   va   = aij->a; vb = bij->a;
2286785e854fSJed Brown   ierr = PetscMalloc1(ma,&aptr);CHKERRQ(ierr);
2287785e854fSJed Brown   ierr = PetscMalloc1(mb,&bptr);CHKERRQ(ierr);
2288cd0d46ebSvictorle   for (i=0; i<ma; i++) aptr[i] = aii[i];
2289cd0d46ebSvictorle   for (i=0; i<mb; i++) bptr[i] = bii[i];
2290cd0d46ebSvictorle 
2291cd0d46ebSvictorle   *f = PETSC_TRUE;
2292cd0d46ebSvictorle   for (i=0; i<ma; i++) {
2293cd0d46ebSvictorle     while (aptr[i]<aii[i+1]) {
229497f1f81fSBarry Smith       PetscInt    idc,idr;
22955485867bSBarry Smith       PetscScalar vc,vr;
2296cd0d46ebSvictorle       /* column/row index/value */
22975485867bSBarry Smith       idc = adx[aptr[i]];
22985485867bSBarry Smith       idr = bdx[bptr[idc]];
22995485867bSBarry Smith       vc  = va[aptr[i]];
23005485867bSBarry Smith       vr  = vb[bptr[idc]];
23015485867bSBarry Smith       if (i!=idr || PetscAbsScalar(vc-vr) > tol) {
23025485867bSBarry Smith         *f = PETSC_FALSE;
23035485867bSBarry Smith         goto done;
2304cd0d46ebSvictorle       } else {
23055485867bSBarry Smith         aptr[i]++;
23065485867bSBarry Smith         if (B || i!=idc) bptr[idc]++;
2307cd0d46ebSvictorle       }
2308cd0d46ebSvictorle     }
2309cd0d46ebSvictorle   }
2310cd0d46ebSvictorle done:
2311cd0d46ebSvictorle   ierr = PetscFree(aptr);CHKERRQ(ierr);
23123aeef889SHong Zhang   ierr = PetscFree(bptr);CHKERRQ(ierr);
2313cd0d46ebSvictorle   PetscFunctionReturn(0);
2314cd0d46ebSvictorle }
2315cd0d46ebSvictorle 
23167087cfbeSBarry Smith PetscErrorCode  MatIsHermitianTranspose_SeqAIJ(Mat A,Mat B,PetscReal tol,PetscBool  *f)
23171cbb95d3SBarry Smith {
23183d3eaba7SBarry Smith   Mat_SeqAIJ     *aij = (Mat_SeqAIJ*) A->data,*bij = (Mat_SeqAIJ*) B->data;
231954f21887SBarry Smith   PetscInt       *adx,*bdx,*aii,*bii,*aptr,*bptr;
232054f21887SBarry Smith   MatScalar      *va,*vb;
23211cbb95d3SBarry Smith   PetscErrorCode ierr;
23221cbb95d3SBarry Smith   PetscInt       ma,na,mb,nb, i;
23231cbb95d3SBarry Smith 
23241cbb95d3SBarry Smith   PetscFunctionBegin;
23251cbb95d3SBarry Smith   ierr = MatGetSize(A,&ma,&na);CHKERRQ(ierr);
23261cbb95d3SBarry Smith   ierr = MatGetSize(B,&mb,&nb);CHKERRQ(ierr);
23271cbb95d3SBarry Smith   if (ma!=nb || na!=mb) {
23281cbb95d3SBarry Smith     *f = PETSC_FALSE;
23291cbb95d3SBarry Smith     PetscFunctionReturn(0);
23301cbb95d3SBarry Smith   }
23311cbb95d3SBarry Smith   aii  = aij->i; bii = bij->i;
23321cbb95d3SBarry Smith   adx  = aij->j; bdx = bij->j;
23331cbb95d3SBarry Smith   va   = aij->a; vb = bij->a;
2334785e854fSJed Brown   ierr = PetscMalloc1(ma,&aptr);CHKERRQ(ierr);
2335785e854fSJed Brown   ierr = PetscMalloc1(mb,&bptr);CHKERRQ(ierr);
23361cbb95d3SBarry Smith   for (i=0; i<ma; i++) aptr[i] = aii[i];
23371cbb95d3SBarry Smith   for (i=0; i<mb; i++) bptr[i] = bii[i];
23381cbb95d3SBarry Smith 
23391cbb95d3SBarry Smith   *f = PETSC_TRUE;
23401cbb95d3SBarry Smith   for (i=0; i<ma; i++) {
23411cbb95d3SBarry Smith     while (aptr[i]<aii[i+1]) {
23421cbb95d3SBarry Smith       PetscInt    idc,idr;
23431cbb95d3SBarry Smith       PetscScalar vc,vr;
23441cbb95d3SBarry Smith       /* column/row index/value */
23451cbb95d3SBarry Smith       idc = adx[aptr[i]];
23461cbb95d3SBarry Smith       idr = bdx[bptr[idc]];
23471cbb95d3SBarry Smith       vc  = va[aptr[i]];
23481cbb95d3SBarry Smith       vr  = vb[bptr[idc]];
23491cbb95d3SBarry Smith       if (i!=idr || PetscAbsScalar(vc-PetscConj(vr)) > tol) {
23501cbb95d3SBarry Smith         *f = PETSC_FALSE;
23511cbb95d3SBarry Smith         goto done;
23521cbb95d3SBarry Smith       } else {
23531cbb95d3SBarry Smith         aptr[i]++;
23541cbb95d3SBarry Smith         if (B || i!=idc) bptr[idc]++;
23551cbb95d3SBarry Smith       }
23561cbb95d3SBarry Smith     }
23571cbb95d3SBarry Smith   }
23581cbb95d3SBarry Smith done:
23591cbb95d3SBarry Smith   ierr = PetscFree(aptr);CHKERRQ(ierr);
23601cbb95d3SBarry Smith   ierr = PetscFree(bptr);CHKERRQ(ierr);
23611cbb95d3SBarry Smith   PetscFunctionReturn(0);
23621cbb95d3SBarry Smith }
23631cbb95d3SBarry Smith 
2364ace3abfcSBarry Smith PetscErrorCode MatIsSymmetric_SeqAIJ(Mat A,PetscReal tol,PetscBool  *f)
23659e29f15eSvictorle {
2366dfbe8321SBarry Smith   PetscErrorCode ierr;
23676e111a19SKarl Rupp 
23689e29f15eSvictorle   PetscFunctionBegin;
23695485867bSBarry Smith   ierr = MatIsTranspose_SeqAIJ(A,A,tol,f);CHKERRQ(ierr);
23709e29f15eSvictorle   PetscFunctionReturn(0);
23719e29f15eSvictorle }
23729e29f15eSvictorle 
2373ace3abfcSBarry Smith PetscErrorCode MatIsHermitian_SeqAIJ(Mat A,PetscReal tol,PetscBool  *f)
23741cbb95d3SBarry Smith {
23751cbb95d3SBarry Smith   PetscErrorCode ierr;
23766e111a19SKarl Rupp 
23771cbb95d3SBarry Smith   PetscFunctionBegin;
23781cbb95d3SBarry Smith   ierr = MatIsHermitianTranspose_SeqAIJ(A,A,tol,f);CHKERRQ(ierr);
23791cbb95d3SBarry Smith   PetscFunctionReturn(0);
23801cbb95d3SBarry Smith }
23811cbb95d3SBarry Smith 
2382dfbe8321SBarry Smith PetscErrorCode MatDiagonalScale_SeqAIJ(Mat A,Vec ll,Vec rr)
238317ab2063SBarry Smith {
2384416022c9SBarry Smith   Mat_SeqAIJ        *a = (Mat_SeqAIJ*)A->data;
2385fff8e43fSBarry Smith   const PetscScalar *l,*r;
2386fff8e43fSBarry Smith   PetscScalar       x;
238754f21887SBarry Smith   MatScalar         *v;
2388dfbe8321SBarry Smith   PetscErrorCode    ierr;
2389fff8e43fSBarry Smith   PetscInt          i,j,m = A->rmap->n,n = A->cmap->n,M,nz = a->nz;
2390fff8e43fSBarry Smith   const PetscInt    *jj;
239117ab2063SBarry Smith 
23923a40ed3dSBarry Smith   PetscFunctionBegin;
239317ab2063SBarry Smith   if (ll) {
23943ea7c6a1SSatish Balay     /* The local size is used so that VecMPI can be passed to this routine
23953ea7c6a1SSatish Balay        by MatDiagonalScale_MPIAIJ */
2396e1311b90SBarry Smith     ierr = VecGetLocalSize(ll,&m);CHKERRQ(ierr);
2397e32f2f54SBarry Smith     if (m != A->rmap->n) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Left scaling vector wrong length");
2398fff8e43fSBarry Smith     ierr = VecGetArrayRead(ll,&l);CHKERRQ(ierr);
2399416022c9SBarry Smith     v    = a->a;
240017ab2063SBarry Smith     for (i=0; i<m; i++) {
240117ab2063SBarry Smith       x = l[i];
2402416022c9SBarry Smith       M = a->i[i+1] - a->i[i];
24032205254eSKarl Rupp       for (j=0; j<M; j++) (*v++) *= x;
240417ab2063SBarry Smith     }
2405fff8e43fSBarry Smith     ierr = VecRestoreArrayRead(ll,&l);CHKERRQ(ierr);
2406efee365bSSatish Balay     ierr = PetscLogFlops(nz);CHKERRQ(ierr);
240717ab2063SBarry Smith   }
240817ab2063SBarry Smith   if (rr) {
2409e1311b90SBarry Smith     ierr = VecGetLocalSize(rr,&n);CHKERRQ(ierr);
2410e32f2f54SBarry Smith     if (n != A->cmap->n) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Right scaling vector wrong length");
2411fff8e43fSBarry Smith     ierr = VecGetArrayRead(rr,&r);CHKERRQ(ierr);
2412416022c9SBarry Smith     v    = a->a; jj = a->j;
24132205254eSKarl Rupp     for (i=0; i<nz; i++) (*v++) *= r[*jj++];
2414fff8e43fSBarry Smith     ierr = VecRestoreArrayRead(rr,&r);CHKERRQ(ierr);
2415efee365bSSatish Balay     ierr = PetscLogFlops(nz);CHKERRQ(ierr);
241617ab2063SBarry Smith   }
2417acf2f550SJed Brown   ierr = MatSeqAIJInvalidateDiagonal(A);CHKERRQ(ierr);
2418e2cf4d64SStefano Zampini #if defined(PETSC_HAVE_VIENNACL) || defined(PETSC_HAVE_CUDA)
2419c70f7ee4SJunchao Zhang   if (A->offloadmask != PETSC_OFFLOAD_UNALLOCATED) A->offloadmask = PETSC_OFFLOAD_CPU;
2420e2cf4d64SStefano Zampini #endif
24213a40ed3dSBarry Smith   PetscFunctionReturn(0);
242217ab2063SBarry Smith }
242317ab2063SBarry Smith 
24247dae84e0SHong Zhang PetscErrorCode MatCreateSubMatrix_SeqAIJ(Mat A,IS isrow,IS iscol,PetscInt csize,MatReuse scall,Mat *B)
242517ab2063SBarry Smith {
2426db02288aSLois Curfman McInnes   Mat_SeqAIJ     *a = (Mat_SeqAIJ*)A->data,*c;
24276849ba73SBarry Smith   PetscErrorCode ierr;
2428d0f46423SBarry Smith   PetscInt       *smap,i,k,kstart,kend,oldcols = A->cmap->n,*lens;
242997f1f81fSBarry Smith   PetscInt       row,mat_i,*mat_j,tcol,first,step,*mat_ilen,sum,lensi;
24305d0c19d7SBarry Smith   const PetscInt *irow,*icol;
24315d0c19d7SBarry Smith   PetscInt       nrows,ncols;
243297f1f81fSBarry Smith   PetscInt       *starts,*j_new,*i_new,*aj = a->j,*ai = a->i,ii,*ailen = a->ilen;
243354f21887SBarry Smith   MatScalar      *a_new,*mat_a;
2434416022c9SBarry Smith   Mat            C;
2435cdc6f3adSToby Isaac   PetscBool      stride;
243617ab2063SBarry Smith 
24373a40ed3dSBarry Smith   PetscFunctionBegin;
243899141d43SSatish Balay 
243917ab2063SBarry Smith   ierr = ISGetIndices(isrow,&irow);CHKERRQ(ierr);
2440b9b97703SBarry Smith   ierr = ISGetLocalSize(isrow,&nrows);CHKERRQ(ierr);
2441b9b97703SBarry Smith   ierr = ISGetLocalSize(iscol,&ncols);CHKERRQ(ierr);
244217ab2063SBarry Smith 
2443251f4c67SDmitry Karpeev   ierr = PetscObjectTypeCompare((PetscObject)iscol,ISSTRIDE,&stride);CHKERRQ(ierr);
2444ff718158SBarry Smith   if (stride) {
2445ff718158SBarry Smith     ierr = ISStrideGetInfo(iscol,&first,&step);CHKERRQ(ierr);
2446ff718158SBarry Smith   } else {
2447ff718158SBarry Smith     first = 0;
2448ff718158SBarry Smith     step  = 0;
2449ff718158SBarry Smith   }
2450fee21e36SBarry Smith   if (stride && step == 1) {
245102834360SBarry Smith     /* special case of contiguous rows */
2452dcca6d9dSJed Brown     ierr = PetscMalloc2(nrows,&lens,nrows,&starts);CHKERRQ(ierr);
245302834360SBarry Smith     /* loop over new rows determining lens and starting points */
245402834360SBarry Smith     for (i=0; i<nrows; i++) {
2455bfeeae90SHong Zhang       kstart = ai[irow[i]];
2456a2744918SBarry Smith       kend   = kstart + ailen[irow[i]];
2457a91a9bebSLisandro Dalcin       starts[i] = kstart;
245802834360SBarry Smith       for (k=kstart; k<kend; k++) {
2459bfeeae90SHong Zhang         if (aj[k] >= first) {
246002834360SBarry Smith           starts[i] = k;
246102834360SBarry Smith           break;
246202834360SBarry Smith         }
246302834360SBarry Smith       }
2464a2744918SBarry Smith       sum = 0;
246502834360SBarry Smith       while (k < kend) {
2466bfeeae90SHong Zhang         if (aj[k++] >= first+ncols) break;
2467a2744918SBarry Smith         sum++;
246802834360SBarry Smith       }
2469a2744918SBarry Smith       lens[i] = sum;
247002834360SBarry Smith     }
247102834360SBarry Smith     /* create submatrix */
2472cddf8d76SBarry Smith     if (scall == MAT_REUSE_MATRIX) {
247397f1f81fSBarry Smith       PetscInt n_cols,n_rows;
247408480c60SBarry Smith       ierr = MatGetSize(*B,&n_rows,&n_cols);CHKERRQ(ierr);
2475e32f2f54SBarry Smith       if (n_rows != nrows || n_cols != ncols) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Reused submatrix wrong size");
2476d8ced48eSBarry Smith       ierr = MatZeroEntries(*B);CHKERRQ(ierr);
247708480c60SBarry Smith       C    = *B;
24783a40ed3dSBarry Smith     } else {
24793bef6203SJed Brown       PetscInt rbs,cbs;
2480ce94432eSBarry Smith       ierr = MatCreate(PetscObjectComm((PetscObject)A),&C);CHKERRQ(ierr);
2481f69a0ea3SMatthew Knepley       ierr = MatSetSizes(C,nrows,ncols,PETSC_DETERMINE,PETSC_DETERMINE);CHKERRQ(ierr);
24823bef6203SJed Brown       ierr = ISGetBlockSize(isrow,&rbs);CHKERRQ(ierr);
24833bef6203SJed Brown       ierr = ISGetBlockSize(iscol,&cbs);CHKERRQ(ierr);
24843bef6203SJed Brown       ierr = MatSetBlockSizes(C,rbs,cbs);CHKERRQ(ierr);
24857adad957SLisandro Dalcin       ierr = MatSetType(C,((PetscObject)A)->type_name);CHKERRQ(ierr);
2486ab93d7beSBarry Smith       ierr = MatSeqAIJSetPreallocation_SeqAIJ(C,0,lens);CHKERRQ(ierr);
248708480c60SBarry Smith     }
2488db02288aSLois Curfman McInnes     c = (Mat_SeqAIJ*)C->data;
2489db02288aSLois Curfman McInnes 
249002834360SBarry Smith     /* loop over rows inserting into submatrix */
2491db02288aSLois Curfman McInnes     a_new = c->a;
2492db02288aSLois Curfman McInnes     j_new = c->j;
2493db02288aSLois Curfman McInnes     i_new = c->i;
2494bfeeae90SHong Zhang 
249502834360SBarry Smith     for (i=0; i<nrows; i++) {
2496a2744918SBarry Smith       ii    = starts[i];
2497a2744918SBarry Smith       lensi = lens[i];
2498a2744918SBarry Smith       for (k=0; k<lensi; k++) {
2499a2744918SBarry Smith         *j_new++ = aj[ii+k] - first;
250002834360SBarry Smith       }
2501580bdb30SBarry Smith       ierr       = PetscArraycpy(a_new,a->a + starts[i],lensi);CHKERRQ(ierr);
2502a2744918SBarry Smith       a_new     += lensi;
2503a2744918SBarry Smith       i_new[i+1] = i_new[i] + lensi;
2504a2744918SBarry Smith       c->ilen[i] = lensi;
250502834360SBarry Smith     }
25060e83c824SBarry Smith     ierr = PetscFree2(lens,starts);CHKERRQ(ierr);
25073a40ed3dSBarry Smith   } else {
250802834360SBarry Smith     ierr = ISGetIndices(iscol,&icol);CHKERRQ(ierr);
25091795a4d1SJed Brown     ierr = PetscCalloc1(oldcols,&smap);CHKERRQ(ierr);
2510854ce69bSBarry Smith     ierr = PetscMalloc1(1+nrows,&lens);CHKERRQ(ierr);
25114dcab191SBarry Smith     for (i=0; i<ncols; i++) {
2512d9ef940eSSatish Balay       if (PetscUnlikelyDebug(icol[i] >= oldcols)) SETERRQ3(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Requesting column beyond largest column icol[%D] %D >= A->cmap->n %D",i,icol[i],oldcols);
25134dcab191SBarry Smith       smap[icol[i]] = i+1;
25144dcab191SBarry Smith     }
25154dcab191SBarry Smith 
251602834360SBarry Smith     /* determine lens of each row */
251702834360SBarry Smith     for (i=0; i<nrows; i++) {
2518bfeeae90SHong Zhang       kstart  = ai[irow[i]];
251902834360SBarry Smith       kend    = kstart + a->ilen[irow[i]];
252002834360SBarry Smith       lens[i] = 0;
252102834360SBarry Smith       for (k=kstart; k<kend; k++) {
2522bfeeae90SHong Zhang         if (smap[aj[k]]) {
252302834360SBarry Smith           lens[i]++;
252402834360SBarry Smith         }
252502834360SBarry Smith       }
252602834360SBarry Smith     }
252717ab2063SBarry Smith     /* Create and fill new matrix */
2528a2744918SBarry Smith     if (scall == MAT_REUSE_MATRIX) {
2529ace3abfcSBarry Smith       PetscBool equal;
25300f5bd95cSBarry Smith 
253199141d43SSatish Balay       c = (Mat_SeqAIJ*)((*B)->data);
2532e32f2f54SBarry Smith       if ((*B)->rmap->n  != nrows || (*B)->cmap->n != ncols) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Cannot reuse matrix. wrong size");
2533580bdb30SBarry Smith       ierr = PetscArraycmp(c->ilen,lens,(*B)->rmap->n,&equal);CHKERRQ(ierr);
2534f23aa3ddSBarry Smith       if (!equal) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Cannot reuse matrix. wrong no of nonzeros");
2535580bdb30SBarry Smith       ierr = PetscArrayzero(c->ilen,(*B)->rmap->n);CHKERRQ(ierr);
253608480c60SBarry Smith       C    = *B;
25373a40ed3dSBarry Smith     } else {
25383bef6203SJed Brown       PetscInt rbs,cbs;
2539ce94432eSBarry Smith       ierr = MatCreate(PetscObjectComm((PetscObject)A),&C);CHKERRQ(ierr);
2540f69a0ea3SMatthew Knepley       ierr = MatSetSizes(C,nrows,ncols,PETSC_DETERMINE,PETSC_DETERMINE);CHKERRQ(ierr);
25413bef6203SJed Brown       ierr = ISGetBlockSize(isrow,&rbs);CHKERRQ(ierr);
25423bef6203SJed Brown       ierr = ISGetBlockSize(iscol,&cbs);CHKERRQ(ierr);
25433bef6203SJed Brown       ierr = MatSetBlockSizes(C,rbs,cbs);CHKERRQ(ierr);
25447adad957SLisandro Dalcin       ierr = MatSetType(C,((PetscObject)A)->type_name);CHKERRQ(ierr);
2545ab93d7beSBarry Smith       ierr = MatSeqAIJSetPreallocation_SeqAIJ(C,0,lens);CHKERRQ(ierr);
254608480c60SBarry Smith     }
254799141d43SSatish Balay     c = (Mat_SeqAIJ*)(C->data);
254817ab2063SBarry Smith     for (i=0; i<nrows; i++) {
254999141d43SSatish Balay       row      = irow[i];
2550bfeeae90SHong Zhang       kstart   = ai[row];
255199141d43SSatish Balay       kend     = kstart + a->ilen[row];
2552bfeeae90SHong Zhang       mat_i    = c->i[i];
255399141d43SSatish Balay       mat_j    = c->j + mat_i;
255499141d43SSatish Balay       mat_a    = c->a + mat_i;
255599141d43SSatish Balay       mat_ilen = c->ilen + i;
255617ab2063SBarry Smith       for (k=kstart; k<kend; k++) {
2557bfeeae90SHong Zhang         if ((tcol=smap[a->j[k]])) {
2558ed480e8bSBarry Smith           *mat_j++ = tcol - 1;
255999141d43SSatish Balay           *mat_a++ = a->a[k];
256099141d43SSatish Balay           (*mat_ilen)++;
256199141d43SSatish Balay 
256217ab2063SBarry Smith         }
256317ab2063SBarry Smith       }
256417ab2063SBarry Smith     }
256502834360SBarry Smith     /* Free work space */
256602834360SBarry Smith     ierr = ISRestoreIndices(iscol,&icol);CHKERRQ(ierr);
2567606d414cSSatish Balay     ierr = PetscFree(smap);CHKERRQ(ierr);
2568606d414cSSatish Balay     ierr = PetscFree(lens);CHKERRQ(ierr);
2569cdc6f3adSToby Isaac     /* sort */
2570cdc6f3adSToby Isaac     for (i = 0; i < nrows; i++) {
2571cdc6f3adSToby Isaac       PetscInt ilen;
2572cdc6f3adSToby Isaac 
2573cdc6f3adSToby Isaac       mat_i = c->i[i];
2574cdc6f3adSToby Isaac       mat_j = c->j + mat_i;
2575cdc6f3adSToby Isaac       mat_a = c->a + mat_i;
2576cdc6f3adSToby Isaac       ilen  = c->ilen[i];
2577390e1bf2SBarry Smith       ierr  = PetscSortIntWithScalarArray(ilen,mat_j,mat_a);CHKERRQ(ierr);
2578cdc6f3adSToby Isaac     }
257902834360SBarry Smith   }
2580305c6ccfSStefano Zampini #if defined(PETSC_HAVE_VIENNACL) || defined(PETSC_HAVE_CUDA)
2581b470e4b4SRichard Tran Mills   ierr = MatBindToCPU(C,A->boundtocpu);CHKERRQ(ierr);
2582305c6ccfSStefano Zampini #endif
25836d4a8577SBarry Smith   ierr = MatAssemblyBegin(C,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
25846d4a8577SBarry Smith   ierr = MatAssemblyEnd(C,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
258517ab2063SBarry Smith 
258617ab2063SBarry Smith   ierr = ISRestoreIndices(isrow,&irow);CHKERRQ(ierr);
2587416022c9SBarry Smith   *B   = C;
25883a40ed3dSBarry Smith   PetscFunctionReturn(0);
258917ab2063SBarry Smith }
259017ab2063SBarry Smith 
2591fc08c53fSHong Zhang PetscErrorCode  MatGetMultiProcBlock_SeqAIJ(Mat mat,MPI_Comm subComm,MatReuse scall,Mat *subMat)
259282d44351SHong Zhang {
259382d44351SHong Zhang   PetscErrorCode ierr;
259482d44351SHong Zhang   Mat            B;
259582d44351SHong Zhang 
259682d44351SHong Zhang   PetscFunctionBegin;
2597c2d650bdSHong Zhang   if (scall == MAT_INITIAL_MATRIX) {
259882d44351SHong Zhang     ierr    = MatCreate(subComm,&B);CHKERRQ(ierr);
259982d44351SHong Zhang     ierr    = MatSetSizes(B,mat->rmap->n,mat->cmap->n,mat->rmap->n,mat->cmap->n);CHKERRQ(ierr);
260033d57670SJed Brown     ierr    = MatSetBlockSizesFromMats(B,mat,mat);CHKERRQ(ierr);
260182d44351SHong Zhang     ierr    = MatSetType(B,MATSEQAIJ);CHKERRQ(ierr);
260282d44351SHong Zhang     ierr    = MatDuplicateNoCreate_SeqAIJ(B,mat,MAT_COPY_VALUES,PETSC_TRUE);CHKERRQ(ierr);
260382d44351SHong Zhang     *subMat = B;
2604c2d650bdSHong Zhang   } else {
2605c2d650bdSHong Zhang     ierr = MatCopy_SeqAIJ(mat,*subMat,SAME_NONZERO_PATTERN);CHKERRQ(ierr);
2606c2d650bdSHong Zhang   }
260782d44351SHong Zhang   PetscFunctionReturn(0);
260882d44351SHong Zhang }
260982d44351SHong Zhang 
26109a625307SHong Zhang PetscErrorCode MatILUFactor_SeqAIJ(Mat inA,IS row,IS col,const MatFactorInfo *info)
2611a871dcd8SBarry Smith {
261263b91edcSBarry Smith   Mat_SeqAIJ     *a = (Mat_SeqAIJ*)inA->data;
2613dfbe8321SBarry Smith   PetscErrorCode ierr;
261463b91edcSBarry Smith   Mat            outA;
2615ace3abfcSBarry Smith   PetscBool      row_identity,col_identity;
261663b91edcSBarry Smith 
26173a40ed3dSBarry Smith   PetscFunctionBegin;
2618e32f2f54SBarry Smith   if (info->levels != 0) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_SUP,"Only levels=0 supported for in-place ilu");
26191df811f5SHong Zhang 
2620b8a78c4aSBarry Smith   ierr = ISIdentity(row,&row_identity);CHKERRQ(ierr);
2621b8a78c4aSBarry Smith   ierr = ISIdentity(col,&col_identity);CHKERRQ(ierr);
2622a871dcd8SBarry Smith 
262363b91edcSBarry Smith   outA             = inA;
2624d5f3da31SBarry Smith   outA->factortype = MAT_FACTOR_LU;
2625f6224b95SHong Zhang   ierr = PetscFree(inA->solvertype);CHKERRQ(ierr);
2626f6224b95SHong Zhang   ierr = PetscStrallocpy(MATSOLVERPETSC,&inA->solvertype);CHKERRQ(ierr);
26272205254eSKarl Rupp 
2628c38d4ed2SBarry Smith   ierr = PetscObjectReference((PetscObject)row);CHKERRQ(ierr);
26296bf464f9SBarry Smith   ierr = ISDestroy(&a->row);CHKERRQ(ierr);
26302205254eSKarl Rupp 
2631c3122656SLisandro Dalcin   a->row = row;
26322205254eSKarl Rupp 
2633c38d4ed2SBarry Smith   ierr = PetscObjectReference((PetscObject)col);CHKERRQ(ierr);
26346bf464f9SBarry Smith   ierr = ISDestroy(&a->col);CHKERRQ(ierr);
26352205254eSKarl Rupp 
2636c3122656SLisandro Dalcin   a->col = col;
263763b91edcSBarry Smith 
263836db0b34SBarry Smith   /* Create the inverse permutation so that it can be used in MatLUFactorNumeric() */
26396bf464f9SBarry Smith   ierr = ISDestroy(&a->icol);CHKERRQ(ierr);
26404c49b128SBarry Smith   ierr = ISInvertPermutation(col,PETSC_DECIDE,&a->icol);CHKERRQ(ierr);
26413bb1ff40SBarry Smith   ierr = PetscLogObjectParent((PetscObject)inA,(PetscObject)a->icol);CHKERRQ(ierr);
2642f0ec6fceSSatish Balay 
264394a9d846SBarry Smith   if (!a->solve_work) { /* this matrix may have been factored before */
2644854ce69bSBarry Smith     ierr = PetscMalloc1(inA->rmap->n+1,&a->solve_work);CHKERRQ(ierr);
26453bb1ff40SBarry Smith     ierr = PetscLogObjectMemory((PetscObject)inA, (inA->rmap->n+1)*sizeof(PetscScalar));CHKERRQ(ierr);
264694a9d846SBarry Smith   }
264763b91edcSBarry Smith 
2648f1e2ffcdSBarry Smith   ierr = MatMarkDiagonal_SeqAIJ(inA);CHKERRQ(ierr);
2649137fb511SHong Zhang   if (row_identity && col_identity) {
2650ad04f41aSHong Zhang     ierr = MatLUFactorNumeric_SeqAIJ_inplace(outA,inA,info);CHKERRQ(ierr);
2651137fb511SHong Zhang   } else {
2652719d5645SBarry Smith     ierr = MatLUFactorNumeric_SeqAIJ_InplaceWithPerm(outA,inA,info);CHKERRQ(ierr);
2653137fb511SHong Zhang   }
26543a40ed3dSBarry Smith   PetscFunctionReturn(0);
2655a871dcd8SBarry Smith }
2656a871dcd8SBarry Smith 
2657f4df32b1SMatthew Knepley PetscErrorCode MatScale_SeqAIJ(Mat inA,PetscScalar alpha)
2658f0b747eeSBarry Smith {
2659f0b747eeSBarry Smith   Mat_SeqAIJ     *a     = (Mat_SeqAIJ*)inA->data;
2660f4df32b1SMatthew Knepley   PetscScalar    oalpha = alpha;
2661efee365bSSatish Balay   PetscErrorCode ierr;
2662c5df96a5SBarry Smith   PetscBLASInt   one = 1,bnz;
26633a40ed3dSBarry Smith 
26643a40ed3dSBarry Smith   PetscFunctionBegin;
2665c5df96a5SBarry Smith   ierr = PetscBLASIntCast(a->nz,&bnz);CHKERRQ(ierr);
26668b83055fSJed Brown   PetscStackCallBLAS("BLASscal",BLASscal_(&bnz,&oalpha,a->a,&one));
2667efee365bSSatish Balay   ierr = PetscLogFlops(a->nz);CHKERRQ(ierr);
2668acf2f550SJed Brown   ierr = MatSeqAIJInvalidateDiagonal(inA);CHKERRQ(ierr);
2669e2cf4d64SStefano Zampini #if defined(PETSC_HAVE_VIENNACL) || defined(PETSC_HAVE_CUDA)
2670c70f7ee4SJunchao Zhang   if (inA->offloadmask != PETSC_OFFLOAD_UNALLOCATED) inA->offloadmask = PETSC_OFFLOAD_CPU;
2671e2cf4d64SStefano Zampini #endif
26723a40ed3dSBarry Smith   PetscFunctionReturn(0);
2673f0b747eeSBarry Smith }
2674f0b747eeSBarry Smith 
2675f68bb481SHong Zhang PetscErrorCode MatDestroySubMatrix_Private(Mat_SubSppt *submatj)
267616b64355SHong Zhang {
267716b64355SHong Zhang   PetscErrorCode ierr;
267816b64355SHong Zhang   PetscInt       i;
267916b64355SHong Zhang 
268016b64355SHong Zhang   PetscFunctionBegin;
268116b64355SHong Zhang   if (!submatj->id) { /* delete data that are linked only to submats[id=0] */
268216b64355SHong Zhang     ierr = PetscFree4(submatj->sbuf1,submatj->ptr,submatj->tmp,submatj->ctr);CHKERRQ(ierr);
268316b64355SHong Zhang 
268416b64355SHong Zhang     for (i=0; i<submatj->nrqr; ++i) {
268516b64355SHong Zhang       ierr = PetscFree(submatj->sbuf2[i]);CHKERRQ(ierr);
268616b64355SHong Zhang     }
268716b64355SHong Zhang     ierr = PetscFree3(submatj->sbuf2,submatj->req_size,submatj->req_source1);CHKERRQ(ierr);
268816b64355SHong Zhang 
268916b64355SHong Zhang     if (submatj->rbuf1) {
269016b64355SHong Zhang       ierr = PetscFree(submatj->rbuf1[0]);CHKERRQ(ierr);
269116b64355SHong Zhang       ierr = PetscFree(submatj->rbuf1);CHKERRQ(ierr);
269216b64355SHong Zhang     }
269316b64355SHong Zhang 
269416b64355SHong Zhang     for (i=0; i<submatj->nrqs; ++i) {
269516b64355SHong Zhang       ierr = PetscFree(submatj->rbuf3[i]);CHKERRQ(ierr);
269616b64355SHong Zhang     }
269716b64355SHong Zhang     ierr = PetscFree3(submatj->req_source2,submatj->rbuf2,submatj->rbuf3);CHKERRQ(ierr);
269816b64355SHong Zhang     ierr = PetscFree(submatj->pa);CHKERRQ(ierr);
269916b64355SHong Zhang   }
270016b64355SHong Zhang 
270116b64355SHong Zhang #if defined(PETSC_USE_CTABLE)
270216b64355SHong Zhang   ierr = PetscTableDestroy((PetscTable*)&submatj->rmap);CHKERRQ(ierr);
270316b64355SHong Zhang   if (submatj->cmap_loc) {ierr = PetscFree(submatj->cmap_loc);CHKERRQ(ierr);}
270416b64355SHong Zhang   ierr = PetscFree(submatj->rmap_loc);CHKERRQ(ierr);
270516b64355SHong Zhang #else
270616b64355SHong Zhang   ierr = PetscFree(submatj->rmap);CHKERRQ(ierr);
270716b64355SHong Zhang #endif
270816b64355SHong Zhang 
270916b64355SHong Zhang   if (!submatj->allcolumns) {
271016b64355SHong Zhang #if defined(PETSC_USE_CTABLE)
271116b64355SHong Zhang     ierr = PetscTableDestroy((PetscTable*)&submatj->cmap);CHKERRQ(ierr);
271216b64355SHong Zhang #else
271316b64355SHong Zhang     ierr = PetscFree(submatj->cmap);CHKERRQ(ierr);
271416b64355SHong Zhang #endif
271516b64355SHong Zhang   }
271616b64355SHong Zhang   ierr = PetscFree(submatj->row2proc);CHKERRQ(ierr);
271716b64355SHong Zhang 
271816b64355SHong Zhang   ierr = PetscFree(submatj);CHKERRQ(ierr);
271916b64355SHong Zhang   PetscFunctionReturn(0);
272016b64355SHong Zhang }
272116b64355SHong Zhang 
27220fb991dcSHong Zhang PetscErrorCode MatDestroySubMatrix_SeqAIJ(Mat C)
272316b64355SHong Zhang {
272416b64355SHong Zhang   PetscErrorCode ierr;
272516b64355SHong Zhang   Mat_SeqAIJ     *c = (Mat_SeqAIJ*)C->data;
27265c39f6d9SHong Zhang   Mat_SubSppt    *submatj = c->submatis1;
272716b64355SHong Zhang 
272816b64355SHong Zhang   PetscFunctionBegin;
272934136279SStefano Zampini   ierr = (*submatj->destroy)(C);CHKERRQ(ierr);
2730f68bb481SHong Zhang   ierr = MatDestroySubMatrix_Private(submatj);CHKERRQ(ierr);
273116b64355SHong Zhang   PetscFunctionReturn(0);
273216b64355SHong Zhang }
273316b64355SHong Zhang 
27342d033e1fSHong Zhang PetscErrorCode MatDestroySubMatrices_SeqAIJ(PetscInt n,Mat *mat[])
27352d033e1fSHong Zhang {
27362d033e1fSHong Zhang   PetscErrorCode ierr;
27372d033e1fSHong Zhang   PetscInt       i;
27380fb991dcSHong Zhang   Mat            C;
27390fb991dcSHong Zhang   Mat_SeqAIJ     *c;
27400fb991dcSHong Zhang   Mat_SubSppt    *submatj;
27412d033e1fSHong Zhang 
27422d033e1fSHong Zhang   PetscFunctionBegin;
27432d033e1fSHong Zhang   for (i=0; i<n; i++) {
27440fb991dcSHong Zhang     C       = (*mat)[i];
27450fb991dcSHong Zhang     c       = (Mat_SeqAIJ*)C->data;
27460fb991dcSHong Zhang     submatj = c->submatis1;
27472d033e1fSHong Zhang     if (submatj) {
2748682e4c99SStefano Zampini       if (--((PetscObject)C)->refct <= 0) {
274934136279SStefano Zampini         ierr = (*submatj->destroy)(C);CHKERRQ(ierr);
2750f68bb481SHong Zhang         ierr = MatDestroySubMatrix_Private(submatj);CHKERRQ(ierr);
275134136279SStefano Zampini         ierr = PetscFree(C->defaultvectype);CHKERRQ(ierr);
27522d033e1fSHong Zhang         ierr = PetscLayoutDestroy(&C->rmap);CHKERRQ(ierr);
27532d033e1fSHong Zhang         ierr = PetscLayoutDestroy(&C->cmap);CHKERRQ(ierr);
27542d033e1fSHong Zhang         ierr = PetscHeaderDestroy(&C);CHKERRQ(ierr);
2755682e4c99SStefano Zampini       }
27562d033e1fSHong Zhang     } else {
27572d033e1fSHong Zhang       ierr = MatDestroy(&C);CHKERRQ(ierr);
27582d033e1fSHong Zhang     }
27592d033e1fSHong Zhang   }
276086e85357SHong Zhang 
276163a75b2aSHong Zhang   /* Destroy Dummy submatrices created for reuse */
276263a75b2aSHong Zhang   ierr = MatDestroySubMatrices_Dummy(n,mat);CHKERRQ(ierr);
276363a75b2aSHong Zhang 
27642d033e1fSHong Zhang   ierr = PetscFree(*mat);CHKERRQ(ierr);
27652d033e1fSHong Zhang   PetscFunctionReturn(0);
27662d033e1fSHong Zhang }
27672d033e1fSHong Zhang 
27687dae84e0SHong Zhang PetscErrorCode MatCreateSubMatrices_SeqAIJ(Mat A,PetscInt n,const IS irow[],const IS icol[],MatReuse scall,Mat *B[])
2769cddf8d76SBarry Smith {
2770dfbe8321SBarry Smith   PetscErrorCode ierr;
277197f1f81fSBarry Smith   PetscInt       i;
2772cddf8d76SBarry Smith 
27733a40ed3dSBarry Smith   PetscFunctionBegin;
2774cddf8d76SBarry Smith   if (scall == MAT_INITIAL_MATRIX) {
2775df750dc8SHong Zhang     ierr = PetscCalloc1(n+1,B);CHKERRQ(ierr);
2776cddf8d76SBarry Smith   }
2777cddf8d76SBarry Smith 
2778cddf8d76SBarry Smith   for (i=0; i<n; i++) {
27797dae84e0SHong Zhang     ierr = MatCreateSubMatrix_SeqAIJ(A,irow[i],icol[i],PETSC_DECIDE,scall,&(*B)[i]);CHKERRQ(ierr);
2780cddf8d76SBarry Smith   }
27813a40ed3dSBarry Smith   PetscFunctionReturn(0);
2782cddf8d76SBarry Smith }
2783cddf8d76SBarry Smith 
278497f1f81fSBarry Smith PetscErrorCode MatIncreaseOverlap_SeqAIJ(Mat A,PetscInt is_max,IS is[],PetscInt ov)
27854dcbc457SBarry Smith {
2786e4d965acSSatish Balay   Mat_SeqAIJ     *a = (Mat_SeqAIJ*)A->data;
27876849ba73SBarry Smith   PetscErrorCode ierr;
27885d0c19d7SBarry Smith   PetscInt       row,i,j,k,l,m,n,*nidx,isz,val;
27895d0c19d7SBarry Smith   const PetscInt *idx;
279097f1f81fSBarry Smith   PetscInt       start,end,*ai,*aj;
2791f1af5d2fSBarry Smith   PetscBT        table;
2792bbd702dbSSatish Balay 
27933a40ed3dSBarry Smith   PetscFunctionBegin;
2794d0f46423SBarry Smith   m  = A->rmap->n;
2795e4d965acSSatish Balay   ai = a->i;
2796bfeeae90SHong Zhang   aj = a->j;
27978a047759SSatish Balay 
2798e32f2f54SBarry Smith   if (ov < 0) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"illegal negative overlap value used");
279906763907SSatish Balay 
2800854ce69bSBarry Smith   ierr = PetscMalloc1(m+1,&nidx);CHKERRQ(ierr);
280153b8de81SBarry Smith   ierr = PetscBTCreate(m,&table);CHKERRQ(ierr);
280206763907SSatish Balay 
2803e4d965acSSatish Balay   for (i=0; i<is_max; i++) {
2804b97fc60eSLois Curfman McInnes     /* Initialize the two local arrays */
2805e4d965acSSatish Balay     isz  = 0;
28066831982aSBarry Smith     ierr = PetscBTMemzero(m,table);CHKERRQ(ierr);
2807e4d965acSSatish Balay 
2808e4d965acSSatish Balay     /* Extract the indices, assume there can be duplicate entries */
28094dcbc457SBarry Smith     ierr = ISGetIndices(is[i],&idx);CHKERRQ(ierr);
2810b9b97703SBarry Smith     ierr = ISGetLocalSize(is[i],&n);CHKERRQ(ierr);
2811e4d965acSSatish Balay 
2812dd097bc3SLois Curfman McInnes     /* Enter these into the temp arrays. I.e., mark table[row], enter row into new index */
2813e4d965acSSatish Balay     for (j=0; j<n; ++j) {
28142205254eSKarl Rupp       if (!PetscBTLookupSet(table,idx[j])) nidx[isz++] = idx[j];
28154dcbc457SBarry Smith     }
281606763907SSatish Balay     ierr = ISRestoreIndices(is[i],&idx);CHKERRQ(ierr);
28176bf464f9SBarry Smith     ierr = ISDestroy(&is[i]);CHKERRQ(ierr);
2818e4d965acSSatish Balay 
281904a348a9SBarry Smith     k = 0;
282004a348a9SBarry Smith     for (j=0; j<ov; j++) { /* for each overlap */
282104a348a9SBarry Smith       n = isz;
282206763907SSatish Balay       for (; k<n; k++) { /* do only those rows in nidx[k], which are not done yet */
2823e4d965acSSatish Balay         row   = nidx[k];
2824e4d965acSSatish Balay         start = ai[row];
2825e4d965acSSatish Balay         end   = ai[row+1];
282604a348a9SBarry Smith         for (l = start; l<end; l++) {
2827efb16452SHong Zhang           val = aj[l];
28282205254eSKarl Rupp           if (!PetscBTLookupSet(table,val)) nidx[isz++] = val;
2829e4d965acSSatish Balay         }
2830e4d965acSSatish Balay       }
2831e4d965acSSatish Balay     }
283270b3c8c7SBarry Smith     ierr = ISCreateGeneral(PETSC_COMM_SELF,isz,nidx,PETSC_COPY_VALUES,(is+i));CHKERRQ(ierr);
2833e4d965acSSatish Balay   }
283494bacf5dSBarry Smith   ierr = PetscBTDestroy(&table);CHKERRQ(ierr);
2835606d414cSSatish Balay   ierr = PetscFree(nidx);CHKERRQ(ierr);
28363a40ed3dSBarry Smith   PetscFunctionReturn(0);
28374dcbc457SBarry Smith }
283817ab2063SBarry Smith 
28390513a670SBarry Smith /* -------------------------------------------------------------- */
2840dfbe8321SBarry Smith PetscErrorCode MatPermute_SeqAIJ(Mat A,IS rowp,IS colp,Mat *B)
28410513a670SBarry Smith {
28420513a670SBarry Smith   Mat_SeqAIJ     *a = (Mat_SeqAIJ*)A->data;
28436849ba73SBarry Smith   PetscErrorCode ierr;
28443b98c0a2SBarry Smith   PetscInt       i,nz = 0,m = A->rmap->n,n = A->cmap->n;
28455d0c19d7SBarry Smith   const PetscInt *row,*col;
28465d0c19d7SBarry Smith   PetscInt       *cnew,j,*lens;
284756cd22aeSBarry Smith   IS             icolp,irowp;
28480298fd71SBarry Smith   PetscInt       *cwork = NULL;
28490298fd71SBarry Smith   PetscScalar    *vwork = NULL;
28500513a670SBarry Smith 
28513a40ed3dSBarry Smith   PetscFunctionBegin;
28524c49b128SBarry Smith   ierr = ISInvertPermutation(rowp,PETSC_DECIDE,&irowp);CHKERRQ(ierr);
285356cd22aeSBarry Smith   ierr = ISGetIndices(irowp,&row);CHKERRQ(ierr);
28544c49b128SBarry Smith   ierr = ISInvertPermutation(colp,PETSC_DECIDE,&icolp);CHKERRQ(ierr);
285556cd22aeSBarry Smith   ierr = ISGetIndices(icolp,&col);CHKERRQ(ierr);
28560513a670SBarry Smith 
28570513a670SBarry Smith   /* determine lengths of permuted rows */
2858854ce69bSBarry Smith   ierr = PetscMalloc1(m+1,&lens);CHKERRQ(ierr);
28592205254eSKarl Rupp   for (i=0; i<m; i++) lens[row[i]] = a->i[i+1] - a->i[i];
2860ce94432eSBarry Smith   ierr = MatCreate(PetscObjectComm((PetscObject)A),B);CHKERRQ(ierr);
2861f69a0ea3SMatthew Knepley   ierr = MatSetSizes(*B,m,n,m,n);CHKERRQ(ierr);
286233d57670SJed Brown   ierr = MatSetBlockSizesFromMats(*B,A,A);CHKERRQ(ierr);
28637adad957SLisandro Dalcin   ierr = MatSetType(*B,((PetscObject)A)->type_name);CHKERRQ(ierr);
2864ab93d7beSBarry Smith   ierr = MatSeqAIJSetPreallocation_SeqAIJ(*B,0,lens);CHKERRQ(ierr);
2865606d414cSSatish Balay   ierr = PetscFree(lens);CHKERRQ(ierr);
28660513a670SBarry Smith 
2867785e854fSJed Brown   ierr = PetscMalloc1(n,&cnew);CHKERRQ(ierr);
28680513a670SBarry Smith   for (i=0; i<m; i++) {
286932ec9ce4SBarry Smith     ierr = MatGetRow_SeqAIJ(A,i,&nz,&cwork,&vwork);CHKERRQ(ierr);
28702205254eSKarl Rupp     for (j=0; j<nz; j++) cnew[j] = col[cwork[j]];
2871cdc0ba36SBarry Smith     ierr = MatSetValues_SeqAIJ(*B,1,&row[i],nz,cnew,vwork,INSERT_VALUES);CHKERRQ(ierr);
287232ec9ce4SBarry Smith     ierr = MatRestoreRow_SeqAIJ(A,i,&nz,&cwork,&vwork);CHKERRQ(ierr);
28730513a670SBarry Smith   }
2874606d414cSSatish Balay   ierr = PetscFree(cnew);CHKERRQ(ierr);
28752205254eSKarl Rupp 
28763c7d62e4SBarry Smith   (*B)->assembled = PETSC_FALSE;
28772205254eSKarl Rupp 
28789fe5e383SStefano Zampini #if defined(PETSC_HAVE_VIENNACL) || defined(PETSC_HAVE_CUDA)
2879b470e4b4SRichard Tran Mills   ierr = MatBindToCPU(*B,A->boundtocpu);CHKERRQ(ierr);
28809fe5e383SStefano Zampini #endif
28810513a670SBarry Smith   ierr = MatAssemblyBegin(*B,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
28820513a670SBarry Smith   ierr = MatAssemblyEnd(*B,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
288356cd22aeSBarry Smith   ierr = ISRestoreIndices(irowp,&row);CHKERRQ(ierr);
288456cd22aeSBarry Smith   ierr = ISRestoreIndices(icolp,&col);CHKERRQ(ierr);
28856bf464f9SBarry Smith   ierr = ISDestroy(&irowp);CHKERRQ(ierr);
28866bf464f9SBarry Smith   ierr = ISDestroy(&icolp);CHKERRQ(ierr);
28876768869dSprj-   if (rowp == colp) {
28886768869dSprj-     if (A->symmetric) {
28896768869dSprj-       ierr = MatSetOption(*B,MAT_SYMMETRIC,PETSC_TRUE);CHKERRQ(ierr);
28906768869dSprj-     }
28916768869dSprj-     if (A->hermitian) {
28926768869dSprj-       ierr = MatSetOption(*B,MAT_HERMITIAN,PETSC_TRUE);CHKERRQ(ierr);
28936768869dSprj-     }
28946768869dSprj-   }
28953a40ed3dSBarry Smith   PetscFunctionReturn(0);
28960513a670SBarry Smith }
28970513a670SBarry Smith 
2898dfbe8321SBarry Smith PetscErrorCode MatCopy_SeqAIJ(Mat A,Mat B,MatStructure str)
2899cb5b572fSBarry Smith {
2900dfbe8321SBarry Smith   PetscErrorCode ierr;
2901cb5b572fSBarry Smith 
2902cb5b572fSBarry Smith   PetscFunctionBegin;
290333f4a19fSKris Buschelman   /* If the two matrices have the same copy implementation, use fast copy. */
290433f4a19fSKris Buschelman   if (str == SAME_NONZERO_PATTERN && (A->ops->copy == B->ops->copy)) {
2905be6bf707SBarry Smith     Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data;
2906be6bf707SBarry Smith     Mat_SeqAIJ *b = (Mat_SeqAIJ*)B->data;
2907be6bf707SBarry Smith 
29084d805d7cSStefano Zampini     if (a->i[A->rmap->n] != b->i[B->rmap->n]) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_INCOMP,"Number of nonzeros in two matrices are different %D != %D",a->i[A->rmap->n],b->i[B->rmap->n]);
2909580bdb30SBarry Smith     ierr = PetscArraycpy(b->a,a->a,a->i[A->rmap->n]);CHKERRQ(ierr);
2910cdc753b6SBarry Smith     ierr = PetscObjectStateIncrease((PetscObject)B);CHKERRQ(ierr);
2911cb5b572fSBarry Smith   } else {
2912cb5b572fSBarry Smith     ierr = MatCopy_Basic(A,B,str);CHKERRQ(ierr);
2913cb5b572fSBarry Smith   }
2914cb5b572fSBarry Smith   PetscFunctionReturn(0);
2915cb5b572fSBarry Smith }
2916cb5b572fSBarry Smith 
29174994cf47SJed Brown PetscErrorCode MatSetUp_SeqAIJ(Mat A)
2918273d9f13SBarry Smith {
2919dfbe8321SBarry Smith   PetscErrorCode ierr;
2920273d9f13SBarry Smith 
2921273d9f13SBarry Smith   PetscFunctionBegin;
2922ab93d7beSBarry Smith   ierr = MatSeqAIJSetPreallocation_SeqAIJ(A,PETSC_DEFAULT,0);CHKERRQ(ierr);
2923273d9f13SBarry Smith   PetscFunctionReturn(0);
2924273d9f13SBarry Smith }
2925273d9f13SBarry Smith 
2926f38c1e66SStefano Zampini PETSC_INTERN PetscErrorCode MatSeqAIJGetArray_SeqAIJ(Mat A,PetscScalar *array[])
29276c0721eeSBarry Smith {
29286c0721eeSBarry Smith   Mat_SeqAIJ *a = (Mat_SeqAIJ*)A->data;
29296e111a19SKarl Rupp 
29306c0721eeSBarry Smith   PetscFunctionBegin;
29316c0721eeSBarry Smith   *array = a->a;
29326c0721eeSBarry Smith   PetscFunctionReturn(0);
29336c0721eeSBarry Smith }
29346c0721eeSBarry Smith 
2935f38c1e66SStefano Zampini PETSC_INTERN PetscErrorCode MatSeqAIJRestoreArray_SeqAIJ(Mat A,PetscScalar *array[])
29366c0721eeSBarry Smith {
29376c0721eeSBarry Smith   PetscFunctionBegin;
2938f38c1e66SStefano Zampini   *array = NULL;
29396c0721eeSBarry Smith   PetscFunctionReturn(0);
29406c0721eeSBarry Smith }
2941273d9f13SBarry Smith 
29428229c054SShri Abhyankar /*
29438229c054SShri Abhyankar    Computes the number of nonzeros per row needed for preallocation when X and Y
29448229c054SShri Abhyankar    have different nonzero structure.
29458229c054SShri Abhyankar */
2946b264fe52SHong Zhang PetscErrorCode MatAXPYGetPreallocation_SeqX_private(PetscInt m,const PetscInt *xi,const PetscInt *xj,const PetscInt *yi,const PetscInt *yj,PetscInt *nnz)
2947ec7775f6SShri Abhyankar {
2948b264fe52SHong Zhang   PetscInt       i,j,k,nzx,nzy;
2949ec7775f6SShri Abhyankar 
2950ec7775f6SShri Abhyankar   PetscFunctionBegin;
2951ec7775f6SShri Abhyankar   /* Set the number of nonzeros in the new matrix */
2952ec7775f6SShri Abhyankar   for (i=0; i<m; i++) {
2953b264fe52SHong Zhang     const PetscInt *xjj = xj+xi[i],*yjj = yj+yi[i];
2954b264fe52SHong Zhang     nzx = xi[i+1] - xi[i];
2955b264fe52SHong Zhang     nzy = yi[i+1] - yi[i];
29568af7cee1SJed Brown     nnz[i] = 0;
29578af7cee1SJed Brown     for (j=0,k=0; j<nzx; j++) {                   /* Point in X */
2958b264fe52SHong Zhang       for (; k<nzy && yjj[k]<xjj[j]; k++) nnz[i]++; /* Catch up to X */
2959b264fe52SHong Zhang       if (k<nzy && yjj[k]==xjj[j]) k++;             /* Skip duplicate */
29608af7cee1SJed Brown       nnz[i]++;
29618af7cee1SJed Brown     }
29628af7cee1SJed Brown     for (; k<nzy; k++) nnz[i]++;
2963ec7775f6SShri Abhyankar   }
2964ec7775f6SShri Abhyankar   PetscFunctionReturn(0);
2965ec7775f6SShri Abhyankar }
2966ec7775f6SShri Abhyankar 
2967b264fe52SHong Zhang PetscErrorCode MatAXPYGetPreallocation_SeqAIJ(Mat Y,Mat X,PetscInt *nnz)
2968b264fe52SHong Zhang {
2969b264fe52SHong Zhang   PetscInt       m = Y->rmap->N;
2970b264fe52SHong Zhang   Mat_SeqAIJ     *x = (Mat_SeqAIJ*)X->data;
2971b264fe52SHong Zhang   Mat_SeqAIJ     *y = (Mat_SeqAIJ*)Y->data;
2972b264fe52SHong Zhang   PetscErrorCode ierr;
2973b264fe52SHong Zhang 
2974b264fe52SHong Zhang   PetscFunctionBegin;
2975b264fe52SHong Zhang   /* Set the number of nonzeros in the new matrix */
2976b264fe52SHong Zhang   ierr = MatAXPYGetPreallocation_SeqX_private(m,x->i,x->j,y->i,y->j,nnz);CHKERRQ(ierr);
2977b264fe52SHong Zhang   PetscFunctionReturn(0);
2978b264fe52SHong Zhang }
2979b264fe52SHong Zhang 
2980f4df32b1SMatthew Knepley PetscErrorCode MatAXPY_SeqAIJ(Mat Y,PetscScalar a,Mat X,MatStructure str)
2981ac90fabeSBarry Smith {
2982dfbe8321SBarry Smith   PetscErrorCode ierr;
2983ac90fabeSBarry Smith   Mat_SeqAIJ     *x = (Mat_SeqAIJ*)X->data,*y = (Mat_SeqAIJ*)Y->data;
2984c5df96a5SBarry Smith   PetscBLASInt   one=1,bnz;
2985ac90fabeSBarry Smith 
2986ac90fabeSBarry Smith   PetscFunctionBegin;
2987c5df96a5SBarry Smith   ierr = PetscBLASIntCast(x->nz,&bnz);CHKERRQ(ierr);
2988ac90fabeSBarry Smith   if (str == SAME_NONZERO_PATTERN) {
2989f4df32b1SMatthew Knepley     PetscScalar alpha = a;
29908b83055fSJed Brown     PetscStackCallBLAS("BLASaxpy",BLASaxpy_(&bnz,&alpha,x->a,&one,y->a,&one));
2991acf2f550SJed Brown     ierr = MatSeqAIJInvalidateDiagonal(Y);CHKERRQ(ierr);
2992a3fa217bSJose E. Roman     ierr = PetscObjectStateIncrease((PetscObject)Y);CHKERRQ(ierr);
2993e2cf4d64SStefano Zampini     /* the MatAXPY_Basic* subroutines calls MatAssembly, so the matrix on the GPU
2994e2cf4d64SStefano Zampini        will be updated */
2995e2cf4d64SStefano Zampini #if defined(PETSC_HAVE_VIENNACL) || defined(PETSC_HAVE_CUDA)
2996c70f7ee4SJunchao Zhang     if (Y->offloadmask != PETSC_OFFLOAD_UNALLOCATED) {
2997c70f7ee4SJunchao Zhang       Y->offloadmask = PETSC_OFFLOAD_CPU;
2998e2cf4d64SStefano Zampini     }
2999e2cf4d64SStefano Zampini #endif
3000ab784542SHong Zhang   } else if (str == SUBSET_NONZERO_PATTERN) { /* nonzeros of X is a subset of Y's */
3001ab784542SHong Zhang     ierr = MatAXPY_Basic(Y,a,X,str);CHKERRQ(ierr);
3002ac90fabeSBarry Smith   } else {
30038229c054SShri Abhyankar     Mat      B;
30048229c054SShri Abhyankar     PetscInt *nnz;
3005785e854fSJed Brown     ierr = PetscMalloc1(Y->rmap->N,&nnz);CHKERRQ(ierr);
3006ce94432eSBarry Smith     ierr = MatCreate(PetscObjectComm((PetscObject)Y),&B);CHKERRQ(ierr);
3007bc5a2726SShri Abhyankar     ierr = PetscObjectSetName((PetscObject)B,((PetscObject)Y)->name);CHKERRQ(ierr);
30084aa94f47SShri Abhyankar     ierr = MatSetSizes(B,Y->rmap->n,Y->cmap->n,Y->rmap->N,Y->cmap->N);CHKERRQ(ierr);
300933d57670SJed Brown     ierr = MatSetBlockSizesFromMats(B,Y,Y);CHKERRQ(ierr);
3010176df525SBarry Smith     ierr = MatSetType(B,(MatType) ((PetscObject)Y)->type_name);CHKERRQ(ierr);
30118229c054SShri Abhyankar     ierr = MatAXPYGetPreallocation_SeqAIJ(Y,X,nnz);CHKERRQ(ierr);
3012ecd8bba6SJed Brown     ierr = MatSeqAIJSetPreallocation(B,0,nnz);CHKERRQ(ierr);
3013ec7775f6SShri Abhyankar     ierr = MatAXPY_BasicWithPreallocation(B,Y,a,X,str);CHKERRQ(ierr);
301428be2f97SBarry Smith     ierr = MatHeaderReplace(Y,&B);CHKERRQ(ierr);
30158229c054SShri Abhyankar     ierr = PetscFree(nnz);CHKERRQ(ierr);
3016ac90fabeSBarry Smith   }
3017ac90fabeSBarry Smith   PetscFunctionReturn(0);
3018ac90fabeSBarry Smith }
3019ac90fabeSBarry Smith 
30207087cfbeSBarry Smith PetscErrorCode  MatConjugate_SeqAIJ(Mat mat)
3021354c94deSBarry Smith {
3022354c94deSBarry Smith #if defined(PETSC_USE_COMPLEX)
3023354c94deSBarry Smith   Mat_SeqAIJ  *aij = (Mat_SeqAIJ*)mat->data;
3024354c94deSBarry Smith   PetscInt    i,nz;
3025354c94deSBarry Smith   PetscScalar *a;
3026354c94deSBarry Smith 
3027354c94deSBarry Smith   PetscFunctionBegin;
3028354c94deSBarry Smith   nz = aij->nz;
3029354c94deSBarry Smith   a  = aij->a;
30302205254eSKarl Rupp   for (i=0; i<nz; i++) a[i] = PetscConj(a[i]);
3031e2cf4d64SStefano Zampini #if defined(PETSC_HAVE_VIENNACL) || defined(PETSC_HAVE_CUDA)
3032c70f7ee4SJunchao Zhang   if (mat->offloadmask != PETSC_OFFLOAD_UNALLOCATED) mat->offloadmask = PETSC_OFFLOAD_CPU;
3033e2cf4d64SStefano Zampini #endif
3034354c94deSBarry Smith #else
3035354c94deSBarry Smith   PetscFunctionBegin;
3036354c94deSBarry Smith #endif
3037354c94deSBarry Smith   PetscFunctionReturn(0);
3038354c94deSBarry Smith }
3039354c94deSBarry Smith 
3040985db425SBarry Smith PetscErrorCode MatGetRowMaxAbs_SeqAIJ(Mat A,Vec v,PetscInt idx[])
3041e34fafa9SBarry Smith {
3042e34fafa9SBarry Smith   Mat_SeqAIJ     *a = (Mat_SeqAIJ*)A->data;
3043e34fafa9SBarry Smith   PetscErrorCode ierr;
3044d0f46423SBarry Smith   PetscInt       i,j,m = A->rmap->n,*ai,*aj,ncols,n;
3045e34fafa9SBarry Smith   PetscReal      atmp;
3046985db425SBarry Smith   PetscScalar    *x;
3047e34fafa9SBarry Smith   MatScalar      *aa;
3048e34fafa9SBarry Smith 
3049e34fafa9SBarry Smith   PetscFunctionBegin;
3050e32f2f54SBarry Smith   if (A->factortype) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Not for factored matrix");
3051e34fafa9SBarry Smith   aa = a->a;
3052e34fafa9SBarry Smith   ai = a->i;
3053e34fafa9SBarry Smith   aj = a->j;
3054e34fafa9SBarry Smith 
3055985db425SBarry Smith   ierr = VecSet(v,0.0);CHKERRQ(ierr);
3056e34fafa9SBarry Smith   ierr = VecGetArray(v,&x);CHKERRQ(ierr);
3057e34fafa9SBarry Smith   ierr = VecGetLocalSize(v,&n);CHKERRQ(ierr);
3058e32f2f54SBarry Smith   if (n != A->rmap->n) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Nonconforming matrix and vector");
3059e34fafa9SBarry Smith   for (i=0; i<m; i++) {
3060e34fafa9SBarry Smith     ncols = ai[1] - ai[0]; ai++;
30619189402eSHong Zhang     x[i]  = 0.0;
3062e34fafa9SBarry Smith     for (j=0; j<ncols; j++) {
3063985db425SBarry Smith       atmp = PetscAbsScalar(*aa);
3064985db425SBarry Smith       if (PetscAbsScalar(x[i]) < atmp) {x[i] = atmp; if (idx) idx[i] = *aj;}
3065985db425SBarry Smith       aa++; aj++;
3066985db425SBarry Smith     }
3067985db425SBarry Smith   }
3068985db425SBarry Smith   ierr = VecRestoreArray(v,&x);CHKERRQ(ierr);
3069985db425SBarry Smith   PetscFunctionReturn(0);
3070985db425SBarry Smith }
3071985db425SBarry Smith 
3072985db425SBarry Smith PetscErrorCode MatGetRowMax_SeqAIJ(Mat A,Vec v,PetscInt idx[])
3073985db425SBarry Smith {
3074985db425SBarry Smith   Mat_SeqAIJ     *a = (Mat_SeqAIJ*)A->data;
3075985db425SBarry Smith   PetscErrorCode ierr;
3076d0f46423SBarry Smith   PetscInt       i,j,m = A->rmap->n,*ai,*aj,ncols,n;
3077985db425SBarry Smith   PetscScalar    *x;
3078985db425SBarry Smith   MatScalar      *aa;
3079985db425SBarry Smith 
3080985db425SBarry Smith   PetscFunctionBegin;
3081e32f2f54SBarry Smith   if (A->factortype) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Not for factored matrix");
3082985db425SBarry Smith   aa = a->a;
3083985db425SBarry Smith   ai = a->i;
3084985db425SBarry Smith   aj = a->j;
3085985db425SBarry Smith 
3086985db425SBarry Smith   ierr = VecSet(v,0.0);CHKERRQ(ierr);
3087985db425SBarry Smith   ierr = VecGetArray(v,&x);CHKERRQ(ierr);
3088985db425SBarry Smith   ierr = VecGetLocalSize(v,&n);CHKERRQ(ierr);
3089e32f2f54SBarry Smith   if (n != A->rmap->n) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Nonconforming matrix and vector");
3090985db425SBarry Smith   for (i=0; i<m; i++) {
3091985db425SBarry Smith     ncols = ai[1] - ai[0]; ai++;
3092d0f46423SBarry Smith     if (ncols == A->cmap->n) { /* row is dense */
3093985db425SBarry Smith       x[i] = *aa; if (idx) idx[i] = 0;
3094985db425SBarry Smith     } else {  /* row is sparse so already KNOW maximum is 0.0 or higher */
3095985db425SBarry Smith       x[i] = 0.0;
3096985db425SBarry Smith       if (idx) {
3097985db425SBarry Smith         idx[i] = 0; /* in case ncols is zero */
3098985db425SBarry Smith         for (j=0;j<ncols;j++) { /* find first implicit 0.0 in the row */
3099985db425SBarry Smith           if (aj[j] > j) {
3100985db425SBarry Smith             idx[i] = j;
3101985db425SBarry Smith             break;
3102985db425SBarry Smith           }
3103985db425SBarry Smith         }
3104985db425SBarry Smith       }
3105985db425SBarry Smith     }
3106985db425SBarry Smith     for (j=0; j<ncols; j++) {
3107985db425SBarry Smith       if (PetscRealPart(x[i]) < PetscRealPart(*aa)) {x[i] = *aa; if (idx) idx[i] = *aj;}
3108985db425SBarry Smith       aa++; aj++;
3109985db425SBarry Smith     }
3110985db425SBarry Smith   }
3111985db425SBarry Smith   ierr = VecRestoreArray(v,&x);CHKERRQ(ierr);
3112985db425SBarry Smith   PetscFunctionReturn(0);
3113985db425SBarry Smith }
3114985db425SBarry Smith 
3115c87e5d42SMatthew Knepley PetscErrorCode MatGetRowMinAbs_SeqAIJ(Mat A,Vec v,PetscInt idx[])
3116c87e5d42SMatthew Knepley {
3117c87e5d42SMatthew Knepley   Mat_SeqAIJ     *a = (Mat_SeqAIJ*)A->data;
3118c87e5d42SMatthew Knepley   PetscErrorCode ierr;
3119c87e5d42SMatthew Knepley   PetscInt       i,j,m = A->rmap->n,*ai,*aj,ncols,n;
3120c87e5d42SMatthew Knepley   PetscReal      atmp;
3121c87e5d42SMatthew Knepley   PetscScalar    *x;
3122c87e5d42SMatthew Knepley   MatScalar      *aa;
3123c87e5d42SMatthew Knepley 
3124c87e5d42SMatthew Knepley   PetscFunctionBegin;
3125e32f2f54SBarry Smith   if (A->factortype) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Not for factored matrix");
3126c87e5d42SMatthew Knepley   aa = a->a;
3127c87e5d42SMatthew Knepley   ai = a->i;
3128c87e5d42SMatthew Knepley   aj = a->j;
3129c87e5d42SMatthew Knepley 
3130c87e5d42SMatthew Knepley   ierr = VecSet(v,0.0);CHKERRQ(ierr);
3131c87e5d42SMatthew Knepley   ierr = VecGetArray(v,&x);CHKERRQ(ierr);
3132c87e5d42SMatthew Knepley   ierr = VecGetLocalSize(v,&n);CHKERRQ(ierr);
313360e0710aSBarry Smith   if (n != A->rmap->n) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Nonconforming matrix and vector, %D vs. %D rows", A->rmap->n, n);
3134c87e5d42SMatthew Knepley   for (i=0; i<m; i++) {
3135c87e5d42SMatthew Knepley     ncols = ai[1] - ai[0]; ai++;
3136289a08f5SMatthew Knepley     if (ncols) {
3137289a08f5SMatthew Knepley       /* Get first nonzero */
3138289a08f5SMatthew Knepley       for (j = 0; j < ncols; j++) {
3139289a08f5SMatthew Knepley         atmp = PetscAbsScalar(aa[j]);
31402205254eSKarl Rupp         if (atmp > 1.0e-12) {
31412205254eSKarl Rupp           x[i] = atmp;
31422205254eSKarl Rupp           if (idx) idx[i] = aj[j];
31432205254eSKarl Rupp           break;
31442205254eSKarl Rupp         }
3145289a08f5SMatthew Knepley       }
314612431cb0SMatthew G Knepley       if (j == ncols) {x[i] = PetscAbsScalar(*aa); if (idx) idx[i] = *aj;}
3147289a08f5SMatthew Knepley     } else {
3148289a08f5SMatthew Knepley       x[i] = 0.0; if (idx) idx[i] = 0;
3149289a08f5SMatthew Knepley     }
3150c87e5d42SMatthew Knepley     for (j = 0; j < ncols; j++) {
3151c87e5d42SMatthew Knepley       atmp = PetscAbsScalar(*aa);
3152289a08f5SMatthew Knepley       if (atmp > 1.0e-12 && PetscAbsScalar(x[i]) > atmp) {x[i] = atmp; if (idx) idx[i] = *aj;}
3153c87e5d42SMatthew Knepley       aa++; aj++;
3154c87e5d42SMatthew Knepley     }
3155c87e5d42SMatthew Knepley   }
3156c87e5d42SMatthew Knepley   ierr = VecRestoreArray(v,&x);CHKERRQ(ierr);
3157c87e5d42SMatthew Knepley   PetscFunctionReturn(0);
3158c87e5d42SMatthew Knepley }
3159c87e5d42SMatthew Knepley 
3160985db425SBarry Smith PetscErrorCode MatGetRowMin_SeqAIJ(Mat A,Vec v,PetscInt idx[])
3161985db425SBarry Smith {
3162985db425SBarry Smith   Mat_SeqAIJ      *a = (Mat_SeqAIJ*)A->data;
3163985db425SBarry Smith   PetscErrorCode  ierr;
3164d9ca1df4SBarry Smith   PetscInt        i,j,m = A->rmap->n,ncols,n;
3165d9ca1df4SBarry Smith   const PetscInt  *ai,*aj;
3166985db425SBarry Smith   PetscScalar     *x;
3167d9ca1df4SBarry Smith   const MatScalar *aa;
3168985db425SBarry Smith 
3169985db425SBarry Smith   PetscFunctionBegin;
3170e32f2f54SBarry Smith   if (A->factortype) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Not for factored matrix");
3171985db425SBarry Smith   aa = a->a;
3172985db425SBarry Smith   ai = a->i;
3173985db425SBarry Smith   aj = a->j;
3174985db425SBarry Smith 
3175985db425SBarry Smith   ierr = VecSet(v,0.0);CHKERRQ(ierr);
3176985db425SBarry Smith   ierr = VecGetArray(v,&x);CHKERRQ(ierr);
3177985db425SBarry Smith   ierr = VecGetLocalSize(v,&n);CHKERRQ(ierr);
3178e32f2f54SBarry Smith   if (n != A->rmap->n) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Nonconforming matrix and vector");
3179985db425SBarry Smith   for (i=0; i<m; i++) {
3180985db425SBarry Smith     ncols = ai[1] - ai[0]; ai++;
3181d0f46423SBarry Smith     if (ncols == A->cmap->n) { /* row is dense */
3182985db425SBarry Smith       x[i] = *aa; if (idx) idx[i] = 0;
3183985db425SBarry Smith     } else {  /* row is sparse so already KNOW minimum is 0.0 or lower */
3184985db425SBarry Smith       x[i] = 0.0;
3185985db425SBarry Smith       if (idx) {   /* find first implicit 0.0 in the row */
3186985db425SBarry Smith         idx[i] = 0; /* in case ncols is zero */
3187985db425SBarry Smith         for (j=0; j<ncols; j++) {
3188985db425SBarry Smith           if (aj[j] > j) {
3189985db425SBarry Smith             idx[i] = j;
3190985db425SBarry Smith             break;
3191985db425SBarry Smith           }
3192985db425SBarry Smith         }
3193985db425SBarry Smith       }
3194985db425SBarry Smith     }
3195985db425SBarry Smith     for (j=0; j<ncols; j++) {
3196985db425SBarry Smith       if (PetscRealPart(x[i]) > PetscRealPart(*aa)) {x[i] = *aa; if (idx) idx[i] = *aj;}
3197985db425SBarry Smith       aa++; aj++;
3198e34fafa9SBarry Smith     }
3199e34fafa9SBarry Smith   }
3200e34fafa9SBarry Smith   ierr = VecRestoreArray(v,&x);CHKERRQ(ierr);
3201e34fafa9SBarry Smith   PetscFunctionReturn(0);
3202e34fafa9SBarry Smith }
3203bbead8a2SBarry Smith 
3204713ccfa9SJed Brown PetscErrorCode MatInvertBlockDiagonal_SeqAIJ(Mat A,const PetscScalar **values)
3205bbead8a2SBarry Smith {
3206bbead8a2SBarry Smith   Mat_SeqAIJ      *a = (Mat_SeqAIJ*) A->data;
3207bbead8a2SBarry Smith   PetscErrorCode  ierr;
320833d57670SJed Brown   PetscInt        i,bs = PetscAbs(A->rmap->bs),mbs = A->rmap->n/bs,ipvt[5],bs2 = bs*bs,*v_pivots,ij[7],*IJ,j;
3209bbead8a2SBarry Smith   MatScalar       *diag,work[25],*v_work;
32100da83c2eSBarry Smith   const PetscReal shift = 0.0;
32111a9391e3SHong Zhang   PetscBool       allowzeropivot,zeropivotdetected=PETSC_FALSE;
3212bbead8a2SBarry Smith 
3213bbead8a2SBarry Smith   PetscFunctionBegin;
3214a455e926SHong Zhang   allowzeropivot = PetscNot(A->erroriffailure);
32154a0d0026SBarry Smith   if (a->ibdiagvalid) {
32164a0d0026SBarry Smith     if (values) *values = a->ibdiag;
32174a0d0026SBarry Smith     PetscFunctionReturn(0);
32184a0d0026SBarry Smith   }
3219bbead8a2SBarry Smith   ierr = MatMarkDiagonal_SeqAIJ(A);CHKERRQ(ierr);
3220bbead8a2SBarry Smith   if (!a->ibdiag) {
3221785e854fSJed Brown     ierr = PetscMalloc1(bs2*mbs,&a->ibdiag);CHKERRQ(ierr);
32223bb1ff40SBarry Smith     ierr = PetscLogObjectMemory((PetscObject)A,bs2*mbs*sizeof(PetscScalar));CHKERRQ(ierr);
3223bbead8a2SBarry Smith   }
3224bbead8a2SBarry Smith   diag = a->ibdiag;
3225bbead8a2SBarry Smith   if (values) *values = a->ibdiag;
3226bbead8a2SBarry Smith   /* factor and invert each block */
3227bbead8a2SBarry Smith   switch (bs) {
3228bbead8a2SBarry Smith   case 1:
3229bbead8a2SBarry Smith     for (i=0; i<mbs; i++) {
3230bbead8a2SBarry Smith       ierr = MatGetValues(A,1,&i,1,&i,diag+i);CHKERRQ(ierr);
3231ec1892c8SHong Zhang       if (PetscAbsScalar(diag[i] + shift) < PETSC_MACHINE_EPSILON) {
3232ec1892c8SHong Zhang         if (allowzeropivot) {
32337b6c816cSBarry Smith           A->factorerrortype             = MAT_FACTOR_NUMERIC_ZEROPIVOT;
32347b6c816cSBarry Smith           A->factorerror_zeropivot_value = PetscAbsScalar(diag[i]);
32357b6c816cSBarry Smith           A->factorerror_zeropivot_row   = i;
32367b6c816cSBarry Smith           ierr = PetscInfo3(A,"Zero pivot, row %D pivot %g tolerance %g\n",i,(double)PetscAbsScalar(diag[i]),(double)PETSC_MACHINE_EPSILON);CHKERRQ(ierr);
32377b6c816cSBarry Smith         } else SETERRQ3(PETSC_COMM_SELF,PETSC_ERR_MAT_LU_ZRPVT,"Zero pivot, row %D pivot %g tolerance %g",i,(double)PetscAbsScalar(diag[i]),(double)PETSC_MACHINE_EPSILON);
3238ec1892c8SHong Zhang       }
3239bbead8a2SBarry Smith       diag[i] = (PetscScalar)1.0 / (diag[i] + shift);
3240bbead8a2SBarry Smith     }
3241bbead8a2SBarry Smith     break;
3242bbead8a2SBarry Smith   case 2:
3243bbead8a2SBarry Smith     for (i=0; i<mbs; i++) {
3244bbead8a2SBarry Smith       ij[0] = 2*i; ij[1] = 2*i + 1;
3245bbead8a2SBarry Smith       ierr  = MatGetValues(A,2,ij,2,ij,diag);CHKERRQ(ierr);
3246a455e926SHong Zhang       ierr  = PetscKernel_A_gets_inverse_A_2(diag,shift,allowzeropivot,&zeropivotdetected);CHKERRQ(ierr);
32477b6c816cSBarry Smith       if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT;
324896b95a6bSBarry Smith       ierr  = PetscKernel_A_gets_transpose_A_2(diag);CHKERRQ(ierr);
3249bbead8a2SBarry Smith       diag += 4;
3250bbead8a2SBarry Smith     }
3251bbead8a2SBarry Smith     break;
3252bbead8a2SBarry Smith   case 3:
3253bbead8a2SBarry Smith     for (i=0; i<mbs; i++) {
3254bbead8a2SBarry Smith       ij[0] = 3*i; ij[1] = 3*i + 1; ij[2] = 3*i + 2;
3255bbead8a2SBarry Smith       ierr  = MatGetValues(A,3,ij,3,ij,diag);CHKERRQ(ierr);
3256a455e926SHong Zhang       ierr  = PetscKernel_A_gets_inverse_A_3(diag,shift,allowzeropivot,&zeropivotdetected);CHKERRQ(ierr);
32577b6c816cSBarry Smith       if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT;
325896b95a6bSBarry Smith       ierr  = PetscKernel_A_gets_transpose_A_3(diag);CHKERRQ(ierr);
3259bbead8a2SBarry Smith       diag += 9;
3260bbead8a2SBarry Smith     }
3261bbead8a2SBarry Smith     break;
3262bbead8a2SBarry Smith   case 4:
3263bbead8a2SBarry Smith     for (i=0; i<mbs; i++) {
3264bbead8a2SBarry Smith       ij[0] = 4*i; ij[1] = 4*i + 1; ij[2] = 4*i + 2; ij[3] = 4*i + 3;
3265bbead8a2SBarry Smith       ierr  = MatGetValues(A,4,ij,4,ij,diag);CHKERRQ(ierr);
3266a455e926SHong Zhang       ierr  = PetscKernel_A_gets_inverse_A_4(diag,shift,allowzeropivot,&zeropivotdetected);CHKERRQ(ierr);
32677b6c816cSBarry Smith       if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT;
326896b95a6bSBarry Smith       ierr  = PetscKernel_A_gets_transpose_A_4(diag);CHKERRQ(ierr);
3269bbead8a2SBarry Smith       diag += 16;
3270bbead8a2SBarry Smith     }
3271bbead8a2SBarry Smith     break;
3272bbead8a2SBarry Smith   case 5:
3273bbead8a2SBarry Smith     for (i=0; i<mbs; i++) {
3274bbead8a2SBarry Smith       ij[0] = 5*i; ij[1] = 5*i + 1; ij[2] = 5*i + 2; ij[3] = 5*i + 3; ij[4] = 5*i + 4;
3275bbead8a2SBarry Smith       ierr  = MatGetValues(A,5,ij,5,ij,diag);CHKERRQ(ierr);
3276a455e926SHong Zhang       ierr  = PetscKernel_A_gets_inverse_A_5(diag,ipvt,work,shift,allowzeropivot,&zeropivotdetected);CHKERRQ(ierr);
32777b6c816cSBarry Smith       if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT;
327896b95a6bSBarry Smith       ierr  = PetscKernel_A_gets_transpose_A_5(diag);CHKERRQ(ierr);
3279bbead8a2SBarry Smith       diag += 25;
3280bbead8a2SBarry Smith     }
3281bbead8a2SBarry Smith     break;
3282bbead8a2SBarry Smith   case 6:
3283bbead8a2SBarry Smith     for (i=0; i<mbs; i++) {
3284bbead8a2SBarry Smith       ij[0] = 6*i; ij[1] = 6*i + 1; ij[2] = 6*i + 2; ij[3] = 6*i + 3; ij[4] = 6*i + 4; ij[5] = 6*i + 5;
3285bbead8a2SBarry Smith       ierr  = MatGetValues(A,6,ij,6,ij,diag);CHKERRQ(ierr);
3286a455e926SHong Zhang       ierr  = PetscKernel_A_gets_inverse_A_6(diag,shift,allowzeropivot,&zeropivotdetected);CHKERRQ(ierr);
32877b6c816cSBarry Smith       if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT;
328896b95a6bSBarry Smith       ierr  = PetscKernel_A_gets_transpose_A_6(diag);CHKERRQ(ierr);
3289bbead8a2SBarry Smith       diag += 36;
3290bbead8a2SBarry Smith     }
3291bbead8a2SBarry Smith     break;
3292bbead8a2SBarry Smith   case 7:
3293bbead8a2SBarry Smith     for (i=0; i<mbs; i++) {
3294bbead8a2SBarry Smith       ij[0] = 7*i; ij[1] = 7*i + 1; ij[2] = 7*i + 2; ij[3] = 7*i + 3; ij[4] = 7*i + 4; ij[5] = 7*i + 5; ij[5] = 7*i + 6;
3295bbead8a2SBarry Smith       ierr  = MatGetValues(A,7,ij,7,ij,diag);CHKERRQ(ierr);
3296a455e926SHong Zhang       ierr  = PetscKernel_A_gets_inverse_A_7(diag,shift,allowzeropivot,&zeropivotdetected);CHKERRQ(ierr);
32977b6c816cSBarry Smith       if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT;
329896b95a6bSBarry Smith       ierr  = PetscKernel_A_gets_transpose_A_7(diag);CHKERRQ(ierr);
3299bbead8a2SBarry Smith       diag += 49;
3300bbead8a2SBarry Smith     }
3301bbead8a2SBarry Smith     break;
3302bbead8a2SBarry Smith   default:
3303dcca6d9dSJed Brown     ierr = PetscMalloc3(bs,&v_work,bs,&v_pivots,bs,&IJ);CHKERRQ(ierr);
3304bbead8a2SBarry Smith     for (i=0; i<mbs; i++) {
3305bbead8a2SBarry Smith       for (j=0; j<bs; j++) {
3306bbead8a2SBarry Smith         IJ[j] = bs*i + j;
3307bbead8a2SBarry Smith       }
3308bbead8a2SBarry Smith       ierr  = MatGetValues(A,bs,IJ,bs,IJ,diag);CHKERRQ(ierr);
33095f8bbccaSHong Zhang       ierr  = PetscKernel_A_gets_inverse_A(bs,diag,v_pivots,v_work,allowzeropivot,&zeropivotdetected);CHKERRQ(ierr);
33107b6c816cSBarry Smith       if (zeropivotdetected) A->factorerrortype = MAT_FACTOR_NUMERIC_ZEROPIVOT;
331196b95a6bSBarry Smith       ierr  = PetscKernel_A_gets_transpose_A_N(diag,bs);CHKERRQ(ierr);
3312bbead8a2SBarry Smith       diag += bs2;
3313bbead8a2SBarry Smith     }
3314bbead8a2SBarry Smith     ierr = PetscFree3(v_work,v_pivots,IJ);CHKERRQ(ierr);
3315bbead8a2SBarry Smith   }
3316bbead8a2SBarry Smith   a->ibdiagvalid = PETSC_TRUE;
3317bbead8a2SBarry Smith   PetscFunctionReturn(0);
3318bbead8a2SBarry Smith }
3319bbead8a2SBarry Smith 
332073a71a0fSBarry Smith static PetscErrorCode  MatSetRandom_SeqAIJ(Mat x,PetscRandom rctx)
332173a71a0fSBarry Smith {
332273a71a0fSBarry Smith   PetscErrorCode ierr;
332373a71a0fSBarry Smith   Mat_SeqAIJ     *aij = (Mat_SeqAIJ*)x->data;
332473a71a0fSBarry Smith   PetscScalar    a;
332573a71a0fSBarry Smith   PetscInt       m,n,i,j,col;
332673a71a0fSBarry Smith 
332773a71a0fSBarry Smith   PetscFunctionBegin;
332873a71a0fSBarry Smith   if (!x->assembled) {
332973a71a0fSBarry Smith     ierr = MatGetSize(x,&m,&n);CHKERRQ(ierr);
333073a71a0fSBarry Smith     for (i=0; i<m; i++) {
333173a71a0fSBarry Smith       for (j=0; j<aij->imax[i]; j++) {
333273a71a0fSBarry Smith         ierr = PetscRandomGetValue(rctx,&a);CHKERRQ(ierr);
333373a71a0fSBarry Smith         col  = (PetscInt)(n*PetscRealPart(a));
333473a71a0fSBarry Smith         ierr = MatSetValues(x,1,&i,1,&col,&a,ADD_VALUES);CHKERRQ(ierr);
333573a71a0fSBarry Smith       }
333673a71a0fSBarry Smith     }
3337e2ce353bSJunchao Zhang   } else {
3338e2ce353bSJunchao Zhang     for (i=0; i<aij->nz; i++) {ierr = PetscRandomGetValue(rctx,aij->a+i);CHKERRQ(ierr);}
3339e2ce353bSJunchao Zhang   }
334073a71a0fSBarry Smith   ierr = MatAssemblyBegin(x,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
334173a71a0fSBarry Smith   ierr = MatAssemblyEnd(x,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
334273a71a0fSBarry Smith   PetscFunctionReturn(0);
334373a71a0fSBarry Smith }
334473a71a0fSBarry Smith 
3345679944adSJunchao Zhang /* Like MatSetRandom_SeqAIJ, but do not set values on columns in range of [low, high) */
3346679944adSJunchao Zhang PetscErrorCode  MatSetRandomSkipColumnRange_SeqAIJ_Private(Mat x,PetscInt low,PetscInt high,PetscRandom rctx)
3347679944adSJunchao Zhang {
3348679944adSJunchao Zhang   PetscErrorCode ierr;
3349679944adSJunchao Zhang   Mat_SeqAIJ     *aij = (Mat_SeqAIJ*)x->data;
3350679944adSJunchao Zhang   PetscScalar    a;
3351679944adSJunchao Zhang   PetscInt       m,n,i,j,col,nskip;
3352679944adSJunchao Zhang 
3353679944adSJunchao Zhang   PetscFunctionBegin;
3354679944adSJunchao Zhang   nskip = high - low;
3355679944adSJunchao Zhang   ierr  = MatGetSize(x,&m,&n);CHKERRQ(ierr);
3356679944adSJunchao Zhang   n    -= nskip; /* shrink number of columns where nonzeros can be set */
3357679944adSJunchao Zhang   for (i=0; i<m; i++) {
3358679944adSJunchao Zhang     for (j=0; j<aij->imax[i]; j++) {
3359679944adSJunchao Zhang       ierr = PetscRandomGetValue(rctx,&a);CHKERRQ(ierr);
3360679944adSJunchao Zhang       col  = (PetscInt)(n*PetscRealPart(a));
3361679944adSJunchao Zhang       if (col >= low) col += nskip; /* shift col rightward to skip the hole */
3362679944adSJunchao Zhang       ierr = MatSetValues(x,1,&i,1,&col,&a,ADD_VALUES);CHKERRQ(ierr);
3363679944adSJunchao Zhang     }
3364e2ce353bSJunchao Zhang   }
3365679944adSJunchao Zhang   ierr = MatAssemblyBegin(x,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
3366679944adSJunchao Zhang   ierr = MatAssemblyEnd(x,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
3367679944adSJunchao Zhang   PetscFunctionReturn(0);
3368679944adSJunchao Zhang }
3369679944adSJunchao Zhang 
3370679944adSJunchao Zhang 
3371682d7d0cSBarry Smith /* -------------------------------------------------------------------*/
33720a6ffc59SBarry Smith static struct _MatOps MatOps_Values = { MatSetValues_SeqAIJ,
3373cb5b572fSBarry Smith                                         MatGetRow_SeqAIJ,
3374cb5b572fSBarry Smith                                         MatRestoreRow_SeqAIJ,
3375cb5b572fSBarry Smith                                         MatMult_SeqAIJ,
337697304618SKris Buschelman                                 /*  4*/ MatMultAdd_SeqAIJ,
33777c922b88SBarry Smith                                         MatMultTranspose_SeqAIJ,
33787c922b88SBarry Smith                                         MatMultTransposeAdd_SeqAIJ,
3379db4efbfdSBarry Smith                                         0,
3380db4efbfdSBarry Smith                                         0,
3381db4efbfdSBarry Smith                                         0,
3382db4efbfdSBarry Smith                                 /* 10*/ 0,
3383cb5b572fSBarry Smith                                         MatLUFactor_SeqAIJ,
3384cb5b572fSBarry Smith                                         0,
338541f059aeSBarry Smith                                         MatSOR_SeqAIJ,
338691e9d3e2SHong Zhang                                         MatTranspose_SeqAIJ,
338797304618SKris Buschelman                                 /*1 5*/ MatGetInfo_SeqAIJ,
3388cb5b572fSBarry Smith                                         MatEqual_SeqAIJ,
3389cb5b572fSBarry Smith                                         MatGetDiagonal_SeqAIJ,
3390cb5b572fSBarry Smith                                         MatDiagonalScale_SeqAIJ,
3391cb5b572fSBarry Smith                                         MatNorm_SeqAIJ,
339297304618SKris Buschelman                                 /* 20*/ 0,
3393cb5b572fSBarry Smith                                         MatAssemblyEnd_SeqAIJ,
3394cb5b572fSBarry Smith                                         MatSetOption_SeqAIJ,
3395cb5b572fSBarry Smith                                         MatZeroEntries_SeqAIJ,
3396d519adbfSMatthew Knepley                                 /* 24*/ MatZeroRows_SeqAIJ,
3397db4efbfdSBarry Smith                                         0,
3398db4efbfdSBarry Smith                                         0,
3399db4efbfdSBarry Smith                                         0,
3400db4efbfdSBarry Smith                                         0,
34014994cf47SJed Brown                                 /* 29*/ MatSetUp_SeqAIJ,
3402db4efbfdSBarry Smith                                         0,
3403db4efbfdSBarry Smith                                         0,
34048c778c55SBarry Smith                                         0,
34058c778c55SBarry Smith                                         0,
3406d519adbfSMatthew Knepley                                 /* 34*/ MatDuplicate_SeqAIJ,
3407cb5b572fSBarry Smith                                         0,
3408cb5b572fSBarry Smith                                         0,
3409cb5b572fSBarry Smith                                         MatILUFactor_SeqAIJ,
3410cb5b572fSBarry Smith                                         0,
3411d519adbfSMatthew Knepley                                 /* 39*/ MatAXPY_SeqAIJ,
34127dae84e0SHong Zhang                                         MatCreateSubMatrices_SeqAIJ,
3413cb5b572fSBarry Smith                                         MatIncreaseOverlap_SeqAIJ,
3414cb5b572fSBarry Smith                                         MatGetValues_SeqAIJ,
3415cb5b572fSBarry Smith                                         MatCopy_SeqAIJ,
3416d519adbfSMatthew Knepley                                 /* 44*/ MatGetRowMax_SeqAIJ,
3417cb5b572fSBarry Smith                                         MatScale_SeqAIJ,
34187d68702bSBarry Smith                                         MatShift_SeqAIJ,
341979299369SBarry Smith                                         MatDiagonalSet_SeqAIJ,
34206e169961SBarry Smith                                         MatZeroRowsColumns_SeqAIJ,
342173a71a0fSBarry Smith                                 /* 49*/ MatSetRandom_SeqAIJ,
34223b2fbd54SBarry Smith                                         MatGetRowIJ_SeqAIJ,
34233b2fbd54SBarry Smith                                         MatRestoreRowIJ_SeqAIJ,
34243b2fbd54SBarry Smith                                         MatGetColumnIJ_SeqAIJ,
3425a93ec695SBarry Smith                                         MatRestoreColumnIJ_SeqAIJ,
342693dfae19SHong Zhang                                 /* 54*/ MatFDColoringCreate_SeqXAIJ,
3427b9617806SBarry Smith                                         0,
34280513a670SBarry Smith                                         0,
3429cda55fadSBarry Smith                                         MatPermute_SeqAIJ,
3430cda55fadSBarry Smith                                         0,
3431d519adbfSMatthew Knepley                                 /* 59*/ 0,
3432b9b97703SBarry Smith                                         MatDestroy_SeqAIJ,
3433b9b97703SBarry Smith                                         MatView_SeqAIJ,
3434357abbc8SBarry Smith                                         0,
34354222ddf1SHong Zhang                                         0,
34364222ddf1SHong Zhang                                 /* 64*/ 0,
3437321b30b9SSatish Balay                                         MatMatMatMultNumeric_SeqAIJ_SeqAIJ_SeqAIJ,
3438ee4f033dSBarry Smith                                         0,
3439ee4f033dSBarry Smith                                         0,
3440ee4f033dSBarry Smith                                         0,
3441d519adbfSMatthew Knepley                                 /* 69*/ MatGetRowMaxAbs_SeqAIJ,
3442c87e5d42SMatthew Knepley                                         MatGetRowMinAbs_SeqAIJ,
3443ee4f033dSBarry Smith                                         0,
3444dcf5cc72SBarry Smith                                         0,
34452c93a97aSBarry Smith                                         0,
34462c93a97aSBarry Smith                                 /* 74*/ 0,
34473acb8795SBarry Smith                                         MatFDColoringApply_AIJ,
344897304618SKris Buschelman                                         0,
344997304618SKris Buschelman                                         0,
345097304618SKris Buschelman                                         0,
34516ce1633cSBarry Smith                                 /* 79*/ MatFindZeroDiagonals_SeqAIJ,
345297304618SKris Buschelman                                         0,
345397304618SKris Buschelman                                         0,
345497304618SKris Buschelman                                         0,
3455bc011b1eSHong Zhang                                         MatLoad_SeqAIJ,
3456d519adbfSMatthew Knepley                                 /* 84*/ MatIsSymmetric_SeqAIJ,
34571cbb95d3SBarry Smith                                         MatIsHermitian_SeqAIJ,
34586284ec50SHong Zhang                                         0,
34596284ec50SHong Zhang                                         0,
3460bc011b1eSHong Zhang                                         0,
34614222ddf1SHong Zhang                                 /* 89*/ 0,
34624222ddf1SHong Zhang                                         0,
346326be0446SHong Zhang                                         MatMatMultNumeric_SeqAIJ_SeqAIJ,
34644222ddf1SHong Zhang                                         0,
34654222ddf1SHong Zhang                                         0,
34668fa4b5a6SHong Zhang                                 /* 94*/ MatPtAPNumeric_SeqAIJ_SeqAIJ_SparseAxpy,
34674222ddf1SHong Zhang                                         0,
34684222ddf1SHong Zhang                                         0,
34696fc122caSHong Zhang                                         MatMatTransposeMultNumeric_SeqAIJ_SeqAIJ,
34702121bac1SHong Zhang                                         0,
34714222ddf1SHong Zhang                                 /* 99*/ MatProductSetFromOptions_SeqAIJ,
3472609c6c4dSKris Buschelman                                         0,
3473609c6c4dSKris Buschelman                                         0,
347487d4246cSBarry Smith                                         MatConjugate_SeqAIJ,
347587d4246cSBarry Smith                                         0,
3476d519adbfSMatthew Knepley                                 /*104*/ MatSetValuesRow_SeqAIJ,
347799cafbc1SBarry Smith                                         MatRealPart_SeqAIJ,
3478f5edf698SHong Zhang                                         MatImaginaryPart_SeqAIJ,
3479f5edf698SHong Zhang                                         0,
34802bebee5dSHong Zhang                                         0,
3481cbd44569SHong Zhang                                 /*109*/ MatMatSolve_SeqAIJ,
3482985db425SBarry Smith                                         0,
34832af78befSBarry Smith                                         MatGetRowMin_SeqAIJ,
34842af78befSBarry Smith                                         0,
3485599ef60dSHong Zhang                                         MatMissingDiagonal_SeqAIJ,
3486d519adbfSMatthew Knepley                                 /*114*/ 0,
3487599ef60dSHong Zhang                                         0,
34883c2a7987SHong Zhang                                         0,
3489fe97e370SBarry Smith                                         0,
3490fbdbba38SShri Abhyankar                                         0,
3491fbdbba38SShri Abhyankar                                 /*119*/ 0,
3492fbdbba38SShri Abhyankar                                         0,
3493fbdbba38SShri Abhyankar                                         0,
349482d44351SHong Zhang                                         0,
3495b3a44c85SBarry Smith                                         MatGetMultiProcBlock_SeqAIJ,
34960716a85fSBarry Smith                                 /*124*/ MatFindNonzeroRows_SeqAIJ,
3497bbead8a2SBarry Smith                                         MatGetColumnNorms_SeqAIJ,
349837868618SMatthew G Knepley                                         MatInvertBlockDiagonal_SeqAIJ,
34990da83c2eSBarry Smith                                         MatInvertVariableBlockDiagonal_SeqAIJ,
350037868618SMatthew G Knepley                                         0,
35015df89d91SHong Zhang                                 /*129*/ 0,
35024222ddf1SHong Zhang                                         0,
35034222ddf1SHong Zhang                                         0,
350475648e8dSHong Zhang                                         MatTransposeMatMultNumeric_SeqAIJ_SeqAIJ,
3505b9af6bddSHong Zhang                                         MatTransposeColoringCreate_SeqAIJ,
3506b9af6bddSHong Zhang                                 /*134*/ MatTransColoringApplySpToDen_SeqAIJ,
35072b8ad9a3SHong Zhang                                         MatTransColoringApplyDenToSp_SeqAIJ,
35084222ddf1SHong Zhang                                         0,
35094222ddf1SHong Zhang                                         0,
35103964eb88SJed Brown                                         MatRARtNumeric_SeqAIJ_SeqAIJ,
35113964eb88SJed Brown                                  /*139*/0,
3512f9426fe0SMark Adams                                         0,
35131919a2e2SJed Brown                                         0,
35143a062f41SBarry Smith                                         MatFDColoringSetUp_SeqXAIJ,
35159c8f2541SHong Zhang                                         MatFindOffBlockDiagonalEntries_SeqAIJ,
35164222ddf1SHong Zhang                                         MatCreateMPIMatConcatenateSeqMat_SeqAIJ,
35174222ddf1SHong Zhang                                  /*145*/MatDestroySubMatrices_SeqAIJ,
35184222ddf1SHong Zhang                                         0,
35194222ddf1SHong Zhang                                         0
35209e29f15eSvictorle };
352117ab2063SBarry Smith 
35227087cfbeSBarry Smith PetscErrorCode  MatSeqAIJSetColumnIndices_SeqAIJ(Mat mat,PetscInt *indices)
3523bef8e0ddSBarry Smith {
3524bef8e0ddSBarry Smith   Mat_SeqAIJ *aij = (Mat_SeqAIJ*)mat->data;
352597f1f81fSBarry Smith   PetscInt   i,nz,n;
3526bef8e0ddSBarry Smith 
3527bef8e0ddSBarry Smith   PetscFunctionBegin;
3528bef8e0ddSBarry Smith   nz = aij->maxnz;
3529d0f46423SBarry Smith   n  = mat->rmap->n;
3530bef8e0ddSBarry Smith   for (i=0; i<nz; i++) {
3531bef8e0ddSBarry Smith     aij->j[i] = indices[i];
3532bef8e0ddSBarry Smith   }
3533bef8e0ddSBarry Smith   aij->nz = nz;
3534bef8e0ddSBarry Smith   for (i=0; i<n; i++) {
3535bef8e0ddSBarry Smith     aij->ilen[i] = aij->imax[i];
3536bef8e0ddSBarry Smith   }
3537bef8e0ddSBarry Smith   PetscFunctionReturn(0);
3538bef8e0ddSBarry Smith }
3539bef8e0ddSBarry Smith 
3540a3bb6f32SFande Kong /*
3541e8b528d9SFande Kong  * When a sparse matrix has many zero columns, we should compact them out to save the space
3542a3bb6f32SFande Kong  * This happens in MatPtAPSymbolic_MPIAIJ_MPIAIJ_scalable()
3543a3bb6f32SFande Kong  * */
3544a3bb6f32SFande Kong PetscErrorCode  MatSeqAIJCompactOutExtraColumns_SeqAIJ(Mat mat, ISLocalToGlobalMapping *mapping)
3545a3bb6f32SFande Kong {
3546a3bb6f32SFande Kong   Mat_SeqAIJ *aij = (Mat_SeqAIJ*)mat->data;
3547a3bb6f32SFande Kong   PetscTable         gid1_lid1;
3548a3bb6f32SFande Kong   PetscTablePosition tpos;
3549a3bb6f32SFande Kong   PetscInt           gid,lid,i,j,ncols,ec;
3550a3bb6f32SFande Kong   PetscInt           *garray;
3551a3bb6f32SFande Kong   PetscErrorCode  ierr;
3552a3bb6f32SFande Kong 
3553a3bb6f32SFande Kong   PetscFunctionBegin;
3554a3bb6f32SFande Kong   PetscValidHeaderSpecific(mat,MAT_CLASSID,1);
3555a3bb6f32SFande Kong   PetscValidPointer(mapping,2);
3556a3bb6f32SFande Kong   /* use a table */
3557a3bb6f32SFande Kong   ierr = PetscTableCreate(mat->rmap->n,mat->cmap->N+1,&gid1_lid1);CHKERRQ(ierr);
3558a3bb6f32SFande Kong   ec = 0;
3559a3bb6f32SFande Kong   for (i=0; i<mat->rmap->n; i++) {
3560a3bb6f32SFande Kong     ncols = aij->i[i+1] - aij->i[i];
3561a3bb6f32SFande Kong     for (j=0; j<ncols; j++) {
3562a3bb6f32SFande Kong       PetscInt data,gid1 = aij->j[aij->i[i] + j] + 1;
3563a3bb6f32SFande Kong       ierr = PetscTableFind(gid1_lid1,gid1,&data);CHKERRQ(ierr);
3564a3bb6f32SFande Kong       if (!data) {
3565a3bb6f32SFande Kong         /* one based table */
3566a3bb6f32SFande Kong         ierr = PetscTableAdd(gid1_lid1,gid1,++ec,INSERT_VALUES);CHKERRQ(ierr);
3567a3bb6f32SFande Kong       }
3568a3bb6f32SFande Kong     }
3569a3bb6f32SFande Kong   }
3570a3bb6f32SFande Kong   /* form array of columns we need */
3571a3bb6f32SFande Kong   ierr = PetscMalloc1(ec+1,&garray);CHKERRQ(ierr);
3572a3bb6f32SFande Kong   ierr = PetscTableGetHeadPosition(gid1_lid1,&tpos);CHKERRQ(ierr);
3573a3bb6f32SFande Kong   while (tpos) {
3574a3bb6f32SFande Kong     ierr = PetscTableGetNext(gid1_lid1,&tpos,&gid,&lid);CHKERRQ(ierr);
3575a3bb6f32SFande Kong     gid--;
3576a3bb6f32SFande Kong     lid--;
3577a3bb6f32SFande Kong     garray[lid] = gid;
3578a3bb6f32SFande Kong   }
3579a3bb6f32SFande Kong   ierr = PetscSortInt(ec,garray);CHKERRQ(ierr); /* sort, and rebuild */
3580a3bb6f32SFande Kong   ierr = PetscTableRemoveAll(gid1_lid1);CHKERRQ(ierr);
3581a3bb6f32SFande Kong   for (i=0; i<ec; i++) {
3582a3bb6f32SFande Kong     ierr = PetscTableAdd(gid1_lid1,garray[i]+1,i+1,INSERT_VALUES);CHKERRQ(ierr);
3583a3bb6f32SFande Kong   }
3584a3bb6f32SFande Kong   /* compact out the extra columns in B */
3585a3bb6f32SFande Kong   for (i=0; i<mat->rmap->n; i++) {
3586a3bb6f32SFande Kong 	ncols = aij->i[i+1] - aij->i[i];
3587a3bb6f32SFande Kong     for (j=0; j<ncols; j++) {
3588a3bb6f32SFande Kong       PetscInt gid1 = aij->j[aij->i[i] + j] + 1;
3589a3bb6f32SFande Kong       ierr = PetscTableFind(gid1_lid1,gid1,&lid);CHKERRQ(ierr);
3590a3bb6f32SFande Kong       lid--;
3591a3bb6f32SFande Kong       aij->j[aij->i[i] + j] = lid;
3592a3bb6f32SFande Kong     }
3593a3bb6f32SFande Kong   }
3594ca5434daSLawrence Mitchell   ierr = PetscLayoutDestroy(&mat->cmap);CHKERRQ(ierr);
3595ca5434daSLawrence Mitchell   ierr = PetscLayoutCreateFromSizes(PetscObjectComm((PetscObject)mat),ec,ec,1,&mat->cmap);CHKERRQ(ierr);
3596a3bb6f32SFande Kong   ierr = PetscTableDestroy(&gid1_lid1);CHKERRQ(ierr);
3597a3bb6f32SFande Kong   ierr = ISLocalToGlobalMappingCreate(PETSC_COMM_SELF,mat->cmap->bs,mat->cmap->n,garray,PETSC_OWN_POINTER,mapping);CHKERRQ(ierr);
3598a3bb6f32SFande Kong   ierr = ISLocalToGlobalMappingSetType(*mapping,ISLOCALTOGLOBALMAPPINGHASH);CHKERRQ(ierr);
3599a3bb6f32SFande Kong   PetscFunctionReturn(0);
3600a3bb6f32SFande Kong }
3601a3bb6f32SFande Kong 
3602bef8e0ddSBarry Smith /*@
3603bef8e0ddSBarry Smith     MatSeqAIJSetColumnIndices - Set the column indices for all the rows
3604bef8e0ddSBarry Smith        in the matrix.
3605bef8e0ddSBarry Smith 
3606bef8e0ddSBarry Smith   Input Parameters:
3607bef8e0ddSBarry Smith +  mat - the SeqAIJ matrix
3608bef8e0ddSBarry Smith -  indices - the column indices
3609bef8e0ddSBarry Smith 
361015091d37SBarry Smith   Level: advanced
361115091d37SBarry Smith 
3612bef8e0ddSBarry Smith   Notes:
3613bef8e0ddSBarry Smith     This can be called if you have precomputed the nonzero structure of the
3614bef8e0ddSBarry Smith   matrix and want to provide it to the matrix object to improve the performance
3615bef8e0ddSBarry Smith   of the MatSetValues() operation.
3616bef8e0ddSBarry Smith 
3617bef8e0ddSBarry Smith     You MUST have set the correct numbers of nonzeros per row in the call to
3618d1be2dadSMatthew Knepley   MatCreateSeqAIJ(), and the columns indices MUST be sorted.
3619bef8e0ddSBarry Smith 
3620bef8e0ddSBarry Smith     MUST be called before any calls to MatSetValues();
3621bef8e0ddSBarry Smith 
3622b9617806SBarry Smith     The indices should start with zero, not one.
3623b9617806SBarry Smith 
3624bef8e0ddSBarry Smith @*/
36257087cfbeSBarry Smith PetscErrorCode  MatSeqAIJSetColumnIndices(Mat mat,PetscInt *indices)
3626bef8e0ddSBarry Smith {
36274ac538c5SBarry Smith   PetscErrorCode ierr;
3628bef8e0ddSBarry Smith 
3629bef8e0ddSBarry Smith   PetscFunctionBegin;
36300700a824SBarry Smith   PetscValidHeaderSpecific(mat,MAT_CLASSID,1);
36314482741eSBarry Smith   PetscValidPointer(indices,2);
36324ac538c5SBarry Smith   ierr = PetscUseMethod(mat,"MatSeqAIJSetColumnIndices_C",(Mat,PetscInt*),(mat,indices));CHKERRQ(ierr);
3633bef8e0ddSBarry Smith   PetscFunctionReturn(0);
3634bef8e0ddSBarry Smith }
3635bef8e0ddSBarry Smith 
3636be6bf707SBarry Smith /* ----------------------------------------------------------------------------------------*/
3637be6bf707SBarry Smith 
36387087cfbeSBarry Smith PetscErrorCode  MatStoreValues_SeqAIJ(Mat mat)
3639be6bf707SBarry Smith {
3640be6bf707SBarry Smith   Mat_SeqAIJ     *aij = (Mat_SeqAIJ*)mat->data;
36416849ba73SBarry Smith   PetscErrorCode ierr;
3642d0f46423SBarry Smith   size_t         nz = aij->i[mat->rmap->n];
3643be6bf707SBarry Smith 
3644be6bf707SBarry Smith   PetscFunctionBegin;
3645169f6850SBarry Smith   if (!aij->nonew) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ORDER,"Must call MatSetOption(A,MAT_NEW_NONZERO_LOCATIONS,PETSC_FALSE);first");
3646be6bf707SBarry Smith 
3647be6bf707SBarry Smith   /* allocate space for values if not already there */
3648be6bf707SBarry Smith   if (!aij->saved_values) {
3649854ce69bSBarry Smith     ierr = PetscMalloc1(nz+1,&aij->saved_values);CHKERRQ(ierr);
36503bb1ff40SBarry Smith     ierr = PetscLogObjectMemory((PetscObject)mat,(nz+1)*sizeof(PetscScalar));CHKERRQ(ierr);
3651be6bf707SBarry Smith   }
3652be6bf707SBarry Smith 
3653be6bf707SBarry Smith   /* copy values over */
3654580bdb30SBarry Smith   ierr = PetscArraycpy(aij->saved_values,aij->a,nz);CHKERRQ(ierr);
3655be6bf707SBarry Smith   PetscFunctionReturn(0);
3656be6bf707SBarry Smith }
3657be6bf707SBarry Smith 
3658be6bf707SBarry Smith /*@
3659be6bf707SBarry Smith     MatStoreValues - Stashes a copy of the matrix values; this allows, for
3660be6bf707SBarry Smith        example, reuse of the linear part of a Jacobian, while recomputing the
3661be6bf707SBarry Smith        nonlinear portion.
3662be6bf707SBarry Smith 
3663be6bf707SBarry Smith    Collect on Mat
3664be6bf707SBarry Smith 
3665be6bf707SBarry Smith   Input Parameters:
36660e609b76SBarry Smith .  mat - the matrix (currently only AIJ matrices support this option)
3667be6bf707SBarry Smith 
366815091d37SBarry Smith   Level: advanced
366915091d37SBarry Smith 
3670be6bf707SBarry Smith   Common Usage, with SNESSolve():
3671be6bf707SBarry Smith $    Create Jacobian matrix
3672be6bf707SBarry Smith $    Set linear terms into matrix
3673be6bf707SBarry Smith $    Apply boundary conditions to matrix, at this time matrix must have
3674be6bf707SBarry Smith $      final nonzero structure (i.e. setting the nonlinear terms and applying
3675be6bf707SBarry Smith $      boundary conditions again will not change the nonzero structure
3676512a5fc5SBarry Smith $    ierr = MatSetOption(mat,MAT_NEW_NONZERO_LOCATIONS,PETSC_FALSE);
3677be6bf707SBarry Smith $    ierr = MatStoreValues(mat);
3678be6bf707SBarry Smith $    Call SNESSetJacobian() with matrix
3679be6bf707SBarry Smith $    In your Jacobian routine
3680be6bf707SBarry Smith $      ierr = MatRetrieveValues(mat);
3681be6bf707SBarry Smith $      Set nonlinear terms in matrix
3682be6bf707SBarry Smith 
3683be6bf707SBarry Smith   Common Usage without SNESSolve(), i.e. when you handle nonlinear solve yourself:
3684be6bf707SBarry Smith $    // build linear portion of Jacobian
3685512a5fc5SBarry Smith $    ierr = MatSetOption(mat,MAT_NEW_NONZERO_LOCATIONS,PETSC_FALSE);
3686be6bf707SBarry Smith $    ierr = MatStoreValues(mat);
3687be6bf707SBarry Smith $    loop over nonlinear iterations
3688be6bf707SBarry Smith $       ierr = MatRetrieveValues(mat);
3689be6bf707SBarry Smith $       // call MatSetValues(mat,...) to set nonliner portion of Jacobian
3690be6bf707SBarry Smith $       // call MatAssemblyBegin/End() on matrix
3691be6bf707SBarry Smith $       Solve linear system with Jacobian
3692be6bf707SBarry Smith $    endloop
3693be6bf707SBarry Smith 
3694be6bf707SBarry Smith   Notes:
3695be6bf707SBarry Smith     Matrix must already be assemblied before calling this routine
3696512a5fc5SBarry Smith     Must set the matrix option MatSetOption(mat,MAT_NEW_NONZERO_LOCATIONS,PETSC_FALSE); before
3697be6bf707SBarry Smith     calling this routine.
3698be6bf707SBarry Smith 
36990c468ba9SBarry Smith     When this is called multiple times it overwrites the previous set of stored values
37000c468ba9SBarry Smith     and does not allocated additional space.
37010c468ba9SBarry Smith 
3702be6bf707SBarry Smith .seealso: MatRetrieveValues()
3703be6bf707SBarry Smith 
3704be6bf707SBarry Smith @*/
37057087cfbeSBarry Smith PetscErrorCode  MatStoreValues(Mat mat)
3706be6bf707SBarry Smith {
37074ac538c5SBarry Smith   PetscErrorCode ierr;
3708be6bf707SBarry Smith 
3709be6bf707SBarry Smith   PetscFunctionBegin;
37100700a824SBarry Smith   PetscValidHeaderSpecific(mat,MAT_CLASSID,1);
3711e32f2f54SBarry Smith   if (!mat->assembled) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Not for unassembled matrix");
3712e32f2f54SBarry Smith   if (mat->factortype) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Not for factored matrix");
37134ac538c5SBarry Smith   ierr = PetscUseMethod(mat,"MatStoreValues_C",(Mat),(mat));CHKERRQ(ierr);
3714be6bf707SBarry Smith   PetscFunctionReturn(0);
3715be6bf707SBarry Smith }
3716be6bf707SBarry Smith 
37177087cfbeSBarry Smith PetscErrorCode  MatRetrieveValues_SeqAIJ(Mat mat)
3718be6bf707SBarry Smith {
3719be6bf707SBarry Smith   Mat_SeqAIJ     *aij = (Mat_SeqAIJ*)mat->data;
37206849ba73SBarry Smith   PetscErrorCode ierr;
3721d0f46423SBarry Smith   PetscInt       nz = aij->i[mat->rmap->n];
3722be6bf707SBarry Smith 
3723be6bf707SBarry Smith   PetscFunctionBegin;
3724169f6850SBarry Smith   if (!aij->nonew) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ORDER,"Must call MatSetOption(A,MAT_NEW_NONZERO_LOCATIONS,PETSC_FALSE);first");
3725f23aa3ddSBarry Smith   if (!aij->saved_values) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ORDER,"Must call MatStoreValues(A);first");
3726be6bf707SBarry Smith   /* copy values over */
3727580bdb30SBarry Smith   ierr = PetscArraycpy(aij->a,aij->saved_values,nz);CHKERRQ(ierr);
3728be6bf707SBarry Smith   PetscFunctionReturn(0);
3729be6bf707SBarry Smith }
3730be6bf707SBarry Smith 
3731be6bf707SBarry Smith /*@
3732be6bf707SBarry Smith     MatRetrieveValues - Retrieves the copy of the matrix values; this allows, for
3733be6bf707SBarry Smith        example, reuse of the linear part of a Jacobian, while recomputing the
3734be6bf707SBarry Smith        nonlinear portion.
3735be6bf707SBarry Smith 
3736be6bf707SBarry Smith    Collect on Mat
3737be6bf707SBarry Smith 
3738be6bf707SBarry Smith   Input Parameters:
3739386f7cf9SBarry Smith .  mat - the matrix (currently only AIJ matrices support this option)
3740be6bf707SBarry Smith 
374115091d37SBarry Smith   Level: advanced
374215091d37SBarry Smith 
3743be6bf707SBarry Smith .seealso: MatStoreValues()
3744be6bf707SBarry Smith 
3745be6bf707SBarry Smith @*/
37467087cfbeSBarry Smith PetscErrorCode  MatRetrieveValues(Mat mat)
3747be6bf707SBarry Smith {
37484ac538c5SBarry Smith   PetscErrorCode ierr;
3749be6bf707SBarry Smith 
3750be6bf707SBarry Smith   PetscFunctionBegin;
37510700a824SBarry Smith   PetscValidHeaderSpecific(mat,MAT_CLASSID,1);
3752e32f2f54SBarry Smith   if (!mat->assembled) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Not for unassembled matrix");
3753e32f2f54SBarry Smith   if (mat->factortype) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"Not for factored matrix");
37544ac538c5SBarry Smith   ierr = PetscUseMethod(mat,"MatRetrieveValues_C",(Mat),(mat));CHKERRQ(ierr);
3755be6bf707SBarry Smith   PetscFunctionReturn(0);
3756be6bf707SBarry Smith }
3757be6bf707SBarry Smith 
3758f83d6046SBarry Smith 
3759be6bf707SBarry Smith /* --------------------------------------------------------------------------------*/
376017ab2063SBarry Smith /*@C
3761682d7d0cSBarry Smith    MatCreateSeqAIJ - Creates a sparse matrix in AIJ (compressed row) format
37620d15e28bSLois Curfman McInnes    (the default parallel PETSc format).  For good matrix assembly performance
37636e62573dSLois Curfman McInnes    the user should preallocate the matrix storage by setting the parameter nz
376451c19458SBarry Smith    (or the array nnz).  By setting these parameters accurately, performance
37652bd5e0b2SLois Curfman McInnes    during matrix assembly can be increased by more than a factor of 50.
376617ab2063SBarry Smith 
3767d083f849SBarry Smith    Collective
3768db81eaa0SLois Curfman McInnes 
376917ab2063SBarry Smith    Input Parameters:
3770db81eaa0SLois Curfman McInnes +  comm - MPI communicator, set to PETSC_COMM_SELF
377117ab2063SBarry Smith .  m - number of rows
377217ab2063SBarry Smith .  n - number of columns
377317ab2063SBarry Smith .  nz - number of nonzeros per row (same for all rows)
377451c19458SBarry Smith -  nnz - array containing the number of nonzeros in the various rows
37750298fd71SBarry Smith          (possibly different for each row) or NULL
377617ab2063SBarry Smith 
377717ab2063SBarry Smith    Output Parameter:
3778416022c9SBarry Smith .  A - the matrix
377917ab2063SBarry Smith 
3780175b88e8SBarry Smith    It is recommended that one use the MatCreate(), MatSetType() and/or MatSetFromOptions(),
3781f6f02116SRichard Tran Mills    MatXXXXSetPreallocation() paradigm instead of this routine directly.
3782175b88e8SBarry Smith    [MatXXXXSetPreallocation() is, for example, MatSeqAIJSetPreallocation]
3783175b88e8SBarry Smith 
3784b259b22eSLois Curfman McInnes    Notes:
378549a6f317SBarry Smith    If nnz is given then nz is ignored
378649a6f317SBarry Smith 
378717ab2063SBarry Smith    The AIJ format (also called the Yale sparse matrix format or
378817ab2063SBarry Smith    compressed row storage), is fully compatible with standard Fortran 77
37890002213bSLois Curfman McInnes    storage.  That is, the stored row and column indices can begin at
379044cd7ae7SLois Curfman McInnes    either one (as in Fortran) or zero.  See the users' manual for details.
379117ab2063SBarry Smith 
379217ab2063SBarry Smith    Specify the preallocated storage with either nz or nnz (not both).
37930298fd71SBarry Smith    Set nz=PETSC_DEFAULT and nnz=NULL for PETSc to control dynamic memory
37943d323bbdSBarry Smith    allocation.  For large problems you MUST preallocate memory or you
37956da5968aSLois Curfman McInnes    will get TERRIBLE performance, see the users' manual chapter on matrices.
379617ab2063SBarry Smith 
3797682d7d0cSBarry Smith    By default, this format uses inodes (identical nodes) when possible, to
37984fca80b9SLois Curfman McInnes    improve numerical efficiency of matrix-vector products and solves. We
3799682d7d0cSBarry Smith    search for consecutive rows with the same nonzero structure, thereby
38006c7ebb05SLois Curfman McInnes    reusing matrix information to achieve increased efficiency.
38016c7ebb05SLois Curfman McInnes 
38026c7ebb05SLois Curfman McInnes    Options Database Keys:
3803698d4c6aSKris Buschelman +  -mat_no_inode  - Do not use inodes
38049db58ca8SBarry Smith -  -mat_inode_limit <limit> - Sets inode limit (max limit=5)
380517ab2063SBarry Smith 
3806027ccd11SLois Curfman McInnes    Level: intermediate
3807027ccd11SLois Curfman McInnes 
380869b1f4b7SBarry Smith .seealso: MatCreate(), MatCreateAIJ(), MatSetValues(), MatSeqAIJSetColumnIndices(), MatCreateSeqAIJWithArrays()
380936db0b34SBarry Smith 
381017ab2063SBarry Smith @*/
38117087cfbeSBarry Smith PetscErrorCode  MatCreateSeqAIJ(MPI_Comm comm,PetscInt m,PetscInt n,PetscInt nz,const PetscInt nnz[],Mat *A)
381217ab2063SBarry Smith {
3813dfbe8321SBarry Smith   PetscErrorCode ierr;
38146945ee14SBarry Smith 
38153a40ed3dSBarry Smith   PetscFunctionBegin;
3816f69a0ea3SMatthew Knepley   ierr = MatCreate(comm,A);CHKERRQ(ierr);
3817117016b1SBarry Smith   ierr = MatSetSizes(*A,m,n,m,n);CHKERRQ(ierr);
3818c4752a88SBarry Smith   ierr = MatSetType(*A,MATSEQAIJ);CHKERRQ(ierr);
3819d28bb7d2SJed Brown   ierr = MatSeqAIJSetPreallocation_SeqAIJ(*A,nz,nnz);CHKERRQ(ierr);
3820273d9f13SBarry Smith   PetscFunctionReturn(0);
3821273d9f13SBarry Smith }
3822273d9f13SBarry Smith 
3823273d9f13SBarry Smith /*@C
3824273d9f13SBarry Smith    MatSeqAIJSetPreallocation - For good matrix assembly performance
3825273d9f13SBarry Smith    the user should preallocate the matrix storage by setting the parameter nz
3826273d9f13SBarry Smith    (or the array nnz).  By setting these parameters accurately, performance
3827273d9f13SBarry Smith    during matrix assembly can be increased by more than a factor of 50.
3828273d9f13SBarry Smith 
3829d083f849SBarry Smith    Collective
3830273d9f13SBarry Smith 
3831273d9f13SBarry Smith    Input Parameters:
38321c4f3114SJed Brown +  B - The matrix
3833273d9f13SBarry Smith .  nz - number of nonzeros per row (same for all rows)
3834273d9f13SBarry Smith -  nnz - array containing the number of nonzeros in the various rows
38350298fd71SBarry Smith          (possibly different for each row) or NULL
3836273d9f13SBarry Smith 
3837273d9f13SBarry Smith    Notes:
383849a6f317SBarry Smith      If nnz is given then nz is ignored
383949a6f317SBarry Smith 
3840273d9f13SBarry Smith     The AIJ format (also called the Yale sparse matrix format or
3841273d9f13SBarry Smith    compressed row storage), is fully compatible with standard Fortran 77
3842273d9f13SBarry Smith    storage.  That is, the stored row and column indices can begin at
3843273d9f13SBarry Smith    either one (as in Fortran) or zero.  See the users' manual for details.
3844273d9f13SBarry Smith 
3845273d9f13SBarry Smith    Specify the preallocated storage with either nz or nnz (not both).
38460298fd71SBarry Smith    Set nz=PETSC_DEFAULT and nnz=NULL for PETSc to control dynamic memory
3847273d9f13SBarry Smith    allocation.  For large problems you MUST preallocate memory or you
3848273d9f13SBarry Smith    will get TERRIBLE performance, see the users' manual chapter on matrices.
3849273d9f13SBarry Smith 
3850aa95bbe8SBarry Smith    You can call MatGetInfo() to get information on how effective the preallocation was;
3851aa95bbe8SBarry Smith    for example the fields mallocs,nz_allocated,nz_used,nz_unneeded;
3852aa95bbe8SBarry Smith    You can also run with the option -info and look for messages with the string
3853aa95bbe8SBarry Smith    malloc in them to see if additional memory allocation was needed.
3854aa95bbe8SBarry Smith 
3855a96a251dSBarry Smith    Developers: Use nz of MAT_SKIP_ALLOCATION to not allocate any space for the matrix
3856a96a251dSBarry Smith    entries or columns indices
3857a96a251dSBarry Smith 
3858273d9f13SBarry Smith    By default, this format uses inodes (identical nodes) when possible, to
3859273d9f13SBarry Smith    improve numerical efficiency of matrix-vector products and solves. We
3860273d9f13SBarry Smith    search for consecutive rows with the same nonzero structure, thereby
3861273d9f13SBarry Smith    reusing matrix information to achieve increased efficiency.
3862273d9f13SBarry Smith 
3863273d9f13SBarry Smith    Options Database Keys:
3864698d4c6aSKris Buschelman +  -mat_no_inode  - Do not use inodes
386547b2e64bSBarry Smith -  -mat_inode_limit <limit> - Sets inode limit (max limit=5)
3866273d9f13SBarry Smith 
3867273d9f13SBarry Smith    Level: intermediate
3868273d9f13SBarry Smith 
386969b1f4b7SBarry Smith .seealso: MatCreate(), MatCreateAIJ(), MatSetValues(), MatSeqAIJSetColumnIndices(), MatCreateSeqAIJWithArrays(), MatGetInfo()
3870273d9f13SBarry Smith 
3871273d9f13SBarry Smith @*/
38727087cfbeSBarry Smith PetscErrorCode  MatSeqAIJSetPreallocation(Mat B,PetscInt nz,const PetscInt nnz[])
3873273d9f13SBarry Smith {
38744ac538c5SBarry Smith   PetscErrorCode ierr;
3875a23d5eceSKris Buschelman 
3876a23d5eceSKris Buschelman   PetscFunctionBegin;
38776ba663aaSJed Brown   PetscValidHeaderSpecific(B,MAT_CLASSID,1);
38786ba663aaSJed Brown   PetscValidType(B,1);
38794ac538c5SBarry Smith   ierr = PetscTryMethod(B,"MatSeqAIJSetPreallocation_C",(Mat,PetscInt,const PetscInt[]),(B,nz,nnz));CHKERRQ(ierr);
3880a23d5eceSKris Buschelman   PetscFunctionReturn(0);
3881a23d5eceSKris Buschelman }
3882a23d5eceSKris Buschelman 
38837087cfbeSBarry Smith PetscErrorCode  MatSeqAIJSetPreallocation_SeqAIJ(Mat B,PetscInt nz,const PetscInt *nnz)
3884a23d5eceSKris Buschelman {
3885273d9f13SBarry Smith   Mat_SeqAIJ     *b;
38862576faa2SJed Brown   PetscBool      skipallocation = PETSC_FALSE,realalloc = PETSC_FALSE;
38876849ba73SBarry Smith   PetscErrorCode ierr;
388897f1f81fSBarry Smith   PetscInt       i;
3889273d9f13SBarry Smith 
3890273d9f13SBarry Smith   PetscFunctionBegin;
38912576faa2SJed Brown   if (nz >= 0 || nnz) realalloc = PETSC_TRUE;
3892a96a251dSBarry Smith   if (nz == MAT_SKIP_ALLOCATION) {
3893c461c341SBarry Smith     skipallocation = PETSC_TRUE;
3894c461c341SBarry Smith     nz             = 0;
3895c461c341SBarry Smith   }
389626283091SBarry Smith   ierr = PetscLayoutSetUp(B->rmap);CHKERRQ(ierr);
389726283091SBarry Smith   ierr = PetscLayoutSetUp(B->cmap);CHKERRQ(ierr);
3898899cda47SBarry Smith 
3899435da068SBarry Smith   if (nz == PETSC_DEFAULT || nz == PETSC_DECIDE) nz = 5;
390060e0710aSBarry Smith   if (nz < 0) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"nz cannot be less than 0: value %D",nz);
3901cf9c20a2SJed Brown   if (PetscUnlikelyDebug(nnz)) {
3902d0f46423SBarry Smith     for (i=0; i<B->rmap->n; i++) {
390360e0710aSBarry Smith       if (nnz[i] < 0) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"nnz cannot be less than 0: local row %D value %D",i,nnz[i]);
390460e0710aSBarry Smith       if (nnz[i] > B->cmap->n) SETERRQ3(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"nnz cannot be greater than row length: local row %D value %d rowlength %D",i,nnz[i],B->cmap->n);
3905b73539f3SBarry Smith     }
3906b73539f3SBarry Smith   }
3907b73539f3SBarry Smith 
3908273d9f13SBarry Smith   B->preallocated = PETSC_TRUE;
39092205254eSKarl Rupp 
3910273d9f13SBarry Smith   b = (Mat_SeqAIJ*)B->data;
3911273d9f13SBarry Smith 
3912ab93d7beSBarry Smith   if (!skipallocation) {
39132ee49352SLisandro Dalcin     if (!b->imax) {
3914071fcb05SBarry Smith       ierr = PetscMalloc1(B->rmap->n,&b->imax);CHKERRQ(ierr);
3915071fcb05SBarry Smith       ierr = PetscLogObjectMemory((PetscObject)B,B->rmap->n*sizeof(PetscInt));CHKERRQ(ierr);
3916071fcb05SBarry Smith     }
3917071fcb05SBarry Smith     if (!b->ilen) {
3918071fcb05SBarry Smith       /* b->ilen will count nonzeros in each row so far. */
3919071fcb05SBarry Smith       ierr = PetscCalloc1(B->rmap->n,&b->ilen);CHKERRQ(ierr);
3920071fcb05SBarry Smith       ierr = PetscLogObjectMemory((PetscObject)B,B->rmap->n*sizeof(PetscInt));CHKERRQ(ierr);
3921071fcb05SBarry Smith     } else {
3922071fcb05SBarry Smith       ierr = PetscMemzero(b->ilen,B->rmap->n*sizeof(PetscInt));CHKERRQ(ierr);
39232ee49352SLisandro Dalcin     }
3924846b4da1SFande Kong     if (!b->ipre) {
3925846b4da1SFande Kong       ierr = PetscMalloc1(B->rmap->n,&b->ipre);CHKERRQ(ierr);
3926846b4da1SFande Kong       ierr = PetscLogObjectMemory((PetscObject)B,B->rmap->n*sizeof(PetscInt));CHKERRQ(ierr);
3927846b4da1SFande Kong     }
3928273d9f13SBarry Smith     if (!nnz) {
3929435da068SBarry Smith       if (nz == PETSC_DEFAULT || nz == PETSC_DECIDE) nz = 10;
3930c62bd62aSJed Brown       else if (nz < 0) nz = 1;
39315d2a9ed1SStefano Zampini       nz = PetscMin(nz,B->cmap->n);
3932d0f46423SBarry Smith       for (i=0; i<B->rmap->n; i++) b->imax[i] = nz;
3933d0f46423SBarry Smith       nz = nz*B->rmap->n;
3934273d9f13SBarry Smith     } else {
3935c73702f5SBarry Smith       PetscInt64 nz64 = 0;
3936c73702f5SBarry Smith       for (i=0; i<B->rmap->n; i++) {b->imax[i] = nnz[i]; nz64 += nnz[i];}
3937c73702f5SBarry Smith       ierr = PetscIntCast(nz64,&nz);CHKERRQ(ierr);
3938273d9f13SBarry Smith     }
3939ab93d7beSBarry Smith 
3940273d9f13SBarry Smith     /* allocate the matrix space */
394153dd7562SDmitry Karpeev     /* FIXME: should B's old memory be unlogged? */
39422ee49352SLisandro Dalcin     ierr = MatSeqXAIJFreeAIJ(B,&b->a,&b->j,&b->i);CHKERRQ(ierr);
3943396832f4SHong Zhang     if (B->structure_only) {
39445848002fSHong Zhang       ierr = PetscMalloc1(nz,&b->j);CHKERRQ(ierr);
39455848002fSHong Zhang       ierr = PetscMalloc1(B->rmap->n+1,&b->i);CHKERRQ(ierr);
3946396832f4SHong Zhang       ierr = PetscLogObjectMemory((PetscObject)B,(B->rmap->n+1)*sizeof(PetscInt)+nz*sizeof(PetscInt));CHKERRQ(ierr);
3947396832f4SHong Zhang     } else {
3948dcca6d9dSJed Brown       ierr = PetscMalloc3(nz,&b->a,nz,&b->j,B->rmap->n+1,&b->i);CHKERRQ(ierr);
39493bb1ff40SBarry Smith       ierr = PetscLogObjectMemory((PetscObject)B,(B->rmap->n+1)*sizeof(PetscInt)+nz*(sizeof(PetscScalar)+sizeof(PetscInt)));CHKERRQ(ierr);
3950396832f4SHong Zhang     }
3951bfeeae90SHong Zhang     b->i[0] = 0;
3952d0f46423SBarry Smith     for (i=1; i<B->rmap->n+1; i++) {
39535da197adSKris Buschelman       b->i[i] = b->i[i-1] + b->imax[i-1];
39545da197adSKris Buschelman     }
3955396832f4SHong Zhang     if (B->structure_only) {
3956396832f4SHong Zhang       b->singlemalloc = PETSC_FALSE;
3957396832f4SHong Zhang       b->free_a       = PETSC_FALSE;
3958396832f4SHong Zhang     } else {
3959273d9f13SBarry Smith       b->singlemalloc = PETSC_TRUE;
3960e6b907acSBarry Smith       b->free_a       = PETSC_TRUE;
3961396832f4SHong Zhang     }
3962e6b907acSBarry Smith     b->free_ij      = PETSC_TRUE;
3963c461c341SBarry Smith   } else {
3964e6b907acSBarry Smith     b->free_a  = PETSC_FALSE;
3965e6b907acSBarry Smith     b->free_ij = PETSC_FALSE;
3966c461c341SBarry Smith   }
3967273d9f13SBarry Smith 
3968846b4da1SFande Kong   if (b->ipre && nnz != b->ipre  && b->imax) {
3969846b4da1SFande Kong     /* reserve user-requested sparsity */
3970580bdb30SBarry Smith     ierr = PetscArraycpy(b->ipre,b->imax,B->rmap->n);CHKERRQ(ierr);
3971846b4da1SFande Kong   }
3972846b4da1SFande Kong 
3973846b4da1SFande Kong 
3974273d9f13SBarry Smith   b->nz               = 0;
3975273d9f13SBarry Smith   b->maxnz            = nz;
3976273d9f13SBarry Smith   B->info.nz_unneeded = (double)b->maxnz;
39772205254eSKarl Rupp   if (realalloc) {
39782205254eSKarl Rupp     ierr = MatSetOption(B,MAT_NEW_NONZERO_ALLOCATION_ERR,PETSC_TRUE);CHKERRQ(ierr);
39792205254eSKarl Rupp   }
3980cb7b82ddSBarry Smith   B->was_assembled = PETSC_FALSE;
3981cb7b82ddSBarry Smith   B->assembled     = PETSC_FALSE;
3982273d9f13SBarry Smith   PetscFunctionReturn(0);
3983273d9f13SBarry Smith }
3984273d9f13SBarry Smith 
3985846b4da1SFande Kong 
3986846b4da1SFande Kong PetscErrorCode MatResetPreallocation_SeqAIJ(Mat A)
3987846b4da1SFande Kong {
3988846b4da1SFande Kong   Mat_SeqAIJ     *a;
3989a5bbaf83SFande Kong   PetscInt       i;
3990846b4da1SFande Kong   PetscErrorCode ierr;
3991846b4da1SFande Kong 
3992846b4da1SFande Kong   PetscFunctionBegin;
3993846b4da1SFande Kong   PetscValidHeaderSpecific(A,MAT_CLASSID,1);
399414d0e64fSAlex Lindsay 
399514d0e64fSAlex Lindsay   /* Check local size. If zero, then return */
399614d0e64fSAlex Lindsay   if (!A->rmap->n) PetscFunctionReturn(0);
399714d0e64fSAlex Lindsay 
3998846b4da1SFande Kong   a = (Mat_SeqAIJ*)A->data;
39992c814fdeSFande Kong   /* if no saved info, we error out */
4000fb4dc15dSAlex Lindsay   if (!a->ipre) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_NULL,"No saved preallocation info \n");
40012c814fdeSFande Kong 
4002fb4dc15dSAlex Lindsay   if (!a->i || !a->j || !a->a || !a->imax || !a->ilen) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_NULL,"Memory info is incomplete, and can not reset preallocation \n");
40032c814fdeSFande Kong 
4004580bdb30SBarry Smith   ierr = PetscArraycpy(a->imax,a->ipre,A->rmap->n);CHKERRQ(ierr);
4005580bdb30SBarry Smith   ierr = PetscArrayzero(a->ilen,A->rmap->n);CHKERRQ(ierr);
4006846b4da1SFande Kong   a->i[0] = 0;
4007846b4da1SFande Kong   for (i=1; i<A->rmap->n+1; i++) {
4008846b4da1SFande Kong     a->i[i] = a->i[i-1] + a->imax[i-1];
4009846b4da1SFande Kong   }
4010846b4da1SFande Kong   A->preallocated     = PETSC_TRUE;
4011846b4da1SFande Kong   a->nz               = 0;
4012846b4da1SFande Kong   a->maxnz            = a->i[A->rmap->n];
4013846b4da1SFande Kong   A->info.nz_unneeded = (double)a->maxnz;
4014846b4da1SFande Kong   A->was_assembled    = PETSC_FALSE;
4015846b4da1SFande Kong   A->assembled        = PETSC_FALSE;
4016846b4da1SFande Kong   PetscFunctionReturn(0);
4017846b4da1SFande Kong }
4018846b4da1SFande Kong 
401958d36128SBarry Smith /*@
4020a1661176SMatthew Knepley    MatSeqAIJSetPreallocationCSR - Allocates memory for a sparse sequential matrix in AIJ format.
4021a1661176SMatthew Knepley 
4022a1661176SMatthew Knepley    Input Parameters:
4023a1661176SMatthew Knepley +  B - the matrix
4024a1661176SMatthew Knepley .  i - the indices into j for the start of each row (starts with zero)
4025a1661176SMatthew Knepley .  j - the column indices for each row (starts with zero) these must be sorted for each row
4026a1661176SMatthew Knepley -  v - optional values in the matrix
4027a1661176SMatthew Knepley 
4028a1661176SMatthew Knepley    Level: developer
4029a1661176SMatthew Knepley 
403058d36128SBarry Smith    The i,j,v values are COPIED with this routine; to avoid the copy use MatCreateSeqAIJWithArrays()
403158d36128SBarry Smith 
4032c1c1d628SHong Zhang .seealso: MatCreate(), MatCreateSeqAIJ(), MatSetValues(), MatSeqAIJSetPreallocation(), MatCreateSeqAIJ(), MATSEQAIJ
4033a1661176SMatthew Knepley @*/
4034a1661176SMatthew Knepley PetscErrorCode MatSeqAIJSetPreallocationCSR(Mat B,const PetscInt i[],const PetscInt j[],const PetscScalar v[])
4035a1661176SMatthew Knepley {
4036a1661176SMatthew Knepley   PetscErrorCode ierr;
4037a1661176SMatthew Knepley 
4038a1661176SMatthew Knepley   PetscFunctionBegin;
40390700a824SBarry Smith   PetscValidHeaderSpecific(B,MAT_CLASSID,1);
40406ba663aaSJed Brown   PetscValidType(B,1);
40414ac538c5SBarry Smith   ierr = PetscTryMethod(B,"MatSeqAIJSetPreallocationCSR_C",(Mat,const PetscInt[],const PetscInt[],const PetscScalar[]),(B,i,j,v));CHKERRQ(ierr);
4042a1661176SMatthew Knepley   PetscFunctionReturn(0);
4043a1661176SMatthew Knepley }
4044a1661176SMatthew Knepley 
40457087cfbeSBarry Smith PetscErrorCode  MatSeqAIJSetPreallocationCSR_SeqAIJ(Mat B,const PetscInt Ii[],const PetscInt J[],const PetscScalar v[])
4046a1661176SMatthew Knepley {
4047a1661176SMatthew Knepley   PetscInt       i;
4048a1661176SMatthew Knepley   PetscInt       m,n;
4049a1661176SMatthew Knepley   PetscInt       nz;
4050a1661176SMatthew Knepley   PetscInt       *nnz, nz_max = 0;
4051a1661176SMatthew Knepley   PetscErrorCode ierr;
4052a1661176SMatthew Knepley 
4053a1661176SMatthew Knepley   PetscFunctionBegin;
405465e19b50SBarry Smith   if (Ii[0]) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE, "Ii[0] must be 0 it is %D", Ii[0]);
4055779a8d59SSatish Balay 
4056779a8d59SSatish Balay   ierr = PetscLayoutSetUp(B->rmap);CHKERRQ(ierr);
4057779a8d59SSatish Balay   ierr = PetscLayoutSetUp(B->cmap);CHKERRQ(ierr);
4058779a8d59SSatish Balay 
4059779a8d59SSatish Balay   ierr = MatGetSize(B, &m, &n);CHKERRQ(ierr);
4060854ce69bSBarry Smith   ierr = PetscMalloc1(m+1, &nnz);CHKERRQ(ierr);
4061a1661176SMatthew Knepley   for (i = 0; i < m; i++) {
4062b7940d39SSatish Balay     nz     = Ii[i+1]- Ii[i];
4063a1661176SMatthew Knepley     nz_max = PetscMax(nz_max, nz);
406465e19b50SBarry Smith     if (nz < 0) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE, "Local row %D has a negative number of columns %D", i, nnz);
4065a1661176SMatthew Knepley     nnz[i] = nz;
4066a1661176SMatthew Knepley   }
4067a1661176SMatthew Knepley   ierr = MatSeqAIJSetPreallocation(B, 0, nnz);CHKERRQ(ierr);
4068a1661176SMatthew Knepley   ierr = PetscFree(nnz);CHKERRQ(ierr);
4069a1661176SMatthew Knepley 
4070a1661176SMatthew Knepley   for (i = 0; i < m; i++) {
4071071fcb05SBarry Smith     ierr = MatSetValues_SeqAIJ(B, 1, &i, Ii[i+1] - Ii[i], J+Ii[i], v ? v + Ii[i] : NULL, INSERT_VALUES);CHKERRQ(ierr);
4072a1661176SMatthew Knepley   }
4073a1661176SMatthew Knepley 
4074a1661176SMatthew Knepley   ierr = MatAssemblyBegin(B,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
4075a1661176SMatthew Knepley   ierr = MatAssemblyEnd(B,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
4076a1661176SMatthew Knepley 
40777827cd58SJed Brown   ierr = MatSetOption(B,MAT_NEW_NONZERO_LOCATION_ERR,PETSC_TRUE);CHKERRQ(ierr);
4078a1661176SMatthew Knepley   PetscFunctionReturn(0);
4079a1661176SMatthew Knepley }
4080a1661176SMatthew Knepley 
4081c6db04a5SJed Brown #include <../src/mat/impls/dense/seq/dense.h>
4082af0996ceSBarry Smith #include <petsc/private/kernels/petscaxpy.h>
4083170fe5c8SBarry Smith 
4084170fe5c8SBarry Smith /*
4085170fe5c8SBarry Smith     Computes (B'*A')' since computing B*A directly is untenable
4086170fe5c8SBarry Smith 
4087170fe5c8SBarry Smith                n                       p                          p
4088170fe5c8SBarry Smith         (              )       (              )         (                  )
4089170fe5c8SBarry Smith       m (      A       )  *  n (       B      )   =   m (         C        )
4090170fe5c8SBarry Smith         (              )       (              )         (                  )
4091170fe5c8SBarry Smith 
4092170fe5c8SBarry Smith */
4093170fe5c8SBarry Smith PetscErrorCode MatMatMultNumeric_SeqDense_SeqAIJ(Mat A,Mat B,Mat C)
4094170fe5c8SBarry Smith {
4095170fe5c8SBarry Smith   PetscErrorCode    ierr;
4096170fe5c8SBarry Smith   Mat_SeqDense      *sub_a = (Mat_SeqDense*)A->data;
4097170fe5c8SBarry Smith   Mat_SeqAIJ        *sub_b = (Mat_SeqAIJ*)B->data;
4098170fe5c8SBarry Smith   Mat_SeqDense      *sub_c = (Mat_SeqDense*)C->data;
409986214ceeSStefano Zampini   PetscInt          i,j,n,m,q,p;
4100170fe5c8SBarry Smith   const PetscInt    *ii,*idx;
4101170fe5c8SBarry Smith   const PetscScalar *b,*a,*a_q;
4102170fe5c8SBarry Smith   PetscScalar       *c,*c_q;
410386214ceeSStefano Zampini   PetscInt          clda = sub_c->lda;
410486214ceeSStefano Zampini   PetscInt          alda = sub_a->lda;
4105170fe5c8SBarry Smith 
4106170fe5c8SBarry Smith   PetscFunctionBegin;
4107d0f46423SBarry Smith   m    = A->rmap->n;
4108d0f46423SBarry Smith   n    = A->cmap->n;
4109d0f46423SBarry Smith   p    = B->cmap->n;
4110170fe5c8SBarry Smith   a    = sub_a->v;
4111170fe5c8SBarry Smith   b    = sub_b->a;
4112170fe5c8SBarry Smith   c    = sub_c->v;
411386214ceeSStefano Zampini   if (clda == m) {
4114580bdb30SBarry Smith     ierr = PetscArrayzero(c,m*p);CHKERRQ(ierr);
411586214ceeSStefano Zampini   } else {
411686214ceeSStefano Zampini     for (j=0;j<p;j++)
411786214ceeSStefano Zampini       for (i=0;i<m;i++)
411886214ceeSStefano Zampini         c[j*clda + i] = 0.0;
411986214ceeSStefano Zampini   }
4120170fe5c8SBarry Smith   ii  = sub_b->i;
4121170fe5c8SBarry Smith   idx = sub_b->j;
4122170fe5c8SBarry Smith   for (i=0; i<n; i++) {
4123170fe5c8SBarry Smith     q = ii[i+1] - ii[i];
4124170fe5c8SBarry Smith     while (q-->0) {
412586214ceeSStefano Zampini       c_q = c + clda*(*idx);
412686214ceeSStefano Zampini       a_q = a + alda*i;
4127854c7f52SBarry Smith       PetscKernelAXPY(c_q,*b,a_q,m);
4128170fe5c8SBarry Smith       idx++;
4129170fe5c8SBarry Smith       b++;
4130170fe5c8SBarry Smith     }
4131170fe5c8SBarry Smith   }
4132170fe5c8SBarry Smith   PetscFunctionReturn(0);
4133170fe5c8SBarry Smith }
4134170fe5c8SBarry Smith 
41354222ddf1SHong Zhang PetscErrorCode MatMatMultSymbolic_SeqDense_SeqAIJ(Mat A,Mat B,PetscReal fill,Mat C)
4136170fe5c8SBarry Smith {
4137170fe5c8SBarry Smith   PetscErrorCode ierr;
4138d0f46423SBarry Smith   PetscInt       m=A->rmap->n,n=B->cmap->n;
413986214ceeSStefano Zampini   PetscBool      cisdense;
4140170fe5c8SBarry Smith 
4141170fe5c8SBarry Smith   PetscFunctionBegin;
414260e0710aSBarry Smith   if (A->cmap->n != B->rmap->n) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"A->cmap->n %D != B->rmap->n %D\n",A->cmap->n,B->rmap->n);
41434222ddf1SHong Zhang   ierr = MatSetSizes(C,m,n,m,n);CHKERRQ(ierr);
41444222ddf1SHong Zhang   ierr = MatSetBlockSizesFromMats(C,A,B);CHKERRQ(ierr);
414586214ceeSStefano Zampini   ierr = PetscObjectTypeCompareAny((PetscObject)C,&cisdense,MATSEQDENSE,MATSEQDENSECUDA,"");CHKERRQ(ierr);
414686214ceeSStefano Zampini   if (!cisdense) {
414786214ceeSStefano Zampini     ierr = MatSetType(C,MATDENSE);CHKERRQ(ierr);
414886214ceeSStefano Zampini   }
414986214ceeSStefano Zampini   ierr = MatSetUp(C);CHKERRQ(ierr);
4150d73949e8SHong Zhang 
41514222ddf1SHong Zhang   C->ops->matmultnumeric = MatMatMultNumeric_SeqDense_SeqAIJ;
4152170fe5c8SBarry Smith   PetscFunctionReturn(0);
4153170fe5c8SBarry Smith }
4154170fe5c8SBarry Smith 
4155170fe5c8SBarry Smith /* ----------------------------------------------------------------*/
41560bad9183SKris Buschelman /*MC
4157fafad747SKris Buschelman    MATSEQAIJ - MATSEQAIJ = "seqaij" - A matrix type to be used for sequential sparse matrices,
41580bad9183SKris Buschelman    based on compressed sparse row format.
41590bad9183SKris Buschelman 
41600bad9183SKris Buschelman    Options Database Keys:
41610bad9183SKris Buschelman . -mat_type seqaij - sets the matrix type to "seqaij" during a call to MatSetFromOptions()
41620bad9183SKris Buschelman 
41630bad9183SKris Buschelman    Level: beginner
41640bad9183SKris Buschelman 
41650cd7f59aSBarry Smith    Notes:
41660cd7f59aSBarry Smith     MatSetValues() may be called for this matrix type with a NULL argument for the numerical values,
41670cd7f59aSBarry Smith     in this case the values associated with the rows and columns one passes in are set to zero
41680cd7f59aSBarry Smith     in the matrix
41690cd7f59aSBarry Smith 
41700cd7f59aSBarry Smith     MatSetOptions(,MAT_STRUCTURE_ONLY,PETSC_TRUE) may be called for this matrix type. In this no
41710cd7f59aSBarry Smith     space is allocated for the nonzero entries and any entries passed with MatSetValues() are ignored
41720cd7f59aSBarry Smith 
41730cd7f59aSBarry Smith   Developer Notes:
41740cd7f59aSBarry Smith     It would be nice if all matrix formats supported passing NULL in for the numerical values
41750cd7f59aSBarry Smith 
4176f587520bSBarry Smith .seealso: MatCreateSeqAIJ(), MatSetFromOptions(), MatSetType(), MatCreate(), MatType
41770bad9183SKris Buschelman M*/
41780bad9183SKris Buschelman 
4179ccd284c7SBarry Smith /*MC
4180ccd284c7SBarry Smith    MATAIJ - MATAIJ = "aij" - A matrix type to be used for sparse matrices.
4181ccd284c7SBarry Smith 
4182ccd284c7SBarry Smith    This matrix type is identical to MATSEQAIJ when constructed with a single process communicator,
4183ccd284c7SBarry Smith    and MATMPIAIJ otherwise.  As a result, for single process communicators,
41840cd7f59aSBarry Smith   MatSeqAIJSetPreallocation is supported, and similarly MatMPIAIJSetPreallocation() is supported
4185ccd284c7SBarry Smith   for communicators controlling multiple processes.  It is recommended that you call both of
4186ccd284c7SBarry Smith   the above preallocation routines for simplicity.
4187ccd284c7SBarry Smith 
4188ccd284c7SBarry Smith    Options Database Keys:
4189ccd284c7SBarry Smith . -mat_type aij - sets the matrix type to "aij" during a call to MatSetFromOptions()
4190ccd284c7SBarry Smith 
419195452b02SPatrick Sanan   Developer Notes:
4192ca9cdca7SRichard Tran Mills     Subclasses include MATAIJCUSPARSE, MATAIJPERM, MATAIJSELL, MATAIJMKL, MATAIJCRL, and also automatically switches over to use inodes when
4193ccd284c7SBarry Smith    enough exist.
4194ccd284c7SBarry Smith 
4195ccd284c7SBarry Smith   Level: beginner
4196ccd284c7SBarry Smith 
4197ccd284c7SBarry Smith .seealso: MatCreateAIJ(), MatCreateSeqAIJ(), MATSEQAIJ,MATMPIAIJ
4198ccd284c7SBarry Smith M*/
4199ccd284c7SBarry Smith 
4200ccd284c7SBarry Smith /*MC
4201ccd284c7SBarry Smith    MATAIJCRL - MATAIJCRL = "aijcrl" - A matrix type to be used for sparse matrices.
4202ccd284c7SBarry Smith 
4203ccd284c7SBarry Smith    This matrix type is identical to MATSEQAIJCRL when constructed with a single process communicator,
4204ccd284c7SBarry Smith    and MATMPIAIJCRL otherwise.  As a result, for single process communicators,
4205ccd284c7SBarry Smith    MatSeqAIJSetPreallocation() is supported, and similarly MatMPIAIJSetPreallocation() is supported
4206ccd284c7SBarry Smith   for communicators controlling multiple processes.  It is recommended that you call both of
4207ccd284c7SBarry Smith   the above preallocation routines for simplicity.
4208ccd284c7SBarry Smith 
4209ccd284c7SBarry Smith    Options Database Keys:
4210ccd284c7SBarry Smith . -mat_type aijcrl - sets the matrix type to "aijcrl" during a call to MatSetFromOptions()
4211ccd284c7SBarry Smith 
4212ccd284c7SBarry Smith   Level: beginner
4213ccd284c7SBarry Smith 
4214ccd284c7SBarry Smith .seealso: MatCreateMPIAIJCRL,MATSEQAIJCRL,MATMPIAIJCRL, MATSEQAIJCRL, MATMPIAIJCRL
4215ccd284c7SBarry Smith M*/
4216ccd284c7SBarry Smith 
42177906f579SHong Zhang PETSC_INTERN PetscErrorCode MatConvert_SeqAIJ_SeqAIJCRL(Mat,MatType,MatReuse,Mat*);
42187906f579SHong Zhang #if defined(PETSC_HAVE_ELEMENTAL)
42197906f579SHong Zhang PETSC_INTERN PetscErrorCode MatConvert_SeqAIJ_Elemental(Mat,MatType,MatReuse,Mat*);
42207906f579SHong Zhang #endif
42217906f579SHong Zhang #if defined(PETSC_HAVE_HYPRE)
42227906f579SHong Zhang PETSC_INTERN PetscErrorCode MatConvert_AIJ_HYPRE(Mat A,MatType,MatReuse,Mat*);
42237906f579SHong Zhang #endif
42247906f579SHong Zhang PETSC_INTERN PetscErrorCode MatConvert_SeqAIJ_SeqDense(Mat,MatType,MatReuse,Mat*);
42257906f579SHong Zhang 
4226d4002b98SHong Zhang PETSC_EXTERN PetscErrorCode MatConvert_SeqAIJ_SeqSELL(Mat,MatType,MatReuse,Mat*);
4227c9225affSStefano Zampini PETSC_INTERN PetscErrorCode MatConvert_XAIJ_IS(Mat,MatType,MatReuse,Mat*);
42284222ddf1SHong Zhang PETSC_INTERN PetscErrorCode MatProductSetFromOptions_IS_XAIJ(Mat);
42297906f579SHong Zhang 
42308c778c55SBarry Smith /*@C
42318f1ea47aSStefano Zampini    MatSeqAIJGetArray - gives read/write access to the array where the data for a MATSEQAIJ matrix is stored
42328c778c55SBarry Smith 
42338c778c55SBarry Smith    Not Collective
42348c778c55SBarry Smith 
42358c778c55SBarry Smith    Input Parameter:
4236579dbff0SBarry Smith .  mat - a MATSEQAIJ matrix
42378c778c55SBarry Smith 
42388c778c55SBarry Smith    Output Parameter:
42398c778c55SBarry Smith .   array - pointer to the data
42408c778c55SBarry Smith 
42418c778c55SBarry Smith    Level: intermediate
42428c778c55SBarry Smith 
4243774cf152SJed Brown .seealso: MatSeqAIJRestoreArray(), MatSeqAIJGetArrayF90()
42448c778c55SBarry Smith @*/
42458c778c55SBarry Smith PetscErrorCode  MatSeqAIJGetArray(Mat A,PetscScalar **array)
42468c778c55SBarry Smith {
42478c778c55SBarry Smith   PetscErrorCode ierr;
42488c778c55SBarry Smith 
42498c778c55SBarry Smith   PetscFunctionBegin;
42508c778c55SBarry Smith   ierr = PetscUseMethod(A,"MatSeqAIJGetArray_C",(Mat,PetscScalar**),(A,array));CHKERRQ(ierr);
42518c778c55SBarry Smith   PetscFunctionReturn(0);
42528c778c55SBarry Smith }
42538c778c55SBarry Smith 
425421e72a00SBarry Smith /*@C
42558f1ea47aSStefano Zampini    MatSeqAIJGetArrayRead - gives read-only access to the array where the data for a MATSEQAIJ matrix is stored
42568f1ea47aSStefano Zampini 
42578f1ea47aSStefano Zampini    Not Collective
42588f1ea47aSStefano Zampini 
42598f1ea47aSStefano Zampini    Input Parameter:
42608f1ea47aSStefano Zampini .  mat - a MATSEQAIJ matrix
42618f1ea47aSStefano Zampini 
42628f1ea47aSStefano Zampini    Output Parameter:
42638f1ea47aSStefano Zampini .   array - pointer to the data
42648f1ea47aSStefano Zampini 
42658f1ea47aSStefano Zampini    Level: intermediate
42668f1ea47aSStefano Zampini 
42678f1ea47aSStefano Zampini .seealso: MatSeqAIJGetArray(), MatSeqAIJRestoreArrayRead()
42688f1ea47aSStefano Zampini @*/
42698f1ea47aSStefano Zampini PetscErrorCode  MatSeqAIJGetArrayRead(Mat A,const PetscScalar **array)
42708f1ea47aSStefano Zampini {
42718f1ea47aSStefano Zampini #if defined(PETSC_HAVE_CUDA) || defined(PETSC_HAVE_VIENNACL)
4272c70f7ee4SJunchao Zhang   PetscOffloadMask oval;
42738f1ea47aSStefano Zampini #endif
42748f1ea47aSStefano Zampini   PetscErrorCode ierr;
42758f1ea47aSStefano Zampini 
42768f1ea47aSStefano Zampini   PetscFunctionBegin;
42778f1ea47aSStefano Zampini #if defined(PETSC_HAVE_CUDA) || defined(PETSC_HAVE_VIENNACL)
4278c70f7ee4SJunchao Zhang   oval = A->offloadmask;
42798f1ea47aSStefano Zampini #endif
42808f1ea47aSStefano Zampini   ierr = MatSeqAIJGetArray(A,(PetscScalar**)array);CHKERRQ(ierr);
42818f1ea47aSStefano Zampini #if defined(PETSC_HAVE_CUDA) || defined(PETSC_HAVE_VIENNACL)
4282c70f7ee4SJunchao Zhang   if (oval == PETSC_OFFLOAD_GPU || oval == PETSC_OFFLOAD_BOTH) A->offloadmask = PETSC_OFFLOAD_BOTH;
42838f1ea47aSStefano Zampini #endif
42848f1ea47aSStefano Zampini   PetscFunctionReturn(0);
42858f1ea47aSStefano Zampini }
42868f1ea47aSStefano Zampini 
42878f1ea47aSStefano Zampini /*@C
42888f1ea47aSStefano Zampini    MatSeqAIJRestoreArrayRead - restore the read-only access array obtained from MatSeqAIJGetArrayRead
42898f1ea47aSStefano Zampini 
42908f1ea47aSStefano Zampini    Not Collective
42918f1ea47aSStefano Zampini 
42928f1ea47aSStefano Zampini    Input Parameter:
42938f1ea47aSStefano Zampini .  mat - a MATSEQAIJ matrix
42948f1ea47aSStefano Zampini 
42958f1ea47aSStefano Zampini    Output Parameter:
42968f1ea47aSStefano Zampini .   array - pointer to the data
42978f1ea47aSStefano Zampini 
42988f1ea47aSStefano Zampini    Level: intermediate
42998f1ea47aSStefano Zampini 
43008f1ea47aSStefano Zampini .seealso: MatSeqAIJGetArray(), MatSeqAIJGetArrayRead()
43018f1ea47aSStefano Zampini @*/
43028f1ea47aSStefano Zampini PetscErrorCode  MatSeqAIJRestoreArrayRead(Mat A,const PetscScalar **array)
43038f1ea47aSStefano Zampini {
43048f1ea47aSStefano Zampini #if defined(PETSC_HAVE_CUDA) || defined(PETSC_HAVE_VIENNACL)
4305c70f7ee4SJunchao Zhang   PetscOffloadMask oval;
43068f1ea47aSStefano Zampini #endif
43078f1ea47aSStefano Zampini   PetscErrorCode ierr;
43088f1ea47aSStefano Zampini 
43098f1ea47aSStefano Zampini   PetscFunctionBegin;
43108f1ea47aSStefano Zampini #if defined(PETSC_HAVE_CUDA) || defined(PETSC_HAVE_VIENNACL)
4311c70f7ee4SJunchao Zhang   oval = A->offloadmask;
43128f1ea47aSStefano Zampini #endif
43138f1ea47aSStefano Zampini   ierr = MatSeqAIJRestoreArray(A,(PetscScalar**)array);CHKERRQ(ierr);
43148f1ea47aSStefano Zampini #if defined(PETSC_HAVE_CUDA) || defined(PETSC_HAVE_VIENNACL)
4315c70f7ee4SJunchao Zhang   A->offloadmask = oval;
43168f1ea47aSStefano Zampini #endif
43178f1ea47aSStefano Zampini   PetscFunctionReturn(0);
43188f1ea47aSStefano Zampini }
43198f1ea47aSStefano Zampini 
43208f1ea47aSStefano Zampini /*@C
432121e72a00SBarry Smith    MatSeqAIJGetMaxRowNonzeros - returns the maximum number of nonzeros in any row
432221e72a00SBarry Smith 
432321e72a00SBarry Smith    Not Collective
432421e72a00SBarry Smith 
432521e72a00SBarry Smith    Input Parameter:
4326579dbff0SBarry Smith .  mat - a MATSEQAIJ matrix
432721e72a00SBarry Smith 
432821e72a00SBarry Smith    Output Parameter:
432921e72a00SBarry Smith .   nz - the maximum number of nonzeros in any row
433021e72a00SBarry Smith 
433121e72a00SBarry Smith    Level: intermediate
433221e72a00SBarry Smith 
433321e72a00SBarry Smith .seealso: MatSeqAIJRestoreArray(), MatSeqAIJGetArrayF90()
433421e72a00SBarry Smith @*/
433521e72a00SBarry Smith PetscErrorCode  MatSeqAIJGetMaxRowNonzeros(Mat A,PetscInt *nz)
433621e72a00SBarry Smith {
433721e72a00SBarry Smith   Mat_SeqAIJ     *aij = (Mat_SeqAIJ*)A->data;
433821e72a00SBarry Smith 
433921e72a00SBarry Smith   PetscFunctionBegin;
434021e72a00SBarry Smith   *nz = aij->rmax;
434121e72a00SBarry Smith   PetscFunctionReturn(0);
434221e72a00SBarry Smith }
434321e72a00SBarry Smith 
43448c778c55SBarry Smith /*@C
4345579dbff0SBarry Smith    MatSeqAIJRestoreArray - returns access to the array where the data for a MATSEQAIJ matrix is stored obtained by MatSeqAIJGetArray()
43468c778c55SBarry Smith 
43478c778c55SBarry Smith    Not Collective
43488c778c55SBarry Smith 
43498c778c55SBarry Smith    Input Parameters:
4350a2b725a8SWilliam Gropp +  mat - a MATSEQAIJ matrix
4351a2b725a8SWilliam Gropp -  array - pointer to the data
43528c778c55SBarry Smith 
43538c778c55SBarry Smith    Level: intermediate
43548c778c55SBarry Smith 
4355774cf152SJed Brown .seealso: MatSeqAIJGetArray(), MatSeqAIJRestoreArrayF90()
43568c778c55SBarry Smith @*/
43578c778c55SBarry Smith PetscErrorCode  MatSeqAIJRestoreArray(Mat A,PetscScalar **array)
43588c778c55SBarry Smith {
43598c778c55SBarry Smith   PetscErrorCode ierr;
43608c778c55SBarry Smith 
43618c778c55SBarry Smith   PetscFunctionBegin;
43628c778c55SBarry Smith   ierr = PetscUseMethod(A,"MatSeqAIJRestoreArray_C",(Mat,PetscScalar**),(A,array));CHKERRQ(ierr);
43638c778c55SBarry Smith   PetscFunctionReturn(0);
43648c778c55SBarry Smith }
43658c778c55SBarry Smith 
436634b5b067SBarry Smith #if defined(PETSC_HAVE_CUDA)
43670ce8acdeSStefano Zampini PETSC_INTERN PetscErrorCode MatConvert_SeqAIJ_SeqAIJCUSPARSE(Mat);
436802fe1965SBarry Smith #endif
436902fe1965SBarry Smith 
43708cc058d9SJed Brown PETSC_EXTERN PetscErrorCode MatCreate_SeqAIJ(Mat B)
4371273d9f13SBarry Smith {
4372273d9f13SBarry Smith   Mat_SeqAIJ     *b;
4373dfbe8321SBarry Smith   PetscErrorCode ierr;
437438baddfdSBarry Smith   PetscMPIInt    size;
4375273d9f13SBarry Smith 
4376273d9f13SBarry Smith   PetscFunctionBegin;
4377ce94432eSBarry Smith   ierr = MPI_Comm_size(PetscObjectComm((PetscObject)B),&size);CHKERRQ(ierr);
4378e32f2f54SBarry Smith   if (size > 1) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Comm must be of size 1");
4379273d9f13SBarry Smith 
4380b00a9115SJed Brown   ierr = PetscNewLog(B,&b);CHKERRQ(ierr);
43812205254eSKarl Rupp 
4382b0a32e0cSBarry Smith   B->data = (void*)b;
43832205254eSKarl Rupp 
4384549d3d68SSatish Balay   ierr = PetscMemcpy(B->ops,&MatOps_Values,sizeof(struct _MatOps));CHKERRQ(ierr);
4385071fcb05SBarry Smith   if (B->sortedfull) B->ops->setvalues = MatSetValues_SeqAIJ_SortedFull;
43862205254eSKarl Rupp 
4387416022c9SBarry Smith   b->row                = 0;
4388416022c9SBarry Smith   b->col                = 0;
438982bf6240SBarry Smith   b->icol               = 0;
4390b810aeb4SBarry Smith   b->reallocs           = 0;
439136db0b34SBarry Smith   b->ignorezeroentries  = PETSC_FALSE;
4392f1e2ffcdSBarry Smith   b->roworiented        = PETSC_TRUE;
4393416022c9SBarry Smith   b->nonew              = 0;
4394416022c9SBarry Smith   b->diag               = 0;
4395416022c9SBarry Smith   b->solve_work         = 0;
43962a1b7f2aSHong Zhang   B->spptr              = 0;
4397be6bf707SBarry Smith   b->saved_values       = 0;
4398d7f994e1SBarry Smith   b->idiag              = 0;
439971f1c65dSBarry Smith   b->mdiag              = 0;
440071f1c65dSBarry Smith   b->ssor_work          = 0;
440171f1c65dSBarry Smith   b->omega              = 1.0;
440271f1c65dSBarry Smith   b->fshift             = 0.0;
440371f1c65dSBarry Smith   b->idiagvalid         = PETSC_FALSE;
4404bbead8a2SBarry Smith   b->ibdiagvalid        = PETSC_FALSE;
4405a9817697SBarry Smith   b->keepnonzeropattern = PETSC_FALSE;
440617ab2063SBarry Smith 
440735d8aa7fSBarry Smith   ierr = PetscObjectChangeTypeName((PetscObject)B,MATSEQAIJ);CHKERRQ(ierr);
4408bdf89e91SBarry Smith   ierr = PetscObjectComposeFunction((PetscObject)B,"MatSeqAIJGetArray_C",MatSeqAIJGetArray_SeqAIJ);CHKERRQ(ierr);
4409bdf89e91SBarry Smith   ierr = PetscObjectComposeFunction((PetscObject)B,"MatSeqAIJRestoreArray_C",MatSeqAIJRestoreArray_SeqAIJ);CHKERRQ(ierr);
44108c778c55SBarry Smith 
4411b3866ffcSBarry Smith #if defined(PETSC_HAVE_MATLAB_ENGINE)
4412bdf89e91SBarry Smith   ierr = PetscObjectComposeFunction((PetscObject)B,"PetscMatlabEnginePut_C",MatlabEnginePut_SeqAIJ);CHKERRQ(ierr);
4413bdf89e91SBarry Smith   ierr = PetscObjectComposeFunction((PetscObject)B,"PetscMatlabEngineGet_C",MatlabEngineGet_SeqAIJ);CHKERRQ(ierr);
4414b3866ffcSBarry Smith #endif
441517f1a0eaSHong Zhang 
4416bdf89e91SBarry Smith   ierr = PetscObjectComposeFunction((PetscObject)B,"MatSeqAIJSetColumnIndices_C",MatSeqAIJSetColumnIndices_SeqAIJ);CHKERRQ(ierr);
4417bdf89e91SBarry Smith   ierr = PetscObjectComposeFunction((PetscObject)B,"MatStoreValues_C",MatStoreValues_SeqAIJ);CHKERRQ(ierr);
4418bdf89e91SBarry Smith   ierr = PetscObjectComposeFunction((PetscObject)B,"MatRetrieveValues_C",MatRetrieveValues_SeqAIJ);CHKERRQ(ierr);
4419bdf89e91SBarry Smith   ierr = PetscObjectComposeFunction((PetscObject)B,"MatConvert_seqaij_seqsbaij_C",MatConvert_SeqAIJ_SeqSBAIJ);CHKERRQ(ierr);
4420bdf89e91SBarry Smith   ierr = PetscObjectComposeFunction((PetscObject)B,"MatConvert_seqaij_seqbaij_C",MatConvert_SeqAIJ_SeqBAIJ);CHKERRQ(ierr);
4421bdf89e91SBarry Smith   ierr = PetscObjectComposeFunction((PetscObject)B,"MatConvert_seqaij_seqaijperm_C",MatConvert_SeqAIJ_SeqAIJPERM);CHKERRQ(ierr);
44224dfdc2d9SRichard Tran Mills   ierr = PetscObjectComposeFunction((PetscObject)B,"MatConvert_seqaij_seqaijsell_C",MatConvert_SeqAIJ_SeqAIJSELL);CHKERRQ(ierr);
44239779e05dSSatish Balay #if defined(PETSC_HAVE_MKL_SPARSE)
44244a2a386eSRichard Tran Mills   ierr = PetscObjectComposeFunction((PetscObject)B,"MatConvert_seqaij_seqaijmkl_C",MatConvert_SeqAIJ_SeqAIJMKL);CHKERRQ(ierr);
4425191b95cbSRichard Tran Mills #endif
442634b5b067SBarry Smith #if defined(PETSC_HAVE_CUDA)
442702fe1965SBarry Smith   ierr = PetscObjectComposeFunction((PetscObject)B,"MatConvert_seqaij_seqaijcusparse_C",MatConvert_SeqAIJ_SeqAIJCUSPARSE);CHKERRQ(ierr);
44284222ddf1SHong Zhang   ierr = PetscObjectComposeFunction((PetscObject)B,"MatProductSetFromOptions_seqaijcusparse_seqaij_C",MatProductSetFromOptions_SeqAIJ);CHKERRQ(ierr);
442902fe1965SBarry Smith #endif
4430bdf89e91SBarry Smith   ierr = PetscObjectComposeFunction((PetscObject)B,"MatConvert_seqaij_seqaijcrl_C",MatConvert_SeqAIJ_SeqAIJCRL);CHKERRQ(ierr);
4431af8000cdSHong Zhang #if defined(PETSC_HAVE_ELEMENTAL)
4432af8000cdSHong Zhang   ierr = PetscObjectComposeFunction((PetscObject)B,"MatConvert_seqaij_elemental_C",MatConvert_SeqAIJ_Elemental);CHKERRQ(ierr);
4433af8000cdSHong Zhang #endif
443463c07aadSStefano Zampini #if defined(PETSC_HAVE_HYPRE)
443563c07aadSStefano Zampini   ierr = PetscObjectComposeFunction((PetscObject)B,"MatConvert_seqaij_hypre_C",MatConvert_AIJ_HYPRE);CHKERRQ(ierr);
44364222ddf1SHong Zhang   ierr = PetscObjectComposeFunction((PetscObject)B,"MatProductSetFromOptions_transpose_seqaij_seqaij_C",MatProductSetFromOptions_Transpose_AIJ_AIJ);CHKERRQ(ierr);
443763c07aadSStefano Zampini #endif
4438b49cda9fSStefano Zampini   ierr = PetscObjectComposeFunction((PetscObject)B,"MatConvert_seqaij_seqdense_C",MatConvert_SeqAIJ_SeqDense);CHKERRQ(ierr);
4439d4002b98SHong Zhang   ierr = PetscObjectComposeFunction((PetscObject)B,"MatConvert_seqaij_seqsell_C",MatConvert_SeqAIJ_SeqSELL);CHKERRQ(ierr);
4440c9225affSStefano Zampini   ierr = PetscObjectComposeFunction((PetscObject)B,"MatConvert_seqaij_is_C",MatConvert_XAIJ_IS);CHKERRQ(ierr);
4441bdf89e91SBarry Smith   ierr = PetscObjectComposeFunction((PetscObject)B,"MatIsTranspose_C",MatIsTranspose_SeqAIJ);CHKERRQ(ierr);
4442bdf89e91SBarry Smith   ierr = PetscObjectComposeFunction((PetscObject)B,"MatIsHermitianTranspose_C",MatIsTranspose_SeqAIJ);CHKERRQ(ierr);
4443bdf89e91SBarry Smith   ierr = PetscObjectComposeFunction((PetscObject)B,"MatSeqAIJSetPreallocation_C",MatSeqAIJSetPreallocation_SeqAIJ);CHKERRQ(ierr);
4444846b4da1SFande Kong   ierr = PetscObjectComposeFunction((PetscObject)B,"MatResetPreallocation_C",MatResetPreallocation_SeqAIJ);CHKERRQ(ierr);
4445bdf89e91SBarry Smith   ierr = PetscObjectComposeFunction((PetscObject)B,"MatSeqAIJSetPreallocationCSR_C",MatSeqAIJSetPreallocationCSR_SeqAIJ);CHKERRQ(ierr);
4446bdf89e91SBarry Smith   ierr = PetscObjectComposeFunction((PetscObject)B,"MatReorderForNonzeroDiagonal_C",MatReorderForNonzeroDiagonal_SeqAIJ);CHKERRQ(ierr);
44474222ddf1SHong Zhang   ierr = PetscObjectComposeFunction((PetscObject)B,"MatProductSetFromOptions_is_seqaij_C",MatProductSetFromOptions_IS_XAIJ);CHKERRQ(ierr);
44484222ddf1SHong Zhang   ierr = PetscObjectComposeFunction((PetscObject)B,"MatProductSetFromOptions_seqdense_seqaij_C",MatProductSetFromOptions_SeqDense_SeqAIJ);CHKERRQ(ierr);
44494222ddf1SHong Zhang   ierr = PetscObjectComposeFunction((PetscObject)B,"MatProductSetFromOptions_seqaij_seqaij_C",MatProductSetFromOptions_SeqAIJ);CHKERRQ(ierr);
44504108e4d5SBarry Smith   ierr = MatCreate_SeqAIJ_Inode(B);CHKERRQ(ierr);
445117667f90SBarry Smith   ierr = PetscObjectChangeTypeName((PetscObject)B,MATSEQAIJ);CHKERRQ(ierr);
44524099cc6bSBarry Smith   ierr = MatSeqAIJSetTypeFromOptions(B);CHKERRQ(ierr);  /* this allows changing the matrix subtype to say MATSEQAIJPERM */
44533a40ed3dSBarry Smith   PetscFunctionReturn(0);
445417ab2063SBarry Smith }
445517ab2063SBarry Smith 
4456b24902e0SBarry Smith /*
4457b24902e0SBarry Smith     Given a matrix generated with MatGetFactor() duplicates all the information in A into B
4458b24902e0SBarry Smith */
4459ace3abfcSBarry Smith PetscErrorCode MatDuplicateNoCreate_SeqAIJ(Mat C,Mat A,MatDuplicateOption cpvalues,PetscBool mallocmatspace)
446017ab2063SBarry Smith {
4461416022c9SBarry Smith   Mat_SeqAIJ     *c,*a = (Mat_SeqAIJ*)A->data;
44626849ba73SBarry Smith   PetscErrorCode ierr;
4463071fcb05SBarry Smith   PetscInt       m = A->rmap->n,i;
446417ab2063SBarry Smith 
44653a40ed3dSBarry Smith   PetscFunctionBegin;
4466273d9f13SBarry Smith   c = (Mat_SeqAIJ*)C->data;
4467273d9f13SBarry Smith 
4468d5f3da31SBarry Smith   C->factortype = A->factortype;
4469416022c9SBarry Smith   c->row        = 0;
4470416022c9SBarry Smith   c->col        = 0;
447182bf6240SBarry Smith   c->icol       = 0;
44726ad4291fSHong Zhang   c->reallocs   = 0;
447317ab2063SBarry Smith 
44746ad4291fSHong Zhang   C->assembled = PETSC_TRUE;
447517ab2063SBarry Smith 
4476aa5ea44dSBarry Smith   ierr = PetscLayoutReference(A->rmap,&C->rmap);CHKERRQ(ierr);
4477aa5ea44dSBarry Smith   ierr = PetscLayoutReference(A->cmap,&C->cmap);CHKERRQ(ierr);
4478eec197d1SBarry Smith 
4479071fcb05SBarry Smith   ierr = PetscMalloc1(m,&c->imax);CHKERRQ(ierr);
4480071fcb05SBarry Smith   ierr = PetscMemcpy(c->imax,a->imax,m*sizeof(PetscInt));CHKERRQ(ierr);
4481071fcb05SBarry Smith   ierr = PetscMalloc1(m,&c->ilen);CHKERRQ(ierr);
4482071fcb05SBarry Smith   ierr = PetscMemcpy(c->ilen,a->ilen,m*sizeof(PetscInt));CHKERRQ(ierr);
44833bb1ff40SBarry Smith   ierr = PetscLogObjectMemory((PetscObject)C, 2*m*sizeof(PetscInt));CHKERRQ(ierr);
448417ab2063SBarry Smith 
448517ab2063SBarry Smith   /* allocate the matrix space */
4486f77e22a1SHong Zhang   if (mallocmatspace) {
4487dcca6d9dSJed Brown     ierr = PetscMalloc3(a->i[m],&c->a,a->i[m],&c->j,m+1,&c->i);CHKERRQ(ierr);
44883bb1ff40SBarry Smith     ierr = PetscLogObjectMemory((PetscObject)C, a->i[m]*(sizeof(PetscScalar)+sizeof(PetscInt))+(m+1)*sizeof(PetscInt));CHKERRQ(ierr);
44892205254eSKarl Rupp 
4490f1e2ffcdSBarry Smith     c->singlemalloc = PETSC_TRUE;
44912205254eSKarl Rupp 
4492580bdb30SBarry Smith     ierr = PetscArraycpy(c->i,a->i,m+1);CHKERRQ(ierr);
449317ab2063SBarry Smith     if (m > 0) {
4494580bdb30SBarry Smith       ierr = PetscArraycpy(c->j,a->j,a->i[m]);CHKERRQ(ierr);
4495be6bf707SBarry Smith       if (cpvalues == MAT_COPY_VALUES) {
4496580bdb30SBarry Smith         ierr = PetscArraycpy(c->a,a->a,a->i[m]);CHKERRQ(ierr);
4497be6bf707SBarry Smith       } else {
4498580bdb30SBarry Smith         ierr = PetscArrayzero(c->a,a->i[m]);CHKERRQ(ierr);
449917ab2063SBarry Smith       }
450008480c60SBarry Smith     }
4501f77e22a1SHong Zhang   }
450217ab2063SBarry Smith 
45036ad4291fSHong Zhang   c->ignorezeroentries = a->ignorezeroentries;
4504416022c9SBarry Smith   c->roworiented       = a->roworiented;
4505416022c9SBarry Smith   c->nonew             = a->nonew;
4506416022c9SBarry Smith   if (a->diag) {
4507854ce69bSBarry Smith     ierr = PetscMalloc1(m+1,&c->diag);CHKERRQ(ierr);
4508071fcb05SBarry Smith     ierr = PetscMemcpy(c->diag,a->diag,m*sizeof(PetscInt));CHKERRQ(ierr);
45093bb1ff40SBarry Smith     ierr = PetscLogObjectMemory((PetscObject)C,(m+1)*sizeof(PetscInt));CHKERRQ(ierr);
4510071fcb05SBarry Smith   } else c->diag = NULL;
45112205254eSKarl Rupp 
45126ad4291fSHong Zhang   c->solve_work         = 0;
45136ad4291fSHong Zhang   c->saved_values       = 0;
45146ad4291fSHong Zhang   c->idiag              = 0;
451571f1c65dSBarry Smith   c->ssor_work          = 0;
4516a9817697SBarry Smith   c->keepnonzeropattern = a->keepnonzeropattern;
4517e6b907acSBarry Smith   c->free_a             = PETSC_TRUE;
4518e6b907acSBarry Smith   c->free_ij            = PETSC_TRUE;
45196ad4291fSHong Zhang 
4520893ad86cSHong Zhang   c->rmax         = a->rmax;
4521416022c9SBarry Smith   c->nz           = a->nz;
45228ed568f8SMatthew G Knepley   c->maxnz        = a->nz;       /* Since we allocate exactly the right amount */
4523273d9f13SBarry Smith   C->preallocated = PETSC_TRUE;
4524754ec7b1SSatish Balay 
45256ad4291fSHong Zhang   c->compressedrow.use   = a->compressedrow.use;
45266ad4291fSHong Zhang   c->compressedrow.nrows = a->compressedrow.nrows;
4527cd6b891eSBarry Smith   if (a->compressedrow.use) {
45286ad4291fSHong Zhang     i    = a->compressedrow.nrows;
4529dcca6d9dSJed Brown     ierr = PetscMalloc2(i+1,&c->compressedrow.i,i,&c->compressedrow.rindex);CHKERRQ(ierr);
4530580bdb30SBarry Smith     ierr = PetscArraycpy(c->compressedrow.i,a->compressedrow.i,i+1);CHKERRQ(ierr);
4531580bdb30SBarry Smith     ierr = PetscArraycpy(c->compressedrow.rindex,a->compressedrow.rindex,i);CHKERRQ(ierr);
453227ea64f8SHong Zhang   } else {
453327ea64f8SHong Zhang     c->compressedrow.use    = PETSC_FALSE;
45340298fd71SBarry Smith     c->compressedrow.i      = NULL;
45350298fd71SBarry Smith     c->compressedrow.rindex = NULL;
45366ad4291fSHong Zhang   }
4537ea632784SBarry Smith   c->nonzerorowcnt = a->nonzerorowcnt;
4538e56f5c9eSBarry Smith   C->nonzerostate  = A->nonzerostate;
45394846f1f5SKris Buschelman 
45402205254eSKarl Rupp   ierr = MatDuplicate_SeqAIJ_Inode(A,cpvalues,&C);CHKERRQ(ierr);
4541140e18c1SBarry Smith   ierr = PetscFunctionListDuplicate(((PetscObject)A)->qlist,&((PetscObject)C)->qlist);CHKERRQ(ierr);
45423a40ed3dSBarry Smith   PetscFunctionReturn(0);
454317ab2063SBarry Smith }
454417ab2063SBarry Smith 
4545b24902e0SBarry Smith PetscErrorCode MatDuplicate_SeqAIJ(Mat A,MatDuplicateOption cpvalues,Mat *B)
4546b24902e0SBarry Smith {
4547b24902e0SBarry Smith   PetscErrorCode ierr;
4548b24902e0SBarry Smith 
4549b24902e0SBarry Smith   PetscFunctionBegin;
4550ce94432eSBarry Smith   ierr = MatCreate(PetscObjectComm((PetscObject)A),B);CHKERRQ(ierr);
45514b6263acSBarry Smith   ierr = MatSetSizes(*B,A->rmap->n,A->cmap->n,A->rmap->n,A->cmap->n);CHKERRQ(ierr);
4552cfd3f464SBarry Smith   if (!(A->rmap->n % A->rmap->bs) && !(A->cmap->n % A->cmap->bs)) {
455333d57670SJed Brown     ierr = MatSetBlockSizesFromMats(*B,A,A);CHKERRQ(ierr);
4554cfd3f464SBarry Smith   }
4555a54f2f98SBarry Smith   ierr = MatSetType(*B,((PetscObject)A)->type_name);CHKERRQ(ierr);
4556f77e22a1SHong Zhang   ierr = MatDuplicateNoCreate_SeqAIJ(*B,A,cpvalues,PETSC_TRUE);CHKERRQ(ierr);
4557b24902e0SBarry Smith   PetscFunctionReturn(0);
4558b24902e0SBarry Smith }
4559b24902e0SBarry Smith 
4560112444f4SShri Abhyankar PetscErrorCode MatLoad_SeqAIJ(Mat newMat, PetscViewer viewer)
4561fbdbba38SShri Abhyankar {
456252f91c60SVaclav Hapla   PetscBool      isbinary, ishdf5;
456352f91c60SVaclav Hapla   PetscErrorCode ierr;
456452f91c60SVaclav Hapla 
456552f91c60SVaclav Hapla   PetscFunctionBegin;
456652f91c60SVaclav Hapla   PetscValidHeaderSpecific(newMat,MAT_CLASSID,1);
456752f91c60SVaclav Hapla   PetscValidHeaderSpecific(viewer,PETSC_VIEWER_CLASSID,2);
4568c27b3999SVaclav Hapla   /* force binary viewer to load .info file if it has not yet done so */
4569c27b3999SVaclav Hapla   ierr = PetscViewerSetUp(viewer);CHKERRQ(ierr);
457052f91c60SVaclav Hapla   ierr = PetscObjectTypeCompare((PetscObject)viewer,PETSCVIEWERBINARY,&isbinary);CHKERRQ(ierr);
457152f91c60SVaclav Hapla   ierr = PetscObjectTypeCompare((PetscObject)viewer,PETSCVIEWERHDF5,  &ishdf5);CHKERRQ(ierr);
457252f91c60SVaclav Hapla   if (isbinary) {
457352f91c60SVaclav Hapla     ierr = MatLoad_SeqAIJ_Binary(newMat,viewer);CHKERRQ(ierr);
457452f91c60SVaclav Hapla   } else if (ishdf5) {
457552f91c60SVaclav Hapla #if defined(PETSC_HAVE_HDF5)
457652f91c60SVaclav Hapla     ierr = MatLoad_AIJ_HDF5(newMat,viewer);CHKERRQ(ierr);
457752f91c60SVaclav Hapla #else
457852f91c60SVaclav Hapla     SETERRQ(PetscObjectComm((PetscObject)newMat),PETSC_ERR_SUP,"HDF5 not supported in this build.\nPlease reconfigure using --download-hdf5");
457952f91c60SVaclav Hapla #endif
458052f91c60SVaclav Hapla   } else {
458152f91c60SVaclav Hapla     SETERRQ2(PetscObjectComm((PetscObject)newMat),PETSC_ERR_SUP,"Viewer type %s not yet supported for reading %s matrices",((PetscObject)viewer)->type_name,((PetscObject)newMat)->type_name);
458252f91c60SVaclav Hapla   }
458352f91c60SVaclav Hapla   PetscFunctionReturn(0);
458452f91c60SVaclav Hapla }
458552f91c60SVaclav Hapla 
45863ea6fe3dSLisandro Dalcin PetscErrorCode MatLoad_SeqAIJ_Binary(Mat mat, PetscViewer viewer)
458752f91c60SVaclav Hapla {
45883ea6fe3dSLisandro Dalcin   Mat_SeqAIJ     *a = (Mat_SeqAIJ*)mat->data;
4589fbdbba38SShri Abhyankar   PetscErrorCode ierr;
45903ea6fe3dSLisandro Dalcin   PetscInt       header[4],*rowlens,M,N,nz,sum,rows,cols,i;
4591fbdbba38SShri Abhyankar 
4592fbdbba38SShri Abhyankar   PetscFunctionBegin;
45933ea6fe3dSLisandro Dalcin   ierr = PetscViewerSetUp(viewer);CHKERRQ(ierr);
4594bbead8a2SBarry Smith 
45953ea6fe3dSLisandro Dalcin   /* read in matrix header */
45963ea6fe3dSLisandro Dalcin   ierr = PetscViewerBinaryRead(viewer,header,4,NULL,PETSC_INT);CHKERRQ(ierr);
45973ea6fe3dSLisandro Dalcin   if (header[0] != MAT_FILE_CLASSID) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_FILE_UNEXPECTED,"Not a matrix object in file");
4598fbdbba38SShri Abhyankar   M = header[1]; N = header[2]; nz = header[3];
45993ea6fe3dSLisandro Dalcin   if (M < 0) SETERRQ1(PetscObjectComm((PetscObject)viewer),PETSC_ERR_FILE_UNEXPECTED,"Matrix row size (%D) in file is negative",M);
46003ea6fe3dSLisandro Dalcin   if (N < 0) SETERRQ1(PetscObjectComm((PetscObject)viewer),PETSC_ERR_FILE_UNEXPECTED,"Matrix column size (%D) in file is negative",N);
4601bbead8a2SBarry Smith   if (nz < 0) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_FILE_UNEXPECTED,"Matrix stored in special format on disk, cannot load as SeqAIJ");
4602fbdbba38SShri Abhyankar 
46033ea6fe3dSLisandro Dalcin   /* set block sizes from the viewer's .info file */
46043ea6fe3dSLisandro Dalcin   ierr = MatLoad_Binary_BlockSizes(mat,viewer);CHKERRQ(ierr);
46053ea6fe3dSLisandro Dalcin   /* set local and global sizes if not set already */
46063ea6fe3dSLisandro Dalcin   if (mat->rmap->n < 0) mat->rmap->n = M;
46073ea6fe3dSLisandro Dalcin   if (mat->cmap->n < 0) mat->cmap->n = N;
46083ea6fe3dSLisandro Dalcin   if (mat->rmap->N < 0) mat->rmap->N = M;
46093ea6fe3dSLisandro Dalcin   if (mat->cmap->N < 0) mat->cmap->N = N;
46103ea6fe3dSLisandro Dalcin   ierr = PetscLayoutSetUp(mat->rmap);CHKERRQ(ierr);
46113ea6fe3dSLisandro Dalcin   ierr = PetscLayoutSetUp(mat->cmap);CHKERRQ(ierr);
46123ea6fe3dSLisandro Dalcin 
46133ea6fe3dSLisandro Dalcin   /* check if the matrix sizes are correct */
46143ea6fe3dSLisandro Dalcin   ierr = MatGetSize(mat,&rows,&cols);CHKERRQ(ierr);
46153ea6fe3dSLisandro Dalcin   if (M != rows || N != cols) SETERRQ4(PETSC_COMM_SELF,PETSC_ERR_FILE_UNEXPECTED, "Matrix in file of different sizes (%D, %D) than the input matrix (%D, %D)",M,N,rows,cols);
46163ea6fe3dSLisandro Dalcin 
4617fbdbba38SShri Abhyankar   /* read in row lengths */
46183ea6fe3dSLisandro Dalcin   ierr = PetscMalloc1(M,&rowlens);CHKERRQ(ierr);
46193ea6fe3dSLisandro Dalcin   ierr = PetscViewerBinaryRead(viewer,rowlens,M,NULL,PETSC_INT);CHKERRQ(ierr);
46203ea6fe3dSLisandro Dalcin   /* check if sum(rowlens) is same as nz */
46213ea6fe3dSLisandro Dalcin   sum = 0; for (i=0; i<M; i++) sum += rowlens[i];
46223ea6fe3dSLisandro Dalcin   if (sum != nz) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_FILE_UNEXPECTED,"Inconsistent matrix data in file: nonzeros = %D, sum-row-lengths = %D\n",nz,sum);
46233ea6fe3dSLisandro Dalcin   /* preallocate and check sizes */
46243ea6fe3dSLisandro Dalcin   ierr = MatSeqAIJSetPreallocation_SeqAIJ(mat,0,rowlens);CHKERRQ(ierr);
46253ea6fe3dSLisandro Dalcin   ierr = MatGetSize(mat,&rows,&cols);CHKERRQ(ierr);
462660e0710aSBarry Smith   if (M != rows || N != cols) SETERRQ4(PETSC_COMM_SELF,PETSC_ERR_FILE_UNEXPECTED, "Matrix in file of different length (%D, %D) than the input matrix (%D, %D)",M,N,rows,cols);
46273ea6fe3dSLisandro Dalcin   /* store row lengths */
46283ea6fe3dSLisandro Dalcin   ierr = PetscArraycpy(a->ilen,rowlens,M);CHKERRQ(ierr);
46293ea6fe3dSLisandro Dalcin   ierr = PetscFree(rowlens);CHKERRQ(ierr);
4630fbdbba38SShri Abhyankar 
46313ea6fe3dSLisandro Dalcin   /* fill in "i" row pointers */
46323ea6fe3dSLisandro Dalcin   a->i[0] = 0; for (i=0; i<M; i++) a->i[i+1] = a->i[i] + a->ilen[i];
46333ea6fe3dSLisandro Dalcin   /* read in "j" column indices */
46343ea6fe3dSLisandro Dalcin   ierr = PetscViewerBinaryRead(viewer,a->j,nz,NULL,PETSC_INT);CHKERRQ(ierr);
46353ea6fe3dSLisandro Dalcin   /* read in "a" nonzero values */
46363ea6fe3dSLisandro Dalcin   ierr = PetscViewerBinaryRead(viewer,a->a,nz,NULL,PETSC_SCALAR);CHKERRQ(ierr);
4637fbdbba38SShri Abhyankar 
46383ea6fe3dSLisandro Dalcin   ierr = MatAssemblyBegin(mat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
46393ea6fe3dSLisandro Dalcin   ierr = MatAssemblyEnd(mat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
4640fbdbba38SShri Abhyankar   PetscFunctionReturn(0);
4641fbdbba38SShri Abhyankar }
4642fbdbba38SShri Abhyankar 
4643ace3abfcSBarry Smith PetscErrorCode MatEqual_SeqAIJ(Mat A,Mat B,PetscBool * flg)
46447264ac53SSatish Balay {
46457264ac53SSatish Balay   Mat_SeqAIJ     *a = (Mat_SeqAIJ*)A->data,*b = (Mat_SeqAIJ*)B->data;
4646dfbe8321SBarry Smith   PetscErrorCode ierr;
4647eeffb40dSHong Zhang #if defined(PETSC_USE_COMPLEX)
4648eeffb40dSHong Zhang   PetscInt k;
4649eeffb40dSHong Zhang #endif
46507264ac53SSatish Balay 
46513a40ed3dSBarry Smith   PetscFunctionBegin;
4652bfeeae90SHong Zhang   /* If the  matrix dimensions are not equal,or no of nonzeros */
4653d0f46423SBarry Smith   if ((A->rmap->n != B->rmap->n) || (A->cmap->n != B->cmap->n) ||(a->nz != b->nz)) {
4654ca44d042SBarry Smith     *flg = PETSC_FALSE;
4655ca44d042SBarry Smith     PetscFunctionReturn(0);
4656bcd2baecSBarry Smith   }
46577264ac53SSatish Balay 
46587264ac53SSatish Balay   /* if the a->i are the same */
4659580bdb30SBarry Smith   ierr = PetscArraycmp(a->i,b->i,A->rmap->n+1,flg);CHKERRQ(ierr);
4660abc0a331SBarry Smith   if (!*flg) PetscFunctionReturn(0);
46617264ac53SSatish Balay 
46627264ac53SSatish Balay   /* if a->j are the same */
4663580bdb30SBarry Smith   ierr = PetscArraycmp(a->j,b->j,a->nz,flg);CHKERRQ(ierr);
4664abc0a331SBarry Smith   if (!*flg) PetscFunctionReturn(0);
4665bcd2baecSBarry Smith 
4666bcd2baecSBarry Smith   /* if a->a are the same */
4667eeffb40dSHong Zhang #if defined(PETSC_USE_COMPLEX)
4668eeffb40dSHong Zhang   for (k=0; k<a->nz; k++) {
4669eeffb40dSHong Zhang     if (PetscRealPart(a->a[k]) != PetscRealPart(b->a[k]) || PetscImaginaryPart(a->a[k]) != PetscImaginaryPart(b->a[k])) {
4670eeffb40dSHong Zhang       *flg = PETSC_FALSE;
46713a40ed3dSBarry Smith       PetscFunctionReturn(0);
4672eeffb40dSHong Zhang     }
4673eeffb40dSHong Zhang   }
4674eeffb40dSHong Zhang #else
4675580bdb30SBarry Smith   ierr = PetscArraycmp(a->a,b->a,a->nz,flg);CHKERRQ(ierr);
4676eeffb40dSHong Zhang #endif
4677eeffb40dSHong Zhang   PetscFunctionReturn(0);
46787264ac53SSatish Balay }
467936db0b34SBarry Smith 
468005869f15SSatish Balay /*@
468136db0b34SBarry Smith      MatCreateSeqAIJWithArrays - Creates an sequential AIJ matrix using matrix elements (in CSR format)
468236db0b34SBarry Smith               provided by the user.
468336db0b34SBarry Smith 
4684d083f849SBarry Smith       Collective
468536db0b34SBarry Smith 
468636db0b34SBarry Smith    Input Parameters:
468736db0b34SBarry Smith +   comm - must be an MPI communicator of size 1
468836db0b34SBarry Smith .   m - number of rows
468936db0b34SBarry Smith .   n - number of columns
4690483a2f95SBarry Smith .   i - row indices; that is i[0] = 0, i[row] = i[row-1] + number of elements in that row of the matrix
469136db0b34SBarry Smith .   j - column indices
469236db0b34SBarry Smith -   a - matrix values
469336db0b34SBarry Smith 
469436db0b34SBarry Smith    Output Parameter:
469536db0b34SBarry Smith .   mat - the matrix
469636db0b34SBarry Smith 
469736db0b34SBarry Smith    Level: intermediate
469836db0b34SBarry Smith 
469936db0b34SBarry Smith    Notes:
47000551d7c0SBarry Smith        The i, j, and a arrays are not copied by this routine, the user must free these arrays
4701292fb18eSBarry Smith     once the matrix is destroyed and not before
470236db0b34SBarry Smith 
470336db0b34SBarry Smith        You cannot set new nonzero locations into this matrix, that will generate an error.
470436db0b34SBarry Smith 
4705bfeeae90SHong Zhang        The i and j indices are 0 based
470636db0b34SBarry Smith 
4707a4552177SSatish Balay        The format which is used for the sparse matrix input, is equivalent to a
4708a4552177SSatish Balay     row-major ordering.. i.e for the following matrix, the input data expected is
47098eef79e4SBarry Smith     as shown
4710a4552177SSatish Balay 
47118eef79e4SBarry Smith $        1 0 0
47128eef79e4SBarry Smith $        2 0 3
47138eef79e4SBarry Smith $        4 5 6
47148eef79e4SBarry Smith $
47158eef79e4SBarry Smith $        i =  {0,1,3,6}  [size = nrow+1  = 3+1]
47168eef79e4SBarry Smith $        j =  {0,0,2,0,1,2}  [size = 6]; values must be sorted for each row
47178eef79e4SBarry Smith $        v =  {1,2,3,4,5,6}  [size = 6]
4718a4552177SSatish Balay 
47199985e31cSBarry Smith 
472069b1f4b7SBarry Smith .seealso: MatCreate(), MatCreateAIJ(), MatCreateSeqAIJ(), MatCreateMPIAIJWithArrays(), MatMPIAIJSetPreallocationCSR()
472136db0b34SBarry Smith 
472236db0b34SBarry Smith @*/
4723c3c607ccSBarry Smith PetscErrorCode  MatCreateSeqAIJWithArrays(MPI_Comm comm,PetscInt m,PetscInt n,PetscInt i[],PetscInt j[],PetscScalar a[],Mat *mat)
472436db0b34SBarry Smith {
4725dfbe8321SBarry Smith   PetscErrorCode ierr;
4726cbcfb4deSHong Zhang   PetscInt       ii;
472736db0b34SBarry Smith   Mat_SeqAIJ     *aij;
4728cbcfb4deSHong Zhang   PetscInt jj;
472936db0b34SBarry Smith 
473036db0b34SBarry Smith   PetscFunctionBegin;
473141096f02SStefano Zampini   if (m > 0 && i[0]) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"i (row indices) must start with 0");
4732f69a0ea3SMatthew Knepley   ierr = MatCreate(comm,mat);CHKERRQ(ierr);
4733f69a0ea3SMatthew Knepley   ierr = MatSetSizes(*mat,m,n,m,n);CHKERRQ(ierr);
4734a2f3521dSMark F. Adams   /* ierr = MatSetBlockSizes(*mat,,);CHKERRQ(ierr); */
4735ab93d7beSBarry Smith   ierr = MatSetType(*mat,MATSEQAIJ);CHKERRQ(ierr);
4736ab93d7beSBarry Smith   ierr = MatSeqAIJSetPreallocation_SeqAIJ(*mat,MAT_SKIP_ALLOCATION,0);CHKERRQ(ierr);
4737ab93d7beSBarry Smith   aij  = (Mat_SeqAIJ*)(*mat)->data;
4738071fcb05SBarry Smith   ierr = PetscMalloc1(m,&aij->imax);CHKERRQ(ierr);
4739071fcb05SBarry Smith   ierr = PetscMalloc1(m,&aij->ilen);CHKERRQ(ierr);
4740ab93d7beSBarry Smith 
474136db0b34SBarry Smith   aij->i            = i;
474236db0b34SBarry Smith   aij->j            = j;
474336db0b34SBarry Smith   aij->a            = a;
474436db0b34SBarry Smith   aij->singlemalloc = PETSC_FALSE;
474536db0b34SBarry Smith   aij->nonew        = -1;             /*this indicates that inserting a new value in the matrix that generates a new nonzero is an error*/
4746e6b907acSBarry Smith   aij->free_a       = PETSC_FALSE;
4747e6b907acSBarry Smith   aij->free_ij      = PETSC_FALSE;
474836db0b34SBarry Smith 
474936db0b34SBarry Smith   for (ii=0; ii<m; ii++) {
475036db0b34SBarry Smith     aij->ilen[ii] = aij->imax[ii] = i[ii+1] - i[ii];
475176bd3646SJed Brown     if (PetscDefined(USE_DEBUG)) {
475260e0710aSBarry Smith       if (i[ii+1] - i[ii] < 0) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Negative row length in i (row indices) row = %D length = %D",ii,i[ii+1] - i[ii]);
47539985e31cSBarry Smith       for (jj=i[ii]+1; jj<i[ii+1]; jj++) {
4754a061629eSStefano Zampini         if (j[jj] < j[jj-1]) SETERRQ3(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Column entry number %D (actual column %D) in row %D is not sorted",jj-i[ii],j[jj],ii);
4755a061629eSStefano Zampini         if (j[jj] == j[jj-1]) SETERRQ3(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Column entry number %D (actual column %D) in row %D is identical to previous entry",jj-i[ii],j[jj],ii);
47569985e31cSBarry Smith       }
475736db0b34SBarry Smith     }
475876bd3646SJed Brown   }
475976bd3646SJed Brown   if (PetscDefined(USE_DEBUG)) {
476036db0b34SBarry Smith     for (ii=0; ii<aij->i[m]; ii++) {
476160e0710aSBarry Smith       if (j[ii] < 0) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Negative column index at location = %D index = %D",ii,j[ii]);
476260e0710aSBarry Smith       if (j[ii] > n - 1) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Column index to large at location = %D index = %D",ii,j[ii]);
476336db0b34SBarry Smith     }
476476bd3646SJed Brown   }
476536db0b34SBarry Smith 
4766b65db4caSBarry Smith   ierr = MatAssemblyBegin(*mat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
4767b65db4caSBarry Smith   ierr = MatAssemblyEnd(*mat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
476836db0b34SBarry Smith   PetscFunctionReturn(0);
476936db0b34SBarry Smith }
477080ef6e79SMatthew G Knepley /*@C
4771d021a1c5SVictor Minden      MatCreateSeqAIJFromTriple - Creates an sequential AIJ matrix using matrix elements (in COO format)
47728a0b0e6bSVictor Minden               provided by the user.
47738a0b0e6bSVictor Minden 
4774d083f849SBarry Smith       Collective
47758a0b0e6bSVictor Minden 
47768a0b0e6bSVictor Minden    Input Parameters:
47778a0b0e6bSVictor Minden +   comm - must be an MPI communicator of size 1
47788a0b0e6bSVictor Minden .   m   - number of rows
47798a0b0e6bSVictor Minden .   n   - number of columns
47808a0b0e6bSVictor Minden .   i   - row indices
47818a0b0e6bSVictor Minden .   j   - column indices
47821230e6d1SVictor Minden .   a   - matrix values
47831230e6d1SVictor Minden .   nz  - number of nonzeros
47841230e6d1SVictor Minden -   idx - 0 or 1 based
47858a0b0e6bSVictor Minden 
47868a0b0e6bSVictor Minden    Output Parameter:
47878a0b0e6bSVictor Minden .   mat - the matrix
47888a0b0e6bSVictor Minden 
47898a0b0e6bSVictor Minden    Level: intermediate
47908a0b0e6bSVictor Minden 
47918a0b0e6bSVictor Minden    Notes:
47928a0b0e6bSVictor Minden        The i and j indices are 0 based
47938a0b0e6bSVictor Minden 
47948a0b0e6bSVictor Minden        The format which is used for the sparse matrix input, is equivalent to a
47958a0b0e6bSVictor Minden     row-major ordering.. i.e for the following matrix, the input data expected is
47968a0b0e6bSVictor Minden     as shown:
47978a0b0e6bSVictor Minden 
47988a0b0e6bSVictor Minden         1 0 0
47998a0b0e6bSVictor Minden         2 0 3
48008a0b0e6bSVictor Minden         4 5 6
48018a0b0e6bSVictor Minden 
48028a0b0e6bSVictor Minden         i =  {0,1,1,2,2,2}
48038a0b0e6bSVictor Minden         j =  {0,0,2,0,1,2}
48048a0b0e6bSVictor Minden         v =  {1,2,3,4,5,6}
48058a0b0e6bSVictor Minden 
48068a0b0e6bSVictor Minden 
480769b1f4b7SBarry Smith .seealso: MatCreate(), MatCreateAIJ(), MatCreateSeqAIJ(), MatCreateSeqAIJWithArrays(), MatMPIAIJSetPreallocationCSR()
48088a0b0e6bSVictor Minden 
48098a0b0e6bSVictor Minden @*/
4810c3c607ccSBarry Smith PetscErrorCode  MatCreateSeqAIJFromTriple(MPI_Comm comm,PetscInt m,PetscInt n,PetscInt i[],PetscInt j[],PetscScalar a[],Mat *mat,PetscInt nz,PetscBool idx)
48118a0b0e6bSVictor Minden {
48128a0b0e6bSVictor Minden   PetscErrorCode ierr;
4813d021a1c5SVictor Minden   PetscInt       ii, *nnz, one = 1,row,col;
48148a0b0e6bSVictor Minden 
48158a0b0e6bSVictor Minden 
48168a0b0e6bSVictor Minden   PetscFunctionBegin;
48171795a4d1SJed Brown   ierr = PetscCalloc1(m,&nnz);CHKERRQ(ierr);
48181230e6d1SVictor Minden   for (ii = 0; ii < nz; ii++) {
4819c8d679ebSHong Zhang     nnz[i[ii] - !!idx] += 1;
48201230e6d1SVictor Minden   }
48218a0b0e6bSVictor Minden   ierr = MatCreate(comm,mat);CHKERRQ(ierr);
48228a0b0e6bSVictor Minden   ierr = MatSetSizes(*mat,m,n,m,n);CHKERRQ(ierr);
48238a0b0e6bSVictor Minden   ierr = MatSetType(*mat,MATSEQAIJ);CHKERRQ(ierr);
48241230e6d1SVictor Minden   ierr = MatSeqAIJSetPreallocation_SeqAIJ(*mat,0,nnz);CHKERRQ(ierr);
48251230e6d1SVictor Minden   for (ii = 0; ii < nz; ii++) {
48261230e6d1SVictor Minden     if (idx) {
48271230e6d1SVictor Minden       row = i[ii] - 1;
48281230e6d1SVictor Minden       col = j[ii] - 1;
48291230e6d1SVictor Minden     } else {
48301230e6d1SVictor Minden       row = i[ii];
48311230e6d1SVictor Minden       col = j[ii];
48328a0b0e6bSVictor Minden     }
48331230e6d1SVictor Minden     ierr = MatSetValues(*mat,one,&row,one,&col,&a[ii],ADD_VALUES);CHKERRQ(ierr);
48348a0b0e6bSVictor Minden   }
48358a0b0e6bSVictor Minden   ierr = MatAssemblyBegin(*mat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
48368a0b0e6bSVictor Minden   ierr = MatAssemblyEnd(*mat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
4837d021a1c5SVictor Minden   ierr = PetscFree(nnz);CHKERRQ(ierr);
48388a0b0e6bSVictor Minden   PetscFunctionReturn(0);
48398a0b0e6bSVictor Minden }
484036db0b34SBarry Smith 
4841acf2f550SJed Brown PetscErrorCode MatSeqAIJInvalidateDiagonal(Mat A)
4842acf2f550SJed Brown {
4843acf2f550SJed Brown   Mat_SeqAIJ     *a=(Mat_SeqAIJ*)A->data;
4844acf2f550SJed Brown   PetscErrorCode ierr;
4845acf2f550SJed Brown 
4846acf2f550SJed Brown   PetscFunctionBegin;
4847acf2f550SJed Brown   a->idiagvalid  = PETSC_FALSE;
4848acf2f550SJed Brown   a->ibdiagvalid = PETSC_FALSE;
48492205254eSKarl Rupp 
4850acf2f550SJed Brown   ierr = MatSeqAIJInvalidateDiagonal_Inode(A);CHKERRQ(ierr);
4851acf2f550SJed Brown   PetscFunctionReturn(0);
4852acf2f550SJed Brown }
4853acf2f550SJed Brown 
48549c8f2541SHong Zhang PetscErrorCode MatCreateMPIMatConcatenateSeqMat_SeqAIJ(MPI_Comm comm,Mat inmat,PetscInt n,MatReuse scall,Mat *outmat)
48559c8f2541SHong Zhang {
48569c8f2541SHong Zhang   PetscErrorCode ierr;
48578761c3d6SHong Zhang   PetscMPIInt    size;
48589c8f2541SHong Zhang 
48599c8f2541SHong Zhang   PetscFunctionBegin;
48608761c3d6SHong Zhang   ierr = MPI_Comm_size(comm,&size);CHKERRQ(ierr);
48617bbdc51dSHong Zhang   if (size == 1) {
48627bbdc51dSHong Zhang     if (scall == MAT_INITIAL_MATRIX) {
48637bbdc51dSHong Zhang       ierr = MatDuplicate(inmat,MAT_COPY_VALUES,outmat);CHKERRQ(ierr);
48647bbdc51dSHong Zhang     } else {
48658761c3d6SHong Zhang       ierr = MatCopy(inmat,*outmat,SAME_NONZERO_PATTERN);CHKERRQ(ierr);
48667bbdc51dSHong Zhang     }
48678761c3d6SHong Zhang   } else {
48689c8f2541SHong Zhang     ierr = MatCreateMPIMatConcatenateSeqMat_MPIAIJ(comm,inmat,n,scall,outmat);CHKERRQ(ierr);
48698761c3d6SHong Zhang   }
48709c8f2541SHong Zhang   PetscFunctionReturn(0);
48719c8f2541SHong Zhang }
48729c8f2541SHong Zhang 
487381824310SBarry Smith /*
487453dd7562SDmitry Karpeev  Permute A into C's *local* index space using rowemb,colemb.
487553dd7562SDmitry Karpeev  The embedding are supposed to be injections and the above implies that the range of rowemb is a subset
487653dd7562SDmitry Karpeev  of [0,m), colemb is in [0,n).
487753dd7562SDmitry Karpeev  If pattern == DIFFERENT_NONZERO_PATTERN, C is preallocated according to A.
487853dd7562SDmitry Karpeev  */
487953dd7562SDmitry Karpeev PetscErrorCode MatSetSeqMat_SeqAIJ(Mat C,IS rowemb,IS colemb,MatStructure pattern,Mat B)
488053dd7562SDmitry Karpeev {
488153dd7562SDmitry Karpeev   /* If making this function public, change the error returned in this function away from _PLIB. */
488253dd7562SDmitry Karpeev   PetscErrorCode ierr;
488353dd7562SDmitry Karpeev   Mat_SeqAIJ     *Baij;
488453dd7562SDmitry Karpeev   PetscBool      seqaij;
488553dd7562SDmitry Karpeev   PetscInt       m,n,*nz,i,j,count;
488653dd7562SDmitry Karpeev   PetscScalar    v;
488753dd7562SDmitry Karpeev   const PetscInt *rowindices,*colindices;
488853dd7562SDmitry Karpeev 
488953dd7562SDmitry Karpeev   PetscFunctionBegin;
489053dd7562SDmitry Karpeev   if (!B) PetscFunctionReturn(0);
489153dd7562SDmitry Karpeev   /* Check to make sure the target matrix (and embeddings) are compatible with C and each other. */
48924099cc6bSBarry Smith   ierr = PetscObjectBaseTypeCompare((PetscObject)B,MATSEQAIJ,&seqaij);CHKERRQ(ierr);
489353dd7562SDmitry Karpeev   if (!seqaij) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Input matrix is of wrong type");
489453dd7562SDmitry Karpeev   if (rowemb) {
489553dd7562SDmitry Karpeev     ierr = ISGetLocalSize(rowemb,&m);CHKERRQ(ierr);
489653dd7562SDmitry Karpeev     if (m != B->rmap->n) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Row IS of size %D is incompatible with matrix row size %D",m,B->rmap->n);
489753dd7562SDmitry Karpeev   } else {
48986c4ed002SBarry Smith     if (C->rmap->n != B->rmap->n) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Input matrix is row-incompatible with the target matrix");
489953dd7562SDmitry Karpeev   }
490053dd7562SDmitry Karpeev   if (colemb) {
490153dd7562SDmitry Karpeev     ierr = ISGetLocalSize(colemb,&n);CHKERRQ(ierr);
490253dd7562SDmitry Karpeev     if (n != B->cmap->n) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Diag col IS of size %D is incompatible with input matrix col size %D",n,B->cmap->n);
490353dd7562SDmitry Karpeev   } else {
490453dd7562SDmitry Karpeev     if (C->cmap->n != B->cmap->n) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Input matrix is col-incompatible with the target matrix");
490553dd7562SDmitry Karpeev   }
490653dd7562SDmitry Karpeev 
490753dd7562SDmitry Karpeev   Baij = (Mat_SeqAIJ*)(B->data);
490853dd7562SDmitry Karpeev   if (pattern == DIFFERENT_NONZERO_PATTERN) {
490953dd7562SDmitry Karpeev     ierr = PetscMalloc1(B->rmap->n,&nz);CHKERRQ(ierr);
491053dd7562SDmitry Karpeev     for (i=0; i<B->rmap->n; i++) {
491153dd7562SDmitry Karpeev       nz[i] = Baij->i[i+1] - Baij->i[i];
491253dd7562SDmitry Karpeev     }
491353dd7562SDmitry Karpeev     ierr = MatSeqAIJSetPreallocation(C,0,nz);CHKERRQ(ierr);
491453dd7562SDmitry Karpeev     ierr = PetscFree(nz);CHKERRQ(ierr);
491553dd7562SDmitry Karpeev   }
491653dd7562SDmitry Karpeev   if (pattern == SUBSET_NONZERO_PATTERN) {
491753dd7562SDmitry Karpeev     ierr = MatZeroEntries(C);CHKERRQ(ierr);
491853dd7562SDmitry Karpeev   }
491953dd7562SDmitry Karpeev   count = 0;
492053dd7562SDmitry Karpeev   rowindices = NULL;
492153dd7562SDmitry Karpeev   colindices = NULL;
492253dd7562SDmitry Karpeev   if (rowemb) {
492353dd7562SDmitry Karpeev     ierr = ISGetIndices(rowemb,&rowindices);CHKERRQ(ierr);
492453dd7562SDmitry Karpeev   }
492553dd7562SDmitry Karpeev   if (colemb) {
492653dd7562SDmitry Karpeev     ierr = ISGetIndices(colemb,&colindices);CHKERRQ(ierr);
492753dd7562SDmitry Karpeev   }
492853dd7562SDmitry Karpeev   for (i=0; i<B->rmap->n; i++) {
492953dd7562SDmitry Karpeev     PetscInt row;
493053dd7562SDmitry Karpeev     row = i;
493153dd7562SDmitry Karpeev     if (rowindices) row = rowindices[i];
493253dd7562SDmitry Karpeev     for (j=Baij->i[i]; j<Baij->i[i+1]; j++) {
493353dd7562SDmitry Karpeev       PetscInt col;
493453dd7562SDmitry Karpeev       col  = Baij->j[count];
493553dd7562SDmitry Karpeev       if (colindices) col = colindices[col];
493653dd7562SDmitry Karpeev       v    = Baij->a[count];
493753dd7562SDmitry Karpeev       ierr = MatSetValues(C,1,&row,1,&col,&v,INSERT_VALUES);CHKERRQ(ierr);
493853dd7562SDmitry Karpeev       ++count;
493953dd7562SDmitry Karpeev     }
494053dd7562SDmitry Karpeev   }
494153dd7562SDmitry Karpeev   /* FIXME: set C's nonzerostate correctly. */
494253dd7562SDmitry Karpeev   /* Assembly for C is necessary. */
494353dd7562SDmitry Karpeev   C->preallocated = PETSC_TRUE;
494453dd7562SDmitry Karpeev   C->assembled     = PETSC_TRUE;
494553dd7562SDmitry Karpeev   C->was_assembled = PETSC_FALSE;
494653dd7562SDmitry Karpeev   PetscFunctionReturn(0);
494753dd7562SDmitry Karpeev }
494853dd7562SDmitry Karpeev 
49494099cc6bSBarry Smith PetscFunctionList MatSeqAIJList = NULL;
49504099cc6bSBarry Smith 
49514099cc6bSBarry Smith /*@C
49524099cc6bSBarry Smith    MatSeqAIJSetType - Converts a MATSEQAIJ matrix to a subtype
49534099cc6bSBarry Smith 
49544099cc6bSBarry Smith    Collective on Mat
49554099cc6bSBarry Smith 
49564099cc6bSBarry Smith    Input Parameters:
49574099cc6bSBarry Smith +  mat      - the matrix object
49584099cc6bSBarry Smith -  matype   - matrix type
49594099cc6bSBarry Smith 
49604099cc6bSBarry Smith    Options Database Key:
49614099cc6bSBarry Smith .  -mat_seqai_type  <method> - for example seqaijcrl
49624099cc6bSBarry Smith 
49634099cc6bSBarry Smith 
49644099cc6bSBarry Smith   Level: intermediate
49654099cc6bSBarry Smith 
49664099cc6bSBarry Smith .seealso: PCSetType(), VecSetType(), MatCreate(), MatType, Mat
49674099cc6bSBarry Smith @*/
49684099cc6bSBarry Smith PetscErrorCode  MatSeqAIJSetType(Mat mat, MatType matype)
49694099cc6bSBarry Smith {
4970fd9d3c67SJed Brown   PetscErrorCode ierr,(*r)(Mat,MatType,MatReuse,Mat*);
49714099cc6bSBarry Smith   PetscBool      sametype;
49724099cc6bSBarry Smith 
49734099cc6bSBarry Smith   PetscFunctionBegin;
49744099cc6bSBarry Smith   PetscValidHeaderSpecific(mat,MAT_CLASSID,1);
49754099cc6bSBarry Smith   ierr = PetscObjectTypeCompare((PetscObject)mat,matype,&sametype);CHKERRQ(ierr);
49764099cc6bSBarry Smith   if (sametype) PetscFunctionReturn(0);
49774099cc6bSBarry Smith 
49784099cc6bSBarry Smith   ierr =  PetscFunctionListFind(MatSeqAIJList,matype,&r);CHKERRQ(ierr);
49794099cc6bSBarry Smith   if (!r) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_ARG_UNKNOWN_TYPE,"Unknown Mat type given: %s",matype);
49804099cc6bSBarry Smith   ierr = (*r)(mat,matype,MAT_INPLACE_MATRIX,&mat);CHKERRQ(ierr);
49814099cc6bSBarry Smith   PetscFunctionReturn(0);
49824099cc6bSBarry Smith }
49834099cc6bSBarry Smith 
49844099cc6bSBarry Smith 
49854099cc6bSBarry Smith /*@C
49864099cc6bSBarry Smith   MatSeqAIJRegister -  - Adds a new sub-matrix type for sequential AIJ matrices
49874099cc6bSBarry Smith 
49884099cc6bSBarry Smith    Not Collective
49894099cc6bSBarry Smith 
49904099cc6bSBarry Smith    Input Parameters:
49914099cc6bSBarry Smith +  name - name of a new user-defined matrix type, for example MATSEQAIJCRL
49924099cc6bSBarry Smith -  function - routine to convert to subtype
49934099cc6bSBarry Smith 
49944099cc6bSBarry Smith    Notes:
49954099cc6bSBarry Smith    MatSeqAIJRegister() may be called multiple times to add several user-defined solvers.
49964099cc6bSBarry Smith 
49974099cc6bSBarry Smith 
49984099cc6bSBarry Smith    Then, your matrix can be chosen with the procedural interface at runtime via the option
49994099cc6bSBarry Smith $     -mat_seqaij_type my_mat
50004099cc6bSBarry Smith 
50014099cc6bSBarry Smith    Level: advanced
50024099cc6bSBarry Smith 
50034099cc6bSBarry Smith .seealso: MatSeqAIJRegisterAll()
50044099cc6bSBarry Smith 
50054099cc6bSBarry Smith 
50064099cc6bSBarry Smith   Level: advanced
50074099cc6bSBarry Smith @*/
5008388d47a6SSatish Balay PetscErrorCode  MatSeqAIJRegister(const char sname[],PetscErrorCode (*function)(Mat,MatType,MatReuse,Mat *))
50094099cc6bSBarry Smith {
50104099cc6bSBarry Smith   PetscErrorCode ierr;
50114099cc6bSBarry Smith 
50124099cc6bSBarry Smith   PetscFunctionBegin;
50139cc31a68SJed Brown   ierr = MatInitializePackage();CHKERRQ(ierr);
50144099cc6bSBarry Smith   ierr = PetscFunctionListAdd(&MatSeqAIJList,sname,function);CHKERRQ(ierr);
50154099cc6bSBarry Smith   PetscFunctionReturn(0);
50164099cc6bSBarry Smith }
50174099cc6bSBarry Smith 
50184099cc6bSBarry Smith PetscBool MatSeqAIJRegisterAllCalled = PETSC_FALSE;
50194099cc6bSBarry Smith 
50204099cc6bSBarry Smith /*@C
50214099cc6bSBarry Smith   MatSeqAIJRegisterAll - Registers all of the matrix subtypes of SeqAIJ
50224099cc6bSBarry Smith 
50234099cc6bSBarry Smith   Not Collective
50244099cc6bSBarry Smith 
50254099cc6bSBarry Smith   Level: advanced
50264099cc6bSBarry Smith 
50274099cc6bSBarry Smith   Developers Note: CUSP and CUSPARSE do not yet support the  MatConvert_SeqAIJ..() paradigm and thus cannot be registered here
50284099cc6bSBarry Smith 
50294099cc6bSBarry Smith .seealso:  MatRegisterAll(), MatSeqAIJRegister()
50304099cc6bSBarry Smith @*/
50314099cc6bSBarry Smith PetscErrorCode  MatSeqAIJRegisterAll(void)
50324099cc6bSBarry Smith {
50334099cc6bSBarry Smith   PetscErrorCode ierr;
50344099cc6bSBarry Smith 
50354099cc6bSBarry Smith   PetscFunctionBegin;
50364099cc6bSBarry Smith   if (MatSeqAIJRegisterAllCalled) PetscFunctionReturn(0);
50374099cc6bSBarry Smith   MatSeqAIJRegisterAllCalled = PETSC_TRUE;
50384099cc6bSBarry Smith 
50394099cc6bSBarry Smith   ierr = MatSeqAIJRegister(MATSEQAIJCRL,      MatConvert_SeqAIJ_SeqAIJCRL);CHKERRQ(ierr);
50404099cc6bSBarry Smith   ierr = MatSeqAIJRegister(MATSEQAIJPERM,     MatConvert_SeqAIJ_SeqAIJPERM);CHKERRQ(ierr);
50414dfdc2d9SRichard Tran Mills   ierr = MatSeqAIJRegister(MATSEQAIJSELL,     MatConvert_SeqAIJ_SeqAIJSELL);CHKERRQ(ierr);
50429779e05dSSatish Balay #if defined(PETSC_HAVE_MKL_SPARSE)
50436b62b571SRichard Tran Mills   ierr = MatSeqAIJRegister(MATSEQAIJMKL,      MatConvert_SeqAIJ_SeqAIJMKL);CHKERRQ(ierr);
5044485f9817SRichard Tran Mills #endif
50454099cc6bSBarry Smith #if defined(PETSC_HAVE_VIENNACL) && defined(PETSC_HAVE_VIENNACL_NO_CUDA)
50464099cc6bSBarry Smith   ierr = MatSeqAIJRegister(MATMPIAIJVIENNACL, MatConvert_SeqAIJ_SeqAIJViennaCL);CHKERRQ(ierr);
50474099cc6bSBarry Smith #endif
50484099cc6bSBarry Smith   PetscFunctionReturn(0);
50494099cc6bSBarry Smith }
505053dd7562SDmitry Karpeev 
505153dd7562SDmitry Karpeev /*
505281824310SBarry Smith     Special version for direct calls from Fortran
505381824310SBarry Smith */
5054af0996ceSBarry Smith #include <petsc/private/fortranimpl.h>
505581824310SBarry Smith #if defined(PETSC_HAVE_FORTRAN_CAPS)
505681824310SBarry Smith #define matsetvaluesseqaij_ MATSETVALUESSEQAIJ
505781824310SBarry Smith #elif !defined(PETSC_HAVE_FORTRAN_UNDERSCORE)
505881824310SBarry Smith #define matsetvaluesseqaij_ matsetvaluesseqaij
505981824310SBarry Smith #endif
506081824310SBarry Smith 
506181824310SBarry Smith /* Change these macros so can be used in void function */
506281824310SBarry Smith #undef CHKERRQ
5063ce94432eSBarry Smith #define CHKERRQ(ierr) CHKERRABORT(PetscObjectComm((PetscObject)A),ierr)
506481824310SBarry Smith #undef SETERRQ2
5065e32f2f54SBarry Smith #define SETERRQ2(comm,ierr,b,c,d) CHKERRABORT(comm,ierr)
50664994cf47SJed Brown #undef SETERRQ3
50674994cf47SJed Brown #define SETERRQ3(comm,ierr,b,c,d,e) CHKERRABORT(comm,ierr)
506881824310SBarry Smith 
506919caf8f3SSatish Balay PETSC_EXTERN void matsetvaluesseqaij_(Mat *AA,PetscInt *mm,const PetscInt im[],PetscInt *nn,const PetscInt in[],const PetscScalar v[],InsertMode *isis, PetscErrorCode *_ierr)
507081824310SBarry Smith {
507181824310SBarry Smith   Mat            A  = *AA;
507281824310SBarry Smith   PetscInt       m  = *mm, n = *nn;
507381824310SBarry Smith   InsertMode     is = *isis;
507481824310SBarry Smith   Mat_SeqAIJ     *a = (Mat_SeqAIJ*)A->data;
507581824310SBarry Smith   PetscInt       *rp,k,low,high,t,ii,row,nrow,i,col,l,rmax,N;
507681824310SBarry Smith   PetscInt       *imax,*ai,*ailen;
507781824310SBarry Smith   PetscErrorCode ierr;
507881824310SBarry Smith   PetscInt       *aj,nonew = a->nonew,lastcol = -1;
507954f21887SBarry Smith   MatScalar      *ap,value,*aa;
5080ace3abfcSBarry Smith   PetscBool      ignorezeroentries = a->ignorezeroentries;
5081ace3abfcSBarry Smith   PetscBool      roworiented       = a->roworiented;
508281824310SBarry Smith 
508381824310SBarry Smith   PetscFunctionBegin;
50844994cf47SJed Brown   MatCheckPreallocated(A,1);
508581824310SBarry Smith   imax  = a->imax;
508681824310SBarry Smith   ai    = a->i;
508781824310SBarry Smith   ailen = a->ilen;
508881824310SBarry Smith   aj    = a->j;
508981824310SBarry Smith   aa    = a->a;
509081824310SBarry Smith 
509181824310SBarry Smith   for (k=0; k<m; k++) { /* loop over added rows */
509281824310SBarry Smith     row = im[k];
509381824310SBarry Smith     if (row < 0) continue;
5094cf9c20a2SJed Brown     if (PetscUnlikelyDebug(row >= A->rmap->n)) SETERRABORT(PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_OUTOFRANGE,"Row too large");
509581824310SBarry Smith     rp   = aj + ai[row]; ap = aa + ai[row];
509681824310SBarry Smith     rmax = imax[row]; nrow = ailen[row];
509781824310SBarry Smith     low  = 0;
509881824310SBarry Smith     high = nrow;
509981824310SBarry Smith     for (l=0; l<n; l++) { /* loop over added columns */
510081824310SBarry Smith       if (in[l] < 0) continue;
5101cf9c20a2SJed Brown       if (PetscUnlikelyDebug(in[l] >= A->cmap->n)) SETERRABORT(PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_OUTOFRANGE,"Column too large");
510281824310SBarry Smith       col = in[l];
51032205254eSKarl Rupp       if (roworiented) value = v[l + k*n];
51042205254eSKarl Rupp       else value = v[k + l*m];
51052205254eSKarl Rupp 
510681824310SBarry Smith       if (value == 0.0 && ignorezeroentries && (is == ADD_VALUES)) continue;
510781824310SBarry Smith 
51082205254eSKarl Rupp       if (col <= lastcol) low = 0;
51092205254eSKarl Rupp       else high = nrow;
511081824310SBarry Smith       lastcol = col;
511181824310SBarry Smith       while (high-low > 5) {
511281824310SBarry Smith         t = (low+high)/2;
511381824310SBarry Smith         if (rp[t] > col) high = t;
511481824310SBarry Smith         else             low  = t;
511581824310SBarry Smith       }
511681824310SBarry Smith       for (i=low; i<high; i++) {
511781824310SBarry Smith         if (rp[i] > col) break;
511881824310SBarry Smith         if (rp[i] == col) {
511981824310SBarry Smith           if (is == ADD_VALUES) ap[i] += value;
512081824310SBarry Smith           else                  ap[i] = value;
512181824310SBarry Smith           goto noinsert;
512281824310SBarry Smith         }
512381824310SBarry Smith       }
512481824310SBarry Smith       if (value == 0.0 && ignorezeroentries) goto noinsert;
512581824310SBarry Smith       if (nonew == 1) goto noinsert;
5126ce94432eSBarry Smith       if (nonew == -1) SETERRABORT(PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_OUTOFRANGE,"Inserting a new nonzero in the matrix");
5127fef13f97SBarry Smith       MatSeqXAIJReallocateAIJ(A,A->rmap->n,1,nrow,row,col,rmax,aa,ai,aj,rp,ap,imax,nonew,MatScalar);
512881824310SBarry Smith       N = nrow++ - 1; a->nz++; high++;
512981824310SBarry Smith       /* shift up all the later entries in this row */
513081824310SBarry Smith       for (ii=N; ii>=i; ii--) {
513181824310SBarry Smith         rp[ii+1] = rp[ii];
513281824310SBarry Smith         ap[ii+1] = ap[ii];
513381824310SBarry Smith       }
513481824310SBarry Smith       rp[i] = col;
513581824310SBarry Smith       ap[i] = value;
5136e56f5c9eSBarry Smith       A->nonzerostate++;
513781824310SBarry Smith noinsert:;
513881824310SBarry Smith       low = i + 1;
513981824310SBarry Smith     }
514081824310SBarry Smith     ailen[row] = nrow;
514181824310SBarry Smith   }
514281824310SBarry Smith   PetscFunctionReturnVoid();
514381824310SBarry Smith }
5144