xref: /petsc/src/mat/impls/aij/mpi/mumps/mumps.c (revision 33d57670fcdbf57d9203d482728f549b81403a0e)
11c2a3de1SBarry Smith 
2397b6df1SKris Buschelman /*
3c2b5dc30SHong Zhang     Provides an interface to the MUMPS sparse solver
4397b6df1SKris Buschelman */
551d5961aSHong Zhang 
6c6db04a5SJed Brown #include <../src/mat/impls/aij/mpi/mpiaij.h> /*I  "petscmat.h"  I*/
7c6db04a5SJed Brown #include <../src/mat/impls/sbaij/mpi/mpisbaij.h>
8397b6df1SKris Buschelman 
9397b6df1SKris Buschelman EXTERN_C_BEGIN
10397b6df1SKris Buschelman #if defined(PETSC_USE_COMPLEX)
112907cef9SHong Zhang #if defined(PETSC_USE_REAL_SINGLE)
122907cef9SHong Zhang #include <cmumps_c.h>
132907cef9SHong Zhang #else
14c6db04a5SJed Brown #include <zmumps_c.h>
152907cef9SHong Zhang #endif
162907cef9SHong Zhang #else
172907cef9SHong Zhang #if defined(PETSC_USE_REAL_SINGLE)
182907cef9SHong Zhang #include <smumps_c.h>
19397b6df1SKris Buschelman #else
20c6db04a5SJed Brown #include <dmumps_c.h>
21397b6df1SKris Buschelman #endif
222907cef9SHong Zhang #endif
23397b6df1SKris Buschelman EXTERN_C_END
24397b6df1SKris Buschelman #define JOB_INIT -1
253d472b54SHong Zhang #define JOB_FACTSYMBOLIC 1
263d472b54SHong Zhang #define JOB_FACTNUMERIC 2
273d472b54SHong Zhang #define JOB_SOLVE 3
28397b6df1SKris Buschelman #define JOB_END -2
293d472b54SHong Zhang 
302907cef9SHong Zhang /* calls to MUMPS */
312907cef9SHong Zhang #if defined(PETSC_USE_COMPLEX)
322907cef9SHong Zhang #if defined(PETSC_USE_REAL_SINGLE)
332907cef9SHong Zhang #define PetscMUMPS_c cmumps_c
342907cef9SHong Zhang #else
352907cef9SHong Zhang #define PetscMUMPS_c zmumps_c
362907cef9SHong Zhang #endif
372907cef9SHong Zhang #else
382907cef9SHong Zhang #if defined(PETSC_USE_REAL_SINGLE)
392907cef9SHong Zhang #define PetscMUMPS_c smumps_c
402907cef9SHong Zhang #else
412907cef9SHong Zhang #define PetscMUMPS_c dmumps_c
422907cef9SHong Zhang #endif
432907cef9SHong Zhang #endif
442907cef9SHong Zhang 
453d472b54SHong Zhang 
46397b6df1SKris Buschelman /* macros s.t. indices match MUMPS documentation */
47397b6df1SKris Buschelman #define ICNTL(I) icntl[(I)-1]
48397b6df1SKris Buschelman #define CNTL(I) cntl[(I)-1]
49397b6df1SKris Buschelman #define INFOG(I) infog[(I)-1]
50a7aca84bSHong Zhang #define INFO(I) info[(I)-1]
51397b6df1SKris Buschelman #define RINFOG(I) rinfog[(I)-1]
52adc1d99fSHong Zhang #define RINFO(I) rinfo[(I)-1]
53397b6df1SKris Buschelman 
54397b6df1SKris Buschelman typedef struct {
55397b6df1SKris Buschelman #if defined(PETSC_USE_COMPLEX)
562907cef9SHong Zhang #if defined(PETSC_USE_REAL_SINGLE)
572907cef9SHong Zhang   CMUMPS_STRUC_C id;
582907cef9SHong Zhang #else
59397b6df1SKris Buschelman   ZMUMPS_STRUC_C id;
602907cef9SHong Zhang #endif
612907cef9SHong Zhang #else
622907cef9SHong Zhang #if defined(PETSC_USE_REAL_SINGLE)
632907cef9SHong Zhang   SMUMPS_STRUC_C id;
64397b6df1SKris Buschelman #else
65397b6df1SKris Buschelman   DMUMPS_STRUC_C id;
66397b6df1SKris Buschelman #endif
672907cef9SHong Zhang #endif
682907cef9SHong Zhang 
69397b6df1SKris Buschelman   MatStructure matstruc;
70c1490034SHong Zhang   PetscMPIInt  myid,size;
71a5e57a09SHong Zhang   PetscInt     *irn,*jcn,nz,sym;
72397b6df1SKris Buschelman   PetscScalar  *val;
73397b6df1SKris Buschelman   MPI_Comm     comm_mumps;
74329ec9b3SHong Zhang   VecScatter   scat_rhs, scat_sol;
7564e6c443SBarry Smith   PetscBool    isAIJ,CleanUpMUMPS;
76329ec9b3SHong Zhang   Vec          b_seq,x_seq;
77a5e57a09SHong Zhang   PetscInt     ICNTL9_pre;   /* check if ICNTL(9) is changed from previous MatSolve */
782205254eSKarl Rupp 
79bf0cc555SLisandro Dalcin   PetscErrorCode (*Destroy)(Mat);
80bccb9932SShri Abhyankar   PetscErrorCode (*ConvertToTriples)(Mat, int, MatReuse, int*, int**, int**, PetscScalar**);
81f0c56d0fSKris Buschelman } Mat_MUMPS;
82f0c56d0fSKris Buschelman 
8309573ac7SBarry Smith extern PetscErrorCode MatDuplicate_MUMPS(Mat,MatDuplicateOption,Mat*);
84b24902e0SBarry Smith 
8567877ebaSShri Abhyankar 
8667877ebaSShri Abhyankar /* MatConvertToTriples_A_B */
8767877ebaSShri Abhyankar /*convert Petsc matrix to triples: row[nz], col[nz], val[nz] */
88397b6df1SKris Buschelman /*
89397b6df1SKris Buschelman   input:
9067877ebaSShri Abhyankar     A       - matrix in aij,baij or sbaij (bs=1) format
91397b6df1SKris Buschelman     shift   - 0: C style output triple; 1: Fortran style output triple.
92bccb9932SShri Abhyankar     reuse   - MAT_INITIAL_MATRIX: spaces are allocated and values are set for the triple
93bccb9932SShri Abhyankar               MAT_REUSE_MATRIX:   only the values in v array are updated
94397b6df1SKris Buschelman   output:
95397b6df1SKris Buschelman     nnz     - dim of r, c, and v (number of local nonzero entries of A)
96397b6df1SKris Buschelman     r, c, v - row and col index, matrix values (matrix triples)
97eb9baa12SBarry Smith 
98eb9baa12SBarry Smith   The returned values r, c, and sometimes v are obtained in a single PetscMalloc(). Then in MatDestroy_MUMPS() it is
99eb9baa12SBarry Smith   freed with PetscFree((mumps->irn);  This is not ideal code, the fact that v is ONLY sometimes part of mumps->irn means
100eb9baa12SBarry Smith   that the PetscMalloc() cannot easily be replaced with a PetscMalloc3().
101eb9baa12SBarry Smith 
102397b6df1SKris Buschelman  */
10316ebf90aSShri Abhyankar 
10416ebf90aSShri Abhyankar #undef __FUNCT__
10516ebf90aSShri Abhyankar #define __FUNCT__ "MatConvertToTriples_seqaij_seqaij"
106bccb9932SShri Abhyankar PetscErrorCode MatConvertToTriples_seqaij_seqaij(Mat A,int shift,MatReuse reuse,int *nnz,int **r, int **c, PetscScalar **v)
107b24902e0SBarry Smith {
108185f6596SHong Zhang   const PetscInt *ai,*aj,*ajj,M=A->rmap->n;
10967877ebaSShri Abhyankar   PetscInt       nz,rnz,i,j;
110dfbe8321SBarry Smith   PetscErrorCode ierr;
111c1490034SHong Zhang   PetscInt       *row,*col;
11216ebf90aSShri Abhyankar   Mat_SeqAIJ     *aa=(Mat_SeqAIJ*)A->data;
113397b6df1SKris Buschelman 
114397b6df1SKris Buschelman   PetscFunctionBegin;
11516ebf90aSShri Abhyankar   *v=aa->a;
116bccb9932SShri Abhyankar   if (reuse == MAT_INITIAL_MATRIX) {
1172205254eSKarl Rupp     nz   = aa->nz;
1182205254eSKarl Rupp     ai   = aa->i;
1192205254eSKarl Rupp     aj   = aa->j;
12016ebf90aSShri Abhyankar     *nnz = nz;
121785e854fSJed Brown     ierr = PetscMalloc1(2*nz, &row);CHKERRQ(ierr);
122185f6596SHong Zhang     col  = row + nz;
123185f6596SHong Zhang 
12416ebf90aSShri Abhyankar     nz = 0;
12516ebf90aSShri Abhyankar     for (i=0; i<M; i++) {
12616ebf90aSShri Abhyankar       rnz = ai[i+1] - ai[i];
12767877ebaSShri Abhyankar       ajj = aj + ai[i];
12867877ebaSShri Abhyankar       for (j=0; j<rnz; j++) {
12967877ebaSShri Abhyankar         row[nz] = i+shift; col[nz++] = ajj[j] + shift;
13016ebf90aSShri Abhyankar       }
13116ebf90aSShri Abhyankar     }
13216ebf90aSShri Abhyankar     *r = row; *c = col;
13316ebf90aSShri Abhyankar   }
13416ebf90aSShri Abhyankar   PetscFunctionReturn(0);
13516ebf90aSShri Abhyankar }
136397b6df1SKris Buschelman 
13716ebf90aSShri Abhyankar #undef __FUNCT__
13867877ebaSShri Abhyankar #define __FUNCT__ "MatConvertToTriples_seqbaij_seqaij"
139bccb9932SShri Abhyankar PetscErrorCode MatConvertToTriples_seqbaij_seqaij(Mat A,int shift,MatReuse reuse,int *nnz,int **r, int **c, PetscScalar **v)
14067877ebaSShri Abhyankar {
14167877ebaSShri Abhyankar   Mat_SeqBAIJ    *aa=(Mat_SeqBAIJ*)A->data;
142*33d57670SJed Brown   const PetscInt *ai,*aj,*ajj,bs2 = aa->bs2;
143*33d57670SJed Brown   PetscInt       bs,M,nz,idx=0,rnz,i,j,k,m;
14467877ebaSShri Abhyankar   PetscErrorCode ierr;
14567877ebaSShri Abhyankar   PetscInt       *row,*col;
14667877ebaSShri Abhyankar 
14767877ebaSShri Abhyankar   PetscFunctionBegin;
148*33d57670SJed Brown   ierr = MatGetBlockSize(A,&bs);CHKERRQ(ierr);
149*33d57670SJed Brown   M = A->rmap->N/bs;
150cf3759fdSShri Abhyankar   *v = aa->a;
151bccb9932SShri Abhyankar   if (reuse == MAT_INITIAL_MATRIX) {
152cf3759fdSShri Abhyankar     ai   = aa->i; aj = aa->j;
15367877ebaSShri Abhyankar     nz   = bs2*aa->nz;
15467877ebaSShri Abhyankar     *nnz = nz;
155785e854fSJed Brown     ierr = PetscMalloc1(2*nz, &row);CHKERRQ(ierr);
156185f6596SHong Zhang     col  = row + nz;
157185f6596SHong Zhang 
15867877ebaSShri Abhyankar     for (i=0; i<M; i++) {
15967877ebaSShri Abhyankar       ajj = aj + ai[i];
16067877ebaSShri Abhyankar       rnz = ai[i+1] - ai[i];
16167877ebaSShri Abhyankar       for (k=0; k<rnz; k++) {
16267877ebaSShri Abhyankar         for (j=0; j<bs; j++) {
16367877ebaSShri Abhyankar           for (m=0; m<bs; m++) {
16467877ebaSShri Abhyankar             row[idx]   = i*bs + m + shift;
165cf3759fdSShri Abhyankar             col[idx++] = bs*(ajj[k]) + j + shift;
16667877ebaSShri Abhyankar           }
16767877ebaSShri Abhyankar         }
16867877ebaSShri Abhyankar       }
16967877ebaSShri Abhyankar     }
170cf3759fdSShri Abhyankar     *r = row; *c = col;
17167877ebaSShri Abhyankar   }
17267877ebaSShri Abhyankar   PetscFunctionReturn(0);
17367877ebaSShri Abhyankar }
17467877ebaSShri Abhyankar 
17567877ebaSShri Abhyankar #undef __FUNCT__
17616ebf90aSShri Abhyankar #define __FUNCT__ "MatConvertToTriples_seqsbaij_seqsbaij"
177bccb9932SShri Abhyankar PetscErrorCode MatConvertToTriples_seqsbaij_seqsbaij(Mat A,int shift,MatReuse reuse,int *nnz,int **r, int **c, PetscScalar **v)
17816ebf90aSShri Abhyankar {
17967877ebaSShri Abhyankar   const PetscInt *ai, *aj,*ajj,M=A->rmap->n;
18067877ebaSShri Abhyankar   PetscInt       nz,rnz,i,j;
18116ebf90aSShri Abhyankar   PetscErrorCode ierr;
18216ebf90aSShri Abhyankar   PetscInt       *row,*col;
18316ebf90aSShri Abhyankar   Mat_SeqSBAIJ   *aa=(Mat_SeqSBAIJ*)A->data;
18416ebf90aSShri Abhyankar 
18516ebf90aSShri Abhyankar   PetscFunctionBegin;
186882afa5aSHong Zhang   *v = aa->a;
187bccb9932SShri Abhyankar   if (reuse == MAT_INITIAL_MATRIX) {
1882205254eSKarl Rupp     nz   = aa->nz;
1892205254eSKarl Rupp     ai   = aa->i;
1902205254eSKarl Rupp     aj   = aa->j;
1912205254eSKarl Rupp     *v   = aa->a;
19216ebf90aSShri Abhyankar     *nnz = nz;
193785e854fSJed Brown     ierr = PetscMalloc1(2*nz, &row);CHKERRQ(ierr);
194185f6596SHong Zhang     col  = row + nz;
195185f6596SHong Zhang 
19616ebf90aSShri Abhyankar     nz = 0;
19716ebf90aSShri Abhyankar     for (i=0; i<M; i++) {
19816ebf90aSShri Abhyankar       rnz = ai[i+1] - ai[i];
19967877ebaSShri Abhyankar       ajj = aj + ai[i];
20067877ebaSShri Abhyankar       for (j=0; j<rnz; j++) {
20167877ebaSShri Abhyankar         row[nz] = i+shift; col[nz++] = ajj[j] + shift;
20216ebf90aSShri Abhyankar       }
20316ebf90aSShri Abhyankar     }
20416ebf90aSShri Abhyankar     *r = row; *c = col;
20516ebf90aSShri Abhyankar   }
20616ebf90aSShri Abhyankar   PetscFunctionReturn(0);
20716ebf90aSShri Abhyankar }
20816ebf90aSShri Abhyankar 
20916ebf90aSShri Abhyankar #undef __FUNCT__
21016ebf90aSShri Abhyankar #define __FUNCT__ "MatConvertToTriples_seqaij_seqsbaij"
211bccb9932SShri Abhyankar PetscErrorCode MatConvertToTriples_seqaij_seqsbaij(Mat A,int shift,MatReuse reuse,int *nnz,int **r, int **c, PetscScalar **v)
21216ebf90aSShri Abhyankar {
21367877ebaSShri Abhyankar   const PetscInt    *ai,*aj,*ajj,*adiag,M=A->rmap->n;
21467877ebaSShri Abhyankar   PetscInt          nz,rnz,i,j;
21567877ebaSShri Abhyankar   const PetscScalar *av,*v1;
21616ebf90aSShri Abhyankar   PetscScalar       *val;
21716ebf90aSShri Abhyankar   PetscErrorCode    ierr;
21816ebf90aSShri Abhyankar   PetscInt          *row,*col;
21916ebf90aSShri Abhyankar   Mat_SeqSBAIJ      *aa=(Mat_SeqSBAIJ*)A->data;
22016ebf90aSShri Abhyankar 
22116ebf90aSShri Abhyankar   PetscFunctionBegin;
22216ebf90aSShri Abhyankar   ai   =aa->i; aj=aa->j;av=aa->a;
22316ebf90aSShri Abhyankar   adiag=aa->diag;
224bccb9932SShri Abhyankar   if (reuse == MAT_INITIAL_MATRIX) {
22516ebf90aSShri Abhyankar     nz   = M + (aa->nz-M)/2;
22616ebf90aSShri Abhyankar     *nnz = nz;
227185f6596SHong Zhang     ierr = PetscMalloc((2*nz*sizeof(PetscInt)+nz*sizeof(PetscScalar)), &row);CHKERRQ(ierr);
228185f6596SHong Zhang     col  = row + nz;
229185f6596SHong Zhang     val  = (PetscScalar*)(col + nz);
230185f6596SHong Zhang 
23116ebf90aSShri Abhyankar     nz = 0;
23216ebf90aSShri Abhyankar     for (i=0; i<M; i++) {
23316ebf90aSShri Abhyankar       rnz = ai[i+1] - adiag[i];
23467877ebaSShri Abhyankar       ajj = aj + adiag[i];
235cf3759fdSShri Abhyankar       v1  = av + adiag[i];
23667877ebaSShri Abhyankar       for (j=0; j<rnz; j++) {
23767877ebaSShri Abhyankar         row[nz] = i+shift; col[nz] = ajj[j] + shift; val[nz++] = v1[j];
23816ebf90aSShri Abhyankar       }
23916ebf90aSShri Abhyankar     }
24016ebf90aSShri Abhyankar     *r = row; *c = col; *v = val;
241397b6df1SKris Buschelman   } else {
24216ebf90aSShri Abhyankar     nz = 0; val = *v;
24316ebf90aSShri Abhyankar     for (i=0; i <M; i++) {
24416ebf90aSShri Abhyankar       rnz = ai[i+1] - adiag[i];
24567877ebaSShri Abhyankar       ajj = aj + adiag[i];
24667877ebaSShri Abhyankar       v1  = av + adiag[i];
24767877ebaSShri Abhyankar       for (j=0; j<rnz; j++) {
24867877ebaSShri Abhyankar         val[nz++] = v1[j];
24916ebf90aSShri Abhyankar       }
25016ebf90aSShri Abhyankar     }
25116ebf90aSShri Abhyankar   }
25216ebf90aSShri Abhyankar   PetscFunctionReturn(0);
25316ebf90aSShri Abhyankar }
25416ebf90aSShri Abhyankar 
25516ebf90aSShri Abhyankar #undef __FUNCT__
25616ebf90aSShri Abhyankar #define __FUNCT__ "MatConvertToTriples_mpisbaij_mpisbaij"
257bccb9932SShri Abhyankar PetscErrorCode MatConvertToTriples_mpisbaij_mpisbaij(Mat A,int shift,MatReuse reuse,int *nnz,int **r, int **c, PetscScalar **v)
25816ebf90aSShri Abhyankar {
25916ebf90aSShri Abhyankar   const PetscInt    *ai, *aj, *bi, *bj,*garray,m=A->rmap->n,*ajj,*bjj;
26016ebf90aSShri Abhyankar   PetscErrorCode    ierr;
26116ebf90aSShri Abhyankar   PetscInt          rstart,nz,i,j,jj,irow,countA,countB;
26216ebf90aSShri Abhyankar   PetscInt          *row,*col;
26316ebf90aSShri Abhyankar   const PetscScalar *av, *bv,*v1,*v2;
26416ebf90aSShri Abhyankar   PetscScalar       *val;
265397b6df1SKris Buschelman   Mat_MPISBAIJ      *mat = (Mat_MPISBAIJ*)A->data;
266397b6df1SKris Buschelman   Mat_SeqSBAIJ      *aa  = (Mat_SeqSBAIJ*)(mat->A)->data;
267397b6df1SKris Buschelman   Mat_SeqBAIJ       *bb  = (Mat_SeqBAIJ*)(mat->B)->data;
26816ebf90aSShri Abhyankar 
26916ebf90aSShri Abhyankar   PetscFunctionBegin;
270d0f46423SBarry Smith   ai=aa->i; aj=aa->j; bi=bb->i; bj=bb->j; rstart= A->rmap->rstart;
271397b6df1SKris Buschelman   av=aa->a; bv=bb->a;
272397b6df1SKris Buschelman 
2732205254eSKarl Rupp   garray = mat->garray;
2742205254eSKarl Rupp 
275bccb9932SShri Abhyankar   if (reuse == MAT_INITIAL_MATRIX) {
27616ebf90aSShri Abhyankar     nz   = aa->nz + bb->nz;
27716ebf90aSShri Abhyankar     *nnz = nz;
278185f6596SHong Zhang     ierr = PetscMalloc((2*nz*sizeof(PetscInt)+nz*sizeof(PetscScalar)), &row);CHKERRQ(ierr);
279185f6596SHong Zhang     col  = row + nz;
280185f6596SHong Zhang     val  = (PetscScalar*)(col + nz);
281185f6596SHong Zhang 
282397b6df1SKris Buschelman     *r = row; *c = col; *v = val;
283397b6df1SKris Buschelman   } else {
284397b6df1SKris Buschelman     row = *r; col = *c; val = *v;
285397b6df1SKris Buschelman   }
286397b6df1SKris Buschelman 
287028e57e8SHong Zhang   jj = 0; irow = rstart;
288397b6df1SKris Buschelman   for (i=0; i<m; i++) {
289397b6df1SKris Buschelman     ajj    = aj + ai[i];                 /* ptr to the beginning of this row */
290397b6df1SKris Buschelman     countA = ai[i+1] - ai[i];
291397b6df1SKris Buschelman     countB = bi[i+1] - bi[i];
292397b6df1SKris Buschelman     bjj    = bj + bi[i];
29316ebf90aSShri Abhyankar     v1     = av + ai[i];
29416ebf90aSShri Abhyankar     v2     = bv + bi[i];
295397b6df1SKris Buschelman 
296397b6df1SKris Buschelman     /* A-part */
297397b6df1SKris Buschelman     for (j=0; j<countA; j++) {
298bccb9932SShri Abhyankar       if (reuse == MAT_INITIAL_MATRIX) {
299397b6df1SKris Buschelman         row[jj] = irow + shift; col[jj] = rstart + ajj[j] + shift;
300397b6df1SKris Buschelman       }
30116ebf90aSShri Abhyankar       val[jj++] = v1[j];
302397b6df1SKris Buschelman     }
30316ebf90aSShri Abhyankar 
30416ebf90aSShri Abhyankar     /* B-part */
30516ebf90aSShri Abhyankar     for (j=0; j < countB; j++) {
306bccb9932SShri Abhyankar       if (reuse == MAT_INITIAL_MATRIX) {
307397b6df1SKris Buschelman         row[jj] = irow + shift; col[jj] = garray[bjj[j]] + shift;
308397b6df1SKris Buschelman       }
30916ebf90aSShri Abhyankar       val[jj++] = v2[j];
31016ebf90aSShri Abhyankar     }
31116ebf90aSShri Abhyankar     irow++;
31216ebf90aSShri Abhyankar   }
31316ebf90aSShri Abhyankar   PetscFunctionReturn(0);
31416ebf90aSShri Abhyankar }
31516ebf90aSShri Abhyankar 
31616ebf90aSShri Abhyankar #undef __FUNCT__
31716ebf90aSShri Abhyankar #define __FUNCT__ "MatConvertToTriples_mpiaij_mpiaij"
318bccb9932SShri Abhyankar PetscErrorCode MatConvertToTriples_mpiaij_mpiaij(Mat A,int shift,MatReuse reuse,int *nnz,int **r, int **c, PetscScalar **v)
31916ebf90aSShri Abhyankar {
32016ebf90aSShri Abhyankar   const PetscInt    *ai, *aj, *bi, *bj,*garray,m=A->rmap->n,*ajj,*bjj;
32116ebf90aSShri Abhyankar   PetscErrorCode    ierr;
32216ebf90aSShri Abhyankar   PetscInt          rstart,nz,i,j,jj,irow,countA,countB;
32316ebf90aSShri Abhyankar   PetscInt          *row,*col;
32416ebf90aSShri Abhyankar   const PetscScalar *av, *bv,*v1,*v2;
32516ebf90aSShri Abhyankar   PetscScalar       *val;
32616ebf90aSShri Abhyankar   Mat_MPIAIJ        *mat = (Mat_MPIAIJ*)A->data;
32716ebf90aSShri Abhyankar   Mat_SeqAIJ        *aa  = (Mat_SeqAIJ*)(mat->A)->data;
32816ebf90aSShri Abhyankar   Mat_SeqAIJ        *bb  = (Mat_SeqAIJ*)(mat->B)->data;
32916ebf90aSShri Abhyankar 
33016ebf90aSShri Abhyankar   PetscFunctionBegin;
33116ebf90aSShri Abhyankar   ai=aa->i; aj=aa->j; bi=bb->i; bj=bb->j; rstart= A->rmap->rstart;
33216ebf90aSShri Abhyankar   av=aa->a; bv=bb->a;
33316ebf90aSShri Abhyankar 
3342205254eSKarl Rupp   garray = mat->garray;
3352205254eSKarl Rupp 
336bccb9932SShri Abhyankar   if (reuse == MAT_INITIAL_MATRIX) {
33716ebf90aSShri Abhyankar     nz   = aa->nz + bb->nz;
33816ebf90aSShri Abhyankar     *nnz = nz;
339185f6596SHong Zhang     ierr = PetscMalloc((2*nz*sizeof(PetscInt)+nz*sizeof(PetscScalar)), &row);CHKERRQ(ierr);
340185f6596SHong Zhang     col  = row + nz;
341185f6596SHong Zhang     val  = (PetscScalar*)(col + nz);
342185f6596SHong Zhang 
34316ebf90aSShri Abhyankar     *r = row; *c = col; *v = val;
34416ebf90aSShri Abhyankar   } else {
34516ebf90aSShri Abhyankar     row = *r; col = *c; val = *v;
34616ebf90aSShri Abhyankar   }
34716ebf90aSShri Abhyankar 
34816ebf90aSShri Abhyankar   jj = 0; irow = rstart;
34916ebf90aSShri Abhyankar   for (i=0; i<m; i++) {
35016ebf90aSShri Abhyankar     ajj    = aj + ai[i];                 /* ptr to the beginning of this row */
35116ebf90aSShri Abhyankar     countA = ai[i+1] - ai[i];
35216ebf90aSShri Abhyankar     countB = bi[i+1] - bi[i];
35316ebf90aSShri Abhyankar     bjj    = bj + bi[i];
35416ebf90aSShri Abhyankar     v1     = av + ai[i];
35516ebf90aSShri Abhyankar     v2     = bv + bi[i];
35616ebf90aSShri Abhyankar 
35716ebf90aSShri Abhyankar     /* A-part */
35816ebf90aSShri Abhyankar     for (j=0; j<countA; j++) {
359bccb9932SShri Abhyankar       if (reuse == MAT_INITIAL_MATRIX) {
36016ebf90aSShri Abhyankar         row[jj] = irow + shift; col[jj] = rstart + ajj[j] + shift;
36116ebf90aSShri Abhyankar       }
36216ebf90aSShri Abhyankar       val[jj++] = v1[j];
36316ebf90aSShri Abhyankar     }
36416ebf90aSShri Abhyankar 
36516ebf90aSShri Abhyankar     /* B-part */
36616ebf90aSShri Abhyankar     for (j=0; j < countB; j++) {
367bccb9932SShri Abhyankar       if (reuse == MAT_INITIAL_MATRIX) {
36816ebf90aSShri Abhyankar         row[jj] = irow + shift; col[jj] = garray[bjj[j]] + shift;
36916ebf90aSShri Abhyankar       }
37016ebf90aSShri Abhyankar       val[jj++] = v2[j];
37116ebf90aSShri Abhyankar     }
37216ebf90aSShri Abhyankar     irow++;
37316ebf90aSShri Abhyankar   }
37416ebf90aSShri Abhyankar   PetscFunctionReturn(0);
37516ebf90aSShri Abhyankar }
37616ebf90aSShri Abhyankar 
37716ebf90aSShri Abhyankar #undef __FUNCT__
37867877ebaSShri Abhyankar #define __FUNCT__ "MatConvertToTriples_mpibaij_mpiaij"
379bccb9932SShri Abhyankar PetscErrorCode MatConvertToTriples_mpibaij_mpiaij(Mat A,int shift,MatReuse reuse,int *nnz,int **r, int **c, PetscScalar **v)
38067877ebaSShri Abhyankar {
38167877ebaSShri Abhyankar   Mat_MPIBAIJ       *mat    = (Mat_MPIBAIJ*)A->data;
38267877ebaSShri Abhyankar   Mat_SeqBAIJ       *aa     = (Mat_SeqBAIJ*)(mat->A)->data;
38367877ebaSShri Abhyankar   Mat_SeqBAIJ       *bb     = (Mat_SeqBAIJ*)(mat->B)->data;
38467877ebaSShri Abhyankar   const PetscInt    *ai     = aa->i, *bi = bb->i, *aj = aa->j, *bj = bb->j,*ajj, *bjj;
385d985c460SShri Abhyankar   const PetscInt    *garray = mat->garray,mbs=mat->mbs,rstart=A->rmap->rstart;
386*33d57670SJed Brown   const PetscInt    bs2=mat->bs2;
38767877ebaSShri Abhyankar   PetscErrorCode    ierr;
388*33d57670SJed Brown   PetscInt          bs,nz,i,j,k,n,jj,irow,countA,countB,idx;
38967877ebaSShri Abhyankar   PetscInt          *row,*col;
39067877ebaSShri Abhyankar   const PetscScalar *av=aa->a, *bv=bb->a,*v1,*v2;
39167877ebaSShri Abhyankar   PetscScalar       *val;
39267877ebaSShri Abhyankar 
39367877ebaSShri Abhyankar   PetscFunctionBegin;
394*33d57670SJed Brown   ierr = MatGetBlockSize(A,&bs);CHKERRQ(ierr);
395bccb9932SShri Abhyankar   if (reuse == MAT_INITIAL_MATRIX) {
39667877ebaSShri Abhyankar     nz   = bs2*(aa->nz + bb->nz);
39767877ebaSShri Abhyankar     *nnz = nz;
398185f6596SHong Zhang     ierr = PetscMalloc((2*nz*sizeof(PetscInt)+nz*sizeof(PetscScalar)), &row);CHKERRQ(ierr);
399185f6596SHong Zhang     col  = row + nz;
400185f6596SHong Zhang     val  = (PetscScalar*)(col + nz);
401185f6596SHong Zhang 
40267877ebaSShri Abhyankar     *r = row; *c = col; *v = val;
40367877ebaSShri Abhyankar   } else {
40467877ebaSShri Abhyankar     row = *r; col = *c; val = *v;
40567877ebaSShri Abhyankar   }
40667877ebaSShri Abhyankar 
407d985c460SShri Abhyankar   jj = 0; irow = rstart;
40867877ebaSShri Abhyankar   for (i=0; i<mbs; i++) {
40967877ebaSShri Abhyankar     countA = ai[i+1] - ai[i];
41067877ebaSShri Abhyankar     countB = bi[i+1] - bi[i];
41167877ebaSShri Abhyankar     ajj    = aj + ai[i];
41267877ebaSShri Abhyankar     bjj    = bj + bi[i];
41367877ebaSShri Abhyankar     v1     = av + bs2*ai[i];
41467877ebaSShri Abhyankar     v2     = bv + bs2*bi[i];
41567877ebaSShri Abhyankar 
41667877ebaSShri Abhyankar     idx = 0;
41767877ebaSShri Abhyankar     /* A-part */
41867877ebaSShri Abhyankar     for (k=0; k<countA; k++) {
41967877ebaSShri Abhyankar       for (j=0; j<bs; j++) {
42067877ebaSShri Abhyankar         for (n=0; n<bs; n++) {
421bccb9932SShri Abhyankar           if (reuse == MAT_INITIAL_MATRIX) {
422d985c460SShri Abhyankar             row[jj] = irow + n + shift;
423d985c460SShri Abhyankar             col[jj] = rstart + bs*ajj[k] + j + shift;
42467877ebaSShri Abhyankar           }
42567877ebaSShri Abhyankar           val[jj++] = v1[idx++];
42667877ebaSShri Abhyankar         }
42767877ebaSShri Abhyankar       }
42867877ebaSShri Abhyankar     }
42967877ebaSShri Abhyankar 
43067877ebaSShri Abhyankar     idx = 0;
43167877ebaSShri Abhyankar     /* B-part */
43267877ebaSShri Abhyankar     for (k=0; k<countB; k++) {
43367877ebaSShri Abhyankar       for (j=0; j<bs; j++) {
43467877ebaSShri Abhyankar         for (n=0; n<bs; n++) {
435bccb9932SShri Abhyankar           if (reuse == MAT_INITIAL_MATRIX) {
436d985c460SShri Abhyankar             row[jj] = irow + n + shift;
437d985c460SShri Abhyankar             col[jj] = bs*garray[bjj[k]] + j + shift;
43867877ebaSShri Abhyankar           }
439d985c460SShri Abhyankar           val[jj++] = v2[idx++];
44067877ebaSShri Abhyankar         }
44167877ebaSShri Abhyankar       }
44267877ebaSShri Abhyankar     }
443d985c460SShri Abhyankar     irow += bs;
44467877ebaSShri Abhyankar   }
44567877ebaSShri Abhyankar   PetscFunctionReturn(0);
44667877ebaSShri Abhyankar }
44767877ebaSShri Abhyankar 
44867877ebaSShri Abhyankar #undef __FUNCT__
44916ebf90aSShri Abhyankar #define __FUNCT__ "MatConvertToTriples_mpiaij_mpisbaij"
450bccb9932SShri Abhyankar PetscErrorCode MatConvertToTriples_mpiaij_mpisbaij(Mat A,int shift,MatReuse reuse,int *nnz,int **r, int **c, PetscScalar **v)
45116ebf90aSShri Abhyankar {
45216ebf90aSShri Abhyankar   const PetscInt    *ai, *aj,*adiag, *bi, *bj,*garray,m=A->rmap->n,*ajj,*bjj;
45316ebf90aSShri Abhyankar   PetscErrorCode    ierr;
454e0bace9bSHong Zhang   PetscInt          rstart,nz,nza,nzb,i,j,jj,irow,countA,countB;
45516ebf90aSShri Abhyankar   PetscInt          *row,*col;
45616ebf90aSShri Abhyankar   const PetscScalar *av, *bv,*v1,*v2;
45716ebf90aSShri Abhyankar   PetscScalar       *val;
45816ebf90aSShri Abhyankar   Mat_MPIAIJ        *mat =  (Mat_MPIAIJ*)A->data;
45916ebf90aSShri Abhyankar   Mat_SeqAIJ        *aa  =(Mat_SeqAIJ*)(mat->A)->data;
46016ebf90aSShri Abhyankar   Mat_SeqAIJ        *bb  =(Mat_SeqAIJ*)(mat->B)->data;
46116ebf90aSShri Abhyankar 
46216ebf90aSShri Abhyankar   PetscFunctionBegin;
46316ebf90aSShri Abhyankar   ai=aa->i; aj=aa->j; adiag=aa->diag;
46416ebf90aSShri Abhyankar   bi=bb->i; bj=bb->j; garray = mat->garray;
46516ebf90aSShri Abhyankar   av=aa->a; bv=bb->a;
4662205254eSKarl Rupp 
46716ebf90aSShri Abhyankar   rstart = A->rmap->rstart;
46816ebf90aSShri Abhyankar 
469bccb9932SShri Abhyankar   if (reuse == MAT_INITIAL_MATRIX) {
470e0bace9bSHong Zhang     nza = 0;    /* num of upper triangular entries in mat->A, including diagonals */
471e0bace9bSHong Zhang     nzb = 0;    /* num of upper triangular entries in mat->B */
47216ebf90aSShri Abhyankar     for (i=0; i<m; i++) {
473e0bace9bSHong Zhang       nza   += (ai[i+1] - adiag[i]);
47416ebf90aSShri Abhyankar       countB = bi[i+1] - bi[i];
47516ebf90aSShri Abhyankar       bjj    = bj + bi[i];
476e0bace9bSHong Zhang       for (j=0; j<countB; j++) {
477e0bace9bSHong Zhang         if (garray[bjj[j]] > rstart) nzb++;
478e0bace9bSHong Zhang       }
479e0bace9bSHong Zhang     }
48016ebf90aSShri Abhyankar 
481e0bace9bSHong Zhang     nz   = nza + nzb; /* total nz of upper triangular part of mat */
48216ebf90aSShri Abhyankar     *nnz = nz;
483185f6596SHong Zhang     ierr = PetscMalloc((2*nz*sizeof(PetscInt)+nz*sizeof(PetscScalar)), &row);CHKERRQ(ierr);
484185f6596SHong Zhang     col  = row + nz;
485185f6596SHong Zhang     val  = (PetscScalar*)(col + nz);
486185f6596SHong Zhang 
48716ebf90aSShri Abhyankar     *r = row; *c = col; *v = val;
48816ebf90aSShri Abhyankar   } else {
48916ebf90aSShri Abhyankar     row = *r; col = *c; val = *v;
49016ebf90aSShri Abhyankar   }
49116ebf90aSShri Abhyankar 
49216ebf90aSShri Abhyankar   jj = 0; irow = rstart;
49316ebf90aSShri Abhyankar   for (i=0; i<m; i++) {
49416ebf90aSShri Abhyankar     ajj    = aj + adiag[i];                 /* ptr to the beginning of the diagonal of this row */
49516ebf90aSShri Abhyankar     v1     = av + adiag[i];
49616ebf90aSShri Abhyankar     countA = ai[i+1] - adiag[i];
49716ebf90aSShri Abhyankar     countB = bi[i+1] - bi[i];
49816ebf90aSShri Abhyankar     bjj    = bj + bi[i];
49916ebf90aSShri Abhyankar     v2     = bv + bi[i];
50016ebf90aSShri Abhyankar 
50116ebf90aSShri Abhyankar     /* A-part */
50216ebf90aSShri Abhyankar     for (j=0; j<countA; j++) {
503bccb9932SShri Abhyankar       if (reuse == MAT_INITIAL_MATRIX) {
50416ebf90aSShri Abhyankar         row[jj] = irow + shift; col[jj] = rstart + ajj[j] + shift;
50516ebf90aSShri Abhyankar       }
50616ebf90aSShri Abhyankar       val[jj++] = v1[j];
50716ebf90aSShri Abhyankar     }
50816ebf90aSShri Abhyankar 
50916ebf90aSShri Abhyankar     /* B-part */
51016ebf90aSShri Abhyankar     for (j=0; j < countB; j++) {
51116ebf90aSShri Abhyankar       if (garray[bjj[j]] > rstart) {
512bccb9932SShri Abhyankar         if (reuse == MAT_INITIAL_MATRIX) {
51316ebf90aSShri Abhyankar           row[jj] = irow + shift; col[jj] = garray[bjj[j]] + shift;
51416ebf90aSShri Abhyankar         }
51516ebf90aSShri Abhyankar         val[jj++] = v2[j];
51616ebf90aSShri Abhyankar       }
517397b6df1SKris Buschelman     }
518397b6df1SKris Buschelman     irow++;
519397b6df1SKris Buschelman   }
520397b6df1SKris Buschelman   PetscFunctionReturn(0);
521397b6df1SKris Buschelman }
522397b6df1SKris Buschelman 
523397b6df1SKris Buschelman #undef __FUNCT__
5243924e44cSKris Buschelman #define __FUNCT__ "MatDestroy_MUMPS"
525dfbe8321SBarry Smith PetscErrorCode MatDestroy_MUMPS(Mat A)
526dfbe8321SBarry Smith {
527a5e57a09SHong Zhang   Mat_MUMPS      *mumps=(Mat_MUMPS*)A->spptr;
528dfbe8321SBarry Smith   PetscErrorCode ierr;
529b24902e0SBarry Smith 
530397b6df1SKris Buschelman   PetscFunctionBegin;
531a5e57a09SHong Zhang   if (mumps->CleanUpMUMPS) {
532397b6df1SKris Buschelman     /* Terminate instance, deallocate memories */
533a5e57a09SHong Zhang     ierr = PetscFree2(mumps->id.sol_loc,mumps->id.isol_loc);CHKERRQ(ierr);
534a5e57a09SHong Zhang     ierr = VecScatterDestroy(&mumps->scat_rhs);CHKERRQ(ierr);
535a5e57a09SHong Zhang     ierr = VecDestroy(&mumps->b_seq);CHKERRQ(ierr);
536a5e57a09SHong Zhang     ierr = VecScatterDestroy(&mumps->scat_sol);CHKERRQ(ierr);
537a5e57a09SHong Zhang     ierr = VecDestroy(&mumps->x_seq);CHKERRQ(ierr);
538a5e57a09SHong Zhang     ierr = PetscFree(mumps->id.perm_in);CHKERRQ(ierr);
539a5e57a09SHong Zhang     ierr = PetscFree(mumps->irn);CHKERRQ(ierr);
5402205254eSKarl Rupp 
541a5e57a09SHong Zhang     mumps->id.job = JOB_END;
542a5e57a09SHong Zhang     PetscMUMPS_c(&mumps->id);
543a5e57a09SHong Zhang     ierr = MPI_Comm_free(&(mumps->comm_mumps));CHKERRQ(ierr);
544397b6df1SKris Buschelman   }
545a5e57a09SHong Zhang   if (mumps->Destroy) {
546a5e57a09SHong Zhang     ierr = (mumps->Destroy)(A);CHKERRQ(ierr);
547bf0cc555SLisandro Dalcin   }
548bf0cc555SLisandro Dalcin   ierr = PetscFree(A->spptr);CHKERRQ(ierr);
549bf0cc555SLisandro Dalcin 
55097969023SHong Zhang   /* clear composed functions */
551bdf89e91SBarry Smith   ierr = PetscObjectComposeFunction((PetscObject)A,"MatFactorGetSolverPackage_C",NULL);CHKERRQ(ierr);
552bdf89e91SBarry Smith   ierr = PetscObjectComposeFunction((PetscObject)A,"MatMumpsSetIcntl_C",NULL);CHKERRQ(ierr);
553bdf89e91SBarry Smith   ierr = PetscObjectComposeFunction((PetscObject)A,"MatMumpsSetCntl_C",NULL);CHKERRQ(ierr);
554397b6df1SKris Buschelman   PetscFunctionReturn(0);
555397b6df1SKris Buschelman }
556397b6df1SKris Buschelman 
557397b6df1SKris Buschelman #undef __FUNCT__
558f6c57405SHong Zhang #define __FUNCT__ "MatSolve_MUMPS"
559b24902e0SBarry Smith PetscErrorCode MatSolve_MUMPS(Mat A,Vec b,Vec x)
560b24902e0SBarry Smith {
561a5e57a09SHong Zhang   Mat_MUMPS        *mumps=(Mat_MUMPS*)A->spptr;
562d54de34fSKris Buschelman   PetscScalar      *array;
56367877ebaSShri Abhyankar   Vec              b_seq;
564329ec9b3SHong Zhang   IS               is_iden,is_petsc;
565dfbe8321SBarry Smith   PetscErrorCode   ierr;
566329ec9b3SHong Zhang   PetscInt         i;
567883f2eb9SBarry Smith   static PetscBool cite1 = PETSC_FALSE,cite2 = PETSC_FALSE;
568397b6df1SKris Buschelman 
569397b6df1SKris Buschelman   PetscFunctionBegin;
570883f2eb9SBarry Smith   ierr = PetscCitationsRegister("@article{MUMPS01,\n  author = {P.~R. Amestoy and I.~S. Duff and J.-Y. L'Excellent and J. Koster},\n  title = {A fully asynchronous multifrontal solver using distributed dynamic scheduling},\n  journal = {SIAM Journal on Matrix Analysis and Applications},\n  volume = {23},\n  number = {1},\n  pages = {15--41},\n  year = {2001}\n}\n",&cite1);CHKERRQ(ierr);
571883f2eb9SBarry Smith   ierr = PetscCitationsRegister("@article{MUMPS02,\n  author = {P.~R. Amestoy and A. Guermouche and J.-Y. L'Excellent and S. Pralet},\n  title = {Hybrid scheduling for the parallel solution of linear systems},\n  journal = {Parallel Computing},\n  volume = {32},\n  number = {2},\n  pages = {136--156},\n  year = {2006}\n}\n",&cite2);CHKERRQ(ierr);
572a5e57a09SHong Zhang   mumps->id.nrhs = 1;
573a5e57a09SHong Zhang   b_seq          = mumps->b_seq;
574a5e57a09SHong Zhang   if (mumps->size > 1) {
575329ec9b3SHong Zhang     /* MUMPS only supports centralized rhs. Scatter b into a seqential rhs vector */
576a5e57a09SHong Zhang     ierr = VecScatterBegin(mumps->scat_rhs,b,b_seq,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
577a5e57a09SHong Zhang     ierr = VecScatterEnd(mumps->scat_rhs,b,b_seq,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
578a5e57a09SHong Zhang     if (!mumps->myid) {ierr = VecGetArray(b_seq,&array);CHKERRQ(ierr);}
579397b6df1SKris Buschelman   } else {  /* size == 1 */
580397b6df1SKris Buschelman     ierr = VecCopy(b,x);CHKERRQ(ierr);
581397b6df1SKris Buschelman     ierr = VecGetArray(x,&array);CHKERRQ(ierr);
582397b6df1SKris Buschelman   }
583a5e57a09SHong Zhang   if (!mumps->myid) { /* define rhs on the host */
584a5e57a09SHong Zhang     mumps->id.nrhs = 1;
585397b6df1SKris Buschelman #if defined(PETSC_USE_COMPLEX)
5862907cef9SHong Zhang #if defined(PETSC_USE_REAL_SINGLE)
587a5e57a09SHong Zhang     mumps->id.rhs = (mumps_complex*)array;
5882907cef9SHong Zhang #else
589a5e57a09SHong Zhang     mumps->id.rhs = (mumps_double_complex*)array;
5902907cef9SHong Zhang #endif
591397b6df1SKris Buschelman #else
592a5e57a09SHong Zhang     mumps->id.rhs = array;
593397b6df1SKris Buschelman #endif
594397b6df1SKris Buschelman   }
595397b6df1SKris Buschelman 
596397b6df1SKris Buschelman   /* solve phase */
597329ec9b3SHong Zhang   /*-------------*/
598a5e57a09SHong Zhang   mumps->id.job = JOB_SOLVE;
599a5e57a09SHong Zhang   PetscMUMPS_c(&mumps->id);
600a5e57a09SHong Zhang   if (mumps->id.INFOG(1) < 0) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error reported by MUMPS in solve phase: INFOG(1)=%d\n",mumps->id.INFOG(1));
601397b6df1SKris Buschelman 
602a5e57a09SHong Zhang   if (mumps->size > 1) { /* convert mumps distributed solution to petsc mpi x */
603a5e57a09SHong Zhang     if (mumps->scat_sol && mumps->ICNTL9_pre != mumps->id.ICNTL(9)) {
604a5e57a09SHong Zhang       /* when id.ICNTL(9) changes, the contents of lsol_loc may change (not its size, lsol_loc), recreates scat_sol */
605a5e57a09SHong Zhang       ierr = VecScatterDestroy(&mumps->scat_sol);CHKERRQ(ierr);
606397b6df1SKris Buschelman     }
607a5e57a09SHong Zhang     if (!mumps->scat_sol) { /* create scatter scat_sol */
608a5e57a09SHong Zhang       ierr = ISCreateStride(PETSC_COMM_SELF,mumps->id.lsol_loc,0,1,&is_iden);CHKERRQ(ierr); /* from */
609a5e57a09SHong Zhang       for (i=0; i<mumps->id.lsol_loc; i++) {
610a5e57a09SHong Zhang         mumps->id.isol_loc[i] -= 1; /* change Fortran style to C style */
611a5e57a09SHong Zhang       }
612a5e57a09SHong Zhang       ierr = ISCreateGeneral(PETSC_COMM_SELF,mumps->id.lsol_loc,mumps->id.isol_loc,PETSC_COPY_VALUES,&is_petsc);CHKERRQ(ierr);  /* to */
613a5e57a09SHong Zhang       ierr = VecScatterCreate(mumps->x_seq,is_iden,x,is_petsc,&mumps->scat_sol);CHKERRQ(ierr);
6146bf464f9SBarry Smith       ierr = ISDestroy(&is_iden);CHKERRQ(ierr);
6156bf464f9SBarry Smith       ierr = ISDestroy(&is_petsc);CHKERRQ(ierr);
6162205254eSKarl Rupp 
617a5e57a09SHong Zhang       mumps->ICNTL9_pre = mumps->id.ICNTL(9); /* save current value of id.ICNTL(9) */
618397b6df1SKris Buschelman     }
619a5e57a09SHong Zhang 
620a5e57a09SHong Zhang     ierr = VecScatterBegin(mumps->scat_sol,mumps->x_seq,x,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
621a5e57a09SHong Zhang     ierr = VecScatterEnd(mumps->scat_sol,mumps->x_seq,x,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
622329ec9b3SHong Zhang   }
623397b6df1SKris Buschelman   PetscFunctionReturn(0);
624397b6df1SKris Buschelman }
625397b6df1SKris Buschelman 
62651d5961aSHong Zhang #undef __FUNCT__
62751d5961aSHong Zhang #define __FUNCT__ "MatSolveTranspose_MUMPS"
62851d5961aSHong Zhang PetscErrorCode MatSolveTranspose_MUMPS(Mat A,Vec b,Vec x)
62951d5961aSHong Zhang {
630a5e57a09SHong Zhang   Mat_MUMPS      *mumps=(Mat_MUMPS*)A->spptr;
63151d5961aSHong Zhang   PetscErrorCode ierr;
63251d5961aSHong Zhang 
63351d5961aSHong Zhang   PetscFunctionBegin;
634a5e57a09SHong Zhang   mumps->id.ICNTL(9) = 0;
6352205254eSKarl Rupp 
6360ad0caddSJed Brown   ierr = MatSolve_MUMPS(A,b,x);CHKERRQ(ierr);
6372205254eSKarl Rupp 
638a5e57a09SHong Zhang   mumps->id.ICNTL(9) = 1;
63951d5961aSHong Zhang   PetscFunctionReturn(0);
64051d5961aSHong Zhang }
64151d5961aSHong Zhang 
642e0b74bf9SHong Zhang #undef __FUNCT__
643e0b74bf9SHong Zhang #define __FUNCT__ "MatMatSolve_MUMPS"
644e0b74bf9SHong Zhang PetscErrorCode MatMatSolve_MUMPS(Mat A,Mat B,Mat X)
645e0b74bf9SHong Zhang {
646bda8bf91SBarry Smith   PetscErrorCode ierr;
647bda8bf91SBarry Smith   PetscBool      flg;
648bda8bf91SBarry Smith 
649e0b74bf9SHong Zhang   PetscFunctionBegin;
6500298fd71SBarry Smith   ierr = PetscObjectTypeCompareAny((PetscObject)B,&flg,MATSEQDENSE,MATMPIDENSE,NULL);CHKERRQ(ierr);
651ce94432eSBarry Smith   if (!flg) SETERRQ(PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_WRONG,"Matrix B must be MATDENSE matrix");
6520298fd71SBarry Smith   ierr = PetscObjectTypeCompareAny((PetscObject)X,&flg,MATSEQDENSE,MATMPIDENSE,NULL);CHKERRQ(ierr);
653ce94432eSBarry Smith   if (!flg) SETERRQ(PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_WRONG,"Matrix X must be MATDENSE matrix");
6542205254eSKarl Rupp   SETERRQ(PETSC_COMM_SELF,PETSC_ERR_SUP,"MatMatSolve_MUMPS() is not implemented yet");
655e0b74bf9SHong Zhang   PetscFunctionReturn(0);
656e0b74bf9SHong Zhang }
657e0b74bf9SHong Zhang 
658ace3df97SHong Zhang #if !defined(PETSC_USE_COMPLEX)
659a58c3f20SHong Zhang /*
660a58c3f20SHong Zhang   input:
661a58c3f20SHong Zhang    F:        numeric factor
662a58c3f20SHong Zhang   output:
663a58c3f20SHong Zhang    nneg:     total number of negative pivots
664a58c3f20SHong Zhang    nzero:    0
665a58c3f20SHong Zhang    npos:     (global dimension of F) - nneg
666a58c3f20SHong Zhang */
667a58c3f20SHong Zhang 
668a58c3f20SHong Zhang #undef __FUNCT__
669a58c3f20SHong Zhang #define __FUNCT__ "MatGetInertia_SBAIJMUMPS"
670dfbe8321SBarry Smith PetscErrorCode MatGetInertia_SBAIJMUMPS(Mat F,int *nneg,int *nzero,int *npos)
671a58c3f20SHong Zhang {
672a5e57a09SHong Zhang   Mat_MUMPS      *mumps =(Mat_MUMPS*)F->spptr;
673dfbe8321SBarry Smith   PetscErrorCode ierr;
674c1490034SHong Zhang   PetscMPIInt    size;
675a58c3f20SHong Zhang 
676a58c3f20SHong Zhang   PetscFunctionBegin;
677ce94432eSBarry Smith   ierr = MPI_Comm_size(PetscObjectComm((PetscObject)F),&size);CHKERRQ(ierr);
678bcb30aebSHong Zhang   /* MUMPS 4.3.1 calls ScaLAPACK when ICNTL(13)=0 (default), which does not offer the possibility to compute the inertia of a dense matrix. Set ICNTL(13)=1 to skip ScaLAPACK */
679a5e57a09SHong Zhang   if (size > 1 && mumps->id.ICNTL(13) != 1) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONG,"ICNTL(13)=%d. -mat_mumps_icntl_13 must be set as 1 for correct global matrix inertia\n",mumps->id.INFOG(13));
680a58c3f20SHong Zhang   if (nneg) {
681a5e57a09SHong Zhang     if (!mumps->myid) {
682a5e57a09SHong Zhang       *nneg = mumps->id.INFOG(12);
683a58c3f20SHong Zhang     }
684a5e57a09SHong Zhang     ierr = MPI_Bcast(nneg,1,MPI_INT,0,mumps->comm_mumps);CHKERRQ(ierr);
685a58c3f20SHong Zhang   }
686a58c3f20SHong Zhang   if (nzero) *nzero = 0;
687d0f46423SBarry Smith   if (npos)  *npos  = F->rmap->N - (*nneg);
688a58c3f20SHong Zhang   PetscFunctionReturn(0);
689a58c3f20SHong Zhang }
690ace3df97SHong Zhang #endif /* !defined(PETSC_USE_COMPLEX) */
691a58c3f20SHong Zhang 
692397b6df1SKris Buschelman #undef __FUNCT__
693f6c57405SHong Zhang #define __FUNCT__ "MatFactorNumeric_MUMPS"
6940481f469SBarry Smith PetscErrorCode MatFactorNumeric_MUMPS(Mat F,Mat A,const MatFactorInfo *info)
695af281ebdSHong Zhang {
696a5e57a09SHong Zhang   Mat_MUMPS      *mumps =(Mat_MUMPS*)(F)->spptr;
6976849ba73SBarry Smith   PetscErrorCode ierr;
698e09efc27SHong Zhang   Mat            F_diag;
699ace3abfcSBarry Smith   PetscBool      isMPIAIJ;
700397b6df1SKris Buschelman 
701397b6df1SKris Buschelman   PetscFunctionBegin;
702a5e57a09SHong Zhang   ierr = (*mumps->ConvertToTriples)(A, 1, MAT_REUSE_MATRIX, &mumps->nz, &mumps->irn, &mumps->jcn, &mumps->val);CHKERRQ(ierr);
703397b6df1SKris Buschelman 
704397b6df1SKris Buschelman   /* numerical factorization phase */
705329ec9b3SHong Zhang   /*-------------------------------*/
706a5e57a09SHong Zhang   mumps->id.job = JOB_FACTNUMERIC;
707a5e57a09SHong Zhang   if (!mumps->id.ICNTL(18)) {
708a5e57a09SHong Zhang     if (!mumps->myid) {
709397b6df1SKris Buschelman #if defined(PETSC_USE_COMPLEX)
7102907cef9SHong Zhang #if defined(PETSC_USE_REAL_SINGLE)
711a5e57a09SHong Zhang       mumps->id.a = (mumps_complex*)mumps->val;
7122907cef9SHong Zhang #else
713a5e57a09SHong Zhang       mumps->id.a = (mumps_double_complex*)mumps->val;
7142907cef9SHong Zhang #endif
715397b6df1SKris Buschelman #else
716a5e57a09SHong Zhang       mumps->id.a = mumps->val;
717397b6df1SKris Buschelman #endif
718397b6df1SKris Buschelman     }
719397b6df1SKris Buschelman   } else {
720397b6df1SKris Buschelman #if defined(PETSC_USE_COMPLEX)
7212907cef9SHong Zhang #if defined(PETSC_USE_REAL_SINGLE)
722a5e57a09SHong Zhang     mumps->id.a_loc = (mumps_complex*)mumps->val;
7232907cef9SHong Zhang #else
724a5e57a09SHong Zhang     mumps->id.a_loc = (mumps_double_complex*)mumps->val;
7252907cef9SHong Zhang #endif
726397b6df1SKris Buschelman #else
727a5e57a09SHong Zhang     mumps->id.a_loc = mumps->val;
728397b6df1SKris Buschelman #endif
729397b6df1SKris Buschelman   }
730a5e57a09SHong Zhang   PetscMUMPS_c(&mumps->id);
731a5e57a09SHong Zhang   if (mumps->id.INFOG(1) < 0) {
732a5e57a09SHong Zhang     if (mumps->id.INFO(1) == -13) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error reported by MUMPS in numerical factorization phase: Cannot allocate required memory %d megabytes\n",mumps->id.INFO(2));
733a5e57a09SHong Zhang     else SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error reported by MUMPS in numerical factorization phase: INFO(1)=%d, INFO(2)=%d\n",mumps->id.INFO(1),mumps->id.INFO(2));
734397b6df1SKris Buschelman   }
735a5e57a09SHong Zhang   if (!mumps->myid && mumps->id.ICNTL(16) > 0) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"  mumps->id.ICNTL(16):=%d\n",mumps->id.INFOG(16));
736397b6df1SKris Buschelman 
737a5e57a09SHong Zhang   if (mumps->size > 1) {
738251f4c67SDmitry Karpeev     ierr = PetscObjectTypeCompare((PetscObject)A,MATMPIAIJ,&isMPIAIJ);CHKERRQ(ierr);
7392205254eSKarl Rupp     if (isMPIAIJ) F_diag = ((Mat_MPIAIJ*)(F)->data)->A;
7402205254eSKarl Rupp     else F_diag = ((Mat_MPISBAIJ*)(F)->data)->A;
741e09efc27SHong Zhang     F_diag->assembled = PETSC_TRUE;
742a5e57a09SHong Zhang     if (mumps->scat_sol) {
743a5e57a09SHong Zhang       ierr = VecScatterDestroy(&mumps->scat_sol);CHKERRQ(ierr);
744a5e57a09SHong Zhang       ierr = PetscFree2(mumps->id.sol_loc,mumps->id.isol_loc);CHKERRQ(ierr);
745a5e57a09SHong Zhang       ierr = VecDestroy(&mumps->x_seq);CHKERRQ(ierr);
746329ec9b3SHong Zhang     }
7478ada1bb4SHong Zhang   }
748dcd589f8SShri Abhyankar   (F)->assembled      = PETSC_TRUE;
749a5e57a09SHong Zhang   mumps->matstruc     = SAME_NONZERO_PATTERN;
750a5e57a09SHong Zhang   mumps->CleanUpMUMPS = PETSC_TRUE;
75167877ebaSShri Abhyankar 
752a5e57a09SHong Zhang   if (mumps->size > 1) {
75367877ebaSShri Abhyankar     /* distributed solution */
754a5e57a09SHong Zhang     if (!mumps->scat_sol) {
75567877ebaSShri Abhyankar       /* Create x_seq=sol_loc for repeated use */
75667877ebaSShri Abhyankar       PetscInt    lsol_loc;
75767877ebaSShri Abhyankar       PetscScalar *sol_loc;
7582205254eSKarl Rupp 
759a5e57a09SHong Zhang       lsol_loc = mumps->id.INFO(23); /* length of sol_loc */
7602205254eSKarl Rupp 
761dcca6d9dSJed Brown       ierr = PetscMalloc2(lsol_loc,&sol_loc,lsol_loc,&mumps->id.isol_loc);CHKERRQ(ierr);
7622205254eSKarl Rupp 
763a5e57a09SHong Zhang       mumps->id.lsol_loc = lsol_loc;
76467877ebaSShri Abhyankar #if defined(PETSC_USE_COMPLEX)
7652907cef9SHong Zhang #if defined(PETSC_USE_REAL_SINGLE)
766a5e57a09SHong Zhang       mumps->id.sol_loc = (mumps_complex*)sol_loc;
7672907cef9SHong Zhang #else
768a5e57a09SHong Zhang       mumps->id.sol_loc = (mumps_double_complex*)sol_loc;
7692907cef9SHong Zhang #endif
77067877ebaSShri Abhyankar #else
771a5e57a09SHong Zhang       mumps->id.sol_loc = sol_loc;
77267877ebaSShri Abhyankar #endif
773a5e57a09SHong Zhang       ierr = VecCreateSeqWithArray(PETSC_COMM_SELF,1,lsol_loc,sol_loc,&mumps->x_seq);CHKERRQ(ierr);
77467877ebaSShri Abhyankar     }
77567877ebaSShri Abhyankar   }
776397b6df1SKris Buschelman   PetscFunctionReturn(0);
777397b6df1SKris Buschelman }
778397b6df1SKris Buschelman 
7799a2535b5SHong Zhang /* Sets MUMPS options from the options database */
780dcd589f8SShri Abhyankar #undef __FUNCT__
7819a2535b5SHong Zhang #define __FUNCT__ "PetscSetMUMPSFromOptions"
7829a2535b5SHong Zhang PetscErrorCode PetscSetMUMPSFromOptions(Mat F, Mat A)
783dcd589f8SShri Abhyankar {
7849a2535b5SHong Zhang   Mat_MUMPS      *mumps = (Mat_MUMPS*)F->spptr;
785dcd589f8SShri Abhyankar   PetscErrorCode ierr;
786dcd589f8SShri Abhyankar   PetscInt       icntl;
787ace3abfcSBarry Smith   PetscBool      flg;
788dcd589f8SShri Abhyankar 
789dcd589f8SShri Abhyankar   PetscFunctionBegin;
790ce94432eSBarry Smith   ierr = PetscOptionsBegin(PetscObjectComm((PetscObject)A),((PetscObject)A)->prefix,"MUMPS Options","Mat");CHKERRQ(ierr);
7919a2535b5SHong Zhang   ierr = PetscOptionsInt("-mat_mumps_icntl_1","ICNTL(1): output stream for error messages","None",mumps->id.ICNTL(1),&icntl,&flg);CHKERRQ(ierr);
7929a2535b5SHong Zhang   if (flg) mumps->id.ICNTL(1) = icntl;
7939a2535b5SHong Zhang   ierr = PetscOptionsInt("-mat_mumps_icntl_2","ICNTL(2): output stream for diagnostic printing, statistics, and warning","None",mumps->id.ICNTL(2),&icntl,&flg);CHKERRQ(ierr);
7949a2535b5SHong Zhang   if (flg) mumps->id.ICNTL(2) = icntl;
7959a2535b5SHong Zhang   ierr = PetscOptionsInt("-mat_mumps_icntl_3","ICNTL(3): output stream for global information, collected on the host","None",mumps->id.ICNTL(3),&icntl,&flg);CHKERRQ(ierr);
7969a2535b5SHong Zhang   if (flg) mumps->id.ICNTL(3) = icntl;
797dcd589f8SShri Abhyankar 
7989a2535b5SHong Zhang   ierr = PetscOptionsInt("-mat_mumps_icntl_4","ICNTL(4): level of printing (0 to 4)","None",mumps->id.ICNTL(4),&icntl,&flg);CHKERRQ(ierr);
7999a2535b5SHong Zhang   if (flg) mumps->id.ICNTL(4) = icntl;
8009a2535b5SHong Zhang   if (mumps->id.ICNTL(4) || PetscLogPrintInfo) mumps->id.ICNTL(3) = 6; /* resume MUMPS default id.ICNTL(3) = 6 */
8019a2535b5SHong Zhang 
8029a2535b5SHong Zhang   ierr = PetscOptionsInt("-mat_mumps_icntl_6","ICNTL(6): permuting and/or scaling the matrix (0 to 7)","None",mumps->id.ICNTL(6),&icntl,&flg);CHKERRQ(ierr);
8039a2535b5SHong Zhang   if (flg) mumps->id.ICNTL(6) = icntl;
8049a2535b5SHong Zhang 
8059a2535b5SHong Zhang   ierr = PetscOptionsInt("-mat_mumps_icntl_7","ICNTL(7): matrix ordering (0 to 7). 3=Scotch, 4=PORD, 5=Metis","None",mumps->id.ICNTL(7),&icntl,&flg);CHKERRQ(ierr);
806dcd589f8SShri Abhyankar   if (flg) {
8072205254eSKarl Rupp     if (icntl== 1 && mumps->size > 1) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_SUP,"pivot order be set by the user in PERM_IN -- not supported by the PETSc/MUMPS interface\n");
8082205254eSKarl Rupp     else mumps->id.ICNTL(7) = icntl;
809dcd589f8SShri Abhyankar   }
810e0b74bf9SHong Zhang 
8110298fd71SBarry Smith   ierr = PetscOptionsInt("-mat_mumps_icntl_8","ICNTL(8): scaling strategy (-2 to 8 or 77)","None",mumps->id.ICNTL(8),&mumps->id.ICNTL(8),NULL);CHKERRQ(ierr);
8120298fd71SBarry Smith   ierr = PetscOptionsInt("-mat_mumps_icntl_10","ICNTL(10): max num of refinements","None",mumps->id.ICNTL(10),&mumps->id.ICNTL(10),NULL);CHKERRQ(ierr);
8130298fd71SBarry Smith   ierr = PetscOptionsInt("-mat_mumps_icntl_11","ICNTL(11): statistics related to the linear system solved (via -ksp_view)","None",mumps->id.ICNTL(11),&mumps->id.ICNTL(11),NULL);CHKERRQ(ierr);
8140298fd71SBarry Smith   ierr = PetscOptionsInt("-mat_mumps_icntl_12","ICNTL(12): efficiency control: defines the ordering strategy with scaling constraints (0 to 3)","None",mumps->id.ICNTL(12),&mumps->id.ICNTL(12),NULL);CHKERRQ(ierr);
8150298fd71SBarry Smith   ierr = PetscOptionsInt("-mat_mumps_icntl_13","ICNTL(13): efficiency control: with or without ScaLAPACK","None",mumps->id.ICNTL(13),&mumps->id.ICNTL(13),NULL);CHKERRQ(ierr);
8160298fd71SBarry Smith   ierr = PetscOptionsInt("-mat_mumps_icntl_14","ICNTL(14): percentage of estimated workspace increase","None",mumps->id.ICNTL(14),&mumps->id.ICNTL(14),NULL);CHKERRQ(ierr);
8170298fd71SBarry Smith   ierr = PetscOptionsInt("-mat_mumps_icntl_19","ICNTL(19): Schur complement","None",mumps->id.ICNTL(19),&mumps->id.ICNTL(19),NULL);CHKERRQ(ierr);
8189a2535b5SHong Zhang 
8190298fd71SBarry Smith   ierr = PetscOptionsInt("-mat_mumps_icntl_22","ICNTL(22): in-core/out-of-core facility (0 or 1)","None",mumps->id.ICNTL(22),&mumps->id.ICNTL(22),NULL);CHKERRQ(ierr);
8200298fd71SBarry Smith   ierr = PetscOptionsInt("-mat_mumps_icntl_23","ICNTL(23): max size of the working memory (MB) that can allocate per processor","None",mumps->id.ICNTL(23),&mumps->id.ICNTL(23),NULL);CHKERRQ(ierr);
8210298fd71SBarry Smith   ierr = PetscOptionsInt("-mat_mumps_icntl_24","ICNTL(24): detection of null pivot rows (0 or 1)","None",mumps->id.ICNTL(24),&mumps->id.ICNTL(24),NULL);CHKERRQ(ierr);
8229a2535b5SHong Zhang   if (mumps->id.ICNTL(24)) {
8239a2535b5SHong Zhang     mumps->id.ICNTL(13) = 1; /* turn-off ScaLAPACK to help with the correct detection of null pivots */
824d7ebd59bSHong Zhang   }
825d7ebd59bSHong Zhang 
8260298fd71SBarry Smith   ierr = PetscOptionsInt("-mat_mumps_icntl_25","ICNTL(25): computation of a null space basis","None",mumps->id.ICNTL(25),&mumps->id.ICNTL(25),NULL);CHKERRQ(ierr);
8270298fd71SBarry Smith   ierr = PetscOptionsInt("-mat_mumps_icntl_26","ICNTL(26): Schur options for right-hand side or solution vector","None",mumps->id.ICNTL(26),&mumps->id.ICNTL(26),NULL);CHKERRQ(ierr);
8280298fd71SBarry Smith   ierr = PetscOptionsInt("-mat_mumps_icntl_27","ICNTL(27): experimental parameter","None",mumps->id.ICNTL(27),&mumps->id.ICNTL(27),NULL);CHKERRQ(ierr);
8290298fd71SBarry Smith   ierr = PetscOptionsInt("-mat_mumps_icntl_28","ICNTL(28): use 1 for sequential analysis and ictnl(7) ordering, or 2 for parallel analysis and ictnl(29) ordering","None",mumps->id.ICNTL(28),&mumps->id.ICNTL(28),NULL);CHKERRQ(ierr);
8300298fd71SBarry Smith   ierr = PetscOptionsInt("-mat_mumps_icntl_29","ICNTL(29): parallel ordering 1 = ptscotch 2 = parmetis","None",mumps->id.ICNTL(29),&mumps->id.ICNTL(29),NULL);CHKERRQ(ierr);
8310298fd71SBarry Smith   ierr = PetscOptionsInt("-mat_mumps_icntl_30","ICNTL(30): compute user-specified set of entries in inv(A)","None",mumps->id.ICNTL(30),&mumps->id.ICNTL(30),NULL);CHKERRQ(ierr);
8320298fd71SBarry Smith   ierr = PetscOptionsInt("-mat_mumps_icntl_31","ICNTL(31): factors can be discarded in the solve phase","None",mumps->id.ICNTL(31),&mumps->id.ICNTL(31),NULL);CHKERRQ(ierr);
8330298fd71SBarry Smith   ierr = PetscOptionsInt("-mat_mumps_icntl_33","ICNTL(33): compute determinant","None",mumps->id.ICNTL(33),&mumps->id.ICNTL(33),NULL);CHKERRQ(ierr);
834dcd589f8SShri Abhyankar 
8350298fd71SBarry Smith   ierr = PetscOptionsReal("-mat_mumps_cntl_1","CNTL(1): relative pivoting threshold","None",mumps->id.CNTL(1),&mumps->id.CNTL(1),NULL);CHKERRQ(ierr);
8360298fd71SBarry Smith   ierr = PetscOptionsReal("-mat_mumps_cntl_2","CNTL(2): stopping criterion of refinement","None",mumps->id.CNTL(2),&mumps->id.CNTL(2),NULL);CHKERRQ(ierr);
8370298fd71SBarry Smith   ierr = PetscOptionsReal("-mat_mumps_cntl_3","CNTL(3): absolute pivoting threshold","None",mumps->id.CNTL(3),&mumps->id.CNTL(3),NULL);CHKERRQ(ierr);
8380298fd71SBarry Smith   ierr = PetscOptionsReal("-mat_mumps_cntl_4","CNTL(4): value for static pivoting","None",mumps->id.CNTL(4),&mumps->id.CNTL(4),NULL);CHKERRQ(ierr);
8390298fd71SBarry Smith   ierr = PetscOptionsReal("-mat_mumps_cntl_5","CNTL(5): fixation for null pivots","None",mumps->id.CNTL(5),&mumps->id.CNTL(5),NULL);CHKERRQ(ierr);
840e5bb22a1SHong Zhang 
8410298fd71SBarry Smith   ierr = PetscOptionsString("-mat_mumps_ooc_tmpdir", "out of core directory", "None", mumps->id.ooc_tmpdir, mumps->id.ooc_tmpdir, 256, NULL);
842dcd589f8SShri Abhyankar   PetscOptionsEnd();
843dcd589f8SShri Abhyankar   PetscFunctionReturn(0);
844dcd589f8SShri Abhyankar }
845dcd589f8SShri Abhyankar 
846dcd589f8SShri Abhyankar #undef __FUNCT__
847dcd589f8SShri Abhyankar #define __FUNCT__ "PetscInitializeMUMPS"
848f697e70eSHong Zhang PetscErrorCode PetscInitializeMUMPS(Mat A,Mat_MUMPS *mumps)
849dcd589f8SShri Abhyankar {
850dcd589f8SShri Abhyankar   PetscErrorCode ierr;
851dcd589f8SShri Abhyankar 
852dcd589f8SShri Abhyankar   PetscFunctionBegin;
853ce94432eSBarry Smith   ierr = MPI_Comm_rank(PetscObjectComm((PetscObject)A), &mumps->myid);
854ce94432eSBarry Smith   ierr = MPI_Comm_size(PetscObjectComm((PetscObject)A),&mumps->size);CHKERRQ(ierr);
855ce94432eSBarry Smith   ierr = MPI_Comm_dup(PetscObjectComm((PetscObject)A),&(mumps->comm_mumps));CHKERRQ(ierr);
8562205254eSKarl Rupp 
857f697e70eSHong Zhang   mumps->id.comm_fortran = MPI_Comm_c2f(mumps->comm_mumps);
858f697e70eSHong Zhang 
859f697e70eSHong Zhang   mumps->id.job = JOB_INIT;
860f697e70eSHong Zhang   mumps->id.par = 1;  /* host participates factorizaton and solve */
861f697e70eSHong Zhang   mumps->id.sym = mumps->sym;
8622907cef9SHong Zhang   PetscMUMPS_c(&mumps->id);
863f697e70eSHong Zhang 
864f697e70eSHong Zhang   mumps->CleanUpMUMPS = PETSC_FALSE;
8650298fd71SBarry Smith   mumps->scat_rhs     = NULL;
8660298fd71SBarry Smith   mumps->scat_sol     = NULL;
8679a2535b5SHong Zhang 
86870544d5fSHong Zhang   /* set PETSc-MUMPS default options - override MUMPS default */
8699a2535b5SHong Zhang   mumps->id.ICNTL(3) = 0;
8709a2535b5SHong Zhang   mumps->id.ICNTL(4) = 0;
8719a2535b5SHong Zhang   if (mumps->size == 1) {
8729a2535b5SHong Zhang     mumps->id.ICNTL(18) = 0;   /* centralized assembled matrix input */
8739a2535b5SHong Zhang   } else {
8749a2535b5SHong Zhang     mumps->id.ICNTL(18) = 3;   /* distributed assembled matrix input */
87570544d5fSHong Zhang     mumps->id.ICNTL(21) = 1;   /* distributed solution */
8769a2535b5SHong Zhang   }
877dcd589f8SShri Abhyankar   PetscFunctionReturn(0);
878dcd589f8SShri Abhyankar }
879dcd589f8SShri Abhyankar 
880a5e57a09SHong Zhang /* Note Petsc r(=c) permutation is used when mumps->id.ICNTL(7)==1 with centralized assembled matrix input; otherwise r and c are ignored */
881397b6df1SKris Buschelman #undef __FUNCT__
882f0c56d0fSKris Buschelman #define __FUNCT__ "MatLUFactorSymbolic_AIJMUMPS"
8830481f469SBarry Smith PetscErrorCode MatLUFactorSymbolic_AIJMUMPS(Mat F,Mat A,IS r,IS c,const MatFactorInfo *info)
884b24902e0SBarry Smith {
885a5e57a09SHong Zhang   Mat_MUMPS      *mumps = (Mat_MUMPS*)F->spptr;
886dcd589f8SShri Abhyankar   PetscErrorCode ierr;
88767877ebaSShri Abhyankar   Vec            b;
88867877ebaSShri Abhyankar   IS             is_iden;
88967877ebaSShri Abhyankar   const PetscInt M = A->rmap->N;
890397b6df1SKris Buschelman 
891397b6df1SKris Buschelman   PetscFunctionBegin;
892a5e57a09SHong Zhang   mumps->matstruc = DIFFERENT_NONZERO_PATTERN;
893dcd589f8SShri Abhyankar 
8949a2535b5SHong Zhang   /* Set MUMPS options from the options database */
8959a2535b5SHong Zhang   ierr = PetscSetMUMPSFromOptions(F,A);CHKERRQ(ierr);
896dcd589f8SShri Abhyankar 
897a5e57a09SHong Zhang   ierr = (*mumps->ConvertToTriples)(A, 1, MAT_INITIAL_MATRIX, &mumps->nz, &mumps->irn, &mumps->jcn, &mumps->val);CHKERRQ(ierr);
898dcd589f8SShri Abhyankar 
89967877ebaSShri Abhyankar   /* analysis phase */
90067877ebaSShri Abhyankar   /*----------------*/
901a5e57a09SHong Zhang   mumps->id.job = JOB_FACTSYMBOLIC;
902a5e57a09SHong Zhang   mumps->id.n   = M;
903a5e57a09SHong Zhang   switch (mumps->id.ICNTL(18)) {
90467877ebaSShri Abhyankar   case 0:  /* centralized assembled matrix input */
905a5e57a09SHong Zhang     if (!mumps->myid) {
906a5e57a09SHong Zhang       mumps->id.nz =mumps->nz; mumps->id.irn=mumps->irn; mumps->id.jcn=mumps->jcn;
907a5e57a09SHong Zhang       if (mumps->id.ICNTL(6)>1) {
90867877ebaSShri Abhyankar #if defined(PETSC_USE_COMPLEX)
9092907cef9SHong Zhang #if defined(PETSC_USE_REAL_SINGLE)
910a5e57a09SHong Zhang         mumps->id.a = (mumps_complex*)mumps->val;
9112907cef9SHong Zhang #else
912a5e57a09SHong Zhang         mumps->id.a = (mumps_double_complex*)mumps->val;
9132907cef9SHong Zhang #endif
91467877ebaSShri Abhyankar #else
915a5e57a09SHong Zhang         mumps->id.a = mumps->val;
91667877ebaSShri Abhyankar #endif
91767877ebaSShri Abhyankar       }
918a5e57a09SHong Zhang       if (mumps->id.ICNTL(7) == 1) { /* use user-provide matrix ordering - assuming r = c ordering */
9195248a706SHong Zhang         /*
9205248a706SHong Zhang         PetscBool      flag;
9215248a706SHong Zhang         ierr = ISEqual(r,c,&flag);CHKERRQ(ierr);
9225248a706SHong Zhang         if (!flag) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_USER,"row_perm != col_perm");
9235248a706SHong Zhang         ierr = ISView(r,PETSC_VIEWER_STDOUT_SELF);
9245248a706SHong Zhang          */
925a5e57a09SHong Zhang         if (!mumps->myid) {
926e0b74bf9SHong Zhang           const PetscInt *idx;
927e0b74bf9SHong Zhang           PetscInt       i,*perm_in;
9282205254eSKarl Rupp 
929785e854fSJed Brown           ierr = PetscMalloc1(M,&perm_in);CHKERRQ(ierr);
930e0b74bf9SHong Zhang           ierr = ISGetIndices(r,&idx);CHKERRQ(ierr);
9312205254eSKarl Rupp 
932a5e57a09SHong Zhang           mumps->id.perm_in = perm_in;
933e0b74bf9SHong Zhang           for (i=0; i<M; i++) perm_in[i] = idx[i]+1; /* perm_in[]: start from 1, not 0! */
934e0b74bf9SHong Zhang           ierr = ISRestoreIndices(r,&idx);CHKERRQ(ierr);
935e0b74bf9SHong Zhang         }
936e0b74bf9SHong Zhang       }
93767877ebaSShri Abhyankar     }
93867877ebaSShri Abhyankar     break;
93967877ebaSShri Abhyankar   case 3:  /* distributed assembled matrix input (size>1) */
940a5e57a09SHong Zhang     mumps->id.nz_loc = mumps->nz;
941a5e57a09SHong Zhang     mumps->id.irn_loc=mumps->irn; mumps->id.jcn_loc=mumps->jcn;
942a5e57a09SHong Zhang     if (mumps->id.ICNTL(6)>1) {
94367877ebaSShri Abhyankar #if defined(PETSC_USE_COMPLEX)
9442907cef9SHong Zhang #if defined(PETSC_USE_REAL_SINGLE)
945a5e57a09SHong Zhang       mumps->id.a_loc = (mumps_complex*)mumps->val;
9462907cef9SHong Zhang #else
947a5e57a09SHong Zhang       mumps->id.a_loc = (mumps_double_complex*)mumps->val;
9482907cef9SHong Zhang #endif
94967877ebaSShri Abhyankar #else
950a5e57a09SHong Zhang       mumps->id.a_loc = mumps->val;
95167877ebaSShri Abhyankar #endif
95267877ebaSShri Abhyankar     }
95367877ebaSShri Abhyankar     /* MUMPS only supports centralized rhs. Create scatter scat_rhs for repeated use in MatSolve() */
954a5e57a09SHong Zhang     if (!mumps->myid) {
955a5e57a09SHong Zhang       ierr = VecCreateSeq(PETSC_COMM_SELF,A->cmap->N,&mumps->b_seq);CHKERRQ(ierr);
95667877ebaSShri Abhyankar       ierr = ISCreateStride(PETSC_COMM_SELF,A->cmap->N,0,1,&is_iden);CHKERRQ(ierr);
95767877ebaSShri Abhyankar     } else {
958a5e57a09SHong Zhang       ierr = VecCreateSeq(PETSC_COMM_SELF,0,&mumps->b_seq);CHKERRQ(ierr);
95967877ebaSShri Abhyankar       ierr = ISCreateStride(PETSC_COMM_SELF,0,0,1,&is_iden);CHKERRQ(ierr);
96067877ebaSShri Abhyankar     }
961c0dedaeaSBarry Smith     ierr = MatGetVecs(A,NULL,&b);CHKERRQ(ierr);
962a5e57a09SHong Zhang     ierr = VecScatterCreate(b,is_iden,mumps->b_seq,is_iden,&mumps->scat_rhs);CHKERRQ(ierr);
9636bf464f9SBarry Smith     ierr = ISDestroy(&is_iden);CHKERRQ(ierr);
9646bf464f9SBarry Smith     ierr = VecDestroy(&b);CHKERRQ(ierr);
96567877ebaSShri Abhyankar     break;
96667877ebaSShri Abhyankar   }
967a5e57a09SHong Zhang   PetscMUMPS_c(&mumps->id);
968a5e57a09SHong Zhang   if (mumps->id.INFOG(1) < 0) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error reported by MUMPS in analysis phase: INFOG(1)=%d\n",mumps->id.INFOG(1));
96967877ebaSShri Abhyankar 
970719d5645SBarry Smith   F->ops->lufactornumeric = MatFactorNumeric_MUMPS;
971dcd589f8SShri Abhyankar   F->ops->solve           = MatSolve_MUMPS;
97251d5961aSHong Zhang   F->ops->solvetranspose  = MatSolveTranspose_MUMPS;
97317f96c7aSHong Zhang   F->ops->matsolve        = 0;  /* use MatMatSolve_Basic() until mumps supports distributed rhs */
974b24902e0SBarry Smith   PetscFunctionReturn(0);
975b24902e0SBarry Smith }
976b24902e0SBarry Smith 
977450b117fSShri Abhyankar /* Note the Petsc r and c permutations are ignored */
978450b117fSShri Abhyankar #undef __FUNCT__
979450b117fSShri Abhyankar #define __FUNCT__ "MatLUFactorSymbolic_BAIJMUMPS"
980450b117fSShri Abhyankar PetscErrorCode MatLUFactorSymbolic_BAIJMUMPS(Mat F,Mat A,IS r,IS c,const MatFactorInfo *info)
981450b117fSShri Abhyankar {
982a5e57a09SHong Zhang   Mat_MUMPS      *mumps = (Mat_MUMPS*)F->spptr;
983dcd589f8SShri Abhyankar   PetscErrorCode ierr;
98467877ebaSShri Abhyankar   Vec            b;
98567877ebaSShri Abhyankar   IS             is_iden;
98667877ebaSShri Abhyankar   const PetscInt M = A->rmap->N;
987450b117fSShri Abhyankar 
988450b117fSShri Abhyankar   PetscFunctionBegin;
989a5e57a09SHong Zhang   mumps->matstruc = DIFFERENT_NONZERO_PATTERN;
990dcd589f8SShri Abhyankar 
9919a2535b5SHong Zhang   /* Set MUMPS options from the options database */
9929a2535b5SHong Zhang   ierr = PetscSetMUMPSFromOptions(F,A);CHKERRQ(ierr);
993dcd589f8SShri Abhyankar 
994a5e57a09SHong Zhang   ierr = (*mumps->ConvertToTriples)(A, 1, MAT_INITIAL_MATRIX, &mumps->nz, &mumps->irn, &mumps->jcn, &mumps->val);CHKERRQ(ierr);
99567877ebaSShri Abhyankar 
99667877ebaSShri Abhyankar   /* analysis phase */
99767877ebaSShri Abhyankar   /*----------------*/
998a5e57a09SHong Zhang   mumps->id.job = JOB_FACTSYMBOLIC;
999a5e57a09SHong Zhang   mumps->id.n   = M;
1000a5e57a09SHong Zhang   switch (mumps->id.ICNTL(18)) {
100167877ebaSShri Abhyankar   case 0:  /* centralized assembled matrix input */
1002a5e57a09SHong Zhang     if (!mumps->myid) {
1003a5e57a09SHong Zhang       mumps->id.nz =mumps->nz; mumps->id.irn=mumps->irn; mumps->id.jcn=mumps->jcn;
1004a5e57a09SHong Zhang       if (mumps->id.ICNTL(6)>1) {
100567877ebaSShri Abhyankar #if defined(PETSC_USE_COMPLEX)
10062907cef9SHong Zhang #if defined(PETSC_USE_REAL_SINGLE)
1007a5e57a09SHong Zhang         mumps->id.a = (mumps_complex*)mumps->val;
10082907cef9SHong Zhang #else
1009a5e57a09SHong Zhang         mumps->id.a = (mumps_double_complex*)mumps->val;
10102907cef9SHong Zhang #endif
101167877ebaSShri Abhyankar #else
1012a5e57a09SHong Zhang         mumps->id.a = mumps->val;
101367877ebaSShri Abhyankar #endif
101467877ebaSShri Abhyankar       }
101567877ebaSShri Abhyankar     }
101667877ebaSShri Abhyankar     break;
101767877ebaSShri Abhyankar   case 3:  /* distributed assembled matrix input (size>1) */
1018a5e57a09SHong Zhang     mumps->id.nz_loc = mumps->nz;
1019a5e57a09SHong Zhang     mumps->id.irn_loc=mumps->irn; mumps->id.jcn_loc=mumps->jcn;
1020a5e57a09SHong Zhang     if (mumps->id.ICNTL(6)>1) {
102167877ebaSShri Abhyankar #if defined(PETSC_USE_COMPLEX)
10222907cef9SHong Zhang #if defined(PETSC_USE_REAL_SINGLE)
1023a5e57a09SHong Zhang       mumps->id.a_loc = (mumps_complex*)mumps->val;
10242907cef9SHong Zhang #else
1025a5e57a09SHong Zhang       mumps->id.a_loc = (mumps_double_complex*)mumps->val;
10262907cef9SHong Zhang #endif
102767877ebaSShri Abhyankar #else
1028a5e57a09SHong Zhang       mumps->id.a_loc = mumps->val;
102967877ebaSShri Abhyankar #endif
103067877ebaSShri Abhyankar     }
103167877ebaSShri Abhyankar     /* MUMPS only supports centralized rhs. Create scatter scat_rhs for repeated use in MatSolve() */
1032a5e57a09SHong Zhang     if (!mumps->myid) {
1033a5e57a09SHong Zhang       ierr = VecCreateSeq(PETSC_COMM_SELF,A->cmap->N,&mumps->b_seq);CHKERRQ(ierr);
103467877ebaSShri Abhyankar       ierr = ISCreateStride(PETSC_COMM_SELF,A->cmap->N,0,1,&is_iden);CHKERRQ(ierr);
103567877ebaSShri Abhyankar     } else {
1036a5e57a09SHong Zhang       ierr = VecCreateSeq(PETSC_COMM_SELF,0,&mumps->b_seq);CHKERRQ(ierr);
103767877ebaSShri Abhyankar       ierr = ISCreateStride(PETSC_COMM_SELF,0,0,1,&is_iden);CHKERRQ(ierr);
103867877ebaSShri Abhyankar     }
1039c0dedaeaSBarry Smith     ierr = MatGetVecs(A,NULL,&b);CHKERRQ(ierr);
1040a5e57a09SHong Zhang     ierr = VecScatterCreate(b,is_iden,mumps->b_seq,is_iden,&mumps->scat_rhs);CHKERRQ(ierr);
10416bf464f9SBarry Smith     ierr = ISDestroy(&is_iden);CHKERRQ(ierr);
10426bf464f9SBarry Smith     ierr = VecDestroy(&b);CHKERRQ(ierr);
104367877ebaSShri Abhyankar     break;
104467877ebaSShri Abhyankar   }
1045a5e57a09SHong Zhang   PetscMUMPS_c(&mumps->id);
1046a5e57a09SHong Zhang   if (mumps->id.INFOG(1) < 0) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error reported by MUMPS in analysis phase: INFOG(1)=%d\n",mumps->id.INFOG(1));
104767877ebaSShri Abhyankar 
1048450b117fSShri Abhyankar   F->ops->lufactornumeric = MatFactorNumeric_MUMPS;
1049dcd589f8SShri Abhyankar   F->ops->solve           = MatSolve_MUMPS;
105051d5961aSHong Zhang   F->ops->solvetranspose  = MatSolveTranspose_MUMPS;
1051450b117fSShri Abhyankar   PetscFunctionReturn(0);
1052450b117fSShri Abhyankar }
1053b24902e0SBarry Smith 
1054141f4205SHong Zhang /* Note the Petsc r permutation and factor info are ignored */
1055397b6df1SKris Buschelman #undef __FUNCT__
105667877ebaSShri Abhyankar #define __FUNCT__ "MatCholeskyFactorSymbolic_MUMPS"
105767877ebaSShri Abhyankar PetscErrorCode MatCholeskyFactorSymbolic_MUMPS(Mat F,Mat A,IS r,const MatFactorInfo *info)
1058b24902e0SBarry Smith {
1059a5e57a09SHong Zhang   Mat_MUMPS      *mumps = (Mat_MUMPS*)F->spptr;
1060dcd589f8SShri Abhyankar   PetscErrorCode ierr;
106167877ebaSShri Abhyankar   Vec            b;
106267877ebaSShri Abhyankar   IS             is_iden;
106367877ebaSShri Abhyankar   const PetscInt M = A->rmap->N;
1064397b6df1SKris Buschelman 
1065397b6df1SKris Buschelman   PetscFunctionBegin;
1066a5e57a09SHong Zhang   mumps->matstruc = DIFFERENT_NONZERO_PATTERN;
1067dcd589f8SShri Abhyankar 
10689a2535b5SHong Zhang   /* Set MUMPS options from the options database */
10699a2535b5SHong Zhang   ierr = PetscSetMUMPSFromOptions(F,A);CHKERRQ(ierr);
1070dcd589f8SShri Abhyankar 
1071a5e57a09SHong Zhang   ierr = (*mumps->ConvertToTriples)(A, 1, MAT_INITIAL_MATRIX, &mumps->nz, &mumps->irn, &mumps->jcn, &mumps->val);CHKERRQ(ierr);
1072dcd589f8SShri Abhyankar 
107367877ebaSShri Abhyankar   /* analysis phase */
107467877ebaSShri Abhyankar   /*----------------*/
1075a5e57a09SHong Zhang   mumps->id.job = JOB_FACTSYMBOLIC;
1076a5e57a09SHong Zhang   mumps->id.n   = M;
1077a5e57a09SHong Zhang   switch (mumps->id.ICNTL(18)) {
107867877ebaSShri Abhyankar   case 0:  /* centralized assembled matrix input */
1079a5e57a09SHong Zhang     if (!mumps->myid) {
1080a5e57a09SHong Zhang       mumps->id.nz =mumps->nz; mumps->id.irn=mumps->irn; mumps->id.jcn=mumps->jcn;
1081a5e57a09SHong Zhang       if (mumps->id.ICNTL(6)>1) {
108267877ebaSShri Abhyankar #if defined(PETSC_USE_COMPLEX)
10832907cef9SHong Zhang #if defined(PETSC_USE_REAL_SINGLE)
1084a5e57a09SHong Zhang         mumps->id.a = (mumps_complex*)mumps->val;
10852907cef9SHong Zhang #else
1086a5e57a09SHong Zhang         mumps->id.a = (mumps_double_complex*)mumps->val;
10872907cef9SHong Zhang #endif
108867877ebaSShri Abhyankar #else
1089a5e57a09SHong Zhang         mumps->id.a = mumps->val;
109067877ebaSShri Abhyankar #endif
109167877ebaSShri Abhyankar       }
109267877ebaSShri Abhyankar     }
109367877ebaSShri Abhyankar     break;
109467877ebaSShri Abhyankar   case 3:  /* distributed assembled matrix input (size>1) */
1095a5e57a09SHong Zhang     mumps->id.nz_loc = mumps->nz;
1096a5e57a09SHong Zhang     mumps->id.irn_loc=mumps->irn; mumps->id.jcn_loc=mumps->jcn;
1097a5e57a09SHong Zhang     if (mumps->id.ICNTL(6)>1) {
109867877ebaSShri Abhyankar #if defined(PETSC_USE_COMPLEX)
10992907cef9SHong Zhang #if defined(PETSC_USE_REAL_SINGLE)
1100a5e57a09SHong Zhang       mumps->id.a_loc = (mumps_complex*)mumps->val;
11012907cef9SHong Zhang #else
1102a5e57a09SHong Zhang       mumps->id.a_loc = (mumps_double_complex*)mumps->val;
11032907cef9SHong Zhang #endif
110467877ebaSShri Abhyankar #else
1105a5e57a09SHong Zhang       mumps->id.a_loc = mumps->val;
110667877ebaSShri Abhyankar #endif
110767877ebaSShri Abhyankar     }
110867877ebaSShri Abhyankar     /* MUMPS only supports centralized rhs. Create scatter scat_rhs for repeated use in MatSolve() */
1109a5e57a09SHong Zhang     if (!mumps->myid) {
1110a5e57a09SHong Zhang       ierr = VecCreateSeq(PETSC_COMM_SELF,A->cmap->N,&mumps->b_seq);CHKERRQ(ierr);
111167877ebaSShri Abhyankar       ierr = ISCreateStride(PETSC_COMM_SELF,A->cmap->N,0,1,&is_iden);CHKERRQ(ierr);
111267877ebaSShri Abhyankar     } else {
1113a5e57a09SHong Zhang       ierr = VecCreateSeq(PETSC_COMM_SELF,0,&mumps->b_seq);CHKERRQ(ierr);
111467877ebaSShri Abhyankar       ierr = ISCreateStride(PETSC_COMM_SELF,0,0,1,&is_iden);CHKERRQ(ierr);
111567877ebaSShri Abhyankar     }
1116c0dedaeaSBarry Smith     ierr = MatGetVecs(A,NULL,&b);CHKERRQ(ierr);
1117a5e57a09SHong Zhang     ierr = VecScatterCreate(b,is_iden,mumps->b_seq,is_iden,&mumps->scat_rhs);CHKERRQ(ierr);
11186bf464f9SBarry Smith     ierr = ISDestroy(&is_iden);CHKERRQ(ierr);
11196bf464f9SBarry Smith     ierr = VecDestroy(&b);CHKERRQ(ierr);
112067877ebaSShri Abhyankar     break;
112167877ebaSShri Abhyankar   }
1122a5e57a09SHong Zhang   PetscMUMPS_c(&mumps->id);
1123a5e57a09SHong Zhang   if (mumps->id.INFOG(1) < 0) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error reported by MUMPS in analysis phase: INFOG(1)=%d\n",mumps->id.INFOG(1));
112467877ebaSShri Abhyankar 
11252792810eSHong Zhang   F->ops->choleskyfactornumeric = MatFactorNumeric_MUMPS;
1126dcd589f8SShri Abhyankar   F->ops->solve                 = MatSolve_MUMPS;
112751d5961aSHong Zhang   F->ops->solvetranspose        = MatSolve_MUMPS;
112830c107b7SHong Zhang   F->ops->matsolve              = 0; /* use MatMatSolve_Basic() until mumps supports distributed rhs */
1129db4efbfdSBarry Smith #if !defined(PETSC_USE_COMPLEX)
113005aa0992SJose Roman   F->ops->getinertia = MatGetInertia_SBAIJMUMPS;
113105aa0992SJose Roman #else
11320298fd71SBarry Smith   F->ops->getinertia = NULL;
1133db4efbfdSBarry Smith #endif
1134b24902e0SBarry Smith   PetscFunctionReturn(0);
1135b24902e0SBarry Smith }
1136b24902e0SBarry Smith 
1137397b6df1SKris Buschelman #undef __FUNCT__
113864e6c443SBarry Smith #define __FUNCT__ "MatView_MUMPS"
113964e6c443SBarry Smith PetscErrorCode MatView_MUMPS(Mat A,PetscViewer viewer)
114074ed9c26SBarry Smith {
1141f6c57405SHong Zhang   PetscErrorCode    ierr;
114264e6c443SBarry Smith   PetscBool         iascii;
114364e6c443SBarry Smith   PetscViewerFormat format;
1144a5e57a09SHong Zhang   Mat_MUMPS         *mumps=(Mat_MUMPS*)A->spptr;
1145f6c57405SHong Zhang 
1146f6c57405SHong Zhang   PetscFunctionBegin;
114764e6c443SBarry Smith   /* check if matrix is mumps type */
114864e6c443SBarry Smith   if (A->ops->solve != MatSolve_MUMPS) PetscFunctionReturn(0);
114964e6c443SBarry Smith 
1150251f4c67SDmitry Karpeev   ierr = PetscObjectTypeCompare((PetscObject)viewer,PETSCVIEWERASCII,&iascii);CHKERRQ(ierr);
115164e6c443SBarry Smith   if (iascii) {
115264e6c443SBarry Smith     ierr = PetscViewerGetFormat(viewer,&format);CHKERRQ(ierr);
115364e6c443SBarry Smith     if (format == PETSC_VIEWER_ASCII_INFO) {
115464e6c443SBarry Smith       ierr = PetscViewerASCIIPrintf(viewer,"MUMPS run parameters:\n");CHKERRQ(ierr);
1155a5e57a09SHong Zhang       ierr = PetscViewerASCIIPrintf(viewer,"  SYM (matrix type):                   %d \n",mumps->id.sym);CHKERRQ(ierr);
1156a5e57a09SHong Zhang       ierr = PetscViewerASCIIPrintf(viewer,"  PAR (host participation):            %d \n",mumps->id.par);CHKERRQ(ierr);
1157a5e57a09SHong Zhang       ierr = PetscViewerASCIIPrintf(viewer,"  ICNTL(1) (output for error):         %d \n",mumps->id.ICNTL(1));CHKERRQ(ierr);
1158a5e57a09SHong Zhang       ierr = PetscViewerASCIIPrintf(viewer,"  ICNTL(2) (output of diagnostic msg): %d \n",mumps->id.ICNTL(2));CHKERRQ(ierr);
1159a5e57a09SHong Zhang       ierr = PetscViewerASCIIPrintf(viewer,"  ICNTL(3) (output for global info):   %d \n",mumps->id.ICNTL(3));CHKERRQ(ierr);
1160a5e57a09SHong Zhang       ierr = PetscViewerASCIIPrintf(viewer,"  ICNTL(4) (level of printing):        %d \n",mumps->id.ICNTL(4));CHKERRQ(ierr);
1161a5e57a09SHong Zhang       ierr = PetscViewerASCIIPrintf(viewer,"  ICNTL(5) (input mat struct):         %d \n",mumps->id.ICNTL(5));CHKERRQ(ierr);
1162a5e57a09SHong Zhang       ierr = PetscViewerASCIIPrintf(viewer,"  ICNTL(6) (matrix prescaling):        %d \n",mumps->id.ICNTL(6));CHKERRQ(ierr);
1163a5e57a09SHong Zhang       ierr = PetscViewerASCIIPrintf(viewer,"  ICNTL(7) (sequentia matrix ordering):%d \n",mumps->id.ICNTL(7));CHKERRQ(ierr);
1164a5e57a09SHong Zhang       ierr = PetscViewerASCIIPrintf(viewer,"  ICNTL(8) (scalling strategy):        %d \n",mumps->id.ICNTL(8));CHKERRQ(ierr);
1165a5e57a09SHong Zhang       ierr = PetscViewerASCIIPrintf(viewer,"  ICNTL(10) (max num of refinements):  %d \n",mumps->id.ICNTL(10));CHKERRQ(ierr);
1166a5e57a09SHong Zhang       ierr = PetscViewerASCIIPrintf(viewer,"  ICNTL(11) (error analysis):          %d \n",mumps->id.ICNTL(11));CHKERRQ(ierr);
1167a5e57a09SHong Zhang       if (mumps->id.ICNTL(11)>0) {
1168a5e57a09SHong Zhang         ierr = PetscViewerASCIIPrintf(viewer,"    RINFOG(4) (inf norm of input mat):        %g\n",mumps->id.RINFOG(4));CHKERRQ(ierr);
1169a5e57a09SHong Zhang         ierr = PetscViewerASCIIPrintf(viewer,"    RINFOG(5) (inf norm of solution):         %g\n",mumps->id.RINFOG(5));CHKERRQ(ierr);
1170a5e57a09SHong Zhang         ierr = PetscViewerASCIIPrintf(viewer,"    RINFOG(6) (inf norm of residual):         %g\n",mumps->id.RINFOG(6));CHKERRQ(ierr);
1171a5e57a09SHong Zhang         ierr = PetscViewerASCIIPrintf(viewer,"    RINFOG(7),RINFOG(8) (backward error est): %g, %g\n",mumps->id.RINFOG(7),mumps->id.RINFOG(8));CHKERRQ(ierr);
1172a5e57a09SHong Zhang         ierr = PetscViewerASCIIPrintf(viewer,"    RINFOG(9) (error estimate):               %g \n",mumps->id.RINFOG(9));CHKERRQ(ierr);
1173a5e57a09SHong Zhang         ierr = PetscViewerASCIIPrintf(viewer,"    RINFOG(10),RINFOG(11)(condition numbers): %g, %g\n",mumps->id.RINFOG(10),mumps->id.RINFOG(11));CHKERRQ(ierr);
1174f6c57405SHong Zhang       }
1175a5e57a09SHong Zhang       ierr = PetscViewerASCIIPrintf(viewer,"  ICNTL(12) (efficiency control):                         %d \n",mumps->id.ICNTL(12));CHKERRQ(ierr);
1176a5e57a09SHong Zhang       ierr = PetscViewerASCIIPrintf(viewer,"  ICNTL(13) (efficiency control):                         %d \n",mumps->id.ICNTL(13));CHKERRQ(ierr);
1177a5e57a09SHong Zhang       ierr = PetscViewerASCIIPrintf(viewer,"  ICNTL(14) (percentage of estimated workspace increase): %d \n",mumps->id.ICNTL(14));CHKERRQ(ierr);
1178f6c57405SHong Zhang       /* ICNTL(15-17) not used */
1179a5e57a09SHong Zhang       ierr = PetscViewerASCIIPrintf(viewer,"  ICNTL(18) (input mat struct):                           %d \n",mumps->id.ICNTL(18));CHKERRQ(ierr);
1180a5e57a09SHong Zhang       ierr = PetscViewerASCIIPrintf(viewer,"  ICNTL(19) (Shur complement info):                       %d \n",mumps->id.ICNTL(19));CHKERRQ(ierr);
1181a5e57a09SHong Zhang       ierr = PetscViewerASCIIPrintf(viewer,"  ICNTL(20) (rhs sparse pattern):                         %d \n",mumps->id.ICNTL(20));CHKERRQ(ierr);
1182a5e57a09SHong Zhang       ierr = PetscViewerASCIIPrintf(viewer,"  ICNTL(21) (somumpstion struct):                            %d \n",mumps->id.ICNTL(21));CHKERRQ(ierr);
1183a5e57a09SHong Zhang       ierr = PetscViewerASCIIPrintf(viewer,"  ICNTL(22) (in-core/out-of-core facility):               %d \n",mumps->id.ICNTL(22));CHKERRQ(ierr);
1184a5e57a09SHong Zhang       ierr = PetscViewerASCIIPrintf(viewer,"  ICNTL(23) (max size of memory can be allocated locally):%d \n",mumps->id.ICNTL(23));CHKERRQ(ierr);
1185c0165424SHong Zhang 
1186a5e57a09SHong Zhang       ierr = PetscViewerASCIIPrintf(viewer,"  ICNTL(24) (detection of null pivot rows):               %d \n",mumps->id.ICNTL(24));CHKERRQ(ierr);
1187a5e57a09SHong Zhang       ierr = PetscViewerASCIIPrintf(viewer,"  ICNTL(25) (computation of a null space basis):          %d \n",mumps->id.ICNTL(25));CHKERRQ(ierr);
1188a5e57a09SHong Zhang       ierr = PetscViewerASCIIPrintf(viewer,"  ICNTL(26) (Schur options for rhs or solution):          %d \n",mumps->id.ICNTL(26));CHKERRQ(ierr);
1189a5e57a09SHong Zhang       ierr = PetscViewerASCIIPrintf(viewer,"  ICNTL(27) (experimental parameter):                     %d \n",mumps->id.ICNTL(27));CHKERRQ(ierr);
1190a5e57a09SHong Zhang       ierr = PetscViewerASCIIPrintf(viewer,"  ICNTL(28) (use parallel or sequential ordering):        %d \n",mumps->id.ICNTL(28));CHKERRQ(ierr);
1191a5e57a09SHong Zhang       ierr = PetscViewerASCIIPrintf(viewer,"  ICNTL(29) (parallel ordering):                          %d \n",mumps->id.ICNTL(29));CHKERRQ(ierr);
119242179a6aSHong Zhang 
1193a5e57a09SHong Zhang       ierr = PetscViewerASCIIPrintf(viewer,"  ICNTL(30) (user-specified set of entries in inv(A)):    %d \n",mumps->id.ICNTL(30));CHKERRQ(ierr);
1194a5e57a09SHong Zhang       ierr = PetscViewerASCIIPrintf(viewer,"  ICNTL(31) (factors is discarded in the solve phase):    %d \n",mumps->id.ICNTL(31));CHKERRQ(ierr);
1195a5e57a09SHong Zhang       ierr = PetscViewerASCIIPrintf(viewer,"  ICNTL(33) (compute determinant):                        %d \n",mumps->id.ICNTL(33));CHKERRQ(ierr);
1196f6c57405SHong Zhang 
1197a5e57a09SHong Zhang       ierr = PetscViewerASCIIPrintf(viewer,"  CNTL(1) (relative pivoting threshold):      %g \n",mumps->id.CNTL(1));CHKERRQ(ierr);
1198a5e57a09SHong Zhang       ierr = PetscViewerASCIIPrintf(viewer,"  CNTL(2) (stopping criterion of refinement): %g \n",mumps->id.CNTL(2));CHKERRQ(ierr);
1199a5e57a09SHong Zhang       ierr = PetscViewerASCIIPrintf(viewer,"  CNTL(3) (absomumpste pivoting threshold):      %g \n",mumps->id.CNTL(3));CHKERRQ(ierr);
1200a5e57a09SHong Zhang       ierr = PetscViewerASCIIPrintf(viewer,"  CNTL(4) (vamumpse of static pivoting):         %g \n",mumps->id.CNTL(4));CHKERRQ(ierr);
1201a5e57a09SHong Zhang       ierr = PetscViewerASCIIPrintf(viewer,"  CNTL(5) (fixation for null pivots):         %g \n",mumps->id.CNTL(5));CHKERRQ(ierr);
1202f6c57405SHong Zhang 
1203f6c57405SHong Zhang       /* infomation local to each processor */
120434ed7027SBarry Smith       ierr = PetscViewerASCIIPrintf(viewer, "  RINFO(1) (local estimated flops for the elimination after analysis): \n");CHKERRQ(ierr);
12057b23a99aSBarry Smith       ierr = PetscViewerASCIISynchronizedAllow(viewer,PETSC_TRUE);CHKERRQ(ierr);
1206a5e57a09SHong Zhang       ierr = PetscViewerASCIISynchronizedPrintf(viewer,"    [%d] %g \n",mumps->myid,mumps->id.RINFO(1));CHKERRQ(ierr);
120734ed7027SBarry Smith       ierr = PetscViewerFlush(viewer);
120834ed7027SBarry Smith       ierr = PetscViewerASCIIPrintf(viewer, "  RINFO(2) (local estimated flops for the assembly after factorization): \n");CHKERRQ(ierr);
1209a5e57a09SHong Zhang       ierr = PetscViewerASCIISynchronizedPrintf(viewer,"    [%d]  %g \n",mumps->myid,mumps->id.RINFO(2));CHKERRQ(ierr);
121034ed7027SBarry Smith       ierr = PetscViewerFlush(viewer);
121134ed7027SBarry Smith       ierr = PetscViewerASCIIPrintf(viewer, "  RINFO(3) (local estimated flops for the elimination after factorization): \n");CHKERRQ(ierr);
1212a5e57a09SHong Zhang       ierr = PetscViewerASCIISynchronizedPrintf(viewer,"    [%d]  %g \n",mumps->myid,mumps->id.RINFO(3));CHKERRQ(ierr);
121334ed7027SBarry Smith       ierr = PetscViewerFlush(viewer);
1214f6c57405SHong Zhang 
121534ed7027SBarry Smith       ierr = PetscViewerASCIIPrintf(viewer, "  INFO(15) (estimated size of (in MB) MUMPS internal data for running numerical factorization): \n");CHKERRQ(ierr);
1216a5e57a09SHong Zhang       ierr = PetscViewerASCIISynchronizedPrintf(viewer,"  [%d] %d \n",mumps->myid,mumps->id.INFO(15));CHKERRQ(ierr);
121734ed7027SBarry Smith       ierr = PetscViewerFlush(viewer);
1218f6c57405SHong Zhang 
121934ed7027SBarry Smith       ierr = PetscViewerASCIIPrintf(viewer, "  INFO(16) (size of (in MB) MUMPS internal data used during numerical factorization): \n");CHKERRQ(ierr);
1220a5e57a09SHong Zhang       ierr = PetscViewerASCIISynchronizedPrintf(viewer,"    [%d] %d \n",mumps->myid,mumps->id.INFO(16));CHKERRQ(ierr);
122134ed7027SBarry Smith       ierr = PetscViewerFlush(viewer);
1222f6c57405SHong Zhang 
122334ed7027SBarry Smith       ierr = PetscViewerASCIIPrintf(viewer, "  INFO(23) (num of pivots eliminated on this processor after factorization): \n");CHKERRQ(ierr);
1224a5e57a09SHong Zhang       ierr = PetscViewerASCIISynchronizedPrintf(viewer,"    [%d] %d \n",mumps->myid,mumps->id.INFO(23));CHKERRQ(ierr);
122534ed7027SBarry Smith       ierr = PetscViewerFlush(viewer);
12267b23a99aSBarry Smith       ierr = PetscViewerASCIISynchronizedAllow(viewer,PETSC_FALSE);CHKERRQ(ierr);
1227f6c57405SHong Zhang 
1228a5e57a09SHong Zhang       if (!mumps->myid) { /* information from the host */
1229a5e57a09SHong Zhang         ierr = PetscViewerASCIIPrintf(viewer,"  RINFOG(1) (global estimated flops for the elimination after analysis): %g \n",mumps->id.RINFOG(1));CHKERRQ(ierr);
1230a5e57a09SHong Zhang         ierr = PetscViewerASCIIPrintf(viewer,"  RINFOG(2) (global estimated flops for the assembly after factorization): %g \n",mumps->id.RINFOG(2));CHKERRQ(ierr);
1231a5e57a09SHong Zhang         ierr = PetscViewerASCIIPrintf(viewer,"  RINFOG(3) (global estimated flops for the elimination after factorization): %g \n",mumps->id.RINFOG(3));CHKERRQ(ierr);
1232a5e57a09SHong Zhang         ierr = PetscViewerASCIIPrintf(viewer,"  (RINFOG(12) RINFOG(13))*2^INFOG(34) (determinant): (%g,%g)*(2^%d)\n",mumps->id.RINFOG(12),mumps->id.RINFOG(13),mumps->id.INFOG(34));CHKERRQ(ierr);
1233f6c57405SHong Zhang 
1234a5e57a09SHong Zhang         ierr = PetscViewerASCIIPrintf(viewer,"  INFOG(3) (estimated real workspace for factors on all processors after analysis): %d \n",mumps->id.INFOG(3));CHKERRQ(ierr);
1235a5e57a09SHong Zhang         ierr = PetscViewerASCIIPrintf(viewer,"  INFOG(4) (estimated integer workspace for factors on all processors after analysis): %d \n",mumps->id.INFOG(4));CHKERRQ(ierr);
1236a5e57a09SHong Zhang         ierr = PetscViewerASCIIPrintf(viewer,"  INFOG(5) (estimated maximum front size in the complete tree): %d \n",mumps->id.INFOG(5));CHKERRQ(ierr);
1237a5e57a09SHong Zhang         ierr = PetscViewerASCIIPrintf(viewer,"  INFOG(6) (number of nodes in the complete tree): %d \n",mumps->id.INFOG(6));CHKERRQ(ierr);
1238a5e57a09SHong Zhang         ierr = PetscViewerASCIIPrintf(viewer,"  INFOG(7) (ordering option effectively use after analysis): %d \n",mumps->id.INFOG(7));CHKERRQ(ierr);
1239a5e57a09SHong Zhang         ierr = PetscViewerASCIIPrintf(viewer,"  INFOG(8) (structural symmetry in percent of the permuted matrix after analysis): %d \n",mumps->id.INFOG(8));CHKERRQ(ierr);
1240a5e57a09SHong Zhang         ierr = PetscViewerASCIIPrintf(viewer,"  INFOG(9) (total real/complex workspace to store the matrix factors after factorization): %d \n",mumps->id.INFOG(9));CHKERRQ(ierr);
1241a5e57a09SHong Zhang         ierr = PetscViewerASCIIPrintf(viewer,"  INFOG(10) (total integer space store the matrix factors after factorization): %d \n",mumps->id.INFOG(10));CHKERRQ(ierr);
1242a5e57a09SHong Zhang         ierr = PetscViewerASCIIPrintf(viewer,"  INFOG(11) (order of largest frontal matrix after factorization): %d \n",mumps->id.INFOG(11));CHKERRQ(ierr);
1243a5e57a09SHong Zhang         ierr = PetscViewerASCIIPrintf(viewer,"  INFOG(12) (number of off-diagonal pivots): %d \n",mumps->id.INFOG(12));CHKERRQ(ierr);
1244a5e57a09SHong Zhang         ierr = PetscViewerASCIIPrintf(viewer,"  INFOG(13) (number of delayed pivots after factorization): %d \n",mumps->id.INFOG(13));CHKERRQ(ierr);
1245a5e57a09SHong Zhang         ierr = PetscViewerASCIIPrintf(viewer,"  INFOG(14) (number of memory compress after factorization): %d \n",mumps->id.INFOG(14));CHKERRQ(ierr);
1246a5e57a09SHong Zhang         ierr = PetscViewerASCIIPrintf(viewer,"  INFOG(15) (number of steps of iterative refinement after solution): %d \n",mumps->id.INFOG(15));CHKERRQ(ierr);
1247a5e57a09SHong Zhang         ierr = PetscViewerASCIIPrintf(viewer,"  INFOG(16) (estimated size (in MB) of all MUMPS internal data for factorization after analysis: value on the most memory consuming processor): %d \n",mumps->id.INFOG(16));CHKERRQ(ierr);
1248a5e57a09SHong Zhang         ierr = PetscViewerASCIIPrintf(viewer,"  INFOG(17) (estimated size of all MUMPS internal data for factorization after analysis: sum over all processors): %d \n",mumps->id.INFOG(17));CHKERRQ(ierr);
1249a5e57a09SHong Zhang         ierr = PetscViewerASCIIPrintf(viewer,"  INFOG(18) (size of all MUMPS internal data allocated during factorization: value on the most memory consuming processor): %d \n",mumps->id.INFOG(18));CHKERRQ(ierr);
1250a5e57a09SHong Zhang         ierr = PetscViewerASCIIPrintf(viewer,"  INFOG(19) (size of all MUMPS internal data allocated during factorization: sum over all processors): %d \n",mumps->id.INFOG(19));CHKERRQ(ierr);
1251a5e57a09SHong Zhang         ierr = PetscViewerASCIIPrintf(viewer,"  INFOG(20) (estimated number of entries in the factors): %d \n",mumps->id.INFOG(20));CHKERRQ(ierr);
1252a5e57a09SHong Zhang         ierr = PetscViewerASCIIPrintf(viewer,"  INFOG(21) (size in MB of memory effectively used during factorization - value on the most memory consuming processor): %d \n",mumps->id.INFOG(21));CHKERRQ(ierr);
1253a5e57a09SHong Zhang         ierr = PetscViewerASCIIPrintf(viewer,"  INFOG(22) (size in MB of memory effectively used during factorization - sum over all processors): %d \n",mumps->id.INFOG(22));CHKERRQ(ierr);
1254a5e57a09SHong Zhang         ierr = PetscViewerASCIIPrintf(viewer,"  INFOG(23) (after analysis: value of ICNTL(6) effectively used): %d \n",mumps->id.INFOG(23));CHKERRQ(ierr);
1255a5e57a09SHong Zhang         ierr = PetscViewerASCIIPrintf(viewer,"  INFOG(24) (after analysis: value of ICNTL(12) effectively used): %d \n",mumps->id.INFOG(24));CHKERRQ(ierr);
1256a5e57a09SHong Zhang         ierr = PetscViewerASCIIPrintf(viewer,"  INFOG(25) (after factorization: number of pivots modified by static pivoting): %d \n",mumps->id.INFOG(25));CHKERRQ(ierr);
1257f6c57405SHong Zhang       }
1258f6c57405SHong Zhang     }
1259cb828f0fSHong Zhang   }
1260f6c57405SHong Zhang   PetscFunctionReturn(0);
1261f6c57405SHong Zhang }
1262f6c57405SHong Zhang 
126335bd34faSBarry Smith #undef __FUNCT__
126435bd34faSBarry Smith #define __FUNCT__ "MatGetInfo_MUMPS"
126535bd34faSBarry Smith PetscErrorCode MatGetInfo_MUMPS(Mat A,MatInfoType flag,MatInfo *info)
126635bd34faSBarry Smith {
1267cb828f0fSHong Zhang   Mat_MUMPS *mumps =(Mat_MUMPS*)A->spptr;
126835bd34faSBarry Smith 
126935bd34faSBarry Smith   PetscFunctionBegin;
127035bd34faSBarry Smith   info->block_size        = 1.0;
1271cb828f0fSHong Zhang   info->nz_allocated      = mumps->id.INFOG(20);
1272cb828f0fSHong Zhang   info->nz_used           = mumps->id.INFOG(20);
127335bd34faSBarry Smith   info->nz_unneeded       = 0.0;
127435bd34faSBarry Smith   info->assemblies        = 0.0;
127535bd34faSBarry Smith   info->mallocs           = 0.0;
127635bd34faSBarry Smith   info->memory            = 0.0;
127735bd34faSBarry Smith   info->fill_ratio_given  = 0;
127835bd34faSBarry Smith   info->fill_ratio_needed = 0;
127935bd34faSBarry Smith   info->factor_mallocs    = 0;
128035bd34faSBarry Smith   PetscFunctionReturn(0);
128135bd34faSBarry Smith }
128235bd34faSBarry Smith 
12835ccb76cbSHong Zhang /* -------------------------------------------------------------------------------------------*/
12845ccb76cbSHong Zhang #undef __FUNCT__
12855ccb76cbSHong Zhang #define __FUNCT__ "MatMumpsSetIcntl_MUMPS"
12865ccb76cbSHong Zhang PetscErrorCode MatMumpsSetIcntl_MUMPS(Mat F,PetscInt icntl,PetscInt ival)
12875ccb76cbSHong Zhang {
1288a5e57a09SHong Zhang   Mat_MUMPS *mumps =(Mat_MUMPS*)F->spptr;
12895ccb76cbSHong Zhang 
12905ccb76cbSHong Zhang   PetscFunctionBegin;
1291a5e57a09SHong Zhang   mumps->id.ICNTL(icntl) = ival;
12925ccb76cbSHong Zhang   PetscFunctionReturn(0);
12935ccb76cbSHong Zhang }
12945ccb76cbSHong Zhang 
12955ccb76cbSHong Zhang #undef __FUNCT__
12965ccb76cbSHong Zhang #define __FUNCT__ "MatMumpsSetIcntl"
12975ccb76cbSHong Zhang /*@
12985ccb76cbSHong Zhang   MatMumpsSetIcntl - Set MUMPS parameter ICNTL()
12995ccb76cbSHong Zhang 
13005ccb76cbSHong Zhang    Logically Collective on Mat
13015ccb76cbSHong Zhang 
13025ccb76cbSHong Zhang    Input Parameters:
13035ccb76cbSHong Zhang +  F - the factored matrix obtained by calling MatGetFactor() from PETSc-MUMPS interface
13045ccb76cbSHong Zhang .  icntl - index of MUMPS parameter array ICNTL()
13055ccb76cbSHong Zhang -  ival - value of MUMPS ICNTL(icntl)
13065ccb76cbSHong Zhang 
13075ccb76cbSHong Zhang   Options Database:
13085ccb76cbSHong Zhang .   -mat_mumps_icntl_<icntl> <ival>
13095ccb76cbSHong Zhang 
13105ccb76cbSHong Zhang    Level: beginner
13115ccb76cbSHong Zhang 
13125ccb76cbSHong Zhang    References: MUMPS Users' Guide
13135ccb76cbSHong Zhang 
13145ccb76cbSHong Zhang .seealso: MatGetFactor()
13155ccb76cbSHong Zhang @*/
13165ccb76cbSHong Zhang PetscErrorCode MatMumpsSetIcntl(Mat F,PetscInt icntl,PetscInt ival)
13175ccb76cbSHong Zhang {
13185ccb76cbSHong Zhang   PetscErrorCode ierr;
13195ccb76cbSHong Zhang 
13205ccb76cbSHong Zhang   PetscFunctionBegin;
13215ccb76cbSHong Zhang   PetscValidLogicalCollectiveInt(F,icntl,2);
13225ccb76cbSHong Zhang   PetscValidLogicalCollectiveInt(F,ival,3);
13235ccb76cbSHong Zhang   ierr = PetscTryMethod(F,"MatMumpsSetIcntl_C",(Mat,PetscInt,PetscInt),(F,icntl,ival));CHKERRQ(ierr);
13245ccb76cbSHong Zhang   PetscFunctionReturn(0);
13255ccb76cbSHong Zhang }
13265ccb76cbSHong Zhang 
13278928b65cSHong Zhang /* -------------------------------------------------------------------------------------------*/
13288928b65cSHong Zhang #undef __FUNCT__
13298928b65cSHong Zhang #define __FUNCT__ "MatMumpsSetCntl_MUMPS"
13308928b65cSHong Zhang PetscErrorCode MatMumpsSetCntl_MUMPS(Mat F,PetscInt icntl,PetscReal val)
13318928b65cSHong Zhang {
13328928b65cSHong Zhang   Mat_MUMPS *mumps =(Mat_MUMPS*)F->spptr;
13338928b65cSHong Zhang 
13348928b65cSHong Zhang   PetscFunctionBegin;
13358928b65cSHong Zhang   mumps->id.CNTL(icntl) = val;
13368928b65cSHong Zhang   PetscFunctionReturn(0);
13378928b65cSHong Zhang }
13388928b65cSHong Zhang 
13398928b65cSHong Zhang #undef __FUNCT__
13408928b65cSHong Zhang #define __FUNCT__ "MatMumpsSetCntl"
13418928b65cSHong Zhang /*@
13428928b65cSHong Zhang   MatMumpsSetCntl - Set MUMPS parameter CNTL()
13438928b65cSHong Zhang 
13448928b65cSHong Zhang    Logically Collective on Mat
13458928b65cSHong Zhang 
13468928b65cSHong Zhang    Input Parameters:
13478928b65cSHong Zhang +  F - the factored matrix obtained by calling MatGetFactor() from PETSc-MUMPS interface
13488928b65cSHong Zhang .  icntl - index of MUMPS parameter array CNTL()
13498928b65cSHong Zhang -  val - value of MUMPS CNTL(icntl)
13508928b65cSHong Zhang 
13518928b65cSHong Zhang   Options Database:
13528928b65cSHong Zhang .   -mat_mumps_cntl_<icntl> <val>
13538928b65cSHong Zhang 
13548928b65cSHong Zhang    Level: beginner
13558928b65cSHong Zhang 
13568928b65cSHong Zhang    References: MUMPS Users' Guide
13578928b65cSHong Zhang 
13588928b65cSHong Zhang .seealso: MatGetFactor()
13598928b65cSHong Zhang @*/
13608928b65cSHong Zhang PetscErrorCode MatMumpsSetCntl(Mat F,PetscInt icntl,PetscReal val)
13618928b65cSHong Zhang {
13628928b65cSHong Zhang   PetscErrorCode ierr;
13638928b65cSHong Zhang 
13648928b65cSHong Zhang   PetscFunctionBegin;
13658928b65cSHong Zhang   PetscValidLogicalCollectiveInt(F,icntl,2);
13668928b65cSHong Zhang   PetscValidLogicalCollectiveInt(F,val,3);
13678928b65cSHong Zhang   ierr = PetscTryMethod(F,"MatMumpsSetCntl_C",(Mat,PetscInt,PetscReal),(F,icntl,val));CHKERRQ(ierr);
13688928b65cSHong Zhang   PetscFunctionReturn(0);
13698928b65cSHong Zhang }
13708928b65cSHong Zhang 
137124b6179bSKris Buschelman /*MC
13722692d6eeSBarry Smith   MATSOLVERMUMPS -  A matrix type providing direct solvers (LU and Cholesky) for
137324b6179bSKris Buschelman   distributed and sequential matrices via the external package MUMPS.
137424b6179bSKris Buschelman 
137541c8de11SBarry Smith   Works with MATAIJ and MATSBAIJ matrices
137624b6179bSKris Buschelman 
137724b6179bSKris Buschelman   Options Database Keys:
1378fb8376fbSHong Zhang + -mat_mumps_icntl_4 <0,...,4> - print level
137924b6179bSKris Buschelman . -mat_mumps_icntl_6 <0,...,7> - matrix prescaling options (see MUMPS User's Guide)
138064e6c443SBarry Smith . -mat_mumps_icntl_7 <0,...,7> - matrix orderings (see MUMPS User's Guidec)
138124b6179bSKris Buschelman . -mat_mumps_icntl_9 <1,2> - A or A^T x=b to be solved: 1 denotes A, 2 denotes A^T
138224b6179bSKris Buschelman . -mat_mumps_icntl_10 <n> - maximum number of iterative refinements
138394b7f48cSBarry Smith . -mat_mumps_icntl_11 <n> - error analysis, a positive value returns statistics during -ksp_view
138424b6179bSKris Buschelman . -mat_mumps_icntl_12 <n> - efficiency control (see MUMPS User's Guide)
138524b6179bSKris Buschelman . -mat_mumps_icntl_13 <n> - efficiency control (see MUMPS User's Guide)
138624b6179bSKris Buschelman . -mat_mumps_icntl_14 <n> - efficiency control (see MUMPS User's Guide)
138724b6179bSKris Buschelman . -mat_mumps_icntl_15 <n> - efficiency control (see MUMPS User's Guide)
138824b6179bSKris Buschelman . -mat_mumps_cntl_1 <delta> - relative pivoting threshold
138924b6179bSKris Buschelman . -mat_mumps_cntl_2 <tol> - stopping criterion for refinement
139024b6179bSKris Buschelman - -mat_mumps_cntl_3 <adelta> - absolute pivoting threshold
139124b6179bSKris Buschelman 
139224b6179bSKris Buschelman   Level: beginner
139324b6179bSKris Buschelman 
139441c8de11SBarry Smith .seealso: PCFactorSetMatSolverPackage(), MatSolverPackage
139541c8de11SBarry Smith 
139624b6179bSKris Buschelman M*/
139724b6179bSKris Buschelman 
139835bd34faSBarry Smith #undef __FUNCT__
139935bd34faSBarry Smith #define __FUNCT__ "MatFactorGetSolverPackage_mumps"
1400f7a08781SBarry Smith static PetscErrorCode MatFactorGetSolverPackage_mumps(Mat A,const MatSolverPackage *type)
140135bd34faSBarry Smith {
140235bd34faSBarry Smith   PetscFunctionBegin;
14032692d6eeSBarry Smith   *type = MATSOLVERMUMPS;
140435bd34faSBarry Smith   PetscFunctionReturn(0);
140535bd34faSBarry Smith }
140635bd34faSBarry Smith 
1407bccb9932SShri Abhyankar /* MatGetFactor for Seq and MPI AIJ matrices */
14082877fffaSHong Zhang #undef __FUNCT__
1409bccb9932SShri Abhyankar #define __FUNCT__ "MatGetFactor_aij_mumps"
14108cc058d9SJed Brown PETSC_EXTERN PetscErrorCode MatGetFactor_aij_mumps(Mat A,MatFactorType ftype,Mat *F)
14112877fffaSHong Zhang {
14122877fffaSHong Zhang   Mat            B;
14132877fffaSHong Zhang   PetscErrorCode ierr;
14142877fffaSHong Zhang   Mat_MUMPS      *mumps;
1415ace3abfcSBarry Smith   PetscBool      isSeqAIJ;
14162877fffaSHong Zhang 
14172877fffaSHong Zhang   PetscFunctionBegin;
14182877fffaSHong Zhang   /* Create the factorization matrix */
1419251f4c67SDmitry Karpeev   ierr = PetscObjectTypeCompare((PetscObject)A,MATSEQAIJ,&isSeqAIJ);CHKERRQ(ierr);
1420ce94432eSBarry Smith   ierr = MatCreate(PetscObjectComm((PetscObject)A),&B);CHKERRQ(ierr);
14212877fffaSHong Zhang   ierr = MatSetSizes(B,A->rmap->n,A->cmap->n,A->rmap->N,A->cmap->N);CHKERRQ(ierr);
14222877fffaSHong Zhang   ierr = MatSetType(B,((PetscObject)A)->type_name);CHKERRQ(ierr);
1423bccb9932SShri Abhyankar   if (isSeqAIJ) {
14240298fd71SBarry Smith     ierr = MatSeqAIJSetPreallocation(B,0,NULL);CHKERRQ(ierr);
1425bccb9932SShri Abhyankar   } else {
14260298fd71SBarry Smith     ierr = MatMPIAIJSetPreallocation(B,0,NULL,0,NULL);CHKERRQ(ierr);
1427bccb9932SShri Abhyankar   }
14282877fffaSHong Zhang 
1429b00a9115SJed Brown   ierr = PetscNewLog(B,&mumps);CHKERRQ(ierr);
14302205254eSKarl Rupp 
14312877fffaSHong Zhang   B->ops->view    = MatView_MUMPS;
143235bd34faSBarry Smith   B->ops->getinfo = MatGetInfo_MUMPS;
14332205254eSKarl Rupp 
1434bdf89e91SBarry Smith   ierr = PetscObjectComposeFunction((PetscObject)B,"MatFactorGetSolverPackage_C",MatFactorGetSolverPackage_mumps);CHKERRQ(ierr);
1435bdf89e91SBarry Smith   ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsSetIcntl_C",MatMumpsSetIcntl_MUMPS);CHKERRQ(ierr);
1436bdf89e91SBarry Smith   ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsSetCntl_C",MatMumpsSetCntl_MUMPS);CHKERRQ(ierr);
1437450b117fSShri Abhyankar   if (ftype == MAT_FACTOR_LU) {
1438450b117fSShri Abhyankar     B->ops->lufactorsymbolic = MatLUFactorSymbolic_AIJMUMPS;
1439d5f3da31SBarry Smith     B->factortype            = MAT_FACTOR_LU;
1440bccb9932SShri Abhyankar     if (isSeqAIJ) mumps->ConvertToTriples = MatConvertToTriples_seqaij_seqaij;
1441bccb9932SShri Abhyankar     else mumps->ConvertToTriples = MatConvertToTriples_mpiaij_mpiaij;
1442746480a1SHong Zhang     mumps->sym = 0;
1443dcd589f8SShri Abhyankar   } else {
144467877ebaSShri Abhyankar     B->ops->choleskyfactorsymbolic = MatCholeskyFactorSymbolic_MUMPS;
1445450b117fSShri Abhyankar     B->factortype                  = MAT_FACTOR_CHOLESKY;
1446bccb9932SShri Abhyankar     if (isSeqAIJ) mumps->ConvertToTriples = MatConvertToTriples_seqaij_seqsbaij;
1447bccb9932SShri Abhyankar     else mumps->ConvertToTriples = MatConvertToTriples_mpiaij_mpisbaij;
14486fdc2a6dSBarry Smith     if (A->spd_set && A->spd) mumps->sym = 1;
14496fdc2a6dSBarry Smith     else                      mumps->sym = 2;
1450450b117fSShri Abhyankar   }
14512877fffaSHong Zhang 
14522877fffaSHong Zhang   mumps->isAIJ    = PETSC_TRUE;
1453bf0cc555SLisandro Dalcin   mumps->Destroy  = B->ops->destroy;
14542877fffaSHong Zhang   B->ops->destroy = MatDestroy_MUMPS;
14552877fffaSHong Zhang   B->spptr        = (void*)mumps;
14562205254eSKarl Rupp 
1457f697e70eSHong Zhang   ierr = PetscInitializeMUMPS(A,mumps);CHKERRQ(ierr);
1458746480a1SHong Zhang 
14592877fffaSHong Zhang   *F = B;
14602877fffaSHong Zhang   PetscFunctionReturn(0);
14612877fffaSHong Zhang }
14622877fffaSHong Zhang 
1463bccb9932SShri Abhyankar /* MatGetFactor for Seq and MPI SBAIJ matrices */
14642877fffaSHong Zhang #undef __FUNCT__
1465bccb9932SShri Abhyankar #define __FUNCT__ "MatGetFactor_sbaij_mumps"
14668cc058d9SJed Brown PETSC_EXTERN PetscErrorCode MatGetFactor_sbaij_mumps(Mat A,MatFactorType ftype,Mat *F)
14672877fffaSHong Zhang {
14682877fffaSHong Zhang   Mat            B;
14692877fffaSHong Zhang   PetscErrorCode ierr;
14702877fffaSHong Zhang   Mat_MUMPS      *mumps;
1471ace3abfcSBarry Smith   PetscBool      isSeqSBAIJ;
14722877fffaSHong Zhang 
14732877fffaSHong Zhang   PetscFunctionBegin;
1474ce94432eSBarry Smith   if (ftype != MAT_FACTOR_CHOLESKY) SETERRQ(PetscObjectComm((PetscObject)A),PETSC_ERR_SUP,"Cannot use PETSc SBAIJ matrices with MUMPS LU, use AIJ matrix");
1475ce94432eSBarry Smith   if (A->rmap->bs > 1) SETERRQ(PetscObjectComm((PetscObject)A),PETSC_ERR_SUP,"Cannot use PETSc SBAIJ matrices with block size > 1 with MUMPS Cholesky, use AIJ matrix instead");
1476251f4c67SDmitry Karpeev   ierr = PetscObjectTypeCompare((PetscObject)A,MATSEQSBAIJ,&isSeqSBAIJ);CHKERRQ(ierr);
14772877fffaSHong Zhang   /* Create the factorization matrix */
1478ce94432eSBarry Smith   ierr = MatCreate(PetscObjectComm((PetscObject)A),&B);CHKERRQ(ierr);
14792877fffaSHong Zhang   ierr = MatSetSizes(B,A->rmap->n,A->cmap->n,A->rmap->N,A->cmap->N);CHKERRQ(ierr);
14802877fffaSHong Zhang   ierr = MatSetType(B,((PetscObject)A)->type_name);CHKERRQ(ierr);
1481b00a9115SJed Brown   ierr = PetscNewLog(B,&mumps);CHKERRQ(ierr);
1482bccb9932SShri Abhyankar   if (isSeqSBAIJ) {
14830298fd71SBarry Smith     ierr = MatSeqSBAIJSetPreallocation(B,1,0,NULL);CHKERRQ(ierr);
14842205254eSKarl Rupp 
148516ebf90aSShri Abhyankar     mumps->ConvertToTriples = MatConvertToTriples_seqsbaij_seqsbaij;
1486dcd589f8SShri Abhyankar   } else {
14870298fd71SBarry Smith     ierr = MatMPISBAIJSetPreallocation(B,1,0,NULL,0,NULL);CHKERRQ(ierr);
14882205254eSKarl Rupp 
1489bccb9932SShri Abhyankar     mumps->ConvertToTriples = MatConvertToTriples_mpisbaij_mpisbaij;
1490bccb9932SShri Abhyankar   }
1491bccb9932SShri Abhyankar 
149267877ebaSShri Abhyankar   B->ops->choleskyfactorsymbolic = MatCholeskyFactorSymbolic_MUMPS;
1493bccb9932SShri Abhyankar   B->ops->view                   = MatView_MUMPS;
14942205254eSKarl Rupp 
1495bdf89e91SBarry Smith   ierr = PetscObjectComposeFunction((PetscObject)B,"MatFactorGetSolverPackage_C",MatFactorGetSolverPackage_mumps);CHKERRQ(ierr);
1496bdf89e91SBarry Smith   ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsSetIcntl_C",MatMumpsSetIcntl);CHKERRQ(ierr);
1497bdf89e91SBarry Smith   ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsSetCntl_C",MatMumpsSetCntl);CHKERRQ(ierr);
14982205254eSKarl Rupp 
1499f4762488SHong Zhang   B->factortype = MAT_FACTOR_CHOLESKY;
15006fdc2a6dSBarry Smith   if (A->spd_set && A->spd) mumps->sym = 1;
15016fdc2a6dSBarry Smith   else                      mumps->sym = 2;
1502a214ac2aSShri Abhyankar 
1503bccb9932SShri Abhyankar   mumps->isAIJ    = PETSC_FALSE;
1504bf0cc555SLisandro Dalcin   mumps->Destroy  = B->ops->destroy;
1505f3c0ef26SHong Zhang   B->ops->destroy = MatDestroy_MUMPS;
15062877fffaSHong Zhang   B->spptr        = (void*)mumps;
15072205254eSKarl Rupp 
1508f697e70eSHong Zhang   ierr = PetscInitializeMUMPS(A,mumps);CHKERRQ(ierr);
1509746480a1SHong Zhang 
15102877fffaSHong Zhang   *F = B;
15112877fffaSHong Zhang   PetscFunctionReturn(0);
15122877fffaSHong Zhang }
151397969023SHong Zhang 
1514450b117fSShri Abhyankar #undef __FUNCT__
1515bccb9932SShri Abhyankar #define __FUNCT__ "MatGetFactor_baij_mumps"
15168cc058d9SJed Brown PETSC_EXTERN PetscErrorCode MatGetFactor_baij_mumps(Mat A,MatFactorType ftype,Mat *F)
151767877ebaSShri Abhyankar {
151867877ebaSShri Abhyankar   Mat            B;
151967877ebaSShri Abhyankar   PetscErrorCode ierr;
152067877ebaSShri Abhyankar   Mat_MUMPS      *mumps;
1521ace3abfcSBarry Smith   PetscBool      isSeqBAIJ;
152267877ebaSShri Abhyankar 
152367877ebaSShri Abhyankar   PetscFunctionBegin;
152467877ebaSShri Abhyankar   /* Create the factorization matrix */
1525251f4c67SDmitry Karpeev   ierr = PetscObjectTypeCompare((PetscObject)A,MATSEQBAIJ,&isSeqBAIJ);CHKERRQ(ierr);
1526ce94432eSBarry Smith   ierr = MatCreate(PetscObjectComm((PetscObject)A),&B);CHKERRQ(ierr);
152767877ebaSShri Abhyankar   ierr = MatSetSizes(B,A->rmap->n,A->cmap->n,A->rmap->N,A->cmap->N);CHKERRQ(ierr);
152867877ebaSShri Abhyankar   ierr = MatSetType(B,((PetscObject)A)->type_name);CHKERRQ(ierr);
1529bccb9932SShri Abhyankar   if (isSeqBAIJ) {
15300298fd71SBarry Smith     ierr = MatSeqBAIJSetPreallocation(B,A->rmap->bs,0,NULL);CHKERRQ(ierr);
1531bccb9932SShri Abhyankar   } else {
15320298fd71SBarry Smith     ierr = MatMPIBAIJSetPreallocation(B,A->rmap->bs,0,NULL,0,NULL);CHKERRQ(ierr);
1533bccb9932SShri Abhyankar   }
1534450b117fSShri Abhyankar 
1535b00a9115SJed Brown   ierr = PetscNewLog(B,&mumps);CHKERRQ(ierr);
1536450b117fSShri Abhyankar   if (ftype == MAT_FACTOR_LU) {
1537450b117fSShri Abhyankar     B->ops->lufactorsymbolic = MatLUFactorSymbolic_BAIJMUMPS;
1538450b117fSShri Abhyankar     B->factortype            = MAT_FACTOR_LU;
1539bccb9932SShri Abhyankar     if (isSeqBAIJ) mumps->ConvertToTriples = MatConvertToTriples_seqbaij_seqaij;
1540bccb9932SShri Abhyankar     else mumps->ConvertToTriples = MatConvertToTriples_mpibaij_mpiaij;
1541746480a1SHong Zhang     mumps->sym = 0;
1542f23aa3ddSBarry Smith   } else SETERRQ(PETSC_COMM_SELF,PETSC_ERR_SUP,"Cannot use PETSc BAIJ matrices with MUMPS Cholesky, use SBAIJ or AIJ matrix instead\n");
1543bccb9932SShri Abhyankar 
1544450b117fSShri Abhyankar   B->ops->view = MatView_MUMPS;
15452205254eSKarl Rupp 
1546bdf89e91SBarry Smith   ierr = PetscObjectComposeFunction((PetscObject)B,"MatFactorGetSolverPackage_C",MatFactorGetSolverPackage_mumps);CHKERRQ(ierr);
1547bdf89e91SBarry Smith   ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsSetIcntl_C",MatMumpsSetIcntl_MUMPS);CHKERRQ(ierr);
1548bdf89e91SBarry Smith   ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsSetCntl_C",MatMumpsSetCntl_MUMPS);CHKERRQ(ierr);
1549450b117fSShri Abhyankar 
1550450b117fSShri Abhyankar   mumps->isAIJ    = PETSC_TRUE;
1551bf0cc555SLisandro Dalcin   mumps->Destroy  = B->ops->destroy;
1552450b117fSShri Abhyankar   B->ops->destroy = MatDestroy_MUMPS;
1553450b117fSShri Abhyankar   B->spptr        = (void*)mumps;
15542205254eSKarl Rupp 
1555f697e70eSHong Zhang   ierr = PetscInitializeMUMPS(A,mumps);CHKERRQ(ierr);
1556746480a1SHong Zhang 
1557450b117fSShri Abhyankar   *F = B;
1558450b117fSShri Abhyankar   PetscFunctionReturn(0);
1559450b117fSShri Abhyankar }
1560a214ac2aSShri Abhyankar 
1561