xref: /petsc/src/mat/impls/aij/mpi/mumps/mumps.c (revision eb9baa12dd270b0fce613d417379d2060a8326f8)
11c2a3de1SBarry Smith 
2397b6df1SKris Buschelman /*
3c2b5dc30SHong Zhang     Provides an interface to the MUMPS sparse solver
4397b6df1SKris Buschelman */
551d5961aSHong Zhang 
6c6db04a5SJed Brown #include <../src/mat/impls/aij/mpi/mpiaij.h> /*I  "petscmat.h"  I*/
7c6db04a5SJed Brown #include <../src/mat/impls/sbaij/mpi/mpisbaij.h>
8397b6df1SKris Buschelman 
9397b6df1SKris Buschelman EXTERN_C_BEGIN
10397b6df1SKris Buschelman #if defined(PETSC_USE_COMPLEX)
112907cef9SHong Zhang #if defined(PETSC_USE_REAL_SINGLE)
122907cef9SHong Zhang #include <cmumps_c.h>
132907cef9SHong Zhang #else
14c6db04a5SJed Brown #include <zmumps_c.h>
152907cef9SHong Zhang #endif
162907cef9SHong Zhang #else
172907cef9SHong Zhang #if defined(PETSC_USE_REAL_SINGLE)
182907cef9SHong Zhang #include <smumps_c.h>
19397b6df1SKris Buschelman #else
20c6db04a5SJed Brown #include <dmumps_c.h>
21397b6df1SKris Buschelman #endif
222907cef9SHong Zhang #endif
23397b6df1SKris Buschelman EXTERN_C_END
24397b6df1SKris Buschelman #define JOB_INIT -1
253d472b54SHong Zhang #define JOB_FACTSYMBOLIC 1
263d472b54SHong Zhang #define JOB_FACTNUMERIC 2
273d472b54SHong Zhang #define JOB_SOLVE 3
28397b6df1SKris Buschelman #define JOB_END -2
293d472b54SHong Zhang 
302907cef9SHong Zhang /* calls to MUMPS */
312907cef9SHong Zhang #if defined(PETSC_USE_COMPLEX)
322907cef9SHong Zhang #if defined(PETSC_USE_REAL_SINGLE)
332907cef9SHong Zhang #define PetscMUMPS_c cmumps_c
342907cef9SHong Zhang #else
352907cef9SHong Zhang #define PetscMUMPS_c zmumps_c
362907cef9SHong Zhang #endif
372907cef9SHong Zhang #else
382907cef9SHong Zhang #if defined(PETSC_USE_REAL_SINGLE)
392907cef9SHong Zhang #define PetscMUMPS_c smumps_c
402907cef9SHong Zhang #else
412907cef9SHong Zhang #define PetscMUMPS_c dmumps_c
422907cef9SHong Zhang #endif
432907cef9SHong Zhang #endif
442907cef9SHong Zhang 
453d472b54SHong Zhang 
46397b6df1SKris Buschelman /* macros s.t. indices match MUMPS documentation */
47397b6df1SKris Buschelman #define ICNTL(I) icntl[(I)-1]
48397b6df1SKris Buschelman #define CNTL(I) cntl[(I)-1]
49397b6df1SKris Buschelman #define INFOG(I) infog[(I)-1]
50a7aca84bSHong Zhang #define INFO(I) info[(I)-1]
51397b6df1SKris Buschelman #define RINFOG(I) rinfog[(I)-1]
52adc1d99fSHong Zhang #define RINFO(I) rinfo[(I)-1]
53397b6df1SKris Buschelman 
54397b6df1SKris Buschelman typedef struct {
55397b6df1SKris Buschelman #if defined(PETSC_USE_COMPLEX)
562907cef9SHong Zhang #if defined(PETSC_USE_REAL_SINGLE)
572907cef9SHong Zhang   CMUMPS_STRUC_C id;
582907cef9SHong Zhang #else
59397b6df1SKris Buschelman   ZMUMPS_STRUC_C id;
602907cef9SHong Zhang #endif
612907cef9SHong Zhang #else
622907cef9SHong Zhang #if defined(PETSC_USE_REAL_SINGLE)
632907cef9SHong Zhang   SMUMPS_STRUC_C id;
64397b6df1SKris Buschelman #else
65397b6df1SKris Buschelman   DMUMPS_STRUC_C id;
66397b6df1SKris Buschelman #endif
672907cef9SHong Zhang #endif
682907cef9SHong Zhang 
69397b6df1SKris Buschelman   MatStructure matstruc;
70c1490034SHong Zhang   PetscMPIInt  myid,size;
71a5e57a09SHong Zhang   PetscInt     *irn,*jcn,nz,sym;
72397b6df1SKris Buschelman   PetscScalar  *val;
73397b6df1SKris Buschelman   MPI_Comm     comm_mumps;
74329ec9b3SHong Zhang   VecScatter   scat_rhs, scat_sol;
7564e6c443SBarry Smith   PetscBool    isAIJ,CleanUpMUMPS;
76329ec9b3SHong Zhang   Vec          b_seq,x_seq;
77a5e57a09SHong Zhang   PetscInt     ICNTL9_pre;   /* check if ICNTL(9) is changed from previous MatSolve */
782205254eSKarl Rupp 
79bf0cc555SLisandro Dalcin   PetscErrorCode (*Destroy)(Mat);
80bccb9932SShri Abhyankar   PetscErrorCode (*ConvertToTriples)(Mat, int, MatReuse, int*, int**, int**, PetscScalar**);
81f0c56d0fSKris Buschelman } Mat_MUMPS;
82f0c56d0fSKris Buschelman 
8309573ac7SBarry Smith extern PetscErrorCode MatDuplicate_MUMPS(Mat,MatDuplicateOption,Mat*);
84b24902e0SBarry Smith 
8567877ebaSShri Abhyankar 
8667877ebaSShri Abhyankar /* MatConvertToTriples_A_B */
8767877ebaSShri Abhyankar /*convert Petsc matrix to triples: row[nz], col[nz], val[nz] */
88397b6df1SKris Buschelman /*
89397b6df1SKris Buschelman   input:
9067877ebaSShri Abhyankar     A       - matrix in aij,baij or sbaij (bs=1) format
91397b6df1SKris Buschelman     shift   - 0: C style output triple; 1: Fortran style output triple.
92bccb9932SShri Abhyankar     reuse   - MAT_INITIAL_MATRIX: spaces are allocated and values are set for the triple
93bccb9932SShri Abhyankar               MAT_REUSE_MATRIX:   only the values in v array are updated
94397b6df1SKris Buschelman   output:
95397b6df1SKris Buschelman     nnz     - dim of r, c, and v (number of local nonzero entries of A)
96397b6df1SKris Buschelman     r, c, v - row and col index, matrix values (matrix triples)
97*eb9baa12SBarry Smith 
98*eb9baa12SBarry Smith   The returned values r, c, and sometimes v are obtained in a single PetscMalloc(). Then in MatDestroy_MUMPS() it is
99*eb9baa12SBarry Smith   freed with PetscFree((mumps->irn);  This is not ideal code, the fact that v is ONLY sometimes part of mumps->irn means
100*eb9baa12SBarry Smith   that the PetscMalloc() cannot easily be replaced with a PetscMalloc3().
101*eb9baa12SBarry Smith 
102397b6df1SKris Buschelman  */
10316ebf90aSShri Abhyankar 
10416ebf90aSShri Abhyankar #undef __FUNCT__
10516ebf90aSShri Abhyankar #define __FUNCT__ "MatConvertToTriples_seqaij_seqaij"
106bccb9932SShri Abhyankar PetscErrorCode MatConvertToTriples_seqaij_seqaij(Mat A,int shift,MatReuse reuse,int *nnz,int **r, int **c, PetscScalar **v)
107b24902e0SBarry Smith {
108185f6596SHong Zhang   const PetscInt *ai,*aj,*ajj,M=A->rmap->n;
10967877ebaSShri Abhyankar   PetscInt       nz,rnz,i,j;
110dfbe8321SBarry Smith   PetscErrorCode ierr;
111c1490034SHong Zhang   PetscInt       *row,*col;
11216ebf90aSShri Abhyankar   Mat_SeqAIJ     *aa=(Mat_SeqAIJ*)A->data;
113397b6df1SKris Buschelman 
114397b6df1SKris Buschelman   PetscFunctionBegin;
11516ebf90aSShri Abhyankar   *v=aa->a;
116bccb9932SShri Abhyankar   if (reuse == MAT_INITIAL_MATRIX) {
1172205254eSKarl Rupp     nz   = aa->nz;
1182205254eSKarl Rupp     ai   = aa->i;
1192205254eSKarl Rupp     aj   = aa->j;
12016ebf90aSShri Abhyankar     *nnz = nz;
121185f6596SHong Zhang     ierr = PetscMalloc(2*nz*sizeof(PetscInt), &row);CHKERRQ(ierr);
122185f6596SHong Zhang     col  = row + nz;
123185f6596SHong Zhang 
12416ebf90aSShri Abhyankar     nz = 0;
12516ebf90aSShri Abhyankar     for (i=0; i<M; i++) {
12616ebf90aSShri Abhyankar       rnz = ai[i+1] - ai[i];
12767877ebaSShri Abhyankar       ajj = aj + ai[i];
12867877ebaSShri Abhyankar       for (j=0; j<rnz; j++) {
12967877ebaSShri Abhyankar         row[nz] = i+shift; col[nz++] = ajj[j] + shift;
13016ebf90aSShri Abhyankar       }
13116ebf90aSShri Abhyankar     }
13216ebf90aSShri Abhyankar     *r = row; *c = col;
13316ebf90aSShri Abhyankar   }
13416ebf90aSShri Abhyankar   PetscFunctionReturn(0);
13516ebf90aSShri Abhyankar }
136397b6df1SKris Buschelman 
13716ebf90aSShri Abhyankar #undef __FUNCT__
13867877ebaSShri Abhyankar #define __FUNCT__ "MatConvertToTriples_seqbaij_seqaij"
139bccb9932SShri Abhyankar PetscErrorCode MatConvertToTriples_seqbaij_seqaij(Mat A,int shift,MatReuse reuse,int *nnz,int **r, int **c, PetscScalar **v)
14067877ebaSShri Abhyankar {
14167877ebaSShri Abhyankar   Mat_SeqBAIJ    *aa=(Mat_SeqBAIJ*)A->data;
14267877ebaSShri Abhyankar   const PetscInt *ai,*aj,*ajj,bs=A->rmap->bs,bs2=aa->bs2,M=A->rmap->N/bs;
1430ad0caddSJed Brown   PetscInt       nz,idx=0,rnz,i,j,k,m;
14467877ebaSShri Abhyankar   PetscErrorCode ierr;
14567877ebaSShri Abhyankar   PetscInt       *row,*col;
14667877ebaSShri Abhyankar 
14767877ebaSShri Abhyankar   PetscFunctionBegin;
148cf3759fdSShri Abhyankar   *v = aa->a;
149bccb9932SShri Abhyankar   if (reuse == MAT_INITIAL_MATRIX) {
150cf3759fdSShri Abhyankar     ai   = aa->i; aj = aa->j;
15167877ebaSShri Abhyankar     nz   = bs2*aa->nz;
15267877ebaSShri Abhyankar     *nnz = nz;
153185f6596SHong Zhang     ierr = PetscMalloc(2*nz*sizeof(PetscInt), &row);CHKERRQ(ierr);
154185f6596SHong Zhang     col  = row + nz;
155185f6596SHong Zhang 
15667877ebaSShri Abhyankar     for (i=0; i<M; i++) {
15767877ebaSShri Abhyankar       ajj = aj + ai[i];
15867877ebaSShri Abhyankar       rnz = ai[i+1] - ai[i];
15967877ebaSShri Abhyankar       for (k=0; k<rnz; k++) {
16067877ebaSShri Abhyankar         for (j=0; j<bs; j++) {
16167877ebaSShri Abhyankar           for (m=0; m<bs; m++) {
16267877ebaSShri Abhyankar             row[idx]   = i*bs + m + shift;
163cf3759fdSShri Abhyankar             col[idx++] = bs*(ajj[k]) + j + shift;
16467877ebaSShri Abhyankar           }
16567877ebaSShri Abhyankar         }
16667877ebaSShri Abhyankar       }
16767877ebaSShri Abhyankar     }
168cf3759fdSShri Abhyankar     *r = row; *c = col;
16967877ebaSShri Abhyankar   }
17067877ebaSShri Abhyankar   PetscFunctionReturn(0);
17167877ebaSShri Abhyankar }
17267877ebaSShri Abhyankar 
17367877ebaSShri Abhyankar #undef __FUNCT__
17416ebf90aSShri Abhyankar #define __FUNCT__ "MatConvertToTriples_seqsbaij_seqsbaij"
175bccb9932SShri Abhyankar PetscErrorCode MatConvertToTriples_seqsbaij_seqsbaij(Mat A,int shift,MatReuse reuse,int *nnz,int **r, int **c, PetscScalar **v)
17616ebf90aSShri Abhyankar {
17767877ebaSShri Abhyankar   const PetscInt *ai, *aj,*ajj,M=A->rmap->n;
17867877ebaSShri Abhyankar   PetscInt       nz,rnz,i,j;
17916ebf90aSShri Abhyankar   PetscErrorCode ierr;
18016ebf90aSShri Abhyankar   PetscInt       *row,*col;
18116ebf90aSShri Abhyankar   Mat_SeqSBAIJ   *aa=(Mat_SeqSBAIJ*)A->data;
18216ebf90aSShri Abhyankar 
18316ebf90aSShri Abhyankar   PetscFunctionBegin;
184882afa5aSHong Zhang   *v = aa->a;
185bccb9932SShri Abhyankar   if (reuse == MAT_INITIAL_MATRIX) {
1862205254eSKarl Rupp     nz   = aa->nz;
1872205254eSKarl Rupp     ai   = aa->i;
1882205254eSKarl Rupp     aj   = aa->j;
1892205254eSKarl Rupp     *v   = aa->a;
19016ebf90aSShri Abhyankar     *nnz = nz;
191185f6596SHong Zhang     ierr = PetscMalloc(2*nz*sizeof(PetscInt), &row);CHKERRQ(ierr);
192185f6596SHong Zhang     col  = row + nz;
193185f6596SHong Zhang 
19416ebf90aSShri Abhyankar     nz = 0;
19516ebf90aSShri Abhyankar     for (i=0; i<M; i++) {
19616ebf90aSShri Abhyankar       rnz = ai[i+1] - ai[i];
19767877ebaSShri Abhyankar       ajj = aj + ai[i];
19867877ebaSShri Abhyankar       for (j=0; j<rnz; j++) {
19967877ebaSShri Abhyankar         row[nz] = i+shift; col[nz++] = ajj[j] + shift;
20016ebf90aSShri Abhyankar       }
20116ebf90aSShri Abhyankar     }
20216ebf90aSShri Abhyankar     *r = row; *c = col;
20316ebf90aSShri Abhyankar   }
20416ebf90aSShri Abhyankar   PetscFunctionReturn(0);
20516ebf90aSShri Abhyankar }
20616ebf90aSShri Abhyankar 
20716ebf90aSShri Abhyankar #undef __FUNCT__
20816ebf90aSShri Abhyankar #define __FUNCT__ "MatConvertToTriples_seqaij_seqsbaij"
209bccb9932SShri Abhyankar PetscErrorCode MatConvertToTriples_seqaij_seqsbaij(Mat A,int shift,MatReuse reuse,int *nnz,int **r, int **c, PetscScalar **v)
21016ebf90aSShri Abhyankar {
21167877ebaSShri Abhyankar   const PetscInt    *ai,*aj,*ajj,*adiag,M=A->rmap->n;
21267877ebaSShri Abhyankar   PetscInt          nz,rnz,i,j;
21367877ebaSShri Abhyankar   const PetscScalar *av,*v1;
21416ebf90aSShri Abhyankar   PetscScalar       *val;
21516ebf90aSShri Abhyankar   PetscErrorCode    ierr;
21616ebf90aSShri Abhyankar   PetscInt          *row,*col;
21716ebf90aSShri Abhyankar   Mat_SeqSBAIJ      *aa=(Mat_SeqSBAIJ*)A->data;
21816ebf90aSShri Abhyankar 
21916ebf90aSShri Abhyankar   PetscFunctionBegin;
22016ebf90aSShri Abhyankar   ai   =aa->i; aj=aa->j;av=aa->a;
22116ebf90aSShri Abhyankar   adiag=aa->diag;
222bccb9932SShri Abhyankar   if (reuse == MAT_INITIAL_MATRIX) {
22316ebf90aSShri Abhyankar     nz   = M + (aa->nz-M)/2;
22416ebf90aSShri Abhyankar     *nnz = nz;
225185f6596SHong Zhang     ierr = PetscMalloc((2*nz*sizeof(PetscInt)+nz*sizeof(PetscScalar)), &row);CHKERRQ(ierr);
226185f6596SHong Zhang     col  = row + nz;
227185f6596SHong Zhang     val  = (PetscScalar*)(col + nz);
228185f6596SHong Zhang 
22916ebf90aSShri Abhyankar     nz = 0;
23016ebf90aSShri Abhyankar     for (i=0; i<M; i++) {
23116ebf90aSShri Abhyankar       rnz = ai[i+1] - adiag[i];
23267877ebaSShri Abhyankar       ajj = aj + adiag[i];
233cf3759fdSShri Abhyankar       v1  = av + adiag[i];
23467877ebaSShri Abhyankar       for (j=0; j<rnz; j++) {
23567877ebaSShri Abhyankar         row[nz] = i+shift; col[nz] = ajj[j] + shift; val[nz++] = v1[j];
23616ebf90aSShri Abhyankar       }
23716ebf90aSShri Abhyankar     }
23816ebf90aSShri Abhyankar     *r = row; *c = col; *v = val;
239397b6df1SKris Buschelman   } else {
24016ebf90aSShri Abhyankar     nz = 0; val = *v;
24116ebf90aSShri Abhyankar     for (i=0; i <M; i++) {
24216ebf90aSShri Abhyankar       rnz = ai[i+1] - adiag[i];
24367877ebaSShri Abhyankar       ajj = aj + adiag[i];
24467877ebaSShri Abhyankar       v1  = av + adiag[i];
24567877ebaSShri Abhyankar       for (j=0; j<rnz; j++) {
24667877ebaSShri Abhyankar         val[nz++] = v1[j];
24716ebf90aSShri Abhyankar       }
24816ebf90aSShri Abhyankar     }
24916ebf90aSShri Abhyankar   }
25016ebf90aSShri Abhyankar   PetscFunctionReturn(0);
25116ebf90aSShri Abhyankar }
25216ebf90aSShri Abhyankar 
25316ebf90aSShri Abhyankar #undef __FUNCT__
25416ebf90aSShri Abhyankar #define __FUNCT__ "MatConvertToTriples_mpisbaij_mpisbaij"
255bccb9932SShri Abhyankar PetscErrorCode MatConvertToTriples_mpisbaij_mpisbaij(Mat A,int shift,MatReuse reuse,int *nnz,int **r, int **c, PetscScalar **v)
25616ebf90aSShri Abhyankar {
25716ebf90aSShri Abhyankar   const PetscInt    *ai, *aj, *bi, *bj,*garray,m=A->rmap->n,*ajj,*bjj;
25816ebf90aSShri Abhyankar   PetscErrorCode    ierr;
25916ebf90aSShri Abhyankar   PetscInt          rstart,nz,i,j,jj,irow,countA,countB;
26016ebf90aSShri Abhyankar   PetscInt          *row,*col;
26116ebf90aSShri Abhyankar   const PetscScalar *av, *bv,*v1,*v2;
26216ebf90aSShri Abhyankar   PetscScalar       *val;
263397b6df1SKris Buschelman   Mat_MPISBAIJ      *mat = (Mat_MPISBAIJ*)A->data;
264397b6df1SKris Buschelman   Mat_SeqSBAIJ      *aa  = (Mat_SeqSBAIJ*)(mat->A)->data;
265397b6df1SKris Buschelman   Mat_SeqBAIJ       *bb  = (Mat_SeqBAIJ*)(mat->B)->data;
26616ebf90aSShri Abhyankar 
26716ebf90aSShri Abhyankar   PetscFunctionBegin;
268d0f46423SBarry Smith   ai=aa->i; aj=aa->j; bi=bb->i; bj=bb->j; rstart= A->rmap->rstart;
269397b6df1SKris Buschelman   av=aa->a; bv=bb->a;
270397b6df1SKris Buschelman 
2712205254eSKarl Rupp   garray = mat->garray;
2722205254eSKarl Rupp 
273bccb9932SShri Abhyankar   if (reuse == MAT_INITIAL_MATRIX) {
27416ebf90aSShri Abhyankar     nz   = aa->nz + bb->nz;
27516ebf90aSShri Abhyankar     *nnz = nz;
276185f6596SHong Zhang     ierr = PetscMalloc((2*nz*sizeof(PetscInt)+nz*sizeof(PetscScalar)), &row);CHKERRQ(ierr);
277185f6596SHong Zhang     col  = row + nz;
278185f6596SHong Zhang     val  = (PetscScalar*)(col + nz);
279185f6596SHong Zhang 
280397b6df1SKris Buschelman     *r = row; *c = col; *v = val;
281397b6df1SKris Buschelman   } else {
282397b6df1SKris Buschelman     row = *r; col = *c; val = *v;
283397b6df1SKris Buschelman   }
284397b6df1SKris Buschelman 
285028e57e8SHong Zhang   jj = 0; irow = rstart;
286397b6df1SKris Buschelman   for (i=0; i<m; i++) {
287397b6df1SKris Buschelman     ajj    = aj + ai[i];                 /* ptr to the beginning of this row */
288397b6df1SKris Buschelman     countA = ai[i+1] - ai[i];
289397b6df1SKris Buschelman     countB = bi[i+1] - bi[i];
290397b6df1SKris Buschelman     bjj    = bj + bi[i];
29116ebf90aSShri Abhyankar     v1     = av + ai[i];
29216ebf90aSShri Abhyankar     v2     = bv + bi[i];
293397b6df1SKris Buschelman 
294397b6df1SKris Buschelman     /* A-part */
295397b6df1SKris Buschelman     for (j=0; j<countA; j++) {
296bccb9932SShri Abhyankar       if (reuse == MAT_INITIAL_MATRIX) {
297397b6df1SKris Buschelman         row[jj] = irow + shift; col[jj] = rstart + ajj[j] + shift;
298397b6df1SKris Buschelman       }
29916ebf90aSShri Abhyankar       val[jj++] = v1[j];
300397b6df1SKris Buschelman     }
30116ebf90aSShri Abhyankar 
30216ebf90aSShri Abhyankar     /* B-part */
30316ebf90aSShri Abhyankar     for (j=0; j < countB; j++) {
304bccb9932SShri Abhyankar       if (reuse == MAT_INITIAL_MATRIX) {
305397b6df1SKris Buschelman         row[jj] = irow + shift; col[jj] = garray[bjj[j]] + shift;
306397b6df1SKris Buschelman       }
30716ebf90aSShri Abhyankar       val[jj++] = v2[j];
30816ebf90aSShri Abhyankar     }
30916ebf90aSShri Abhyankar     irow++;
31016ebf90aSShri Abhyankar   }
31116ebf90aSShri Abhyankar   PetscFunctionReturn(0);
31216ebf90aSShri Abhyankar }
31316ebf90aSShri Abhyankar 
31416ebf90aSShri Abhyankar #undef __FUNCT__
31516ebf90aSShri Abhyankar #define __FUNCT__ "MatConvertToTriples_mpiaij_mpiaij"
316bccb9932SShri Abhyankar PetscErrorCode MatConvertToTriples_mpiaij_mpiaij(Mat A,int shift,MatReuse reuse,int *nnz,int **r, int **c, PetscScalar **v)
31716ebf90aSShri Abhyankar {
31816ebf90aSShri Abhyankar   const PetscInt    *ai, *aj, *bi, *bj,*garray,m=A->rmap->n,*ajj,*bjj;
31916ebf90aSShri Abhyankar   PetscErrorCode    ierr;
32016ebf90aSShri Abhyankar   PetscInt          rstart,nz,i,j,jj,irow,countA,countB;
32116ebf90aSShri Abhyankar   PetscInt          *row,*col;
32216ebf90aSShri Abhyankar   const PetscScalar *av, *bv,*v1,*v2;
32316ebf90aSShri Abhyankar   PetscScalar       *val;
32416ebf90aSShri Abhyankar   Mat_MPIAIJ        *mat = (Mat_MPIAIJ*)A->data;
32516ebf90aSShri Abhyankar   Mat_SeqAIJ        *aa  = (Mat_SeqAIJ*)(mat->A)->data;
32616ebf90aSShri Abhyankar   Mat_SeqAIJ        *bb  = (Mat_SeqAIJ*)(mat->B)->data;
32716ebf90aSShri Abhyankar 
32816ebf90aSShri Abhyankar   PetscFunctionBegin;
32916ebf90aSShri Abhyankar   ai=aa->i; aj=aa->j; bi=bb->i; bj=bb->j; rstart= A->rmap->rstart;
33016ebf90aSShri Abhyankar   av=aa->a; bv=bb->a;
33116ebf90aSShri Abhyankar 
3322205254eSKarl Rupp   garray = mat->garray;
3332205254eSKarl Rupp 
334bccb9932SShri Abhyankar   if (reuse == MAT_INITIAL_MATRIX) {
33516ebf90aSShri Abhyankar     nz   = aa->nz + bb->nz;
33616ebf90aSShri Abhyankar     *nnz = nz;
337185f6596SHong Zhang     ierr = PetscMalloc((2*nz*sizeof(PetscInt)+nz*sizeof(PetscScalar)), &row);CHKERRQ(ierr);
338185f6596SHong Zhang     col  = row + nz;
339185f6596SHong Zhang     val  = (PetscScalar*)(col + nz);
340185f6596SHong Zhang 
34116ebf90aSShri Abhyankar     *r = row; *c = col; *v = val;
34216ebf90aSShri Abhyankar   } else {
34316ebf90aSShri Abhyankar     row = *r; col = *c; val = *v;
34416ebf90aSShri Abhyankar   }
34516ebf90aSShri Abhyankar 
34616ebf90aSShri Abhyankar   jj = 0; irow = rstart;
34716ebf90aSShri Abhyankar   for (i=0; i<m; i++) {
34816ebf90aSShri Abhyankar     ajj    = aj + ai[i];                 /* ptr to the beginning of this row */
34916ebf90aSShri Abhyankar     countA = ai[i+1] - ai[i];
35016ebf90aSShri Abhyankar     countB = bi[i+1] - bi[i];
35116ebf90aSShri Abhyankar     bjj    = bj + bi[i];
35216ebf90aSShri Abhyankar     v1     = av + ai[i];
35316ebf90aSShri Abhyankar     v2     = bv + bi[i];
35416ebf90aSShri Abhyankar 
35516ebf90aSShri Abhyankar     /* A-part */
35616ebf90aSShri Abhyankar     for (j=0; j<countA; j++) {
357bccb9932SShri Abhyankar       if (reuse == MAT_INITIAL_MATRIX) {
35816ebf90aSShri Abhyankar         row[jj] = irow + shift; col[jj] = rstart + ajj[j] + shift;
35916ebf90aSShri Abhyankar       }
36016ebf90aSShri Abhyankar       val[jj++] = v1[j];
36116ebf90aSShri Abhyankar     }
36216ebf90aSShri Abhyankar 
36316ebf90aSShri Abhyankar     /* B-part */
36416ebf90aSShri Abhyankar     for (j=0; j < countB; j++) {
365bccb9932SShri Abhyankar       if (reuse == MAT_INITIAL_MATRIX) {
36616ebf90aSShri Abhyankar         row[jj] = irow + shift; col[jj] = garray[bjj[j]] + shift;
36716ebf90aSShri Abhyankar       }
36816ebf90aSShri Abhyankar       val[jj++] = v2[j];
36916ebf90aSShri Abhyankar     }
37016ebf90aSShri Abhyankar     irow++;
37116ebf90aSShri Abhyankar   }
37216ebf90aSShri Abhyankar   PetscFunctionReturn(0);
37316ebf90aSShri Abhyankar }
37416ebf90aSShri Abhyankar 
37516ebf90aSShri Abhyankar #undef __FUNCT__
37667877ebaSShri Abhyankar #define __FUNCT__ "MatConvertToTriples_mpibaij_mpiaij"
377bccb9932SShri Abhyankar PetscErrorCode MatConvertToTriples_mpibaij_mpiaij(Mat A,int shift,MatReuse reuse,int *nnz,int **r, int **c, PetscScalar **v)
37867877ebaSShri Abhyankar {
37967877ebaSShri Abhyankar   Mat_MPIBAIJ       *mat    = (Mat_MPIBAIJ*)A->data;
38067877ebaSShri Abhyankar   Mat_SeqBAIJ       *aa     = (Mat_SeqBAIJ*)(mat->A)->data;
38167877ebaSShri Abhyankar   Mat_SeqBAIJ       *bb     = (Mat_SeqBAIJ*)(mat->B)->data;
38267877ebaSShri Abhyankar   const PetscInt    *ai     = aa->i, *bi = bb->i, *aj = aa->j, *bj = bb->j,*ajj, *bjj;
383d985c460SShri Abhyankar   const PetscInt    *garray = mat->garray,mbs=mat->mbs,rstart=A->rmap->rstart;
38467877ebaSShri Abhyankar   const PetscInt    bs      = A->rmap->bs,bs2=mat->bs2;
38567877ebaSShri Abhyankar   PetscErrorCode    ierr;
38667877ebaSShri Abhyankar   PetscInt          nz,i,j,k,n,jj,irow,countA,countB,idx;
38767877ebaSShri Abhyankar   PetscInt          *row,*col;
38867877ebaSShri Abhyankar   const PetscScalar *av=aa->a, *bv=bb->a,*v1,*v2;
38967877ebaSShri Abhyankar   PetscScalar       *val;
39067877ebaSShri Abhyankar 
39167877ebaSShri Abhyankar   PetscFunctionBegin;
392bccb9932SShri Abhyankar   if (reuse == MAT_INITIAL_MATRIX) {
39367877ebaSShri Abhyankar     nz   = bs2*(aa->nz + bb->nz);
39467877ebaSShri Abhyankar     *nnz = nz;
395185f6596SHong Zhang     ierr = PetscMalloc((2*nz*sizeof(PetscInt)+nz*sizeof(PetscScalar)), &row);CHKERRQ(ierr);
396185f6596SHong Zhang     col  = row + nz;
397185f6596SHong Zhang     val  = (PetscScalar*)(col + nz);
398185f6596SHong Zhang 
39967877ebaSShri Abhyankar     *r = row; *c = col; *v = val;
40067877ebaSShri Abhyankar   } else {
40167877ebaSShri Abhyankar     row = *r; col = *c; val = *v;
40267877ebaSShri Abhyankar   }
40367877ebaSShri Abhyankar 
404d985c460SShri Abhyankar   jj = 0; irow = rstart;
40567877ebaSShri Abhyankar   for (i=0; i<mbs; i++) {
40667877ebaSShri Abhyankar     countA = ai[i+1] - ai[i];
40767877ebaSShri Abhyankar     countB = bi[i+1] - bi[i];
40867877ebaSShri Abhyankar     ajj    = aj + ai[i];
40967877ebaSShri Abhyankar     bjj    = bj + bi[i];
41067877ebaSShri Abhyankar     v1     = av + bs2*ai[i];
41167877ebaSShri Abhyankar     v2     = bv + bs2*bi[i];
41267877ebaSShri Abhyankar 
41367877ebaSShri Abhyankar     idx = 0;
41467877ebaSShri Abhyankar     /* A-part */
41567877ebaSShri Abhyankar     for (k=0; k<countA; k++) {
41667877ebaSShri Abhyankar       for (j=0; j<bs; j++) {
41767877ebaSShri Abhyankar         for (n=0; n<bs; n++) {
418bccb9932SShri Abhyankar           if (reuse == MAT_INITIAL_MATRIX) {
419d985c460SShri Abhyankar             row[jj] = irow + n + shift;
420d985c460SShri Abhyankar             col[jj] = rstart + bs*ajj[k] + j + shift;
42167877ebaSShri Abhyankar           }
42267877ebaSShri Abhyankar           val[jj++] = v1[idx++];
42367877ebaSShri Abhyankar         }
42467877ebaSShri Abhyankar       }
42567877ebaSShri Abhyankar     }
42667877ebaSShri Abhyankar 
42767877ebaSShri Abhyankar     idx = 0;
42867877ebaSShri Abhyankar     /* B-part */
42967877ebaSShri Abhyankar     for (k=0; k<countB; k++) {
43067877ebaSShri Abhyankar       for (j=0; j<bs; j++) {
43167877ebaSShri Abhyankar         for (n=0; n<bs; n++) {
432bccb9932SShri Abhyankar           if (reuse == MAT_INITIAL_MATRIX) {
433d985c460SShri Abhyankar             row[jj] = irow + n + shift;
434d985c460SShri Abhyankar             col[jj] = bs*garray[bjj[k]] + j + shift;
43567877ebaSShri Abhyankar           }
436d985c460SShri Abhyankar           val[jj++] = v2[idx++];
43767877ebaSShri Abhyankar         }
43867877ebaSShri Abhyankar       }
43967877ebaSShri Abhyankar     }
440d985c460SShri Abhyankar     irow += bs;
44167877ebaSShri Abhyankar   }
44267877ebaSShri Abhyankar   PetscFunctionReturn(0);
44367877ebaSShri Abhyankar }
44467877ebaSShri Abhyankar 
44567877ebaSShri Abhyankar #undef __FUNCT__
44616ebf90aSShri Abhyankar #define __FUNCT__ "MatConvertToTriples_mpiaij_mpisbaij"
447bccb9932SShri Abhyankar PetscErrorCode MatConvertToTriples_mpiaij_mpisbaij(Mat A,int shift,MatReuse reuse,int *nnz,int **r, int **c, PetscScalar **v)
44816ebf90aSShri Abhyankar {
44916ebf90aSShri Abhyankar   const PetscInt    *ai, *aj,*adiag, *bi, *bj,*garray,m=A->rmap->n,*ajj,*bjj;
45016ebf90aSShri Abhyankar   PetscErrorCode    ierr;
451e0bace9bSHong Zhang   PetscInt          rstart,nz,nza,nzb,i,j,jj,irow,countA,countB;
45216ebf90aSShri Abhyankar   PetscInt          *row,*col;
45316ebf90aSShri Abhyankar   const PetscScalar *av, *bv,*v1,*v2;
45416ebf90aSShri Abhyankar   PetscScalar       *val;
45516ebf90aSShri Abhyankar   Mat_MPIAIJ        *mat =  (Mat_MPIAIJ*)A->data;
45616ebf90aSShri Abhyankar   Mat_SeqAIJ        *aa  =(Mat_SeqAIJ*)(mat->A)->data;
45716ebf90aSShri Abhyankar   Mat_SeqAIJ        *bb  =(Mat_SeqAIJ*)(mat->B)->data;
45816ebf90aSShri Abhyankar 
45916ebf90aSShri Abhyankar   PetscFunctionBegin;
46016ebf90aSShri Abhyankar   ai=aa->i; aj=aa->j; adiag=aa->diag;
46116ebf90aSShri Abhyankar   bi=bb->i; bj=bb->j; garray = mat->garray;
46216ebf90aSShri Abhyankar   av=aa->a; bv=bb->a;
4632205254eSKarl Rupp 
46416ebf90aSShri Abhyankar   rstart = A->rmap->rstart;
46516ebf90aSShri Abhyankar 
466bccb9932SShri Abhyankar   if (reuse == MAT_INITIAL_MATRIX) {
467e0bace9bSHong Zhang     nza = 0;    /* num of upper triangular entries in mat->A, including diagonals */
468e0bace9bSHong Zhang     nzb = 0;    /* num of upper triangular entries in mat->B */
46916ebf90aSShri Abhyankar     for (i=0; i<m; i++) {
470e0bace9bSHong Zhang       nza   += (ai[i+1] - adiag[i]);
47116ebf90aSShri Abhyankar       countB = bi[i+1] - bi[i];
47216ebf90aSShri Abhyankar       bjj    = bj + bi[i];
473e0bace9bSHong Zhang       for (j=0; j<countB; j++) {
474e0bace9bSHong Zhang         if (garray[bjj[j]] > rstart) nzb++;
475e0bace9bSHong Zhang       }
476e0bace9bSHong Zhang     }
47716ebf90aSShri Abhyankar 
478e0bace9bSHong Zhang     nz   = nza + nzb; /* total nz of upper triangular part of mat */
47916ebf90aSShri Abhyankar     *nnz = nz;
480185f6596SHong Zhang     ierr = PetscMalloc((2*nz*sizeof(PetscInt)+nz*sizeof(PetscScalar)), &row);CHKERRQ(ierr);
481185f6596SHong Zhang     col  = row + nz;
482185f6596SHong Zhang     val  = (PetscScalar*)(col + nz);
483185f6596SHong Zhang 
48416ebf90aSShri Abhyankar     *r = row; *c = col; *v = val;
48516ebf90aSShri Abhyankar   } else {
48616ebf90aSShri Abhyankar     row = *r; col = *c; val = *v;
48716ebf90aSShri Abhyankar   }
48816ebf90aSShri Abhyankar 
48916ebf90aSShri Abhyankar   jj = 0; irow = rstart;
49016ebf90aSShri Abhyankar   for (i=0; i<m; i++) {
49116ebf90aSShri Abhyankar     ajj    = aj + adiag[i];                 /* ptr to the beginning of the diagonal of this row */
49216ebf90aSShri Abhyankar     v1     = av + adiag[i];
49316ebf90aSShri Abhyankar     countA = ai[i+1] - adiag[i];
49416ebf90aSShri Abhyankar     countB = bi[i+1] - bi[i];
49516ebf90aSShri Abhyankar     bjj    = bj + bi[i];
49616ebf90aSShri Abhyankar     v2     = bv + bi[i];
49716ebf90aSShri Abhyankar 
49816ebf90aSShri Abhyankar     /* A-part */
49916ebf90aSShri Abhyankar     for (j=0; j<countA; j++) {
500bccb9932SShri Abhyankar       if (reuse == MAT_INITIAL_MATRIX) {
50116ebf90aSShri Abhyankar         row[jj] = irow + shift; col[jj] = rstart + ajj[j] + shift;
50216ebf90aSShri Abhyankar       }
50316ebf90aSShri Abhyankar       val[jj++] = v1[j];
50416ebf90aSShri Abhyankar     }
50516ebf90aSShri Abhyankar 
50616ebf90aSShri Abhyankar     /* B-part */
50716ebf90aSShri Abhyankar     for (j=0; j < countB; j++) {
50816ebf90aSShri Abhyankar       if (garray[bjj[j]] > rstart) {
509bccb9932SShri Abhyankar         if (reuse == MAT_INITIAL_MATRIX) {
51016ebf90aSShri Abhyankar           row[jj] = irow + shift; col[jj] = garray[bjj[j]] + shift;
51116ebf90aSShri Abhyankar         }
51216ebf90aSShri Abhyankar         val[jj++] = v2[j];
51316ebf90aSShri Abhyankar       }
514397b6df1SKris Buschelman     }
515397b6df1SKris Buschelman     irow++;
516397b6df1SKris Buschelman   }
517397b6df1SKris Buschelman   PetscFunctionReturn(0);
518397b6df1SKris Buschelman }
519397b6df1SKris Buschelman 
520397b6df1SKris Buschelman #undef __FUNCT__
5213924e44cSKris Buschelman #define __FUNCT__ "MatDestroy_MUMPS"
522dfbe8321SBarry Smith PetscErrorCode MatDestroy_MUMPS(Mat A)
523dfbe8321SBarry Smith {
524a5e57a09SHong Zhang   Mat_MUMPS      *mumps=(Mat_MUMPS*)A->spptr;
525dfbe8321SBarry Smith   PetscErrorCode ierr;
526b24902e0SBarry Smith 
527397b6df1SKris Buschelman   PetscFunctionBegin;
528a5e57a09SHong Zhang   if (mumps->CleanUpMUMPS) {
529397b6df1SKris Buschelman     /* Terminate instance, deallocate memories */
530a5e57a09SHong Zhang     ierr = PetscFree2(mumps->id.sol_loc,mumps->id.isol_loc);CHKERRQ(ierr);
531a5e57a09SHong Zhang     ierr = VecScatterDestroy(&mumps->scat_rhs);CHKERRQ(ierr);
532a5e57a09SHong Zhang     ierr = VecDestroy(&mumps->b_seq);CHKERRQ(ierr);
533a5e57a09SHong Zhang     ierr = VecScatterDestroy(&mumps->scat_sol);CHKERRQ(ierr);
534a5e57a09SHong Zhang     ierr = VecDestroy(&mumps->x_seq);CHKERRQ(ierr);
535a5e57a09SHong Zhang     ierr = PetscFree(mumps->id.perm_in);CHKERRQ(ierr);
536a5e57a09SHong Zhang     ierr = PetscFree(mumps->irn);CHKERRQ(ierr);
5372205254eSKarl Rupp 
538a5e57a09SHong Zhang     mumps->id.job = JOB_END;
539a5e57a09SHong Zhang     PetscMUMPS_c(&mumps->id);
540a5e57a09SHong Zhang     ierr = MPI_Comm_free(&(mumps->comm_mumps));CHKERRQ(ierr);
541397b6df1SKris Buschelman   }
542a5e57a09SHong Zhang   if (mumps->Destroy) {
543a5e57a09SHong Zhang     ierr = (mumps->Destroy)(A);CHKERRQ(ierr);
544bf0cc555SLisandro Dalcin   }
545bf0cc555SLisandro Dalcin   ierr = PetscFree(A->spptr);CHKERRQ(ierr);
546bf0cc555SLisandro Dalcin 
54797969023SHong Zhang   /* clear composed functions */
548bdf89e91SBarry Smith   ierr = PetscObjectComposeFunction((PetscObject)A,"MatFactorGetSolverPackage_C",NULL);CHKERRQ(ierr);
549bdf89e91SBarry Smith   ierr = PetscObjectComposeFunction((PetscObject)A,"MatMumpsSetIcntl_C",NULL);CHKERRQ(ierr);
550bdf89e91SBarry Smith   ierr = PetscObjectComposeFunction((PetscObject)A,"MatMumpsSetCntl_C",NULL);CHKERRQ(ierr);
551397b6df1SKris Buschelman   PetscFunctionReturn(0);
552397b6df1SKris Buschelman }
553397b6df1SKris Buschelman 
554397b6df1SKris Buschelman #undef __FUNCT__
555f6c57405SHong Zhang #define __FUNCT__ "MatSolve_MUMPS"
556b24902e0SBarry Smith PetscErrorCode MatSolve_MUMPS(Mat A,Vec b,Vec x)
557b24902e0SBarry Smith {
558a5e57a09SHong Zhang   Mat_MUMPS        *mumps=(Mat_MUMPS*)A->spptr;
559d54de34fSKris Buschelman   PetscScalar      *array;
56067877ebaSShri Abhyankar   Vec              b_seq;
561329ec9b3SHong Zhang   IS               is_iden,is_petsc;
562dfbe8321SBarry Smith   PetscErrorCode   ierr;
563329ec9b3SHong Zhang   PetscInt         i;
564883f2eb9SBarry Smith   static PetscBool cite1 = PETSC_FALSE,cite2 = PETSC_FALSE;
565397b6df1SKris Buschelman 
566397b6df1SKris Buschelman   PetscFunctionBegin;
567883f2eb9SBarry Smith   ierr = PetscCitationsRegister("@article{MUMPS01,\n  author = {P.~R. Amestoy and I.~S. Duff and J.-Y. L'Excellent and J. Koster},\n  title = {A fully asynchronous multifrontal solver using distributed dynamic scheduling},\n  journal = {SIAM Journal on Matrix Analysis and Applications},\n  volume = {23},\n  number = {1},\n  pages = {15--41},\n  year = {2001}\n}\n",&cite1);CHKERRQ(ierr);
568883f2eb9SBarry Smith   ierr = PetscCitationsRegister("@article{MUMPS02,\n  author = {P.~R. Amestoy and A. Guermouche and J.-Y. L'Excellent and S. Pralet},\n  title = {Hybrid scheduling for the parallel solution of linear systems},\n  journal = {Parallel Computing},\n  volume = {32},\n  number = {2},\n  pages = {136--156},\n  year = {2006}\n}\n",&cite2);CHKERRQ(ierr);
569a5e57a09SHong Zhang   mumps->id.nrhs = 1;
570a5e57a09SHong Zhang   b_seq          = mumps->b_seq;
571a5e57a09SHong Zhang   if (mumps->size > 1) {
572329ec9b3SHong Zhang     /* MUMPS only supports centralized rhs. Scatter b into a seqential rhs vector */
573a5e57a09SHong Zhang     ierr = VecScatterBegin(mumps->scat_rhs,b,b_seq,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
574a5e57a09SHong Zhang     ierr = VecScatterEnd(mumps->scat_rhs,b,b_seq,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
575a5e57a09SHong Zhang     if (!mumps->myid) {ierr = VecGetArray(b_seq,&array);CHKERRQ(ierr);}
576397b6df1SKris Buschelman   } else {  /* size == 1 */
577397b6df1SKris Buschelman     ierr = VecCopy(b,x);CHKERRQ(ierr);
578397b6df1SKris Buschelman     ierr = VecGetArray(x,&array);CHKERRQ(ierr);
579397b6df1SKris Buschelman   }
580a5e57a09SHong Zhang   if (!mumps->myid) { /* define rhs on the host */
581a5e57a09SHong Zhang     mumps->id.nrhs = 1;
582397b6df1SKris Buschelman #if defined(PETSC_USE_COMPLEX)
5832907cef9SHong Zhang #if defined(PETSC_USE_REAL_SINGLE)
584a5e57a09SHong Zhang     mumps->id.rhs = (mumps_complex*)array;
5852907cef9SHong Zhang #else
586a5e57a09SHong Zhang     mumps->id.rhs = (mumps_double_complex*)array;
5872907cef9SHong Zhang #endif
588397b6df1SKris Buschelman #else
589a5e57a09SHong Zhang     mumps->id.rhs = array;
590397b6df1SKris Buschelman #endif
591397b6df1SKris Buschelman   }
592397b6df1SKris Buschelman 
593397b6df1SKris Buschelman   /* solve phase */
594329ec9b3SHong Zhang   /*-------------*/
595a5e57a09SHong Zhang   mumps->id.job = JOB_SOLVE;
596a5e57a09SHong Zhang   PetscMUMPS_c(&mumps->id);
597a5e57a09SHong Zhang   if (mumps->id.INFOG(1) < 0) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error reported by MUMPS in solve phase: INFOG(1)=%d\n",mumps->id.INFOG(1));
598397b6df1SKris Buschelman 
599a5e57a09SHong Zhang   if (mumps->size > 1) { /* convert mumps distributed solution to petsc mpi x */
600a5e57a09SHong Zhang     if (mumps->scat_sol && mumps->ICNTL9_pre != mumps->id.ICNTL(9)) {
601a5e57a09SHong Zhang       /* when id.ICNTL(9) changes, the contents of lsol_loc may change (not its size, lsol_loc), recreates scat_sol */
602a5e57a09SHong Zhang       ierr = VecScatterDestroy(&mumps->scat_sol);CHKERRQ(ierr);
603397b6df1SKris Buschelman     }
604a5e57a09SHong Zhang     if (!mumps->scat_sol) { /* create scatter scat_sol */
605a5e57a09SHong Zhang       ierr = ISCreateStride(PETSC_COMM_SELF,mumps->id.lsol_loc,0,1,&is_iden);CHKERRQ(ierr); /* from */
606a5e57a09SHong Zhang       for (i=0; i<mumps->id.lsol_loc; i++) {
607a5e57a09SHong Zhang         mumps->id.isol_loc[i] -= 1; /* change Fortran style to C style */
608a5e57a09SHong Zhang       }
609a5e57a09SHong Zhang       ierr = ISCreateGeneral(PETSC_COMM_SELF,mumps->id.lsol_loc,mumps->id.isol_loc,PETSC_COPY_VALUES,&is_petsc);CHKERRQ(ierr);  /* to */
610a5e57a09SHong Zhang       ierr = VecScatterCreate(mumps->x_seq,is_iden,x,is_petsc,&mumps->scat_sol);CHKERRQ(ierr);
6116bf464f9SBarry Smith       ierr = ISDestroy(&is_iden);CHKERRQ(ierr);
6126bf464f9SBarry Smith       ierr = ISDestroy(&is_petsc);CHKERRQ(ierr);
6132205254eSKarl Rupp 
614a5e57a09SHong Zhang       mumps->ICNTL9_pre = mumps->id.ICNTL(9); /* save current value of id.ICNTL(9) */
615397b6df1SKris Buschelman     }
616a5e57a09SHong Zhang 
617a5e57a09SHong Zhang     ierr = VecScatterBegin(mumps->scat_sol,mumps->x_seq,x,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
618a5e57a09SHong Zhang     ierr = VecScatterEnd(mumps->scat_sol,mumps->x_seq,x,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
619329ec9b3SHong Zhang   }
620397b6df1SKris Buschelman   PetscFunctionReturn(0);
621397b6df1SKris Buschelman }
622397b6df1SKris Buschelman 
62351d5961aSHong Zhang #undef __FUNCT__
62451d5961aSHong Zhang #define __FUNCT__ "MatSolveTranspose_MUMPS"
62551d5961aSHong Zhang PetscErrorCode MatSolveTranspose_MUMPS(Mat A,Vec b,Vec x)
62651d5961aSHong Zhang {
627a5e57a09SHong Zhang   Mat_MUMPS      *mumps=(Mat_MUMPS*)A->spptr;
62851d5961aSHong Zhang   PetscErrorCode ierr;
62951d5961aSHong Zhang 
63051d5961aSHong Zhang   PetscFunctionBegin;
631a5e57a09SHong Zhang   mumps->id.ICNTL(9) = 0;
6322205254eSKarl Rupp 
6330ad0caddSJed Brown   ierr = MatSolve_MUMPS(A,b,x);CHKERRQ(ierr);
6342205254eSKarl Rupp 
635a5e57a09SHong Zhang   mumps->id.ICNTL(9) = 1;
63651d5961aSHong Zhang   PetscFunctionReturn(0);
63751d5961aSHong Zhang }
63851d5961aSHong Zhang 
639e0b74bf9SHong Zhang #undef __FUNCT__
640e0b74bf9SHong Zhang #define __FUNCT__ "MatMatSolve_MUMPS"
641e0b74bf9SHong Zhang PetscErrorCode MatMatSolve_MUMPS(Mat A,Mat B,Mat X)
642e0b74bf9SHong Zhang {
643bda8bf91SBarry Smith   PetscErrorCode ierr;
644bda8bf91SBarry Smith   PetscBool      flg;
645bda8bf91SBarry Smith 
646e0b74bf9SHong Zhang   PetscFunctionBegin;
6470298fd71SBarry Smith   ierr = PetscObjectTypeCompareAny((PetscObject)B,&flg,MATSEQDENSE,MATMPIDENSE,NULL);CHKERRQ(ierr);
648ce94432eSBarry Smith   if (!flg) SETERRQ(PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_WRONG,"Matrix B must be MATDENSE matrix");
6490298fd71SBarry Smith   ierr = PetscObjectTypeCompareAny((PetscObject)X,&flg,MATSEQDENSE,MATMPIDENSE,NULL);CHKERRQ(ierr);
650ce94432eSBarry Smith   if (!flg) SETERRQ(PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_WRONG,"Matrix X must be MATDENSE matrix");
6512205254eSKarl Rupp   SETERRQ(PETSC_COMM_SELF,PETSC_ERR_SUP,"MatMatSolve_MUMPS() is not implemented yet");
652e0b74bf9SHong Zhang   PetscFunctionReturn(0);
653e0b74bf9SHong Zhang }
654e0b74bf9SHong Zhang 
655ace3df97SHong Zhang #if !defined(PETSC_USE_COMPLEX)
656a58c3f20SHong Zhang /*
657a58c3f20SHong Zhang   input:
658a58c3f20SHong Zhang    F:        numeric factor
659a58c3f20SHong Zhang   output:
660a58c3f20SHong Zhang    nneg:     total number of negative pivots
661a58c3f20SHong Zhang    nzero:    0
662a58c3f20SHong Zhang    npos:     (global dimension of F) - nneg
663a58c3f20SHong Zhang */
664a58c3f20SHong Zhang 
665a58c3f20SHong Zhang #undef __FUNCT__
666a58c3f20SHong Zhang #define __FUNCT__ "MatGetInertia_SBAIJMUMPS"
667dfbe8321SBarry Smith PetscErrorCode MatGetInertia_SBAIJMUMPS(Mat F,int *nneg,int *nzero,int *npos)
668a58c3f20SHong Zhang {
669a5e57a09SHong Zhang   Mat_MUMPS      *mumps =(Mat_MUMPS*)F->spptr;
670dfbe8321SBarry Smith   PetscErrorCode ierr;
671c1490034SHong Zhang   PetscMPIInt    size;
672a58c3f20SHong Zhang 
673a58c3f20SHong Zhang   PetscFunctionBegin;
674ce94432eSBarry Smith   ierr = MPI_Comm_size(PetscObjectComm((PetscObject)F),&size);CHKERRQ(ierr);
675bcb30aebSHong Zhang   /* MUMPS 4.3.1 calls ScaLAPACK when ICNTL(13)=0 (default), which does not offer the possibility to compute the inertia of a dense matrix. Set ICNTL(13)=1 to skip ScaLAPACK */
676a5e57a09SHong Zhang   if (size > 1 && mumps->id.ICNTL(13) != 1) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONG,"ICNTL(13)=%d. -mat_mumps_icntl_13 must be set as 1 for correct global matrix inertia\n",mumps->id.INFOG(13));
677a58c3f20SHong Zhang   if (nneg) {
678a5e57a09SHong Zhang     if (!mumps->myid) {
679a5e57a09SHong Zhang       *nneg = mumps->id.INFOG(12);
680a58c3f20SHong Zhang     }
681a5e57a09SHong Zhang     ierr = MPI_Bcast(nneg,1,MPI_INT,0,mumps->comm_mumps);CHKERRQ(ierr);
682a58c3f20SHong Zhang   }
683a58c3f20SHong Zhang   if (nzero) *nzero = 0;
684d0f46423SBarry Smith   if (npos)  *npos  = F->rmap->N - (*nneg);
685a58c3f20SHong Zhang   PetscFunctionReturn(0);
686a58c3f20SHong Zhang }
687ace3df97SHong Zhang #endif /* !defined(PETSC_USE_COMPLEX) */
688a58c3f20SHong Zhang 
689397b6df1SKris Buschelman #undef __FUNCT__
690f6c57405SHong Zhang #define __FUNCT__ "MatFactorNumeric_MUMPS"
6910481f469SBarry Smith PetscErrorCode MatFactorNumeric_MUMPS(Mat F,Mat A,const MatFactorInfo *info)
692af281ebdSHong Zhang {
693a5e57a09SHong Zhang   Mat_MUMPS      *mumps =(Mat_MUMPS*)(F)->spptr;
6946849ba73SBarry Smith   PetscErrorCode ierr;
695e09efc27SHong Zhang   Mat            F_diag;
696ace3abfcSBarry Smith   PetscBool      isMPIAIJ;
697397b6df1SKris Buschelman 
698397b6df1SKris Buschelman   PetscFunctionBegin;
699a5e57a09SHong Zhang   ierr = (*mumps->ConvertToTriples)(A, 1, MAT_REUSE_MATRIX, &mumps->nz, &mumps->irn, &mumps->jcn, &mumps->val);CHKERRQ(ierr);
700397b6df1SKris Buschelman 
701397b6df1SKris Buschelman   /* numerical factorization phase */
702329ec9b3SHong Zhang   /*-------------------------------*/
703a5e57a09SHong Zhang   mumps->id.job = JOB_FACTNUMERIC;
704a5e57a09SHong Zhang   if (!mumps->id.ICNTL(18)) {
705a5e57a09SHong Zhang     if (!mumps->myid) {
706397b6df1SKris Buschelman #if defined(PETSC_USE_COMPLEX)
7072907cef9SHong Zhang #if defined(PETSC_USE_REAL_SINGLE)
708a5e57a09SHong Zhang       mumps->id.a = (mumps_complex*)mumps->val;
7092907cef9SHong Zhang #else
710a5e57a09SHong Zhang       mumps->id.a = (mumps_double_complex*)mumps->val;
7112907cef9SHong Zhang #endif
712397b6df1SKris Buschelman #else
713a5e57a09SHong Zhang       mumps->id.a = mumps->val;
714397b6df1SKris Buschelman #endif
715397b6df1SKris Buschelman     }
716397b6df1SKris Buschelman   } else {
717397b6df1SKris Buschelman #if defined(PETSC_USE_COMPLEX)
7182907cef9SHong Zhang #if defined(PETSC_USE_REAL_SINGLE)
719a5e57a09SHong Zhang     mumps->id.a_loc = (mumps_complex*)mumps->val;
7202907cef9SHong Zhang #else
721a5e57a09SHong Zhang     mumps->id.a_loc = (mumps_double_complex*)mumps->val;
7222907cef9SHong Zhang #endif
723397b6df1SKris Buschelman #else
724a5e57a09SHong Zhang     mumps->id.a_loc = mumps->val;
725397b6df1SKris Buschelman #endif
726397b6df1SKris Buschelman   }
727a5e57a09SHong Zhang   PetscMUMPS_c(&mumps->id);
728a5e57a09SHong Zhang   if (mumps->id.INFOG(1) < 0) {
729a5e57a09SHong Zhang     if (mumps->id.INFO(1) == -13) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error reported by MUMPS in numerical factorization phase: Cannot allocate required memory %d megabytes\n",mumps->id.INFO(2));
730a5e57a09SHong Zhang     else SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error reported by MUMPS in numerical factorization phase: INFO(1)=%d, INFO(2)=%d\n",mumps->id.INFO(1),mumps->id.INFO(2));
731397b6df1SKris Buschelman   }
732a5e57a09SHong Zhang   if (!mumps->myid && mumps->id.ICNTL(16) > 0) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"  mumps->id.ICNTL(16):=%d\n",mumps->id.INFOG(16));
733397b6df1SKris Buschelman 
734a5e57a09SHong Zhang   if (mumps->size > 1) {
735251f4c67SDmitry Karpeev     ierr = PetscObjectTypeCompare((PetscObject)A,MATMPIAIJ,&isMPIAIJ);CHKERRQ(ierr);
7362205254eSKarl Rupp     if (isMPIAIJ) F_diag = ((Mat_MPIAIJ*)(F)->data)->A;
7372205254eSKarl Rupp     else F_diag = ((Mat_MPISBAIJ*)(F)->data)->A;
738e09efc27SHong Zhang     F_diag->assembled = PETSC_TRUE;
739a5e57a09SHong Zhang     if (mumps->scat_sol) {
740a5e57a09SHong Zhang       ierr = VecScatterDestroy(&mumps->scat_sol);CHKERRQ(ierr);
741a5e57a09SHong Zhang       ierr = PetscFree2(mumps->id.sol_loc,mumps->id.isol_loc);CHKERRQ(ierr);
742a5e57a09SHong Zhang       ierr = VecDestroy(&mumps->x_seq);CHKERRQ(ierr);
743329ec9b3SHong Zhang     }
7448ada1bb4SHong Zhang   }
745dcd589f8SShri Abhyankar   (F)->assembled      = PETSC_TRUE;
746a5e57a09SHong Zhang   mumps->matstruc     = SAME_NONZERO_PATTERN;
747a5e57a09SHong Zhang   mumps->CleanUpMUMPS = PETSC_TRUE;
74867877ebaSShri Abhyankar 
749a5e57a09SHong Zhang   if (mumps->size > 1) {
75067877ebaSShri Abhyankar     /* distributed solution */
751a5e57a09SHong Zhang     if (!mumps->scat_sol) {
75267877ebaSShri Abhyankar       /* Create x_seq=sol_loc for repeated use */
75367877ebaSShri Abhyankar       PetscInt    lsol_loc;
75467877ebaSShri Abhyankar       PetscScalar *sol_loc;
7552205254eSKarl Rupp 
756a5e57a09SHong Zhang       lsol_loc = mumps->id.INFO(23); /* length of sol_loc */
7572205254eSKarl Rupp 
758a5e57a09SHong Zhang       ierr = PetscMalloc2(lsol_loc,PetscScalar,&sol_loc,lsol_loc,PetscInt,&mumps->id.isol_loc);CHKERRQ(ierr);
7592205254eSKarl Rupp 
760a5e57a09SHong Zhang       mumps->id.lsol_loc = lsol_loc;
76167877ebaSShri Abhyankar #if defined(PETSC_USE_COMPLEX)
7622907cef9SHong Zhang #if defined(PETSC_USE_REAL_SINGLE)
763a5e57a09SHong Zhang       mumps->id.sol_loc = (mumps_complex*)sol_loc;
7642907cef9SHong Zhang #else
765a5e57a09SHong Zhang       mumps->id.sol_loc = (mumps_double_complex*)sol_loc;
7662907cef9SHong Zhang #endif
76767877ebaSShri Abhyankar #else
768a5e57a09SHong Zhang       mumps->id.sol_loc = sol_loc;
76967877ebaSShri Abhyankar #endif
770a5e57a09SHong Zhang       ierr = VecCreateSeqWithArray(PETSC_COMM_SELF,1,lsol_loc,sol_loc,&mumps->x_seq);CHKERRQ(ierr);
77167877ebaSShri Abhyankar     }
77267877ebaSShri Abhyankar   }
773397b6df1SKris Buschelman   PetscFunctionReturn(0);
774397b6df1SKris Buschelman }
775397b6df1SKris Buschelman 
7769a2535b5SHong Zhang /* Sets MUMPS options from the options database */
777dcd589f8SShri Abhyankar #undef __FUNCT__
7789a2535b5SHong Zhang #define __FUNCT__ "PetscSetMUMPSFromOptions"
7799a2535b5SHong Zhang PetscErrorCode PetscSetMUMPSFromOptions(Mat F, Mat A)
780dcd589f8SShri Abhyankar {
7819a2535b5SHong Zhang   Mat_MUMPS      *mumps = (Mat_MUMPS*)F->spptr;
782dcd589f8SShri Abhyankar   PetscErrorCode ierr;
783dcd589f8SShri Abhyankar   PetscInt       icntl;
784ace3abfcSBarry Smith   PetscBool      flg;
785dcd589f8SShri Abhyankar 
786dcd589f8SShri Abhyankar   PetscFunctionBegin;
787ce94432eSBarry Smith   ierr = PetscOptionsBegin(PetscObjectComm((PetscObject)A),((PetscObject)A)->prefix,"MUMPS Options","Mat");CHKERRQ(ierr);
7889a2535b5SHong Zhang   ierr = PetscOptionsInt("-mat_mumps_icntl_1","ICNTL(1): output stream for error messages","None",mumps->id.ICNTL(1),&icntl,&flg);CHKERRQ(ierr);
7899a2535b5SHong Zhang   if (flg) mumps->id.ICNTL(1) = icntl;
7909a2535b5SHong Zhang   ierr = PetscOptionsInt("-mat_mumps_icntl_2","ICNTL(2): output stream for diagnostic printing, statistics, and warning","None",mumps->id.ICNTL(2),&icntl,&flg);CHKERRQ(ierr);
7919a2535b5SHong Zhang   if (flg) mumps->id.ICNTL(2) = icntl;
7929a2535b5SHong Zhang   ierr = PetscOptionsInt("-mat_mumps_icntl_3","ICNTL(3): output stream for global information, collected on the host","None",mumps->id.ICNTL(3),&icntl,&flg);CHKERRQ(ierr);
7939a2535b5SHong Zhang   if (flg) mumps->id.ICNTL(3) = icntl;
794dcd589f8SShri Abhyankar 
7959a2535b5SHong Zhang   ierr = PetscOptionsInt("-mat_mumps_icntl_4","ICNTL(4): level of printing (0 to 4)","None",mumps->id.ICNTL(4),&icntl,&flg);CHKERRQ(ierr);
7969a2535b5SHong Zhang   if (flg) mumps->id.ICNTL(4) = icntl;
7979a2535b5SHong Zhang   if (mumps->id.ICNTL(4) || PetscLogPrintInfo) mumps->id.ICNTL(3) = 6; /* resume MUMPS default id.ICNTL(3) = 6 */
7989a2535b5SHong Zhang 
7999a2535b5SHong Zhang   ierr = PetscOptionsInt("-mat_mumps_icntl_6","ICNTL(6): permuting and/or scaling the matrix (0 to 7)","None",mumps->id.ICNTL(6),&icntl,&flg);CHKERRQ(ierr);
8009a2535b5SHong Zhang   if (flg) mumps->id.ICNTL(6) = icntl;
8019a2535b5SHong Zhang 
8029a2535b5SHong Zhang   ierr = PetscOptionsInt("-mat_mumps_icntl_7","ICNTL(7): matrix ordering (0 to 7). 3=Scotch, 4=PORD, 5=Metis","None",mumps->id.ICNTL(7),&icntl,&flg);CHKERRQ(ierr);
803dcd589f8SShri Abhyankar   if (flg) {
8042205254eSKarl Rupp     if (icntl== 1 && mumps->size > 1) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_SUP,"pivot order be set by the user in PERM_IN -- not supported by the PETSc/MUMPS interface\n");
8052205254eSKarl Rupp     else mumps->id.ICNTL(7) = icntl;
806dcd589f8SShri Abhyankar   }
807e0b74bf9SHong Zhang 
8080298fd71SBarry Smith   ierr = PetscOptionsInt("-mat_mumps_icntl_8","ICNTL(8): scaling strategy (-2 to 8 or 77)","None",mumps->id.ICNTL(8),&mumps->id.ICNTL(8),NULL);CHKERRQ(ierr);
8090298fd71SBarry Smith   ierr = PetscOptionsInt("-mat_mumps_icntl_10","ICNTL(10): max num of refinements","None",mumps->id.ICNTL(10),&mumps->id.ICNTL(10),NULL);CHKERRQ(ierr);
8100298fd71SBarry Smith   ierr = PetscOptionsInt("-mat_mumps_icntl_11","ICNTL(11): statistics related to the linear system solved (via -ksp_view)","None",mumps->id.ICNTL(11),&mumps->id.ICNTL(11),NULL);CHKERRQ(ierr);
8110298fd71SBarry Smith   ierr = PetscOptionsInt("-mat_mumps_icntl_12","ICNTL(12): efficiency control: defines the ordering strategy with scaling constraints (0 to 3)","None",mumps->id.ICNTL(12),&mumps->id.ICNTL(12),NULL);CHKERRQ(ierr);
8120298fd71SBarry Smith   ierr = PetscOptionsInt("-mat_mumps_icntl_13","ICNTL(13): efficiency control: with or without ScaLAPACK","None",mumps->id.ICNTL(13),&mumps->id.ICNTL(13),NULL);CHKERRQ(ierr);
8130298fd71SBarry Smith   ierr = PetscOptionsInt("-mat_mumps_icntl_14","ICNTL(14): percentage of estimated workspace increase","None",mumps->id.ICNTL(14),&mumps->id.ICNTL(14),NULL);CHKERRQ(ierr);
8140298fd71SBarry Smith   ierr = PetscOptionsInt("-mat_mumps_icntl_19","ICNTL(19): Schur complement","None",mumps->id.ICNTL(19),&mumps->id.ICNTL(19),NULL);CHKERRQ(ierr);
8159a2535b5SHong Zhang 
8160298fd71SBarry Smith   ierr = PetscOptionsInt("-mat_mumps_icntl_22","ICNTL(22): in-core/out-of-core facility (0 or 1)","None",mumps->id.ICNTL(22),&mumps->id.ICNTL(22),NULL);CHKERRQ(ierr);
8170298fd71SBarry Smith   ierr = PetscOptionsInt("-mat_mumps_icntl_23","ICNTL(23): max size of the working memory (MB) that can allocate per processor","None",mumps->id.ICNTL(23),&mumps->id.ICNTL(23),NULL);CHKERRQ(ierr);
8180298fd71SBarry Smith   ierr = PetscOptionsInt("-mat_mumps_icntl_24","ICNTL(24): detection of null pivot rows (0 or 1)","None",mumps->id.ICNTL(24),&mumps->id.ICNTL(24),NULL);CHKERRQ(ierr);
8199a2535b5SHong Zhang   if (mumps->id.ICNTL(24)) {
8209a2535b5SHong Zhang     mumps->id.ICNTL(13) = 1; /* turn-off ScaLAPACK to help with the correct detection of null pivots */
821d7ebd59bSHong Zhang   }
822d7ebd59bSHong Zhang 
8230298fd71SBarry Smith   ierr = PetscOptionsInt("-mat_mumps_icntl_25","ICNTL(25): computation of a null space basis","None",mumps->id.ICNTL(25),&mumps->id.ICNTL(25),NULL);CHKERRQ(ierr);
8240298fd71SBarry Smith   ierr = PetscOptionsInt("-mat_mumps_icntl_26","ICNTL(26): Schur options for right-hand side or solution vector","None",mumps->id.ICNTL(26),&mumps->id.ICNTL(26),NULL);CHKERRQ(ierr);
8250298fd71SBarry Smith   ierr = PetscOptionsInt("-mat_mumps_icntl_27","ICNTL(27): experimental parameter","None",mumps->id.ICNTL(27),&mumps->id.ICNTL(27),NULL);CHKERRQ(ierr);
8260298fd71SBarry Smith   ierr = PetscOptionsInt("-mat_mumps_icntl_28","ICNTL(28): use 1 for sequential analysis and ictnl(7) ordering, or 2 for parallel analysis and ictnl(29) ordering","None",mumps->id.ICNTL(28),&mumps->id.ICNTL(28),NULL);CHKERRQ(ierr);
8270298fd71SBarry Smith   ierr = PetscOptionsInt("-mat_mumps_icntl_29","ICNTL(29): parallel ordering 1 = ptscotch 2 = parmetis","None",mumps->id.ICNTL(29),&mumps->id.ICNTL(29),NULL);CHKERRQ(ierr);
8280298fd71SBarry Smith   ierr = PetscOptionsInt("-mat_mumps_icntl_30","ICNTL(30): compute user-specified set of entries in inv(A)","None",mumps->id.ICNTL(30),&mumps->id.ICNTL(30),NULL);CHKERRQ(ierr);
8290298fd71SBarry Smith   ierr = PetscOptionsInt("-mat_mumps_icntl_31","ICNTL(31): factors can be discarded in the solve phase","None",mumps->id.ICNTL(31),&mumps->id.ICNTL(31),NULL);CHKERRQ(ierr);
8300298fd71SBarry Smith   ierr = PetscOptionsInt("-mat_mumps_icntl_33","ICNTL(33): compute determinant","None",mumps->id.ICNTL(33),&mumps->id.ICNTL(33),NULL);CHKERRQ(ierr);
831dcd589f8SShri Abhyankar 
8320298fd71SBarry Smith   ierr = PetscOptionsReal("-mat_mumps_cntl_1","CNTL(1): relative pivoting threshold","None",mumps->id.CNTL(1),&mumps->id.CNTL(1),NULL);CHKERRQ(ierr);
8330298fd71SBarry Smith   ierr = PetscOptionsReal("-mat_mumps_cntl_2","CNTL(2): stopping criterion of refinement","None",mumps->id.CNTL(2),&mumps->id.CNTL(2),NULL);CHKERRQ(ierr);
8340298fd71SBarry Smith   ierr = PetscOptionsReal("-mat_mumps_cntl_3","CNTL(3): absolute pivoting threshold","None",mumps->id.CNTL(3),&mumps->id.CNTL(3),NULL);CHKERRQ(ierr);
8350298fd71SBarry Smith   ierr = PetscOptionsReal("-mat_mumps_cntl_4","CNTL(4): value for static pivoting","None",mumps->id.CNTL(4),&mumps->id.CNTL(4),NULL);CHKERRQ(ierr);
8360298fd71SBarry Smith   ierr = PetscOptionsReal("-mat_mumps_cntl_5","CNTL(5): fixation for null pivots","None",mumps->id.CNTL(5),&mumps->id.CNTL(5),NULL);CHKERRQ(ierr);
837e5bb22a1SHong Zhang 
8380298fd71SBarry Smith   ierr = PetscOptionsString("-mat_mumps_ooc_tmpdir", "out of core directory", "None", mumps->id.ooc_tmpdir, mumps->id.ooc_tmpdir, 256, NULL);
839dcd589f8SShri Abhyankar   PetscOptionsEnd();
840dcd589f8SShri Abhyankar   PetscFunctionReturn(0);
841dcd589f8SShri Abhyankar }
842dcd589f8SShri Abhyankar 
843dcd589f8SShri Abhyankar #undef __FUNCT__
844dcd589f8SShri Abhyankar #define __FUNCT__ "PetscInitializeMUMPS"
845f697e70eSHong Zhang PetscErrorCode PetscInitializeMUMPS(Mat A,Mat_MUMPS *mumps)
846dcd589f8SShri Abhyankar {
847dcd589f8SShri Abhyankar   PetscErrorCode ierr;
848dcd589f8SShri Abhyankar 
849dcd589f8SShri Abhyankar   PetscFunctionBegin;
850ce94432eSBarry Smith   ierr = MPI_Comm_rank(PetscObjectComm((PetscObject)A), &mumps->myid);
851ce94432eSBarry Smith   ierr = MPI_Comm_size(PetscObjectComm((PetscObject)A),&mumps->size);CHKERRQ(ierr);
852ce94432eSBarry Smith   ierr = MPI_Comm_dup(PetscObjectComm((PetscObject)A),&(mumps->comm_mumps));CHKERRQ(ierr);
8532205254eSKarl Rupp 
854f697e70eSHong Zhang   mumps->id.comm_fortran = MPI_Comm_c2f(mumps->comm_mumps);
855f697e70eSHong Zhang 
856f697e70eSHong Zhang   mumps->id.job = JOB_INIT;
857f697e70eSHong Zhang   mumps->id.par = 1;  /* host participates factorizaton and solve */
858f697e70eSHong Zhang   mumps->id.sym = mumps->sym;
8592907cef9SHong Zhang   PetscMUMPS_c(&mumps->id);
860f697e70eSHong Zhang 
861f697e70eSHong Zhang   mumps->CleanUpMUMPS = PETSC_FALSE;
8620298fd71SBarry Smith   mumps->scat_rhs     = NULL;
8630298fd71SBarry Smith   mumps->scat_sol     = NULL;
8649a2535b5SHong Zhang 
86570544d5fSHong Zhang   /* set PETSc-MUMPS default options - override MUMPS default */
8669a2535b5SHong Zhang   mumps->id.ICNTL(3) = 0;
8679a2535b5SHong Zhang   mumps->id.ICNTL(4) = 0;
8689a2535b5SHong Zhang   if (mumps->size == 1) {
8699a2535b5SHong Zhang     mumps->id.ICNTL(18) = 0;   /* centralized assembled matrix input */
8709a2535b5SHong Zhang   } else {
8719a2535b5SHong Zhang     mumps->id.ICNTL(18) = 3;   /* distributed assembled matrix input */
87270544d5fSHong Zhang     mumps->id.ICNTL(21) = 1;   /* distributed solution */
8739a2535b5SHong Zhang   }
874dcd589f8SShri Abhyankar   PetscFunctionReturn(0);
875dcd589f8SShri Abhyankar }
876dcd589f8SShri Abhyankar 
877a5e57a09SHong Zhang /* Note Petsc r(=c) permutation is used when mumps->id.ICNTL(7)==1 with centralized assembled matrix input; otherwise r and c are ignored */
878397b6df1SKris Buschelman #undef __FUNCT__
879f0c56d0fSKris Buschelman #define __FUNCT__ "MatLUFactorSymbolic_AIJMUMPS"
8800481f469SBarry Smith PetscErrorCode MatLUFactorSymbolic_AIJMUMPS(Mat F,Mat A,IS r,IS c,const MatFactorInfo *info)
881b24902e0SBarry Smith {
882a5e57a09SHong Zhang   Mat_MUMPS      *mumps = (Mat_MUMPS*)F->spptr;
883dcd589f8SShri Abhyankar   PetscErrorCode ierr;
88467877ebaSShri Abhyankar   Vec            b;
88567877ebaSShri Abhyankar   IS             is_iden;
88667877ebaSShri Abhyankar   const PetscInt M = A->rmap->N;
887397b6df1SKris Buschelman 
888397b6df1SKris Buschelman   PetscFunctionBegin;
889a5e57a09SHong Zhang   mumps->matstruc = DIFFERENT_NONZERO_PATTERN;
890dcd589f8SShri Abhyankar 
8919a2535b5SHong Zhang   /* Set MUMPS options from the options database */
8929a2535b5SHong Zhang   ierr = PetscSetMUMPSFromOptions(F,A);CHKERRQ(ierr);
893dcd589f8SShri Abhyankar 
894a5e57a09SHong Zhang   ierr = (*mumps->ConvertToTriples)(A, 1, MAT_INITIAL_MATRIX, &mumps->nz, &mumps->irn, &mumps->jcn, &mumps->val);CHKERRQ(ierr);
895dcd589f8SShri Abhyankar 
89667877ebaSShri Abhyankar   /* analysis phase */
89767877ebaSShri Abhyankar   /*----------------*/
898a5e57a09SHong Zhang   mumps->id.job = JOB_FACTSYMBOLIC;
899a5e57a09SHong Zhang   mumps->id.n   = M;
900a5e57a09SHong Zhang   switch (mumps->id.ICNTL(18)) {
90167877ebaSShri Abhyankar   case 0:  /* centralized assembled matrix input */
902a5e57a09SHong Zhang     if (!mumps->myid) {
903a5e57a09SHong Zhang       mumps->id.nz =mumps->nz; mumps->id.irn=mumps->irn; mumps->id.jcn=mumps->jcn;
904a5e57a09SHong Zhang       if (mumps->id.ICNTL(6)>1) {
90567877ebaSShri Abhyankar #if defined(PETSC_USE_COMPLEX)
9062907cef9SHong Zhang #if defined(PETSC_USE_REAL_SINGLE)
907a5e57a09SHong Zhang         mumps->id.a = (mumps_complex*)mumps->val;
9082907cef9SHong Zhang #else
909a5e57a09SHong Zhang         mumps->id.a = (mumps_double_complex*)mumps->val;
9102907cef9SHong Zhang #endif
91167877ebaSShri Abhyankar #else
912a5e57a09SHong Zhang         mumps->id.a = mumps->val;
91367877ebaSShri Abhyankar #endif
91467877ebaSShri Abhyankar       }
915a5e57a09SHong Zhang       if (mumps->id.ICNTL(7) == 1) { /* use user-provide matrix ordering - assuming r = c ordering */
9165248a706SHong Zhang         /*
9175248a706SHong Zhang         PetscBool      flag;
9185248a706SHong Zhang         ierr = ISEqual(r,c,&flag);CHKERRQ(ierr);
9195248a706SHong Zhang         if (!flag) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_USER,"row_perm != col_perm");
9205248a706SHong Zhang         ierr = ISView(r,PETSC_VIEWER_STDOUT_SELF);
9215248a706SHong Zhang          */
922a5e57a09SHong Zhang         if (!mumps->myid) {
923e0b74bf9SHong Zhang           const PetscInt *idx;
924e0b74bf9SHong Zhang           PetscInt       i,*perm_in;
9252205254eSKarl Rupp 
926e0b74bf9SHong Zhang           ierr = PetscMalloc(M*sizeof(PetscInt),&perm_in);CHKERRQ(ierr);
927e0b74bf9SHong Zhang           ierr = ISGetIndices(r,&idx);CHKERRQ(ierr);
9282205254eSKarl Rupp 
929a5e57a09SHong Zhang           mumps->id.perm_in = perm_in;
930e0b74bf9SHong Zhang           for (i=0; i<M; i++) perm_in[i] = idx[i]+1; /* perm_in[]: start from 1, not 0! */
931e0b74bf9SHong Zhang           ierr = ISRestoreIndices(r,&idx);CHKERRQ(ierr);
932e0b74bf9SHong Zhang         }
933e0b74bf9SHong Zhang       }
93467877ebaSShri Abhyankar     }
93567877ebaSShri Abhyankar     break;
93667877ebaSShri Abhyankar   case 3:  /* distributed assembled matrix input (size>1) */
937a5e57a09SHong Zhang     mumps->id.nz_loc = mumps->nz;
938a5e57a09SHong Zhang     mumps->id.irn_loc=mumps->irn; mumps->id.jcn_loc=mumps->jcn;
939a5e57a09SHong Zhang     if (mumps->id.ICNTL(6)>1) {
94067877ebaSShri Abhyankar #if defined(PETSC_USE_COMPLEX)
9412907cef9SHong Zhang #if defined(PETSC_USE_REAL_SINGLE)
942a5e57a09SHong Zhang       mumps->id.a_loc = (mumps_complex*)mumps->val;
9432907cef9SHong Zhang #else
944a5e57a09SHong Zhang       mumps->id.a_loc = (mumps_double_complex*)mumps->val;
9452907cef9SHong Zhang #endif
94667877ebaSShri Abhyankar #else
947a5e57a09SHong Zhang       mumps->id.a_loc = mumps->val;
94867877ebaSShri Abhyankar #endif
94967877ebaSShri Abhyankar     }
95067877ebaSShri Abhyankar     /* MUMPS only supports centralized rhs. Create scatter scat_rhs for repeated use in MatSolve() */
951a5e57a09SHong Zhang     if (!mumps->myid) {
952a5e57a09SHong Zhang       ierr = VecCreateSeq(PETSC_COMM_SELF,A->cmap->N,&mumps->b_seq);CHKERRQ(ierr);
95367877ebaSShri Abhyankar       ierr = ISCreateStride(PETSC_COMM_SELF,A->cmap->N,0,1,&is_iden);CHKERRQ(ierr);
95467877ebaSShri Abhyankar     } else {
955a5e57a09SHong Zhang       ierr = VecCreateSeq(PETSC_COMM_SELF,0,&mumps->b_seq);CHKERRQ(ierr);
95667877ebaSShri Abhyankar       ierr = ISCreateStride(PETSC_COMM_SELF,0,0,1,&is_iden);CHKERRQ(ierr);
95767877ebaSShri Abhyankar     }
958ce94432eSBarry Smith     ierr = VecCreate(PetscObjectComm((PetscObject)A),&b);CHKERRQ(ierr);
95967877ebaSShri Abhyankar     ierr = VecSetSizes(b,A->rmap->n,PETSC_DECIDE);CHKERRQ(ierr);
96067877ebaSShri Abhyankar     ierr = VecSetFromOptions(b);CHKERRQ(ierr);
96167877ebaSShri Abhyankar 
962a5e57a09SHong Zhang     ierr = VecScatterCreate(b,is_iden,mumps->b_seq,is_iden,&mumps->scat_rhs);CHKERRQ(ierr);
9636bf464f9SBarry Smith     ierr = ISDestroy(&is_iden);CHKERRQ(ierr);
9646bf464f9SBarry Smith     ierr = VecDestroy(&b);CHKERRQ(ierr);
96567877ebaSShri Abhyankar     break;
96667877ebaSShri Abhyankar   }
967a5e57a09SHong Zhang   PetscMUMPS_c(&mumps->id);
968a5e57a09SHong Zhang   if (mumps->id.INFOG(1) < 0) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error reported by MUMPS in analysis phase: INFOG(1)=%d\n",mumps->id.INFOG(1));
96967877ebaSShri Abhyankar 
970719d5645SBarry Smith   F->ops->lufactornumeric = MatFactorNumeric_MUMPS;
971dcd589f8SShri Abhyankar   F->ops->solve           = MatSolve_MUMPS;
97251d5961aSHong Zhang   F->ops->solvetranspose  = MatSolveTranspose_MUMPS;
97317f96c7aSHong Zhang   F->ops->matsolve        = 0;  /* use MatMatSolve_Basic() until mumps supports distributed rhs */
974b24902e0SBarry Smith   PetscFunctionReturn(0);
975b24902e0SBarry Smith }
976b24902e0SBarry Smith 
977450b117fSShri Abhyankar /* Note the Petsc r and c permutations are ignored */
978450b117fSShri Abhyankar #undef __FUNCT__
979450b117fSShri Abhyankar #define __FUNCT__ "MatLUFactorSymbolic_BAIJMUMPS"
980450b117fSShri Abhyankar PetscErrorCode MatLUFactorSymbolic_BAIJMUMPS(Mat F,Mat A,IS r,IS c,const MatFactorInfo *info)
981450b117fSShri Abhyankar {
982a5e57a09SHong Zhang   Mat_MUMPS      *mumps = (Mat_MUMPS*)F->spptr;
983dcd589f8SShri Abhyankar   PetscErrorCode ierr;
98467877ebaSShri Abhyankar   Vec            b;
98567877ebaSShri Abhyankar   IS             is_iden;
98667877ebaSShri Abhyankar   const PetscInt M = A->rmap->N;
987450b117fSShri Abhyankar 
988450b117fSShri Abhyankar   PetscFunctionBegin;
989a5e57a09SHong Zhang   mumps->matstruc = DIFFERENT_NONZERO_PATTERN;
990dcd589f8SShri Abhyankar 
9919a2535b5SHong Zhang   /* Set MUMPS options from the options database */
9929a2535b5SHong Zhang   ierr = PetscSetMUMPSFromOptions(F,A);CHKERRQ(ierr);
993dcd589f8SShri Abhyankar 
994a5e57a09SHong Zhang   ierr = (*mumps->ConvertToTriples)(A, 1, MAT_INITIAL_MATRIX, &mumps->nz, &mumps->irn, &mumps->jcn, &mumps->val);CHKERRQ(ierr);
99567877ebaSShri Abhyankar 
99667877ebaSShri Abhyankar   /* analysis phase */
99767877ebaSShri Abhyankar   /*----------------*/
998a5e57a09SHong Zhang   mumps->id.job = JOB_FACTSYMBOLIC;
999a5e57a09SHong Zhang   mumps->id.n   = M;
1000a5e57a09SHong Zhang   switch (mumps->id.ICNTL(18)) {
100167877ebaSShri Abhyankar   case 0:  /* centralized assembled matrix input */
1002a5e57a09SHong Zhang     if (!mumps->myid) {
1003a5e57a09SHong Zhang       mumps->id.nz =mumps->nz; mumps->id.irn=mumps->irn; mumps->id.jcn=mumps->jcn;
1004a5e57a09SHong Zhang       if (mumps->id.ICNTL(6)>1) {
100567877ebaSShri Abhyankar #if defined(PETSC_USE_COMPLEX)
10062907cef9SHong Zhang #if defined(PETSC_USE_REAL_SINGLE)
1007a5e57a09SHong Zhang         mumps->id.a = (mumps_complex*)mumps->val;
10082907cef9SHong Zhang #else
1009a5e57a09SHong Zhang         mumps->id.a = (mumps_double_complex*)mumps->val;
10102907cef9SHong Zhang #endif
101167877ebaSShri Abhyankar #else
1012a5e57a09SHong Zhang         mumps->id.a = mumps->val;
101367877ebaSShri Abhyankar #endif
101467877ebaSShri Abhyankar       }
101567877ebaSShri Abhyankar     }
101667877ebaSShri Abhyankar     break;
101767877ebaSShri Abhyankar   case 3:  /* distributed assembled matrix input (size>1) */
1018a5e57a09SHong Zhang     mumps->id.nz_loc = mumps->nz;
1019a5e57a09SHong Zhang     mumps->id.irn_loc=mumps->irn; mumps->id.jcn_loc=mumps->jcn;
1020a5e57a09SHong Zhang     if (mumps->id.ICNTL(6)>1) {
102167877ebaSShri Abhyankar #if defined(PETSC_USE_COMPLEX)
10222907cef9SHong Zhang #if defined(PETSC_USE_REAL_SINGLE)
1023a5e57a09SHong Zhang       mumps->id.a_loc = (mumps_complex*)mumps->val;
10242907cef9SHong Zhang #else
1025a5e57a09SHong Zhang       mumps->id.a_loc = (mumps_double_complex*)mumps->val;
10262907cef9SHong Zhang #endif
102767877ebaSShri Abhyankar #else
1028a5e57a09SHong Zhang       mumps->id.a_loc = mumps->val;
102967877ebaSShri Abhyankar #endif
103067877ebaSShri Abhyankar     }
103167877ebaSShri Abhyankar     /* MUMPS only supports centralized rhs. Create scatter scat_rhs for repeated use in MatSolve() */
1032a5e57a09SHong Zhang     if (!mumps->myid) {
1033a5e57a09SHong Zhang       ierr = VecCreateSeq(PETSC_COMM_SELF,A->cmap->N,&mumps->b_seq);CHKERRQ(ierr);
103467877ebaSShri Abhyankar       ierr = ISCreateStride(PETSC_COMM_SELF,A->cmap->N,0,1,&is_iden);CHKERRQ(ierr);
103567877ebaSShri Abhyankar     } else {
1036a5e57a09SHong Zhang       ierr = VecCreateSeq(PETSC_COMM_SELF,0,&mumps->b_seq);CHKERRQ(ierr);
103767877ebaSShri Abhyankar       ierr = ISCreateStride(PETSC_COMM_SELF,0,0,1,&is_iden);CHKERRQ(ierr);
103867877ebaSShri Abhyankar     }
1039ce94432eSBarry Smith     ierr = VecCreate(PetscObjectComm((PetscObject)A),&b);CHKERRQ(ierr);
104067877ebaSShri Abhyankar     ierr = VecSetSizes(b,A->rmap->n,PETSC_DECIDE);CHKERRQ(ierr);
104167877ebaSShri Abhyankar     ierr = VecSetFromOptions(b);CHKERRQ(ierr);
104267877ebaSShri Abhyankar 
1043a5e57a09SHong Zhang     ierr = VecScatterCreate(b,is_iden,mumps->b_seq,is_iden,&mumps->scat_rhs);CHKERRQ(ierr);
10446bf464f9SBarry Smith     ierr = ISDestroy(&is_iden);CHKERRQ(ierr);
10456bf464f9SBarry Smith     ierr = VecDestroy(&b);CHKERRQ(ierr);
104667877ebaSShri Abhyankar     break;
104767877ebaSShri Abhyankar   }
1048a5e57a09SHong Zhang   PetscMUMPS_c(&mumps->id);
1049a5e57a09SHong Zhang   if (mumps->id.INFOG(1) < 0) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error reported by MUMPS in analysis phase: INFOG(1)=%d\n",mumps->id.INFOG(1));
105067877ebaSShri Abhyankar 
1051450b117fSShri Abhyankar   F->ops->lufactornumeric = MatFactorNumeric_MUMPS;
1052dcd589f8SShri Abhyankar   F->ops->solve           = MatSolve_MUMPS;
105351d5961aSHong Zhang   F->ops->solvetranspose  = MatSolveTranspose_MUMPS;
1054450b117fSShri Abhyankar   PetscFunctionReturn(0);
1055450b117fSShri Abhyankar }
1056b24902e0SBarry Smith 
1057141f4205SHong Zhang /* Note the Petsc r permutation and factor info are ignored */
1058397b6df1SKris Buschelman #undef __FUNCT__
105967877ebaSShri Abhyankar #define __FUNCT__ "MatCholeskyFactorSymbolic_MUMPS"
106067877ebaSShri Abhyankar PetscErrorCode MatCholeskyFactorSymbolic_MUMPS(Mat F,Mat A,IS r,const MatFactorInfo *info)
1061b24902e0SBarry Smith {
1062a5e57a09SHong Zhang   Mat_MUMPS      *mumps = (Mat_MUMPS*)F->spptr;
1063dcd589f8SShri Abhyankar   PetscErrorCode ierr;
106467877ebaSShri Abhyankar   Vec            b;
106567877ebaSShri Abhyankar   IS             is_iden;
106667877ebaSShri Abhyankar   const PetscInt M = A->rmap->N;
1067397b6df1SKris Buschelman 
1068397b6df1SKris Buschelman   PetscFunctionBegin;
1069a5e57a09SHong Zhang   mumps->matstruc = DIFFERENT_NONZERO_PATTERN;
1070dcd589f8SShri Abhyankar 
10719a2535b5SHong Zhang   /* Set MUMPS options from the options database */
10729a2535b5SHong Zhang   ierr = PetscSetMUMPSFromOptions(F,A);CHKERRQ(ierr);
1073dcd589f8SShri Abhyankar 
1074a5e57a09SHong Zhang   ierr = (*mumps->ConvertToTriples)(A, 1, MAT_INITIAL_MATRIX, &mumps->nz, &mumps->irn, &mumps->jcn, &mumps->val);CHKERRQ(ierr);
1075dcd589f8SShri Abhyankar 
107667877ebaSShri Abhyankar   /* analysis phase */
107767877ebaSShri Abhyankar   /*----------------*/
1078a5e57a09SHong Zhang   mumps->id.job = JOB_FACTSYMBOLIC;
1079a5e57a09SHong Zhang   mumps->id.n   = M;
1080a5e57a09SHong Zhang   switch (mumps->id.ICNTL(18)) {
108167877ebaSShri Abhyankar   case 0:  /* centralized assembled matrix input */
1082a5e57a09SHong Zhang     if (!mumps->myid) {
1083a5e57a09SHong Zhang       mumps->id.nz =mumps->nz; mumps->id.irn=mumps->irn; mumps->id.jcn=mumps->jcn;
1084a5e57a09SHong Zhang       if (mumps->id.ICNTL(6)>1) {
108567877ebaSShri Abhyankar #if defined(PETSC_USE_COMPLEX)
10862907cef9SHong Zhang #if defined(PETSC_USE_REAL_SINGLE)
1087a5e57a09SHong Zhang         mumps->id.a = (mumps_complex*)mumps->val;
10882907cef9SHong Zhang #else
1089a5e57a09SHong Zhang         mumps->id.a = (mumps_double_complex*)mumps->val;
10902907cef9SHong Zhang #endif
109167877ebaSShri Abhyankar #else
1092a5e57a09SHong Zhang         mumps->id.a = mumps->val;
109367877ebaSShri Abhyankar #endif
109467877ebaSShri Abhyankar       }
109567877ebaSShri Abhyankar     }
109667877ebaSShri Abhyankar     break;
109767877ebaSShri Abhyankar   case 3:  /* distributed assembled matrix input (size>1) */
1098a5e57a09SHong Zhang     mumps->id.nz_loc = mumps->nz;
1099a5e57a09SHong Zhang     mumps->id.irn_loc=mumps->irn; mumps->id.jcn_loc=mumps->jcn;
1100a5e57a09SHong Zhang     if (mumps->id.ICNTL(6)>1) {
110167877ebaSShri Abhyankar #if defined(PETSC_USE_COMPLEX)
11022907cef9SHong Zhang #if defined(PETSC_USE_REAL_SINGLE)
1103a5e57a09SHong Zhang       mumps->id.a_loc = (mumps_complex*)mumps->val;
11042907cef9SHong Zhang #else
1105a5e57a09SHong Zhang       mumps->id.a_loc = (mumps_double_complex*)mumps->val;
11062907cef9SHong Zhang #endif
110767877ebaSShri Abhyankar #else
1108a5e57a09SHong Zhang       mumps->id.a_loc = mumps->val;
110967877ebaSShri Abhyankar #endif
111067877ebaSShri Abhyankar     }
111167877ebaSShri Abhyankar     /* MUMPS only supports centralized rhs. Create scatter scat_rhs for repeated use in MatSolve() */
1112a5e57a09SHong Zhang     if (!mumps->myid) {
1113a5e57a09SHong Zhang       ierr = VecCreateSeq(PETSC_COMM_SELF,A->cmap->N,&mumps->b_seq);CHKERRQ(ierr);
111467877ebaSShri Abhyankar       ierr = ISCreateStride(PETSC_COMM_SELF,A->cmap->N,0,1,&is_iden);CHKERRQ(ierr);
111567877ebaSShri Abhyankar     } else {
1116a5e57a09SHong Zhang       ierr = VecCreateSeq(PETSC_COMM_SELF,0,&mumps->b_seq);CHKERRQ(ierr);
111767877ebaSShri Abhyankar       ierr = ISCreateStride(PETSC_COMM_SELF,0,0,1,&is_iden);CHKERRQ(ierr);
111867877ebaSShri Abhyankar     }
1119ce94432eSBarry Smith     ierr = VecCreate(PetscObjectComm((PetscObject)A),&b);CHKERRQ(ierr);
112067877ebaSShri Abhyankar     ierr = VecSetSizes(b,A->rmap->n,PETSC_DECIDE);CHKERRQ(ierr);
112167877ebaSShri Abhyankar     ierr = VecSetFromOptions(b);CHKERRQ(ierr);
112267877ebaSShri Abhyankar 
1123a5e57a09SHong Zhang     ierr = VecScatterCreate(b,is_iden,mumps->b_seq,is_iden,&mumps->scat_rhs);CHKERRQ(ierr);
11246bf464f9SBarry Smith     ierr = ISDestroy(&is_iden);CHKERRQ(ierr);
11256bf464f9SBarry Smith     ierr = VecDestroy(&b);CHKERRQ(ierr);
112667877ebaSShri Abhyankar     break;
112767877ebaSShri Abhyankar   }
1128a5e57a09SHong Zhang   PetscMUMPS_c(&mumps->id);
1129a5e57a09SHong Zhang   if (mumps->id.INFOG(1) < 0) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error reported by MUMPS in analysis phase: INFOG(1)=%d\n",mumps->id.INFOG(1));
113067877ebaSShri Abhyankar 
11312792810eSHong Zhang   F->ops->choleskyfactornumeric = MatFactorNumeric_MUMPS;
1132dcd589f8SShri Abhyankar   F->ops->solve                 = MatSolve_MUMPS;
113351d5961aSHong Zhang   F->ops->solvetranspose        = MatSolve_MUMPS;
113430c107b7SHong Zhang   F->ops->matsolve              = 0; /* use MatMatSolve_Basic() until mumps supports distributed rhs */
1135db4efbfdSBarry Smith #if !defined(PETSC_USE_COMPLEX)
113605aa0992SJose Roman   F->ops->getinertia = MatGetInertia_SBAIJMUMPS;
113705aa0992SJose Roman #else
11380298fd71SBarry Smith   F->ops->getinertia = NULL;
1139db4efbfdSBarry Smith #endif
1140b24902e0SBarry Smith   PetscFunctionReturn(0);
1141b24902e0SBarry Smith }
1142b24902e0SBarry Smith 
1143397b6df1SKris Buschelman #undef __FUNCT__
114464e6c443SBarry Smith #define __FUNCT__ "MatView_MUMPS"
114564e6c443SBarry Smith PetscErrorCode MatView_MUMPS(Mat A,PetscViewer viewer)
114674ed9c26SBarry Smith {
1147f6c57405SHong Zhang   PetscErrorCode    ierr;
114864e6c443SBarry Smith   PetscBool         iascii;
114964e6c443SBarry Smith   PetscViewerFormat format;
1150a5e57a09SHong Zhang   Mat_MUMPS         *mumps=(Mat_MUMPS*)A->spptr;
1151f6c57405SHong Zhang 
1152f6c57405SHong Zhang   PetscFunctionBegin;
115364e6c443SBarry Smith   /* check if matrix is mumps type */
115464e6c443SBarry Smith   if (A->ops->solve != MatSolve_MUMPS) PetscFunctionReturn(0);
115564e6c443SBarry Smith 
1156251f4c67SDmitry Karpeev   ierr = PetscObjectTypeCompare((PetscObject)viewer,PETSCVIEWERASCII,&iascii);CHKERRQ(ierr);
115764e6c443SBarry Smith   if (iascii) {
115864e6c443SBarry Smith     ierr = PetscViewerGetFormat(viewer,&format);CHKERRQ(ierr);
115964e6c443SBarry Smith     if (format == PETSC_VIEWER_ASCII_INFO) {
116064e6c443SBarry Smith       ierr = PetscViewerASCIIPrintf(viewer,"MUMPS run parameters:\n");CHKERRQ(ierr);
1161a5e57a09SHong Zhang       ierr = PetscViewerASCIIPrintf(viewer,"  SYM (matrix type):                   %d \n",mumps->id.sym);CHKERRQ(ierr);
1162a5e57a09SHong Zhang       ierr = PetscViewerASCIIPrintf(viewer,"  PAR (host participation):            %d \n",mumps->id.par);CHKERRQ(ierr);
1163a5e57a09SHong Zhang       ierr = PetscViewerASCIIPrintf(viewer,"  ICNTL(1) (output for error):         %d \n",mumps->id.ICNTL(1));CHKERRQ(ierr);
1164a5e57a09SHong Zhang       ierr = PetscViewerASCIIPrintf(viewer,"  ICNTL(2) (output of diagnostic msg): %d \n",mumps->id.ICNTL(2));CHKERRQ(ierr);
1165a5e57a09SHong Zhang       ierr = PetscViewerASCIIPrintf(viewer,"  ICNTL(3) (output for global info):   %d \n",mumps->id.ICNTL(3));CHKERRQ(ierr);
1166a5e57a09SHong Zhang       ierr = PetscViewerASCIIPrintf(viewer,"  ICNTL(4) (level of printing):        %d \n",mumps->id.ICNTL(4));CHKERRQ(ierr);
1167a5e57a09SHong Zhang       ierr = PetscViewerASCIIPrintf(viewer,"  ICNTL(5) (input mat struct):         %d \n",mumps->id.ICNTL(5));CHKERRQ(ierr);
1168a5e57a09SHong Zhang       ierr = PetscViewerASCIIPrintf(viewer,"  ICNTL(6) (matrix prescaling):        %d \n",mumps->id.ICNTL(6));CHKERRQ(ierr);
1169a5e57a09SHong Zhang       ierr = PetscViewerASCIIPrintf(viewer,"  ICNTL(7) (sequentia matrix ordering):%d \n",mumps->id.ICNTL(7));CHKERRQ(ierr);
1170a5e57a09SHong Zhang       ierr = PetscViewerASCIIPrintf(viewer,"  ICNTL(8) (scalling strategy):        %d \n",mumps->id.ICNTL(8));CHKERRQ(ierr);
1171a5e57a09SHong Zhang       ierr = PetscViewerASCIIPrintf(viewer,"  ICNTL(10) (max num of refinements):  %d \n",mumps->id.ICNTL(10));CHKERRQ(ierr);
1172a5e57a09SHong Zhang       ierr = PetscViewerASCIIPrintf(viewer,"  ICNTL(11) (error analysis):          %d \n",mumps->id.ICNTL(11));CHKERRQ(ierr);
1173a5e57a09SHong Zhang       if (mumps->id.ICNTL(11)>0) {
1174a5e57a09SHong Zhang         ierr = PetscViewerASCIIPrintf(viewer,"    RINFOG(4) (inf norm of input mat):        %g\n",mumps->id.RINFOG(4));CHKERRQ(ierr);
1175a5e57a09SHong Zhang         ierr = PetscViewerASCIIPrintf(viewer,"    RINFOG(5) (inf norm of solution):         %g\n",mumps->id.RINFOG(5));CHKERRQ(ierr);
1176a5e57a09SHong Zhang         ierr = PetscViewerASCIIPrintf(viewer,"    RINFOG(6) (inf norm of residual):         %g\n",mumps->id.RINFOG(6));CHKERRQ(ierr);
1177a5e57a09SHong Zhang         ierr = PetscViewerASCIIPrintf(viewer,"    RINFOG(7),RINFOG(8) (backward error est): %g, %g\n",mumps->id.RINFOG(7),mumps->id.RINFOG(8));CHKERRQ(ierr);
1178a5e57a09SHong Zhang         ierr = PetscViewerASCIIPrintf(viewer,"    RINFOG(9) (error estimate):               %g \n",mumps->id.RINFOG(9));CHKERRQ(ierr);
1179a5e57a09SHong Zhang         ierr = PetscViewerASCIIPrintf(viewer,"    RINFOG(10),RINFOG(11)(condition numbers): %g, %g\n",mumps->id.RINFOG(10),mumps->id.RINFOG(11));CHKERRQ(ierr);
1180f6c57405SHong Zhang       }
1181a5e57a09SHong Zhang       ierr = PetscViewerASCIIPrintf(viewer,"  ICNTL(12) (efficiency control):                         %d \n",mumps->id.ICNTL(12));CHKERRQ(ierr);
1182a5e57a09SHong Zhang       ierr = PetscViewerASCIIPrintf(viewer,"  ICNTL(13) (efficiency control):                         %d \n",mumps->id.ICNTL(13));CHKERRQ(ierr);
1183a5e57a09SHong Zhang       ierr = PetscViewerASCIIPrintf(viewer,"  ICNTL(14) (percentage of estimated workspace increase): %d \n",mumps->id.ICNTL(14));CHKERRQ(ierr);
1184f6c57405SHong Zhang       /* ICNTL(15-17) not used */
1185a5e57a09SHong Zhang       ierr = PetscViewerASCIIPrintf(viewer,"  ICNTL(18) (input mat struct):                           %d \n",mumps->id.ICNTL(18));CHKERRQ(ierr);
1186a5e57a09SHong Zhang       ierr = PetscViewerASCIIPrintf(viewer,"  ICNTL(19) (Shur complement info):                       %d \n",mumps->id.ICNTL(19));CHKERRQ(ierr);
1187a5e57a09SHong Zhang       ierr = PetscViewerASCIIPrintf(viewer,"  ICNTL(20) (rhs sparse pattern):                         %d \n",mumps->id.ICNTL(20));CHKERRQ(ierr);
1188a5e57a09SHong Zhang       ierr = PetscViewerASCIIPrintf(viewer,"  ICNTL(21) (somumpstion struct):                            %d \n",mumps->id.ICNTL(21));CHKERRQ(ierr);
1189a5e57a09SHong Zhang       ierr = PetscViewerASCIIPrintf(viewer,"  ICNTL(22) (in-core/out-of-core facility):               %d \n",mumps->id.ICNTL(22));CHKERRQ(ierr);
1190a5e57a09SHong Zhang       ierr = PetscViewerASCIIPrintf(viewer,"  ICNTL(23) (max size of memory can be allocated locally):%d \n",mumps->id.ICNTL(23));CHKERRQ(ierr);
1191c0165424SHong Zhang 
1192a5e57a09SHong Zhang       ierr = PetscViewerASCIIPrintf(viewer,"  ICNTL(24) (detection of null pivot rows):               %d \n",mumps->id.ICNTL(24));CHKERRQ(ierr);
1193a5e57a09SHong Zhang       ierr = PetscViewerASCIIPrintf(viewer,"  ICNTL(25) (computation of a null space basis):          %d \n",mumps->id.ICNTL(25));CHKERRQ(ierr);
1194a5e57a09SHong Zhang       ierr = PetscViewerASCIIPrintf(viewer,"  ICNTL(26) (Schur options for rhs or solution):          %d \n",mumps->id.ICNTL(26));CHKERRQ(ierr);
1195a5e57a09SHong Zhang       ierr = PetscViewerASCIIPrintf(viewer,"  ICNTL(27) (experimental parameter):                     %d \n",mumps->id.ICNTL(27));CHKERRQ(ierr);
1196a5e57a09SHong Zhang       ierr = PetscViewerASCIIPrintf(viewer,"  ICNTL(28) (use parallel or sequential ordering):        %d \n",mumps->id.ICNTL(28));CHKERRQ(ierr);
1197a5e57a09SHong Zhang       ierr = PetscViewerASCIIPrintf(viewer,"  ICNTL(29) (parallel ordering):                          %d \n",mumps->id.ICNTL(29));CHKERRQ(ierr);
119842179a6aSHong Zhang 
1199a5e57a09SHong Zhang       ierr = PetscViewerASCIIPrintf(viewer,"  ICNTL(30) (user-specified set of entries in inv(A)):    %d \n",mumps->id.ICNTL(30));CHKERRQ(ierr);
1200a5e57a09SHong Zhang       ierr = PetscViewerASCIIPrintf(viewer,"  ICNTL(31) (factors is discarded in the solve phase):    %d \n",mumps->id.ICNTL(31));CHKERRQ(ierr);
1201a5e57a09SHong Zhang       ierr = PetscViewerASCIIPrintf(viewer,"  ICNTL(33) (compute determinant):                        %d \n",mumps->id.ICNTL(33));CHKERRQ(ierr);
1202f6c57405SHong Zhang 
1203a5e57a09SHong Zhang       ierr = PetscViewerASCIIPrintf(viewer,"  CNTL(1) (relative pivoting threshold):      %g \n",mumps->id.CNTL(1));CHKERRQ(ierr);
1204a5e57a09SHong Zhang       ierr = PetscViewerASCIIPrintf(viewer,"  CNTL(2) (stopping criterion of refinement): %g \n",mumps->id.CNTL(2));CHKERRQ(ierr);
1205a5e57a09SHong Zhang       ierr = PetscViewerASCIIPrintf(viewer,"  CNTL(3) (absomumpste pivoting threshold):      %g \n",mumps->id.CNTL(3));CHKERRQ(ierr);
1206a5e57a09SHong Zhang       ierr = PetscViewerASCIIPrintf(viewer,"  CNTL(4) (vamumpse of static pivoting):         %g \n",mumps->id.CNTL(4));CHKERRQ(ierr);
1207a5e57a09SHong Zhang       ierr = PetscViewerASCIIPrintf(viewer,"  CNTL(5) (fixation for null pivots):         %g \n",mumps->id.CNTL(5));CHKERRQ(ierr);
1208f6c57405SHong Zhang 
1209f6c57405SHong Zhang       /* infomation local to each processor */
121034ed7027SBarry Smith       ierr = PetscViewerASCIIPrintf(viewer, "  RINFO(1) (local estimated flops for the elimination after analysis): \n");CHKERRQ(ierr);
12117b23a99aSBarry Smith       ierr = PetscViewerASCIISynchronizedAllow(viewer,PETSC_TRUE);CHKERRQ(ierr);
1212a5e57a09SHong Zhang       ierr = PetscViewerASCIISynchronizedPrintf(viewer,"    [%d] %g \n",mumps->myid,mumps->id.RINFO(1));CHKERRQ(ierr);
121334ed7027SBarry Smith       ierr = PetscViewerFlush(viewer);
121434ed7027SBarry Smith       ierr = PetscViewerASCIIPrintf(viewer, "  RINFO(2) (local estimated flops for the assembly after factorization): \n");CHKERRQ(ierr);
1215a5e57a09SHong Zhang       ierr = PetscViewerASCIISynchronizedPrintf(viewer,"    [%d]  %g \n",mumps->myid,mumps->id.RINFO(2));CHKERRQ(ierr);
121634ed7027SBarry Smith       ierr = PetscViewerFlush(viewer);
121734ed7027SBarry Smith       ierr = PetscViewerASCIIPrintf(viewer, "  RINFO(3) (local estimated flops for the elimination after factorization): \n");CHKERRQ(ierr);
1218a5e57a09SHong Zhang       ierr = PetscViewerASCIISynchronizedPrintf(viewer,"    [%d]  %g \n",mumps->myid,mumps->id.RINFO(3));CHKERRQ(ierr);
121934ed7027SBarry Smith       ierr = PetscViewerFlush(viewer);
1220f6c57405SHong Zhang 
122134ed7027SBarry Smith       ierr = PetscViewerASCIIPrintf(viewer, "  INFO(15) (estimated size of (in MB) MUMPS internal data for running numerical factorization): \n");CHKERRQ(ierr);
1222a5e57a09SHong Zhang       ierr = PetscViewerASCIISynchronizedPrintf(viewer,"  [%d] %d \n",mumps->myid,mumps->id.INFO(15));CHKERRQ(ierr);
122334ed7027SBarry Smith       ierr = PetscViewerFlush(viewer);
1224f6c57405SHong Zhang 
122534ed7027SBarry Smith       ierr = PetscViewerASCIIPrintf(viewer, "  INFO(16) (size of (in MB) MUMPS internal data used during numerical factorization): \n");CHKERRQ(ierr);
1226a5e57a09SHong Zhang       ierr = PetscViewerASCIISynchronizedPrintf(viewer,"    [%d] %d \n",mumps->myid,mumps->id.INFO(16));CHKERRQ(ierr);
122734ed7027SBarry Smith       ierr = PetscViewerFlush(viewer);
1228f6c57405SHong Zhang 
122934ed7027SBarry Smith       ierr = PetscViewerASCIIPrintf(viewer, "  INFO(23) (num of pivots eliminated on this processor after factorization): \n");CHKERRQ(ierr);
1230a5e57a09SHong Zhang       ierr = PetscViewerASCIISynchronizedPrintf(viewer,"    [%d] %d \n",mumps->myid,mumps->id.INFO(23));CHKERRQ(ierr);
123134ed7027SBarry Smith       ierr = PetscViewerFlush(viewer);
12327b23a99aSBarry Smith       ierr = PetscViewerASCIISynchronizedAllow(viewer,PETSC_FALSE);CHKERRQ(ierr);
1233f6c57405SHong Zhang 
1234a5e57a09SHong Zhang       if (!mumps->myid) { /* information from the host */
1235a5e57a09SHong Zhang         ierr = PetscViewerASCIIPrintf(viewer,"  RINFOG(1) (global estimated flops for the elimination after analysis): %g \n",mumps->id.RINFOG(1));CHKERRQ(ierr);
1236a5e57a09SHong Zhang         ierr = PetscViewerASCIIPrintf(viewer,"  RINFOG(2) (global estimated flops for the assembly after factorization): %g \n",mumps->id.RINFOG(2));CHKERRQ(ierr);
1237a5e57a09SHong Zhang         ierr = PetscViewerASCIIPrintf(viewer,"  RINFOG(3) (global estimated flops for the elimination after factorization): %g \n",mumps->id.RINFOG(3));CHKERRQ(ierr);
1238a5e57a09SHong Zhang         ierr = PetscViewerASCIIPrintf(viewer,"  (RINFOG(12) RINFOG(13))*2^INFOG(34) (determinant): (%g,%g)*(2^%d)\n",mumps->id.RINFOG(12),mumps->id.RINFOG(13),mumps->id.INFOG(34));CHKERRQ(ierr);
1239f6c57405SHong Zhang 
1240a5e57a09SHong Zhang         ierr = PetscViewerASCIIPrintf(viewer,"  INFOG(3) (estimated real workspace for factors on all processors after analysis): %d \n",mumps->id.INFOG(3));CHKERRQ(ierr);
1241a5e57a09SHong Zhang         ierr = PetscViewerASCIIPrintf(viewer,"  INFOG(4) (estimated integer workspace for factors on all processors after analysis): %d \n",mumps->id.INFOG(4));CHKERRQ(ierr);
1242a5e57a09SHong Zhang         ierr = PetscViewerASCIIPrintf(viewer,"  INFOG(5) (estimated maximum front size in the complete tree): %d \n",mumps->id.INFOG(5));CHKERRQ(ierr);
1243a5e57a09SHong Zhang         ierr = PetscViewerASCIIPrintf(viewer,"  INFOG(6) (number of nodes in the complete tree): %d \n",mumps->id.INFOG(6));CHKERRQ(ierr);
1244a5e57a09SHong Zhang         ierr = PetscViewerASCIIPrintf(viewer,"  INFOG(7) (ordering option effectively use after analysis): %d \n",mumps->id.INFOG(7));CHKERRQ(ierr);
1245a5e57a09SHong Zhang         ierr = PetscViewerASCIIPrintf(viewer,"  INFOG(8) (structural symmetry in percent of the permuted matrix after analysis): %d \n",mumps->id.INFOG(8));CHKERRQ(ierr);
1246a5e57a09SHong Zhang         ierr = PetscViewerASCIIPrintf(viewer,"  INFOG(9) (total real/complex workspace to store the matrix factors after factorization): %d \n",mumps->id.INFOG(9));CHKERRQ(ierr);
1247a5e57a09SHong Zhang         ierr = PetscViewerASCIIPrintf(viewer,"  INFOG(10) (total integer space store the matrix factors after factorization): %d \n",mumps->id.INFOG(10));CHKERRQ(ierr);
1248a5e57a09SHong Zhang         ierr = PetscViewerASCIIPrintf(viewer,"  INFOG(11) (order of largest frontal matrix after factorization): %d \n",mumps->id.INFOG(11));CHKERRQ(ierr);
1249a5e57a09SHong Zhang         ierr = PetscViewerASCIIPrintf(viewer,"  INFOG(12) (number of off-diagonal pivots): %d \n",mumps->id.INFOG(12));CHKERRQ(ierr);
1250a5e57a09SHong Zhang         ierr = PetscViewerASCIIPrintf(viewer,"  INFOG(13) (number of delayed pivots after factorization): %d \n",mumps->id.INFOG(13));CHKERRQ(ierr);
1251a5e57a09SHong Zhang         ierr = PetscViewerASCIIPrintf(viewer,"  INFOG(14) (number of memory compress after factorization): %d \n",mumps->id.INFOG(14));CHKERRQ(ierr);
1252a5e57a09SHong Zhang         ierr = PetscViewerASCIIPrintf(viewer,"  INFOG(15) (number of steps of iterative refinement after solution): %d \n",mumps->id.INFOG(15));CHKERRQ(ierr);
1253a5e57a09SHong Zhang         ierr = PetscViewerASCIIPrintf(viewer,"  INFOG(16) (estimated size (in MB) of all MUMPS internal data for factorization after analysis: value on the most memory consuming processor): %d \n",mumps->id.INFOG(16));CHKERRQ(ierr);
1254a5e57a09SHong Zhang         ierr = PetscViewerASCIIPrintf(viewer,"  INFOG(17) (estimated size of all MUMPS internal data for factorization after analysis: sum over all processors): %d \n",mumps->id.INFOG(17));CHKERRQ(ierr);
1255a5e57a09SHong Zhang         ierr = PetscViewerASCIIPrintf(viewer,"  INFOG(18) (size of all MUMPS internal data allocated during factorization: value on the most memory consuming processor): %d \n",mumps->id.INFOG(18));CHKERRQ(ierr);
1256a5e57a09SHong Zhang         ierr = PetscViewerASCIIPrintf(viewer,"  INFOG(19) (size of all MUMPS internal data allocated during factorization: sum over all processors): %d \n",mumps->id.INFOG(19));CHKERRQ(ierr);
1257a5e57a09SHong Zhang         ierr = PetscViewerASCIIPrintf(viewer,"  INFOG(20) (estimated number of entries in the factors): %d \n",mumps->id.INFOG(20));CHKERRQ(ierr);
1258a5e57a09SHong Zhang         ierr = PetscViewerASCIIPrintf(viewer,"  INFOG(21) (size in MB of memory effectively used during factorization - value on the most memory consuming processor): %d \n",mumps->id.INFOG(21));CHKERRQ(ierr);
1259a5e57a09SHong Zhang         ierr = PetscViewerASCIIPrintf(viewer,"  INFOG(22) (size in MB of memory effectively used during factorization - sum over all processors): %d \n",mumps->id.INFOG(22));CHKERRQ(ierr);
1260a5e57a09SHong Zhang         ierr = PetscViewerASCIIPrintf(viewer,"  INFOG(23) (after analysis: value of ICNTL(6) effectively used): %d \n",mumps->id.INFOG(23));CHKERRQ(ierr);
1261a5e57a09SHong Zhang         ierr = PetscViewerASCIIPrintf(viewer,"  INFOG(24) (after analysis: value of ICNTL(12) effectively used): %d \n",mumps->id.INFOG(24));CHKERRQ(ierr);
1262a5e57a09SHong Zhang         ierr = PetscViewerASCIIPrintf(viewer,"  INFOG(25) (after factorization: number of pivots modified by static pivoting): %d \n",mumps->id.INFOG(25));CHKERRQ(ierr);
1263f6c57405SHong Zhang       }
1264f6c57405SHong Zhang     }
1265cb828f0fSHong Zhang   }
1266f6c57405SHong Zhang   PetscFunctionReturn(0);
1267f6c57405SHong Zhang }
1268f6c57405SHong Zhang 
126935bd34faSBarry Smith #undef __FUNCT__
127035bd34faSBarry Smith #define __FUNCT__ "MatGetInfo_MUMPS"
127135bd34faSBarry Smith PetscErrorCode MatGetInfo_MUMPS(Mat A,MatInfoType flag,MatInfo *info)
127235bd34faSBarry Smith {
1273cb828f0fSHong Zhang   Mat_MUMPS *mumps =(Mat_MUMPS*)A->spptr;
127435bd34faSBarry Smith 
127535bd34faSBarry Smith   PetscFunctionBegin;
127635bd34faSBarry Smith   info->block_size        = 1.0;
1277cb828f0fSHong Zhang   info->nz_allocated      = mumps->id.INFOG(20);
1278cb828f0fSHong Zhang   info->nz_used           = mumps->id.INFOG(20);
127935bd34faSBarry Smith   info->nz_unneeded       = 0.0;
128035bd34faSBarry Smith   info->assemblies        = 0.0;
128135bd34faSBarry Smith   info->mallocs           = 0.0;
128235bd34faSBarry Smith   info->memory            = 0.0;
128335bd34faSBarry Smith   info->fill_ratio_given  = 0;
128435bd34faSBarry Smith   info->fill_ratio_needed = 0;
128535bd34faSBarry Smith   info->factor_mallocs    = 0;
128635bd34faSBarry Smith   PetscFunctionReturn(0);
128735bd34faSBarry Smith }
128835bd34faSBarry Smith 
12895ccb76cbSHong Zhang /* -------------------------------------------------------------------------------------------*/
12905ccb76cbSHong Zhang #undef __FUNCT__
12915ccb76cbSHong Zhang #define __FUNCT__ "MatMumpsSetIcntl_MUMPS"
12925ccb76cbSHong Zhang PetscErrorCode MatMumpsSetIcntl_MUMPS(Mat F,PetscInt icntl,PetscInt ival)
12935ccb76cbSHong Zhang {
1294a5e57a09SHong Zhang   Mat_MUMPS *mumps =(Mat_MUMPS*)F->spptr;
12955ccb76cbSHong Zhang 
12965ccb76cbSHong Zhang   PetscFunctionBegin;
1297a5e57a09SHong Zhang   mumps->id.ICNTL(icntl) = ival;
12985ccb76cbSHong Zhang   PetscFunctionReturn(0);
12995ccb76cbSHong Zhang }
13005ccb76cbSHong Zhang 
13015ccb76cbSHong Zhang #undef __FUNCT__
13025ccb76cbSHong Zhang #define __FUNCT__ "MatMumpsSetIcntl"
13035ccb76cbSHong Zhang /*@
13045ccb76cbSHong Zhang   MatMumpsSetIcntl - Set MUMPS parameter ICNTL()
13055ccb76cbSHong Zhang 
13065ccb76cbSHong Zhang    Logically Collective on Mat
13075ccb76cbSHong Zhang 
13085ccb76cbSHong Zhang    Input Parameters:
13095ccb76cbSHong Zhang +  F - the factored matrix obtained by calling MatGetFactor() from PETSc-MUMPS interface
13105ccb76cbSHong Zhang .  icntl - index of MUMPS parameter array ICNTL()
13115ccb76cbSHong Zhang -  ival - value of MUMPS ICNTL(icntl)
13125ccb76cbSHong Zhang 
13135ccb76cbSHong Zhang   Options Database:
13145ccb76cbSHong Zhang .   -mat_mumps_icntl_<icntl> <ival>
13155ccb76cbSHong Zhang 
13165ccb76cbSHong Zhang    Level: beginner
13175ccb76cbSHong Zhang 
13185ccb76cbSHong Zhang    References: MUMPS Users' Guide
13195ccb76cbSHong Zhang 
13205ccb76cbSHong Zhang .seealso: MatGetFactor()
13215ccb76cbSHong Zhang @*/
13225ccb76cbSHong Zhang PetscErrorCode MatMumpsSetIcntl(Mat F,PetscInt icntl,PetscInt ival)
13235ccb76cbSHong Zhang {
13245ccb76cbSHong Zhang   PetscErrorCode ierr;
13255ccb76cbSHong Zhang 
13265ccb76cbSHong Zhang   PetscFunctionBegin;
13275ccb76cbSHong Zhang   PetscValidLogicalCollectiveInt(F,icntl,2);
13285ccb76cbSHong Zhang   PetscValidLogicalCollectiveInt(F,ival,3);
13295ccb76cbSHong Zhang   ierr = PetscTryMethod(F,"MatMumpsSetIcntl_C",(Mat,PetscInt,PetscInt),(F,icntl,ival));CHKERRQ(ierr);
13305ccb76cbSHong Zhang   PetscFunctionReturn(0);
13315ccb76cbSHong Zhang }
13325ccb76cbSHong Zhang 
13338928b65cSHong Zhang /* -------------------------------------------------------------------------------------------*/
13348928b65cSHong Zhang #undef __FUNCT__
13358928b65cSHong Zhang #define __FUNCT__ "MatMumpsSetCntl_MUMPS"
13368928b65cSHong Zhang PetscErrorCode MatMumpsSetCntl_MUMPS(Mat F,PetscInt icntl,PetscReal val)
13378928b65cSHong Zhang {
13388928b65cSHong Zhang   Mat_MUMPS *mumps =(Mat_MUMPS*)F->spptr;
13398928b65cSHong Zhang 
13408928b65cSHong Zhang   PetscFunctionBegin;
13418928b65cSHong Zhang   mumps->id.CNTL(icntl) = val;
13428928b65cSHong Zhang   PetscFunctionReturn(0);
13438928b65cSHong Zhang }
13448928b65cSHong Zhang 
13458928b65cSHong Zhang #undef __FUNCT__
13468928b65cSHong Zhang #define __FUNCT__ "MatMumpsSetCntl"
13478928b65cSHong Zhang /*@
13488928b65cSHong Zhang   MatMumpsSetCntl - Set MUMPS parameter CNTL()
13498928b65cSHong Zhang 
13508928b65cSHong Zhang    Logically Collective on Mat
13518928b65cSHong Zhang 
13528928b65cSHong Zhang    Input Parameters:
13538928b65cSHong Zhang +  F - the factored matrix obtained by calling MatGetFactor() from PETSc-MUMPS interface
13548928b65cSHong Zhang .  icntl - index of MUMPS parameter array CNTL()
13558928b65cSHong Zhang -  val - value of MUMPS CNTL(icntl)
13568928b65cSHong Zhang 
13578928b65cSHong Zhang   Options Database:
13588928b65cSHong Zhang .   -mat_mumps_cntl_<icntl> <val>
13598928b65cSHong Zhang 
13608928b65cSHong Zhang    Level: beginner
13618928b65cSHong Zhang 
13628928b65cSHong Zhang    References: MUMPS Users' Guide
13638928b65cSHong Zhang 
13648928b65cSHong Zhang .seealso: MatGetFactor()
13658928b65cSHong Zhang @*/
13668928b65cSHong Zhang PetscErrorCode MatMumpsSetCntl(Mat F,PetscInt icntl,PetscReal val)
13678928b65cSHong Zhang {
13688928b65cSHong Zhang   PetscErrorCode ierr;
13698928b65cSHong Zhang 
13708928b65cSHong Zhang   PetscFunctionBegin;
13718928b65cSHong Zhang   PetscValidLogicalCollectiveInt(F,icntl,2);
13728928b65cSHong Zhang   PetscValidLogicalCollectiveInt(F,val,3);
13738928b65cSHong Zhang   ierr = PetscTryMethod(F,"MatMumpsSetCntl_C",(Mat,PetscInt,PetscReal),(F,icntl,val));CHKERRQ(ierr);
13748928b65cSHong Zhang   PetscFunctionReturn(0);
13758928b65cSHong Zhang }
13768928b65cSHong Zhang 
137724b6179bSKris Buschelman /*MC
13782692d6eeSBarry Smith   MATSOLVERMUMPS -  A matrix type providing direct solvers (LU and Cholesky) for
137924b6179bSKris Buschelman   distributed and sequential matrices via the external package MUMPS.
138024b6179bSKris Buschelman 
138141c8de11SBarry Smith   Works with MATAIJ and MATSBAIJ matrices
138224b6179bSKris Buschelman 
138324b6179bSKris Buschelman   Options Database Keys:
1384fb8376fbSHong Zhang + -mat_mumps_icntl_4 <0,...,4> - print level
138524b6179bSKris Buschelman . -mat_mumps_icntl_6 <0,...,7> - matrix prescaling options (see MUMPS User's Guide)
138664e6c443SBarry Smith . -mat_mumps_icntl_7 <0,...,7> - matrix orderings (see MUMPS User's Guidec)
138724b6179bSKris Buschelman . -mat_mumps_icntl_9 <1,2> - A or A^T x=b to be solved: 1 denotes A, 2 denotes A^T
138824b6179bSKris Buschelman . -mat_mumps_icntl_10 <n> - maximum number of iterative refinements
138994b7f48cSBarry Smith . -mat_mumps_icntl_11 <n> - error analysis, a positive value returns statistics during -ksp_view
139024b6179bSKris Buschelman . -mat_mumps_icntl_12 <n> - efficiency control (see MUMPS User's Guide)
139124b6179bSKris Buschelman . -mat_mumps_icntl_13 <n> - efficiency control (see MUMPS User's Guide)
139224b6179bSKris Buschelman . -mat_mumps_icntl_14 <n> - efficiency control (see MUMPS User's Guide)
139324b6179bSKris Buschelman . -mat_mumps_icntl_15 <n> - efficiency control (see MUMPS User's Guide)
139424b6179bSKris Buschelman . -mat_mumps_cntl_1 <delta> - relative pivoting threshold
139524b6179bSKris Buschelman . -mat_mumps_cntl_2 <tol> - stopping criterion for refinement
139624b6179bSKris Buschelman - -mat_mumps_cntl_3 <adelta> - absolute pivoting threshold
139724b6179bSKris Buschelman 
139824b6179bSKris Buschelman   Level: beginner
139924b6179bSKris Buschelman 
140041c8de11SBarry Smith .seealso: PCFactorSetMatSolverPackage(), MatSolverPackage
140141c8de11SBarry Smith 
140224b6179bSKris Buschelman M*/
140324b6179bSKris Buschelman 
140435bd34faSBarry Smith #undef __FUNCT__
140535bd34faSBarry Smith #define __FUNCT__ "MatFactorGetSolverPackage_mumps"
1406f7a08781SBarry Smith static PetscErrorCode MatFactorGetSolverPackage_mumps(Mat A,const MatSolverPackage *type)
140735bd34faSBarry Smith {
140835bd34faSBarry Smith   PetscFunctionBegin;
14092692d6eeSBarry Smith   *type = MATSOLVERMUMPS;
141035bd34faSBarry Smith   PetscFunctionReturn(0);
141135bd34faSBarry Smith }
141235bd34faSBarry Smith 
1413bccb9932SShri Abhyankar /* MatGetFactor for Seq and MPI AIJ matrices */
14142877fffaSHong Zhang #undef __FUNCT__
1415bccb9932SShri Abhyankar #define __FUNCT__ "MatGetFactor_aij_mumps"
14168cc058d9SJed Brown PETSC_EXTERN PetscErrorCode MatGetFactor_aij_mumps(Mat A,MatFactorType ftype,Mat *F)
14172877fffaSHong Zhang {
14182877fffaSHong Zhang   Mat            B;
14192877fffaSHong Zhang   PetscErrorCode ierr;
14202877fffaSHong Zhang   Mat_MUMPS      *mumps;
1421ace3abfcSBarry Smith   PetscBool      isSeqAIJ;
14222877fffaSHong Zhang 
14232877fffaSHong Zhang   PetscFunctionBegin;
14242877fffaSHong Zhang   /* Create the factorization matrix */
1425251f4c67SDmitry Karpeev   ierr = PetscObjectTypeCompare((PetscObject)A,MATSEQAIJ,&isSeqAIJ);CHKERRQ(ierr);
1426ce94432eSBarry Smith   ierr = MatCreate(PetscObjectComm((PetscObject)A),&B);CHKERRQ(ierr);
14272877fffaSHong Zhang   ierr = MatSetSizes(B,A->rmap->n,A->cmap->n,A->rmap->N,A->cmap->N);CHKERRQ(ierr);
14282877fffaSHong Zhang   ierr = MatSetType(B,((PetscObject)A)->type_name);CHKERRQ(ierr);
1429bccb9932SShri Abhyankar   if (isSeqAIJ) {
14300298fd71SBarry Smith     ierr = MatSeqAIJSetPreallocation(B,0,NULL);CHKERRQ(ierr);
1431bccb9932SShri Abhyankar   } else {
14320298fd71SBarry Smith     ierr = MatMPIAIJSetPreallocation(B,0,NULL,0,NULL);CHKERRQ(ierr);
1433bccb9932SShri Abhyankar   }
14342877fffaSHong Zhang 
143516ebf90aSShri Abhyankar   ierr = PetscNewLog(B,Mat_MUMPS,&mumps);CHKERRQ(ierr);
14362205254eSKarl Rupp 
14372877fffaSHong Zhang   B->ops->view    = MatView_MUMPS;
143835bd34faSBarry Smith   B->ops->getinfo = MatGetInfo_MUMPS;
14392205254eSKarl Rupp 
1440bdf89e91SBarry Smith   ierr = PetscObjectComposeFunction((PetscObject)B,"MatFactorGetSolverPackage_C",MatFactorGetSolverPackage_mumps);CHKERRQ(ierr);
1441bdf89e91SBarry Smith   ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsSetIcntl_C",MatMumpsSetIcntl_MUMPS);CHKERRQ(ierr);
1442bdf89e91SBarry Smith   ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsSetCntl_C",MatMumpsSetCntl_MUMPS);CHKERRQ(ierr);
1443450b117fSShri Abhyankar   if (ftype == MAT_FACTOR_LU) {
1444450b117fSShri Abhyankar     B->ops->lufactorsymbolic = MatLUFactorSymbolic_AIJMUMPS;
1445d5f3da31SBarry Smith     B->factortype            = MAT_FACTOR_LU;
1446bccb9932SShri Abhyankar     if (isSeqAIJ) mumps->ConvertToTriples = MatConvertToTriples_seqaij_seqaij;
1447bccb9932SShri Abhyankar     else mumps->ConvertToTriples = MatConvertToTriples_mpiaij_mpiaij;
1448746480a1SHong Zhang     mumps->sym = 0;
1449dcd589f8SShri Abhyankar   } else {
145067877ebaSShri Abhyankar     B->ops->choleskyfactorsymbolic = MatCholeskyFactorSymbolic_MUMPS;
1451450b117fSShri Abhyankar     B->factortype                  = MAT_FACTOR_CHOLESKY;
1452bccb9932SShri Abhyankar     if (isSeqAIJ) mumps->ConvertToTriples = MatConvertToTriples_seqaij_seqsbaij;
1453bccb9932SShri Abhyankar     else mumps->ConvertToTriples = MatConvertToTriples_mpiaij_mpisbaij;
14546fdc2a6dSBarry Smith     if (A->spd_set && A->spd) mumps->sym = 1;
14556fdc2a6dSBarry Smith     else                      mumps->sym = 2;
1456450b117fSShri Abhyankar   }
14572877fffaSHong Zhang 
14582877fffaSHong Zhang   mumps->isAIJ    = PETSC_TRUE;
1459bf0cc555SLisandro Dalcin   mumps->Destroy  = B->ops->destroy;
14602877fffaSHong Zhang   B->ops->destroy = MatDestroy_MUMPS;
14612877fffaSHong Zhang   B->spptr        = (void*)mumps;
14622205254eSKarl Rupp 
1463f697e70eSHong Zhang   ierr = PetscInitializeMUMPS(A,mumps);CHKERRQ(ierr);
1464746480a1SHong Zhang 
14652877fffaSHong Zhang   *F = B;
14662877fffaSHong Zhang   PetscFunctionReturn(0);
14672877fffaSHong Zhang }
14682877fffaSHong Zhang 
1469bccb9932SShri Abhyankar /* MatGetFactor for Seq and MPI SBAIJ matrices */
14702877fffaSHong Zhang #undef __FUNCT__
1471bccb9932SShri Abhyankar #define __FUNCT__ "MatGetFactor_sbaij_mumps"
14728cc058d9SJed Brown PETSC_EXTERN PetscErrorCode MatGetFactor_sbaij_mumps(Mat A,MatFactorType ftype,Mat *F)
14732877fffaSHong Zhang {
14742877fffaSHong Zhang   Mat            B;
14752877fffaSHong Zhang   PetscErrorCode ierr;
14762877fffaSHong Zhang   Mat_MUMPS      *mumps;
1477ace3abfcSBarry Smith   PetscBool      isSeqSBAIJ;
14782877fffaSHong Zhang 
14792877fffaSHong Zhang   PetscFunctionBegin;
1480ce94432eSBarry Smith   if (ftype != MAT_FACTOR_CHOLESKY) SETERRQ(PetscObjectComm((PetscObject)A),PETSC_ERR_SUP,"Cannot use PETSc SBAIJ matrices with MUMPS LU, use AIJ matrix");
1481ce94432eSBarry Smith   if (A->rmap->bs > 1) SETERRQ(PetscObjectComm((PetscObject)A),PETSC_ERR_SUP,"Cannot use PETSc SBAIJ matrices with block size > 1 with MUMPS Cholesky, use AIJ matrix instead");
1482251f4c67SDmitry Karpeev   ierr = PetscObjectTypeCompare((PetscObject)A,MATSEQSBAIJ,&isSeqSBAIJ);CHKERRQ(ierr);
14832877fffaSHong Zhang   /* Create the factorization matrix */
1484ce94432eSBarry Smith   ierr = MatCreate(PetscObjectComm((PetscObject)A),&B);CHKERRQ(ierr);
14852877fffaSHong Zhang   ierr = MatSetSizes(B,A->rmap->n,A->cmap->n,A->rmap->N,A->cmap->N);CHKERRQ(ierr);
14862877fffaSHong Zhang   ierr = MatSetType(B,((PetscObject)A)->type_name);CHKERRQ(ierr);
148716ebf90aSShri Abhyankar   ierr = PetscNewLog(B,Mat_MUMPS,&mumps);CHKERRQ(ierr);
1488bccb9932SShri Abhyankar   if (isSeqSBAIJ) {
14890298fd71SBarry Smith     ierr = MatSeqSBAIJSetPreallocation(B,1,0,NULL);CHKERRQ(ierr);
14902205254eSKarl Rupp 
149116ebf90aSShri Abhyankar     mumps->ConvertToTriples = MatConvertToTriples_seqsbaij_seqsbaij;
1492dcd589f8SShri Abhyankar   } else {
14930298fd71SBarry Smith     ierr = MatMPISBAIJSetPreallocation(B,1,0,NULL,0,NULL);CHKERRQ(ierr);
14942205254eSKarl Rupp 
1495bccb9932SShri Abhyankar     mumps->ConvertToTriples = MatConvertToTriples_mpisbaij_mpisbaij;
1496bccb9932SShri Abhyankar   }
1497bccb9932SShri Abhyankar 
149867877ebaSShri Abhyankar   B->ops->choleskyfactorsymbolic = MatCholeskyFactorSymbolic_MUMPS;
1499bccb9932SShri Abhyankar   B->ops->view                   = MatView_MUMPS;
15002205254eSKarl Rupp 
1501bdf89e91SBarry Smith   ierr = PetscObjectComposeFunction((PetscObject)B,"MatFactorGetSolverPackage_C",MatFactorGetSolverPackage_mumps);CHKERRQ(ierr);
1502bdf89e91SBarry Smith   ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsSetIcntl_C",MatMumpsSetIcntl);CHKERRQ(ierr);
1503bdf89e91SBarry Smith   ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsSetCntl_C",MatMumpsSetCntl);CHKERRQ(ierr);
15042205254eSKarl Rupp 
1505f4762488SHong Zhang   B->factortype = MAT_FACTOR_CHOLESKY;
15066fdc2a6dSBarry Smith   if (A->spd_set && A->spd) mumps->sym = 1;
15076fdc2a6dSBarry Smith   else                      mumps->sym = 2;
1508a214ac2aSShri Abhyankar 
1509bccb9932SShri Abhyankar   mumps->isAIJ    = PETSC_FALSE;
1510bf0cc555SLisandro Dalcin   mumps->Destroy  = B->ops->destroy;
1511f3c0ef26SHong Zhang   B->ops->destroy = MatDestroy_MUMPS;
15122877fffaSHong Zhang   B->spptr        = (void*)mumps;
15132205254eSKarl Rupp 
1514f697e70eSHong Zhang   ierr = PetscInitializeMUMPS(A,mumps);CHKERRQ(ierr);
1515746480a1SHong Zhang 
15162877fffaSHong Zhang   *F = B;
15172877fffaSHong Zhang   PetscFunctionReturn(0);
15182877fffaSHong Zhang }
151997969023SHong Zhang 
1520450b117fSShri Abhyankar #undef __FUNCT__
1521bccb9932SShri Abhyankar #define __FUNCT__ "MatGetFactor_baij_mumps"
15228cc058d9SJed Brown PETSC_EXTERN PetscErrorCode MatGetFactor_baij_mumps(Mat A,MatFactorType ftype,Mat *F)
152367877ebaSShri Abhyankar {
152467877ebaSShri Abhyankar   Mat            B;
152567877ebaSShri Abhyankar   PetscErrorCode ierr;
152667877ebaSShri Abhyankar   Mat_MUMPS      *mumps;
1527ace3abfcSBarry Smith   PetscBool      isSeqBAIJ;
152867877ebaSShri Abhyankar 
152967877ebaSShri Abhyankar   PetscFunctionBegin;
153067877ebaSShri Abhyankar   /* Create the factorization matrix */
1531251f4c67SDmitry Karpeev   ierr = PetscObjectTypeCompare((PetscObject)A,MATSEQBAIJ,&isSeqBAIJ);CHKERRQ(ierr);
1532ce94432eSBarry Smith   ierr = MatCreate(PetscObjectComm((PetscObject)A),&B);CHKERRQ(ierr);
153367877ebaSShri Abhyankar   ierr = MatSetSizes(B,A->rmap->n,A->cmap->n,A->rmap->N,A->cmap->N);CHKERRQ(ierr);
153467877ebaSShri Abhyankar   ierr = MatSetType(B,((PetscObject)A)->type_name);CHKERRQ(ierr);
1535bccb9932SShri Abhyankar   if (isSeqBAIJ) {
15360298fd71SBarry Smith     ierr = MatSeqBAIJSetPreallocation(B,A->rmap->bs,0,NULL);CHKERRQ(ierr);
1537bccb9932SShri Abhyankar   } else {
15380298fd71SBarry Smith     ierr = MatMPIBAIJSetPreallocation(B,A->rmap->bs,0,NULL,0,NULL);CHKERRQ(ierr);
1539bccb9932SShri Abhyankar   }
1540450b117fSShri Abhyankar 
154167877ebaSShri Abhyankar   ierr = PetscNewLog(B,Mat_MUMPS,&mumps);CHKERRQ(ierr);
1542450b117fSShri Abhyankar   if (ftype == MAT_FACTOR_LU) {
1543450b117fSShri Abhyankar     B->ops->lufactorsymbolic = MatLUFactorSymbolic_BAIJMUMPS;
1544450b117fSShri Abhyankar     B->factortype            = MAT_FACTOR_LU;
1545bccb9932SShri Abhyankar     if (isSeqBAIJ) mumps->ConvertToTriples = MatConvertToTriples_seqbaij_seqaij;
1546bccb9932SShri Abhyankar     else mumps->ConvertToTriples = MatConvertToTriples_mpibaij_mpiaij;
1547746480a1SHong Zhang     mumps->sym = 0;
1548f23aa3ddSBarry Smith   } else SETERRQ(PETSC_COMM_SELF,PETSC_ERR_SUP,"Cannot use PETSc BAIJ matrices with MUMPS Cholesky, use SBAIJ or AIJ matrix instead\n");
1549bccb9932SShri Abhyankar 
1550450b117fSShri Abhyankar   B->ops->view = MatView_MUMPS;
15512205254eSKarl Rupp 
1552bdf89e91SBarry Smith   ierr = PetscObjectComposeFunction((PetscObject)B,"MatFactorGetSolverPackage_C",MatFactorGetSolverPackage_mumps);CHKERRQ(ierr);
1553bdf89e91SBarry Smith   ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsSetIcntl_C",MatMumpsSetIcntl_MUMPS);CHKERRQ(ierr);
1554bdf89e91SBarry Smith   ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsSetCntl_C",MatMumpsSetCntl_MUMPS);CHKERRQ(ierr);
1555450b117fSShri Abhyankar 
1556450b117fSShri Abhyankar   mumps->isAIJ    = PETSC_TRUE;
1557bf0cc555SLisandro Dalcin   mumps->Destroy  = B->ops->destroy;
1558450b117fSShri Abhyankar   B->ops->destroy = MatDestroy_MUMPS;
1559450b117fSShri Abhyankar   B->spptr        = (void*)mumps;
15602205254eSKarl Rupp 
1561f697e70eSHong Zhang   ierr = PetscInitializeMUMPS(A,mumps);CHKERRQ(ierr);
1562746480a1SHong Zhang 
1563450b117fSShri Abhyankar   *F = B;
1564450b117fSShri Abhyankar   PetscFunctionReturn(0);
1565450b117fSShri Abhyankar }
1566a214ac2aSShri Abhyankar 
1567