11c2a3de1SBarry Smith 2397b6df1SKris Buschelman /* 3c2b5dc30SHong Zhang Provides an interface to the MUMPS sparse solver 4397b6df1SKris Buschelman */ 551d5961aSHong Zhang 6c6db04a5SJed Brown #include <../src/mat/impls/aij/mpi/mpiaij.h> /*I "petscmat.h" I*/ 7c6db04a5SJed Brown #include <../src/mat/impls/sbaij/mpi/mpisbaij.h> 8397b6df1SKris Buschelman 9397b6df1SKris Buschelman EXTERN_C_BEGIN 10397b6df1SKris Buschelman #if defined(PETSC_USE_COMPLEX) 11c6db04a5SJed Brown #include <zmumps_c.h> 12397b6df1SKris Buschelman #else 13c6db04a5SJed Brown #include <dmumps_c.h> 14397b6df1SKris Buschelman #endif 15397b6df1SKris Buschelman EXTERN_C_END 16397b6df1SKris Buschelman #define JOB_INIT -1 173d472b54SHong Zhang #define JOB_FACTSYMBOLIC 1 183d472b54SHong Zhang #define JOB_FACTNUMERIC 2 193d472b54SHong Zhang #define JOB_SOLVE 3 20397b6df1SKris Buschelman #define JOB_END -2 213d472b54SHong Zhang 223d472b54SHong Zhang 23397b6df1SKris Buschelman /* macros s.t. indices match MUMPS documentation */ 24397b6df1SKris Buschelman #define ICNTL(I) icntl[(I)-1] 25397b6df1SKris Buschelman #define CNTL(I) cntl[(I)-1] 26397b6df1SKris Buschelman #define INFOG(I) infog[(I)-1] 27a7aca84bSHong Zhang #define INFO(I) info[(I)-1] 28397b6df1SKris Buschelman #define RINFOG(I) rinfog[(I)-1] 29adc1d99fSHong Zhang #define RINFO(I) rinfo[(I)-1] 30397b6df1SKris Buschelman 31397b6df1SKris Buschelman typedef struct { 32397b6df1SKris Buschelman #if defined(PETSC_USE_COMPLEX) 33397b6df1SKris Buschelman ZMUMPS_STRUC_C id; 34397b6df1SKris Buschelman #else 35397b6df1SKris Buschelman DMUMPS_STRUC_C id; 36397b6df1SKris Buschelman #endif 37397b6df1SKris Buschelman MatStructure matstruc; 38c1490034SHong Zhang PetscMPIInt myid,size; 3916ebf90aSShri Abhyankar PetscInt *irn,*jcn,nz,sym,nSolve; 40397b6df1SKris Buschelman PetscScalar *val; 41397b6df1SKris Buschelman MPI_Comm comm_mumps; 42329ec9b3SHong Zhang VecScatter scat_rhs, scat_sol; 4364e6c443SBarry Smith PetscBool isAIJ,CleanUpMUMPS; 44329ec9b3SHong Zhang Vec b_seq,x_seq; 45bf0cc555SLisandro Dalcin PetscErrorCode (*Destroy)(Mat); 46bccb9932SShri Abhyankar PetscErrorCode (*ConvertToTriples)(Mat, int, MatReuse, int*, int**, int**, PetscScalar**); 47f0c56d0fSKris Buschelman } Mat_MUMPS; 48f0c56d0fSKris Buschelman 4909573ac7SBarry Smith extern PetscErrorCode MatDuplicate_MUMPS(Mat,MatDuplicateOption,Mat*); 50b24902e0SBarry Smith 5167877ebaSShri Abhyankar 5267877ebaSShri Abhyankar /* MatConvertToTriples_A_B */ 5367877ebaSShri Abhyankar /*convert Petsc matrix to triples: row[nz], col[nz], val[nz] */ 54397b6df1SKris Buschelman /* 55397b6df1SKris Buschelman input: 5667877ebaSShri Abhyankar A - matrix in aij,baij or sbaij (bs=1) format 57397b6df1SKris Buschelman shift - 0: C style output triple; 1: Fortran style output triple. 58bccb9932SShri Abhyankar reuse - MAT_INITIAL_MATRIX: spaces are allocated and values are set for the triple 59bccb9932SShri Abhyankar MAT_REUSE_MATRIX: only the values in v array are updated 60397b6df1SKris Buschelman output: 61397b6df1SKris Buschelman nnz - dim of r, c, and v (number of local nonzero entries of A) 62397b6df1SKris Buschelman r, c, v - row and col index, matrix values (matrix triples) 63397b6df1SKris Buschelman */ 6416ebf90aSShri Abhyankar 6516ebf90aSShri Abhyankar #undef __FUNCT__ 6616ebf90aSShri Abhyankar #define __FUNCT__ "MatConvertToTriples_seqaij_seqaij" 67bccb9932SShri Abhyankar PetscErrorCode MatConvertToTriples_seqaij_seqaij(Mat A,int shift,MatReuse reuse,int *nnz,int **r, int **c, PetscScalar **v) 68b24902e0SBarry Smith { 69185f6596SHong Zhang const PetscInt *ai,*aj,*ajj,M=A->rmap->n; 7067877ebaSShri Abhyankar PetscInt nz,rnz,i,j; 71dfbe8321SBarry Smith PetscErrorCode ierr; 72c1490034SHong Zhang PetscInt *row,*col; 7316ebf90aSShri Abhyankar Mat_SeqAIJ *aa=(Mat_SeqAIJ*)A->data; 74397b6df1SKris Buschelman 75397b6df1SKris Buschelman PetscFunctionBegin; 7616ebf90aSShri Abhyankar *v=aa->a; 77bccb9932SShri Abhyankar if (reuse == MAT_INITIAL_MATRIX){ 7816ebf90aSShri Abhyankar nz = aa->nz; ai = aa->i; aj = aa->j; 7916ebf90aSShri Abhyankar *nnz = nz; 80185f6596SHong Zhang ierr = PetscMalloc(2*nz*sizeof(PetscInt), &row);CHKERRQ(ierr); 81185f6596SHong Zhang col = row + nz; 82185f6596SHong Zhang 8316ebf90aSShri Abhyankar nz = 0; 8416ebf90aSShri Abhyankar for(i=0; i<M; i++) { 8516ebf90aSShri Abhyankar rnz = ai[i+1] - ai[i]; 8667877ebaSShri Abhyankar ajj = aj + ai[i]; 8767877ebaSShri Abhyankar for(j=0; j<rnz; j++) { 8867877ebaSShri Abhyankar row[nz] = i+shift; col[nz++] = ajj[j] + shift; 8916ebf90aSShri Abhyankar } 9016ebf90aSShri Abhyankar } 9116ebf90aSShri Abhyankar *r = row; *c = col; 9216ebf90aSShri Abhyankar } 9316ebf90aSShri Abhyankar PetscFunctionReturn(0); 9416ebf90aSShri Abhyankar } 95397b6df1SKris Buschelman 9616ebf90aSShri Abhyankar #undef __FUNCT__ 9767877ebaSShri Abhyankar #define __FUNCT__ "MatConvertToTriples_seqbaij_seqaij" 98bccb9932SShri Abhyankar PetscErrorCode MatConvertToTriples_seqbaij_seqaij(Mat A,int shift,MatReuse reuse,int *nnz,int **r, int **c, PetscScalar **v) 9967877ebaSShri Abhyankar { 10067877ebaSShri Abhyankar Mat_SeqBAIJ *aa=(Mat_SeqBAIJ*)A->data; 10167877ebaSShri Abhyankar const PetscInt *ai,*aj,*ajj,bs=A->rmap->bs,bs2=aa->bs2,M=A->rmap->N/bs; 1020ad0caddSJed Brown PetscInt nz,idx=0,rnz,i,j,k,m; 10367877ebaSShri Abhyankar PetscErrorCode ierr; 10467877ebaSShri Abhyankar PetscInt *row,*col; 10567877ebaSShri Abhyankar 10667877ebaSShri Abhyankar PetscFunctionBegin; 107cf3759fdSShri Abhyankar *v = aa->a; 108bccb9932SShri Abhyankar if (reuse == MAT_INITIAL_MATRIX){ 109cf3759fdSShri Abhyankar ai = aa->i; aj = aa->j; 11067877ebaSShri Abhyankar nz = bs2*aa->nz; 11167877ebaSShri Abhyankar *nnz = nz; 112185f6596SHong Zhang ierr = PetscMalloc(2*nz*sizeof(PetscInt), &row);CHKERRQ(ierr); 113185f6596SHong Zhang col = row + nz; 114185f6596SHong Zhang 11567877ebaSShri Abhyankar for(i=0; i<M; i++) { 11667877ebaSShri Abhyankar ajj = aj + ai[i]; 11767877ebaSShri Abhyankar rnz = ai[i+1] - ai[i]; 11867877ebaSShri Abhyankar for(k=0; k<rnz; k++) { 11967877ebaSShri Abhyankar for(j=0; j<bs; j++) { 12067877ebaSShri Abhyankar for(m=0; m<bs; m++) { 12167877ebaSShri Abhyankar row[idx] = i*bs + m + shift; 122cf3759fdSShri Abhyankar col[idx++] = bs*(ajj[k]) + j + shift; 12367877ebaSShri Abhyankar } 12467877ebaSShri Abhyankar } 12567877ebaSShri Abhyankar } 12667877ebaSShri Abhyankar } 127cf3759fdSShri Abhyankar *r = row; *c = col; 12867877ebaSShri Abhyankar } 12967877ebaSShri Abhyankar PetscFunctionReturn(0); 13067877ebaSShri Abhyankar } 13167877ebaSShri Abhyankar 13267877ebaSShri Abhyankar #undef __FUNCT__ 13316ebf90aSShri Abhyankar #define __FUNCT__ "MatConvertToTriples_seqsbaij_seqsbaij" 134bccb9932SShri Abhyankar PetscErrorCode MatConvertToTriples_seqsbaij_seqsbaij(Mat A,int shift,MatReuse reuse,int *nnz,int **r, int **c, PetscScalar **v) 13516ebf90aSShri Abhyankar { 13667877ebaSShri Abhyankar const PetscInt *ai, *aj,*ajj,M=A->rmap->n; 13767877ebaSShri Abhyankar PetscInt nz,rnz,i,j; 13816ebf90aSShri Abhyankar PetscErrorCode ierr; 13916ebf90aSShri Abhyankar PetscInt *row,*col; 14016ebf90aSShri Abhyankar Mat_SeqSBAIJ *aa=(Mat_SeqSBAIJ*)A->data; 14116ebf90aSShri Abhyankar 14216ebf90aSShri Abhyankar PetscFunctionBegin; 143bccb9932SShri Abhyankar if (reuse == MAT_INITIAL_MATRIX){ 14416ebf90aSShri Abhyankar nz = aa->nz;ai=aa->i; aj=aa->j;*v=aa->a; 14516ebf90aSShri Abhyankar *nnz = nz; 146185f6596SHong Zhang ierr = PetscMalloc(2*nz*sizeof(PetscInt), &row);CHKERRQ(ierr); 147185f6596SHong Zhang col = row + nz; 148185f6596SHong Zhang 14916ebf90aSShri Abhyankar nz = 0; 15016ebf90aSShri Abhyankar for(i=0; i<M; i++) { 15116ebf90aSShri Abhyankar rnz = ai[i+1] - ai[i]; 15267877ebaSShri Abhyankar ajj = aj + ai[i]; 15367877ebaSShri Abhyankar for(j=0; j<rnz; j++) { 15467877ebaSShri Abhyankar row[nz] = i+shift; col[nz++] = ajj[j] + shift; 15516ebf90aSShri Abhyankar } 15616ebf90aSShri Abhyankar } 15716ebf90aSShri Abhyankar *r = row; *c = col; 15816ebf90aSShri Abhyankar } 15916ebf90aSShri Abhyankar PetscFunctionReturn(0); 16016ebf90aSShri Abhyankar } 16116ebf90aSShri Abhyankar 16216ebf90aSShri Abhyankar #undef __FUNCT__ 16316ebf90aSShri Abhyankar #define __FUNCT__ "MatConvertToTriples_seqaij_seqsbaij" 164bccb9932SShri Abhyankar PetscErrorCode MatConvertToTriples_seqaij_seqsbaij(Mat A,int shift,MatReuse reuse,int *nnz,int **r, int **c, PetscScalar **v) 16516ebf90aSShri Abhyankar { 16667877ebaSShri Abhyankar const PetscInt *ai,*aj,*ajj,*adiag,M=A->rmap->n; 16767877ebaSShri Abhyankar PetscInt nz,rnz,i,j; 16867877ebaSShri Abhyankar const PetscScalar *av,*v1; 16916ebf90aSShri Abhyankar PetscScalar *val; 17016ebf90aSShri Abhyankar PetscErrorCode ierr; 17116ebf90aSShri Abhyankar PetscInt *row,*col; 17216ebf90aSShri Abhyankar Mat_SeqSBAIJ *aa=(Mat_SeqSBAIJ*)A->data; 17316ebf90aSShri Abhyankar 17416ebf90aSShri Abhyankar PetscFunctionBegin; 17516ebf90aSShri Abhyankar ai=aa->i; aj=aa->j;av=aa->a; 17616ebf90aSShri Abhyankar adiag=aa->diag; 177bccb9932SShri Abhyankar if (reuse == MAT_INITIAL_MATRIX){ 17816ebf90aSShri Abhyankar nz = M + (aa->nz-M)/2; 17916ebf90aSShri Abhyankar *nnz = nz; 180185f6596SHong Zhang ierr = PetscMalloc((2*nz*sizeof(PetscInt)+nz*sizeof(PetscScalar)), &row);CHKERRQ(ierr); 181185f6596SHong Zhang col = row + nz; 182185f6596SHong Zhang val = (PetscScalar*)(col + nz); 183185f6596SHong Zhang 18416ebf90aSShri Abhyankar nz = 0; 18516ebf90aSShri Abhyankar for(i=0; i<M; i++) { 18616ebf90aSShri Abhyankar rnz = ai[i+1] - adiag[i]; 18767877ebaSShri Abhyankar ajj = aj + adiag[i]; 188cf3759fdSShri Abhyankar v1 = av + adiag[i]; 18967877ebaSShri Abhyankar for(j=0; j<rnz; j++) { 19067877ebaSShri Abhyankar row[nz] = i+shift; col[nz] = ajj[j] + shift; val[nz++] = v1[j]; 19116ebf90aSShri Abhyankar } 19216ebf90aSShri Abhyankar } 19316ebf90aSShri Abhyankar *r = row; *c = col; *v = val; 194397b6df1SKris Buschelman } else { 19516ebf90aSShri Abhyankar nz = 0; val = *v; 19616ebf90aSShri Abhyankar for(i=0; i <M; i++) { 19716ebf90aSShri Abhyankar rnz = ai[i+1] - adiag[i]; 19867877ebaSShri Abhyankar ajj = aj + adiag[i]; 19967877ebaSShri Abhyankar v1 = av + adiag[i]; 20067877ebaSShri Abhyankar for(j=0; j<rnz; j++) { 20167877ebaSShri Abhyankar val[nz++] = v1[j]; 20216ebf90aSShri Abhyankar } 20316ebf90aSShri Abhyankar } 20416ebf90aSShri Abhyankar } 20516ebf90aSShri Abhyankar PetscFunctionReturn(0); 20616ebf90aSShri Abhyankar } 20716ebf90aSShri Abhyankar 20816ebf90aSShri Abhyankar #undef __FUNCT__ 20916ebf90aSShri Abhyankar #define __FUNCT__ "MatConvertToTriples_mpisbaij_mpisbaij" 210bccb9932SShri Abhyankar PetscErrorCode MatConvertToTriples_mpisbaij_mpisbaij(Mat A,int shift,MatReuse reuse,int *nnz,int **r, int **c, PetscScalar **v) 21116ebf90aSShri Abhyankar { 21216ebf90aSShri Abhyankar const PetscInt *ai, *aj, *bi, *bj,*garray,m=A->rmap->n,*ajj,*bjj; 21316ebf90aSShri Abhyankar PetscErrorCode ierr; 21416ebf90aSShri Abhyankar PetscInt rstart,nz,i,j,jj,irow,countA,countB; 21516ebf90aSShri Abhyankar PetscInt *row,*col; 21616ebf90aSShri Abhyankar const PetscScalar *av, *bv,*v1,*v2; 21716ebf90aSShri Abhyankar PetscScalar *val; 218397b6df1SKris Buschelman Mat_MPISBAIJ *mat = (Mat_MPISBAIJ*)A->data; 219397b6df1SKris Buschelman Mat_SeqSBAIJ *aa=(Mat_SeqSBAIJ*)(mat->A)->data; 220397b6df1SKris Buschelman Mat_SeqBAIJ *bb=(Mat_SeqBAIJ*)(mat->B)->data; 22116ebf90aSShri Abhyankar 22216ebf90aSShri Abhyankar PetscFunctionBegin; 223d0f46423SBarry Smith ai=aa->i; aj=aa->j; bi=bb->i; bj=bb->j; rstart= A->rmap->rstart; 224397b6df1SKris Buschelman garray = mat->garray; 225397b6df1SKris Buschelman av=aa->a; bv=bb->a; 226397b6df1SKris Buschelman 227bccb9932SShri Abhyankar if (reuse == MAT_INITIAL_MATRIX){ 22816ebf90aSShri Abhyankar nz = aa->nz + bb->nz; 22916ebf90aSShri Abhyankar *nnz = nz; 230185f6596SHong Zhang ierr = PetscMalloc((2*nz*sizeof(PetscInt)+nz*sizeof(PetscScalar)), &row);CHKERRQ(ierr); 231185f6596SHong Zhang col = row + nz; 232185f6596SHong Zhang val = (PetscScalar*)(col + nz); 233185f6596SHong Zhang 234397b6df1SKris Buschelman *r = row; *c = col; *v = val; 235397b6df1SKris Buschelman } else { 236397b6df1SKris Buschelman row = *r; col = *c; val = *v; 237397b6df1SKris Buschelman } 238397b6df1SKris Buschelman 239028e57e8SHong Zhang jj = 0; irow = rstart; 240397b6df1SKris Buschelman for ( i=0; i<m; i++ ) { 241397b6df1SKris Buschelman ajj = aj + ai[i]; /* ptr to the beginning of this row */ 242397b6df1SKris Buschelman countA = ai[i+1] - ai[i]; 243397b6df1SKris Buschelman countB = bi[i+1] - bi[i]; 244397b6df1SKris Buschelman bjj = bj + bi[i]; 24516ebf90aSShri Abhyankar v1 = av + ai[i]; 24616ebf90aSShri Abhyankar v2 = bv + bi[i]; 247397b6df1SKris Buschelman 248397b6df1SKris Buschelman /* A-part */ 249397b6df1SKris Buschelman for (j=0; j<countA; j++){ 250bccb9932SShri Abhyankar if (reuse == MAT_INITIAL_MATRIX) { 251397b6df1SKris Buschelman row[jj] = irow + shift; col[jj] = rstart + ajj[j] + shift; 252397b6df1SKris Buschelman } 25316ebf90aSShri Abhyankar val[jj++] = v1[j]; 254397b6df1SKris Buschelman } 25516ebf90aSShri Abhyankar 25616ebf90aSShri Abhyankar /* B-part */ 25716ebf90aSShri Abhyankar for(j=0; j < countB; j++){ 258bccb9932SShri Abhyankar if (reuse == MAT_INITIAL_MATRIX) { 259397b6df1SKris Buschelman row[jj] = irow + shift; col[jj] = garray[bjj[j]] + shift; 260397b6df1SKris Buschelman } 26116ebf90aSShri Abhyankar val[jj++] = v2[j]; 26216ebf90aSShri Abhyankar } 26316ebf90aSShri Abhyankar irow++; 26416ebf90aSShri Abhyankar } 26516ebf90aSShri Abhyankar PetscFunctionReturn(0); 26616ebf90aSShri Abhyankar } 26716ebf90aSShri Abhyankar 26816ebf90aSShri Abhyankar #undef __FUNCT__ 26916ebf90aSShri Abhyankar #define __FUNCT__ "MatConvertToTriples_mpiaij_mpiaij" 270bccb9932SShri Abhyankar PetscErrorCode MatConvertToTriples_mpiaij_mpiaij(Mat A,int shift,MatReuse reuse,int *nnz,int **r, int **c, PetscScalar **v) 27116ebf90aSShri Abhyankar { 27216ebf90aSShri Abhyankar const PetscInt *ai, *aj, *bi, *bj,*garray,m=A->rmap->n,*ajj,*bjj; 27316ebf90aSShri Abhyankar PetscErrorCode ierr; 27416ebf90aSShri Abhyankar PetscInt rstart,nz,i,j,jj,irow,countA,countB; 27516ebf90aSShri Abhyankar PetscInt *row,*col; 27616ebf90aSShri Abhyankar const PetscScalar *av, *bv,*v1,*v2; 27716ebf90aSShri Abhyankar PetscScalar *val; 27816ebf90aSShri Abhyankar Mat_MPIAIJ *mat = (Mat_MPIAIJ*)A->data; 27916ebf90aSShri Abhyankar Mat_SeqAIJ *aa=(Mat_SeqAIJ*)(mat->A)->data; 28016ebf90aSShri Abhyankar Mat_SeqAIJ *bb=(Mat_SeqAIJ*)(mat->B)->data; 28116ebf90aSShri Abhyankar 28216ebf90aSShri Abhyankar PetscFunctionBegin; 28316ebf90aSShri Abhyankar ai=aa->i; aj=aa->j; bi=bb->i; bj=bb->j; rstart= A->rmap->rstart; 28416ebf90aSShri Abhyankar garray = mat->garray; 28516ebf90aSShri Abhyankar av=aa->a; bv=bb->a; 28616ebf90aSShri Abhyankar 287bccb9932SShri Abhyankar if (reuse == MAT_INITIAL_MATRIX){ 28816ebf90aSShri Abhyankar nz = aa->nz + bb->nz; 28916ebf90aSShri Abhyankar *nnz = nz; 290185f6596SHong Zhang ierr = PetscMalloc((2*nz*sizeof(PetscInt)+nz*sizeof(PetscScalar)), &row);CHKERRQ(ierr); 291185f6596SHong Zhang col = row + nz; 292185f6596SHong Zhang val = (PetscScalar*)(col + nz); 293185f6596SHong Zhang 29416ebf90aSShri Abhyankar *r = row; *c = col; *v = val; 29516ebf90aSShri Abhyankar } else { 29616ebf90aSShri Abhyankar row = *r; col = *c; val = *v; 29716ebf90aSShri Abhyankar } 29816ebf90aSShri Abhyankar 29916ebf90aSShri Abhyankar jj = 0; irow = rstart; 30016ebf90aSShri Abhyankar for ( i=0; i<m; i++ ) { 30116ebf90aSShri Abhyankar ajj = aj + ai[i]; /* ptr to the beginning of this row */ 30216ebf90aSShri Abhyankar countA = ai[i+1] - ai[i]; 30316ebf90aSShri Abhyankar countB = bi[i+1] - bi[i]; 30416ebf90aSShri Abhyankar bjj = bj + bi[i]; 30516ebf90aSShri Abhyankar v1 = av + ai[i]; 30616ebf90aSShri Abhyankar v2 = bv + bi[i]; 30716ebf90aSShri Abhyankar 30816ebf90aSShri Abhyankar /* A-part */ 30916ebf90aSShri Abhyankar for (j=0; j<countA; j++){ 310bccb9932SShri Abhyankar if (reuse == MAT_INITIAL_MATRIX){ 31116ebf90aSShri Abhyankar row[jj] = irow + shift; col[jj] = rstart + ajj[j] + shift; 31216ebf90aSShri Abhyankar } 31316ebf90aSShri Abhyankar val[jj++] = v1[j]; 31416ebf90aSShri Abhyankar } 31516ebf90aSShri Abhyankar 31616ebf90aSShri Abhyankar /* B-part */ 31716ebf90aSShri Abhyankar for(j=0; j < countB; j++){ 318bccb9932SShri Abhyankar if (reuse == MAT_INITIAL_MATRIX){ 31916ebf90aSShri Abhyankar row[jj] = irow + shift; col[jj] = garray[bjj[j]] + shift; 32016ebf90aSShri Abhyankar } 32116ebf90aSShri Abhyankar val[jj++] = v2[j]; 32216ebf90aSShri Abhyankar } 32316ebf90aSShri Abhyankar irow++; 32416ebf90aSShri Abhyankar } 32516ebf90aSShri Abhyankar PetscFunctionReturn(0); 32616ebf90aSShri Abhyankar } 32716ebf90aSShri Abhyankar 32816ebf90aSShri Abhyankar #undef __FUNCT__ 32967877ebaSShri Abhyankar #define __FUNCT__ "MatConvertToTriples_mpibaij_mpiaij" 330bccb9932SShri Abhyankar PetscErrorCode MatConvertToTriples_mpibaij_mpiaij(Mat A,int shift,MatReuse reuse,int *nnz,int **r, int **c, PetscScalar **v) 33167877ebaSShri Abhyankar { 33267877ebaSShri Abhyankar Mat_MPIBAIJ *mat = (Mat_MPIBAIJ*)A->data; 33367877ebaSShri Abhyankar Mat_SeqBAIJ *aa=(Mat_SeqBAIJ*)(mat->A)->data; 33467877ebaSShri Abhyankar Mat_SeqBAIJ *bb=(Mat_SeqBAIJ*)(mat->B)->data; 33567877ebaSShri Abhyankar const PetscInt *ai = aa->i, *bi = bb->i, *aj = aa->j, *bj = bb->j,*ajj, *bjj; 336d985c460SShri Abhyankar const PetscInt *garray = mat->garray,mbs=mat->mbs,rstart=A->rmap->rstart; 33767877ebaSShri Abhyankar const PetscInt bs = A->rmap->bs,bs2=mat->bs2; 33867877ebaSShri Abhyankar PetscErrorCode ierr; 33967877ebaSShri Abhyankar PetscInt nz,i,j,k,n,jj,irow,countA,countB,idx; 34067877ebaSShri Abhyankar PetscInt *row,*col; 34167877ebaSShri Abhyankar const PetscScalar *av=aa->a, *bv=bb->a,*v1,*v2; 34267877ebaSShri Abhyankar PetscScalar *val; 34367877ebaSShri Abhyankar 34467877ebaSShri Abhyankar PetscFunctionBegin; 34567877ebaSShri Abhyankar 346bccb9932SShri Abhyankar if (reuse == MAT_INITIAL_MATRIX) { 34767877ebaSShri Abhyankar nz = bs2*(aa->nz + bb->nz); 34867877ebaSShri Abhyankar *nnz = nz; 349185f6596SHong Zhang ierr = PetscMalloc((2*nz*sizeof(PetscInt)+nz*sizeof(PetscScalar)), &row);CHKERRQ(ierr); 350185f6596SHong Zhang col = row + nz; 351185f6596SHong Zhang val = (PetscScalar*)(col + nz); 352185f6596SHong Zhang 35367877ebaSShri Abhyankar *r = row; *c = col; *v = val; 35467877ebaSShri Abhyankar } else { 35567877ebaSShri Abhyankar row = *r; col = *c; val = *v; 35667877ebaSShri Abhyankar } 35767877ebaSShri Abhyankar 358d985c460SShri Abhyankar jj = 0; irow = rstart; 35967877ebaSShri Abhyankar for ( i=0; i<mbs; i++ ) { 36067877ebaSShri Abhyankar countA = ai[i+1] - ai[i]; 36167877ebaSShri Abhyankar countB = bi[i+1] - bi[i]; 36267877ebaSShri Abhyankar ajj = aj + ai[i]; 36367877ebaSShri Abhyankar bjj = bj + bi[i]; 36467877ebaSShri Abhyankar v1 = av + bs2*ai[i]; 36567877ebaSShri Abhyankar v2 = bv + bs2*bi[i]; 36667877ebaSShri Abhyankar 36767877ebaSShri Abhyankar idx = 0; 36867877ebaSShri Abhyankar /* A-part */ 36967877ebaSShri Abhyankar for (k=0; k<countA; k++){ 37067877ebaSShri Abhyankar for (j=0; j<bs; j++) { 37167877ebaSShri Abhyankar for (n=0; n<bs; n++) { 372bccb9932SShri Abhyankar if (reuse == MAT_INITIAL_MATRIX){ 373d985c460SShri Abhyankar row[jj] = irow + n + shift; 374d985c460SShri Abhyankar col[jj] = rstart + bs*ajj[k] + j + shift; 37567877ebaSShri Abhyankar } 37667877ebaSShri Abhyankar val[jj++] = v1[idx++]; 37767877ebaSShri Abhyankar } 37867877ebaSShri Abhyankar } 37967877ebaSShri Abhyankar } 38067877ebaSShri Abhyankar 38167877ebaSShri Abhyankar idx = 0; 38267877ebaSShri Abhyankar /* B-part */ 38367877ebaSShri Abhyankar for(k=0; k<countB; k++){ 38467877ebaSShri Abhyankar for (j=0; j<bs; j++) { 38567877ebaSShri Abhyankar for (n=0; n<bs; n++) { 386bccb9932SShri Abhyankar if (reuse == MAT_INITIAL_MATRIX){ 387d985c460SShri Abhyankar row[jj] = irow + n + shift; 388d985c460SShri Abhyankar col[jj] = bs*garray[bjj[k]] + j + shift; 38967877ebaSShri Abhyankar } 390d985c460SShri Abhyankar val[jj++] = v2[idx++]; 39167877ebaSShri Abhyankar } 39267877ebaSShri Abhyankar } 39367877ebaSShri Abhyankar } 394d985c460SShri Abhyankar irow += bs; 39567877ebaSShri Abhyankar } 39667877ebaSShri Abhyankar PetscFunctionReturn(0); 39767877ebaSShri Abhyankar } 39867877ebaSShri Abhyankar 39967877ebaSShri Abhyankar #undef __FUNCT__ 40016ebf90aSShri Abhyankar #define __FUNCT__ "MatConvertToTriples_mpiaij_mpisbaij" 401bccb9932SShri Abhyankar PetscErrorCode MatConvertToTriples_mpiaij_mpisbaij(Mat A,int shift,MatReuse reuse,int *nnz,int **r, int **c, PetscScalar **v) 40216ebf90aSShri Abhyankar { 40316ebf90aSShri Abhyankar const PetscInt *ai, *aj,*adiag, *bi, *bj,*garray,m=A->rmap->n,*ajj,*bjj; 40416ebf90aSShri Abhyankar PetscErrorCode ierr; 40516ebf90aSShri Abhyankar PetscInt rstart,nz,nza,nzb_low,i,j,jj,irow,countA,countB; 40616ebf90aSShri Abhyankar PetscInt *row,*col; 40716ebf90aSShri Abhyankar const PetscScalar *av, *bv,*v1,*v2; 40816ebf90aSShri Abhyankar PetscScalar *val; 40916ebf90aSShri Abhyankar Mat_MPIAIJ *mat = (Mat_MPIAIJ*)A->data; 41016ebf90aSShri Abhyankar Mat_SeqAIJ *aa=(Mat_SeqAIJ*)(mat->A)->data; 41116ebf90aSShri Abhyankar Mat_SeqAIJ *bb=(Mat_SeqAIJ*)(mat->B)->data; 41216ebf90aSShri Abhyankar 41316ebf90aSShri Abhyankar PetscFunctionBegin; 41416ebf90aSShri Abhyankar ai=aa->i; aj=aa->j; adiag=aa->diag; 41516ebf90aSShri Abhyankar bi=bb->i; bj=bb->j; garray = mat->garray; 41616ebf90aSShri Abhyankar av=aa->a; bv=bb->a; 41716ebf90aSShri Abhyankar rstart = A->rmap->rstart; 41816ebf90aSShri Abhyankar 419bccb9932SShri Abhyankar if (reuse == MAT_INITIAL_MATRIX) { 42016ebf90aSShri Abhyankar nza = 0;nzb_low = 0; 42116ebf90aSShri Abhyankar for(i=0; i<m; i++){ 42216ebf90aSShri Abhyankar nza = nza + (ai[i+1] - adiag[i]); 42316ebf90aSShri Abhyankar countB = bi[i+1] - bi[i]; 42416ebf90aSShri Abhyankar bjj = bj + bi[i]; 42516ebf90aSShri Abhyankar 42616ebf90aSShri Abhyankar j = 0; 42716ebf90aSShri Abhyankar while(garray[bjj[j]] < rstart) { 42816ebf90aSShri Abhyankar if(j == countB) break; 42916ebf90aSShri Abhyankar j++;nzb_low++; 43016ebf90aSShri Abhyankar } 43116ebf90aSShri Abhyankar } 43216ebf90aSShri Abhyankar /* Total nz = nz for the upper triangular A part + nz for the 2nd B part */ 43316ebf90aSShri Abhyankar nz = nza + (bb->nz - nzb_low); 43416ebf90aSShri Abhyankar *nnz = nz; 435185f6596SHong Zhang ierr = PetscMalloc((2*nz*sizeof(PetscInt)+nz*sizeof(PetscScalar)), &row);CHKERRQ(ierr); 436185f6596SHong Zhang col = row + nz; 437185f6596SHong Zhang val = (PetscScalar*)(col + nz); 438185f6596SHong Zhang 43916ebf90aSShri Abhyankar *r = row; *c = col; *v = val; 44016ebf90aSShri Abhyankar } else { 44116ebf90aSShri Abhyankar row = *r; col = *c; val = *v; 44216ebf90aSShri Abhyankar } 44316ebf90aSShri Abhyankar 44416ebf90aSShri Abhyankar jj = 0; irow = rstart; 44516ebf90aSShri Abhyankar for ( i=0; i<m; i++ ) { 44616ebf90aSShri Abhyankar ajj = aj + adiag[i]; /* ptr to the beginning of the diagonal of this row */ 44716ebf90aSShri Abhyankar v1 = av + adiag[i]; 44816ebf90aSShri Abhyankar countA = ai[i+1] - adiag[i]; 44916ebf90aSShri Abhyankar countB = bi[i+1] - bi[i]; 45016ebf90aSShri Abhyankar bjj = bj + bi[i]; 45116ebf90aSShri Abhyankar v2 = bv + bi[i]; 45216ebf90aSShri Abhyankar 45316ebf90aSShri Abhyankar /* A-part */ 45416ebf90aSShri Abhyankar for (j=0; j<countA; j++){ 455bccb9932SShri Abhyankar if (reuse == MAT_INITIAL_MATRIX) { 45616ebf90aSShri Abhyankar row[jj] = irow + shift; col[jj] = rstart + ajj[j] + shift; 45716ebf90aSShri Abhyankar } 45816ebf90aSShri Abhyankar val[jj++] = v1[j]; 45916ebf90aSShri Abhyankar } 46016ebf90aSShri Abhyankar 46116ebf90aSShri Abhyankar /* B-part */ 46216ebf90aSShri Abhyankar for(j=0; j < countB; j++){ 46316ebf90aSShri Abhyankar if (garray[bjj[j]] > rstart) { 464bccb9932SShri Abhyankar if (reuse == MAT_INITIAL_MATRIX) { 46516ebf90aSShri Abhyankar row[jj] = irow + shift; col[jj] = garray[bjj[j]] + shift; 46616ebf90aSShri Abhyankar } 46716ebf90aSShri Abhyankar val[jj++] = v2[j]; 46816ebf90aSShri Abhyankar } 469397b6df1SKris Buschelman } 470397b6df1SKris Buschelman irow++; 471397b6df1SKris Buschelman } 472397b6df1SKris Buschelman PetscFunctionReturn(0); 473397b6df1SKris Buschelman } 474397b6df1SKris Buschelman 475397b6df1SKris Buschelman #undef __FUNCT__ 4763924e44cSKris Buschelman #define __FUNCT__ "MatDestroy_MUMPS" 477dfbe8321SBarry Smith PetscErrorCode MatDestroy_MUMPS(Mat A) 478dfbe8321SBarry Smith { 479f0c56d0fSKris Buschelman Mat_MUMPS *lu=(Mat_MUMPS*)A->spptr; 480dfbe8321SBarry Smith PetscErrorCode ierr; 481b24902e0SBarry Smith 482397b6df1SKris Buschelman PetscFunctionBegin; 483bf0cc555SLisandro Dalcin if (lu && lu->CleanUpMUMPS) { 484397b6df1SKris Buschelman /* Terminate instance, deallocate memories */ 4856bf464f9SBarry Smith ierr = PetscFree2(lu->id.sol_loc,lu->id.isol_loc);CHKERRQ(ierr); 4866bf464f9SBarry Smith ierr = VecScatterDestroy(&lu->scat_rhs);CHKERRQ(ierr); 4876bf464f9SBarry Smith ierr = VecDestroy(&lu->b_seq);CHKERRQ(ierr); 488bf0cc555SLisandro Dalcin ierr = VecScatterDestroy(&lu->scat_sol);CHKERRQ(ierr); 489bf0cc555SLisandro Dalcin ierr = VecDestroy(&lu->x_seq);CHKERRQ(ierr); 4906bf464f9SBarry Smith ierr=PetscFree(lu->id.perm_in);CHKERRQ(ierr); 491185f6596SHong Zhang ierr = PetscFree(lu->irn);CHKERRQ(ierr); 492397b6df1SKris Buschelman lu->id.job=JOB_END; 493397b6df1SKris Buschelman #if defined(PETSC_USE_COMPLEX) 494397b6df1SKris Buschelman zmumps_c(&lu->id); 495397b6df1SKris Buschelman #else 496397b6df1SKris Buschelman dmumps_c(&lu->id); 497397b6df1SKris Buschelman #endif 498397b6df1SKris Buschelman ierr = MPI_Comm_free(&(lu->comm_mumps));CHKERRQ(ierr); 499397b6df1SKris Buschelman } 500bf0cc555SLisandro Dalcin if (lu && lu->Destroy) { 501bf0cc555SLisandro Dalcin ierr = (lu->Destroy)(A);CHKERRQ(ierr); 502bf0cc555SLisandro Dalcin } 503bf0cc555SLisandro Dalcin ierr = PetscFree(A->spptr);CHKERRQ(ierr); 504bf0cc555SLisandro Dalcin 50597969023SHong Zhang /* clear composed functions */ 50697969023SHong Zhang ierr = PetscObjectComposeFunctionDynamic((PetscObject)A,"MatFactorGetSolverPackage_C","",PETSC_NULL);CHKERRQ(ierr); 507f250808bSBarry Smith ierr = PetscObjectComposeFunctionDynamic((PetscObject)A,"MatMumpsSetIcntl_C","",PETSC_NULL);CHKERRQ(ierr); 508397b6df1SKris Buschelman PetscFunctionReturn(0); 509397b6df1SKris Buschelman } 510397b6df1SKris Buschelman 511397b6df1SKris Buschelman #undef __FUNCT__ 512f6c57405SHong Zhang #define __FUNCT__ "MatSolve_MUMPS" 513b24902e0SBarry Smith PetscErrorCode MatSolve_MUMPS(Mat A,Vec b,Vec x) 514b24902e0SBarry Smith { 515f0c56d0fSKris Buschelman Mat_MUMPS *lu=(Mat_MUMPS*)A->spptr; 516d54de34fSKris Buschelman PetscScalar *array; 51767877ebaSShri Abhyankar Vec b_seq; 518329ec9b3SHong Zhang IS is_iden,is_petsc; 519dfbe8321SBarry Smith PetscErrorCode ierr; 520329ec9b3SHong Zhang PetscInt i; 521397b6df1SKris Buschelman 522397b6df1SKris Buschelman PetscFunctionBegin; 523329ec9b3SHong Zhang lu->id.nrhs = 1; 52467877ebaSShri Abhyankar b_seq = lu->b_seq; 525397b6df1SKris Buschelman if (lu->size > 1){ 526329ec9b3SHong Zhang /* MUMPS only supports centralized rhs. Scatter b into a seqential rhs vector */ 52767877ebaSShri Abhyankar ierr = VecScatterBegin(lu->scat_rhs,b,b_seq,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 52867877ebaSShri Abhyankar ierr = VecScatterEnd(lu->scat_rhs,b,b_seq,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 52967877ebaSShri Abhyankar if (!lu->myid) {ierr = VecGetArray(b_seq,&array);CHKERRQ(ierr);} 530397b6df1SKris Buschelman } else { /* size == 1 */ 531397b6df1SKris Buschelman ierr = VecCopy(b,x);CHKERRQ(ierr); 532397b6df1SKris Buschelman ierr = VecGetArray(x,&array);CHKERRQ(ierr); 533397b6df1SKris Buschelman } 534397b6df1SKris Buschelman if (!lu->myid) { /* define rhs on the host */ 5358278f211SHong Zhang lu->id.nrhs = 1; 536397b6df1SKris Buschelman #if defined(PETSC_USE_COMPLEX) 537397b6df1SKris Buschelman lu->id.rhs = (mumps_double_complex*)array; 538397b6df1SKris Buschelman #else 539397b6df1SKris Buschelman lu->id.rhs = array; 540397b6df1SKris Buschelman #endif 541397b6df1SKris Buschelman } 542397b6df1SKris Buschelman 543397b6df1SKris Buschelman /* solve phase */ 544329ec9b3SHong Zhang /*-------------*/ 5453d472b54SHong Zhang lu->id.job = JOB_SOLVE; 546397b6df1SKris Buschelman #if defined(PETSC_USE_COMPLEX) 547397b6df1SKris Buschelman zmumps_c(&lu->id); 548397b6df1SKris Buschelman #else 549397b6df1SKris Buschelman dmumps_c(&lu->id); 550397b6df1SKris Buschelman #endif 55165e19b50SBarry Smith if (lu->id.INFOG(1) < 0) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error reported by MUMPS in solve phase: INFOG(1)=%d\n",lu->id.INFOG(1)); 552397b6df1SKris Buschelman 553329ec9b3SHong Zhang if (lu->size > 1) { /* convert mumps distributed solution to petsc mpi x */ 554329ec9b3SHong Zhang if (!lu->nSolve){ /* create scatter scat_sol */ 555329ec9b3SHong Zhang ierr = ISCreateStride(PETSC_COMM_SELF,lu->id.lsol_loc,0,1,&is_iden);CHKERRQ(ierr); /* from */ 556329ec9b3SHong Zhang for (i=0; i<lu->id.lsol_loc; i++){ 557329ec9b3SHong Zhang lu->id.isol_loc[i] -= 1; /* change Fortran style to C style */ 558397b6df1SKris Buschelman } 55970b3c8c7SBarry Smith ierr = ISCreateGeneral(PETSC_COMM_SELF,lu->id.lsol_loc,lu->id.isol_loc,PETSC_COPY_VALUES,&is_petsc);CHKERRQ(ierr); /* to */ 560329ec9b3SHong Zhang ierr = VecScatterCreate(lu->x_seq,is_iden,x,is_petsc,&lu->scat_sol);CHKERRQ(ierr); 5616bf464f9SBarry Smith ierr = ISDestroy(&is_iden);CHKERRQ(ierr); 5626bf464f9SBarry Smith ierr = ISDestroy(&is_petsc);CHKERRQ(ierr); 563397b6df1SKris Buschelman } 564ca9f406cSSatish Balay ierr = VecScatterBegin(lu->scat_sol,lu->x_seq,x,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 565ca9f406cSSatish Balay ierr = VecScatterEnd(lu->scat_sol,lu->x_seq,x,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 566329ec9b3SHong Zhang } 567329ec9b3SHong Zhang lu->nSolve++; 568397b6df1SKris Buschelman PetscFunctionReturn(0); 569397b6df1SKris Buschelman } 570397b6df1SKris Buschelman 57151d5961aSHong Zhang #undef __FUNCT__ 57251d5961aSHong Zhang #define __FUNCT__ "MatSolveTranspose_MUMPS" 57351d5961aSHong Zhang PetscErrorCode MatSolveTranspose_MUMPS(Mat A,Vec b,Vec x) 57451d5961aSHong Zhang { 57551d5961aSHong Zhang Mat_MUMPS *lu=(Mat_MUMPS*)A->spptr; 57651d5961aSHong Zhang PetscErrorCode ierr; 57751d5961aSHong Zhang 57851d5961aSHong Zhang PetscFunctionBegin; 57951d5961aSHong Zhang lu->id.ICNTL(9) = 0; 5800ad0caddSJed Brown ierr = MatSolve_MUMPS(A,b,x);CHKERRQ(ierr); 58151d5961aSHong Zhang lu->id.ICNTL(9) = 1; 58251d5961aSHong Zhang PetscFunctionReturn(0); 58351d5961aSHong Zhang } 58451d5961aSHong Zhang 585e0b74bf9SHong Zhang #undef __FUNCT__ 586e0b74bf9SHong Zhang #define __FUNCT__ "MatMatSolve_MUMPS" 587e0b74bf9SHong Zhang PetscErrorCode MatMatSolve_MUMPS(Mat A,Mat B,Mat X) 588e0b74bf9SHong Zhang { 589*bda8bf91SBarry Smith PetscErrorCode ierr; 590*bda8bf91SBarry Smith PetscBool flg; 591*bda8bf91SBarry Smith 592e0b74bf9SHong Zhang PetscFunctionBegin; 593*bda8bf91SBarry Smith ierr = PetscTypeCompareAny((PetscObject)B,&flg,MATSEQDENSE,MATMPIDENSE,PETSC_NULL);CHKERRQ(ierr); 594*bda8bf91SBarry Smith if (!flg) SETERRQ(((PetscObject)A)->comm,PETSC_ERR_ARG_WRONG,"Matrix B must be MATDENSE matrix"); 595*bda8bf91SBarry Smith ierr = PetscTypeCompareAny((PetscObject)X,&flg,MATSEQDENSE,MATMPIDENSE,PETSC_NULL);CHKERRQ(ierr); 596*bda8bf91SBarry Smith if (!flg) SETERRQ(((PetscObject)A)->comm,PETSC_ERR_ARG_WRONG,"Matrix X must be MATDENSE matrix"); SETERRQ(PETSC_COMM_SELF,PETSC_ERR_SUP,"MatMatSolve_MUMPS() is not implemented yet"); 597e0b74bf9SHong Zhang PetscFunctionReturn(0); 598e0b74bf9SHong Zhang } 599e0b74bf9SHong Zhang 600ace3df97SHong Zhang #if !defined(PETSC_USE_COMPLEX) 601a58c3f20SHong Zhang /* 602a58c3f20SHong Zhang input: 603a58c3f20SHong Zhang F: numeric factor 604a58c3f20SHong Zhang output: 605a58c3f20SHong Zhang nneg: total number of negative pivots 606a58c3f20SHong Zhang nzero: 0 607a58c3f20SHong Zhang npos: (global dimension of F) - nneg 608a58c3f20SHong Zhang */ 609a58c3f20SHong Zhang 610a58c3f20SHong Zhang #undef __FUNCT__ 611a58c3f20SHong Zhang #define __FUNCT__ "MatGetInertia_SBAIJMUMPS" 612dfbe8321SBarry Smith PetscErrorCode MatGetInertia_SBAIJMUMPS(Mat F,int *nneg,int *nzero,int *npos) 613a58c3f20SHong Zhang { 614a58c3f20SHong Zhang Mat_MUMPS *lu =(Mat_MUMPS*)F->spptr; 615dfbe8321SBarry Smith PetscErrorCode ierr; 616c1490034SHong Zhang PetscMPIInt size; 617a58c3f20SHong Zhang 618a58c3f20SHong Zhang PetscFunctionBegin; 6197adad957SLisandro Dalcin ierr = MPI_Comm_size(((PetscObject)F)->comm,&size);CHKERRQ(ierr); 620bcb30aebSHong Zhang /* MUMPS 4.3.1 calls ScaLAPACK when ICNTL(13)=0 (default), which does not offer the possibility to compute the inertia of a dense matrix. Set ICNTL(13)=1 to skip ScaLAPACK */ 62165e19b50SBarry Smith if (size > 1 && lu->id.ICNTL(13) != 1) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONG,"ICNTL(13)=%d. -mat_mumps_icntl_13 must be set as 1 for correct global matrix inertia\n",lu->id.INFOG(13)); 622a58c3f20SHong Zhang if (nneg){ 623a58c3f20SHong Zhang if (!lu->myid){ 624a58c3f20SHong Zhang *nneg = lu->id.INFOG(12); 625a58c3f20SHong Zhang } 626bcb30aebSHong Zhang ierr = MPI_Bcast(nneg,1,MPI_INT,0,lu->comm_mumps);CHKERRQ(ierr); 627a58c3f20SHong Zhang } 628a58c3f20SHong Zhang if (nzero) *nzero = 0; 629d0f46423SBarry Smith if (npos) *npos = F->rmap->N - (*nneg); 630a58c3f20SHong Zhang PetscFunctionReturn(0); 631a58c3f20SHong Zhang } 632ace3df97SHong Zhang #endif /* !defined(PETSC_USE_COMPLEX) */ 633a58c3f20SHong Zhang 634397b6df1SKris Buschelman #undef __FUNCT__ 635f6c57405SHong Zhang #define __FUNCT__ "MatFactorNumeric_MUMPS" 6360481f469SBarry Smith PetscErrorCode MatFactorNumeric_MUMPS(Mat F,Mat A,const MatFactorInfo *info) 637af281ebdSHong Zhang { 638dcd589f8SShri Abhyankar Mat_MUMPS *lu =(Mat_MUMPS*)(F)->spptr; 6396849ba73SBarry Smith PetscErrorCode ierr; 640bccb9932SShri Abhyankar MatReuse reuse; 641e09efc27SHong Zhang Mat F_diag; 642ace3abfcSBarry Smith PetscBool isMPIAIJ; 643397b6df1SKris Buschelman 644397b6df1SKris Buschelman PetscFunctionBegin; 645bccb9932SShri Abhyankar reuse = MAT_REUSE_MATRIX; 646bccb9932SShri Abhyankar ierr = (*lu->ConvertToTriples)(A, 1, reuse, &lu->nz, &lu->irn, &lu->jcn, &lu->val);CHKERRQ(ierr); 647397b6df1SKris Buschelman 648397b6df1SKris Buschelman /* numerical factorization phase */ 649329ec9b3SHong Zhang /*-------------------------------*/ 6503d472b54SHong Zhang lu->id.job = JOB_FACTNUMERIC; 651958c9bccSBarry Smith if(!lu->id.ICNTL(18)) { 652a7aca84bSHong Zhang if (!lu->myid) { 653397b6df1SKris Buschelman #if defined(PETSC_USE_COMPLEX) 654397b6df1SKris Buschelman lu->id.a = (mumps_double_complex*)lu->val; 655397b6df1SKris Buschelman #else 656397b6df1SKris Buschelman lu->id.a = lu->val; 657397b6df1SKris Buschelman #endif 658397b6df1SKris Buschelman } 659397b6df1SKris Buschelman } else { 660397b6df1SKris Buschelman #if defined(PETSC_USE_COMPLEX) 661397b6df1SKris Buschelman lu->id.a_loc = (mumps_double_complex*)lu->val; 662397b6df1SKris Buschelman #else 663397b6df1SKris Buschelman lu->id.a_loc = lu->val; 664397b6df1SKris Buschelman #endif 665397b6df1SKris Buschelman } 666397b6df1SKris Buschelman #if defined(PETSC_USE_COMPLEX) 667397b6df1SKris Buschelman zmumps_c(&lu->id); 668397b6df1SKris Buschelman #else 669397b6df1SKris Buschelman dmumps_c(&lu->id); 670397b6df1SKris Buschelman #endif 671397b6df1SKris Buschelman if (lu->id.INFOG(1) < 0) { 67265e19b50SBarry Smith if (lu->id.INFO(1) == -13) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error reported by MUMPS in numerical factorization phase: Cannot allocate required memory %d megabytes\n",lu->id.INFO(2)); 67365e19b50SBarry Smith else SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error reported by MUMPS in numerical factorization phase: INFO(1)=%d, INFO(2)=%d\n",lu->id.INFO(1),lu->id.INFO(2)); 674397b6df1SKris Buschelman } 67565e19b50SBarry Smith if (!lu->myid && lu->id.ICNTL(16) > 0) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB," lu->id.ICNTL(16):=%d\n",lu->id.INFOG(16)); 676397b6df1SKris Buschelman 6778ada1bb4SHong Zhang if (lu->size > 1){ 67816ebf90aSShri Abhyankar ierr = PetscTypeCompare((PetscObject)A,MATMPIAIJ,&isMPIAIJ);CHKERRQ(ierr); 679a214ac2aSShri Abhyankar if(isMPIAIJ) { 680dcd589f8SShri Abhyankar F_diag = ((Mat_MPIAIJ *)(F)->data)->A; 681e09efc27SHong Zhang } else { 682dcd589f8SShri Abhyankar F_diag = ((Mat_MPISBAIJ *)(F)->data)->A; 683e09efc27SHong Zhang } 684e09efc27SHong Zhang F_diag->assembled = PETSC_TRUE; 685329ec9b3SHong Zhang if (lu->nSolve){ 6866bf464f9SBarry Smith ierr = VecScatterDestroy(&lu->scat_sol);CHKERRQ(ierr); 6870e83c824SBarry Smith ierr = PetscFree2(lu->id.sol_loc,lu->id.isol_loc);CHKERRQ(ierr); 6886bf464f9SBarry Smith ierr = VecDestroy(&lu->x_seq);CHKERRQ(ierr); 689329ec9b3SHong Zhang } 6908ada1bb4SHong Zhang } 691dcd589f8SShri Abhyankar (F)->assembled = PETSC_TRUE; 692397b6df1SKris Buschelman lu->matstruc = SAME_NONZERO_PATTERN; 693ace87b0dSHong Zhang lu->CleanUpMUMPS = PETSC_TRUE; 694329ec9b3SHong Zhang lu->nSolve = 0; 69567877ebaSShri Abhyankar 69667877ebaSShri Abhyankar if (lu->size > 1){ 69767877ebaSShri Abhyankar /* distributed solution */ 69867877ebaSShri Abhyankar lu->id.ICNTL(21) = 1; 69967877ebaSShri Abhyankar if (!lu->nSolve){ 70067877ebaSShri Abhyankar /* Create x_seq=sol_loc for repeated use */ 70167877ebaSShri Abhyankar PetscInt lsol_loc; 70267877ebaSShri Abhyankar PetscScalar *sol_loc; 70367877ebaSShri Abhyankar lsol_loc = lu->id.INFO(23); /* length of sol_loc */ 70467877ebaSShri Abhyankar ierr = PetscMalloc2(lsol_loc,PetscScalar,&sol_loc,lsol_loc,PetscInt,&lu->id.isol_loc);CHKERRQ(ierr); 70567877ebaSShri Abhyankar lu->id.lsol_loc = lsol_loc; 70667877ebaSShri Abhyankar #if defined(PETSC_USE_COMPLEX) 70767877ebaSShri Abhyankar lu->id.sol_loc = (mumps_double_complex*)sol_loc; 70867877ebaSShri Abhyankar #else 70967877ebaSShri Abhyankar lu->id.sol_loc = sol_loc; 71067877ebaSShri Abhyankar #endif 71167877ebaSShri Abhyankar ierr = VecCreateSeqWithArray(PETSC_COMM_SELF,lsol_loc,sol_loc,&lu->x_seq);CHKERRQ(ierr); 71267877ebaSShri Abhyankar } 71367877ebaSShri Abhyankar } 714397b6df1SKris Buschelman PetscFunctionReturn(0); 715397b6df1SKris Buschelman } 716397b6df1SKris Buschelman 717dcd589f8SShri Abhyankar #undef __FUNCT__ 718dcd589f8SShri Abhyankar #define __FUNCT__ "PetscSetMUMPSOptions" 719dcd589f8SShri Abhyankar PetscErrorCode PetscSetMUMPSOptions(Mat F, Mat A) 720dcd589f8SShri Abhyankar { 721dcd589f8SShri Abhyankar Mat_MUMPS *lu = (Mat_MUMPS*)F->spptr; 722dcd589f8SShri Abhyankar PetscErrorCode ierr; 723dcd589f8SShri Abhyankar PetscInt icntl; 724ace3abfcSBarry Smith PetscBool flg; 725dcd589f8SShri Abhyankar 726dcd589f8SShri Abhyankar PetscFunctionBegin; 727dcd589f8SShri Abhyankar ierr = PetscOptionsBegin(((PetscObject)A)->comm,((PetscObject)A)->prefix,"MUMPS Options","Mat");CHKERRQ(ierr); 728dcd589f8SShri Abhyankar if (lu->size == 1){ 729dcd589f8SShri Abhyankar lu->id.ICNTL(18) = 0; /* centralized assembled matrix input */ 730dcd589f8SShri Abhyankar } else { 731dcd589f8SShri Abhyankar lu->id.ICNTL(18) = 3; /* distributed assembled matrix input */ 732dcd589f8SShri Abhyankar } 733dcd589f8SShri Abhyankar 734dcd589f8SShri Abhyankar icntl=-1; 735dcd589f8SShri Abhyankar lu->id.ICNTL(4) = 0; /* level of printing; overwrite mumps default ICNTL(4)=2 */ 736dcd589f8SShri Abhyankar ierr = PetscOptionsInt("-mat_mumps_icntl_4","ICNTL(4): level of printing (0 to 4)","None",lu->id.ICNTL(4),&icntl,&flg);CHKERRQ(ierr); 737dcd589f8SShri Abhyankar if ((flg && icntl > 0) || PetscLogPrintInfo) { 738dcd589f8SShri Abhyankar lu->id.ICNTL(4)=icntl; /* and use mumps default icntl(i), i=1,2,3 */ 739dcd589f8SShri Abhyankar } else { /* no output */ 740dcd589f8SShri Abhyankar lu->id.ICNTL(1) = 0; /* error message, default= 6 */ 741dcd589f8SShri Abhyankar lu->id.ICNTL(2) = 0; /* output stream for diagnostic printing, statistics, and warning. default=0 */ 742dcd589f8SShri Abhyankar lu->id.ICNTL(3) = 0; /* output stream for global information, default=6 */ 743dcd589f8SShri Abhyankar } 744dcd589f8SShri Abhyankar ierr = PetscOptionsInt("-mat_mumps_icntl_6","ICNTL(6): column permutation and/or scaling to get a zero-free diagonal (0 to 7)","None",lu->id.ICNTL(6),&lu->id.ICNTL(6),PETSC_NULL);CHKERRQ(ierr); 745dcd589f8SShri Abhyankar icntl=-1; 746292fb18eSBarry Smith ierr = PetscOptionsInt("-mat_mumps_icntl_7","ICNTL(7): sequential matrix ordering (0 to 7) 3 = Scotch, 5 = Metis","None",lu->id.ICNTL(7),&icntl,&flg);CHKERRQ(ierr); 747dcd589f8SShri Abhyankar if (flg) { 748e0b74bf9SHong Zhang if (icntl== 1 && lu->size > 1){ 749e32f2f54SBarry Smith SETERRQ(PETSC_COMM_SELF,PETSC_ERR_SUP,"pivot order be set by the user in PERM_IN -- not supported by the PETSc/MUMPS interface\n"); 750dcd589f8SShri Abhyankar } else { 751dcd589f8SShri Abhyankar lu->id.ICNTL(7) = icntl; 752dcd589f8SShri Abhyankar } 753dcd589f8SShri Abhyankar } 754e0b74bf9SHong Zhang 755dcd589f8SShri Abhyankar ierr = PetscOptionsInt("-mat_mumps_icntl_8","ICNTL(8): scaling strategy (-2 to 7 or 77)","None",lu->id.ICNTL(8),&lu->id.ICNTL(8),PETSC_NULL);CHKERRQ(ierr); 756dcd589f8SShri Abhyankar ierr = PetscOptionsInt("-mat_mumps_icntl_10","ICNTL(10): max num of refinements","None",lu->id.ICNTL(10),&lu->id.ICNTL(10),PETSC_NULL);CHKERRQ(ierr); 757dcd589f8SShri Abhyankar ierr = PetscOptionsInt("-mat_mumps_icntl_11","ICNTL(11): statistics related to the linear system solved (via -ksp_view)","None",lu->id.ICNTL(11),&lu->id.ICNTL(11),PETSC_NULL);CHKERRQ(ierr); 758dcd589f8SShri Abhyankar ierr = PetscOptionsInt("-mat_mumps_icntl_12","ICNTL(12): efficiency control: defines the ordering strategy with scaling constraints (0 to 3","None",lu->id.ICNTL(12),&lu->id.ICNTL(12),PETSC_NULL);CHKERRQ(ierr); 759dcd589f8SShri Abhyankar ierr = PetscOptionsInt("-mat_mumps_icntl_13","ICNTL(13): efficiency control: with or without ScaLAPACK","None",lu->id.ICNTL(13),&lu->id.ICNTL(13),PETSC_NULL);CHKERRQ(ierr); 760dcd589f8SShri Abhyankar ierr = PetscOptionsInt("-mat_mumps_icntl_14","ICNTL(14): percentage of estimated workspace increase","None",lu->id.ICNTL(14),&lu->id.ICNTL(14),PETSC_NULL);CHKERRQ(ierr); 761dcd589f8SShri Abhyankar ierr = PetscOptionsInt("-mat_mumps_icntl_19","ICNTL(19): Schur complement","None",lu->id.ICNTL(19),&lu->id.ICNTL(19),PETSC_NULL);CHKERRQ(ierr); 762dcd589f8SShri Abhyankar 763dcd589f8SShri Abhyankar ierr = PetscOptionsInt("-mat_mumps_icntl_22","ICNTL(22): in-core/out-of-core facility (0 or 1)","None",lu->id.ICNTL(22),&lu->id.ICNTL(22),PETSC_NULL);CHKERRQ(ierr); 764dcd589f8SShri Abhyankar ierr = PetscOptionsInt("-mat_mumps_icntl_23","ICNTL(23): max size of the working memory (MB) that can allocate per processor","None",lu->id.ICNTL(23),&lu->id.ICNTL(23),PETSC_NULL);CHKERRQ(ierr); 765dcd589f8SShri Abhyankar ierr = PetscOptionsInt("-mat_mumps_icntl_24","ICNTL(24): detection of null pivot rows (0 or 1)","None",lu->id.ICNTL(24),&lu->id.ICNTL(24),PETSC_NULL);CHKERRQ(ierr); 766d7ebd59bSHong Zhang if (lu->id.ICNTL(24)){ 767d7ebd59bSHong Zhang lu->id.ICNTL(13) = 1; /* turn-off ScaLAPACK to help with the correct detection of null pivots */ 768d7ebd59bSHong Zhang } 769d7ebd59bSHong Zhang 770dcd589f8SShri Abhyankar ierr = PetscOptionsInt("-mat_mumps_icntl_25","ICNTL(25): computation of a null space basis","None",lu->id.ICNTL(25),&lu->id.ICNTL(25),PETSC_NULL);CHKERRQ(ierr); 771dcd589f8SShri Abhyankar ierr = PetscOptionsInt("-mat_mumps_icntl_26","ICNTL(26): Schur options for right-hand side or solution vector","None",lu->id.ICNTL(26),&lu->id.ICNTL(26),PETSC_NULL);CHKERRQ(ierr); 772dcd589f8SShri Abhyankar ierr = PetscOptionsInt("-mat_mumps_icntl_27","ICNTL(27): experimental parameter","None",lu->id.ICNTL(27),&lu->id.ICNTL(27),PETSC_NULL);CHKERRQ(ierr); 773d7ebd59bSHong Zhang ierr = PetscOptionsInt("-mat_mumps_icntl_28","ICNTL(28): use 1 for sequential analysis and ictnl(7) ordering, or 2 for parallel analysis and ictnl(29) ordering","None",lu->id.ICNTL(28),&lu->id.ICNTL(28),PETSC_NULL);CHKERRQ(ierr); 774292fb18eSBarry Smith ierr = PetscOptionsInt("-mat_mumps_icntl_29","ICNTL(29): parallel ordering 1 = ptscotch 2 = parmetis","None",lu->id.ICNTL(29),&lu->id.ICNTL(29),PETSC_NULL);CHKERRQ(ierr); 775dcd589f8SShri Abhyankar 776dcd589f8SShri Abhyankar ierr = PetscOptionsReal("-mat_mumps_cntl_1","CNTL(1): relative pivoting threshold","None",lu->id.CNTL(1),&lu->id.CNTL(1),PETSC_NULL);CHKERRQ(ierr); 777dcd589f8SShri Abhyankar ierr = PetscOptionsReal("-mat_mumps_cntl_2","CNTL(2): stopping criterion of refinement","None",lu->id.CNTL(2),&lu->id.CNTL(2),PETSC_NULL);CHKERRQ(ierr); 778dcd589f8SShri Abhyankar ierr = PetscOptionsReal("-mat_mumps_cntl_3","CNTL(3): absolute pivoting threshold","None",lu->id.CNTL(3),&lu->id.CNTL(3),PETSC_NULL);CHKERRQ(ierr); 779dcd589f8SShri Abhyankar ierr = PetscOptionsReal("-mat_mumps_cntl_4","CNTL(4): value for static pivoting","None",lu->id.CNTL(4),&lu->id.CNTL(4),PETSC_NULL);CHKERRQ(ierr); 780dcd589f8SShri Abhyankar ierr = PetscOptionsReal("-mat_mumps_cntl_5","CNTL(5): fixation for null pivots","None",lu->id.CNTL(5),&lu->id.CNTL(5),PETSC_NULL);CHKERRQ(ierr); 781dcd589f8SShri Abhyankar PetscOptionsEnd(); 782dcd589f8SShri Abhyankar PetscFunctionReturn(0); 783dcd589f8SShri Abhyankar } 784dcd589f8SShri Abhyankar 785dcd589f8SShri Abhyankar #undef __FUNCT__ 786dcd589f8SShri Abhyankar #define __FUNCT__ "PetscInitializeMUMPS" 787f697e70eSHong Zhang PetscErrorCode PetscInitializeMUMPS(Mat A,Mat_MUMPS* mumps) 788dcd589f8SShri Abhyankar { 789dcd589f8SShri Abhyankar PetscErrorCode ierr; 790dcd589f8SShri Abhyankar 791dcd589f8SShri Abhyankar PetscFunctionBegin; 792f697e70eSHong Zhang ierr = MPI_Comm_rank(((PetscObject)A)->comm, &mumps->myid); 793f697e70eSHong Zhang ierr = MPI_Comm_size(((PetscObject)A)->comm,&mumps->size);CHKERRQ(ierr); 794f697e70eSHong Zhang ierr = MPI_Comm_dup(((PetscObject)A)->comm,&(mumps->comm_mumps));CHKERRQ(ierr); 795f697e70eSHong Zhang mumps->id.comm_fortran = MPI_Comm_c2f(mumps->comm_mumps); 796f697e70eSHong Zhang 797f697e70eSHong Zhang mumps->id.job = JOB_INIT; 798f697e70eSHong Zhang mumps->id.par = 1; /* host participates factorizaton and solve */ 799f697e70eSHong Zhang mumps->id.sym = mumps->sym; 800dcd589f8SShri Abhyankar #if defined(PETSC_USE_COMPLEX) 801f697e70eSHong Zhang zmumps_c(&mumps->id); 802dcd589f8SShri Abhyankar #else 803f697e70eSHong Zhang dmumps_c(&mumps->id); 804dcd589f8SShri Abhyankar #endif 805f697e70eSHong Zhang 806f697e70eSHong Zhang mumps->CleanUpMUMPS = PETSC_FALSE; 807f697e70eSHong Zhang mumps->scat_rhs = PETSC_NULL; 808f697e70eSHong Zhang mumps->scat_sol = PETSC_NULL; 809f697e70eSHong Zhang mumps->nSolve = 0; 810dcd589f8SShri Abhyankar PetscFunctionReturn(0); 811dcd589f8SShri Abhyankar } 812dcd589f8SShri Abhyankar 813397b6df1SKris Buschelman /* Note the Petsc r and c permutations are ignored */ 814397b6df1SKris Buschelman #undef __FUNCT__ 815f0c56d0fSKris Buschelman #define __FUNCT__ "MatLUFactorSymbolic_AIJMUMPS" 8160481f469SBarry Smith PetscErrorCode MatLUFactorSymbolic_AIJMUMPS(Mat F,Mat A,IS r,IS c,const MatFactorInfo *info) 817b24902e0SBarry Smith { 818719d5645SBarry Smith Mat_MUMPS *lu = (Mat_MUMPS*)F->spptr; 819dcd589f8SShri Abhyankar PetscErrorCode ierr; 820bccb9932SShri Abhyankar MatReuse reuse; 82167877ebaSShri Abhyankar Vec b; 82267877ebaSShri Abhyankar IS is_iden; 82367877ebaSShri Abhyankar const PetscInt M = A->rmap->N; 824397b6df1SKris Buschelman 825397b6df1SKris Buschelman PetscFunctionBegin; 826b24902e0SBarry Smith lu->matstruc = DIFFERENT_NONZERO_PATTERN; 827dcd589f8SShri Abhyankar 828dcd589f8SShri Abhyankar /* Set MUMPS options */ 829dcd589f8SShri Abhyankar ierr = PetscSetMUMPSOptions(F,A);CHKERRQ(ierr); 830dcd589f8SShri Abhyankar 831bccb9932SShri Abhyankar reuse = MAT_INITIAL_MATRIX; 832bccb9932SShri Abhyankar ierr = (*lu->ConvertToTriples)(A, 1, reuse, &lu->nz, &lu->irn, &lu->jcn, &lu->val);CHKERRQ(ierr); 833dcd589f8SShri Abhyankar 83467877ebaSShri Abhyankar /* analysis phase */ 83567877ebaSShri Abhyankar /*----------------*/ 8363d472b54SHong Zhang lu->id.job = JOB_FACTSYMBOLIC; 83767877ebaSShri Abhyankar lu->id.n = M; 83867877ebaSShri Abhyankar switch (lu->id.ICNTL(18)){ 83967877ebaSShri Abhyankar case 0: /* centralized assembled matrix input */ 84067877ebaSShri Abhyankar if (!lu->myid) { 84167877ebaSShri Abhyankar lu->id.nz =lu->nz; lu->id.irn=lu->irn; lu->id.jcn=lu->jcn; 84267877ebaSShri Abhyankar if (lu->id.ICNTL(6)>1){ 84367877ebaSShri Abhyankar #if defined(PETSC_USE_COMPLEX) 84467877ebaSShri Abhyankar lu->id.a = (mumps_double_complex*)lu->val; 84567877ebaSShri Abhyankar #else 84667877ebaSShri Abhyankar lu->id.a = lu->val; 84767877ebaSShri Abhyankar #endif 84867877ebaSShri Abhyankar } 849e0b74bf9SHong Zhang if (lu->id.ICNTL(7) == 1){ /* use user-provide matrix ordering */ 850e0b74bf9SHong Zhang if (!lu->myid) { 851e0b74bf9SHong Zhang const PetscInt *idx; 852e0b74bf9SHong Zhang PetscInt i,*perm_in; 853e0b74bf9SHong Zhang ierr = PetscMalloc(M*sizeof(PetscInt),&perm_in);CHKERRQ(ierr); 854e0b74bf9SHong Zhang ierr = ISGetIndices(r,&idx);CHKERRQ(ierr); 855e0b74bf9SHong Zhang lu->id.perm_in = perm_in; 856e0b74bf9SHong Zhang for (i=0; i<M; i++) perm_in[i] = idx[i]+1; /* perm_in[]: start from 1, not 0! */ 857e0b74bf9SHong Zhang ierr = ISRestoreIndices(r,&idx);CHKERRQ(ierr); 858e0b74bf9SHong Zhang } 859e0b74bf9SHong Zhang } 86067877ebaSShri Abhyankar } 86167877ebaSShri Abhyankar break; 86267877ebaSShri Abhyankar case 3: /* distributed assembled matrix input (size>1) */ 86367877ebaSShri Abhyankar lu->id.nz_loc = lu->nz; 86467877ebaSShri Abhyankar lu->id.irn_loc=lu->irn; lu->id.jcn_loc=lu->jcn; 86567877ebaSShri Abhyankar if (lu->id.ICNTL(6)>1) { 86667877ebaSShri Abhyankar #if defined(PETSC_USE_COMPLEX) 86767877ebaSShri Abhyankar lu->id.a_loc = (mumps_double_complex*)lu->val; 86867877ebaSShri Abhyankar #else 86967877ebaSShri Abhyankar lu->id.a_loc = lu->val; 87067877ebaSShri Abhyankar #endif 87167877ebaSShri Abhyankar } 87267877ebaSShri Abhyankar /* MUMPS only supports centralized rhs. Create scatter scat_rhs for repeated use in MatSolve() */ 87367877ebaSShri Abhyankar if (!lu->myid){ 87467877ebaSShri Abhyankar ierr = VecCreateSeq(PETSC_COMM_SELF,A->cmap->N,&lu->b_seq);CHKERRQ(ierr); 87567877ebaSShri Abhyankar ierr = ISCreateStride(PETSC_COMM_SELF,A->cmap->N,0,1,&is_iden);CHKERRQ(ierr); 87667877ebaSShri Abhyankar } else { 87767877ebaSShri Abhyankar ierr = VecCreateSeq(PETSC_COMM_SELF,0,&lu->b_seq);CHKERRQ(ierr); 87867877ebaSShri Abhyankar ierr = ISCreateStride(PETSC_COMM_SELF,0,0,1,&is_iden);CHKERRQ(ierr); 87967877ebaSShri Abhyankar } 88067877ebaSShri Abhyankar ierr = VecCreate(((PetscObject)A)->comm,&b);CHKERRQ(ierr); 88167877ebaSShri Abhyankar ierr = VecSetSizes(b,A->rmap->n,PETSC_DECIDE);CHKERRQ(ierr); 88267877ebaSShri Abhyankar ierr = VecSetFromOptions(b);CHKERRQ(ierr); 88367877ebaSShri Abhyankar 88467877ebaSShri Abhyankar ierr = VecScatterCreate(b,is_iden,lu->b_seq,is_iden,&lu->scat_rhs);CHKERRQ(ierr); 8856bf464f9SBarry Smith ierr = ISDestroy(&is_iden);CHKERRQ(ierr); 8866bf464f9SBarry Smith ierr = VecDestroy(&b);CHKERRQ(ierr); 88767877ebaSShri Abhyankar break; 88867877ebaSShri Abhyankar } 88967877ebaSShri Abhyankar #if defined(PETSC_USE_COMPLEX) 89067877ebaSShri Abhyankar zmumps_c(&lu->id); 89167877ebaSShri Abhyankar #else 89267877ebaSShri Abhyankar dmumps_c(&lu->id); 89367877ebaSShri Abhyankar #endif 89467877ebaSShri Abhyankar if (lu->id.INFOG(1) < 0) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error reported by MUMPS in analysis phase: INFOG(1)=%d\n",lu->id.INFOG(1)); 89567877ebaSShri Abhyankar 896719d5645SBarry Smith F->ops->lufactornumeric = MatFactorNumeric_MUMPS; 897dcd589f8SShri Abhyankar F->ops->solve = MatSolve_MUMPS; 89851d5961aSHong Zhang F->ops->solvetranspose = MatSolveTranspose_MUMPS; 899e0b74bf9SHong Zhang F->ops->matsolve = MatMatSolve_MUMPS; 900b24902e0SBarry Smith PetscFunctionReturn(0); 901b24902e0SBarry Smith } 902b24902e0SBarry Smith 903450b117fSShri Abhyankar /* Note the Petsc r and c permutations are ignored */ 904450b117fSShri Abhyankar #undef __FUNCT__ 905450b117fSShri Abhyankar #define __FUNCT__ "MatLUFactorSymbolic_BAIJMUMPS" 906450b117fSShri Abhyankar PetscErrorCode MatLUFactorSymbolic_BAIJMUMPS(Mat F,Mat A,IS r,IS c,const MatFactorInfo *info) 907450b117fSShri Abhyankar { 908dcd589f8SShri Abhyankar 909450b117fSShri Abhyankar Mat_MUMPS *lu = (Mat_MUMPS*)F->spptr; 910dcd589f8SShri Abhyankar PetscErrorCode ierr; 911bccb9932SShri Abhyankar MatReuse reuse; 91267877ebaSShri Abhyankar Vec b; 91367877ebaSShri Abhyankar IS is_iden; 91467877ebaSShri Abhyankar const PetscInt M = A->rmap->N; 915450b117fSShri Abhyankar 916450b117fSShri Abhyankar PetscFunctionBegin; 917450b117fSShri Abhyankar lu->matstruc = DIFFERENT_NONZERO_PATTERN; 918dcd589f8SShri Abhyankar 919dcd589f8SShri Abhyankar /* Set MUMPS options */ 920dcd589f8SShri Abhyankar ierr = PetscSetMUMPSOptions(F,A);CHKERRQ(ierr); 921dcd589f8SShri Abhyankar 922bccb9932SShri Abhyankar reuse = MAT_INITIAL_MATRIX; 923bccb9932SShri Abhyankar ierr = (*lu->ConvertToTriples)(A, 1, reuse, &lu->nz, &lu->irn, &lu->jcn, &lu->val);CHKERRQ(ierr); 92467877ebaSShri Abhyankar 92567877ebaSShri Abhyankar /* analysis phase */ 92667877ebaSShri Abhyankar /*----------------*/ 9273d472b54SHong Zhang lu->id.job = JOB_FACTSYMBOLIC; 92867877ebaSShri Abhyankar lu->id.n = M; 92967877ebaSShri Abhyankar switch (lu->id.ICNTL(18)){ 93067877ebaSShri Abhyankar case 0: /* centralized assembled matrix input */ 93167877ebaSShri Abhyankar if (!lu->myid) { 93267877ebaSShri Abhyankar lu->id.nz =lu->nz; lu->id.irn=lu->irn; lu->id.jcn=lu->jcn; 93367877ebaSShri Abhyankar if (lu->id.ICNTL(6)>1){ 93467877ebaSShri Abhyankar #if defined(PETSC_USE_COMPLEX) 93567877ebaSShri Abhyankar lu->id.a = (mumps_double_complex*)lu->val; 93667877ebaSShri Abhyankar #else 93767877ebaSShri Abhyankar lu->id.a = lu->val; 93867877ebaSShri Abhyankar #endif 93967877ebaSShri Abhyankar } 94067877ebaSShri Abhyankar } 94167877ebaSShri Abhyankar break; 94267877ebaSShri Abhyankar case 3: /* distributed assembled matrix input (size>1) */ 94367877ebaSShri Abhyankar lu->id.nz_loc = lu->nz; 94467877ebaSShri Abhyankar lu->id.irn_loc=lu->irn; lu->id.jcn_loc=lu->jcn; 94567877ebaSShri Abhyankar if (lu->id.ICNTL(6)>1) { 94667877ebaSShri Abhyankar #if defined(PETSC_USE_COMPLEX) 94767877ebaSShri Abhyankar lu->id.a_loc = (mumps_double_complex*)lu->val; 94867877ebaSShri Abhyankar #else 94967877ebaSShri Abhyankar lu->id.a_loc = lu->val; 95067877ebaSShri Abhyankar #endif 95167877ebaSShri Abhyankar } 95267877ebaSShri Abhyankar /* MUMPS only supports centralized rhs. Create scatter scat_rhs for repeated use in MatSolve() */ 95367877ebaSShri Abhyankar if (!lu->myid){ 95467877ebaSShri Abhyankar ierr = VecCreateSeq(PETSC_COMM_SELF,A->cmap->N,&lu->b_seq);CHKERRQ(ierr); 95567877ebaSShri Abhyankar ierr = ISCreateStride(PETSC_COMM_SELF,A->cmap->N,0,1,&is_iden);CHKERRQ(ierr); 95667877ebaSShri Abhyankar } else { 95767877ebaSShri Abhyankar ierr = VecCreateSeq(PETSC_COMM_SELF,0,&lu->b_seq);CHKERRQ(ierr); 95867877ebaSShri Abhyankar ierr = ISCreateStride(PETSC_COMM_SELF,0,0,1,&is_iden);CHKERRQ(ierr); 95967877ebaSShri Abhyankar } 96067877ebaSShri Abhyankar ierr = VecCreate(((PetscObject)A)->comm,&b);CHKERRQ(ierr); 96167877ebaSShri Abhyankar ierr = VecSetSizes(b,A->rmap->n,PETSC_DECIDE);CHKERRQ(ierr); 96267877ebaSShri Abhyankar ierr = VecSetFromOptions(b);CHKERRQ(ierr); 96367877ebaSShri Abhyankar 96467877ebaSShri Abhyankar ierr = VecScatterCreate(b,is_iden,lu->b_seq,is_iden,&lu->scat_rhs);CHKERRQ(ierr); 9656bf464f9SBarry Smith ierr = ISDestroy(&is_iden);CHKERRQ(ierr); 9666bf464f9SBarry Smith ierr = VecDestroy(&b);CHKERRQ(ierr); 96767877ebaSShri Abhyankar break; 96867877ebaSShri Abhyankar } 96967877ebaSShri Abhyankar #if defined(PETSC_USE_COMPLEX) 97067877ebaSShri Abhyankar zmumps_c(&lu->id); 97167877ebaSShri Abhyankar #else 97267877ebaSShri Abhyankar dmumps_c(&lu->id); 97367877ebaSShri Abhyankar #endif 97467877ebaSShri Abhyankar if (lu->id.INFOG(1) < 0) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error reported by MUMPS in analysis phase: INFOG(1)=%d\n",lu->id.INFOG(1)); 97567877ebaSShri Abhyankar 976450b117fSShri Abhyankar F->ops->lufactornumeric = MatFactorNumeric_MUMPS; 977dcd589f8SShri Abhyankar F->ops->solve = MatSolve_MUMPS; 97851d5961aSHong Zhang F->ops->solvetranspose = MatSolveTranspose_MUMPS; 979450b117fSShri Abhyankar PetscFunctionReturn(0); 980450b117fSShri Abhyankar } 981b24902e0SBarry Smith 982141f4205SHong Zhang /* Note the Petsc r permutation and factor info are ignored */ 983397b6df1SKris Buschelman #undef __FUNCT__ 98467877ebaSShri Abhyankar #define __FUNCT__ "MatCholeskyFactorSymbolic_MUMPS" 98567877ebaSShri Abhyankar PetscErrorCode MatCholeskyFactorSymbolic_MUMPS(Mat F,Mat A,IS r,const MatFactorInfo *info) 986b24902e0SBarry Smith { 9872792810eSHong Zhang Mat_MUMPS *lu = (Mat_MUMPS*)F->spptr; 988dcd589f8SShri Abhyankar PetscErrorCode ierr; 989bccb9932SShri Abhyankar MatReuse reuse; 99067877ebaSShri Abhyankar Vec b; 99167877ebaSShri Abhyankar IS is_iden; 99267877ebaSShri Abhyankar const PetscInt M = A->rmap->N; 993397b6df1SKris Buschelman 994397b6df1SKris Buschelman PetscFunctionBegin; 995b24902e0SBarry Smith lu->matstruc = DIFFERENT_NONZERO_PATTERN; 996dcd589f8SShri Abhyankar 997dcd589f8SShri Abhyankar /* Set MUMPS options */ 998dcd589f8SShri Abhyankar ierr = PetscSetMUMPSOptions(F,A);CHKERRQ(ierr); 999dcd589f8SShri Abhyankar 1000bccb9932SShri Abhyankar reuse = MAT_INITIAL_MATRIX; 1001bccb9932SShri Abhyankar ierr = (*lu->ConvertToTriples)(A, 1 , reuse, &lu->nz, &lu->irn, &lu->jcn, &lu->val);CHKERRQ(ierr); 1002dcd589f8SShri Abhyankar 100367877ebaSShri Abhyankar /* analysis phase */ 100467877ebaSShri Abhyankar /*----------------*/ 10053d472b54SHong Zhang lu->id.job = JOB_FACTSYMBOLIC; 100667877ebaSShri Abhyankar lu->id.n = M; 100767877ebaSShri Abhyankar switch (lu->id.ICNTL(18)){ 100867877ebaSShri Abhyankar case 0: /* centralized assembled matrix input */ 100967877ebaSShri Abhyankar if (!lu->myid) { 101067877ebaSShri Abhyankar lu->id.nz =lu->nz; lu->id.irn=lu->irn; lu->id.jcn=lu->jcn; 101167877ebaSShri Abhyankar if (lu->id.ICNTL(6)>1){ 101267877ebaSShri Abhyankar #if defined(PETSC_USE_COMPLEX) 101367877ebaSShri Abhyankar lu->id.a = (mumps_double_complex*)lu->val; 101467877ebaSShri Abhyankar #else 101567877ebaSShri Abhyankar lu->id.a = lu->val; 101667877ebaSShri Abhyankar #endif 101767877ebaSShri Abhyankar } 101867877ebaSShri Abhyankar } 101967877ebaSShri Abhyankar break; 102067877ebaSShri Abhyankar case 3: /* distributed assembled matrix input (size>1) */ 102167877ebaSShri Abhyankar lu->id.nz_loc = lu->nz; 102267877ebaSShri Abhyankar lu->id.irn_loc=lu->irn; lu->id.jcn_loc=lu->jcn; 102367877ebaSShri Abhyankar if (lu->id.ICNTL(6)>1) { 102467877ebaSShri Abhyankar #if defined(PETSC_USE_COMPLEX) 102567877ebaSShri Abhyankar lu->id.a_loc = (mumps_double_complex*)lu->val; 102667877ebaSShri Abhyankar #else 102767877ebaSShri Abhyankar lu->id.a_loc = lu->val; 102867877ebaSShri Abhyankar #endif 102967877ebaSShri Abhyankar } 103067877ebaSShri Abhyankar /* MUMPS only supports centralized rhs. Create scatter scat_rhs for repeated use in MatSolve() */ 103167877ebaSShri Abhyankar if (!lu->myid){ 103267877ebaSShri Abhyankar ierr = VecCreateSeq(PETSC_COMM_SELF,A->cmap->N,&lu->b_seq);CHKERRQ(ierr); 103367877ebaSShri Abhyankar ierr = ISCreateStride(PETSC_COMM_SELF,A->cmap->N,0,1,&is_iden);CHKERRQ(ierr); 103467877ebaSShri Abhyankar } else { 103567877ebaSShri Abhyankar ierr = VecCreateSeq(PETSC_COMM_SELF,0,&lu->b_seq);CHKERRQ(ierr); 103667877ebaSShri Abhyankar ierr = ISCreateStride(PETSC_COMM_SELF,0,0,1,&is_iden);CHKERRQ(ierr); 103767877ebaSShri Abhyankar } 103867877ebaSShri Abhyankar ierr = VecCreate(((PetscObject)A)->comm,&b);CHKERRQ(ierr); 103967877ebaSShri Abhyankar ierr = VecSetSizes(b,A->rmap->n,PETSC_DECIDE);CHKERRQ(ierr); 104067877ebaSShri Abhyankar ierr = VecSetFromOptions(b);CHKERRQ(ierr); 104167877ebaSShri Abhyankar 104267877ebaSShri Abhyankar ierr = VecScatterCreate(b,is_iden,lu->b_seq,is_iden,&lu->scat_rhs);CHKERRQ(ierr); 10436bf464f9SBarry Smith ierr = ISDestroy(&is_iden);CHKERRQ(ierr); 10446bf464f9SBarry Smith ierr = VecDestroy(&b);CHKERRQ(ierr); 104567877ebaSShri Abhyankar break; 104667877ebaSShri Abhyankar } 104767877ebaSShri Abhyankar #if defined(PETSC_USE_COMPLEX) 104867877ebaSShri Abhyankar zmumps_c(&lu->id); 104967877ebaSShri Abhyankar #else 105067877ebaSShri Abhyankar dmumps_c(&lu->id); 105167877ebaSShri Abhyankar #endif 105267877ebaSShri Abhyankar if (lu->id.INFOG(1) < 0) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error reported by MUMPS in analysis phase: INFOG(1)=%d\n",lu->id.INFOG(1)); 105367877ebaSShri Abhyankar 10542792810eSHong Zhang F->ops->choleskyfactornumeric = MatFactorNumeric_MUMPS; 1055dcd589f8SShri Abhyankar F->ops->solve = MatSolve_MUMPS; 105651d5961aSHong Zhang F->ops->solvetranspose = MatSolve_MUMPS; 1057db4efbfdSBarry Smith #if !defined(PETSC_USE_COMPLEX) 1058dcd589f8SShri Abhyankar (F)->ops->getinertia = MatGetInertia_SBAIJMUMPS; 1059db4efbfdSBarry Smith #endif 1060b24902e0SBarry Smith PetscFunctionReturn(0); 1061b24902e0SBarry Smith } 1062b24902e0SBarry Smith 1063397b6df1SKris Buschelman #undef __FUNCT__ 106464e6c443SBarry Smith #define __FUNCT__ "MatView_MUMPS" 106564e6c443SBarry Smith PetscErrorCode MatView_MUMPS(Mat A,PetscViewer viewer) 106674ed9c26SBarry Smith { 1067f6c57405SHong Zhang PetscErrorCode ierr; 106864e6c443SBarry Smith PetscBool iascii; 106964e6c443SBarry Smith PetscViewerFormat format; 107064e6c443SBarry Smith Mat_MUMPS *lu=(Mat_MUMPS*)A->spptr; 1071f6c57405SHong Zhang 1072f6c57405SHong Zhang PetscFunctionBegin; 107364e6c443SBarry Smith /* check if matrix is mumps type */ 107464e6c443SBarry Smith if (A->ops->solve != MatSolve_MUMPS) PetscFunctionReturn(0); 107564e6c443SBarry Smith 107664e6c443SBarry Smith ierr = PetscTypeCompare((PetscObject)viewer,PETSCVIEWERASCII,&iascii);CHKERRQ(ierr); 107764e6c443SBarry Smith if (iascii) { 107864e6c443SBarry Smith ierr = PetscViewerGetFormat(viewer,&format);CHKERRQ(ierr); 107964e6c443SBarry Smith if (format == PETSC_VIEWER_ASCII_INFO){ 108064e6c443SBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"MUMPS run parameters:\n");CHKERRQ(ierr); 108164e6c443SBarry Smith ierr = PetscViewerASCIIPrintf(viewer," SYM (matrix type): %d \n",lu->id.sym);CHKERRQ(ierr); 108264e6c443SBarry Smith ierr = PetscViewerASCIIPrintf(viewer," PAR (host participation): %d \n",lu->id.par);CHKERRQ(ierr); 1083f6c57405SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(1) (output for error): %d \n",lu->id.ICNTL(1));CHKERRQ(ierr); 1084f6c57405SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(2) (output of diagnostic msg): %d \n",lu->id.ICNTL(2));CHKERRQ(ierr); 1085f6c57405SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(3) (output for global info): %d \n",lu->id.ICNTL(3));CHKERRQ(ierr); 1086f6c57405SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(4) (level of printing): %d \n",lu->id.ICNTL(4));CHKERRQ(ierr); 1087f6c57405SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(5) (input mat struct): %d \n",lu->id.ICNTL(5));CHKERRQ(ierr); 1088f6c57405SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(6) (matrix prescaling): %d \n",lu->id.ICNTL(6));CHKERRQ(ierr); 1089d06efebcSBarry Smith ierr = PetscViewerASCIIPrintf(viewer," ICNTL(7) (sequentia matrix ordering):%d \n",lu->id.ICNTL(7));CHKERRQ(ierr); 1090f6c57405SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(8) (scalling strategy): %d \n",lu->id.ICNTL(8));CHKERRQ(ierr); 1091f6c57405SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(10) (max num of refinements): %d \n",lu->id.ICNTL(10));CHKERRQ(ierr); 1092f6c57405SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(11) (error analysis): %d \n",lu->id.ICNTL(11));CHKERRQ(ierr); 109334ed7027SBarry Smith if (lu->id.ICNTL(11)>0) { 109434ed7027SBarry Smith ierr = PetscViewerASCIIPrintf(viewer," RINFOG(4) (inf norm of input mat): %g\n",lu->id.RINFOG(4));CHKERRQ(ierr); 109534ed7027SBarry Smith ierr = PetscViewerASCIIPrintf(viewer," RINFOG(5) (inf norm of solution): %g\n",lu->id.RINFOG(5));CHKERRQ(ierr); 109634ed7027SBarry Smith ierr = PetscViewerASCIIPrintf(viewer," RINFOG(6) (inf norm of residual): %g\n",lu->id.RINFOG(6));CHKERRQ(ierr); 109734ed7027SBarry Smith ierr = PetscViewerASCIIPrintf(viewer," RINFOG(7),RINFOG(8) (backward error est): %g, %g\n",lu->id.RINFOG(7),lu->id.RINFOG(8));CHKERRQ(ierr); 109834ed7027SBarry Smith ierr = PetscViewerASCIIPrintf(viewer," RINFOG(9) (error estimate): %g \n",lu->id.RINFOG(9));CHKERRQ(ierr); 109934ed7027SBarry Smith ierr = PetscViewerASCIIPrintf(viewer," RINFOG(10),RINFOG(11)(condition numbers): %g, %g\n",lu->id.RINFOG(10),lu->id.RINFOG(11));CHKERRQ(ierr); 1100f6c57405SHong Zhang } 1101f6c57405SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(12) (efficiency control): %d \n",lu->id.ICNTL(12));CHKERRQ(ierr); 1102f6c57405SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(13) (efficiency control): %d \n",lu->id.ICNTL(13));CHKERRQ(ierr); 1103f6c57405SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(14) (percentage of estimated workspace increase): %d \n",lu->id.ICNTL(14));CHKERRQ(ierr); 1104f6c57405SHong Zhang /* ICNTL(15-17) not used */ 1105f6c57405SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(18) (input mat struct): %d \n",lu->id.ICNTL(18));CHKERRQ(ierr); 1106f6c57405SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(19) (Shur complement info): %d \n",lu->id.ICNTL(19));CHKERRQ(ierr); 1107f6c57405SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(20) (rhs sparse pattern): %d \n",lu->id.ICNTL(20));CHKERRQ(ierr); 1108f6c57405SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(21) (solution struct): %d \n",lu->id.ICNTL(21));CHKERRQ(ierr); 1109c0165424SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(22) (in-core/out-of-core facility): %d \n",lu->id.ICNTL(22));CHKERRQ(ierr); 1110c0165424SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(23) (max size of memory can be allocated locally):%d \n",lu->id.ICNTL(23));CHKERRQ(ierr); 1111c0165424SHong Zhang 1112c0165424SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(24) (detection of null pivot rows): %d \n",lu->id.ICNTL(24));CHKERRQ(ierr); 1113c0165424SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(25) (computation of a null space basis): %d \n",lu->id.ICNTL(25));CHKERRQ(ierr); 1114c0165424SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(26) (Schur options for rhs or solution): %d \n",lu->id.ICNTL(26));CHKERRQ(ierr); 1115c0165424SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(27) (experimental parameter): %d \n",lu->id.ICNTL(27));CHKERRQ(ierr); 1116d06efebcSBarry Smith ierr = PetscViewerASCIIPrintf(viewer," ICNTL(28) (Use parallel or sequential ordering): %d \n",lu->id.ICNTL(28));CHKERRQ(ierr); 1117d06efebcSBarry Smith ierr = PetscViewerASCIIPrintf(viewer," ICNTL(29) (Parallel ordering): %d \n",lu->id.ICNTL(29));CHKERRQ(ierr); 1118f6c57405SHong Zhang 1119f6c57405SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," CNTL(1) (relative pivoting threshold): %g \n",lu->id.CNTL(1));CHKERRQ(ierr); 1120f6c57405SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," CNTL(2) (stopping criterion of refinement): %g \n",lu->id.CNTL(2));CHKERRQ(ierr); 1121f6c57405SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," CNTL(3) (absolute pivoting threshold): %g \n",lu->id.CNTL(3));CHKERRQ(ierr); 1122f6c57405SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," CNTL(4) (value of static pivoting): %g \n",lu->id.CNTL(4));CHKERRQ(ierr); 1123c0165424SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," CNTL(5) (fixation for null pivots): %g \n",lu->id.CNTL(5));CHKERRQ(ierr); 1124f6c57405SHong Zhang 1125f6c57405SHong Zhang /* infomation local to each processor */ 112634ed7027SBarry Smith ierr = PetscViewerASCIIPrintf(viewer, " RINFO(1) (local estimated flops for the elimination after analysis): \n");CHKERRQ(ierr); 11277b23a99aSBarry Smith ierr = PetscViewerASCIISynchronizedAllow(viewer,PETSC_TRUE);CHKERRQ(ierr); 112834ed7027SBarry Smith ierr = PetscViewerASCIISynchronizedPrintf(viewer," [%d] %g \n",lu->myid,lu->id.RINFO(1));CHKERRQ(ierr); 112934ed7027SBarry Smith ierr = PetscViewerFlush(viewer); 113034ed7027SBarry Smith ierr = PetscViewerASCIIPrintf(viewer, " RINFO(2) (local estimated flops for the assembly after factorization): \n");CHKERRQ(ierr); 113134ed7027SBarry Smith ierr = PetscViewerASCIISynchronizedPrintf(viewer," [%d] %g \n",lu->myid,lu->id.RINFO(2));CHKERRQ(ierr); 113234ed7027SBarry Smith ierr = PetscViewerFlush(viewer); 113334ed7027SBarry Smith ierr = PetscViewerASCIIPrintf(viewer, " RINFO(3) (local estimated flops for the elimination after factorization): \n");CHKERRQ(ierr); 113434ed7027SBarry Smith ierr = PetscViewerASCIISynchronizedPrintf(viewer," [%d] %g \n",lu->myid,lu->id.RINFO(3));CHKERRQ(ierr); 113534ed7027SBarry Smith ierr = PetscViewerFlush(viewer); 1136f6c57405SHong Zhang 113734ed7027SBarry Smith ierr = PetscViewerASCIIPrintf(viewer, " INFO(15) (estimated size of (in MB) MUMPS internal data for running numerical factorization): \n");CHKERRQ(ierr); 113834ed7027SBarry Smith ierr = PetscViewerASCIISynchronizedPrintf(viewer," [%d] %d \n",lu->myid,lu->id.INFO(15));CHKERRQ(ierr); 113934ed7027SBarry Smith ierr = PetscViewerFlush(viewer); 1140f6c57405SHong Zhang 114134ed7027SBarry Smith ierr = PetscViewerASCIIPrintf(viewer, " INFO(16) (size of (in MB) MUMPS internal data used during numerical factorization): \n");CHKERRQ(ierr); 114234ed7027SBarry Smith ierr = PetscViewerASCIISynchronizedPrintf(viewer," [%d] %d \n",lu->myid,lu->id.INFO(16));CHKERRQ(ierr); 114334ed7027SBarry Smith ierr = PetscViewerFlush(viewer); 1144f6c57405SHong Zhang 114534ed7027SBarry Smith ierr = PetscViewerASCIIPrintf(viewer, " INFO(23) (num of pivots eliminated on this processor after factorization): \n");CHKERRQ(ierr); 114634ed7027SBarry Smith ierr = PetscViewerASCIISynchronizedPrintf(viewer," [%d] %d \n",lu->myid,lu->id.INFO(23));CHKERRQ(ierr); 114734ed7027SBarry Smith ierr = PetscViewerFlush(viewer); 11487b23a99aSBarry Smith ierr = PetscViewerASCIISynchronizedAllow(viewer,PETSC_FALSE);CHKERRQ(ierr); 1149f6c57405SHong Zhang 1150f6c57405SHong Zhang if (!lu->myid){ /* information from the host */ 1151f6c57405SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," RINFOG(1) (global estimated flops for the elimination after analysis): %g \n",lu->id.RINFOG(1));CHKERRQ(ierr); 1152f6c57405SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," RINFOG(2) (global estimated flops for the assembly after factorization): %g \n",lu->id.RINFOG(2));CHKERRQ(ierr); 1153f6c57405SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," RINFOG(3) (global estimated flops for the elimination after factorization): %g \n",lu->id.RINFOG(3));CHKERRQ(ierr); 1154f6c57405SHong Zhang 1155f6c57405SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(3) (estimated real workspace for factors on all processors after analysis): %d \n",lu->id.INFOG(3));CHKERRQ(ierr); 1156f6c57405SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(4) (estimated integer workspace for factors on all processors after analysis): %d \n",lu->id.INFOG(4));CHKERRQ(ierr); 1157f6c57405SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(5) (estimated maximum front size in the complete tree): %d \n",lu->id.INFOG(5));CHKERRQ(ierr); 1158f6c57405SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(6) (number of nodes in the complete tree): %d \n",lu->id.INFOG(6));CHKERRQ(ierr); 11592bd8dccdSBarry Smith ierr = PetscViewerASCIIPrintf(viewer," INFOG(7) (ordering option effectively use after analysis): %d \n",lu->id.INFOG(7));CHKERRQ(ierr); 1160f6c57405SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(8) (structural symmetry in percent of the permuted matrix after analysis): %d \n",lu->id.INFOG(8));CHKERRQ(ierr); 1161f6c57405SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(9) (total real/complex workspace to store the matrix factors after factorization): %d \n",lu->id.INFOG(9));CHKERRQ(ierr); 1162f6c57405SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(10) (total integer space store the matrix factors after factorization): %d \n",lu->id.INFOG(10));CHKERRQ(ierr); 1163f6c57405SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(11) (order of largest frontal matrix after factorization): %d \n",lu->id.INFOG(11));CHKERRQ(ierr); 1164f6c57405SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(12) (number of off-diagonal pivots): %d \n",lu->id.INFOG(12));CHKERRQ(ierr); 1165f6c57405SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(13) (number of delayed pivots after factorization): %d \n",lu->id.INFOG(13));CHKERRQ(ierr); 1166f6c57405SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(14) (number of memory compress after factorization): %d \n",lu->id.INFOG(14));CHKERRQ(ierr); 1167f6c57405SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(15) (number of steps of iterative refinement after solution): %d \n",lu->id.INFOG(15));CHKERRQ(ierr); 1168f6c57405SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(16) (estimated size (in MB) of all MUMPS internal data for factorization after analysis: value on the most memory consuming processor): %d \n",lu->id.INFOG(16));CHKERRQ(ierr); 1169f6c57405SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(17) (estimated size of all MUMPS internal data for factorization after analysis: sum over all processors): %d \n",lu->id.INFOG(17));CHKERRQ(ierr); 1170f6c57405SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(18) (size of all MUMPS internal data allocated during factorization: value on the most memory consuming processor): %d \n",lu->id.INFOG(18));CHKERRQ(ierr); 1171f6c57405SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(19) (size of all MUMPS internal data allocated during factorization: sum over all processors): %d \n",lu->id.INFOG(19));CHKERRQ(ierr); 1172f6c57405SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(20) (estimated number of entries in the factors): %d \n",lu->id.INFOG(20));CHKERRQ(ierr); 1173f6c57405SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(21) (size in MB of memory effectively used during factorization - value on the most memory consuming processor): %d \n",lu->id.INFOG(21));CHKERRQ(ierr); 1174f6c57405SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(22) (size in MB of memory effectively used during factorization - sum over all processors): %d \n",lu->id.INFOG(22));CHKERRQ(ierr); 1175f6c57405SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(23) (after analysis: value of ICNTL(6) effectively used): %d \n",lu->id.INFOG(23));CHKERRQ(ierr); 1176f6c57405SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(24) (after analysis: value of ICNTL(12) effectively used): %d \n",lu->id.INFOG(24));CHKERRQ(ierr); 1177f6c57405SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(25) (after factorization: number of pivots modified by static pivoting): %d \n",lu->id.INFOG(25));CHKERRQ(ierr); 1178f6c57405SHong Zhang } 1179f6c57405SHong Zhang } 1180cb828f0fSHong Zhang } 1181f6c57405SHong Zhang PetscFunctionReturn(0); 1182f6c57405SHong Zhang } 1183f6c57405SHong Zhang 118435bd34faSBarry Smith #undef __FUNCT__ 118535bd34faSBarry Smith #define __FUNCT__ "MatGetInfo_MUMPS" 118635bd34faSBarry Smith PetscErrorCode MatGetInfo_MUMPS(Mat A,MatInfoType flag,MatInfo *info) 118735bd34faSBarry Smith { 1188cb828f0fSHong Zhang Mat_MUMPS *mumps =(Mat_MUMPS*)A->spptr; 118935bd34faSBarry Smith 119035bd34faSBarry Smith PetscFunctionBegin; 119135bd34faSBarry Smith info->block_size = 1.0; 1192cb828f0fSHong Zhang info->nz_allocated = mumps->id.INFOG(20); 1193cb828f0fSHong Zhang info->nz_used = mumps->id.INFOG(20); 119435bd34faSBarry Smith info->nz_unneeded = 0.0; 119535bd34faSBarry Smith info->assemblies = 0.0; 119635bd34faSBarry Smith info->mallocs = 0.0; 119735bd34faSBarry Smith info->memory = 0.0; 119835bd34faSBarry Smith info->fill_ratio_given = 0; 119935bd34faSBarry Smith info->fill_ratio_needed = 0; 120035bd34faSBarry Smith info->factor_mallocs = 0; 120135bd34faSBarry Smith PetscFunctionReturn(0); 120235bd34faSBarry Smith } 120335bd34faSBarry Smith 12045ccb76cbSHong Zhang /* -------------------------------------------------------------------------------------------*/ 12055ccb76cbSHong Zhang #undef __FUNCT__ 12065ccb76cbSHong Zhang #define __FUNCT__ "MatMumpsSetIcntl_MUMPS" 12075ccb76cbSHong Zhang PetscErrorCode MatMumpsSetIcntl_MUMPS(Mat F,PetscInt icntl,PetscInt ival) 12085ccb76cbSHong Zhang { 12095ccb76cbSHong Zhang Mat_MUMPS *lu =(Mat_MUMPS*)F->spptr; 12105ccb76cbSHong Zhang 12115ccb76cbSHong Zhang PetscFunctionBegin; 12125ccb76cbSHong Zhang lu->id.ICNTL(icntl) = ival; 12135ccb76cbSHong Zhang PetscFunctionReturn(0); 12145ccb76cbSHong Zhang } 12155ccb76cbSHong Zhang 12165ccb76cbSHong Zhang #undef __FUNCT__ 12175ccb76cbSHong Zhang #define __FUNCT__ "MatMumpsSetIcntl" 12185ccb76cbSHong Zhang /*@ 12195ccb76cbSHong Zhang MatMumpsSetIcntl - Set MUMPS parameter ICNTL() 12205ccb76cbSHong Zhang 12215ccb76cbSHong Zhang Logically Collective on Mat 12225ccb76cbSHong Zhang 12235ccb76cbSHong Zhang Input Parameters: 12245ccb76cbSHong Zhang + F - the factored matrix obtained by calling MatGetFactor() from PETSc-MUMPS interface 12255ccb76cbSHong Zhang . icntl - index of MUMPS parameter array ICNTL() 12265ccb76cbSHong Zhang - ival - value of MUMPS ICNTL(icntl) 12275ccb76cbSHong Zhang 12285ccb76cbSHong Zhang Options Database: 12295ccb76cbSHong Zhang . -mat_mumps_icntl_<icntl> <ival> 12305ccb76cbSHong Zhang 12315ccb76cbSHong Zhang Level: beginner 12325ccb76cbSHong Zhang 12335ccb76cbSHong Zhang References: MUMPS Users' Guide 12345ccb76cbSHong Zhang 12355ccb76cbSHong Zhang .seealso: MatGetFactor() 12365ccb76cbSHong Zhang @*/ 12375ccb76cbSHong Zhang PetscErrorCode MatMumpsSetIcntl(Mat F,PetscInt icntl,PetscInt ival) 12385ccb76cbSHong Zhang { 12395ccb76cbSHong Zhang PetscErrorCode ierr; 12405ccb76cbSHong Zhang 12415ccb76cbSHong Zhang PetscFunctionBegin; 12425ccb76cbSHong Zhang PetscValidLogicalCollectiveInt(F,icntl,2); 12435ccb76cbSHong Zhang PetscValidLogicalCollectiveInt(F,ival,3); 12445ccb76cbSHong Zhang ierr = PetscTryMethod(F,"MatMumpsSetIcntl_C",(Mat,PetscInt,PetscInt),(F,icntl,ival));CHKERRQ(ierr); 12455ccb76cbSHong Zhang PetscFunctionReturn(0); 12465ccb76cbSHong Zhang } 12475ccb76cbSHong Zhang 124824b6179bSKris Buschelman /*MC 12492692d6eeSBarry Smith MATSOLVERMUMPS - A matrix type providing direct solvers (LU and Cholesky) for 125024b6179bSKris Buschelman distributed and sequential matrices via the external package MUMPS. 125124b6179bSKris Buschelman 125241c8de11SBarry Smith Works with MATAIJ and MATSBAIJ matrices 125324b6179bSKris Buschelman 125424b6179bSKris Buschelman Options Database Keys: 1255fb8376fbSHong Zhang + -mat_mumps_icntl_4 <0,...,4> - print level 125624b6179bSKris Buschelman . -mat_mumps_icntl_6 <0,...,7> - matrix prescaling options (see MUMPS User's Guide) 125764e6c443SBarry Smith . -mat_mumps_icntl_7 <0,...,7> - matrix orderings (see MUMPS User's Guidec) 125824b6179bSKris Buschelman . -mat_mumps_icntl_9 <1,2> - A or A^T x=b to be solved: 1 denotes A, 2 denotes A^T 125924b6179bSKris Buschelman . -mat_mumps_icntl_10 <n> - maximum number of iterative refinements 126094b7f48cSBarry Smith . -mat_mumps_icntl_11 <n> - error analysis, a positive value returns statistics during -ksp_view 126124b6179bSKris Buschelman . -mat_mumps_icntl_12 <n> - efficiency control (see MUMPS User's Guide) 126224b6179bSKris Buschelman . -mat_mumps_icntl_13 <n> - efficiency control (see MUMPS User's Guide) 126324b6179bSKris Buschelman . -mat_mumps_icntl_14 <n> - efficiency control (see MUMPS User's Guide) 126424b6179bSKris Buschelman . -mat_mumps_icntl_15 <n> - efficiency control (see MUMPS User's Guide) 126524b6179bSKris Buschelman . -mat_mumps_cntl_1 <delta> - relative pivoting threshold 126624b6179bSKris Buschelman . -mat_mumps_cntl_2 <tol> - stopping criterion for refinement 126724b6179bSKris Buschelman - -mat_mumps_cntl_3 <adelta> - absolute pivoting threshold 126824b6179bSKris Buschelman 126924b6179bSKris Buschelman Level: beginner 127024b6179bSKris Buschelman 127141c8de11SBarry Smith .seealso: PCFactorSetMatSolverPackage(), MatSolverPackage 127241c8de11SBarry Smith 127324b6179bSKris Buschelman M*/ 127424b6179bSKris Buschelman 12752877fffaSHong Zhang EXTERN_C_BEGIN 127635bd34faSBarry Smith #undef __FUNCT__ 127735bd34faSBarry Smith #define __FUNCT__ "MatFactorGetSolverPackage_mumps" 127835bd34faSBarry Smith PetscErrorCode MatFactorGetSolverPackage_mumps(Mat A,const MatSolverPackage *type) 127935bd34faSBarry Smith { 128035bd34faSBarry Smith PetscFunctionBegin; 12812692d6eeSBarry Smith *type = MATSOLVERMUMPS; 128235bd34faSBarry Smith PetscFunctionReturn(0); 128335bd34faSBarry Smith } 128435bd34faSBarry Smith EXTERN_C_END 128535bd34faSBarry Smith 128635bd34faSBarry Smith EXTERN_C_BEGIN 1287bccb9932SShri Abhyankar /* MatGetFactor for Seq and MPI AIJ matrices */ 12882877fffaSHong Zhang #undef __FUNCT__ 1289bccb9932SShri Abhyankar #define __FUNCT__ "MatGetFactor_aij_mumps" 1290bccb9932SShri Abhyankar PetscErrorCode MatGetFactor_aij_mumps(Mat A,MatFactorType ftype,Mat *F) 12912877fffaSHong Zhang { 12922877fffaSHong Zhang Mat B; 12932877fffaSHong Zhang PetscErrorCode ierr; 12942877fffaSHong Zhang Mat_MUMPS *mumps; 1295ace3abfcSBarry Smith PetscBool isSeqAIJ; 12962877fffaSHong Zhang 12972877fffaSHong Zhang PetscFunctionBegin; 12982877fffaSHong Zhang /* Create the factorization matrix */ 1299bccb9932SShri Abhyankar ierr = PetscTypeCompare((PetscObject)A,MATSEQAIJ,&isSeqAIJ);CHKERRQ(ierr); 13002877fffaSHong Zhang ierr = MatCreate(((PetscObject)A)->comm,&B);CHKERRQ(ierr); 13012877fffaSHong Zhang ierr = MatSetSizes(B,A->rmap->n,A->cmap->n,A->rmap->N,A->cmap->N);CHKERRQ(ierr); 13022877fffaSHong Zhang ierr = MatSetType(B,((PetscObject)A)->type_name);CHKERRQ(ierr); 1303bccb9932SShri Abhyankar if (isSeqAIJ) { 13042877fffaSHong Zhang ierr = MatSeqAIJSetPreallocation(B,0,PETSC_NULL);CHKERRQ(ierr); 1305bccb9932SShri Abhyankar } else { 1306bccb9932SShri Abhyankar ierr = MatMPIAIJSetPreallocation(B,0,PETSC_NULL,0,PETSC_NULL);CHKERRQ(ierr); 1307bccb9932SShri Abhyankar } 13082877fffaSHong Zhang 130916ebf90aSShri Abhyankar ierr = PetscNewLog(B,Mat_MUMPS,&mumps);CHKERRQ(ierr); 13102877fffaSHong Zhang B->ops->view = MatView_MUMPS; 131135bd34faSBarry Smith B->ops->getinfo = MatGetInfo_MUMPS; 131235bd34faSBarry Smith ierr = PetscObjectComposeFunctionDynamic((PetscObject)B,"MatFactorGetSolverPackage_C","MatFactorGetSolverPackage_mumps",MatFactorGetSolverPackage_mumps);CHKERRQ(ierr); 13135ccb76cbSHong Zhang ierr = PetscObjectComposeFunctionDynamic((PetscObject)B,"MatMumpsSetIcntl_C","MatMumpsSetIcntl_MUMPS",MatMumpsSetIcntl_MUMPS);CHKERRQ(ierr); 1314450b117fSShri Abhyankar if (ftype == MAT_FACTOR_LU) { 1315450b117fSShri Abhyankar B->ops->lufactorsymbolic = MatLUFactorSymbolic_AIJMUMPS; 1316d5f3da31SBarry Smith B->factortype = MAT_FACTOR_LU; 1317bccb9932SShri Abhyankar if (isSeqAIJ) mumps->ConvertToTriples = MatConvertToTriples_seqaij_seqaij; 1318bccb9932SShri Abhyankar else mumps->ConvertToTriples = MatConvertToTriples_mpiaij_mpiaij; 1319746480a1SHong Zhang mumps->sym = 0; 1320dcd589f8SShri Abhyankar } else { 132167877ebaSShri Abhyankar B->ops->choleskyfactorsymbolic = MatCholeskyFactorSymbolic_MUMPS; 1322450b117fSShri Abhyankar B->factortype = MAT_FACTOR_CHOLESKY; 1323bccb9932SShri Abhyankar if (isSeqAIJ) mumps->ConvertToTriples = MatConvertToTriples_seqaij_seqsbaij; 1324bccb9932SShri Abhyankar else mumps->ConvertToTriples = MatConvertToTriples_mpiaij_mpisbaij; 13256fdc2a6dSBarry Smith if (A->spd_set && A->spd) mumps->sym = 1; 13266fdc2a6dSBarry Smith else mumps->sym = 2; 1327450b117fSShri Abhyankar } 13282877fffaSHong Zhang 13292877fffaSHong Zhang mumps->isAIJ = PETSC_TRUE; 1330bf0cc555SLisandro Dalcin mumps->Destroy = B->ops->destroy; 13312877fffaSHong Zhang B->ops->destroy = MatDestroy_MUMPS; 13322877fffaSHong Zhang B->spptr = (void*)mumps; 1333f697e70eSHong Zhang ierr = PetscInitializeMUMPS(A,mumps);CHKERRQ(ierr); 1334746480a1SHong Zhang 13352877fffaSHong Zhang *F = B; 13362877fffaSHong Zhang PetscFunctionReturn(0); 13372877fffaSHong Zhang } 13382877fffaSHong Zhang EXTERN_C_END 13392877fffaSHong Zhang 1340bccb9932SShri Abhyankar 13412877fffaSHong Zhang EXTERN_C_BEGIN 1342bccb9932SShri Abhyankar /* MatGetFactor for Seq and MPI SBAIJ matrices */ 13432877fffaSHong Zhang #undef __FUNCT__ 1344bccb9932SShri Abhyankar #define __FUNCT__ "MatGetFactor_sbaij_mumps" 1345bccb9932SShri Abhyankar PetscErrorCode MatGetFactor_sbaij_mumps(Mat A,MatFactorType ftype,Mat *F) 13462877fffaSHong Zhang { 13472877fffaSHong Zhang Mat B; 13482877fffaSHong Zhang PetscErrorCode ierr; 13492877fffaSHong Zhang Mat_MUMPS *mumps; 1350ace3abfcSBarry Smith PetscBool isSeqSBAIJ; 13512877fffaSHong Zhang 13522877fffaSHong Zhang PetscFunctionBegin; 1353e7e72b3dSBarry Smith if (ftype != MAT_FACTOR_CHOLESKY) SETERRQ(((PetscObject)A)->comm,PETSC_ERR_SUP,"Cannot use PETSc SBAIJ matrices with MUMPS LU, use AIJ matrix"); 1354bccb9932SShri Abhyankar if(A->rmap->bs > 1) SETERRQ(((PetscObject)A)->comm,PETSC_ERR_SUP,"Cannot use PETSc SBAIJ matrices with block size > 1 with MUMPS Cholesky, use AIJ matrix instead"); 1355bccb9932SShri Abhyankar ierr = PetscTypeCompare((PetscObject)A,MATSEQSBAIJ,&isSeqSBAIJ);CHKERRQ(ierr); 13562877fffaSHong Zhang /* Create the factorization matrix */ 13572877fffaSHong Zhang ierr = MatCreate(((PetscObject)A)->comm,&B);CHKERRQ(ierr); 13582877fffaSHong Zhang ierr = MatSetSizes(B,A->rmap->n,A->cmap->n,A->rmap->N,A->cmap->N);CHKERRQ(ierr); 13592877fffaSHong Zhang ierr = MatSetType(B,((PetscObject)A)->type_name);CHKERRQ(ierr); 136016ebf90aSShri Abhyankar ierr = PetscNewLog(B,Mat_MUMPS,&mumps);CHKERRQ(ierr); 1361bccb9932SShri Abhyankar if (isSeqSBAIJ) { 1362bccb9932SShri Abhyankar ierr = MatSeqSBAIJSetPreallocation(B,1,0,PETSC_NULL);CHKERRQ(ierr); 136316ebf90aSShri Abhyankar mumps->ConvertToTriples = MatConvertToTriples_seqsbaij_seqsbaij; 1364dcd589f8SShri Abhyankar } else { 1365bccb9932SShri Abhyankar ierr = MatMPISBAIJSetPreallocation(B,1,0,PETSC_NULL,0,PETSC_NULL);CHKERRQ(ierr); 1366bccb9932SShri Abhyankar mumps->ConvertToTriples = MatConvertToTriples_mpisbaij_mpisbaij; 1367bccb9932SShri Abhyankar } 1368bccb9932SShri Abhyankar 136967877ebaSShri Abhyankar B->ops->choleskyfactorsymbolic = MatCholeskyFactorSymbolic_MUMPS; 1370bccb9932SShri Abhyankar B->ops->view = MatView_MUMPS; 1371bccb9932SShri Abhyankar ierr = PetscObjectComposeFunctionDynamic((PetscObject)B,"MatFactorGetSolverPackage_C","MatFactorGetSolverPackage_mumps",MatFactorGetSolverPackage_mumps);CHKERRQ(ierr); 1372f250808bSBarry Smith ierr = PetscObjectComposeFunctionDynamic((PetscObject)B,"MatMumpsSetIcntl_C","MatMumpsSetIcntl",MatMumpsSetIcntl);CHKERRQ(ierr); 1373f4762488SHong Zhang B->factortype = MAT_FACTOR_CHOLESKY; 13746fdc2a6dSBarry Smith if (A->spd_set && A->spd) mumps->sym = 1; 13756fdc2a6dSBarry Smith else mumps->sym = 2; 1376a214ac2aSShri Abhyankar 1377bccb9932SShri Abhyankar mumps->isAIJ = PETSC_FALSE; 1378bf0cc555SLisandro Dalcin mumps->Destroy = B->ops->destroy; 1379f3c0ef26SHong Zhang B->ops->destroy = MatDestroy_MUMPS; 13802877fffaSHong Zhang B->spptr = (void*)mumps; 1381f697e70eSHong Zhang ierr = PetscInitializeMUMPS(A,mumps);CHKERRQ(ierr); 1382746480a1SHong Zhang 13832877fffaSHong Zhang *F = B; 13842877fffaSHong Zhang PetscFunctionReturn(0); 13852877fffaSHong Zhang } 13862877fffaSHong Zhang EXTERN_C_END 138797969023SHong Zhang 1388450b117fSShri Abhyankar EXTERN_C_BEGIN 1389450b117fSShri Abhyankar #undef __FUNCT__ 1390bccb9932SShri Abhyankar #define __FUNCT__ "MatGetFactor_baij_mumps" 1391bccb9932SShri Abhyankar PetscErrorCode MatGetFactor_baij_mumps(Mat A,MatFactorType ftype,Mat *F) 139267877ebaSShri Abhyankar { 139367877ebaSShri Abhyankar Mat B; 139467877ebaSShri Abhyankar PetscErrorCode ierr; 139567877ebaSShri Abhyankar Mat_MUMPS *mumps; 1396ace3abfcSBarry Smith PetscBool isSeqBAIJ; 139767877ebaSShri Abhyankar 139867877ebaSShri Abhyankar PetscFunctionBegin; 139967877ebaSShri Abhyankar /* Create the factorization matrix */ 1400bccb9932SShri Abhyankar ierr = PetscTypeCompare((PetscObject)A,MATSEQBAIJ,&isSeqBAIJ);CHKERRQ(ierr); 140167877ebaSShri Abhyankar ierr = MatCreate(((PetscObject)A)->comm,&B);CHKERRQ(ierr); 140267877ebaSShri Abhyankar ierr = MatSetSizes(B,A->rmap->n,A->cmap->n,A->rmap->N,A->cmap->N);CHKERRQ(ierr); 140367877ebaSShri Abhyankar ierr = MatSetType(B,((PetscObject)A)->type_name);CHKERRQ(ierr); 1404bccb9932SShri Abhyankar if (isSeqBAIJ) { 140567877ebaSShri Abhyankar ierr = MatSeqBAIJSetPreallocation(B,A->rmap->bs,0,PETSC_NULL);CHKERRQ(ierr); 1406bccb9932SShri Abhyankar } else { 140767877ebaSShri Abhyankar ierr = MatMPIBAIJSetPreallocation(B,A->rmap->bs,0,PETSC_NULL,0,PETSC_NULL);CHKERRQ(ierr); 1408bccb9932SShri Abhyankar } 1409450b117fSShri Abhyankar 141067877ebaSShri Abhyankar ierr = PetscNewLog(B,Mat_MUMPS,&mumps);CHKERRQ(ierr); 1411450b117fSShri Abhyankar if (ftype == MAT_FACTOR_LU) { 1412450b117fSShri Abhyankar B->ops->lufactorsymbolic = MatLUFactorSymbolic_BAIJMUMPS; 1413450b117fSShri Abhyankar B->factortype = MAT_FACTOR_LU; 1414bccb9932SShri Abhyankar if (isSeqBAIJ) mumps->ConvertToTriples = MatConvertToTriples_seqbaij_seqaij; 1415bccb9932SShri Abhyankar else mumps->ConvertToTriples = MatConvertToTriples_mpibaij_mpiaij; 1416746480a1SHong Zhang mumps->sym = 0; 1417746480a1SHong Zhang } else { 1418746480a1SHong Zhang SETERRQ(PETSC_COMM_SELF,PETSC_ERR_SUP,"Cannot use PETSc BAIJ matrices with MUMPS Cholesky, use SBAIJ or AIJ matrix instead\n"); 1419450b117fSShri Abhyankar } 1420bccb9932SShri Abhyankar 1421450b117fSShri Abhyankar B->ops->view = MatView_MUMPS; 1422450b117fSShri Abhyankar ierr = PetscObjectComposeFunctionDynamic((PetscObject)B,"MatFactorGetSolverPackage_C","MatFactorGetSolverPackage_mumps",MatFactorGetSolverPackage_mumps);CHKERRQ(ierr); 14235ccb76cbSHong Zhang ierr = PetscObjectComposeFunctionDynamic((PetscObject)B,"MatMumpsSetIcntl_C","MatMumpsSetIcntl_MUMPS",MatMumpsSetIcntl_MUMPS);CHKERRQ(ierr); 1424450b117fSShri Abhyankar 1425450b117fSShri Abhyankar mumps->isAIJ = PETSC_TRUE; 1426bf0cc555SLisandro Dalcin mumps->Destroy = B->ops->destroy; 1427450b117fSShri Abhyankar B->ops->destroy = MatDestroy_MUMPS; 1428450b117fSShri Abhyankar B->spptr = (void*)mumps; 1429f697e70eSHong Zhang ierr = PetscInitializeMUMPS(A,mumps);CHKERRQ(ierr); 1430746480a1SHong Zhang 1431450b117fSShri Abhyankar *F = B; 1432450b117fSShri Abhyankar PetscFunctionReturn(0); 1433450b117fSShri Abhyankar } 1434450b117fSShri Abhyankar EXTERN_C_END 1435a214ac2aSShri Abhyankar 1436