11c2a3de1SBarry Smith 2397b6df1SKris Buschelman /* 3c2b5dc30SHong Zhang Provides an interface to the MUMPS sparse solver 4397b6df1SKris Buschelman */ 551d5961aSHong Zhang 6c6db04a5SJed Brown #include <../src/mat/impls/aij/mpi/mpiaij.h> /*I "petscmat.h" I*/ 7c6db04a5SJed Brown #include <../src/mat/impls/sbaij/mpi/mpisbaij.h> 8397b6df1SKris Buschelman 9397b6df1SKris Buschelman EXTERN_C_BEGIN 10397b6df1SKris Buschelman #if defined(PETSC_USE_COMPLEX) 112907cef9SHong Zhang #if defined(PETSC_USE_REAL_SINGLE) 122907cef9SHong Zhang #include <cmumps_c.h> 132907cef9SHong Zhang #else 14c6db04a5SJed Brown #include <zmumps_c.h> 152907cef9SHong Zhang #endif 162907cef9SHong Zhang #else 172907cef9SHong Zhang #if defined(PETSC_USE_REAL_SINGLE) 182907cef9SHong Zhang #include <smumps_c.h> 19397b6df1SKris Buschelman #else 20c6db04a5SJed Brown #include <dmumps_c.h> 21397b6df1SKris Buschelman #endif 222907cef9SHong Zhang #endif 23397b6df1SKris Buschelman EXTERN_C_END 24397b6df1SKris Buschelman #define JOB_INIT -1 253d472b54SHong Zhang #define JOB_FACTSYMBOLIC 1 263d472b54SHong Zhang #define JOB_FACTNUMERIC 2 273d472b54SHong Zhang #define JOB_SOLVE 3 28397b6df1SKris Buschelman #define JOB_END -2 293d472b54SHong Zhang 302907cef9SHong Zhang /* calls to MUMPS */ 312907cef9SHong Zhang #if defined(PETSC_USE_COMPLEX) 322907cef9SHong Zhang #if defined(PETSC_USE_REAL_SINGLE) 332907cef9SHong Zhang #define PetscMUMPS_c cmumps_c 342907cef9SHong Zhang #else 352907cef9SHong Zhang #define PetscMUMPS_c zmumps_c 362907cef9SHong Zhang #endif 372907cef9SHong Zhang #else 382907cef9SHong Zhang #if defined(PETSC_USE_REAL_SINGLE) 392907cef9SHong Zhang #define PetscMUMPS_c smumps_c 402907cef9SHong Zhang #else 412907cef9SHong Zhang #define PetscMUMPS_c dmumps_c 422907cef9SHong Zhang #endif 432907cef9SHong Zhang #endif 442907cef9SHong Zhang 453d472b54SHong Zhang 46397b6df1SKris Buschelman /* macros s.t. indices match MUMPS documentation */ 47397b6df1SKris Buschelman #define ICNTL(I) icntl[(I)-1] 48397b6df1SKris Buschelman #define CNTL(I) cntl[(I)-1] 49397b6df1SKris Buschelman #define INFOG(I) infog[(I)-1] 50a7aca84bSHong Zhang #define INFO(I) info[(I)-1] 51397b6df1SKris Buschelman #define RINFOG(I) rinfog[(I)-1] 52adc1d99fSHong Zhang #define RINFO(I) rinfo[(I)-1] 53397b6df1SKris Buschelman 54397b6df1SKris Buschelman typedef struct { 55397b6df1SKris Buschelman #if defined(PETSC_USE_COMPLEX) 562907cef9SHong Zhang #if defined(PETSC_USE_REAL_SINGLE) 572907cef9SHong Zhang CMUMPS_STRUC_C id; 582907cef9SHong Zhang #else 59397b6df1SKris Buschelman ZMUMPS_STRUC_C id; 602907cef9SHong Zhang #endif 612907cef9SHong Zhang #else 622907cef9SHong Zhang #if defined(PETSC_USE_REAL_SINGLE) 632907cef9SHong Zhang SMUMPS_STRUC_C id; 64397b6df1SKris Buschelman #else 65397b6df1SKris Buschelman DMUMPS_STRUC_C id; 66397b6df1SKris Buschelman #endif 672907cef9SHong Zhang #endif 682907cef9SHong Zhang 69397b6df1SKris Buschelman MatStructure matstruc; 70c1490034SHong Zhang PetscMPIInt myid,size; 71a5e57a09SHong Zhang PetscInt *irn,*jcn,nz,sym; 72397b6df1SKris Buschelman PetscScalar *val; 73397b6df1SKris Buschelman MPI_Comm comm_mumps; 74329ec9b3SHong Zhang VecScatter scat_rhs, scat_sol; 7564e6c443SBarry Smith PetscBool isAIJ,CleanUpMUMPS; 76329ec9b3SHong Zhang Vec b_seq,x_seq; 77a5e57a09SHong Zhang PetscInt ICNTL9_pre; /* check if ICNTL(9) is changed from previous MatSolve */ 782205254eSKarl Rupp 79bf0cc555SLisandro Dalcin PetscErrorCode (*Destroy)(Mat); 80bccb9932SShri Abhyankar PetscErrorCode (*ConvertToTriples)(Mat, int, MatReuse, int*, int**, int**, PetscScalar**); 81f0c56d0fSKris Buschelman } Mat_MUMPS; 82f0c56d0fSKris Buschelman 8309573ac7SBarry Smith extern PetscErrorCode MatDuplicate_MUMPS(Mat,MatDuplicateOption,Mat*); 84b24902e0SBarry Smith 8567877ebaSShri Abhyankar 8667877ebaSShri Abhyankar /* MatConvertToTriples_A_B */ 8767877ebaSShri Abhyankar /*convert Petsc matrix to triples: row[nz], col[nz], val[nz] */ 88397b6df1SKris Buschelman /* 89397b6df1SKris Buschelman input: 9067877ebaSShri Abhyankar A - matrix in aij,baij or sbaij (bs=1) format 91397b6df1SKris Buschelman shift - 0: C style output triple; 1: Fortran style output triple. 92bccb9932SShri Abhyankar reuse - MAT_INITIAL_MATRIX: spaces are allocated and values are set for the triple 93bccb9932SShri Abhyankar MAT_REUSE_MATRIX: only the values in v array are updated 94397b6df1SKris Buschelman output: 95397b6df1SKris Buschelman nnz - dim of r, c, and v (number of local nonzero entries of A) 96397b6df1SKris Buschelman r, c, v - row and col index, matrix values (matrix triples) 97eb9baa12SBarry Smith 98eb9baa12SBarry Smith The returned values r, c, and sometimes v are obtained in a single PetscMalloc(). Then in MatDestroy_MUMPS() it is 99eb9baa12SBarry Smith freed with PetscFree((mumps->irn); This is not ideal code, the fact that v is ONLY sometimes part of mumps->irn means 100eb9baa12SBarry Smith that the PetscMalloc() cannot easily be replaced with a PetscMalloc3(). 101eb9baa12SBarry Smith 102397b6df1SKris Buschelman */ 10316ebf90aSShri Abhyankar 10416ebf90aSShri Abhyankar #undef __FUNCT__ 10516ebf90aSShri Abhyankar #define __FUNCT__ "MatConvertToTriples_seqaij_seqaij" 106bccb9932SShri Abhyankar PetscErrorCode MatConvertToTriples_seqaij_seqaij(Mat A,int shift,MatReuse reuse,int *nnz,int **r, int **c, PetscScalar **v) 107b24902e0SBarry Smith { 108185f6596SHong Zhang const PetscInt *ai,*aj,*ajj,M=A->rmap->n; 10967877ebaSShri Abhyankar PetscInt nz,rnz,i,j; 110dfbe8321SBarry Smith PetscErrorCode ierr; 111c1490034SHong Zhang PetscInt *row,*col; 11216ebf90aSShri Abhyankar Mat_SeqAIJ *aa=(Mat_SeqAIJ*)A->data; 113397b6df1SKris Buschelman 114397b6df1SKris Buschelman PetscFunctionBegin; 11516ebf90aSShri Abhyankar *v=aa->a; 116bccb9932SShri Abhyankar if (reuse == MAT_INITIAL_MATRIX) { 1172205254eSKarl Rupp nz = aa->nz; 1182205254eSKarl Rupp ai = aa->i; 1192205254eSKarl Rupp aj = aa->j; 12016ebf90aSShri Abhyankar *nnz = nz; 121185f6596SHong Zhang ierr = PetscMalloc(2*nz*sizeof(PetscInt), &row);CHKERRQ(ierr); 122185f6596SHong Zhang col = row + nz; 123185f6596SHong Zhang 12416ebf90aSShri Abhyankar nz = 0; 12516ebf90aSShri Abhyankar for (i=0; i<M; i++) { 12616ebf90aSShri Abhyankar rnz = ai[i+1] - ai[i]; 12767877ebaSShri Abhyankar ajj = aj + ai[i]; 12867877ebaSShri Abhyankar for (j=0; j<rnz; j++) { 12967877ebaSShri Abhyankar row[nz] = i+shift; col[nz++] = ajj[j] + shift; 13016ebf90aSShri Abhyankar } 13116ebf90aSShri Abhyankar } 13216ebf90aSShri Abhyankar *r = row; *c = col; 13316ebf90aSShri Abhyankar } 13416ebf90aSShri Abhyankar PetscFunctionReturn(0); 13516ebf90aSShri Abhyankar } 136397b6df1SKris Buschelman 13716ebf90aSShri Abhyankar #undef __FUNCT__ 13867877ebaSShri Abhyankar #define __FUNCT__ "MatConvertToTriples_seqbaij_seqaij" 139bccb9932SShri Abhyankar PetscErrorCode MatConvertToTriples_seqbaij_seqaij(Mat A,int shift,MatReuse reuse,int *nnz,int **r, int **c, PetscScalar **v) 14067877ebaSShri Abhyankar { 14167877ebaSShri Abhyankar Mat_SeqBAIJ *aa=(Mat_SeqBAIJ*)A->data; 14267877ebaSShri Abhyankar const PetscInt *ai,*aj,*ajj,bs=A->rmap->bs,bs2=aa->bs2,M=A->rmap->N/bs; 1430ad0caddSJed Brown PetscInt nz,idx=0,rnz,i,j,k,m; 14467877ebaSShri Abhyankar PetscErrorCode ierr; 14567877ebaSShri Abhyankar PetscInt *row,*col; 14667877ebaSShri Abhyankar 14767877ebaSShri Abhyankar PetscFunctionBegin; 148cf3759fdSShri Abhyankar *v = aa->a; 149bccb9932SShri Abhyankar if (reuse == MAT_INITIAL_MATRIX) { 150cf3759fdSShri Abhyankar ai = aa->i; aj = aa->j; 15167877ebaSShri Abhyankar nz = bs2*aa->nz; 15267877ebaSShri Abhyankar *nnz = nz; 153185f6596SHong Zhang ierr = PetscMalloc(2*nz*sizeof(PetscInt), &row);CHKERRQ(ierr); 154185f6596SHong Zhang col = row + nz; 155185f6596SHong Zhang 15667877ebaSShri Abhyankar for (i=0; i<M; i++) { 15767877ebaSShri Abhyankar ajj = aj + ai[i]; 15867877ebaSShri Abhyankar rnz = ai[i+1] - ai[i]; 15967877ebaSShri Abhyankar for (k=0; k<rnz; k++) { 16067877ebaSShri Abhyankar for (j=0; j<bs; j++) { 16167877ebaSShri Abhyankar for (m=0; m<bs; m++) { 16267877ebaSShri Abhyankar row[idx] = i*bs + m + shift; 163cf3759fdSShri Abhyankar col[idx++] = bs*(ajj[k]) + j + shift; 16467877ebaSShri Abhyankar } 16567877ebaSShri Abhyankar } 16667877ebaSShri Abhyankar } 16767877ebaSShri Abhyankar } 168cf3759fdSShri Abhyankar *r = row; *c = col; 16967877ebaSShri Abhyankar } 17067877ebaSShri Abhyankar PetscFunctionReturn(0); 17167877ebaSShri Abhyankar } 17267877ebaSShri Abhyankar 17367877ebaSShri Abhyankar #undef __FUNCT__ 17416ebf90aSShri Abhyankar #define __FUNCT__ "MatConvertToTriples_seqsbaij_seqsbaij" 175bccb9932SShri Abhyankar PetscErrorCode MatConvertToTriples_seqsbaij_seqsbaij(Mat A,int shift,MatReuse reuse,int *nnz,int **r, int **c, PetscScalar **v) 17616ebf90aSShri Abhyankar { 17767877ebaSShri Abhyankar const PetscInt *ai, *aj,*ajj,M=A->rmap->n; 17867877ebaSShri Abhyankar PetscInt nz,rnz,i,j; 17916ebf90aSShri Abhyankar PetscErrorCode ierr; 18016ebf90aSShri Abhyankar PetscInt *row,*col; 18116ebf90aSShri Abhyankar Mat_SeqSBAIJ *aa=(Mat_SeqSBAIJ*)A->data; 18216ebf90aSShri Abhyankar 18316ebf90aSShri Abhyankar PetscFunctionBegin; 184882afa5aSHong Zhang *v = aa->a; 185bccb9932SShri Abhyankar if (reuse == MAT_INITIAL_MATRIX) { 1862205254eSKarl Rupp nz = aa->nz; 1872205254eSKarl Rupp ai = aa->i; 1882205254eSKarl Rupp aj = aa->j; 1892205254eSKarl Rupp *v = aa->a; 19016ebf90aSShri Abhyankar *nnz = nz; 191185f6596SHong Zhang ierr = PetscMalloc(2*nz*sizeof(PetscInt), &row);CHKERRQ(ierr); 192185f6596SHong Zhang col = row + nz; 193185f6596SHong Zhang 19416ebf90aSShri Abhyankar nz = 0; 19516ebf90aSShri Abhyankar for (i=0; i<M; i++) { 19616ebf90aSShri Abhyankar rnz = ai[i+1] - ai[i]; 19767877ebaSShri Abhyankar ajj = aj + ai[i]; 19867877ebaSShri Abhyankar for (j=0; j<rnz; j++) { 19967877ebaSShri Abhyankar row[nz] = i+shift; col[nz++] = ajj[j] + shift; 20016ebf90aSShri Abhyankar } 20116ebf90aSShri Abhyankar } 20216ebf90aSShri Abhyankar *r = row; *c = col; 20316ebf90aSShri Abhyankar } 20416ebf90aSShri Abhyankar PetscFunctionReturn(0); 20516ebf90aSShri Abhyankar } 20616ebf90aSShri Abhyankar 20716ebf90aSShri Abhyankar #undef __FUNCT__ 20816ebf90aSShri Abhyankar #define __FUNCT__ "MatConvertToTriples_seqaij_seqsbaij" 209bccb9932SShri Abhyankar PetscErrorCode MatConvertToTriples_seqaij_seqsbaij(Mat A,int shift,MatReuse reuse,int *nnz,int **r, int **c, PetscScalar **v) 21016ebf90aSShri Abhyankar { 21167877ebaSShri Abhyankar const PetscInt *ai,*aj,*ajj,*adiag,M=A->rmap->n; 21267877ebaSShri Abhyankar PetscInt nz,rnz,i,j; 21367877ebaSShri Abhyankar const PetscScalar *av,*v1; 21416ebf90aSShri Abhyankar PetscScalar *val; 21516ebf90aSShri Abhyankar PetscErrorCode ierr; 21616ebf90aSShri Abhyankar PetscInt *row,*col; 21716ebf90aSShri Abhyankar Mat_SeqSBAIJ *aa=(Mat_SeqSBAIJ*)A->data; 21816ebf90aSShri Abhyankar 21916ebf90aSShri Abhyankar PetscFunctionBegin; 22016ebf90aSShri Abhyankar ai =aa->i; aj=aa->j;av=aa->a; 22116ebf90aSShri Abhyankar adiag=aa->diag; 222bccb9932SShri Abhyankar if (reuse == MAT_INITIAL_MATRIX) { 22316ebf90aSShri Abhyankar nz = M + (aa->nz-M)/2; 22416ebf90aSShri Abhyankar *nnz = nz; 225185f6596SHong Zhang ierr = PetscMalloc((2*nz*sizeof(PetscInt)+nz*sizeof(PetscScalar)), &row);CHKERRQ(ierr); 226185f6596SHong Zhang col = row + nz; 227185f6596SHong Zhang val = (PetscScalar*)(col + nz); 228185f6596SHong Zhang 22916ebf90aSShri Abhyankar nz = 0; 23016ebf90aSShri Abhyankar for (i=0; i<M; i++) { 23116ebf90aSShri Abhyankar rnz = ai[i+1] - adiag[i]; 23267877ebaSShri Abhyankar ajj = aj + adiag[i]; 233cf3759fdSShri Abhyankar v1 = av + adiag[i]; 23467877ebaSShri Abhyankar for (j=0; j<rnz; j++) { 23567877ebaSShri Abhyankar row[nz] = i+shift; col[nz] = ajj[j] + shift; val[nz++] = v1[j]; 23616ebf90aSShri Abhyankar } 23716ebf90aSShri Abhyankar } 23816ebf90aSShri Abhyankar *r = row; *c = col; *v = val; 239397b6df1SKris Buschelman } else { 24016ebf90aSShri Abhyankar nz = 0; val = *v; 24116ebf90aSShri Abhyankar for (i=0; i <M; i++) { 24216ebf90aSShri Abhyankar rnz = ai[i+1] - adiag[i]; 24367877ebaSShri Abhyankar ajj = aj + adiag[i]; 24467877ebaSShri Abhyankar v1 = av + adiag[i]; 24567877ebaSShri Abhyankar for (j=0; j<rnz; j++) { 24667877ebaSShri Abhyankar val[nz++] = v1[j]; 24716ebf90aSShri Abhyankar } 24816ebf90aSShri Abhyankar } 24916ebf90aSShri Abhyankar } 25016ebf90aSShri Abhyankar PetscFunctionReturn(0); 25116ebf90aSShri Abhyankar } 25216ebf90aSShri Abhyankar 25316ebf90aSShri Abhyankar #undef __FUNCT__ 25416ebf90aSShri Abhyankar #define __FUNCT__ "MatConvertToTriples_mpisbaij_mpisbaij" 255bccb9932SShri Abhyankar PetscErrorCode MatConvertToTriples_mpisbaij_mpisbaij(Mat A,int shift,MatReuse reuse,int *nnz,int **r, int **c, PetscScalar **v) 25616ebf90aSShri Abhyankar { 25716ebf90aSShri Abhyankar const PetscInt *ai, *aj, *bi, *bj,*garray,m=A->rmap->n,*ajj,*bjj; 25816ebf90aSShri Abhyankar PetscErrorCode ierr; 25916ebf90aSShri Abhyankar PetscInt rstart,nz,i,j,jj,irow,countA,countB; 26016ebf90aSShri Abhyankar PetscInt *row,*col; 26116ebf90aSShri Abhyankar const PetscScalar *av, *bv,*v1,*v2; 26216ebf90aSShri Abhyankar PetscScalar *val; 263397b6df1SKris Buschelman Mat_MPISBAIJ *mat = (Mat_MPISBAIJ*)A->data; 264397b6df1SKris Buschelman Mat_SeqSBAIJ *aa = (Mat_SeqSBAIJ*)(mat->A)->data; 265397b6df1SKris Buschelman Mat_SeqBAIJ *bb = (Mat_SeqBAIJ*)(mat->B)->data; 26616ebf90aSShri Abhyankar 26716ebf90aSShri Abhyankar PetscFunctionBegin; 268d0f46423SBarry Smith ai=aa->i; aj=aa->j; bi=bb->i; bj=bb->j; rstart= A->rmap->rstart; 269397b6df1SKris Buschelman av=aa->a; bv=bb->a; 270397b6df1SKris Buschelman 2712205254eSKarl Rupp garray = mat->garray; 2722205254eSKarl Rupp 273bccb9932SShri Abhyankar if (reuse == MAT_INITIAL_MATRIX) { 27416ebf90aSShri Abhyankar nz = aa->nz + bb->nz; 27516ebf90aSShri Abhyankar *nnz = nz; 276185f6596SHong Zhang ierr = PetscMalloc((2*nz*sizeof(PetscInt)+nz*sizeof(PetscScalar)), &row);CHKERRQ(ierr); 277185f6596SHong Zhang col = row + nz; 278185f6596SHong Zhang val = (PetscScalar*)(col + nz); 279185f6596SHong Zhang 280397b6df1SKris Buschelman *r = row; *c = col; *v = val; 281397b6df1SKris Buschelman } else { 282397b6df1SKris Buschelman row = *r; col = *c; val = *v; 283397b6df1SKris Buschelman } 284397b6df1SKris Buschelman 285028e57e8SHong Zhang jj = 0; irow = rstart; 286397b6df1SKris Buschelman for (i=0; i<m; i++) { 287397b6df1SKris Buschelman ajj = aj + ai[i]; /* ptr to the beginning of this row */ 288397b6df1SKris Buschelman countA = ai[i+1] - ai[i]; 289397b6df1SKris Buschelman countB = bi[i+1] - bi[i]; 290397b6df1SKris Buschelman bjj = bj + bi[i]; 29116ebf90aSShri Abhyankar v1 = av + ai[i]; 29216ebf90aSShri Abhyankar v2 = bv + bi[i]; 293397b6df1SKris Buschelman 294397b6df1SKris Buschelman /* A-part */ 295397b6df1SKris Buschelman for (j=0; j<countA; j++) { 296bccb9932SShri Abhyankar if (reuse == MAT_INITIAL_MATRIX) { 297397b6df1SKris Buschelman row[jj] = irow + shift; col[jj] = rstart + ajj[j] + shift; 298397b6df1SKris Buschelman } 29916ebf90aSShri Abhyankar val[jj++] = v1[j]; 300397b6df1SKris Buschelman } 30116ebf90aSShri Abhyankar 30216ebf90aSShri Abhyankar /* B-part */ 30316ebf90aSShri Abhyankar for (j=0; j < countB; j++) { 304bccb9932SShri Abhyankar if (reuse == MAT_INITIAL_MATRIX) { 305397b6df1SKris Buschelman row[jj] = irow + shift; col[jj] = garray[bjj[j]] + shift; 306397b6df1SKris Buschelman } 30716ebf90aSShri Abhyankar val[jj++] = v2[j]; 30816ebf90aSShri Abhyankar } 30916ebf90aSShri Abhyankar irow++; 31016ebf90aSShri Abhyankar } 31116ebf90aSShri Abhyankar PetscFunctionReturn(0); 31216ebf90aSShri Abhyankar } 31316ebf90aSShri Abhyankar 31416ebf90aSShri Abhyankar #undef __FUNCT__ 31516ebf90aSShri Abhyankar #define __FUNCT__ "MatConvertToTriples_mpiaij_mpiaij" 316bccb9932SShri Abhyankar PetscErrorCode MatConvertToTriples_mpiaij_mpiaij(Mat A,int shift,MatReuse reuse,int *nnz,int **r, int **c, PetscScalar **v) 31716ebf90aSShri Abhyankar { 31816ebf90aSShri Abhyankar const PetscInt *ai, *aj, *bi, *bj,*garray,m=A->rmap->n,*ajj,*bjj; 31916ebf90aSShri Abhyankar PetscErrorCode ierr; 32016ebf90aSShri Abhyankar PetscInt rstart,nz,i,j,jj,irow,countA,countB; 32116ebf90aSShri Abhyankar PetscInt *row,*col; 32216ebf90aSShri Abhyankar const PetscScalar *av, *bv,*v1,*v2; 32316ebf90aSShri Abhyankar PetscScalar *val; 32416ebf90aSShri Abhyankar Mat_MPIAIJ *mat = (Mat_MPIAIJ*)A->data; 32516ebf90aSShri Abhyankar Mat_SeqAIJ *aa = (Mat_SeqAIJ*)(mat->A)->data; 32616ebf90aSShri Abhyankar Mat_SeqAIJ *bb = (Mat_SeqAIJ*)(mat->B)->data; 32716ebf90aSShri Abhyankar 32816ebf90aSShri Abhyankar PetscFunctionBegin; 32916ebf90aSShri Abhyankar ai=aa->i; aj=aa->j; bi=bb->i; bj=bb->j; rstart= A->rmap->rstart; 33016ebf90aSShri Abhyankar av=aa->a; bv=bb->a; 33116ebf90aSShri Abhyankar 3322205254eSKarl Rupp garray = mat->garray; 3332205254eSKarl Rupp 334bccb9932SShri Abhyankar if (reuse == MAT_INITIAL_MATRIX) { 33516ebf90aSShri Abhyankar nz = aa->nz + bb->nz; 33616ebf90aSShri Abhyankar *nnz = nz; 337185f6596SHong Zhang ierr = PetscMalloc((2*nz*sizeof(PetscInt)+nz*sizeof(PetscScalar)), &row);CHKERRQ(ierr); 338185f6596SHong Zhang col = row + nz; 339185f6596SHong Zhang val = (PetscScalar*)(col + nz); 340185f6596SHong Zhang 34116ebf90aSShri Abhyankar *r = row; *c = col; *v = val; 34216ebf90aSShri Abhyankar } else { 34316ebf90aSShri Abhyankar row = *r; col = *c; val = *v; 34416ebf90aSShri Abhyankar } 34516ebf90aSShri Abhyankar 34616ebf90aSShri Abhyankar jj = 0; irow = rstart; 34716ebf90aSShri Abhyankar for (i=0; i<m; i++) { 34816ebf90aSShri Abhyankar ajj = aj + ai[i]; /* ptr to the beginning of this row */ 34916ebf90aSShri Abhyankar countA = ai[i+1] - ai[i]; 35016ebf90aSShri Abhyankar countB = bi[i+1] - bi[i]; 35116ebf90aSShri Abhyankar bjj = bj + bi[i]; 35216ebf90aSShri Abhyankar v1 = av + ai[i]; 35316ebf90aSShri Abhyankar v2 = bv + bi[i]; 35416ebf90aSShri Abhyankar 35516ebf90aSShri Abhyankar /* A-part */ 35616ebf90aSShri Abhyankar for (j=0; j<countA; j++) { 357bccb9932SShri Abhyankar if (reuse == MAT_INITIAL_MATRIX) { 35816ebf90aSShri Abhyankar row[jj] = irow + shift; col[jj] = rstart + ajj[j] + shift; 35916ebf90aSShri Abhyankar } 36016ebf90aSShri Abhyankar val[jj++] = v1[j]; 36116ebf90aSShri Abhyankar } 36216ebf90aSShri Abhyankar 36316ebf90aSShri Abhyankar /* B-part */ 36416ebf90aSShri Abhyankar for (j=0; j < countB; j++) { 365bccb9932SShri Abhyankar if (reuse == MAT_INITIAL_MATRIX) { 36616ebf90aSShri Abhyankar row[jj] = irow + shift; col[jj] = garray[bjj[j]] + shift; 36716ebf90aSShri Abhyankar } 36816ebf90aSShri Abhyankar val[jj++] = v2[j]; 36916ebf90aSShri Abhyankar } 37016ebf90aSShri Abhyankar irow++; 37116ebf90aSShri Abhyankar } 37216ebf90aSShri Abhyankar PetscFunctionReturn(0); 37316ebf90aSShri Abhyankar } 37416ebf90aSShri Abhyankar 37516ebf90aSShri Abhyankar #undef __FUNCT__ 37667877ebaSShri Abhyankar #define __FUNCT__ "MatConvertToTriples_mpibaij_mpiaij" 377bccb9932SShri Abhyankar PetscErrorCode MatConvertToTriples_mpibaij_mpiaij(Mat A,int shift,MatReuse reuse,int *nnz,int **r, int **c, PetscScalar **v) 37867877ebaSShri Abhyankar { 37967877ebaSShri Abhyankar Mat_MPIBAIJ *mat = (Mat_MPIBAIJ*)A->data; 38067877ebaSShri Abhyankar Mat_SeqBAIJ *aa = (Mat_SeqBAIJ*)(mat->A)->data; 38167877ebaSShri Abhyankar Mat_SeqBAIJ *bb = (Mat_SeqBAIJ*)(mat->B)->data; 38267877ebaSShri Abhyankar const PetscInt *ai = aa->i, *bi = bb->i, *aj = aa->j, *bj = bb->j,*ajj, *bjj; 383d985c460SShri Abhyankar const PetscInt *garray = mat->garray,mbs=mat->mbs,rstart=A->rmap->rstart; 38467877ebaSShri Abhyankar const PetscInt bs = A->rmap->bs,bs2=mat->bs2; 38567877ebaSShri Abhyankar PetscErrorCode ierr; 38667877ebaSShri Abhyankar PetscInt nz,i,j,k,n,jj,irow,countA,countB,idx; 38767877ebaSShri Abhyankar PetscInt *row,*col; 38867877ebaSShri Abhyankar const PetscScalar *av=aa->a, *bv=bb->a,*v1,*v2; 38967877ebaSShri Abhyankar PetscScalar *val; 39067877ebaSShri Abhyankar 39167877ebaSShri Abhyankar PetscFunctionBegin; 392bccb9932SShri Abhyankar if (reuse == MAT_INITIAL_MATRIX) { 39367877ebaSShri Abhyankar nz = bs2*(aa->nz + bb->nz); 39467877ebaSShri Abhyankar *nnz = nz; 395185f6596SHong Zhang ierr = PetscMalloc((2*nz*sizeof(PetscInt)+nz*sizeof(PetscScalar)), &row);CHKERRQ(ierr); 396185f6596SHong Zhang col = row + nz; 397185f6596SHong Zhang val = (PetscScalar*)(col + nz); 398185f6596SHong Zhang 39967877ebaSShri Abhyankar *r = row; *c = col; *v = val; 40067877ebaSShri Abhyankar } else { 40167877ebaSShri Abhyankar row = *r; col = *c; val = *v; 40267877ebaSShri Abhyankar } 40367877ebaSShri Abhyankar 404d985c460SShri Abhyankar jj = 0; irow = rstart; 40567877ebaSShri Abhyankar for (i=0; i<mbs; i++) { 40667877ebaSShri Abhyankar countA = ai[i+1] - ai[i]; 40767877ebaSShri Abhyankar countB = bi[i+1] - bi[i]; 40867877ebaSShri Abhyankar ajj = aj + ai[i]; 40967877ebaSShri Abhyankar bjj = bj + bi[i]; 41067877ebaSShri Abhyankar v1 = av + bs2*ai[i]; 41167877ebaSShri Abhyankar v2 = bv + bs2*bi[i]; 41267877ebaSShri Abhyankar 41367877ebaSShri Abhyankar idx = 0; 41467877ebaSShri Abhyankar /* A-part */ 41567877ebaSShri Abhyankar for (k=0; k<countA; k++) { 41667877ebaSShri Abhyankar for (j=0; j<bs; j++) { 41767877ebaSShri Abhyankar for (n=0; n<bs; n++) { 418bccb9932SShri Abhyankar if (reuse == MAT_INITIAL_MATRIX) { 419d985c460SShri Abhyankar row[jj] = irow + n + shift; 420d985c460SShri Abhyankar col[jj] = rstart + bs*ajj[k] + j + shift; 42167877ebaSShri Abhyankar } 42267877ebaSShri Abhyankar val[jj++] = v1[idx++]; 42367877ebaSShri Abhyankar } 42467877ebaSShri Abhyankar } 42567877ebaSShri Abhyankar } 42667877ebaSShri Abhyankar 42767877ebaSShri Abhyankar idx = 0; 42867877ebaSShri Abhyankar /* B-part */ 42967877ebaSShri Abhyankar for (k=0; k<countB; k++) { 43067877ebaSShri Abhyankar for (j=0; j<bs; j++) { 43167877ebaSShri Abhyankar for (n=0; n<bs; n++) { 432bccb9932SShri Abhyankar if (reuse == MAT_INITIAL_MATRIX) { 433d985c460SShri Abhyankar row[jj] = irow + n + shift; 434d985c460SShri Abhyankar col[jj] = bs*garray[bjj[k]] + j + shift; 43567877ebaSShri Abhyankar } 436d985c460SShri Abhyankar val[jj++] = v2[idx++]; 43767877ebaSShri Abhyankar } 43867877ebaSShri Abhyankar } 43967877ebaSShri Abhyankar } 440d985c460SShri Abhyankar irow += bs; 44167877ebaSShri Abhyankar } 44267877ebaSShri Abhyankar PetscFunctionReturn(0); 44367877ebaSShri Abhyankar } 44467877ebaSShri Abhyankar 44567877ebaSShri Abhyankar #undef __FUNCT__ 44616ebf90aSShri Abhyankar #define __FUNCT__ "MatConvertToTriples_mpiaij_mpisbaij" 447bccb9932SShri Abhyankar PetscErrorCode MatConvertToTriples_mpiaij_mpisbaij(Mat A,int shift,MatReuse reuse,int *nnz,int **r, int **c, PetscScalar **v) 44816ebf90aSShri Abhyankar { 44916ebf90aSShri Abhyankar const PetscInt *ai, *aj,*adiag, *bi, *bj,*garray,m=A->rmap->n,*ajj,*bjj; 45016ebf90aSShri Abhyankar PetscErrorCode ierr; 451e0bace9bSHong Zhang PetscInt rstart,nz,nza,nzb,i,j,jj,irow,countA,countB; 45216ebf90aSShri Abhyankar PetscInt *row,*col; 45316ebf90aSShri Abhyankar const PetscScalar *av, *bv,*v1,*v2; 45416ebf90aSShri Abhyankar PetscScalar *val; 45516ebf90aSShri Abhyankar Mat_MPIAIJ *mat = (Mat_MPIAIJ*)A->data; 45616ebf90aSShri Abhyankar Mat_SeqAIJ *aa =(Mat_SeqAIJ*)(mat->A)->data; 45716ebf90aSShri Abhyankar Mat_SeqAIJ *bb =(Mat_SeqAIJ*)(mat->B)->data; 45816ebf90aSShri Abhyankar 45916ebf90aSShri Abhyankar PetscFunctionBegin; 46016ebf90aSShri Abhyankar ai=aa->i; aj=aa->j; adiag=aa->diag; 46116ebf90aSShri Abhyankar bi=bb->i; bj=bb->j; garray = mat->garray; 46216ebf90aSShri Abhyankar av=aa->a; bv=bb->a; 4632205254eSKarl Rupp 46416ebf90aSShri Abhyankar rstart = A->rmap->rstart; 46516ebf90aSShri Abhyankar 466bccb9932SShri Abhyankar if (reuse == MAT_INITIAL_MATRIX) { 467e0bace9bSHong Zhang nza = 0; /* num of upper triangular entries in mat->A, including diagonals */ 468e0bace9bSHong Zhang nzb = 0; /* num of upper triangular entries in mat->B */ 46916ebf90aSShri Abhyankar for (i=0; i<m; i++) { 470e0bace9bSHong Zhang nza += (ai[i+1] - adiag[i]); 47116ebf90aSShri Abhyankar countB = bi[i+1] - bi[i]; 47216ebf90aSShri Abhyankar bjj = bj + bi[i]; 473e0bace9bSHong Zhang for (j=0; j<countB; j++) { 474e0bace9bSHong Zhang if (garray[bjj[j]] > rstart) nzb++; 475e0bace9bSHong Zhang } 476e0bace9bSHong Zhang } 47716ebf90aSShri Abhyankar 478e0bace9bSHong Zhang nz = nza + nzb; /* total nz of upper triangular part of mat */ 47916ebf90aSShri Abhyankar *nnz = nz; 480185f6596SHong Zhang ierr = PetscMalloc((2*nz*sizeof(PetscInt)+nz*sizeof(PetscScalar)), &row);CHKERRQ(ierr); 481185f6596SHong Zhang col = row + nz; 482185f6596SHong Zhang val = (PetscScalar*)(col + nz); 483185f6596SHong Zhang 48416ebf90aSShri Abhyankar *r = row; *c = col; *v = val; 48516ebf90aSShri Abhyankar } else { 48616ebf90aSShri Abhyankar row = *r; col = *c; val = *v; 48716ebf90aSShri Abhyankar } 48816ebf90aSShri Abhyankar 48916ebf90aSShri Abhyankar jj = 0; irow = rstart; 49016ebf90aSShri Abhyankar for (i=0; i<m; i++) { 49116ebf90aSShri Abhyankar ajj = aj + adiag[i]; /* ptr to the beginning of the diagonal of this row */ 49216ebf90aSShri Abhyankar v1 = av + adiag[i]; 49316ebf90aSShri Abhyankar countA = ai[i+1] - adiag[i]; 49416ebf90aSShri Abhyankar countB = bi[i+1] - bi[i]; 49516ebf90aSShri Abhyankar bjj = bj + bi[i]; 49616ebf90aSShri Abhyankar v2 = bv + bi[i]; 49716ebf90aSShri Abhyankar 49816ebf90aSShri Abhyankar /* A-part */ 49916ebf90aSShri Abhyankar for (j=0; j<countA; j++) { 500bccb9932SShri Abhyankar if (reuse == MAT_INITIAL_MATRIX) { 50116ebf90aSShri Abhyankar row[jj] = irow + shift; col[jj] = rstart + ajj[j] + shift; 50216ebf90aSShri Abhyankar } 50316ebf90aSShri Abhyankar val[jj++] = v1[j]; 50416ebf90aSShri Abhyankar } 50516ebf90aSShri Abhyankar 50616ebf90aSShri Abhyankar /* B-part */ 50716ebf90aSShri Abhyankar for (j=0; j < countB; j++) { 50816ebf90aSShri Abhyankar if (garray[bjj[j]] > rstart) { 509bccb9932SShri Abhyankar if (reuse == MAT_INITIAL_MATRIX) { 51016ebf90aSShri Abhyankar row[jj] = irow + shift; col[jj] = garray[bjj[j]] + shift; 51116ebf90aSShri Abhyankar } 51216ebf90aSShri Abhyankar val[jj++] = v2[j]; 51316ebf90aSShri Abhyankar } 514397b6df1SKris Buschelman } 515397b6df1SKris Buschelman irow++; 516397b6df1SKris Buschelman } 517397b6df1SKris Buschelman PetscFunctionReturn(0); 518397b6df1SKris Buschelman } 519397b6df1SKris Buschelman 520397b6df1SKris Buschelman #undef __FUNCT__ 5213924e44cSKris Buschelman #define __FUNCT__ "MatDestroy_MUMPS" 522dfbe8321SBarry Smith PetscErrorCode MatDestroy_MUMPS(Mat A) 523dfbe8321SBarry Smith { 524a5e57a09SHong Zhang Mat_MUMPS *mumps=(Mat_MUMPS*)A->spptr; 525dfbe8321SBarry Smith PetscErrorCode ierr; 526b24902e0SBarry Smith 527397b6df1SKris Buschelman PetscFunctionBegin; 528a5e57a09SHong Zhang if (mumps->CleanUpMUMPS) { 529397b6df1SKris Buschelman /* Terminate instance, deallocate memories */ 530a5e57a09SHong Zhang ierr = PetscFree2(mumps->id.sol_loc,mumps->id.isol_loc);CHKERRQ(ierr); 531a5e57a09SHong Zhang ierr = VecScatterDestroy(&mumps->scat_rhs);CHKERRQ(ierr); 532a5e57a09SHong Zhang ierr = VecDestroy(&mumps->b_seq);CHKERRQ(ierr); 533a5e57a09SHong Zhang ierr = VecScatterDestroy(&mumps->scat_sol);CHKERRQ(ierr); 534a5e57a09SHong Zhang ierr = VecDestroy(&mumps->x_seq);CHKERRQ(ierr); 535a5e57a09SHong Zhang ierr = PetscFree(mumps->id.perm_in);CHKERRQ(ierr); 536a5e57a09SHong Zhang ierr = PetscFree(mumps->irn);CHKERRQ(ierr); 5372205254eSKarl Rupp 538a5e57a09SHong Zhang mumps->id.job = JOB_END; 539a5e57a09SHong Zhang PetscMUMPS_c(&mumps->id); 540a5e57a09SHong Zhang ierr = MPI_Comm_free(&(mumps->comm_mumps));CHKERRQ(ierr); 541397b6df1SKris Buschelman } 542a5e57a09SHong Zhang if (mumps->Destroy) { 543a5e57a09SHong Zhang ierr = (mumps->Destroy)(A);CHKERRQ(ierr); 544bf0cc555SLisandro Dalcin } 545bf0cc555SLisandro Dalcin ierr = PetscFree(A->spptr);CHKERRQ(ierr); 546bf0cc555SLisandro Dalcin 54797969023SHong Zhang /* clear composed functions */ 548bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)A,"MatFactorGetSolverPackage_C",NULL);CHKERRQ(ierr); 549bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)A,"MatMumpsSetIcntl_C",NULL);CHKERRQ(ierr); 550bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)A,"MatMumpsSetCntl_C",NULL);CHKERRQ(ierr); 551397b6df1SKris Buschelman PetscFunctionReturn(0); 552397b6df1SKris Buschelman } 553397b6df1SKris Buschelman 554397b6df1SKris Buschelman #undef __FUNCT__ 555f6c57405SHong Zhang #define __FUNCT__ "MatSolve_MUMPS" 556b24902e0SBarry Smith PetscErrorCode MatSolve_MUMPS(Mat A,Vec b,Vec x) 557b24902e0SBarry Smith { 558a5e57a09SHong Zhang Mat_MUMPS *mumps=(Mat_MUMPS*)A->spptr; 559d54de34fSKris Buschelman PetscScalar *array; 56067877ebaSShri Abhyankar Vec b_seq; 561329ec9b3SHong Zhang IS is_iden,is_petsc; 562dfbe8321SBarry Smith PetscErrorCode ierr; 563329ec9b3SHong Zhang PetscInt i; 564883f2eb9SBarry Smith static PetscBool cite1 = PETSC_FALSE,cite2 = PETSC_FALSE; 565397b6df1SKris Buschelman 566397b6df1SKris Buschelman PetscFunctionBegin; 567883f2eb9SBarry Smith ierr = PetscCitationsRegister("@article{MUMPS01,\n author = {P.~R. Amestoy and I.~S. Duff and J.-Y. L'Excellent and J. Koster},\n title = {A fully asynchronous multifrontal solver using distributed dynamic scheduling},\n journal = {SIAM Journal on Matrix Analysis and Applications},\n volume = {23},\n number = {1},\n pages = {15--41},\n year = {2001}\n}\n",&cite1);CHKERRQ(ierr); 568883f2eb9SBarry Smith ierr = PetscCitationsRegister("@article{MUMPS02,\n author = {P.~R. Amestoy and A. Guermouche and J.-Y. L'Excellent and S. Pralet},\n title = {Hybrid scheduling for the parallel solution of linear systems},\n journal = {Parallel Computing},\n volume = {32},\n number = {2},\n pages = {136--156},\n year = {2006}\n}\n",&cite2);CHKERRQ(ierr); 569a5e57a09SHong Zhang mumps->id.nrhs = 1; 570a5e57a09SHong Zhang b_seq = mumps->b_seq; 571a5e57a09SHong Zhang if (mumps->size > 1) { 572329ec9b3SHong Zhang /* MUMPS only supports centralized rhs. Scatter b into a seqential rhs vector */ 573a5e57a09SHong Zhang ierr = VecScatterBegin(mumps->scat_rhs,b,b_seq,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 574a5e57a09SHong Zhang ierr = VecScatterEnd(mumps->scat_rhs,b,b_seq,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 575a5e57a09SHong Zhang if (!mumps->myid) {ierr = VecGetArray(b_seq,&array);CHKERRQ(ierr);} 576397b6df1SKris Buschelman } else { /* size == 1 */ 577397b6df1SKris Buschelman ierr = VecCopy(b,x);CHKERRQ(ierr); 578397b6df1SKris Buschelman ierr = VecGetArray(x,&array);CHKERRQ(ierr); 579397b6df1SKris Buschelman } 580a5e57a09SHong Zhang if (!mumps->myid) { /* define rhs on the host */ 581a5e57a09SHong Zhang mumps->id.nrhs = 1; 582397b6df1SKris Buschelman #if defined(PETSC_USE_COMPLEX) 5832907cef9SHong Zhang #if defined(PETSC_USE_REAL_SINGLE) 584a5e57a09SHong Zhang mumps->id.rhs = (mumps_complex*)array; 5852907cef9SHong Zhang #else 586a5e57a09SHong Zhang mumps->id.rhs = (mumps_double_complex*)array; 5872907cef9SHong Zhang #endif 588397b6df1SKris Buschelman #else 589a5e57a09SHong Zhang mumps->id.rhs = array; 590397b6df1SKris Buschelman #endif 591397b6df1SKris Buschelman } 592397b6df1SKris Buschelman 593397b6df1SKris Buschelman /* solve phase */ 594329ec9b3SHong Zhang /*-------------*/ 595a5e57a09SHong Zhang mumps->id.job = JOB_SOLVE; 596a5e57a09SHong Zhang PetscMUMPS_c(&mumps->id); 597a5e57a09SHong Zhang if (mumps->id.INFOG(1) < 0) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error reported by MUMPS in solve phase: INFOG(1)=%d\n",mumps->id.INFOG(1)); 598397b6df1SKris Buschelman 599a5e57a09SHong Zhang if (mumps->size > 1) { /* convert mumps distributed solution to petsc mpi x */ 600a5e57a09SHong Zhang if (mumps->scat_sol && mumps->ICNTL9_pre != mumps->id.ICNTL(9)) { 601a5e57a09SHong Zhang /* when id.ICNTL(9) changes, the contents of lsol_loc may change (not its size, lsol_loc), recreates scat_sol */ 602a5e57a09SHong Zhang ierr = VecScatterDestroy(&mumps->scat_sol);CHKERRQ(ierr); 603397b6df1SKris Buschelman } 604a5e57a09SHong Zhang if (!mumps->scat_sol) { /* create scatter scat_sol */ 605a5e57a09SHong Zhang ierr = ISCreateStride(PETSC_COMM_SELF,mumps->id.lsol_loc,0,1,&is_iden);CHKERRQ(ierr); /* from */ 606a5e57a09SHong Zhang for (i=0; i<mumps->id.lsol_loc; i++) { 607a5e57a09SHong Zhang mumps->id.isol_loc[i] -= 1; /* change Fortran style to C style */ 608a5e57a09SHong Zhang } 609a5e57a09SHong Zhang ierr = ISCreateGeneral(PETSC_COMM_SELF,mumps->id.lsol_loc,mumps->id.isol_loc,PETSC_COPY_VALUES,&is_petsc);CHKERRQ(ierr); /* to */ 610a5e57a09SHong Zhang ierr = VecScatterCreate(mumps->x_seq,is_iden,x,is_petsc,&mumps->scat_sol);CHKERRQ(ierr); 6116bf464f9SBarry Smith ierr = ISDestroy(&is_iden);CHKERRQ(ierr); 6126bf464f9SBarry Smith ierr = ISDestroy(&is_petsc);CHKERRQ(ierr); 6132205254eSKarl Rupp 614a5e57a09SHong Zhang mumps->ICNTL9_pre = mumps->id.ICNTL(9); /* save current value of id.ICNTL(9) */ 615397b6df1SKris Buschelman } 616a5e57a09SHong Zhang 617a5e57a09SHong Zhang ierr = VecScatterBegin(mumps->scat_sol,mumps->x_seq,x,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 618a5e57a09SHong Zhang ierr = VecScatterEnd(mumps->scat_sol,mumps->x_seq,x,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 619329ec9b3SHong Zhang } 620397b6df1SKris Buschelman PetscFunctionReturn(0); 621397b6df1SKris Buschelman } 622397b6df1SKris Buschelman 62351d5961aSHong Zhang #undef __FUNCT__ 62451d5961aSHong Zhang #define __FUNCT__ "MatSolveTranspose_MUMPS" 62551d5961aSHong Zhang PetscErrorCode MatSolveTranspose_MUMPS(Mat A,Vec b,Vec x) 62651d5961aSHong Zhang { 627a5e57a09SHong Zhang Mat_MUMPS *mumps=(Mat_MUMPS*)A->spptr; 62851d5961aSHong Zhang PetscErrorCode ierr; 62951d5961aSHong Zhang 63051d5961aSHong Zhang PetscFunctionBegin; 631a5e57a09SHong Zhang mumps->id.ICNTL(9) = 0; 6322205254eSKarl Rupp 6330ad0caddSJed Brown ierr = MatSolve_MUMPS(A,b,x);CHKERRQ(ierr); 6342205254eSKarl Rupp 635a5e57a09SHong Zhang mumps->id.ICNTL(9) = 1; 63651d5961aSHong Zhang PetscFunctionReturn(0); 63751d5961aSHong Zhang } 63851d5961aSHong Zhang 639e0b74bf9SHong Zhang #undef __FUNCT__ 640e0b74bf9SHong Zhang #define __FUNCT__ "MatMatSolve_MUMPS" 641e0b74bf9SHong Zhang PetscErrorCode MatMatSolve_MUMPS(Mat A,Mat B,Mat X) 642e0b74bf9SHong Zhang { 643bda8bf91SBarry Smith PetscErrorCode ierr; 644bda8bf91SBarry Smith PetscBool flg; 645bda8bf91SBarry Smith 646e0b74bf9SHong Zhang PetscFunctionBegin; 6470298fd71SBarry Smith ierr = PetscObjectTypeCompareAny((PetscObject)B,&flg,MATSEQDENSE,MATMPIDENSE,NULL);CHKERRQ(ierr); 648ce94432eSBarry Smith if (!flg) SETERRQ(PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_WRONG,"Matrix B must be MATDENSE matrix"); 6490298fd71SBarry Smith ierr = PetscObjectTypeCompareAny((PetscObject)X,&flg,MATSEQDENSE,MATMPIDENSE,NULL);CHKERRQ(ierr); 650ce94432eSBarry Smith if (!flg) SETERRQ(PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_WRONG,"Matrix X must be MATDENSE matrix"); 6512205254eSKarl Rupp SETERRQ(PETSC_COMM_SELF,PETSC_ERR_SUP,"MatMatSolve_MUMPS() is not implemented yet"); 652e0b74bf9SHong Zhang PetscFunctionReturn(0); 653e0b74bf9SHong Zhang } 654e0b74bf9SHong Zhang 655ace3df97SHong Zhang #if !defined(PETSC_USE_COMPLEX) 656a58c3f20SHong Zhang /* 657a58c3f20SHong Zhang input: 658a58c3f20SHong Zhang F: numeric factor 659a58c3f20SHong Zhang output: 660a58c3f20SHong Zhang nneg: total number of negative pivots 661a58c3f20SHong Zhang nzero: 0 662a58c3f20SHong Zhang npos: (global dimension of F) - nneg 663a58c3f20SHong Zhang */ 664a58c3f20SHong Zhang 665a58c3f20SHong Zhang #undef __FUNCT__ 666a58c3f20SHong Zhang #define __FUNCT__ "MatGetInertia_SBAIJMUMPS" 667dfbe8321SBarry Smith PetscErrorCode MatGetInertia_SBAIJMUMPS(Mat F,int *nneg,int *nzero,int *npos) 668a58c3f20SHong Zhang { 669a5e57a09SHong Zhang Mat_MUMPS *mumps =(Mat_MUMPS*)F->spptr; 670dfbe8321SBarry Smith PetscErrorCode ierr; 671c1490034SHong Zhang PetscMPIInt size; 672a58c3f20SHong Zhang 673a58c3f20SHong Zhang PetscFunctionBegin; 674ce94432eSBarry Smith ierr = MPI_Comm_size(PetscObjectComm((PetscObject)F),&size);CHKERRQ(ierr); 675bcb30aebSHong Zhang /* MUMPS 4.3.1 calls ScaLAPACK when ICNTL(13)=0 (default), which does not offer the possibility to compute the inertia of a dense matrix. Set ICNTL(13)=1 to skip ScaLAPACK */ 676a5e57a09SHong Zhang if (size > 1 && mumps->id.ICNTL(13) != 1) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONG,"ICNTL(13)=%d. -mat_mumps_icntl_13 must be set as 1 for correct global matrix inertia\n",mumps->id.INFOG(13)); 677a58c3f20SHong Zhang if (nneg) { 678a5e57a09SHong Zhang if (!mumps->myid) { 679a5e57a09SHong Zhang *nneg = mumps->id.INFOG(12); 680a58c3f20SHong Zhang } 681a5e57a09SHong Zhang ierr = MPI_Bcast(nneg,1,MPI_INT,0,mumps->comm_mumps);CHKERRQ(ierr); 682a58c3f20SHong Zhang } 683a58c3f20SHong Zhang if (nzero) *nzero = 0; 684d0f46423SBarry Smith if (npos) *npos = F->rmap->N - (*nneg); 685a58c3f20SHong Zhang PetscFunctionReturn(0); 686a58c3f20SHong Zhang } 687ace3df97SHong Zhang #endif /* !defined(PETSC_USE_COMPLEX) */ 688a58c3f20SHong Zhang 689397b6df1SKris Buschelman #undef __FUNCT__ 690f6c57405SHong Zhang #define __FUNCT__ "MatFactorNumeric_MUMPS" 6910481f469SBarry Smith PetscErrorCode MatFactorNumeric_MUMPS(Mat F,Mat A,const MatFactorInfo *info) 692af281ebdSHong Zhang { 693a5e57a09SHong Zhang Mat_MUMPS *mumps =(Mat_MUMPS*)(F)->spptr; 6946849ba73SBarry Smith PetscErrorCode ierr; 695e09efc27SHong Zhang Mat F_diag; 696ace3abfcSBarry Smith PetscBool isMPIAIJ; 697397b6df1SKris Buschelman 698397b6df1SKris Buschelman PetscFunctionBegin; 699a5e57a09SHong Zhang ierr = (*mumps->ConvertToTriples)(A, 1, MAT_REUSE_MATRIX, &mumps->nz, &mumps->irn, &mumps->jcn, &mumps->val);CHKERRQ(ierr); 700397b6df1SKris Buschelman 701397b6df1SKris Buschelman /* numerical factorization phase */ 702329ec9b3SHong Zhang /*-------------------------------*/ 703a5e57a09SHong Zhang mumps->id.job = JOB_FACTNUMERIC; 704a5e57a09SHong Zhang if (!mumps->id.ICNTL(18)) { 705a5e57a09SHong Zhang if (!mumps->myid) { 706397b6df1SKris Buschelman #if defined(PETSC_USE_COMPLEX) 7072907cef9SHong Zhang #if defined(PETSC_USE_REAL_SINGLE) 708a5e57a09SHong Zhang mumps->id.a = (mumps_complex*)mumps->val; 7092907cef9SHong Zhang #else 710a5e57a09SHong Zhang mumps->id.a = (mumps_double_complex*)mumps->val; 7112907cef9SHong Zhang #endif 712397b6df1SKris Buschelman #else 713a5e57a09SHong Zhang mumps->id.a = mumps->val; 714397b6df1SKris Buschelman #endif 715397b6df1SKris Buschelman } 716397b6df1SKris Buschelman } else { 717397b6df1SKris Buschelman #if defined(PETSC_USE_COMPLEX) 7182907cef9SHong Zhang #if defined(PETSC_USE_REAL_SINGLE) 719a5e57a09SHong Zhang mumps->id.a_loc = (mumps_complex*)mumps->val; 7202907cef9SHong Zhang #else 721a5e57a09SHong Zhang mumps->id.a_loc = (mumps_double_complex*)mumps->val; 7222907cef9SHong Zhang #endif 723397b6df1SKris Buschelman #else 724a5e57a09SHong Zhang mumps->id.a_loc = mumps->val; 725397b6df1SKris Buschelman #endif 726397b6df1SKris Buschelman } 727a5e57a09SHong Zhang PetscMUMPS_c(&mumps->id); 728a5e57a09SHong Zhang if (mumps->id.INFOG(1) < 0) { 729a5e57a09SHong Zhang if (mumps->id.INFO(1) == -13) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error reported by MUMPS in numerical factorization phase: Cannot allocate required memory %d megabytes\n",mumps->id.INFO(2)); 730a5e57a09SHong Zhang else SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error reported by MUMPS in numerical factorization phase: INFO(1)=%d, INFO(2)=%d\n",mumps->id.INFO(1),mumps->id.INFO(2)); 731397b6df1SKris Buschelman } 732a5e57a09SHong Zhang if (!mumps->myid && mumps->id.ICNTL(16) > 0) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB," mumps->id.ICNTL(16):=%d\n",mumps->id.INFOG(16)); 733397b6df1SKris Buschelman 734a5e57a09SHong Zhang if (mumps->size > 1) { 735251f4c67SDmitry Karpeev ierr = PetscObjectTypeCompare((PetscObject)A,MATMPIAIJ,&isMPIAIJ);CHKERRQ(ierr); 7362205254eSKarl Rupp if (isMPIAIJ) F_diag = ((Mat_MPIAIJ*)(F)->data)->A; 7372205254eSKarl Rupp else F_diag = ((Mat_MPISBAIJ*)(F)->data)->A; 738e09efc27SHong Zhang F_diag->assembled = PETSC_TRUE; 739a5e57a09SHong Zhang if (mumps->scat_sol) { 740a5e57a09SHong Zhang ierr = VecScatterDestroy(&mumps->scat_sol);CHKERRQ(ierr); 741a5e57a09SHong Zhang ierr = PetscFree2(mumps->id.sol_loc,mumps->id.isol_loc);CHKERRQ(ierr); 742a5e57a09SHong Zhang ierr = VecDestroy(&mumps->x_seq);CHKERRQ(ierr); 743329ec9b3SHong Zhang } 7448ada1bb4SHong Zhang } 745dcd589f8SShri Abhyankar (F)->assembled = PETSC_TRUE; 746a5e57a09SHong Zhang mumps->matstruc = SAME_NONZERO_PATTERN; 747a5e57a09SHong Zhang mumps->CleanUpMUMPS = PETSC_TRUE; 74867877ebaSShri Abhyankar 749a5e57a09SHong Zhang if (mumps->size > 1) { 75067877ebaSShri Abhyankar /* distributed solution */ 751a5e57a09SHong Zhang if (!mumps->scat_sol) { 75267877ebaSShri Abhyankar /* Create x_seq=sol_loc for repeated use */ 75367877ebaSShri Abhyankar PetscInt lsol_loc; 75467877ebaSShri Abhyankar PetscScalar *sol_loc; 7552205254eSKarl Rupp 756a5e57a09SHong Zhang lsol_loc = mumps->id.INFO(23); /* length of sol_loc */ 7572205254eSKarl Rupp 758*dcca6d9dSJed Brown ierr = PetscMalloc2(lsol_loc,&sol_loc,lsol_loc,&mumps->id.isol_loc);CHKERRQ(ierr); 7592205254eSKarl Rupp 760a5e57a09SHong Zhang mumps->id.lsol_loc = lsol_loc; 76167877ebaSShri Abhyankar #if defined(PETSC_USE_COMPLEX) 7622907cef9SHong Zhang #if defined(PETSC_USE_REAL_SINGLE) 763a5e57a09SHong Zhang mumps->id.sol_loc = (mumps_complex*)sol_loc; 7642907cef9SHong Zhang #else 765a5e57a09SHong Zhang mumps->id.sol_loc = (mumps_double_complex*)sol_loc; 7662907cef9SHong Zhang #endif 76767877ebaSShri Abhyankar #else 768a5e57a09SHong Zhang mumps->id.sol_loc = sol_loc; 76967877ebaSShri Abhyankar #endif 770a5e57a09SHong Zhang ierr = VecCreateSeqWithArray(PETSC_COMM_SELF,1,lsol_loc,sol_loc,&mumps->x_seq);CHKERRQ(ierr); 77167877ebaSShri Abhyankar } 77267877ebaSShri Abhyankar } 773397b6df1SKris Buschelman PetscFunctionReturn(0); 774397b6df1SKris Buschelman } 775397b6df1SKris Buschelman 7769a2535b5SHong Zhang /* Sets MUMPS options from the options database */ 777dcd589f8SShri Abhyankar #undef __FUNCT__ 7789a2535b5SHong Zhang #define __FUNCT__ "PetscSetMUMPSFromOptions" 7799a2535b5SHong Zhang PetscErrorCode PetscSetMUMPSFromOptions(Mat F, Mat A) 780dcd589f8SShri Abhyankar { 7819a2535b5SHong Zhang Mat_MUMPS *mumps = (Mat_MUMPS*)F->spptr; 782dcd589f8SShri Abhyankar PetscErrorCode ierr; 783dcd589f8SShri Abhyankar PetscInt icntl; 784ace3abfcSBarry Smith PetscBool flg; 785dcd589f8SShri Abhyankar 786dcd589f8SShri Abhyankar PetscFunctionBegin; 787ce94432eSBarry Smith ierr = PetscOptionsBegin(PetscObjectComm((PetscObject)A),((PetscObject)A)->prefix,"MUMPS Options","Mat");CHKERRQ(ierr); 7889a2535b5SHong Zhang ierr = PetscOptionsInt("-mat_mumps_icntl_1","ICNTL(1): output stream for error messages","None",mumps->id.ICNTL(1),&icntl,&flg);CHKERRQ(ierr); 7899a2535b5SHong Zhang if (flg) mumps->id.ICNTL(1) = icntl; 7909a2535b5SHong Zhang ierr = PetscOptionsInt("-mat_mumps_icntl_2","ICNTL(2): output stream for diagnostic printing, statistics, and warning","None",mumps->id.ICNTL(2),&icntl,&flg);CHKERRQ(ierr); 7919a2535b5SHong Zhang if (flg) mumps->id.ICNTL(2) = icntl; 7929a2535b5SHong Zhang ierr = PetscOptionsInt("-mat_mumps_icntl_3","ICNTL(3): output stream for global information, collected on the host","None",mumps->id.ICNTL(3),&icntl,&flg);CHKERRQ(ierr); 7939a2535b5SHong Zhang if (flg) mumps->id.ICNTL(3) = icntl; 794dcd589f8SShri Abhyankar 7959a2535b5SHong Zhang ierr = PetscOptionsInt("-mat_mumps_icntl_4","ICNTL(4): level of printing (0 to 4)","None",mumps->id.ICNTL(4),&icntl,&flg);CHKERRQ(ierr); 7969a2535b5SHong Zhang if (flg) mumps->id.ICNTL(4) = icntl; 7979a2535b5SHong Zhang if (mumps->id.ICNTL(4) || PetscLogPrintInfo) mumps->id.ICNTL(3) = 6; /* resume MUMPS default id.ICNTL(3) = 6 */ 7989a2535b5SHong Zhang 7999a2535b5SHong Zhang ierr = PetscOptionsInt("-mat_mumps_icntl_6","ICNTL(6): permuting and/or scaling the matrix (0 to 7)","None",mumps->id.ICNTL(6),&icntl,&flg);CHKERRQ(ierr); 8009a2535b5SHong Zhang if (flg) mumps->id.ICNTL(6) = icntl; 8019a2535b5SHong Zhang 8029a2535b5SHong Zhang ierr = PetscOptionsInt("-mat_mumps_icntl_7","ICNTL(7): matrix ordering (0 to 7). 3=Scotch, 4=PORD, 5=Metis","None",mumps->id.ICNTL(7),&icntl,&flg);CHKERRQ(ierr); 803dcd589f8SShri Abhyankar if (flg) { 8042205254eSKarl Rupp if (icntl== 1 && mumps->size > 1) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_SUP,"pivot order be set by the user in PERM_IN -- not supported by the PETSc/MUMPS interface\n"); 8052205254eSKarl Rupp else mumps->id.ICNTL(7) = icntl; 806dcd589f8SShri Abhyankar } 807e0b74bf9SHong Zhang 8080298fd71SBarry Smith ierr = PetscOptionsInt("-mat_mumps_icntl_8","ICNTL(8): scaling strategy (-2 to 8 or 77)","None",mumps->id.ICNTL(8),&mumps->id.ICNTL(8),NULL);CHKERRQ(ierr); 8090298fd71SBarry Smith ierr = PetscOptionsInt("-mat_mumps_icntl_10","ICNTL(10): max num of refinements","None",mumps->id.ICNTL(10),&mumps->id.ICNTL(10),NULL);CHKERRQ(ierr); 8100298fd71SBarry Smith ierr = PetscOptionsInt("-mat_mumps_icntl_11","ICNTL(11): statistics related to the linear system solved (via -ksp_view)","None",mumps->id.ICNTL(11),&mumps->id.ICNTL(11),NULL);CHKERRQ(ierr); 8110298fd71SBarry Smith ierr = PetscOptionsInt("-mat_mumps_icntl_12","ICNTL(12): efficiency control: defines the ordering strategy with scaling constraints (0 to 3)","None",mumps->id.ICNTL(12),&mumps->id.ICNTL(12),NULL);CHKERRQ(ierr); 8120298fd71SBarry Smith ierr = PetscOptionsInt("-mat_mumps_icntl_13","ICNTL(13): efficiency control: with or without ScaLAPACK","None",mumps->id.ICNTL(13),&mumps->id.ICNTL(13),NULL);CHKERRQ(ierr); 8130298fd71SBarry Smith ierr = PetscOptionsInt("-mat_mumps_icntl_14","ICNTL(14): percentage of estimated workspace increase","None",mumps->id.ICNTL(14),&mumps->id.ICNTL(14),NULL);CHKERRQ(ierr); 8140298fd71SBarry Smith ierr = PetscOptionsInt("-mat_mumps_icntl_19","ICNTL(19): Schur complement","None",mumps->id.ICNTL(19),&mumps->id.ICNTL(19),NULL);CHKERRQ(ierr); 8159a2535b5SHong Zhang 8160298fd71SBarry Smith ierr = PetscOptionsInt("-mat_mumps_icntl_22","ICNTL(22): in-core/out-of-core facility (0 or 1)","None",mumps->id.ICNTL(22),&mumps->id.ICNTL(22),NULL);CHKERRQ(ierr); 8170298fd71SBarry Smith ierr = PetscOptionsInt("-mat_mumps_icntl_23","ICNTL(23): max size of the working memory (MB) that can allocate per processor","None",mumps->id.ICNTL(23),&mumps->id.ICNTL(23),NULL);CHKERRQ(ierr); 8180298fd71SBarry Smith ierr = PetscOptionsInt("-mat_mumps_icntl_24","ICNTL(24): detection of null pivot rows (0 or 1)","None",mumps->id.ICNTL(24),&mumps->id.ICNTL(24),NULL);CHKERRQ(ierr); 8199a2535b5SHong Zhang if (mumps->id.ICNTL(24)) { 8209a2535b5SHong Zhang mumps->id.ICNTL(13) = 1; /* turn-off ScaLAPACK to help with the correct detection of null pivots */ 821d7ebd59bSHong Zhang } 822d7ebd59bSHong Zhang 8230298fd71SBarry Smith ierr = PetscOptionsInt("-mat_mumps_icntl_25","ICNTL(25): computation of a null space basis","None",mumps->id.ICNTL(25),&mumps->id.ICNTL(25),NULL);CHKERRQ(ierr); 8240298fd71SBarry Smith ierr = PetscOptionsInt("-mat_mumps_icntl_26","ICNTL(26): Schur options for right-hand side or solution vector","None",mumps->id.ICNTL(26),&mumps->id.ICNTL(26),NULL);CHKERRQ(ierr); 8250298fd71SBarry Smith ierr = PetscOptionsInt("-mat_mumps_icntl_27","ICNTL(27): experimental parameter","None",mumps->id.ICNTL(27),&mumps->id.ICNTL(27),NULL);CHKERRQ(ierr); 8260298fd71SBarry Smith ierr = PetscOptionsInt("-mat_mumps_icntl_28","ICNTL(28): use 1 for sequential analysis and ictnl(7) ordering, or 2 for parallel analysis and ictnl(29) ordering","None",mumps->id.ICNTL(28),&mumps->id.ICNTL(28),NULL);CHKERRQ(ierr); 8270298fd71SBarry Smith ierr = PetscOptionsInt("-mat_mumps_icntl_29","ICNTL(29): parallel ordering 1 = ptscotch 2 = parmetis","None",mumps->id.ICNTL(29),&mumps->id.ICNTL(29),NULL);CHKERRQ(ierr); 8280298fd71SBarry Smith ierr = PetscOptionsInt("-mat_mumps_icntl_30","ICNTL(30): compute user-specified set of entries in inv(A)","None",mumps->id.ICNTL(30),&mumps->id.ICNTL(30),NULL);CHKERRQ(ierr); 8290298fd71SBarry Smith ierr = PetscOptionsInt("-mat_mumps_icntl_31","ICNTL(31): factors can be discarded in the solve phase","None",mumps->id.ICNTL(31),&mumps->id.ICNTL(31),NULL);CHKERRQ(ierr); 8300298fd71SBarry Smith ierr = PetscOptionsInt("-mat_mumps_icntl_33","ICNTL(33): compute determinant","None",mumps->id.ICNTL(33),&mumps->id.ICNTL(33),NULL);CHKERRQ(ierr); 831dcd589f8SShri Abhyankar 8320298fd71SBarry Smith ierr = PetscOptionsReal("-mat_mumps_cntl_1","CNTL(1): relative pivoting threshold","None",mumps->id.CNTL(1),&mumps->id.CNTL(1),NULL);CHKERRQ(ierr); 8330298fd71SBarry Smith ierr = PetscOptionsReal("-mat_mumps_cntl_2","CNTL(2): stopping criterion of refinement","None",mumps->id.CNTL(2),&mumps->id.CNTL(2),NULL);CHKERRQ(ierr); 8340298fd71SBarry Smith ierr = PetscOptionsReal("-mat_mumps_cntl_3","CNTL(3): absolute pivoting threshold","None",mumps->id.CNTL(3),&mumps->id.CNTL(3),NULL);CHKERRQ(ierr); 8350298fd71SBarry Smith ierr = PetscOptionsReal("-mat_mumps_cntl_4","CNTL(4): value for static pivoting","None",mumps->id.CNTL(4),&mumps->id.CNTL(4),NULL);CHKERRQ(ierr); 8360298fd71SBarry Smith ierr = PetscOptionsReal("-mat_mumps_cntl_5","CNTL(5): fixation for null pivots","None",mumps->id.CNTL(5),&mumps->id.CNTL(5),NULL);CHKERRQ(ierr); 837e5bb22a1SHong Zhang 8380298fd71SBarry Smith ierr = PetscOptionsString("-mat_mumps_ooc_tmpdir", "out of core directory", "None", mumps->id.ooc_tmpdir, mumps->id.ooc_tmpdir, 256, NULL); 839dcd589f8SShri Abhyankar PetscOptionsEnd(); 840dcd589f8SShri Abhyankar PetscFunctionReturn(0); 841dcd589f8SShri Abhyankar } 842dcd589f8SShri Abhyankar 843dcd589f8SShri Abhyankar #undef __FUNCT__ 844dcd589f8SShri Abhyankar #define __FUNCT__ "PetscInitializeMUMPS" 845f697e70eSHong Zhang PetscErrorCode PetscInitializeMUMPS(Mat A,Mat_MUMPS *mumps) 846dcd589f8SShri Abhyankar { 847dcd589f8SShri Abhyankar PetscErrorCode ierr; 848dcd589f8SShri Abhyankar 849dcd589f8SShri Abhyankar PetscFunctionBegin; 850ce94432eSBarry Smith ierr = MPI_Comm_rank(PetscObjectComm((PetscObject)A), &mumps->myid); 851ce94432eSBarry Smith ierr = MPI_Comm_size(PetscObjectComm((PetscObject)A),&mumps->size);CHKERRQ(ierr); 852ce94432eSBarry Smith ierr = MPI_Comm_dup(PetscObjectComm((PetscObject)A),&(mumps->comm_mumps));CHKERRQ(ierr); 8532205254eSKarl Rupp 854f697e70eSHong Zhang mumps->id.comm_fortran = MPI_Comm_c2f(mumps->comm_mumps); 855f697e70eSHong Zhang 856f697e70eSHong Zhang mumps->id.job = JOB_INIT; 857f697e70eSHong Zhang mumps->id.par = 1; /* host participates factorizaton and solve */ 858f697e70eSHong Zhang mumps->id.sym = mumps->sym; 8592907cef9SHong Zhang PetscMUMPS_c(&mumps->id); 860f697e70eSHong Zhang 861f697e70eSHong Zhang mumps->CleanUpMUMPS = PETSC_FALSE; 8620298fd71SBarry Smith mumps->scat_rhs = NULL; 8630298fd71SBarry Smith mumps->scat_sol = NULL; 8649a2535b5SHong Zhang 86570544d5fSHong Zhang /* set PETSc-MUMPS default options - override MUMPS default */ 8669a2535b5SHong Zhang mumps->id.ICNTL(3) = 0; 8679a2535b5SHong Zhang mumps->id.ICNTL(4) = 0; 8689a2535b5SHong Zhang if (mumps->size == 1) { 8699a2535b5SHong Zhang mumps->id.ICNTL(18) = 0; /* centralized assembled matrix input */ 8709a2535b5SHong Zhang } else { 8719a2535b5SHong Zhang mumps->id.ICNTL(18) = 3; /* distributed assembled matrix input */ 87270544d5fSHong Zhang mumps->id.ICNTL(21) = 1; /* distributed solution */ 8739a2535b5SHong Zhang } 874dcd589f8SShri Abhyankar PetscFunctionReturn(0); 875dcd589f8SShri Abhyankar } 876dcd589f8SShri Abhyankar 877a5e57a09SHong Zhang /* Note Petsc r(=c) permutation is used when mumps->id.ICNTL(7)==1 with centralized assembled matrix input; otherwise r and c are ignored */ 878397b6df1SKris Buschelman #undef __FUNCT__ 879f0c56d0fSKris Buschelman #define __FUNCT__ "MatLUFactorSymbolic_AIJMUMPS" 8800481f469SBarry Smith PetscErrorCode MatLUFactorSymbolic_AIJMUMPS(Mat F,Mat A,IS r,IS c,const MatFactorInfo *info) 881b24902e0SBarry Smith { 882a5e57a09SHong Zhang Mat_MUMPS *mumps = (Mat_MUMPS*)F->spptr; 883dcd589f8SShri Abhyankar PetscErrorCode ierr; 88467877ebaSShri Abhyankar Vec b; 88567877ebaSShri Abhyankar IS is_iden; 88667877ebaSShri Abhyankar const PetscInt M = A->rmap->N; 887397b6df1SKris Buschelman 888397b6df1SKris Buschelman PetscFunctionBegin; 889a5e57a09SHong Zhang mumps->matstruc = DIFFERENT_NONZERO_PATTERN; 890dcd589f8SShri Abhyankar 8919a2535b5SHong Zhang /* Set MUMPS options from the options database */ 8929a2535b5SHong Zhang ierr = PetscSetMUMPSFromOptions(F,A);CHKERRQ(ierr); 893dcd589f8SShri Abhyankar 894a5e57a09SHong Zhang ierr = (*mumps->ConvertToTriples)(A, 1, MAT_INITIAL_MATRIX, &mumps->nz, &mumps->irn, &mumps->jcn, &mumps->val);CHKERRQ(ierr); 895dcd589f8SShri Abhyankar 89667877ebaSShri Abhyankar /* analysis phase */ 89767877ebaSShri Abhyankar /*----------------*/ 898a5e57a09SHong Zhang mumps->id.job = JOB_FACTSYMBOLIC; 899a5e57a09SHong Zhang mumps->id.n = M; 900a5e57a09SHong Zhang switch (mumps->id.ICNTL(18)) { 90167877ebaSShri Abhyankar case 0: /* centralized assembled matrix input */ 902a5e57a09SHong Zhang if (!mumps->myid) { 903a5e57a09SHong Zhang mumps->id.nz =mumps->nz; mumps->id.irn=mumps->irn; mumps->id.jcn=mumps->jcn; 904a5e57a09SHong Zhang if (mumps->id.ICNTL(6)>1) { 90567877ebaSShri Abhyankar #if defined(PETSC_USE_COMPLEX) 9062907cef9SHong Zhang #if defined(PETSC_USE_REAL_SINGLE) 907a5e57a09SHong Zhang mumps->id.a = (mumps_complex*)mumps->val; 9082907cef9SHong Zhang #else 909a5e57a09SHong Zhang mumps->id.a = (mumps_double_complex*)mumps->val; 9102907cef9SHong Zhang #endif 91167877ebaSShri Abhyankar #else 912a5e57a09SHong Zhang mumps->id.a = mumps->val; 91367877ebaSShri Abhyankar #endif 91467877ebaSShri Abhyankar } 915a5e57a09SHong Zhang if (mumps->id.ICNTL(7) == 1) { /* use user-provide matrix ordering - assuming r = c ordering */ 9165248a706SHong Zhang /* 9175248a706SHong Zhang PetscBool flag; 9185248a706SHong Zhang ierr = ISEqual(r,c,&flag);CHKERRQ(ierr); 9195248a706SHong Zhang if (!flag) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_USER,"row_perm != col_perm"); 9205248a706SHong Zhang ierr = ISView(r,PETSC_VIEWER_STDOUT_SELF); 9215248a706SHong Zhang */ 922a5e57a09SHong Zhang if (!mumps->myid) { 923e0b74bf9SHong Zhang const PetscInt *idx; 924e0b74bf9SHong Zhang PetscInt i,*perm_in; 9252205254eSKarl Rupp 926e0b74bf9SHong Zhang ierr = PetscMalloc(M*sizeof(PetscInt),&perm_in);CHKERRQ(ierr); 927e0b74bf9SHong Zhang ierr = ISGetIndices(r,&idx);CHKERRQ(ierr); 9282205254eSKarl Rupp 929a5e57a09SHong Zhang mumps->id.perm_in = perm_in; 930e0b74bf9SHong Zhang for (i=0; i<M; i++) perm_in[i] = idx[i]+1; /* perm_in[]: start from 1, not 0! */ 931e0b74bf9SHong Zhang ierr = ISRestoreIndices(r,&idx);CHKERRQ(ierr); 932e0b74bf9SHong Zhang } 933e0b74bf9SHong Zhang } 93467877ebaSShri Abhyankar } 93567877ebaSShri Abhyankar break; 93667877ebaSShri Abhyankar case 3: /* distributed assembled matrix input (size>1) */ 937a5e57a09SHong Zhang mumps->id.nz_loc = mumps->nz; 938a5e57a09SHong Zhang mumps->id.irn_loc=mumps->irn; mumps->id.jcn_loc=mumps->jcn; 939a5e57a09SHong Zhang if (mumps->id.ICNTL(6)>1) { 94067877ebaSShri Abhyankar #if defined(PETSC_USE_COMPLEX) 9412907cef9SHong Zhang #if defined(PETSC_USE_REAL_SINGLE) 942a5e57a09SHong Zhang mumps->id.a_loc = (mumps_complex*)mumps->val; 9432907cef9SHong Zhang #else 944a5e57a09SHong Zhang mumps->id.a_loc = (mumps_double_complex*)mumps->val; 9452907cef9SHong Zhang #endif 94667877ebaSShri Abhyankar #else 947a5e57a09SHong Zhang mumps->id.a_loc = mumps->val; 94867877ebaSShri Abhyankar #endif 94967877ebaSShri Abhyankar } 95067877ebaSShri Abhyankar /* MUMPS only supports centralized rhs. Create scatter scat_rhs for repeated use in MatSolve() */ 951a5e57a09SHong Zhang if (!mumps->myid) { 952a5e57a09SHong Zhang ierr = VecCreateSeq(PETSC_COMM_SELF,A->cmap->N,&mumps->b_seq);CHKERRQ(ierr); 95367877ebaSShri Abhyankar ierr = ISCreateStride(PETSC_COMM_SELF,A->cmap->N,0,1,&is_iden);CHKERRQ(ierr); 95467877ebaSShri Abhyankar } else { 955a5e57a09SHong Zhang ierr = VecCreateSeq(PETSC_COMM_SELF,0,&mumps->b_seq);CHKERRQ(ierr); 95667877ebaSShri Abhyankar ierr = ISCreateStride(PETSC_COMM_SELF,0,0,1,&is_iden);CHKERRQ(ierr); 95767877ebaSShri Abhyankar } 958c0dedaeaSBarry Smith ierr = MatGetVecs(A,NULL,&b);CHKERRQ(ierr); 959a5e57a09SHong Zhang ierr = VecScatterCreate(b,is_iden,mumps->b_seq,is_iden,&mumps->scat_rhs);CHKERRQ(ierr); 9606bf464f9SBarry Smith ierr = ISDestroy(&is_iden);CHKERRQ(ierr); 9616bf464f9SBarry Smith ierr = VecDestroy(&b);CHKERRQ(ierr); 96267877ebaSShri Abhyankar break; 96367877ebaSShri Abhyankar } 964a5e57a09SHong Zhang PetscMUMPS_c(&mumps->id); 965a5e57a09SHong Zhang if (mumps->id.INFOG(1) < 0) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error reported by MUMPS in analysis phase: INFOG(1)=%d\n",mumps->id.INFOG(1)); 96667877ebaSShri Abhyankar 967719d5645SBarry Smith F->ops->lufactornumeric = MatFactorNumeric_MUMPS; 968dcd589f8SShri Abhyankar F->ops->solve = MatSolve_MUMPS; 96951d5961aSHong Zhang F->ops->solvetranspose = MatSolveTranspose_MUMPS; 97017f96c7aSHong Zhang F->ops->matsolve = 0; /* use MatMatSolve_Basic() until mumps supports distributed rhs */ 971b24902e0SBarry Smith PetscFunctionReturn(0); 972b24902e0SBarry Smith } 973b24902e0SBarry Smith 974450b117fSShri Abhyankar /* Note the Petsc r and c permutations are ignored */ 975450b117fSShri Abhyankar #undef __FUNCT__ 976450b117fSShri Abhyankar #define __FUNCT__ "MatLUFactorSymbolic_BAIJMUMPS" 977450b117fSShri Abhyankar PetscErrorCode MatLUFactorSymbolic_BAIJMUMPS(Mat F,Mat A,IS r,IS c,const MatFactorInfo *info) 978450b117fSShri Abhyankar { 979a5e57a09SHong Zhang Mat_MUMPS *mumps = (Mat_MUMPS*)F->spptr; 980dcd589f8SShri Abhyankar PetscErrorCode ierr; 98167877ebaSShri Abhyankar Vec b; 98267877ebaSShri Abhyankar IS is_iden; 98367877ebaSShri Abhyankar const PetscInt M = A->rmap->N; 984450b117fSShri Abhyankar 985450b117fSShri Abhyankar PetscFunctionBegin; 986a5e57a09SHong Zhang mumps->matstruc = DIFFERENT_NONZERO_PATTERN; 987dcd589f8SShri Abhyankar 9889a2535b5SHong Zhang /* Set MUMPS options from the options database */ 9899a2535b5SHong Zhang ierr = PetscSetMUMPSFromOptions(F,A);CHKERRQ(ierr); 990dcd589f8SShri Abhyankar 991a5e57a09SHong Zhang ierr = (*mumps->ConvertToTriples)(A, 1, MAT_INITIAL_MATRIX, &mumps->nz, &mumps->irn, &mumps->jcn, &mumps->val);CHKERRQ(ierr); 99267877ebaSShri Abhyankar 99367877ebaSShri Abhyankar /* analysis phase */ 99467877ebaSShri Abhyankar /*----------------*/ 995a5e57a09SHong Zhang mumps->id.job = JOB_FACTSYMBOLIC; 996a5e57a09SHong Zhang mumps->id.n = M; 997a5e57a09SHong Zhang switch (mumps->id.ICNTL(18)) { 99867877ebaSShri Abhyankar case 0: /* centralized assembled matrix input */ 999a5e57a09SHong Zhang if (!mumps->myid) { 1000a5e57a09SHong Zhang mumps->id.nz =mumps->nz; mumps->id.irn=mumps->irn; mumps->id.jcn=mumps->jcn; 1001a5e57a09SHong Zhang if (mumps->id.ICNTL(6)>1) { 100267877ebaSShri Abhyankar #if defined(PETSC_USE_COMPLEX) 10032907cef9SHong Zhang #if defined(PETSC_USE_REAL_SINGLE) 1004a5e57a09SHong Zhang mumps->id.a = (mumps_complex*)mumps->val; 10052907cef9SHong Zhang #else 1006a5e57a09SHong Zhang mumps->id.a = (mumps_double_complex*)mumps->val; 10072907cef9SHong Zhang #endif 100867877ebaSShri Abhyankar #else 1009a5e57a09SHong Zhang mumps->id.a = mumps->val; 101067877ebaSShri Abhyankar #endif 101167877ebaSShri Abhyankar } 101267877ebaSShri Abhyankar } 101367877ebaSShri Abhyankar break; 101467877ebaSShri Abhyankar case 3: /* distributed assembled matrix input (size>1) */ 1015a5e57a09SHong Zhang mumps->id.nz_loc = mumps->nz; 1016a5e57a09SHong Zhang mumps->id.irn_loc=mumps->irn; mumps->id.jcn_loc=mumps->jcn; 1017a5e57a09SHong Zhang if (mumps->id.ICNTL(6)>1) { 101867877ebaSShri Abhyankar #if defined(PETSC_USE_COMPLEX) 10192907cef9SHong Zhang #if defined(PETSC_USE_REAL_SINGLE) 1020a5e57a09SHong Zhang mumps->id.a_loc = (mumps_complex*)mumps->val; 10212907cef9SHong Zhang #else 1022a5e57a09SHong Zhang mumps->id.a_loc = (mumps_double_complex*)mumps->val; 10232907cef9SHong Zhang #endif 102467877ebaSShri Abhyankar #else 1025a5e57a09SHong Zhang mumps->id.a_loc = mumps->val; 102667877ebaSShri Abhyankar #endif 102767877ebaSShri Abhyankar } 102867877ebaSShri Abhyankar /* MUMPS only supports centralized rhs. Create scatter scat_rhs for repeated use in MatSolve() */ 1029a5e57a09SHong Zhang if (!mumps->myid) { 1030a5e57a09SHong Zhang ierr = VecCreateSeq(PETSC_COMM_SELF,A->cmap->N,&mumps->b_seq);CHKERRQ(ierr); 103167877ebaSShri Abhyankar ierr = ISCreateStride(PETSC_COMM_SELF,A->cmap->N,0,1,&is_iden);CHKERRQ(ierr); 103267877ebaSShri Abhyankar } else { 1033a5e57a09SHong Zhang ierr = VecCreateSeq(PETSC_COMM_SELF,0,&mumps->b_seq);CHKERRQ(ierr); 103467877ebaSShri Abhyankar ierr = ISCreateStride(PETSC_COMM_SELF,0,0,1,&is_iden);CHKERRQ(ierr); 103567877ebaSShri Abhyankar } 1036c0dedaeaSBarry Smith ierr = MatGetVecs(A,NULL,&b);CHKERRQ(ierr); 1037a5e57a09SHong Zhang ierr = VecScatterCreate(b,is_iden,mumps->b_seq,is_iden,&mumps->scat_rhs);CHKERRQ(ierr); 10386bf464f9SBarry Smith ierr = ISDestroy(&is_iden);CHKERRQ(ierr); 10396bf464f9SBarry Smith ierr = VecDestroy(&b);CHKERRQ(ierr); 104067877ebaSShri Abhyankar break; 104167877ebaSShri Abhyankar } 1042a5e57a09SHong Zhang PetscMUMPS_c(&mumps->id); 1043a5e57a09SHong Zhang if (mumps->id.INFOG(1) < 0) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error reported by MUMPS in analysis phase: INFOG(1)=%d\n",mumps->id.INFOG(1)); 104467877ebaSShri Abhyankar 1045450b117fSShri Abhyankar F->ops->lufactornumeric = MatFactorNumeric_MUMPS; 1046dcd589f8SShri Abhyankar F->ops->solve = MatSolve_MUMPS; 104751d5961aSHong Zhang F->ops->solvetranspose = MatSolveTranspose_MUMPS; 1048450b117fSShri Abhyankar PetscFunctionReturn(0); 1049450b117fSShri Abhyankar } 1050b24902e0SBarry Smith 1051141f4205SHong Zhang /* Note the Petsc r permutation and factor info are ignored */ 1052397b6df1SKris Buschelman #undef __FUNCT__ 105367877ebaSShri Abhyankar #define __FUNCT__ "MatCholeskyFactorSymbolic_MUMPS" 105467877ebaSShri Abhyankar PetscErrorCode MatCholeskyFactorSymbolic_MUMPS(Mat F,Mat A,IS r,const MatFactorInfo *info) 1055b24902e0SBarry Smith { 1056a5e57a09SHong Zhang Mat_MUMPS *mumps = (Mat_MUMPS*)F->spptr; 1057dcd589f8SShri Abhyankar PetscErrorCode ierr; 105867877ebaSShri Abhyankar Vec b; 105967877ebaSShri Abhyankar IS is_iden; 106067877ebaSShri Abhyankar const PetscInt M = A->rmap->N; 1061397b6df1SKris Buschelman 1062397b6df1SKris Buschelman PetscFunctionBegin; 1063a5e57a09SHong Zhang mumps->matstruc = DIFFERENT_NONZERO_PATTERN; 1064dcd589f8SShri Abhyankar 10659a2535b5SHong Zhang /* Set MUMPS options from the options database */ 10669a2535b5SHong Zhang ierr = PetscSetMUMPSFromOptions(F,A);CHKERRQ(ierr); 1067dcd589f8SShri Abhyankar 1068a5e57a09SHong Zhang ierr = (*mumps->ConvertToTriples)(A, 1, MAT_INITIAL_MATRIX, &mumps->nz, &mumps->irn, &mumps->jcn, &mumps->val);CHKERRQ(ierr); 1069dcd589f8SShri Abhyankar 107067877ebaSShri Abhyankar /* analysis phase */ 107167877ebaSShri Abhyankar /*----------------*/ 1072a5e57a09SHong Zhang mumps->id.job = JOB_FACTSYMBOLIC; 1073a5e57a09SHong Zhang mumps->id.n = M; 1074a5e57a09SHong Zhang switch (mumps->id.ICNTL(18)) { 107567877ebaSShri Abhyankar case 0: /* centralized assembled matrix input */ 1076a5e57a09SHong Zhang if (!mumps->myid) { 1077a5e57a09SHong Zhang mumps->id.nz =mumps->nz; mumps->id.irn=mumps->irn; mumps->id.jcn=mumps->jcn; 1078a5e57a09SHong Zhang if (mumps->id.ICNTL(6)>1) { 107967877ebaSShri Abhyankar #if defined(PETSC_USE_COMPLEX) 10802907cef9SHong Zhang #if defined(PETSC_USE_REAL_SINGLE) 1081a5e57a09SHong Zhang mumps->id.a = (mumps_complex*)mumps->val; 10822907cef9SHong Zhang #else 1083a5e57a09SHong Zhang mumps->id.a = (mumps_double_complex*)mumps->val; 10842907cef9SHong Zhang #endif 108567877ebaSShri Abhyankar #else 1086a5e57a09SHong Zhang mumps->id.a = mumps->val; 108767877ebaSShri Abhyankar #endif 108867877ebaSShri Abhyankar } 108967877ebaSShri Abhyankar } 109067877ebaSShri Abhyankar break; 109167877ebaSShri Abhyankar case 3: /* distributed assembled matrix input (size>1) */ 1092a5e57a09SHong Zhang mumps->id.nz_loc = mumps->nz; 1093a5e57a09SHong Zhang mumps->id.irn_loc=mumps->irn; mumps->id.jcn_loc=mumps->jcn; 1094a5e57a09SHong Zhang if (mumps->id.ICNTL(6)>1) { 109567877ebaSShri Abhyankar #if defined(PETSC_USE_COMPLEX) 10962907cef9SHong Zhang #if defined(PETSC_USE_REAL_SINGLE) 1097a5e57a09SHong Zhang mumps->id.a_loc = (mumps_complex*)mumps->val; 10982907cef9SHong Zhang #else 1099a5e57a09SHong Zhang mumps->id.a_loc = (mumps_double_complex*)mumps->val; 11002907cef9SHong Zhang #endif 110167877ebaSShri Abhyankar #else 1102a5e57a09SHong Zhang mumps->id.a_loc = mumps->val; 110367877ebaSShri Abhyankar #endif 110467877ebaSShri Abhyankar } 110567877ebaSShri Abhyankar /* MUMPS only supports centralized rhs. Create scatter scat_rhs for repeated use in MatSolve() */ 1106a5e57a09SHong Zhang if (!mumps->myid) { 1107a5e57a09SHong Zhang ierr = VecCreateSeq(PETSC_COMM_SELF,A->cmap->N,&mumps->b_seq);CHKERRQ(ierr); 110867877ebaSShri Abhyankar ierr = ISCreateStride(PETSC_COMM_SELF,A->cmap->N,0,1,&is_iden);CHKERRQ(ierr); 110967877ebaSShri Abhyankar } else { 1110a5e57a09SHong Zhang ierr = VecCreateSeq(PETSC_COMM_SELF,0,&mumps->b_seq);CHKERRQ(ierr); 111167877ebaSShri Abhyankar ierr = ISCreateStride(PETSC_COMM_SELF,0,0,1,&is_iden);CHKERRQ(ierr); 111267877ebaSShri Abhyankar } 1113c0dedaeaSBarry Smith ierr = MatGetVecs(A,NULL,&b);CHKERRQ(ierr); 1114a5e57a09SHong Zhang ierr = VecScatterCreate(b,is_iden,mumps->b_seq,is_iden,&mumps->scat_rhs);CHKERRQ(ierr); 11156bf464f9SBarry Smith ierr = ISDestroy(&is_iden);CHKERRQ(ierr); 11166bf464f9SBarry Smith ierr = VecDestroy(&b);CHKERRQ(ierr); 111767877ebaSShri Abhyankar break; 111867877ebaSShri Abhyankar } 1119a5e57a09SHong Zhang PetscMUMPS_c(&mumps->id); 1120a5e57a09SHong Zhang if (mumps->id.INFOG(1) < 0) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error reported by MUMPS in analysis phase: INFOG(1)=%d\n",mumps->id.INFOG(1)); 112167877ebaSShri Abhyankar 11222792810eSHong Zhang F->ops->choleskyfactornumeric = MatFactorNumeric_MUMPS; 1123dcd589f8SShri Abhyankar F->ops->solve = MatSolve_MUMPS; 112451d5961aSHong Zhang F->ops->solvetranspose = MatSolve_MUMPS; 112530c107b7SHong Zhang F->ops->matsolve = 0; /* use MatMatSolve_Basic() until mumps supports distributed rhs */ 1126db4efbfdSBarry Smith #if !defined(PETSC_USE_COMPLEX) 112705aa0992SJose Roman F->ops->getinertia = MatGetInertia_SBAIJMUMPS; 112805aa0992SJose Roman #else 11290298fd71SBarry Smith F->ops->getinertia = NULL; 1130db4efbfdSBarry Smith #endif 1131b24902e0SBarry Smith PetscFunctionReturn(0); 1132b24902e0SBarry Smith } 1133b24902e0SBarry Smith 1134397b6df1SKris Buschelman #undef __FUNCT__ 113564e6c443SBarry Smith #define __FUNCT__ "MatView_MUMPS" 113664e6c443SBarry Smith PetscErrorCode MatView_MUMPS(Mat A,PetscViewer viewer) 113774ed9c26SBarry Smith { 1138f6c57405SHong Zhang PetscErrorCode ierr; 113964e6c443SBarry Smith PetscBool iascii; 114064e6c443SBarry Smith PetscViewerFormat format; 1141a5e57a09SHong Zhang Mat_MUMPS *mumps=(Mat_MUMPS*)A->spptr; 1142f6c57405SHong Zhang 1143f6c57405SHong Zhang PetscFunctionBegin; 114464e6c443SBarry Smith /* check if matrix is mumps type */ 114564e6c443SBarry Smith if (A->ops->solve != MatSolve_MUMPS) PetscFunctionReturn(0); 114664e6c443SBarry Smith 1147251f4c67SDmitry Karpeev ierr = PetscObjectTypeCompare((PetscObject)viewer,PETSCVIEWERASCII,&iascii);CHKERRQ(ierr); 114864e6c443SBarry Smith if (iascii) { 114964e6c443SBarry Smith ierr = PetscViewerGetFormat(viewer,&format);CHKERRQ(ierr); 115064e6c443SBarry Smith if (format == PETSC_VIEWER_ASCII_INFO) { 115164e6c443SBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"MUMPS run parameters:\n");CHKERRQ(ierr); 1152a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," SYM (matrix type): %d \n",mumps->id.sym);CHKERRQ(ierr); 1153a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," PAR (host participation): %d \n",mumps->id.par);CHKERRQ(ierr); 1154a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(1) (output for error): %d \n",mumps->id.ICNTL(1));CHKERRQ(ierr); 1155a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(2) (output of diagnostic msg): %d \n",mumps->id.ICNTL(2));CHKERRQ(ierr); 1156a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(3) (output for global info): %d \n",mumps->id.ICNTL(3));CHKERRQ(ierr); 1157a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(4) (level of printing): %d \n",mumps->id.ICNTL(4));CHKERRQ(ierr); 1158a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(5) (input mat struct): %d \n",mumps->id.ICNTL(5));CHKERRQ(ierr); 1159a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(6) (matrix prescaling): %d \n",mumps->id.ICNTL(6));CHKERRQ(ierr); 1160a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(7) (sequentia matrix ordering):%d \n",mumps->id.ICNTL(7));CHKERRQ(ierr); 1161a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(8) (scalling strategy): %d \n",mumps->id.ICNTL(8));CHKERRQ(ierr); 1162a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(10) (max num of refinements): %d \n",mumps->id.ICNTL(10));CHKERRQ(ierr); 1163a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(11) (error analysis): %d \n",mumps->id.ICNTL(11));CHKERRQ(ierr); 1164a5e57a09SHong Zhang if (mumps->id.ICNTL(11)>0) { 1165a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," RINFOG(4) (inf norm of input mat): %g\n",mumps->id.RINFOG(4));CHKERRQ(ierr); 1166a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," RINFOG(5) (inf norm of solution): %g\n",mumps->id.RINFOG(5));CHKERRQ(ierr); 1167a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," RINFOG(6) (inf norm of residual): %g\n",mumps->id.RINFOG(6));CHKERRQ(ierr); 1168a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," RINFOG(7),RINFOG(8) (backward error est): %g, %g\n",mumps->id.RINFOG(7),mumps->id.RINFOG(8));CHKERRQ(ierr); 1169a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," RINFOG(9) (error estimate): %g \n",mumps->id.RINFOG(9));CHKERRQ(ierr); 1170a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," RINFOG(10),RINFOG(11)(condition numbers): %g, %g\n",mumps->id.RINFOG(10),mumps->id.RINFOG(11));CHKERRQ(ierr); 1171f6c57405SHong Zhang } 1172a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(12) (efficiency control): %d \n",mumps->id.ICNTL(12));CHKERRQ(ierr); 1173a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(13) (efficiency control): %d \n",mumps->id.ICNTL(13));CHKERRQ(ierr); 1174a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(14) (percentage of estimated workspace increase): %d \n",mumps->id.ICNTL(14));CHKERRQ(ierr); 1175f6c57405SHong Zhang /* ICNTL(15-17) not used */ 1176a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(18) (input mat struct): %d \n",mumps->id.ICNTL(18));CHKERRQ(ierr); 1177a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(19) (Shur complement info): %d \n",mumps->id.ICNTL(19));CHKERRQ(ierr); 1178a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(20) (rhs sparse pattern): %d \n",mumps->id.ICNTL(20));CHKERRQ(ierr); 1179a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(21) (somumpstion struct): %d \n",mumps->id.ICNTL(21));CHKERRQ(ierr); 1180a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(22) (in-core/out-of-core facility): %d \n",mumps->id.ICNTL(22));CHKERRQ(ierr); 1181a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(23) (max size of memory can be allocated locally):%d \n",mumps->id.ICNTL(23));CHKERRQ(ierr); 1182c0165424SHong Zhang 1183a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(24) (detection of null pivot rows): %d \n",mumps->id.ICNTL(24));CHKERRQ(ierr); 1184a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(25) (computation of a null space basis): %d \n",mumps->id.ICNTL(25));CHKERRQ(ierr); 1185a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(26) (Schur options for rhs or solution): %d \n",mumps->id.ICNTL(26));CHKERRQ(ierr); 1186a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(27) (experimental parameter): %d \n",mumps->id.ICNTL(27));CHKERRQ(ierr); 1187a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(28) (use parallel or sequential ordering): %d \n",mumps->id.ICNTL(28));CHKERRQ(ierr); 1188a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(29) (parallel ordering): %d \n",mumps->id.ICNTL(29));CHKERRQ(ierr); 118942179a6aSHong Zhang 1190a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(30) (user-specified set of entries in inv(A)): %d \n",mumps->id.ICNTL(30));CHKERRQ(ierr); 1191a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(31) (factors is discarded in the solve phase): %d \n",mumps->id.ICNTL(31));CHKERRQ(ierr); 1192a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(33) (compute determinant): %d \n",mumps->id.ICNTL(33));CHKERRQ(ierr); 1193f6c57405SHong Zhang 1194a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," CNTL(1) (relative pivoting threshold): %g \n",mumps->id.CNTL(1));CHKERRQ(ierr); 1195a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," CNTL(2) (stopping criterion of refinement): %g \n",mumps->id.CNTL(2));CHKERRQ(ierr); 1196a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," CNTL(3) (absomumpste pivoting threshold): %g \n",mumps->id.CNTL(3));CHKERRQ(ierr); 1197a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," CNTL(4) (vamumpse of static pivoting): %g \n",mumps->id.CNTL(4));CHKERRQ(ierr); 1198a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," CNTL(5) (fixation for null pivots): %g \n",mumps->id.CNTL(5));CHKERRQ(ierr); 1199f6c57405SHong Zhang 1200f6c57405SHong Zhang /* infomation local to each processor */ 120134ed7027SBarry Smith ierr = PetscViewerASCIIPrintf(viewer, " RINFO(1) (local estimated flops for the elimination after analysis): \n");CHKERRQ(ierr); 12027b23a99aSBarry Smith ierr = PetscViewerASCIISynchronizedAllow(viewer,PETSC_TRUE);CHKERRQ(ierr); 1203a5e57a09SHong Zhang ierr = PetscViewerASCIISynchronizedPrintf(viewer," [%d] %g \n",mumps->myid,mumps->id.RINFO(1));CHKERRQ(ierr); 120434ed7027SBarry Smith ierr = PetscViewerFlush(viewer); 120534ed7027SBarry Smith ierr = PetscViewerASCIIPrintf(viewer, " RINFO(2) (local estimated flops for the assembly after factorization): \n");CHKERRQ(ierr); 1206a5e57a09SHong Zhang ierr = PetscViewerASCIISynchronizedPrintf(viewer," [%d] %g \n",mumps->myid,mumps->id.RINFO(2));CHKERRQ(ierr); 120734ed7027SBarry Smith ierr = PetscViewerFlush(viewer); 120834ed7027SBarry Smith ierr = PetscViewerASCIIPrintf(viewer, " RINFO(3) (local estimated flops for the elimination after factorization): \n");CHKERRQ(ierr); 1209a5e57a09SHong Zhang ierr = PetscViewerASCIISynchronizedPrintf(viewer," [%d] %g \n",mumps->myid,mumps->id.RINFO(3));CHKERRQ(ierr); 121034ed7027SBarry Smith ierr = PetscViewerFlush(viewer); 1211f6c57405SHong Zhang 121234ed7027SBarry Smith ierr = PetscViewerASCIIPrintf(viewer, " INFO(15) (estimated size of (in MB) MUMPS internal data for running numerical factorization): \n");CHKERRQ(ierr); 1213a5e57a09SHong Zhang ierr = PetscViewerASCIISynchronizedPrintf(viewer," [%d] %d \n",mumps->myid,mumps->id.INFO(15));CHKERRQ(ierr); 121434ed7027SBarry Smith ierr = PetscViewerFlush(viewer); 1215f6c57405SHong Zhang 121634ed7027SBarry Smith ierr = PetscViewerASCIIPrintf(viewer, " INFO(16) (size of (in MB) MUMPS internal data used during numerical factorization): \n");CHKERRQ(ierr); 1217a5e57a09SHong Zhang ierr = PetscViewerASCIISynchronizedPrintf(viewer," [%d] %d \n",mumps->myid,mumps->id.INFO(16));CHKERRQ(ierr); 121834ed7027SBarry Smith ierr = PetscViewerFlush(viewer); 1219f6c57405SHong Zhang 122034ed7027SBarry Smith ierr = PetscViewerASCIIPrintf(viewer, " INFO(23) (num of pivots eliminated on this processor after factorization): \n");CHKERRQ(ierr); 1221a5e57a09SHong Zhang ierr = PetscViewerASCIISynchronizedPrintf(viewer," [%d] %d \n",mumps->myid,mumps->id.INFO(23));CHKERRQ(ierr); 122234ed7027SBarry Smith ierr = PetscViewerFlush(viewer); 12237b23a99aSBarry Smith ierr = PetscViewerASCIISynchronizedAllow(viewer,PETSC_FALSE);CHKERRQ(ierr); 1224f6c57405SHong Zhang 1225a5e57a09SHong Zhang if (!mumps->myid) { /* information from the host */ 1226a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," RINFOG(1) (global estimated flops for the elimination after analysis): %g \n",mumps->id.RINFOG(1));CHKERRQ(ierr); 1227a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," RINFOG(2) (global estimated flops for the assembly after factorization): %g \n",mumps->id.RINFOG(2));CHKERRQ(ierr); 1228a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," RINFOG(3) (global estimated flops for the elimination after factorization): %g \n",mumps->id.RINFOG(3));CHKERRQ(ierr); 1229a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," (RINFOG(12) RINFOG(13))*2^INFOG(34) (determinant): (%g,%g)*(2^%d)\n",mumps->id.RINFOG(12),mumps->id.RINFOG(13),mumps->id.INFOG(34));CHKERRQ(ierr); 1230f6c57405SHong Zhang 1231a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(3) (estimated real workspace for factors on all processors after analysis): %d \n",mumps->id.INFOG(3));CHKERRQ(ierr); 1232a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(4) (estimated integer workspace for factors on all processors after analysis): %d \n",mumps->id.INFOG(4));CHKERRQ(ierr); 1233a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(5) (estimated maximum front size in the complete tree): %d \n",mumps->id.INFOG(5));CHKERRQ(ierr); 1234a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(6) (number of nodes in the complete tree): %d \n",mumps->id.INFOG(6));CHKERRQ(ierr); 1235a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(7) (ordering option effectively use after analysis): %d \n",mumps->id.INFOG(7));CHKERRQ(ierr); 1236a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(8) (structural symmetry in percent of the permuted matrix after analysis): %d \n",mumps->id.INFOG(8));CHKERRQ(ierr); 1237a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(9) (total real/complex workspace to store the matrix factors after factorization): %d \n",mumps->id.INFOG(9));CHKERRQ(ierr); 1238a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(10) (total integer space store the matrix factors after factorization): %d \n",mumps->id.INFOG(10));CHKERRQ(ierr); 1239a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(11) (order of largest frontal matrix after factorization): %d \n",mumps->id.INFOG(11));CHKERRQ(ierr); 1240a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(12) (number of off-diagonal pivots): %d \n",mumps->id.INFOG(12));CHKERRQ(ierr); 1241a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(13) (number of delayed pivots after factorization): %d \n",mumps->id.INFOG(13));CHKERRQ(ierr); 1242a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(14) (number of memory compress after factorization): %d \n",mumps->id.INFOG(14));CHKERRQ(ierr); 1243a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(15) (number of steps of iterative refinement after solution): %d \n",mumps->id.INFOG(15));CHKERRQ(ierr); 1244a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(16) (estimated size (in MB) of all MUMPS internal data for factorization after analysis: value on the most memory consuming processor): %d \n",mumps->id.INFOG(16));CHKERRQ(ierr); 1245a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(17) (estimated size of all MUMPS internal data for factorization after analysis: sum over all processors): %d \n",mumps->id.INFOG(17));CHKERRQ(ierr); 1246a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(18) (size of all MUMPS internal data allocated during factorization: value on the most memory consuming processor): %d \n",mumps->id.INFOG(18));CHKERRQ(ierr); 1247a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(19) (size of all MUMPS internal data allocated during factorization: sum over all processors): %d \n",mumps->id.INFOG(19));CHKERRQ(ierr); 1248a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(20) (estimated number of entries in the factors): %d \n",mumps->id.INFOG(20));CHKERRQ(ierr); 1249a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(21) (size in MB of memory effectively used during factorization - value on the most memory consuming processor): %d \n",mumps->id.INFOG(21));CHKERRQ(ierr); 1250a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(22) (size in MB of memory effectively used during factorization - sum over all processors): %d \n",mumps->id.INFOG(22));CHKERRQ(ierr); 1251a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(23) (after analysis: value of ICNTL(6) effectively used): %d \n",mumps->id.INFOG(23));CHKERRQ(ierr); 1252a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(24) (after analysis: value of ICNTL(12) effectively used): %d \n",mumps->id.INFOG(24));CHKERRQ(ierr); 1253a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(25) (after factorization: number of pivots modified by static pivoting): %d \n",mumps->id.INFOG(25));CHKERRQ(ierr); 1254f6c57405SHong Zhang } 1255f6c57405SHong Zhang } 1256cb828f0fSHong Zhang } 1257f6c57405SHong Zhang PetscFunctionReturn(0); 1258f6c57405SHong Zhang } 1259f6c57405SHong Zhang 126035bd34faSBarry Smith #undef __FUNCT__ 126135bd34faSBarry Smith #define __FUNCT__ "MatGetInfo_MUMPS" 126235bd34faSBarry Smith PetscErrorCode MatGetInfo_MUMPS(Mat A,MatInfoType flag,MatInfo *info) 126335bd34faSBarry Smith { 1264cb828f0fSHong Zhang Mat_MUMPS *mumps =(Mat_MUMPS*)A->spptr; 126535bd34faSBarry Smith 126635bd34faSBarry Smith PetscFunctionBegin; 126735bd34faSBarry Smith info->block_size = 1.0; 1268cb828f0fSHong Zhang info->nz_allocated = mumps->id.INFOG(20); 1269cb828f0fSHong Zhang info->nz_used = mumps->id.INFOG(20); 127035bd34faSBarry Smith info->nz_unneeded = 0.0; 127135bd34faSBarry Smith info->assemblies = 0.0; 127235bd34faSBarry Smith info->mallocs = 0.0; 127335bd34faSBarry Smith info->memory = 0.0; 127435bd34faSBarry Smith info->fill_ratio_given = 0; 127535bd34faSBarry Smith info->fill_ratio_needed = 0; 127635bd34faSBarry Smith info->factor_mallocs = 0; 127735bd34faSBarry Smith PetscFunctionReturn(0); 127835bd34faSBarry Smith } 127935bd34faSBarry Smith 12805ccb76cbSHong Zhang /* -------------------------------------------------------------------------------------------*/ 12815ccb76cbSHong Zhang #undef __FUNCT__ 12825ccb76cbSHong Zhang #define __FUNCT__ "MatMumpsSetIcntl_MUMPS" 12835ccb76cbSHong Zhang PetscErrorCode MatMumpsSetIcntl_MUMPS(Mat F,PetscInt icntl,PetscInt ival) 12845ccb76cbSHong Zhang { 1285a5e57a09SHong Zhang Mat_MUMPS *mumps =(Mat_MUMPS*)F->spptr; 12865ccb76cbSHong Zhang 12875ccb76cbSHong Zhang PetscFunctionBegin; 1288a5e57a09SHong Zhang mumps->id.ICNTL(icntl) = ival; 12895ccb76cbSHong Zhang PetscFunctionReturn(0); 12905ccb76cbSHong Zhang } 12915ccb76cbSHong Zhang 12925ccb76cbSHong Zhang #undef __FUNCT__ 12935ccb76cbSHong Zhang #define __FUNCT__ "MatMumpsSetIcntl" 12945ccb76cbSHong Zhang /*@ 12955ccb76cbSHong Zhang MatMumpsSetIcntl - Set MUMPS parameter ICNTL() 12965ccb76cbSHong Zhang 12975ccb76cbSHong Zhang Logically Collective on Mat 12985ccb76cbSHong Zhang 12995ccb76cbSHong Zhang Input Parameters: 13005ccb76cbSHong Zhang + F - the factored matrix obtained by calling MatGetFactor() from PETSc-MUMPS interface 13015ccb76cbSHong Zhang . icntl - index of MUMPS parameter array ICNTL() 13025ccb76cbSHong Zhang - ival - value of MUMPS ICNTL(icntl) 13035ccb76cbSHong Zhang 13045ccb76cbSHong Zhang Options Database: 13055ccb76cbSHong Zhang . -mat_mumps_icntl_<icntl> <ival> 13065ccb76cbSHong Zhang 13075ccb76cbSHong Zhang Level: beginner 13085ccb76cbSHong Zhang 13095ccb76cbSHong Zhang References: MUMPS Users' Guide 13105ccb76cbSHong Zhang 13115ccb76cbSHong Zhang .seealso: MatGetFactor() 13125ccb76cbSHong Zhang @*/ 13135ccb76cbSHong Zhang PetscErrorCode MatMumpsSetIcntl(Mat F,PetscInt icntl,PetscInt ival) 13145ccb76cbSHong Zhang { 13155ccb76cbSHong Zhang PetscErrorCode ierr; 13165ccb76cbSHong Zhang 13175ccb76cbSHong Zhang PetscFunctionBegin; 13185ccb76cbSHong Zhang PetscValidLogicalCollectiveInt(F,icntl,2); 13195ccb76cbSHong Zhang PetscValidLogicalCollectiveInt(F,ival,3); 13205ccb76cbSHong Zhang ierr = PetscTryMethod(F,"MatMumpsSetIcntl_C",(Mat,PetscInt,PetscInt),(F,icntl,ival));CHKERRQ(ierr); 13215ccb76cbSHong Zhang PetscFunctionReturn(0); 13225ccb76cbSHong Zhang } 13235ccb76cbSHong Zhang 13248928b65cSHong Zhang /* -------------------------------------------------------------------------------------------*/ 13258928b65cSHong Zhang #undef __FUNCT__ 13268928b65cSHong Zhang #define __FUNCT__ "MatMumpsSetCntl_MUMPS" 13278928b65cSHong Zhang PetscErrorCode MatMumpsSetCntl_MUMPS(Mat F,PetscInt icntl,PetscReal val) 13288928b65cSHong Zhang { 13298928b65cSHong Zhang Mat_MUMPS *mumps =(Mat_MUMPS*)F->spptr; 13308928b65cSHong Zhang 13318928b65cSHong Zhang PetscFunctionBegin; 13328928b65cSHong Zhang mumps->id.CNTL(icntl) = val; 13338928b65cSHong Zhang PetscFunctionReturn(0); 13348928b65cSHong Zhang } 13358928b65cSHong Zhang 13368928b65cSHong Zhang #undef __FUNCT__ 13378928b65cSHong Zhang #define __FUNCT__ "MatMumpsSetCntl" 13388928b65cSHong Zhang /*@ 13398928b65cSHong Zhang MatMumpsSetCntl - Set MUMPS parameter CNTL() 13408928b65cSHong Zhang 13418928b65cSHong Zhang Logically Collective on Mat 13428928b65cSHong Zhang 13438928b65cSHong Zhang Input Parameters: 13448928b65cSHong Zhang + F - the factored matrix obtained by calling MatGetFactor() from PETSc-MUMPS interface 13458928b65cSHong Zhang . icntl - index of MUMPS parameter array CNTL() 13468928b65cSHong Zhang - val - value of MUMPS CNTL(icntl) 13478928b65cSHong Zhang 13488928b65cSHong Zhang Options Database: 13498928b65cSHong Zhang . -mat_mumps_cntl_<icntl> <val> 13508928b65cSHong Zhang 13518928b65cSHong Zhang Level: beginner 13528928b65cSHong Zhang 13538928b65cSHong Zhang References: MUMPS Users' Guide 13548928b65cSHong Zhang 13558928b65cSHong Zhang .seealso: MatGetFactor() 13568928b65cSHong Zhang @*/ 13578928b65cSHong Zhang PetscErrorCode MatMumpsSetCntl(Mat F,PetscInt icntl,PetscReal val) 13588928b65cSHong Zhang { 13598928b65cSHong Zhang PetscErrorCode ierr; 13608928b65cSHong Zhang 13618928b65cSHong Zhang PetscFunctionBegin; 13628928b65cSHong Zhang PetscValidLogicalCollectiveInt(F,icntl,2); 13638928b65cSHong Zhang PetscValidLogicalCollectiveInt(F,val,3); 13648928b65cSHong Zhang ierr = PetscTryMethod(F,"MatMumpsSetCntl_C",(Mat,PetscInt,PetscReal),(F,icntl,val));CHKERRQ(ierr); 13658928b65cSHong Zhang PetscFunctionReturn(0); 13668928b65cSHong Zhang } 13678928b65cSHong Zhang 136824b6179bSKris Buschelman /*MC 13692692d6eeSBarry Smith MATSOLVERMUMPS - A matrix type providing direct solvers (LU and Cholesky) for 137024b6179bSKris Buschelman distributed and sequential matrices via the external package MUMPS. 137124b6179bSKris Buschelman 137241c8de11SBarry Smith Works with MATAIJ and MATSBAIJ matrices 137324b6179bSKris Buschelman 137424b6179bSKris Buschelman Options Database Keys: 1375fb8376fbSHong Zhang + -mat_mumps_icntl_4 <0,...,4> - print level 137624b6179bSKris Buschelman . -mat_mumps_icntl_6 <0,...,7> - matrix prescaling options (see MUMPS User's Guide) 137764e6c443SBarry Smith . -mat_mumps_icntl_7 <0,...,7> - matrix orderings (see MUMPS User's Guidec) 137824b6179bSKris Buschelman . -mat_mumps_icntl_9 <1,2> - A or A^T x=b to be solved: 1 denotes A, 2 denotes A^T 137924b6179bSKris Buschelman . -mat_mumps_icntl_10 <n> - maximum number of iterative refinements 138094b7f48cSBarry Smith . -mat_mumps_icntl_11 <n> - error analysis, a positive value returns statistics during -ksp_view 138124b6179bSKris Buschelman . -mat_mumps_icntl_12 <n> - efficiency control (see MUMPS User's Guide) 138224b6179bSKris Buschelman . -mat_mumps_icntl_13 <n> - efficiency control (see MUMPS User's Guide) 138324b6179bSKris Buschelman . -mat_mumps_icntl_14 <n> - efficiency control (see MUMPS User's Guide) 138424b6179bSKris Buschelman . -mat_mumps_icntl_15 <n> - efficiency control (see MUMPS User's Guide) 138524b6179bSKris Buschelman . -mat_mumps_cntl_1 <delta> - relative pivoting threshold 138624b6179bSKris Buschelman . -mat_mumps_cntl_2 <tol> - stopping criterion for refinement 138724b6179bSKris Buschelman - -mat_mumps_cntl_3 <adelta> - absolute pivoting threshold 138824b6179bSKris Buschelman 138924b6179bSKris Buschelman Level: beginner 139024b6179bSKris Buschelman 139141c8de11SBarry Smith .seealso: PCFactorSetMatSolverPackage(), MatSolverPackage 139241c8de11SBarry Smith 139324b6179bSKris Buschelman M*/ 139424b6179bSKris Buschelman 139535bd34faSBarry Smith #undef __FUNCT__ 139635bd34faSBarry Smith #define __FUNCT__ "MatFactorGetSolverPackage_mumps" 1397f7a08781SBarry Smith static PetscErrorCode MatFactorGetSolverPackage_mumps(Mat A,const MatSolverPackage *type) 139835bd34faSBarry Smith { 139935bd34faSBarry Smith PetscFunctionBegin; 14002692d6eeSBarry Smith *type = MATSOLVERMUMPS; 140135bd34faSBarry Smith PetscFunctionReturn(0); 140235bd34faSBarry Smith } 140335bd34faSBarry Smith 1404bccb9932SShri Abhyankar /* MatGetFactor for Seq and MPI AIJ matrices */ 14052877fffaSHong Zhang #undef __FUNCT__ 1406bccb9932SShri Abhyankar #define __FUNCT__ "MatGetFactor_aij_mumps" 14078cc058d9SJed Brown PETSC_EXTERN PetscErrorCode MatGetFactor_aij_mumps(Mat A,MatFactorType ftype,Mat *F) 14082877fffaSHong Zhang { 14092877fffaSHong Zhang Mat B; 14102877fffaSHong Zhang PetscErrorCode ierr; 14112877fffaSHong Zhang Mat_MUMPS *mumps; 1412ace3abfcSBarry Smith PetscBool isSeqAIJ; 14132877fffaSHong Zhang 14142877fffaSHong Zhang PetscFunctionBegin; 14152877fffaSHong Zhang /* Create the factorization matrix */ 1416251f4c67SDmitry Karpeev ierr = PetscObjectTypeCompare((PetscObject)A,MATSEQAIJ,&isSeqAIJ);CHKERRQ(ierr); 1417ce94432eSBarry Smith ierr = MatCreate(PetscObjectComm((PetscObject)A),&B);CHKERRQ(ierr); 14182877fffaSHong Zhang ierr = MatSetSizes(B,A->rmap->n,A->cmap->n,A->rmap->N,A->cmap->N);CHKERRQ(ierr); 14192877fffaSHong Zhang ierr = MatSetType(B,((PetscObject)A)->type_name);CHKERRQ(ierr); 1420bccb9932SShri Abhyankar if (isSeqAIJ) { 14210298fd71SBarry Smith ierr = MatSeqAIJSetPreallocation(B,0,NULL);CHKERRQ(ierr); 1422bccb9932SShri Abhyankar } else { 14230298fd71SBarry Smith ierr = MatMPIAIJSetPreallocation(B,0,NULL,0,NULL);CHKERRQ(ierr); 1424bccb9932SShri Abhyankar } 14252877fffaSHong Zhang 142616ebf90aSShri Abhyankar ierr = PetscNewLog(B,Mat_MUMPS,&mumps);CHKERRQ(ierr); 14272205254eSKarl Rupp 14282877fffaSHong Zhang B->ops->view = MatView_MUMPS; 142935bd34faSBarry Smith B->ops->getinfo = MatGetInfo_MUMPS; 14302205254eSKarl Rupp 1431bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatFactorGetSolverPackage_C",MatFactorGetSolverPackage_mumps);CHKERRQ(ierr); 1432bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsSetIcntl_C",MatMumpsSetIcntl_MUMPS);CHKERRQ(ierr); 1433bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsSetCntl_C",MatMumpsSetCntl_MUMPS);CHKERRQ(ierr); 1434450b117fSShri Abhyankar if (ftype == MAT_FACTOR_LU) { 1435450b117fSShri Abhyankar B->ops->lufactorsymbolic = MatLUFactorSymbolic_AIJMUMPS; 1436d5f3da31SBarry Smith B->factortype = MAT_FACTOR_LU; 1437bccb9932SShri Abhyankar if (isSeqAIJ) mumps->ConvertToTriples = MatConvertToTriples_seqaij_seqaij; 1438bccb9932SShri Abhyankar else mumps->ConvertToTriples = MatConvertToTriples_mpiaij_mpiaij; 1439746480a1SHong Zhang mumps->sym = 0; 1440dcd589f8SShri Abhyankar } else { 144167877ebaSShri Abhyankar B->ops->choleskyfactorsymbolic = MatCholeskyFactorSymbolic_MUMPS; 1442450b117fSShri Abhyankar B->factortype = MAT_FACTOR_CHOLESKY; 1443bccb9932SShri Abhyankar if (isSeqAIJ) mumps->ConvertToTriples = MatConvertToTriples_seqaij_seqsbaij; 1444bccb9932SShri Abhyankar else mumps->ConvertToTriples = MatConvertToTriples_mpiaij_mpisbaij; 14456fdc2a6dSBarry Smith if (A->spd_set && A->spd) mumps->sym = 1; 14466fdc2a6dSBarry Smith else mumps->sym = 2; 1447450b117fSShri Abhyankar } 14482877fffaSHong Zhang 14492877fffaSHong Zhang mumps->isAIJ = PETSC_TRUE; 1450bf0cc555SLisandro Dalcin mumps->Destroy = B->ops->destroy; 14512877fffaSHong Zhang B->ops->destroy = MatDestroy_MUMPS; 14522877fffaSHong Zhang B->spptr = (void*)mumps; 14532205254eSKarl Rupp 1454f697e70eSHong Zhang ierr = PetscInitializeMUMPS(A,mumps);CHKERRQ(ierr); 1455746480a1SHong Zhang 14562877fffaSHong Zhang *F = B; 14572877fffaSHong Zhang PetscFunctionReturn(0); 14582877fffaSHong Zhang } 14592877fffaSHong Zhang 1460bccb9932SShri Abhyankar /* MatGetFactor for Seq and MPI SBAIJ matrices */ 14612877fffaSHong Zhang #undef __FUNCT__ 1462bccb9932SShri Abhyankar #define __FUNCT__ "MatGetFactor_sbaij_mumps" 14638cc058d9SJed Brown PETSC_EXTERN PetscErrorCode MatGetFactor_sbaij_mumps(Mat A,MatFactorType ftype,Mat *F) 14642877fffaSHong Zhang { 14652877fffaSHong Zhang Mat B; 14662877fffaSHong Zhang PetscErrorCode ierr; 14672877fffaSHong Zhang Mat_MUMPS *mumps; 1468ace3abfcSBarry Smith PetscBool isSeqSBAIJ; 14692877fffaSHong Zhang 14702877fffaSHong Zhang PetscFunctionBegin; 1471ce94432eSBarry Smith if (ftype != MAT_FACTOR_CHOLESKY) SETERRQ(PetscObjectComm((PetscObject)A),PETSC_ERR_SUP,"Cannot use PETSc SBAIJ matrices with MUMPS LU, use AIJ matrix"); 1472ce94432eSBarry Smith if (A->rmap->bs > 1) SETERRQ(PetscObjectComm((PetscObject)A),PETSC_ERR_SUP,"Cannot use PETSc SBAIJ matrices with block size > 1 with MUMPS Cholesky, use AIJ matrix instead"); 1473251f4c67SDmitry Karpeev ierr = PetscObjectTypeCompare((PetscObject)A,MATSEQSBAIJ,&isSeqSBAIJ);CHKERRQ(ierr); 14742877fffaSHong Zhang /* Create the factorization matrix */ 1475ce94432eSBarry Smith ierr = MatCreate(PetscObjectComm((PetscObject)A),&B);CHKERRQ(ierr); 14762877fffaSHong Zhang ierr = MatSetSizes(B,A->rmap->n,A->cmap->n,A->rmap->N,A->cmap->N);CHKERRQ(ierr); 14772877fffaSHong Zhang ierr = MatSetType(B,((PetscObject)A)->type_name);CHKERRQ(ierr); 147816ebf90aSShri Abhyankar ierr = PetscNewLog(B,Mat_MUMPS,&mumps);CHKERRQ(ierr); 1479bccb9932SShri Abhyankar if (isSeqSBAIJ) { 14800298fd71SBarry Smith ierr = MatSeqSBAIJSetPreallocation(B,1,0,NULL);CHKERRQ(ierr); 14812205254eSKarl Rupp 148216ebf90aSShri Abhyankar mumps->ConvertToTriples = MatConvertToTriples_seqsbaij_seqsbaij; 1483dcd589f8SShri Abhyankar } else { 14840298fd71SBarry Smith ierr = MatMPISBAIJSetPreallocation(B,1,0,NULL,0,NULL);CHKERRQ(ierr); 14852205254eSKarl Rupp 1486bccb9932SShri Abhyankar mumps->ConvertToTriples = MatConvertToTriples_mpisbaij_mpisbaij; 1487bccb9932SShri Abhyankar } 1488bccb9932SShri Abhyankar 148967877ebaSShri Abhyankar B->ops->choleskyfactorsymbolic = MatCholeskyFactorSymbolic_MUMPS; 1490bccb9932SShri Abhyankar B->ops->view = MatView_MUMPS; 14912205254eSKarl Rupp 1492bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatFactorGetSolverPackage_C",MatFactorGetSolverPackage_mumps);CHKERRQ(ierr); 1493bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsSetIcntl_C",MatMumpsSetIcntl);CHKERRQ(ierr); 1494bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsSetCntl_C",MatMumpsSetCntl);CHKERRQ(ierr); 14952205254eSKarl Rupp 1496f4762488SHong Zhang B->factortype = MAT_FACTOR_CHOLESKY; 14976fdc2a6dSBarry Smith if (A->spd_set && A->spd) mumps->sym = 1; 14986fdc2a6dSBarry Smith else mumps->sym = 2; 1499a214ac2aSShri Abhyankar 1500bccb9932SShri Abhyankar mumps->isAIJ = PETSC_FALSE; 1501bf0cc555SLisandro Dalcin mumps->Destroy = B->ops->destroy; 1502f3c0ef26SHong Zhang B->ops->destroy = MatDestroy_MUMPS; 15032877fffaSHong Zhang B->spptr = (void*)mumps; 15042205254eSKarl Rupp 1505f697e70eSHong Zhang ierr = PetscInitializeMUMPS(A,mumps);CHKERRQ(ierr); 1506746480a1SHong Zhang 15072877fffaSHong Zhang *F = B; 15082877fffaSHong Zhang PetscFunctionReturn(0); 15092877fffaSHong Zhang } 151097969023SHong Zhang 1511450b117fSShri Abhyankar #undef __FUNCT__ 1512bccb9932SShri Abhyankar #define __FUNCT__ "MatGetFactor_baij_mumps" 15138cc058d9SJed Brown PETSC_EXTERN PetscErrorCode MatGetFactor_baij_mumps(Mat A,MatFactorType ftype,Mat *F) 151467877ebaSShri Abhyankar { 151567877ebaSShri Abhyankar Mat B; 151667877ebaSShri Abhyankar PetscErrorCode ierr; 151767877ebaSShri Abhyankar Mat_MUMPS *mumps; 1518ace3abfcSBarry Smith PetscBool isSeqBAIJ; 151967877ebaSShri Abhyankar 152067877ebaSShri Abhyankar PetscFunctionBegin; 152167877ebaSShri Abhyankar /* Create the factorization matrix */ 1522251f4c67SDmitry Karpeev ierr = PetscObjectTypeCompare((PetscObject)A,MATSEQBAIJ,&isSeqBAIJ);CHKERRQ(ierr); 1523ce94432eSBarry Smith ierr = MatCreate(PetscObjectComm((PetscObject)A),&B);CHKERRQ(ierr); 152467877ebaSShri Abhyankar ierr = MatSetSizes(B,A->rmap->n,A->cmap->n,A->rmap->N,A->cmap->N);CHKERRQ(ierr); 152567877ebaSShri Abhyankar ierr = MatSetType(B,((PetscObject)A)->type_name);CHKERRQ(ierr); 1526bccb9932SShri Abhyankar if (isSeqBAIJ) { 15270298fd71SBarry Smith ierr = MatSeqBAIJSetPreallocation(B,A->rmap->bs,0,NULL);CHKERRQ(ierr); 1528bccb9932SShri Abhyankar } else { 15290298fd71SBarry Smith ierr = MatMPIBAIJSetPreallocation(B,A->rmap->bs,0,NULL,0,NULL);CHKERRQ(ierr); 1530bccb9932SShri Abhyankar } 1531450b117fSShri Abhyankar 153267877ebaSShri Abhyankar ierr = PetscNewLog(B,Mat_MUMPS,&mumps);CHKERRQ(ierr); 1533450b117fSShri Abhyankar if (ftype == MAT_FACTOR_LU) { 1534450b117fSShri Abhyankar B->ops->lufactorsymbolic = MatLUFactorSymbolic_BAIJMUMPS; 1535450b117fSShri Abhyankar B->factortype = MAT_FACTOR_LU; 1536bccb9932SShri Abhyankar if (isSeqBAIJ) mumps->ConvertToTriples = MatConvertToTriples_seqbaij_seqaij; 1537bccb9932SShri Abhyankar else mumps->ConvertToTriples = MatConvertToTriples_mpibaij_mpiaij; 1538746480a1SHong Zhang mumps->sym = 0; 1539f23aa3ddSBarry Smith } else SETERRQ(PETSC_COMM_SELF,PETSC_ERR_SUP,"Cannot use PETSc BAIJ matrices with MUMPS Cholesky, use SBAIJ or AIJ matrix instead\n"); 1540bccb9932SShri Abhyankar 1541450b117fSShri Abhyankar B->ops->view = MatView_MUMPS; 15422205254eSKarl Rupp 1543bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatFactorGetSolverPackage_C",MatFactorGetSolverPackage_mumps);CHKERRQ(ierr); 1544bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsSetIcntl_C",MatMumpsSetIcntl_MUMPS);CHKERRQ(ierr); 1545bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsSetCntl_C",MatMumpsSetCntl_MUMPS);CHKERRQ(ierr); 1546450b117fSShri Abhyankar 1547450b117fSShri Abhyankar mumps->isAIJ = PETSC_TRUE; 1548bf0cc555SLisandro Dalcin mumps->Destroy = B->ops->destroy; 1549450b117fSShri Abhyankar B->ops->destroy = MatDestroy_MUMPS; 1550450b117fSShri Abhyankar B->spptr = (void*)mumps; 15512205254eSKarl Rupp 1552f697e70eSHong Zhang ierr = PetscInitializeMUMPS(A,mumps);CHKERRQ(ierr); 1553746480a1SHong Zhang 1554450b117fSShri Abhyankar *F = B; 1555450b117fSShri Abhyankar PetscFunctionReturn(0); 1556450b117fSShri Abhyankar } 1557a214ac2aSShri Abhyankar 1558