11c2a3de1SBarry Smith 2397b6df1SKris Buschelman /* 3c2b5dc30SHong Zhang Provides an interface to the MUMPS sparse solver 4397b6df1SKris Buschelman */ 551d5961aSHong Zhang 6c6db04a5SJed Brown #include <../src/mat/impls/aij/mpi/mpiaij.h> /*I "petscmat.h" I*/ 7c6db04a5SJed Brown #include <../src/mat/impls/sbaij/mpi/mpisbaij.h> 8397b6df1SKris Buschelman 9397b6df1SKris Buschelman EXTERN_C_BEGIN 10397b6df1SKris Buschelman #if defined(PETSC_USE_COMPLEX) 112907cef9SHong Zhang #if defined(PETSC_USE_REAL_SINGLE) 122907cef9SHong Zhang #include <cmumps_c.h> 132907cef9SHong Zhang #else 14c6db04a5SJed Brown #include <zmumps_c.h> 152907cef9SHong Zhang #endif 162907cef9SHong Zhang #else 172907cef9SHong Zhang #if defined(PETSC_USE_REAL_SINGLE) 182907cef9SHong Zhang #include <smumps_c.h> 19397b6df1SKris Buschelman #else 20c6db04a5SJed Brown #include <dmumps_c.h> 21397b6df1SKris Buschelman #endif 222907cef9SHong Zhang #endif 23397b6df1SKris Buschelman EXTERN_C_END 24397b6df1SKris Buschelman #define JOB_INIT -1 253d472b54SHong Zhang #define JOB_FACTSYMBOLIC 1 263d472b54SHong Zhang #define JOB_FACTNUMERIC 2 273d472b54SHong Zhang #define JOB_SOLVE 3 28397b6df1SKris Buschelman #define JOB_END -2 293d472b54SHong Zhang 302907cef9SHong Zhang /* calls to MUMPS */ 312907cef9SHong Zhang #if defined(PETSC_USE_COMPLEX) 322907cef9SHong Zhang #if defined(PETSC_USE_REAL_SINGLE) 332907cef9SHong Zhang #define PetscMUMPS_c cmumps_c 342907cef9SHong Zhang #else 352907cef9SHong Zhang #define PetscMUMPS_c zmumps_c 362907cef9SHong Zhang #endif 372907cef9SHong Zhang #else 382907cef9SHong Zhang #if defined(PETSC_USE_REAL_SINGLE) 392907cef9SHong Zhang #define PetscMUMPS_c smumps_c 402907cef9SHong Zhang #else 412907cef9SHong Zhang #define PetscMUMPS_c dmumps_c 422907cef9SHong Zhang #endif 432907cef9SHong Zhang #endif 442907cef9SHong Zhang 453d472b54SHong Zhang 46397b6df1SKris Buschelman /* macros s.t. indices match MUMPS documentation */ 47397b6df1SKris Buschelman #define ICNTL(I) icntl[(I)-1] 48397b6df1SKris Buschelman #define CNTL(I) cntl[(I)-1] 49397b6df1SKris Buschelman #define INFOG(I) infog[(I)-1] 50a7aca84bSHong Zhang #define INFO(I) info[(I)-1] 51397b6df1SKris Buschelman #define RINFOG(I) rinfog[(I)-1] 52adc1d99fSHong Zhang #define RINFO(I) rinfo[(I)-1] 53397b6df1SKris Buschelman 54397b6df1SKris Buschelman typedef struct { 55397b6df1SKris Buschelman #if defined(PETSC_USE_COMPLEX) 562907cef9SHong Zhang #if defined(PETSC_USE_REAL_SINGLE) 572907cef9SHong Zhang CMUMPS_STRUC_C id; 582907cef9SHong Zhang #else 59397b6df1SKris Buschelman ZMUMPS_STRUC_C id; 602907cef9SHong Zhang #endif 612907cef9SHong Zhang #else 622907cef9SHong Zhang #if defined(PETSC_USE_REAL_SINGLE) 632907cef9SHong Zhang SMUMPS_STRUC_C id; 64397b6df1SKris Buschelman #else 65397b6df1SKris Buschelman DMUMPS_STRUC_C id; 66397b6df1SKris Buschelman #endif 672907cef9SHong Zhang #endif 682907cef9SHong Zhang 69397b6df1SKris Buschelman MatStructure matstruc; 70c1490034SHong Zhang PetscMPIInt myid,size; 71a5e57a09SHong Zhang PetscInt *irn,*jcn,nz,sym; 72397b6df1SKris Buschelman PetscScalar *val; 73397b6df1SKris Buschelman MPI_Comm comm_mumps; 7464e6c443SBarry Smith PetscBool isAIJ,CleanUpMUMPS; 75a5e57a09SHong Zhang PetscInt ICNTL9_pre; /* check if ICNTL(9) is changed from previous MatSolve */ 76*801fbe65SHong Zhang VecScatter scat_rhs, scat_sol; /* used by MatSolve() */ 77*801fbe65SHong Zhang Vec b_seq,x_seq; 78*801fbe65SHong Zhang VecScatter scat_rhss, scat_sols; /* used by MatMatSolve() */ 79*801fbe65SHong Zhang Vec bb_mpi,bb_seq,xx_mpi; 802205254eSKarl Rupp 81bf0cc555SLisandro Dalcin PetscErrorCode (*Destroy)(Mat); 82bccb9932SShri Abhyankar PetscErrorCode (*ConvertToTriples)(Mat, int, MatReuse, int*, int**, int**, PetscScalar**); 83f0c56d0fSKris Buschelman } Mat_MUMPS; 84f0c56d0fSKris Buschelman 8509573ac7SBarry Smith extern PetscErrorCode MatDuplicate_MUMPS(Mat,MatDuplicateOption,Mat*); 86b24902e0SBarry Smith 87397b6df1SKris Buschelman /* 88d341cd04SHong Zhang MatConvertToTriples_A_B - convert Petsc matrix to triples: row[nz], col[nz], val[nz] 89d341cd04SHong Zhang 90397b6df1SKris Buschelman input: 9167877ebaSShri Abhyankar A - matrix in aij,baij or sbaij (bs=1) format 92397b6df1SKris Buschelman shift - 0: C style output triple; 1: Fortran style output triple. 93bccb9932SShri Abhyankar reuse - MAT_INITIAL_MATRIX: spaces are allocated and values are set for the triple 94bccb9932SShri Abhyankar MAT_REUSE_MATRIX: only the values in v array are updated 95397b6df1SKris Buschelman output: 96397b6df1SKris Buschelman nnz - dim of r, c, and v (number of local nonzero entries of A) 97397b6df1SKris Buschelman r, c, v - row and col index, matrix values (matrix triples) 98eb9baa12SBarry Smith 99eb9baa12SBarry Smith The returned values r, c, and sometimes v are obtained in a single PetscMalloc(). Then in MatDestroy_MUMPS() it is 100eb9baa12SBarry Smith freed with PetscFree((mumps->irn); This is not ideal code, the fact that v is ONLY sometimes part of mumps->irn means 101eb9baa12SBarry Smith that the PetscMalloc() cannot easily be replaced with a PetscMalloc3(). 102eb9baa12SBarry Smith 103397b6df1SKris Buschelman */ 10416ebf90aSShri Abhyankar 10516ebf90aSShri Abhyankar #undef __FUNCT__ 10616ebf90aSShri Abhyankar #define __FUNCT__ "MatConvertToTriples_seqaij_seqaij" 107bccb9932SShri Abhyankar PetscErrorCode MatConvertToTriples_seqaij_seqaij(Mat A,int shift,MatReuse reuse,int *nnz,int **r, int **c, PetscScalar **v) 108b24902e0SBarry Smith { 109185f6596SHong Zhang const PetscInt *ai,*aj,*ajj,M=A->rmap->n; 11067877ebaSShri Abhyankar PetscInt nz,rnz,i,j; 111dfbe8321SBarry Smith PetscErrorCode ierr; 112c1490034SHong Zhang PetscInt *row,*col; 11316ebf90aSShri Abhyankar Mat_SeqAIJ *aa=(Mat_SeqAIJ*)A->data; 114397b6df1SKris Buschelman 115397b6df1SKris Buschelman PetscFunctionBegin; 11616ebf90aSShri Abhyankar *v=aa->a; 117bccb9932SShri Abhyankar if (reuse == MAT_INITIAL_MATRIX) { 1182205254eSKarl Rupp nz = aa->nz; 1192205254eSKarl Rupp ai = aa->i; 1202205254eSKarl Rupp aj = aa->j; 12116ebf90aSShri Abhyankar *nnz = nz; 122785e854fSJed Brown ierr = PetscMalloc1(2*nz, &row);CHKERRQ(ierr); 123185f6596SHong Zhang col = row + nz; 124185f6596SHong Zhang 12516ebf90aSShri Abhyankar nz = 0; 12616ebf90aSShri Abhyankar for (i=0; i<M; i++) { 12716ebf90aSShri Abhyankar rnz = ai[i+1] - ai[i]; 12867877ebaSShri Abhyankar ajj = aj + ai[i]; 12967877ebaSShri Abhyankar for (j=0; j<rnz; j++) { 13067877ebaSShri Abhyankar row[nz] = i+shift; col[nz++] = ajj[j] + shift; 13116ebf90aSShri Abhyankar } 13216ebf90aSShri Abhyankar } 13316ebf90aSShri Abhyankar *r = row; *c = col; 13416ebf90aSShri Abhyankar } 13516ebf90aSShri Abhyankar PetscFunctionReturn(0); 13616ebf90aSShri Abhyankar } 137397b6df1SKris Buschelman 13816ebf90aSShri Abhyankar #undef __FUNCT__ 13967877ebaSShri Abhyankar #define __FUNCT__ "MatConvertToTriples_seqbaij_seqaij" 140bccb9932SShri Abhyankar PetscErrorCode MatConvertToTriples_seqbaij_seqaij(Mat A,int shift,MatReuse reuse,int *nnz,int **r, int **c, PetscScalar **v) 14167877ebaSShri Abhyankar { 14267877ebaSShri Abhyankar Mat_SeqBAIJ *aa=(Mat_SeqBAIJ*)A->data; 14333d57670SJed Brown const PetscInt *ai,*aj,*ajj,bs2 = aa->bs2; 14433d57670SJed Brown PetscInt bs,M,nz,idx=0,rnz,i,j,k,m; 14567877ebaSShri Abhyankar PetscErrorCode ierr; 14667877ebaSShri Abhyankar PetscInt *row,*col; 14767877ebaSShri Abhyankar 14867877ebaSShri Abhyankar PetscFunctionBegin; 14933d57670SJed Brown ierr = MatGetBlockSize(A,&bs);CHKERRQ(ierr); 15033d57670SJed Brown M = A->rmap->N/bs; 151cf3759fdSShri Abhyankar *v = aa->a; 152bccb9932SShri Abhyankar if (reuse == MAT_INITIAL_MATRIX) { 153cf3759fdSShri Abhyankar ai = aa->i; aj = aa->j; 15467877ebaSShri Abhyankar nz = bs2*aa->nz; 15567877ebaSShri Abhyankar *nnz = nz; 156785e854fSJed Brown ierr = PetscMalloc1(2*nz, &row);CHKERRQ(ierr); 157185f6596SHong Zhang col = row + nz; 158185f6596SHong Zhang 15967877ebaSShri Abhyankar for (i=0; i<M; i++) { 16067877ebaSShri Abhyankar ajj = aj + ai[i]; 16167877ebaSShri Abhyankar rnz = ai[i+1] - ai[i]; 16267877ebaSShri Abhyankar for (k=0; k<rnz; k++) { 16367877ebaSShri Abhyankar for (j=0; j<bs; j++) { 16467877ebaSShri Abhyankar for (m=0; m<bs; m++) { 16567877ebaSShri Abhyankar row[idx] = i*bs + m + shift; 166cf3759fdSShri Abhyankar col[idx++] = bs*(ajj[k]) + j + shift; 16767877ebaSShri Abhyankar } 16867877ebaSShri Abhyankar } 16967877ebaSShri Abhyankar } 17067877ebaSShri Abhyankar } 171cf3759fdSShri Abhyankar *r = row; *c = col; 17267877ebaSShri Abhyankar } 17367877ebaSShri Abhyankar PetscFunctionReturn(0); 17467877ebaSShri Abhyankar } 17567877ebaSShri Abhyankar 17667877ebaSShri Abhyankar #undef __FUNCT__ 17716ebf90aSShri Abhyankar #define __FUNCT__ "MatConvertToTriples_seqsbaij_seqsbaij" 178bccb9932SShri Abhyankar PetscErrorCode MatConvertToTriples_seqsbaij_seqsbaij(Mat A,int shift,MatReuse reuse,int *nnz,int **r, int **c, PetscScalar **v) 17916ebf90aSShri Abhyankar { 18067877ebaSShri Abhyankar const PetscInt *ai, *aj,*ajj,M=A->rmap->n; 18167877ebaSShri Abhyankar PetscInt nz,rnz,i,j; 18216ebf90aSShri Abhyankar PetscErrorCode ierr; 18316ebf90aSShri Abhyankar PetscInt *row,*col; 18416ebf90aSShri Abhyankar Mat_SeqSBAIJ *aa=(Mat_SeqSBAIJ*)A->data; 18516ebf90aSShri Abhyankar 18616ebf90aSShri Abhyankar PetscFunctionBegin; 187882afa5aSHong Zhang *v = aa->a; 188bccb9932SShri Abhyankar if (reuse == MAT_INITIAL_MATRIX) { 1892205254eSKarl Rupp nz = aa->nz; 1902205254eSKarl Rupp ai = aa->i; 1912205254eSKarl Rupp aj = aa->j; 1922205254eSKarl Rupp *v = aa->a; 19316ebf90aSShri Abhyankar *nnz = nz; 194785e854fSJed Brown ierr = PetscMalloc1(2*nz, &row);CHKERRQ(ierr); 195185f6596SHong Zhang col = row + nz; 196185f6596SHong Zhang 19716ebf90aSShri Abhyankar nz = 0; 19816ebf90aSShri Abhyankar for (i=0; i<M; i++) { 19916ebf90aSShri Abhyankar rnz = ai[i+1] - ai[i]; 20067877ebaSShri Abhyankar ajj = aj + ai[i]; 20167877ebaSShri Abhyankar for (j=0; j<rnz; j++) { 20267877ebaSShri Abhyankar row[nz] = i+shift; col[nz++] = ajj[j] + shift; 20316ebf90aSShri Abhyankar } 20416ebf90aSShri Abhyankar } 20516ebf90aSShri Abhyankar *r = row; *c = col; 20616ebf90aSShri Abhyankar } 20716ebf90aSShri Abhyankar PetscFunctionReturn(0); 20816ebf90aSShri Abhyankar } 20916ebf90aSShri Abhyankar 21016ebf90aSShri Abhyankar #undef __FUNCT__ 21116ebf90aSShri Abhyankar #define __FUNCT__ "MatConvertToTriples_seqaij_seqsbaij" 212bccb9932SShri Abhyankar PetscErrorCode MatConvertToTriples_seqaij_seqsbaij(Mat A,int shift,MatReuse reuse,int *nnz,int **r, int **c, PetscScalar **v) 21316ebf90aSShri Abhyankar { 21467877ebaSShri Abhyankar const PetscInt *ai,*aj,*ajj,*adiag,M=A->rmap->n; 21567877ebaSShri Abhyankar PetscInt nz,rnz,i,j; 21667877ebaSShri Abhyankar const PetscScalar *av,*v1; 21716ebf90aSShri Abhyankar PetscScalar *val; 21816ebf90aSShri Abhyankar PetscErrorCode ierr; 21916ebf90aSShri Abhyankar PetscInt *row,*col; 220829b1710SHong Zhang Mat_SeqAIJ *aa=(Mat_SeqAIJ*)A->data; 22116ebf90aSShri Abhyankar 22216ebf90aSShri Abhyankar PetscFunctionBegin; 22316ebf90aSShri Abhyankar ai =aa->i; aj=aa->j;av=aa->a; 22416ebf90aSShri Abhyankar adiag=aa->diag; 225bccb9932SShri Abhyankar if (reuse == MAT_INITIAL_MATRIX) { 226829b1710SHong Zhang /* count nz in the uppper triangular part of A */ 227829b1710SHong Zhang nz = 0; 228829b1710SHong Zhang for (i=0; i<M; i++) nz += ai[i+1] - adiag[i]; 22916ebf90aSShri Abhyankar *nnz = nz; 230829b1710SHong Zhang 231185f6596SHong Zhang ierr = PetscMalloc((2*nz*sizeof(PetscInt)+nz*sizeof(PetscScalar)), &row);CHKERRQ(ierr); 232185f6596SHong Zhang col = row + nz; 233185f6596SHong Zhang val = (PetscScalar*)(col + nz); 234185f6596SHong Zhang 23516ebf90aSShri Abhyankar nz = 0; 23616ebf90aSShri Abhyankar for (i=0; i<M; i++) { 23716ebf90aSShri Abhyankar rnz = ai[i+1] - adiag[i]; 23867877ebaSShri Abhyankar ajj = aj + adiag[i]; 239cf3759fdSShri Abhyankar v1 = av + adiag[i]; 24067877ebaSShri Abhyankar for (j=0; j<rnz; j++) { 24167877ebaSShri Abhyankar row[nz] = i+shift; col[nz] = ajj[j] + shift; val[nz++] = v1[j]; 24216ebf90aSShri Abhyankar } 24316ebf90aSShri Abhyankar } 24416ebf90aSShri Abhyankar *r = row; *c = col; *v = val; 245397b6df1SKris Buschelman } else { 24616ebf90aSShri Abhyankar nz = 0; val = *v; 24716ebf90aSShri Abhyankar for (i=0; i <M; i++) { 24816ebf90aSShri Abhyankar rnz = ai[i+1] - adiag[i]; 24967877ebaSShri Abhyankar ajj = aj + adiag[i]; 25067877ebaSShri Abhyankar v1 = av + adiag[i]; 25167877ebaSShri Abhyankar for (j=0; j<rnz; j++) { 25267877ebaSShri Abhyankar val[nz++] = v1[j]; 25316ebf90aSShri Abhyankar } 25416ebf90aSShri Abhyankar } 25516ebf90aSShri Abhyankar } 25616ebf90aSShri Abhyankar PetscFunctionReturn(0); 25716ebf90aSShri Abhyankar } 25816ebf90aSShri Abhyankar 25916ebf90aSShri Abhyankar #undef __FUNCT__ 26016ebf90aSShri Abhyankar #define __FUNCT__ "MatConvertToTriples_mpisbaij_mpisbaij" 261bccb9932SShri Abhyankar PetscErrorCode MatConvertToTriples_mpisbaij_mpisbaij(Mat A,int shift,MatReuse reuse,int *nnz,int **r, int **c, PetscScalar **v) 26216ebf90aSShri Abhyankar { 26316ebf90aSShri Abhyankar const PetscInt *ai, *aj, *bi, *bj,*garray,m=A->rmap->n,*ajj,*bjj; 26416ebf90aSShri Abhyankar PetscErrorCode ierr; 26516ebf90aSShri Abhyankar PetscInt rstart,nz,i,j,jj,irow,countA,countB; 26616ebf90aSShri Abhyankar PetscInt *row,*col; 26716ebf90aSShri Abhyankar const PetscScalar *av, *bv,*v1,*v2; 26816ebf90aSShri Abhyankar PetscScalar *val; 269397b6df1SKris Buschelman Mat_MPISBAIJ *mat = (Mat_MPISBAIJ*)A->data; 270397b6df1SKris Buschelman Mat_SeqSBAIJ *aa = (Mat_SeqSBAIJ*)(mat->A)->data; 271397b6df1SKris Buschelman Mat_SeqBAIJ *bb = (Mat_SeqBAIJ*)(mat->B)->data; 27216ebf90aSShri Abhyankar 27316ebf90aSShri Abhyankar PetscFunctionBegin; 274d0f46423SBarry Smith ai=aa->i; aj=aa->j; bi=bb->i; bj=bb->j; rstart= A->rmap->rstart; 275397b6df1SKris Buschelman av=aa->a; bv=bb->a; 276397b6df1SKris Buschelman 2772205254eSKarl Rupp garray = mat->garray; 2782205254eSKarl Rupp 279bccb9932SShri Abhyankar if (reuse == MAT_INITIAL_MATRIX) { 28016ebf90aSShri Abhyankar nz = aa->nz + bb->nz; 28116ebf90aSShri Abhyankar *nnz = nz; 282185f6596SHong Zhang ierr = PetscMalloc((2*nz*sizeof(PetscInt)+nz*sizeof(PetscScalar)), &row);CHKERRQ(ierr); 283185f6596SHong Zhang col = row + nz; 284185f6596SHong Zhang val = (PetscScalar*)(col + nz); 285185f6596SHong Zhang 286397b6df1SKris Buschelman *r = row; *c = col; *v = val; 287397b6df1SKris Buschelman } else { 288397b6df1SKris Buschelman row = *r; col = *c; val = *v; 289397b6df1SKris Buschelman } 290397b6df1SKris Buschelman 291028e57e8SHong Zhang jj = 0; irow = rstart; 292397b6df1SKris Buschelman for (i=0; i<m; i++) { 293397b6df1SKris Buschelman ajj = aj + ai[i]; /* ptr to the beginning of this row */ 294397b6df1SKris Buschelman countA = ai[i+1] - ai[i]; 295397b6df1SKris Buschelman countB = bi[i+1] - bi[i]; 296397b6df1SKris Buschelman bjj = bj + bi[i]; 29716ebf90aSShri Abhyankar v1 = av + ai[i]; 29816ebf90aSShri Abhyankar v2 = bv + bi[i]; 299397b6df1SKris Buschelman 300397b6df1SKris Buschelman /* A-part */ 301397b6df1SKris Buschelman for (j=0; j<countA; j++) { 302bccb9932SShri Abhyankar if (reuse == MAT_INITIAL_MATRIX) { 303397b6df1SKris Buschelman row[jj] = irow + shift; col[jj] = rstart + ajj[j] + shift; 304397b6df1SKris Buschelman } 30516ebf90aSShri Abhyankar val[jj++] = v1[j]; 306397b6df1SKris Buschelman } 30716ebf90aSShri Abhyankar 30816ebf90aSShri Abhyankar /* B-part */ 30916ebf90aSShri Abhyankar for (j=0; j < countB; j++) { 310bccb9932SShri Abhyankar if (reuse == MAT_INITIAL_MATRIX) { 311397b6df1SKris Buschelman row[jj] = irow + shift; col[jj] = garray[bjj[j]] + shift; 312397b6df1SKris Buschelman } 31316ebf90aSShri Abhyankar val[jj++] = v2[j]; 31416ebf90aSShri Abhyankar } 31516ebf90aSShri Abhyankar irow++; 31616ebf90aSShri Abhyankar } 31716ebf90aSShri Abhyankar PetscFunctionReturn(0); 31816ebf90aSShri Abhyankar } 31916ebf90aSShri Abhyankar 32016ebf90aSShri Abhyankar #undef __FUNCT__ 32116ebf90aSShri Abhyankar #define __FUNCT__ "MatConvertToTriples_mpiaij_mpiaij" 322bccb9932SShri Abhyankar PetscErrorCode MatConvertToTriples_mpiaij_mpiaij(Mat A,int shift,MatReuse reuse,int *nnz,int **r, int **c, PetscScalar **v) 32316ebf90aSShri Abhyankar { 32416ebf90aSShri Abhyankar const PetscInt *ai, *aj, *bi, *bj,*garray,m=A->rmap->n,*ajj,*bjj; 32516ebf90aSShri Abhyankar PetscErrorCode ierr; 32616ebf90aSShri Abhyankar PetscInt rstart,nz,i,j,jj,irow,countA,countB; 32716ebf90aSShri Abhyankar PetscInt *row,*col; 32816ebf90aSShri Abhyankar const PetscScalar *av, *bv,*v1,*v2; 32916ebf90aSShri Abhyankar PetscScalar *val; 33016ebf90aSShri Abhyankar Mat_MPIAIJ *mat = (Mat_MPIAIJ*)A->data; 33116ebf90aSShri Abhyankar Mat_SeqAIJ *aa = (Mat_SeqAIJ*)(mat->A)->data; 33216ebf90aSShri Abhyankar Mat_SeqAIJ *bb = (Mat_SeqAIJ*)(mat->B)->data; 33316ebf90aSShri Abhyankar 33416ebf90aSShri Abhyankar PetscFunctionBegin; 33516ebf90aSShri Abhyankar ai=aa->i; aj=aa->j; bi=bb->i; bj=bb->j; rstart= A->rmap->rstart; 33616ebf90aSShri Abhyankar av=aa->a; bv=bb->a; 33716ebf90aSShri Abhyankar 3382205254eSKarl Rupp garray = mat->garray; 3392205254eSKarl Rupp 340bccb9932SShri Abhyankar if (reuse == MAT_INITIAL_MATRIX) { 34116ebf90aSShri Abhyankar nz = aa->nz + bb->nz; 34216ebf90aSShri Abhyankar *nnz = nz; 343185f6596SHong Zhang ierr = PetscMalloc((2*nz*sizeof(PetscInt)+nz*sizeof(PetscScalar)), &row);CHKERRQ(ierr); 344185f6596SHong Zhang col = row + nz; 345185f6596SHong Zhang val = (PetscScalar*)(col + nz); 346185f6596SHong Zhang 34716ebf90aSShri Abhyankar *r = row; *c = col; *v = val; 34816ebf90aSShri Abhyankar } else { 34916ebf90aSShri Abhyankar row = *r; col = *c; val = *v; 35016ebf90aSShri Abhyankar } 35116ebf90aSShri Abhyankar 35216ebf90aSShri Abhyankar jj = 0; irow = rstart; 35316ebf90aSShri Abhyankar for (i=0; i<m; i++) { 35416ebf90aSShri Abhyankar ajj = aj + ai[i]; /* ptr to the beginning of this row */ 35516ebf90aSShri Abhyankar countA = ai[i+1] - ai[i]; 35616ebf90aSShri Abhyankar countB = bi[i+1] - bi[i]; 35716ebf90aSShri Abhyankar bjj = bj + bi[i]; 35816ebf90aSShri Abhyankar v1 = av + ai[i]; 35916ebf90aSShri Abhyankar v2 = bv + bi[i]; 36016ebf90aSShri Abhyankar 36116ebf90aSShri Abhyankar /* A-part */ 36216ebf90aSShri Abhyankar for (j=0; j<countA; j++) { 363bccb9932SShri Abhyankar if (reuse == MAT_INITIAL_MATRIX) { 36416ebf90aSShri Abhyankar row[jj] = irow + shift; col[jj] = rstart + ajj[j] + shift; 36516ebf90aSShri Abhyankar } 36616ebf90aSShri Abhyankar val[jj++] = v1[j]; 36716ebf90aSShri Abhyankar } 36816ebf90aSShri Abhyankar 36916ebf90aSShri Abhyankar /* B-part */ 37016ebf90aSShri Abhyankar for (j=0; j < countB; j++) { 371bccb9932SShri Abhyankar if (reuse == MAT_INITIAL_MATRIX) { 37216ebf90aSShri Abhyankar row[jj] = irow + shift; col[jj] = garray[bjj[j]] + shift; 37316ebf90aSShri Abhyankar } 37416ebf90aSShri Abhyankar val[jj++] = v2[j]; 37516ebf90aSShri Abhyankar } 37616ebf90aSShri Abhyankar irow++; 37716ebf90aSShri Abhyankar } 37816ebf90aSShri Abhyankar PetscFunctionReturn(0); 37916ebf90aSShri Abhyankar } 38016ebf90aSShri Abhyankar 38116ebf90aSShri Abhyankar #undef __FUNCT__ 38267877ebaSShri Abhyankar #define __FUNCT__ "MatConvertToTriples_mpibaij_mpiaij" 383bccb9932SShri Abhyankar PetscErrorCode MatConvertToTriples_mpibaij_mpiaij(Mat A,int shift,MatReuse reuse,int *nnz,int **r, int **c, PetscScalar **v) 38467877ebaSShri Abhyankar { 38567877ebaSShri Abhyankar Mat_MPIBAIJ *mat = (Mat_MPIBAIJ*)A->data; 38667877ebaSShri Abhyankar Mat_SeqBAIJ *aa = (Mat_SeqBAIJ*)(mat->A)->data; 38767877ebaSShri Abhyankar Mat_SeqBAIJ *bb = (Mat_SeqBAIJ*)(mat->B)->data; 38867877ebaSShri Abhyankar const PetscInt *ai = aa->i, *bi = bb->i, *aj = aa->j, *bj = bb->j,*ajj, *bjj; 389d985c460SShri Abhyankar const PetscInt *garray = mat->garray,mbs=mat->mbs,rstart=A->rmap->rstart; 39033d57670SJed Brown const PetscInt bs2=mat->bs2; 39167877ebaSShri Abhyankar PetscErrorCode ierr; 39233d57670SJed Brown PetscInt bs,nz,i,j,k,n,jj,irow,countA,countB,idx; 39367877ebaSShri Abhyankar PetscInt *row,*col; 39467877ebaSShri Abhyankar const PetscScalar *av=aa->a, *bv=bb->a,*v1,*v2; 39567877ebaSShri Abhyankar PetscScalar *val; 39667877ebaSShri Abhyankar 39767877ebaSShri Abhyankar PetscFunctionBegin; 39833d57670SJed Brown ierr = MatGetBlockSize(A,&bs);CHKERRQ(ierr); 399bccb9932SShri Abhyankar if (reuse == MAT_INITIAL_MATRIX) { 40067877ebaSShri Abhyankar nz = bs2*(aa->nz + bb->nz); 40167877ebaSShri Abhyankar *nnz = nz; 402185f6596SHong Zhang ierr = PetscMalloc((2*nz*sizeof(PetscInt)+nz*sizeof(PetscScalar)), &row);CHKERRQ(ierr); 403185f6596SHong Zhang col = row + nz; 404185f6596SHong Zhang val = (PetscScalar*)(col + nz); 405185f6596SHong Zhang 40667877ebaSShri Abhyankar *r = row; *c = col; *v = val; 40767877ebaSShri Abhyankar } else { 40867877ebaSShri Abhyankar row = *r; col = *c; val = *v; 40967877ebaSShri Abhyankar } 41067877ebaSShri Abhyankar 411d985c460SShri Abhyankar jj = 0; irow = rstart; 41267877ebaSShri Abhyankar for (i=0; i<mbs; i++) { 41367877ebaSShri Abhyankar countA = ai[i+1] - ai[i]; 41467877ebaSShri Abhyankar countB = bi[i+1] - bi[i]; 41567877ebaSShri Abhyankar ajj = aj + ai[i]; 41667877ebaSShri Abhyankar bjj = bj + bi[i]; 41767877ebaSShri Abhyankar v1 = av + bs2*ai[i]; 41867877ebaSShri Abhyankar v2 = bv + bs2*bi[i]; 41967877ebaSShri Abhyankar 42067877ebaSShri Abhyankar idx = 0; 42167877ebaSShri Abhyankar /* A-part */ 42267877ebaSShri Abhyankar for (k=0; k<countA; k++) { 42367877ebaSShri Abhyankar for (j=0; j<bs; j++) { 42467877ebaSShri Abhyankar for (n=0; n<bs; n++) { 425bccb9932SShri Abhyankar if (reuse == MAT_INITIAL_MATRIX) { 426d985c460SShri Abhyankar row[jj] = irow + n + shift; 427d985c460SShri Abhyankar col[jj] = rstart + bs*ajj[k] + j + shift; 42867877ebaSShri Abhyankar } 42967877ebaSShri Abhyankar val[jj++] = v1[idx++]; 43067877ebaSShri Abhyankar } 43167877ebaSShri Abhyankar } 43267877ebaSShri Abhyankar } 43367877ebaSShri Abhyankar 43467877ebaSShri Abhyankar idx = 0; 43567877ebaSShri Abhyankar /* B-part */ 43667877ebaSShri Abhyankar for (k=0; k<countB; k++) { 43767877ebaSShri Abhyankar for (j=0; j<bs; j++) { 43867877ebaSShri Abhyankar for (n=0; n<bs; n++) { 439bccb9932SShri Abhyankar if (reuse == MAT_INITIAL_MATRIX) { 440d985c460SShri Abhyankar row[jj] = irow + n + shift; 441d985c460SShri Abhyankar col[jj] = bs*garray[bjj[k]] + j + shift; 44267877ebaSShri Abhyankar } 443d985c460SShri Abhyankar val[jj++] = v2[idx++]; 44467877ebaSShri Abhyankar } 44567877ebaSShri Abhyankar } 44667877ebaSShri Abhyankar } 447d985c460SShri Abhyankar irow += bs; 44867877ebaSShri Abhyankar } 44967877ebaSShri Abhyankar PetscFunctionReturn(0); 45067877ebaSShri Abhyankar } 45167877ebaSShri Abhyankar 45267877ebaSShri Abhyankar #undef __FUNCT__ 45316ebf90aSShri Abhyankar #define __FUNCT__ "MatConvertToTriples_mpiaij_mpisbaij" 454bccb9932SShri Abhyankar PetscErrorCode MatConvertToTriples_mpiaij_mpisbaij(Mat A,int shift,MatReuse reuse,int *nnz,int **r, int **c, PetscScalar **v) 45516ebf90aSShri Abhyankar { 45616ebf90aSShri Abhyankar const PetscInt *ai, *aj,*adiag, *bi, *bj,*garray,m=A->rmap->n,*ajj,*bjj; 45716ebf90aSShri Abhyankar PetscErrorCode ierr; 458e0bace9bSHong Zhang PetscInt rstart,nz,nza,nzb,i,j,jj,irow,countA,countB; 45916ebf90aSShri Abhyankar PetscInt *row,*col; 46016ebf90aSShri Abhyankar const PetscScalar *av, *bv,*v1,*v2; 46116ebf90aSShri Abhyankar PetscScalar *val; 46216ebf90aSShri Abhyankar Mat_MPIAIJ *mat = (Mat_MPIAIJ*)A->data; 46316ebf90aSShri Abhyankar Mat_SeqAIJ *aa =(Mat_SeqAIJ*)(mat->A)->data; 46416ebf90aSShri Abhyankar Mat_SeqAIJ *bb =(Mat_SeqAIJ*)(mat->B)->data; 46516ebf90aSShri Abhyankar 46616ebf90aSShri Abhyankar PetscFunctionBegin; 46716ebf90aSShri Abhyankar ai=aa->i; aj=aa->j; adiag=aa->diag; 46816ebf90aSShri Abhyankar bi=bb->i; bj=bb->j; garray = mat->garray; 46916ebf90aSShri Abhyankar av=aa->a; bv=bb->a; 4702205254eSKarl Rupp 47116ebf90aSShri Abhyankar rstart = A->rmap->rstart; 47216ebf90aSShri Abhyankar 473bccb9932SShri Abhyankar if (reuse == MAT_INITIAL_MATRIX) { 474e0bace9bSHong Zhang nza = 0; /* num of upper triangular entries in mat->A, including diagonals */ 475e0bace9bSHong Zhang nzb = 0; /* num of upper triangular entries in mat->B */ 47616ebf90aSShri Abhyankar for (i=0; i<m; i++) { 477e0bace9bSHong Zhang nza += (ai[i+1] - adiag[i]); 47816ebf90aSShri Abhyankar countB = bi[i+1] - bi[i]; 47916ebf90aSShri Abhyankar bjj = bj + bi[i]; 480e0bace9bSHong Zhang for (j=0; j<countB; j++) { 481e0bace9bSHong Zhang if (garray[bjj[j]] > rstart) nzb++; 482e0bace9bSHong Zhang } 483e0bace9bSHong Zhang } 48416ebf90aSShri Abhyankar 485e0bace9bSHong Zhang nz = nza + nzb; /* total nz of upper triangular part of mat */ 48616ebf90aSShri Abhyankar *nnz = nz; 487185f6596SHong Zhang ierr = PetscMalloc((2*nz*sizeof(PetscInt)+nz*sizeof(PetscScalar)), &row);CHKERRQ(ierr); 488185f6596SHong Zhang col = row + nz; 489185f6596SHong Zhang val = (PetscScalar*)(col + nz); 490185f6596SHong Zhang 49116ebf90aSShri Abhyankar *r = row; *c = col; *v = val; 49216ebf90aSShri Abhyankar } else { 49316ebf90aSShri Abhyankar row = *r; col = *c; val = *v; 49416ebf90aSShri Abhyankar } 49516ebf90aSShri Abhyankar 49616ebf90aSShri Abhyankar jj = 0; irow = rstart; 49716ebf90aSShri Abhyankar for (i=0; i<m; i++) { 49816ebf90aSShri Abhyankar ajj = aj + adiag[i]; /* ptr to the beginning of the diagonal of this row */ 49916ebf90aSShri Abhyankar v1 = av + adiag[i]; 50016ebf90aSShri Abhyankar countA = ai[i+1] - adiag[i]; 50116ebf90aSShri Abhyankar countB = bi[i+1] - bi[i]; 50216ebf90aSShri Abhyankar bjj = bj + bi[i]; 50316ebf90aSShri Abhyankar v2 = bv + bi[i]; 50416ebf90aSShri Abhyankar 50516ebf90aSShri Abhyankar /* A-part */ 50616ebf90aSShri Abhyankar for (j=0; j<countA; j++) { 507bccb9932SShri Abhyankar if (reuse == MAT_INITIAL_MATRIX) { 50816ebf90aSShri Abhyankar row[jj] = irow + shift; col[jj] = rstart + ajj[j] + shift; 50916ebf90aSShri Abhyankar } 51016ebf90aSShri Abhyankar val[jj++] = v1[j]; 51116ebf90aSShri Abhyankar } 51216ebf90aSShri Abhyankar 51316ebf90aSShri Abhyankar /* B-part */ 51416ebf90aSShri Abhyankar for (j=0; j < countB; j++) { 51516ebf90aSShri Abhyankar if (garray[bjj[j]] > rstart) { 516bccb9932SShri Abhyankar if (reuse == MAT_INITIAL_MATRIX) { 51716ebf90aSShri Abhyankar row[jj] = irow + shift; col[jj] = garray[bjj[j]] + shift; 51816ebf90aSShri Abhyankar } 51916ebf90aSShri Abhyankar val[jj++] = v2[j]; 52016ebf90aSShri Abhyankar } 521397b6df1SKris Buschelman } 522397b6df1SKris Buschelman irow++; 523397b6df1SKris Buschelman } 524397b6df1SKris Buschelman PetscFunctionReturn(0); 525397b6df1SKris Buschelman } 526397b6df1SKris Buschelman 527397b6df1SKris Buschelman #undef __FUNCT__ 52820be8e61SHong Zhang #define __FUNCT__ "MatGetDiagonal_MUMPS" 52920be8e61SHong Zhang PetscErrorCode MatGetDiagonal_MUMPS(Mat A,Vec v) 53020be8e61SHong Zhang { 53120be8e61SHong Zhang PetscFunctionBegin; 53220be8e61SHong Zhang SETERRQ(PetscObjectComm((PetscObject)A),PETSC_ERR_SUP,"Mat type: MUMPS factor"); 53320be8e61SHong Zhang PetscFunctionReturn(0); 53420be8e61SHong Zhang } 53520be8e61SHong Zhang 53620be8e61SHong Zhang #undef __FUNCT__ 5373924e44cSKris Buschelman #define __FUNCT__ "MatDestroy_MUMPS" 538dfbe8321SBarry Smith PetscErrorCode MatDestroy_MUMPS(Mat A) 539dfbe8321SBarry Smith { 540a5e57a09SHong Zhang Mat_MUMPS *mumps=(Mat_MUMPS*)A->spptr; 541dfbe8321SBarry Smith PetscErrorCode ierr; 542b24902e0SBarry Smith 543397b6df1SKris Buschelman PetscFunctionBegin; 544a5e57a09SHong Zhang if (mumps->CleanUpMUMPS) { 545397b6df1SKris Buschelman /* Terminate instance, deallocate memories */ 546a5e57a09SHong Zhang ierr = PetscFree2(mumps->id.sol_loc,mumps->id.isol_loc);CHKERRQ(ierr); 547a5e57a09SHong Zhang ierr = VecScatterDestroy(&mumps->scat_rhs);CHKERRQ(ierr); 548a5e57a09SHong Zhang ierr = VecScatterDestroy(&mumps->scat_sol);CHKERRQ(ierr); 549*801fbe65SHong Zhang ierr = VecDestroy(&mumps->b_seq);CHKERRQ(ierr); 550a5e57a09SHong Zhang ierr = VecDestroy(&mumps->x_seq);CHKERRQ(ierr); 551a5e57a09SHong Zhang ierr = PetscFree(mumps->id.perm_in);CHKERRQ(ierr); 552a5e57a09SHong Zhang ierr = PetscFree(mumps->irn);CHKERRQ(ierr); 5532205254eSKarl Rupp 554*801fbe65SHong Zhang /* created in MatMatSolve_MUMPS() */ 555*801fbe65SHong Zhang if (mumps->scat_rhss) { 556*801fbe65SHong Zhang ierr = VecScatterDestroy(&mumps->scat_rhss);CHKERRQ(ierr); 557*801fbe65SHong Zhang ierr = VecScatterDestroy(&mumps->scat_sols);CHKERRQ(ierr); 558*801fbe65SHong Zhang ierr = VecDestroy(&mumps->bb_seq);CHKERRQ(ierr); 559*801fbe65SHong Zhang ierr = VecDestroy(&mumps->bb_mpi);CHKERRQ(ierr); 560*801fbe65SHong Zhang ierr = VecDestroy(&mumps->xx_mpi);CHKERRQ(ierr); 561*801fbe65SHong Zhang } 562*801fbe65SHong Zhang 563a5e57a09SHong Zhang mumps->id.job = JOB_END; 564a5e57a09SHong Zhang PetscMUMPS_c(&mumps->id); 565a5e57a09SHong Zhang ierr = MPI_Comm_free(&(mumps->comm_mumps));CHKERRQ(ierr); 566397b6df1SKris Buschelman } 567a5e57a09SHong Zhang if (mumps->Destroy) { 568a5e57a09SHong Zhang ierr = (mumps->Destroy)(A);CHKERRQ(ierr); 569bf0cc555SLisandro Dalcin } 570bf0cc555SLisandro Dalcin ierr = PetscFree(A->spptr);CHKERRQ(ierr); 571bf0cc555SLisandro Dalcin 57297969023SHong Zhang /* clear composed functions */ 573bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)A,"MatFactorGetSolverPackage_C",NULL);CHKERRQ(ierr); 574bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)A,"MatMumpsSetIcntl_C",NULL);CHKERRQ(ierr); 575bc6112feSHong Zhang ierr = PetscObjectComposeFunction((PetscObject)A,"MatMumpsGetIcntl_C",NULL);CHKERRQ(ierr); 576bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)A,"MatMumpsSetCntl_C",NULL);CHKERRQ(ierr); 577bc6112feSHong Zhang ierr = PetscObjectComposeFunction((PetscObject)A,"MatMumpsGetCntl_C",NULL);CHKERRQ(ierr); 578bc6112feSHong Zhang 579ca810319SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)A,"MatMumpsGetInfo_C",NULL);CHKERRQ(ierr); 580ca810319SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)A,"MatMumpsGetInfog_C",NULL);CHKERRQ(ierr); 581ca810319SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)A,"MatMumpsGetRinfo_C",NULL);CHKERRQ(ierr); 582ca810319SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)A,"MatMumpsGetRinfog_C",NULL);CHKERRQ(ierr); 583397b6df1SKris Buschelman PetscFunctionReturn(0); 584397b6df1SKris Buschelman } 585397b6df1SKris Buschelman 586397b6df1SKris Buschelman #undef __FUNCT__ 587f6c57405SHong Zhang #define __FUNCT__ "MatSolve_MUMPS" 588b24902e0SBarry Smith PetscErrorCode MatSolve_MUMPS(Mat A,Vec b,Vec x) 589b24902e0SBarry Smith { 590a5e57a09SHong Zhang Mat_MUMPS *mumps=(Mat_MUMPS*)A->spptr; 591d54de34fSKris Buschelman PetscScalar *array; 59267877ebaSShri Abhyankar Vec b_seq; 593329ec9b3SHong Zhang IS is_iden,is_petsc; 594dfbe8321SBarry Smith PetscErrorCode ierr; 595329ec9b3SHong Zhang PetscInt i; 596883f2eb9SBarry Smith static PetscBool cite1 = PETSC_FALSE,cite2 = PETSC_FALSE; 597397b6df1SKris Buschelman 598397b6df1SKris Buschelman PetscFunctionBegin; 599883f2eb9SBarry Smith ierr = PetscCitationsRegister("@article{MUMPS01,\n author = {P.~R. Amestoy and I.~S. Duff and J.-Y. L'Excellent and J. Koster},\n title = {A fully asynchronous multifrontal solver using distributed dynamic scheduling},\n journal = {SIAM Journal on Matrix Analysis and Applications},\n volume = {23},\n number = {1},\n pages = {15--41},\n year = {2001}\n}\n",&cite1);CHKERRQ(ierr); 600883f2eb9SBarry Smith ierr = PetscCitationsRegister("@article{MUMPS02,\n author = {P.~R. Amestoy and A. Guermouche and J.-Y. L'Excellent and S. Pralet},\n title = {Hybrid scheduling for the parallel solution of linear systems},\n journal = {Parallel Computing},\n volume = {32},\n number = {2},\n pages = {136--156},\n year = {2006}\n}\n",&cite2);CHKERRQ(ierr); 601a5e57a09SHong Zhang mumps->id.nrhs = 1; 602a5e57a09SHong Zhang b_seq = mumps->b_seq; 603a5e57a09SHong Zhang if (mumps->size > 1) { 604329ec9b3SHong Zhang /* MUMPS only supports centralized rhs. Scatter b into a seqential rhs vector */ 605a5e57a09SHong Zhang ierr = VecScatterBegin(mumps->scat_rhs,b,b_seq,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 606a5e57a09SHong Zhang ierr = VecScatterEnd(mumps->scat_rhs,b,b_seq,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 607a5e57a09SHong Zhang if (!mumps->myid) {ierr = VecGetArray(b_seq,&array);CHKERRQ(ierr);} 608397b6df1SKris Buschelman } else { /* size == 1 */ 609397b6df1SKris Buschelman ierr = VecCopy(b,x);CHKERRQ(ierr); 610397b6df1SKris Buschelman ierr = VecGetArray(x,&array);CHKERRQ(ierr); 611397b6df1SKris Buschelman } 612a5e57a09SHong Zhang if (!mumps->myid) { /* define rhs on the host */ 613a5e57a09SHong Zhang mumps->id.nrhs = 1; 614397b6df1SKris Buschelman #if defined(PETSC_USE_COMPLEX) 6152907cef9SHong Zhang #if defined(PETSC_USE_REAL_SINGLE) 616a5e57a09SHong Zhang mumps->id.rhs = (mumps_complex*)array; 6172907cef9SHong Zhang #else 618a5e57a09SHong Zhang mumps->id.rhs = (mumps_double_complex*)array; 6192907cef9SHong Zhang #endif 620397b6df1SKris Buschelman #else 621a5e57a09SHong Zhang mumps->id.rhs = array; 622397b6df1SKris Buschelman #endif 623397b6df1SKris Buschelman } 624397b6df1SKris Buschelman 625397b6df1SKris Buschelman /* solve phase */ 626329ec9b3SHong Zhang /*-------------*/ 627a5e57a09SHong Zhang mumps->id.job = JOB_SOLVE; 628a5e57a09SHong Zhang PetscMUMPS_c(&mumps->id); 629a5e57a09SHong Zhang if (mumps->id.INFOG(1) < 0) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error reported by MUMPS in solve phase: INFOG(1)=%d\n",mumps->id.INFOG(1)); 630397b6df1SKris Buschelman 631a5e57a09SHong Zhang if (mumps->size > 1) { /* convert mumps distributed solution to petsc mpi x */ 632a5e57a09SHong Zhang if (mumps->scat_sol && mumps->ICNTL9_pre != mumps->id.ICNTL(9)) { 633a5e57a09SHong Zhang /* when id.ICNTL(9) changes, the contents of lsol_loc may change (not its size, lsol_loc), recreates scat_sol */ 634a5e57a09SHong Zhang ierr = VecScatterDestroy(&mumps->scat_sol);CHKERRQ(ierr); 635397b6df1SKris Buschelman } 636a5e57a09SHong Zhang if (!mumps->scat_sol) { /* create scatter scat_sol */ 637a5e57a09SHong Zhang ierr = ISCreateStride(PETSC_COMM_SELF,mumps->id.lsol_loc,0,1,&is_iden);CHKERRQ(ierr); /* from */ 638a5e57a09SHong Zhang for (i=0; i<mumps->id.lsol_loc; i++) { 639a5e57a09SHong Zhang mumps->id.isol_loc[i] -= 1; /* change Fortran style to C style */ 640a5e57a09SHong Zhang } 641a5e57a09SHong Zhang ierr = ISCreateGeneral(PETSC_COMM_SELF,mumps->id.lsol_loc,mumps->id.isol_loc,PETSC_COPY_VALUES,&is_petsc);CHKERRQ(ierr); /* to */ 642a5e57a09SHong Zhang ierr = VecScatterCreate(mumps->x_seq,is_iden,x,is_petsc,&mumps->scat_sol);CHKERRQ(ierr); 6436bf464f9SBarry Smith ierr = ISDestroy(&is_iden);CHKERRQ(ierr); 6446bf464f9SBarry Smith ierr = ISDestroy(&is_petsc);CHKERRQ(ierr); 6452205254eSKarl Rupp 646a5e57a09SHong Zhang mumps->ICNTL9_pre = mumps->id.ICNTL(9); /* save current value of id.ICNTL(9) */ 647397b6df1SKris Buschelman } 648a5e57a09SHong Zhang 649a5e57a09SHong Zhang ierr = VecScatterBegin(mumps->scat_sol,mumps->x_seq,x,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 650a5e57a09SHong Zhang ierr = VecScatterEnd(mumps->scat_sol,mumps->x_seq,x,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 651329ec9b3SHong Zhang } 652397b6df1SKris Buschelman PetscFunctionReturn(0); 653397b6df1SKris Buschelman } 654397b6df1SKris Buschelman 65551d5961aSHong Zhang #undef __FUNCT__ 65651d5961aSHong Zhang #define __FUNCT__ "MatSolveTranspose_MUMPS" 65751d5961aSHong Zhang PetscErrorCode MatSolveTranspose_MUMPS(Mat A,Vec b,Vec x) 65851d5961aSHong Zhang { 659a5e57a09SHong Zhang Mat_MUMPS *mumps=(Mat_MUMPS*)A->spptr; 66051d5961aSHong Zhang PetscErrorCode ierr; 66151d5961aSHong Zhang 66251d5961aSHong Zhang PetscFunctionBegin; 663a5e57a09SHong Zhang mumps->id.ICNTL(9) = 0; 6640ad0caddSJed Brown ierr = MatSolve_MUMPS(A,b,x);CHKERRQ(ierr); 665a5e57a09SHong Zhang mumps->id.ICNTL(9) = 1; 66651d5961aSHong Zhang PetscFunctionReturn(0); 66751d5961aSHong Zhang } 66851d5961aSHong Zhang 669e0b74bf9SHong Zhang #undef __FUNCT__ 670e0b74bf9SHong Zhang #define __FUNCT__ "MatMatSolve_MUMPS" 671e0b74bf9SHong Zhang PetscErrorCode MatMatSolve_MUMPS(Mat A,Mat B,Mat X) 672e0b74bf9SHong Zhang { 673bda8bf91SBarry Smith PetscErrorCode ierr; 674bda8bf91SBarry Smith PetscBool flg; 6754e34a73bSHong Zhang Mat_MUMPS *mumps=(Mat_MUMPS*)A->spptr; 676*801fbe65SHong Zhang PetscInt i,nrhs,m,M,mx; 6772cd7d884SHong Zhang PetscScalar *array,*bray; 678bda8bf91SBarry Smith 679e0b74bf9SHong Zhang PetscFunctionBegin; 6800298fd71SBarry Smith ierr = PetscObjectTypeCompareAny((PetscObject)B,&flg,MATSEQDENSE,MATMPIDENSE,NULL);CHKERRQ(ierr); 681*801fbe65SHong Zhang if (!flg) SETERRQ(PetscObjectComm((PetscObject)B),PETSC_ERR_ARG_WRONG,"Matrix B must be MATDENSE matrix"); 6820298fd71SBarry Smith ierr = PetscObjectTypeCompareAny((PetscObject)X,&flg,MATSEQDENSE,MATMPIDENSE,NULL);CHKERRQ(ierr); 683*801fbe65SHong Zhang if (!flg) SETERRQ(PetscObjectComm((PetscObject)X),PETSC_ERR_ARG_WRONG,"Matrix X must be MATDENSE matrix"); 684*801fbe65SHong Zhang if (B->rmap->n != X->rmap->n) SETERRQ(PetscObjectComm((PetscObject)B),PETSC_ERR_ARG_WRONG,"Matrix B and X must have same row distribution"); 6854e34a73bSHong Zhang 6862cd7d884SHong Zhang ierr = MatGetLocalSize(B,&m,NULL);CHKERRQ(ierr); 6872cd7d884SHong Zhang ierr = MatGetSize(B,&M,&nrhs);CHKERRQ(ierr); 6884e34a73bSHong Zhang 6892cd7d884SHong Zhang if (mumps->size == 1) { 6902cd7d884SHong Zhang /* copy B to X */ 6912cd7d884SHong Zhang ierr = MatDenseGetArray(B,&bray);CHKERRQ(ierr); 6922cd7d884SHong Zhang ierr = MatDenseGetArray(X,&array);CHKERRQ(ierr); 6932cd7d884SHong Zhang for (i=0; i<M*nrhs; i++) array[i] = bray[i]; 6942cd7d884SHong Zhang ierr = MatDenseRestoreArray(B,&bray);CHKERRQ(ierr); 6952cd7d884SHong Zhang 6962cd7d884SHong Zhang mumps->id.nrhs = nrhs; 6972cd7d884SHong Zhang mumps->id.lrhs = M; 6982cd7d884SHong Zhang #if defined(PETSC_USE_COMPLEX) 6992cd7d884SHong Zhang #if defined(PETSC_USE_REAL_SINGLE) 7002cd7d884SHong Zhang mumps->id.rhs = (mumps_complex*)array; 7012cd7d884SHong Zhang #else 7022cd7d884SHong Zhang mumps->id.rhs = (mumps_double_complex*)array; 7032cd7d884SHong Zhang #endif 7042cd7d884SHong Zhang #else 7052cd7d884SHong Zhang mumps->id.rhs = array; 7062cd7d884SHong Zhang #endif 707*801fbe65SHong Zhang 7082cd7d884SHong Zhang /* solve phase */ 7092cd7d884SHong Zhang /*-------------*/ 7102cd7d884SHong Zhang mumps->id.job = JOB_SOLVE; 7112cd7d884SHong Zhang PetscMUMPS_c(&mumps->id); 7122cd7d884SHong Zhang if (mumps->id.INFOG(1) < 0) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error reported by MUMPS in solve phase: INFOG(1)=%d\n",mumps->id.INFOG(1)); 7132cd7d884SHong Zhang 7142cd7d884SHong Zhang ierr = MatDenseRestoreArray(X,&array);CHKERRQ(ierr); 715*801fbe65SHong Zhang } else { /************** parallel case ***************/ 716*801fbe65SHong Zhang PetscInt lsol_loc,*isol_loc,*isol_loc_save,*idx,*iidx,*idxx; 717*801fbe65SHong Zhang PetscScalar *sol_loc,*sol_loc_save; 718*801fbe65SHong Zhang IS is_to,is_from; 719*801fbe65SHong Zhang PetscInt k,proc,j; 720*801fbe65SHong Zhang const PetscInt *rstart; 721*801fbe65SHong Zhang 722*801fbe65SHong Zhang /* create x_seq to hold local solution */ 723*801fbe65SHong Zhang lsol_loc = nrhs*mumps->id.INFO(23); /* length of sol_loc */ 724*801fbe65SHong Zhang 725*801fbe65SHong Zhang ierr = PetscFree2(mumps->id.sol_loc,mumps->id.isol_loc);CHKERRQ(ierr); //save it for MatSovle()!!! 726*801fbe65SHong Zhang sol_loc_save = mumps->id.sol_loc; /* these arrays were allocated for MatSolve_MUMPS() */ 727*801fbe65SHong Zhang isol_loc_save = mumps->id.isol_loc; 728*801fbe65SHong Zhang 729*801fbe65SHong Zhang ierr = PetscMalloc2(lsol_loc,&sol_loc,lsol_loc,&isol_loc);CHKERRQ(ierr); 730*801fbe65SHong Zhang #if defined(PETSC_USE_COMPLEX) 731*801fbe65SHong Zhang #if defined(PETSC_USE_REAL_SINGLE) 732*801fbe65SHong Zhang mumps->id.sol_loc = (mumps_complex*)sol_loc; 733*801fbe65SHong Zhang #else 734*801fbe65SHong Zhang mumps->id.sol_loc = (mumps_double_complex*)sol_loc; 735*801fbe65SHong Zhang #endif 736*801fbe65SHong Zhang #else 737*801fbe65SHong Zhang mumps->id.sol_loc = sol_loc; 738*801fbe65SHong Zhang #endif 739*801fbe65SHong Zhang mumps->id.isol_loc = isol_loc; 740*801fbe65SHong Zhang 741*801fbe65SHong Zhang ierr = VecDestroy(&mumps->x_seq);CHKERRQ(ierr); 742*801fbe65SHong Zhang ierr = VecCreateSeqWithArray(PETSC_COMM_SELF,1,lsol_loc,sol_loc,&mumps->x_seq);CHKERRQ(ierr); 7432cd7d884SHong Zhang 7442cd7d884SHong Zhang /* copy rhs matrix B into vector bb_mpi */ 7452cd7d884SHong Zhang if (mumps->bb_mpi) { 7462cd7d884SHong Zhang ierr = VecDestroy(&mumps->bb_mpi);CHKERRQ(ierr); 7472cd7d884SHong Zhang ierr = VecDestroy(&mumps->bb_seq);CHKERRQ(ierr); 748*801fbe65SHong Zhang ierr = VecDestroy(&mumps->xx_mpi);CHKERRQ(ierr); 749*801fbe65SHong Zhang ierr = VecScatterDestroy(&mumps->scat_rhss);CHKERRQ(ierr); 750*801fbe65SHong Zhang ierr = VecScatterDestroy(&mumps->scat_sols);CHKERRQ(ierr); 7512cd7d884SHong Zhang } 752*801fbe65SHong Zhang ierr = MatDenseGetArray(B,&bray);CHKERRQ(ierr); 753*801fbe65SHong Zhang ierr = VecCreateMPIWithArray(PetscObjectComm((PetscObject)B),1,nrhs*m,nrhs*M,(const PetscScalar*)bray,&mumps->bb_mpi);CHKERRQ(ierr); 754*801fbe65SHong Zhang ierr = MatDenseRestoreArray(B,&bray);CHKERRQ(ierr); 755*801fbe65SHong Zhang 756*801fbe65SHong Zhang ierr = MatDenseGetArray(X,&array);CHKERRQ(ierr); 757*801fbe65SHong Zhang ierr = MatGetLocalSize(B,&mx,NULL);CHKERRQ(ierr); 758*801fbe65SHong Zhang ierr = VecCreateMPIWithArray(PetscObjectComm((PetscObject)X),1,nrhs*mx,nrhs*M,(const PetscScalar*)array,&mumps->xx_mpi);CHKERRQ(ierr); 7592cd7d884SHong Zhang 7602cd7d884SHong Zhang /* scatter bb_mpi to bb_seq because MUMPS only supports centralized rhs */ 761*801fbe65SHong Zhang /* idx: maps from k-th index of bb_mpi to (i,j)-th global entry of B; 762*801fbe65SHong Zhang iidx: inverse of idx, will be used by scattering xx_seq -> X */ 763*801fbe65SHong Zhang ierr = PetscMalloc2(nrhs*M,&idx,nrhs*M,&iidx);CHKERRQ(ierr); 764*801fbe65SHong Zhang ierr = MatGetOwnershipRanges(B,&rstart);CHKERRQ(ierr); 765*801fbe65SHong Zhang k = 0; 766*801fbe65SHong Zhang for (proc=0; proc<mumps->size; proc++){ 767*801fbe65SHong Zhang for (j=0; j<nrhs; j++){ 768*801fbe65SHong Zhang for (i=rstart[proc]; i<rstart[proc+1]; i++){ 769*801fbe65SHong Zhang iidx[j*M + i] = k; 770*801fbe65SHong Zhang idx[k++] = j*M + i; 771*801fbe65SHong Zhang } 772*801fbe65SHong Zhang } 7732cd7d884SHong Zhang } 7742cd7d884SHong Zhang 775*801fbe65SHong Zhang if (!mumps->myid) { 776*801fbe65SHong Zhang ierr = VecCreateSeq(PETSC_COMM_SELF,nrhs*M,&mumps->bb_seq);CHKERRQ(ierr); 777*801fbe65SHong Zhang ierr = ISCreateGeneral(PETSC_COMM_SELF,nrhs*M,idx,PETSC_COPY_VALUES,&is_to);CHKERRQ(ierr); 778*801fbe65SHong Zhang ierr = ISCreateStride(PETSC_COMM_SELF,nrhs*M,0,1,&is_from);CHKERRQ(ierr); 779*801fbe65SHong Zhang } else { 780*801fbe65SHong Zhang ierr = VecCreateSeq(PETSC_COMM_SELF,0,&mumps->bb_seq);CHKERRQ(ierr); 781*801fbe65SHong Zhang ierr = ISCreateStride(PETSC_COMM_SELF,0,0,1,&is_to);CHKERRQ(ierr); 782*801fbe65SHong Zhang ierr = ISCreateStride(PETSC_COMM_SELF,0,0,1,&is_from);CHKERRQ(ierr); 783*801fbe65SHong Zhang } 784*801fbe65SHong Zhang ierr = VecScatterCreate(mumps->bb_mpi,is_from,mumps->bb_seq,is_to,&mumps->scat_rhss);CHKERRQ(ierr); 785*801fbe65SHong Zhang ierr = VecScatterBegin(mumps->scat_rhss,mumps->bb_mpi,mumps->bb_seq,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 786*801fbe65SHong Zhang ierr = ISDestroy(&is_to);CHKERRQ(ierr); 787*801fbe65SHong Zhang ierr = ISDestroy(&is_from);CHKERRQ(ierr); 788*801fbe65SHong Zhang ierr = VecScatterEnd(mumps->scat_rhss,mumps->bb_mpi,mumps->bb_seq,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 789*801fbe65SHong Zhang 790*801fbe65SHong Zhang if (!mumps->myid) { /* define rhs on the host */ 791*801fbe65SHong Zhang ierr = VecGetArray(mumps->bb_seq,&bray);CHKERRQ(ierr); 792*801fbe65SHong Zhang mumps->id.nrhs = nrhs; 793*801fbe65SHong Zhang mumps->id.lrhs = M; 794*801fbe65SHong Zhang #if defined(PETSC_USE_COMPLEX) 795*801fbe65SHong Zhang #if defined(PETSC_USE_REAL_SINGLE) 796*801fbe65SHong Zhang mumps->id.rhs = (mumps_complex*)bray; 797*801fbe65SHong Zhang #else 798*801fbe65SHong Zhang mumps->id.rhs = (mumps_double_complex*)bray; 799*801fbe65SHong Zhang #endif 800*801fbe65SHong Zhang #else 801*801fbe65SHong Zhang mumps->id.rhs = bray; 802*801fbe65SHong Zhang #endif 803*801fbe65SHong Zhang ierr = VecRestoreArray(mumps->bb_seq,&bray);CHKERRQ(ierr); 804*801fbe65SHong Zhang } 805*801fbe65SHong Zhang 806*801fbe65SHong Zhang /* solve phase */ 807*801fbe65SHong Zhang /*-------------*/ 808*801fbe65SHong Zhang mumps->id.job = JOB_SOLVE; 809*801fbe65SHong Zhang PetscMUMPS_c(&mumps->id); 810*801fbe65SHong Zhang if (mumps->id.INFOG(1) < 0) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error reported by MUMPS in solve phase: INFOG(1)=%d\n",mumps->id.INFOG(1)); 811*801fbe65SHong Zhang 812*801fbe65SHong Zhang /* put mumps distributed solution to petsc vector xx_mpi, which shares local arrays with solution matrix X */ 813*801fbe65SHong Zhang 814*801fbe65SHong Zhang /* create scatter scat_sols */ 815*801fbe65SHong Zhang ierr = PetscMalloc1(nrhs*mumps->id.lsol_loc,&idxx);CHKERRQ(ierr); 816*801fbe65SHong Zhang ierr = ISCreateStride(PETSC_COMM_SELF,nrhs*mumps->id.lsol_loc,0,1,&is_from);CHKERRQ(ierr); 817*801fbe65SHong Zhang for (i=0; i<mumps->id.lsol_loc; i++) { 818*801fbe65SHong Zhang mumps->id.isol_loc[i] -= 1; /* change Fortran style to C style */ 819*801fbe65SHong Zhang idxx[i] = iidx[mumps->id.isol_loc[i]]; 820*801fbe65SHong Zhang for (j=1; j<nrhs; j++){ 821*801fbe65SHong Zhang idxx[j*mumps->id.lsol_loc+i] = iidx[mumps->id.isol_loc[i]+j*M]; 822*801fbe65SHong Zhang } 823*801fbe65SHong Zhang } 824*801fbe65SHong Zhang ierr = ISCreateGeneral(PETSC_COMM_SELF,nrhs*mumps->id.lsol_loc,idxx,PETSC_COPY_VALUES,&is_to);CHKERRQ(ierr); 825*801fbe65SHong Zhang ierr = VecScatterCreate(mumps->x_seq,is_from,mumps->xx_mpi,is_to,&mumps->scat_sols);CHKERRQ(ierr); 826*801fbe65SHong Zhang ierr = VecScatterBegin(mumps->scat_sols,mumps->x_seq,mumps->xx_mpi,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 827*801fbe65SHong Zhang ierr = ISDestroy(&is_from);CHKERRQ(ierr); 828*801fbe65SHong Zhang ierr = ISDestroy(&is_to);CHKERRQ(ierr); 829*801fbe65SHong Zhang ierr = VecScatterEnd(mumps->scat_sols,mumps->x_seq,mumps->xx_mpi,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 830*801fbe65SHong Zhang 831*801fbe65SHong Zhang ierr = MatDenseRestoreArray(X,&array);CHKERRQ(ierr); 832*801fbe65SHong Zhang //ierr = PetscFree2(mumps->id.sol_loc,mumps->id.isol_loc);CHKERRQ(ierr); 833*801fbe65SHong Zhang //mumps->id.sol_loc = sol_loc_save; 834*801fbe65SHong Zhang //mumps->id.isol_loc = isol_loc_save; 835*801fbe65SHong Zhang //ierr = PetscFree2(sol_loc,isol_loc);CHKERRQ(ierr); 836*801fbe65SHong Zhang ierr = PetscFree2(idx,iidx);CHKERRQ(ierr); 837*801fbe65SHong Zhang ierr = PetscFree(idxx);CHKERRQ(ierr); 838*801fbe65SHong Zhang } 839e0b74bf9SHong Zhang PetscFunctionReturn(0); 840e0b74bf9SHong Zhang } 841e0b74bf9SHong Zhang 842ace3df97SHong Zhang #if !defined(PETSC_USE_COMPLEX) 843a58c3f20SHong Zhang /* 844a58c3f20SHong Zhang input: 845a58c3f20SHong Zhang F: numeric factor 846a58c3f20SHong Zhang output: 847a58c3f20SHong Zhang nneg: total number of negative pivots 848a58c3f20SHong Zhang nzero: 0 849a58c3f20SHong Zhang npos: (global dimension of F) - nneg 850a58c3f20SHong Zhang */ 851a58c3f20SHong Zhang 852a58c3f20SHong Zhang #undef __FUNCT__ 853a58c3f20SHong Zhang #define __FUNCT__ "MatGetInertia_SBAIJMUMPS" 854dfbe8321SBarry Smith PetscErrorCode MatGetInertia_SBAIJMUMPS(Mat F,int *nneg,int *nzero,int *npos) 855a58c3f20SHong Zhang { 856a5e57a09SHong Zhang Mat_MUMPS *mumps =(Mat_MUMPS*)F->spptr; 857dfbe8321SBarry Smith PetscErrorCode ierr; 858c1490034SHong Zhang PetscMPIInt size; 859a58c3f20SHong Zhang 860a58c3f20SHong Zhang PetscFunctionBegin; 861ce94432eSBarry Smith ierr = MPI_Comm_size(PetscObjectComm((PetscObject)F),&size);CHKERRQ(ierr); 862bcb30aebSHong Zhang /* MUMPS 4.3.1 calls ScaLAPACK when ICNTL(13)=0 (default), which does not offer the possibility to compute the inertia of a dense matrix. Set ICNTL(13)=1 to skip ScaLAPACK */ 863a5e57a09SHong Zhang if (size > 1 && mumps->id.ICNTL(13) != 1) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONG,"ICNTL(13)=%d. -mat_mumps_icntl_13 must be set as 1 for correct global matrix inertia\n",mumps->id.INFOG(13)); 864ed85ac9fSHong Zhang 865710ac8efSHong Zhang if (nneg) *nneg = mumps->id.INFOG(12); 866ed85ac9fSHong Zhang if (nzero || npos) { 867ed85ac9fSHong Zhang if (mumps->id.ICNTL(24) != 1) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONG,"-mat_mumps_icntl_24 must be set as 1 for null pivot row detection"); 868710ac8efSHong Zhang if (nzero) *nzero = mumps->id.INFOG(28); 869710ac8efSHong Zhang if (npos) *npos = F->rmap->N - (mumps->id.INFOG(12) + mumps->id.INFOG(28)); 870a58c3f20SHong Zhang } 871a58c3f20SHong Zhang PetscFunctionReturn(0); 872a58c3f20SHong Zhang } 873ace3df97SHong Zhang #endif /* !defined(PETSC_USE_COMPLEX) */ 874a58c3f20SHong Zhang 875397b6df1SKris Buschelman #undef __FUNCT__ 876f6c57405SHong Zhang #define __FUNCT__ "MatFactorNumeric_MUMPS" 8770481f469SBarry Smith PetscErrorCode MatFactorNumeric_MUMPS(Mat F,Mat A,const MatFactorInfo *info) 878af281ebdSHong Zhang { 879a5e57a09SHong Zhang Mat_MUMPS *mumps =(Mat_MUMPS*)(F)->spptr; 8806849ba73SBarry Smith PetscErrorCode ierr; 881e09efc27SHong Zhang Mat F_diag; 882ace3abfcSBarry Smith PetscBool isMPIAIJ; 883397b6df1SKris Buschelman 884397b6df1SKris Buschelman PetscFunctionBegin; 885a5e57a09SHong Zhang ierr = (*mumps->ConvertToTriples)(A, 1, MAT_REUSE_MATRIX, &mumps->nz, &mumps->irn, &mumps->jcn, &mumps->val);CHKERRQ(ierr); 886397b6df1SKris Buschelman 887397b6df1SKris Buschelman /* numerical factorization phase */ 888329ec9b3SHong Zhang /*-------------------------------*/ 889a5e57a09SHong Zhang mumps->id.job = JOB_FACTNUMERIC; 8904e34a73bSHong Zhang if (!mumps->id.ICNTL(18)) { /* A is centralized */ 891a5e57a09SHong Zhang if (!mumps->myid) { 892397b6df1SKris Buschelman #if defined(PETSC_USE_COMPLEX) 8932907cef9SHong Zhang #if defined(PETSC_USE_REAL_SINGLE) 894a5e57a09SHong Zhang mumps->id.a = (mumps_complex*)mumps->val; 8952907cef9SHong Zhang #else 896a5e57a09SHong Zhang mumps->id.a = (mumps_double_complex*)mumps->val; 8972907cef9SHong Zhang #endif 898397b6df1SKris Buschelman #else 899a5e57a09SHong Zhang mumps->id.a = mumps->val; 900397b6df1SKris Buschelman #endif 901397b6df1SKris Buschelman } 902397b6df1SKris Buschelman } else { 903397b6df1SKris Buschelman #if defined(PETSC_USE_COMPLEX) 9042907cef9SHong Zhang #if defined(PETSC_USE_REAL_SINGLE) 905a5e57a09SHong Zhang mumps->id.a_loc = (mumps_complex*)mumps->val; 9062907cef9SHong Zhang #else 907a5e57a09SHong Zhang mumps->id.a_loc = (mumps_double_complex*)mumps->val; 9082907cef9SHong Zhang #endif 909397b6df1SKris Buschelman #else 910a5e57a09SHong Zhang mumps->id.a_loc = mumps->val; 911397b6df1SKris Buschelman #endif 912397b6df1SKris Buschelman } 913a5e57a09SHong Zhang PetscMUMPS_c(&mumps->id); 914a5e57a09SHong Zhang if (mumps->id.INFOG(1) < 0) { 915151787a6SHong Zhang if (mumps->id.INFO(1) == -13) { 916151787a6SHong Zhang if (mumps->id.INFO(2) < 0) { 917151787a6SHong Zhang SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error reported by MUMPS in numerical factorization phase: Cannot allocate required memory %d megabytes\n",-mumps->id.INFO(2)); 918151787a6SHong Zhang } else { 919151787a6SHong Zhang SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error reported by MUMPS in numerical factorization phase: Cannot allocate required memory %d bytes\n",mumps->id.INFO(2)); 920151787a6SHong Zhang } 921151787a6SHong Zhang } else SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error reported by MUMPS in numerical factorization phase: INFO(1)=%d, INFO(2)=%d\n",mumps->id.INFO(1),mumps->id.INFO(2)); 922397b6df1SKris Buschelman } 923a5e57a09SHong Zhang if (!mumps->myid && mumps->id.ICNTL(16) > 0) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB," mumps->id.ICNTL(16):=%d\n",mumps->id.INFOG(16)); 924397b6df1SKris Buschelman 925dcd589f8SShri Abhyankar (F)->assembled = PETSC_TRUE; 926a5e57a09SHong Zhang mumps->matstruc = SAME_NONZERO_PATTERN; 927a5e57a09SHong Zhang mumps->CleanUpMUMPS = PETSC_TRUE; 92867877ebaSShri Abhyankar 929a5e57a09SHong Zhang if (mumps->size > 1) { 93067877ebaSShri Abhyankar PetscInt lsol_loc; 93167877ebaSShri Abhyankar PetscScalar *sol_loc; 9322205254eSKarl Rupp 933c2093ab7SHong Zhang ierr = PetscObjectTypeCompare((PetscObject)A,MATMPIAIJ,&isMPIAIJ);CHKERRQ(ierr); 934c2093ab7SHong Zhang if (isMPIAIJ) F_diag = ((Mat_MPIAIJ*)(F)->data)->A; 935c2093ab7SHong Zhang else F_diag = ((Mat_MPISBAIJ*)(F)->data)->A; 936c2093ab7SHong Zhang F_diag->assembled = PETSC_TRUE; 937c2093ab7SHong Zhang 938c2093ab7SHong Zhang /* distributed solution; Create x_seq=sol_loc for repeated use */ 939c2093ab7SHong Zhang if (mumps->x_seq) { 940c2093ab7SHong Zhang ierr = VecScatterDestroy(&mumps->scat_sol);CHKERRQ(ierr); 941c2093ab7SHong Zhang ierr = PetscFree2(mumps->id.sol_loc,mumps->id.isol_loc);CHKERRQ(ierr); 942c2093ab7SHong Zhang ierr = VecDestroy(&mumps->x_seq);CHKERRQ(ierr); 943c2093ab7SHong Zhang } 944a5e57a09SHong Zhang lsol_loc = mumps->id.INFO(23); /* length of sol_loc */ 945dcca6d9dSJed Brown ierr = PetscMalloc2(lsol_loc,&sol_loc,lsol_loc,&mumps->id.isol_loc);CHKERRQ(ierr); 946a5e57a09SHong Zhang mumps->id.lsol_loc = lsol_loc; 94767877ebaSShri Abhyankar #if defined(PETSC_USE_COMPLEX) 9482907cef9SHong Zhang #if defined(PETSC_USE_REAL_SINGLE) 949a5e57a09SHong Zhang mumps->id.sol_loc = (mumps_complex*)sol_loc; 9502907cef9SHong Zhang #else 951a5e57a09SHong Zhang mumps->id.sol_loc = (mumps_double_complex*)sol_loc; 9522907cef9SHong Zhang #endif 95367877ebaSShri Abhyankar #else 954a5e57a09SHong Zhang mumps->id.sol_loc = sol_loc; 95567877ebaSShri Abhyankar #endif 956a5e57a09SHong Zhang ierr = VecCreateSeqWithArray(PETSC_COMM_SELF,1,lsol_loc,sol_loc,&mumps->x_seq);CHKERRQ(ierr); 95767877ebaSShri Abhyankar } 958397b6df1SKris Buschelman PetscFunctionReturn(0); 959397b6df1SKris Buschelman } 960397b6df1SKris Buschelman 9619a2535b5SHong Zhang /* Sets MUMPS options from the options database */ 962dcd589f8SShri Abhyankar #undef __FUNCT__ 9639a2535b5SHong Zhang #define __FUNCT__ "PetscSetMUMPSFromOptions" 9649a2535b5SHong Zhang PetscErrorCode PetscSetMUMPSFromOptions(Mat F, Mat A) 965dcd589f8SShri Abhyankar { 9669a2535b5SHong Zhang Mat_MUMPS *mumps = (Mat_MUMPS*)F->spptr; 967dcd589f8SShri Abhyankar PetscErrorCode ierr; 968dcd589f8SShri Abhyankar PetscInt icntl; 969ace3abfcSBarry Smith PetscBool flg; 970dcd589f8SShri Abhyankar 971dcd589f8SShri Abhyankar PetscFunctionBegin; 972ce94432eSBarry Smith ierr = PetscOptionsBegin(PetscObjectComm((PetscObject)A),((PetscObject)A)->prefix,"MUMPS Options","Mat");CHKERRQ(ierr); 9739a2535b5SHong Zhang ierr = PetscOptionsInt("-mat_mumps_icntl_1","ICNTL(1): output stream for error messages","None",mumps->id.ICNTL(1),&icntl,&flg);CHKERRQ(ierr); 9749a2535b5SHong Zhang if (flg) mumps->id.ICNTL(1) = icntl; 9759a2535b5SHong Zhang ierr = PetscOptionsInt("-mat_mumps_icntl_2","ICNTL(2): output stream for diagnostic printing, statistics, and warning","None",mumps->id.ICNTL(2),&icntl,&flg);CHKERRQ(ierr); 9769a2535b5SHong Zhang if (flg) mumps->id.ICNTL(2) = icntl; 9779a2535b5SHong Zhang ierr = PetscOptionsInt("-mat_mumps_icntl_3","ICNTL(3): output stream for global information, collected on the host","None",mumps->id.ICNTL(3),&icntl,&flg);CHKERRQ(ierr); 9789a2535b5SHong Zhang if (flg) mumps->id.ICNTL(3) = icntl; 979dcd589f8SShri Abhyankar 9809a2535b5SHong Zhang ierr = PetscOptionsInt("-mat_mumps_icntl_4","ICNTL(4): level of printing (0 to 4)","None",mumps->id.ICNTL(4),&icntl,&flg);CHKERRQ(ierr); 9819a2535b5SHong Zhang if (flg) mumps->id.ICNTL(4) = icntl; 9829a2535b5SHong Zhang if (mumps->id.ICNTL(4) || PetscLogPrintInfo) mumps->id.ICNTL(3) = 6; /* resume MUMPS default id.ICNTL(3) = 6 */ 9839a2535b5SHong Zhang 984d341cd04SHong Zhang ierr = PetscOptionsInt("-mat_mumps_icntl_6","ICNTL(6): permutes to a zero-free diagonal and/or scale the matrix (0 to 7)","None",mumps->id.ICNTL(6),&icntl,&flg);CHKERRQ(ierr); 9859a2535b5SHong Zhang if (flg) mumps->id.ICNTL(6) = icntl; 9869a2535b5SHong Zhang 987d341cd04SHong Zhang ierr = PetscOptionsInt("-mat_mumps_icntl_7","ICNTL(7): computes a symmetric permutation in sequential analysis (0 to 7). 3=Scotch, 4=PORD, 5=Metis","None",mumps->id.ICNTL(7),&icntl,&flg);CHKERRQ(ierr); 988dcd589f8SShri Abhyankar if (flg) { 9892205254eSKarl Rupp if (icntl== 1 && mumps->size > 1) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_SUP,"pivot order be set by the user in PERM_IN -- not supported by the PETSc/MUMPS interface\n"); 9902205254eSKarl Rupp else mumps->id.ICNTL(7) = icntl; 991dcd589f8SShri Abhyankar } 992e0b74bf9SHong Zhang 9930298fd71SBarry Smith ierr = PetscOptionsInt("-mat_mumps_icntl_8","ICNTL(8): scaling strategy (-2 to 8 or 77)","None",mumps->id.ICNTL(8),&mumps->id.ICNTL(8),NULL);CHKERRQ(ierr); 994d341cd04SHong Zhang /* ierr = PetscOptionsInt("-mat_mumps_icntl_9","ICNTL(9): computes the solution using A or A^T","None",mumps->id.ICNTL(9),&mumps->id.ICNTL(9),NULL);CHKERRQ(ierr); handled by MatSolveTranspose_MUMPS() */ 9950298fd71SBarry Smith ierr = PetscOptionsInt("-mat_mumps_icntl_10","ICNTL(10): max num of refinements","None",mumps->id.ICNTL(10),&mumps->id.ICNTL(10),NULL);CHKERRQ(ierr); 996d341cd04SHong Zhang ierr = PetscOptionsInt("-mat_mumps_icntl_11","ICNTL(11): statistics related to an error analysis (via -ksp_view)","None",mumps->id.ICNTL(11),&mumps->id.ICNTL(11),NULL);CHKERRQ(ierr); 997d341cd04SHong Zhang ierr = PetscOptionsInt("-mat_mumps_icntl_12","ICNTL(12): an ordering strategy for symmetric matrices (0 to 3)","None",mumps->id.ICNTL(12),&mumps->id.ICNTL(12),NULL);CHKERRQ(ierr); 998d341cd04SHong Zhang ierr = PetscOptionsInt("-mat_mumps_icntl_13","ICNTL(13): parallelism of the root node (enable ScaLAPACK) and its splitting","None",mumps->id.ICNTL(13),&mumps->id.ICNTL(13),NULL);CHKERRQ(ierr); 999d341cd04SHong Zhang ierr = PetscOptionsInt("-mat_mumps_icntl_14","ICNTL(14): percentage increase in the estimated working space","None",mumps->id.ICNTL(14),&mumps->id.ICNTL(14),NULL);CHKERRQ(ierr); 1000d341cd04SHong Zhang ierr = PetscOptionsInt("-mat_mumps_icntl_19","ICNTL(19): computes the Schur complement","None",mumps->id.ICNTL(19),&mumps->id.ICNTL(19),NULL);CHKERRQ(ierr); 10014e34a73bSHong Zhang /* ierr = PetscOptionsInt("-mat_mumps_icntl_20","ICNTL(20): the format (dense or sparse) of the right-hand sides","None",mumps->id.ICNTL(20),&mumps->id.ICNTL(20),NULL);CHKERRQ(ierr); -- sparse rhs is not supported in PETSc API */ 1002d341cd04SHong Zhang /* ierr = PetscOptionsInt("-mat_mumps_icntl_21","ICNTL(21): the distribution (centralized or distributed) of the solution vectors","None",mumps->id.ICNTL(21),&mumps->id.ICNTL(21),NULL);CHKERRQ(ierr); we only use distributed solution vector */ 10039a2535b5SHong Zhang 1004d341cd04SHong Zhang ierr = PetscOptionsInt("-mat_mumps_icntl_22","ICNTL(22): in-core/out-of-core factorization and solve (0 or 1)","None",mumps->id.ICNTL(22),&mumps->id.ICNTL(22),NULL);CHKERRQ(ierr); 10050298fd71SBarry Smith ierr = PetscOptionsInt("-mat_mumps_icntl_23","ICNTL(23): max size of the working memory (MB) that can allocate per processor","None",mumps->id.ICNTL(23),&mumps->id.ICNTL(23),NULL);CHKERRQ(ierr); 10060298fd71SBarry Smith ierr = PetscOptionsInt("-mat_mumps_icntl_24","ICNTL(24): detection of null pivot rows (0 or 1)","None",mumps->id.ICNTL(24),&mumps->id.ICNTL(24),NULL);CHKERRQ(ierr); 10079a2535b5SHong Zhang if (mumps->id.ICNTL(24)) { 10089a2535b5SHong Zhang mumps->id.ICNTL(13) = 1; /* turn-off ScaLAPACK to help with the correct detection of null pivots */ 1009d7ebd59bSHong Zhang } 1010d7ebd59bSHong Zhang 1011d341cd04SHong Zhang ierr = PetscOptionsInt("-mat_mumps_icntl_25","ICNTL(25): compute a solution of a deficient matrix and a null space basis","None",mumps->id.ICNTL(25),&mumps->id.ICNTL(25),NULL);CHKERRQ(ierr); 1012d341cd04SHong Zhang ierr = PetscOptionsInt("-mat_mumps_icntl_26","ICNTL(26): drives the solution phase if a Schur complement matrix","None",mumps->id.ICNTL(26),&mumps->id.ICNTL(26),NULL);CHKERRQ(ierr); 10132cd7d884SHong Zhang ierr = PetscOptionsInt("-mat_mumps_icntl_27","ICNTL(27): the blocking size for multiple right-hand sides","None",mumps->id.ICNTL(27),&mumps->id.ICNTL(27),NULL);CHKERRQ(ierr); 10140298fd71SBarry Smith ierr = PetscOptionsInt("-mat_mumps_icntl_28","ICNTL(28): use 1 for sequential analysis and ictnl(7) ordering, or 2 for parallel analysis and ictnl(29) ordering","None",mumps->id.ICNTL(28),&mumps->id.ICNTL(28),NULL);CHKERRQ(ierr); 1015d341cd04SHong Zhang ierr = PetscOptionsInt("-mat_mumps_icntl_29","ICNTL(29): parallel ordering 1 = ptscotch, 2 = parmetis","None",mumps->id.ICNTL(29),&mumps->id.ICNTL(29),NULL);CHKERRQ(ierr); 10160298fd71SBarry Smith ierr = PetscOptionsInt("-mat_mumps_icntl_30","ICNTL(30): compute user-specified set of entries in inv(A)","None",mumps->id.ICNTL(30),&mumps->id.ICNTL(30),NULL);CHKERRQ(ierr); 1017d341cd04SHong Zhang ierr = PetscOptionsInt("-mat_mumps_icntl_31","ICNTL(31): indicates which factors may be discarded during factorization","None",mumps->id.ICNTL(31),&mumps->id.ICNTL(31),NULL);CHKERRQ(ierr); 10184e34a73bSHong Zhang /* ierr = PetscOptionsInt("-mat_mumps_icntl_32","ICNTL(32): performs the forward elemination of the right-hand sides during factorization","None",mumps->id.ICNTL(32),&mumps->id.ICNTL(32),NULL);CHKERRQ(ierr); -- not supported by PETSc API */ 10190298fd71SBarry Smith ierr = PetscOptionsInt("-mat_mumps_icntl_33","ICNTL(33): compute determinant","None",mumps->id.ICNTL(33),&mumps->id.ICNTL(33),NULL);CHKERRQ(ierr); 1020dcd589f8SShri Abhyankar 10210298fd71SBarry Smith ierr = PetscOptionsReal("-mat_mumps_cntl_1","CNTL(1): relative pivoting threshold","None",mumps->id.CNTL(1),&mumps->id.CNTL(1),NULL);CHKERRQ(ierr); 10220298fd71SBarry Smith ierr = PetscOptionsReal("-mat_mumps_cntl_2","CNTL(2): stopping criterion of refinement","None",mumps->id.CNTL(2),&mumps->id.CNTL(2),NULL);CHKERRQ(ierr); 10230298fd71SBarry Smith ierr = PetscOptionsReal("-mat_mumps_cntl_3","CNTL(3): absolute pivoting threshold","None",mumps->id.CNTL(3),&mumps->id.CNTL(3),NULL);CHKERRQ(ierr); 10240298fd71SBarry Smith ierr = PetscOptionsReal("-mat_mumps_cntl_4","CNTL(4): value for static pivoting","None",mumps->id.CNTL(4),&mumps->id.CNTL(4),NULL);CHKERRQ(ierr); 10250298fd71SBarry Smith ierr = PetscOptionsReal("-mat_mumps_cntl_5","CNTL(5): fixation for null pivots","None",mumps->id.CNTL(5),&mumps->id.CNTL(5),NULL);CHKERRQ(ierr); 1026e5bb22a1SHong Zhang 10270298fd71SBarry Smith ierr = PetscOptionsString("-mat_mumps_ooc_tmpdir", "out of core directory", "None", mumps->id.ooc_tmpdir, mumps->id.ooc_tmpdir, 256, NULL); 1028dcd589f8SShri Abhyankar PetscOptionsEnd(); 1029dcd589f8SShri Abhyankar PetscFunctionReturn(0); 1030dcd589f8SShri Abhyankar } 1031dcd589f8SShri Abhyankar 1032dcd589f8SShri Abhyankar #undef __FUNCT__ 1033dcd589f8SShri Abhyankar #define __FUNCT__ "PetscInitializeMUMPS" 1034f697e70eSHong Zhang PetscErrorCode PetscInitializeMUMPS(Mat A,Mat_MUMPS *mumps) 1035dcd589f8SShri Abhyankar { 1036dcd589f8SShri Abhyankar PetscErrorCode ierr; 1037dcd589f8SShri Abhyankar 1038dcd589f8SShri Abhyankar PetscFunctionBegin; 1039ce94432eSBarry Smith ierr = MPI_Comm_rank(PetscObjectComm((PetscObject)A), &mumps->myid); 1040ce94432eSBarry Smith ierr = MPI_Comm_size(PetscObjectComm((PetscObject)A),&mumps->size);CHKERRQ(ierr); 1041ce94432eSBarry Smith ierr = MPI_Comm_dup(PetscObjectComm((PetscObject)A),&(mumps->comm_mumps));CHKERRQ(ierr); 10422205254eSKarl Rupp 1043f697e70eSHong Zhang mumps->id.comm_fortran = MPI_Comm_c2f(mumps->comm_mumps); 1044f697e70eSHong Zhang 1045f697e70eSHong Zhang mumps->id.job = JOB_INIT; 1046f697e70eSHong Zhang mumps->id.par = 1; /* host participates factorizaton and solve */ 1047f697e70eSHong Zhang mumps->id.sym = mumps->sym; 10482907cef9SHong Zhang PetscMUMPS_c(&mumps->id); 1049f697e70eSHong Zhang 1050f697e70eSHong Zhang mumps->CleanUpMUMPS = PETSC_FALSE; 10510298fd71SBarry Smith mumps->scat_rhs = NULL; 10520298fd71SBarry Smith mumps->scat_sol = NULL; 10539a2535b5SHong Zhang 105470544d5fSHong Zhang /* set PETSc-MUMPS default options - override MUMPS default */ 10559a2535b5SHong Zhang mumps->id.ICNTL(3) = 0; 10569a2535b5SHong Zhang mumps->id.ICNTL(4) = 0; 10579a2535b5SHong Zhang if (mumps->size == 1) { 10589a2535b5SHong Zhang mumps->id.ICNTL(18) = 0; /* centralized assembled matrix input */ 10599a2535b5SHong Zhang } else { 10609a2535b5SHong Zhang mumps->id.ICNTL(18) = 3; /* distributed assembled matrix input */ 10614e34a73bSHong Zhang mumps->id.ICNTL(20) = 0; /* rhs is in dense format */ 106270544d5fSHong Zhang mumps->id.ICNTL(21) = 1; /* distributed solution */ 10639a2535b5SHong Zhang } 1064dcd589f8SShri Abhyankar PetscFunctionReturn(0); 1065dcd589f8SShri Abhyankar } 1066dcd589f8SShri Abhyankar 1067a5e57a09SHong Zhang /* Note Petsc r(=c) permutation is used when mumps->id.ICNTL(7)==1 with centralized assembled matrix input; otherwise r and c are ignored */ 1068397b6df1SKris Buschelman #undef __FUNCT__ 1069f0c56d0fSKris Buschelman #define __FUNCT__ "MatLUFactorSymbolic_AIJMUMPS" 10700481f469SBarry Smith PetscErrorCode MatLUFactorSymbolic_AIJMUMPS(Mat F,Mat A,IS r,IS c,const MatFactorInfo *info) 1071b24902e0SBarry Smith { 1072a5e57a09SHong Zhang Mat_MUMPS *mumps = (Mat_MUMPS*)F->spptr; 1073dcd589f8SShri Abhyankar PetscErrorCode ierr; 107467877ebaSShri Abhyankar Vec b; 107567877ebaSShri Abhyankar IS is_iden; 107667877ebaSShri Abhyankar const PetscInt M = A->rmap->N; 1077397b6df1SKris Buschelman 1078397b6df1SKris Buschelman PetscFunctionBegin; 1079a5e57a09SHong Zhang mumps->matstruc = DIFFERENT_NONZERO_PATTERN; 1080dcd589f8SShri Abhyankar 10819a2535b5SHong Zhang /* Set MUMPS options from the options database */ 10829a2535b5SHong Zhang ierr = PetscSetMUMPSFromOptions(F,A);CHKERRQ(ierr); 1083dcd589f8SShri Abhyankar 1084a5e57a09SHong Zhang ierr = (*mumps->ConvertToTriples)(A, 1, MAT_INITIAL_MATRIX, &mumps->nz, &mumps->irn, &mumps->jcn, &mumps->val);CHKERRQ(ierr); 1085dcd589f8SShri Abhyankar 108667877ebaSShri Abhyankar /* analysis phase */ 108767877ebaSShri Abhyankar /*----------------*/ 1088a5e57a09SHong Zhang mumps->id.job = JOB_FACTSYMBOLIC; 1089a5e57a09SHong Zhang mumps->id.n = M; 1090a5e57a09SHong Zhang switch (mumps->id.ICNTL(18)) { 109167877ebaSShri Abhyankar case 0: /* centralized assembled matrix input */ 1092a5e57a09SHong Zhang if (!mumps->myid) { 1093a5e57a09SHong Zhang mumps->id.nz =mumps->nz; mumps->id.irn=mumps->irn; mumps->id.jcn=mumps->jcn; 1094a5e57a09SHong Zhang if (mumps->id.ICNTL(6)>1) { 109567877ebaSShri Abhyankar #if defined(PETSC_USE_COMPLEX) 10962907cef9SHong Zhang #if defined(PETSC_USE_REAL_SINGLE) 1097a5e57a09SHong Zhang mumps->id.a = (mumps_complex*)mumps->val; 10982907cef9SHong Zhang #else 1099a5e57a09SHong Zhang mumps->id.a = (mumps_double_complex*)mumps->val; 11002907cef9SHong Zhang #endif 110167877ebaSShri Abhyankar #else 1102a5e57a09SHong Zhang mumps->id.a = mumps->val; 110367877ebaSShri Abhyankar #endif 110467877ebaSShri Abhyankar } 1105a5e57a09SHong Zhang if (mumps->id.ICNTL(7) == 1) { /* use user-provide matrix ordering - assuming r = c ordering */ 11065248a706SHong Zhang /* 11075248a706SHong Zhang PetscBool flag; 11085248a706SHong Zhang ierr = ISEqual(r,c,&flag);CHKERRQ(ierr); 11095248a706SHong Zhang if (!flag) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_USER,"row_perm != col_perm"); 11105248a706SHong Zhang ierr = ISView(r,PETSC_VIEWER_STDOUT_SELF); 11115248a706SHong Zhang */ 1112a5e57a09SHong Zhang if (!mumps->myid) { 1113e0b74bf9SHong Zhang const PetscInt *idx; 1114e0b74bf9SHong Zhang PetscInt i,*perm_in; 11152205254eSKarl Rupp 1116785e854fSJed Brown ierr = PetscMalloc1(M,&perm_in);CHKERRQ(ierr); 1117e0b74bf9SHong Zhang ierr = ISGetIndices(r,&idx);CHKERRQ(ierr); 11182205254eSKarl Rupp 1119a5e57a09SHong Zhang mumps->id.perm_in = perm_in; 1120e0b74bf9SHong Zhang for (i=0; i<M; i++) perm_in[i] = idx[i]+1; /* perm_in[]: start from 1, not 0! */ 1121e0b74bf9SHong Zhang ierr = ISRestoreIndices(r,&idx);CHKERRQ(ierr); 1122e0b74bf9SHong Zhang } 1123e0b74bf9SHong Zhang } 112467877ebaSShri Abhyankar } 112567877ebaSShri Abhyankar break; 112667877ebaSShri Abhyankar case 3: /* distributed assembled matrix input (size>1) */ 1127a5e57a09SHong Zhang mumps->id.nz_loc = mumps->nz; 1128a5e57a09SHong Zhang mumps->id.irn_loc=mumps->irn; mumps->id.jcn_loc=mumps->jcn; 1129a5e57a09SHong Zhang if (mumps->id.ICNTL(6)>1) { 113067877ebaSShri Abhyankar #if defined(PETSC_USE_COMPLEX) 11312907cef9SHong Zhang #if defined(PETSC_USE_REAL_SINGLE) 1132a5e57a09SHong Zhang mumps->id.a_loc = (mumps_complex*)mumps->val; 11332907cef9SHong Zhang #else 1134a5e57a09SHong Zhang mumps->id.a_loc = (mumps_double_complex*)mumps->val; 11352907cef9SHong Zhang #endif 113667877ebaSShri Abhyankar #else 1137a5e57a09SHong Zhang mumps->id.a_loc = mumps->val; 113867877ebaSShri Abhyankar #endif 113967877ebaSShri Abhyankar } 114067877ebaSShri Abhyankar /* MUMPS only supports centralized rhs. Create scatter scat_rhs for repeated use in MatSolve() */ 1141a5e57a09SHong Zhang if (!mumps->myid) { 11422cd7d884SHong Zhang ierr = VecCreateSeq(PETSC_COMM_SELF,A->rmap->N,&mumps->b_seq);CHKERRQ(ierr); 11432cd7d884SHong Zhang ierr = ISCreateStride(PETSC_COMM_SELF,A->rmap->N,0,1,&is_iden);CHKERRQ(ierr); 114467877ebaSShri Abhyankar } else { 1145a5e57a09SHong Zhang ierr = VecCreateSeq(PETSC_COMM_SELF,0,&mumps->b_seq);CHKERRQ(ierr); 114667877ebaSShri Abhyankar ierr = ISCreateStride(PETSC_COMM_SELF,0,0,1,&is_iden);CHKERRQ(ierr); 114767877ebaSShri Abhyankar } 11482a7a6963SBarry Smith ierr = MatCreateVecs(A,NULL,&b);CHKERRQ(ierr); 1149a5e57a09SHong Zhang ierr = VecScatterCreate(b,is_iden,mumps->b_seq,is_iden,&mumps->scat_rhs);CHKERRQ(ierr); 11506bf464f9SBarry Smith ierr = ISDestroy(&is_iden);CHKERRQ(ierr); 11516bf464f9SBarry Smith ierr = VecDestroy(&b);CHKERRQ(ierr); 115267877ebaSShri Abhyankar break; 115367877ebaSShri Abhyankar } 1154a5e57a09SHong Zhang PetscMUMPS_c(&mumps->id); 1155a5e57a09SHong Zhang if (mumps->id.INFOG(1) < 0) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error reported by MUMPS in analysis phase: INFOG(1)=%d\n",mumps->id.INFOG(1)); 115667877ebaSShri Abhyankar 1157719d5645SBarry Smith F->ops->lufactornumeric = MatFactorNumeric_MUMPS; 1158dcd589f8SShri Abhyankar F->ops->solve = MatSolve_MUMPS; 115951d5961aSHong Zhang F->ops->solvetranspose = MatSolveTranspose_MUMPS; 11604e34a73bSHong Zhang F->ops->matsolve = MatMatSolve_MUMPS; 1161b24902e0SBarry Smith PetscFunctionReturn(0); 1162b24902e0SBarry Smith } 1163b24902e0SBarry Smith 1164450b117fSShri Abhyankar /* Note the Petsc r and c permutations are ignored */ 1165450b117fSShri Abhyankar #undef __FUNCT__ 1166450b117fSShri Abhyankar #define __FUNCT__ "MatLUFactorSymbolic_BAIJMUMPS" 1167450b117fSShri Abhyankar PetscErrorCode MatLUFactorSymbolic_BAIJMUMPS(Mat F,Mat A,IS r,IS c,const MatFactorInfo *info) 1168450b117fSShri Abhyankar { 1169a5e57a09SHong Zhang Mat_MUMPS *mumps = (Mat_MUMPS*)F->spptr; 1170dcd589f8SShri Abhyankar PetscErrorCode ierr; 117167877ebaSShri Abhyankar Vec b; 117267877ebaSShri Abhyankar IS is_iden; 117367877ebaSShri Abhyankar const PetscInt M = A->rmap->N; 1174450b117fSShri Abhyankar 1175450b117fSShri Abhyankar PetscFunctionBegin; 1176a5e57a09SHong Zhang mumps->matstruc = DIFFERENT_NONZERO_PATTERN; 1177dcd589f8SShri Abhyankar 11789a2535b5SHong Zhang /* Set MUMPS options from the options database */ 11799a2535b5SHong Zhang ierr = PetscSetMUMPSFromOptions(F,A);CHKERRQ(ierr); 1180dcd589f8SShri Abhyankar 1181a5e57a09SHong Zhang ierr = (*mumps->ConvertToTriples)(A, 1, MAT_INITIAL_MATRIX, &mumps->nz, &mumps->irn, &mumps->jcn, &mumps->val);CHKERRQ(ierr); 118267877ebaSShri Abhyankar 118367877ebaSShri Abhyankar /* analysis phase */ 118467877ebaSShri Abhyankar /*----------------*/ 1185a5e57a09SHong Zhang mumps->id.job = JOB_FACTSYMBOLIC; 1186a5e57a09SHong Zhang mumps->id.n = M; 1187a5e57a09SHong Zhang switch (mumps->id.ICNTL(18)) { 118867877ebaSShri Abhyankar case 0: /* centralized assembled matrix input */ 1189a5e57a09SHong Zhang if (!mumps->myid) { 1190a5e57a09SHong Zhang mumps->id.nz =mumps->nz; mumps->id.irn=mumps->irn; mumps->id.jcn=mumps->jcn; 1191a5e57a09SHong Zhang if (mumps->id.ICNTL(6)>1) { 119267877ebaSShri Abhyankar #if defined(PETSC_USE_COMPLEX) 11932907cef9SHong Zhang #if defined(PETSC_USE_REAL_SINGLE) 1194a5e57a09SHong Zhang mumps->id.a = (mumps_complex*)mumps->val; 11952907cef9SHong Zhang #else 1196a5e57a09SHong Zhang mumps->id.a = (mumps_double_complex*)mumps->val; 11972907cef9SHong Zhang #endif 119867877ebaSShri Abhyankar #else 1199a5e57a09SHong Zhang mumps->id.a = mumps->val; 120067877ebaSShri Abhyankar #endif 120167877ebaSShri Abhyankar } 120267877ebaSShri Abhyankar } 120367877ebaSShri Abhyankar break; 120467877ebaSShri Abhyankar case 3: /* distributed assembled matrix input (size>1) */ 1205a5e57a09SHong Zhang mumps->id.nz_loc = mumps->nz; 1206a5e57a09SHong Zhang mumps->id.irn_loc=mumps->irn; mumps->id.jcn_loc=mumps->jcn; 1207a5e57a09SHong Zhang if (mumps->id.ICNTL(6)>1) { 120867877ebaSShri Abhyankar #if defined(PETSC_USE_COMPLEX) 12092907cef9SHong Zhang #if defined(PETSC_USE_REAL_SINGLE) 1210a5e57a09SHong Zhang mumps->id.a_loc = (mumps_complex*)mumps->val; 12112907cef9SHong Zhang #else 1212a5e57a09SHong Zhang mumps->id.a_loc = (mumps_double_complex*)mumps->val; 12132907cef9SHong Zhang #endif 121467877ebaSShri Abhyankar #else 1215a5e57a09SHong Zhang mumps->id.a_loc = mumps->val; 121667877ebaSShri Abhyankar #endif 121767877ebaSShri Abhyankar } 121867877ebaSShri Abhyankar /* MUMPS only supports centralized rhs. Create scatter scat_rhs for repeated use in MatSolve() */ 1219a5e57a09SHong Zhang if (!mumps->myid) { 1220a5e57a09SHong Zhang ierr = VecCreateSeq(PETSC_COMM_SELF,A->cmap->N,&mumps->b_seq);CHKERRQ(ierr); 122167877ebaSShri Abhyankar ierr = ISCreateStride(PETSC_COMM_SELF,A->cmap->N,0,1,&is_iden);CHKERRQ(ierr); 122267877ebaSShri Abhyankar } else { 1223a5e57a09SHong Zhang ierr = VecCreateSeq(PETSC_COMM_SELF,0,&mumps->b_seq);CHKERRQ(ierr); 122467877ebaSShri Abhyankar ierr = ISCreateStride(PETSC_COMM_SELF,0,0,1,&is_iden);CHKERRQ(ierr); 122567877ebaSShri Abhyankar } 12262a7a6963SBarry Smith ierr = MatCreateVecs(A,NULL,&b);CHKERRQ(ierr); 1227a5e57a09SHong Zhang ierr = VecScatterCreate(b,is_iden,mumps->b_seq,is_iden,&mumps->scat_rhs);CHKERRQ(ierr); 12286bf464f9SBarry Smith ierr = ISDestroy(&is_iden);CHKERRQ(ierr); 12296bf464f9SBarry Smith ierr = VecDestroy(&b);CHKERRQ(ierr); 123067877ebaSShri Abhyankar break; 123167877ebaSShri Abhyankar } 1232a5e57a09SHong Zhang PetscMUMPS_c(&mumps->id); 1233a5e57a09SHong Zhang if (mumps->id.INFOG(1) < 0) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error reported by MUMPS in analysis phase: INFOG(1)=%d\n",mumps->id.INFOG(1)); 123467877ebaSShri Abhyankar 1235450b117fSShri Abhyankar F->ops->lufactornumeric = MatFactorNumeric_MUMPS; 1236dcd589f8SShri Abhyankar F->ops->solve = MatSolve_MUMPS; 123751d5961aSHong Zhang F->ops->solvetranspose = MatSolveTranspose_MUMPS; 1238450b117fSShri Abhyankar PetscFunctionReturn(0); 1239450b117fSShri Abhyankar } 1240b24902e0SBarry Smith 1241141f4205SHong Zhang /* Note the Petsc r permutation and factor info are ignored */ 1242397b6df1SKris Buschelman #undef __FUNCT__ 124367877ebaSShri Abhyankar #define __FUNCT__ "MatCholeskyFactorSymbolic_MUMPS" 124467877ebaSShri Abhyankar PetscErrorCode MatCholeskyFactorSymbolic_MUMPS(Mat F,Mat A,IS r,const MatFactorInfo *info) 1245b24902e0SBarry Smith { 1246a5e57a09SHong Zhang Mat_MUMPS *mumps = (Mat_MUMPS*)F->spptr; 1247dcd589f8SShri Abhyankar PetscErrorCode ierr; 124867877ebaSShri Abhyankar Vec b; 124967877ebaSShri Abhyankar IS is_iden; 125067877ebaSShri Abhyankar const PetscInt M = A->rmap->N; 1251397b6df1SKris Buschelman 1252397b6df1SKris Buschelman PetscFunctionBegin; 1253a5e57a09SHong Zhang mumps->matstruc = DIFFERENT_NONZERO_PATTERN; 1254dcd589f8SShri Abhyankar 12559a2535b5SHong Zhang /* Set MUMPS options from the options database */ 12569a2535b5SHong Zhang ierr = PetscSetMUMPSFromOptions(F,A);CHKERRQ(ierr); 1257dcd589f8SShri Abhyankar 1258a5e57a09SHong Zhang ierr = (*mumps->ConvertToTriples)(A, 1, MAT_INITIAL_MATRIX, &mumps->nz, &mumps->irn, &mumps->jcn, &mumps->val);CHKERRQ(ierr); 1259dcd589f8SShri Abhyankar 126067877ebaSShri Abhyankar /* analysis phase */ 126167877ebaSShri Abhyankar /*----------------*/ 1262a5e57a09SHong Zhang mumps->id.job = JOB_FACTSYMBOLIC; 1263a5e57a09SHong Zhang mumps->id.n = M; 1264a5e57a09SHong Zhang switch (mumps->id.ICNTL(18)) { 126567877ebaSShri Abhyankar case 0: /* centralized assembled matrix input */ 1266a5e57a09SHong Zhang if (!mumps->myid) { 1267a5e57a09SHong Zhang mumps->id.nz =mumps->nz; mumps->id.irn=mumps->irn; mumps->id.jcn=mumps->jcn; 1268a5e57a09SHong Zhang if (mumps->id.ICNTL(6)>1) { 126967877ebaSShri Abhyankar #if defined(PETSC_USE_COMPLEX) 12702907cef9SHong Zhang #if defined(PETSC_USE_REAL_SINGLE) 1271a5e57a09SHong Zhang mumps->id.a = (mumps_complex*)mumps->val; 12722907cef9SHong Zhang #else 1273a5e57a09SHong Zhang mumps->id.a = (mumps_double_complex*)mumps->val; 12742907cef9SHong Zhang #endif 127567877ebaSShri Abhyankar #else 1276a5e57a09SHong Zhang mumps->id.a = mumps->val; 127767877ebaSShri Abhyankar #endif 127867877ebaSShri Abhyankar } 127967877ebaSShri Abhyankar } 128067877ebaSShri Abhyankar break; 128167877ebaSShri Abhyankar case 3: /* distributed assembled matrix input (size>1) */ 1282a5e57a09SHong Zhang mumps->id.nz_loc = mumps->nz; 1283a5e57a09SHong Zhang mumps->id.irn_loc=mumps->irn; mumps->id.jcn_loc=mumps->jcn; 1284a5e57a09SHong Zhang if (mumps->id.ICNTL(6)>1) { 128567877ebaSShri Abhyankar #if defined(PETSC_USE_COMPLEX) 12862907cef9SHong Zhang #if defined(PETSC_USE_REAL_SINGLE) 1287a5e57a09SHong Zhang mumps->id.a_loc = (mumps_complex*)mumps->val; 12882907cef9SHong Zhang #else 1289a5e57a09SHong Zhang mumps->id.a_loc = (mumps_double_complex*)mumps->val; 12902907cef9SHong Zhang #endif 129167877ebaSShri Abhyankar #else 1292a5e57a09SHong Zhang mumps->id.a_loc = mumps->val; 129367877ebaSShri Abhyankar #endif 129467877ebaSShri Abhyankar } 129567877ebaSShri Abhyankar /* MUMPS only supports centralized rhs. Create scatter scat_rhs for repeated use in MatSolve() */ 1296a5e57a09SHong Zhang if (!mumps->myid) { 1297a5e57a09SHong Zhang ierr = VecCreateSeq(PETSC_COMM_SELF,A->cmap->N,&mumps->b_seq);CHKERRQ(ierr); 129867877ebaSShri Abhyankar ierr = ISCreateStride(PETSC_COMM_SELF,A->cmap->N,0,1,&is_iden);CHKERRQ(ierr); 129967877ebaSShri Abhyankar } else { 1300a5e57a09SHong Zhang ierr = VecCreateSeq(PETSC_COMM_SELF,0,&mumps->b_seq);CHKERRQ(ierr); 130167877ebaSShri Abhyankar ierr = ISCreateStride(PETSC_COMM_SELF,0,0,1,&is_iden);CHKERRQ(ierr); 130267877ebaSShri Abhyankar } 13032a7a6963SBarry Smith ierr = MatCreateVecs(A,NULL,&b);CHKERRQ(ierr); 1304a5e57a09SHong Zhang ierr = VecScatterCreate(b,is_iden,mumps->b_seq,is_iden,&mumps->scat_rhs);CHKERRQ(ierr); 13056bf464f9SBarry Smith ierr = ISDestroy(&is_iden);CHKERRQ(ierr); 13066bf464f9SBarry Smith ierr = VecDestroy(&b);CHKERRQ(ierr); 130767877ebaSShri Abhyankar break; 130867877ebaSShri Abhyankar } 1309a5e57a09SHong Zhang PetscMUMPS_c(&mumps->id); 1310a5e57a09SHong Zhang if (mumps->id.INFOG(1) < 0) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error reported by MUMPS in analysis phase: INFOG(1)=%d\n",mumps->id.INFOG(1)); 131167877ebaSShri Abhyankar 13122792810eSHong Zhang F->ops->choleskyfactornumeric = MatFactorNumeric_MUMPS; 1313dcd589f8SShri Abhyankar F->ops->solve = MatSolve_MUMPS; 131451d5961aSHong Zhang F->ops->solvetranspose = MatSolve_MUMPS; 13154e34a73bSHong Zhang F->ops->matsolve = MatMatSolve_MUMPS; 13164e34a73bSHong Zhang #if defined(PETSC_USE_COMPLEX) 13170298fd71SBarry Smith F->ops->getinertia = NULL; 13184e34a73bSHong Zhang #else 13194e34a73bSHong Zhang F->ops->getinertia = MatGetInertia_SBAIJMUMPS; 1320db4efbfdSBarry Smith #endif 1321b24902e0SBarry Smith PetscFunctionReturn(0); 1322b24902e0SBarry Smith } 1323b24902e0SBarry Smith 13244e34a73bSHong Zhang //update!!! 1325397b6df1SKris Buschelman #undef __FUNCT__ 132664e6c443SBarry Smith #define __FUNCT__ "MatView_MUMPS" 132764e6c443SBarry Smith PetscErrorCode MatView_MUMPS(Mat A,PetscViewer viewer) 132874ed9c26SBarry Smith { 1329f6c57405SHong Zhang PetscErrorCode ierr; 133064e6c443SBarry Smith PetscBool iascii; 133164e6c443SBarry Smith PetscViewerFormat format; 1332a5e57a09SHong Zhang Mat_MUMPS *mumps=(Mat_MUMPS*)A->spptr; 1333f6c57405SHong Zhang 1334f6c57405SHong Zhang PetscFunctionBegin; 133564e6c443SBarry Smith /* check if matrix is mumps type */ 133664e6c443SBarry Smith if (A->ops->solve != MatSolve_MUMPS) PetscFunctionReturn(0); 133764e6c443SBarry Smith 1338251f4c67SDmitry Karpeev ierr = PetscObjectTypeCompare((PetscObject)viewer,PETSCVIEWERASCII,&iascii);CHKERRQ(ierr); 133964e6c443SBarry Smith if (iascii) { 134064e6c443SBarry Smith ierr = PetscViewerGetFormat(viewer,&format);CHKERRQ(ierr); 134164e6c443SBarry Smith if (format == PETSC_VIEWER_ASCII_INFO) { 134264e6c443SBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"MUMPS run parameters:\n");CHKERRQ(ierr); 1343a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," SYM (matrix type): %d \n",mumps->id.sym);CHKERRQ(ierr); 1344a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," PAR (host participation): %d \n",mumps->id.par);CHKERRQ(ierr); 1345a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(1) (output for error): %d \n",mumps->id.ICNTL(1));CHKERRQ(ierr); 1346a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(2) (output of diagnostic msg): %d \n",mumps->id.ICNTL(2));CHKERRQ(ierr); 1347a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(3) (output for global info): %d \n",mumps->id.ICNTL(3));CHKERRQ(ierr); 1348a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(4) (level of printing): %d \n",mumps->id.ICNTL(4));CHKERRQ(ierr); 1349a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(5) (input mat struct): %d \n",mumps->id.ICNTL(5));CHKERRQ(ierr); 1350a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(6) (matrix prescaling): %d \n",mumps->id.ICNTL(6));CHKERRQ(ierr); 1351a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(7) (sequentia matrix ordering):%d \n",mumps->id.ICNTL(7));CHKERRQ(ierr); 1352a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(8) (scalling strategy): %d \n",mumps->id.ICNTL(8));CHKERRQ(ierr); 1353a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(10) (max num of refinements): %d \n",mumps->id.ICNTL(10));CHKERRQ(ierr); 1354a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(11) (error analysis): %d \n",mumps->id.ICNTL(11));CHKERRQ(ierr); 1355a5e57a09SHong Zhang if (mumps->id.ICNTL(11)>0) { 1356a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," RINFOG(4) (inf norm of input mat): %g\n",mumps->id.RINFOG(4));CHKERRQ(ierr); 1357a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," RINFOG(5) (inf norm of solution): %g\n",mumps->id.RINFOG(5));CHKERRQ(ierr); 1358a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," RINFOG(6) (inf norm of residual): %g\n",mumps->id.RINFOG(6));CHKERRQ(ierr); 1359a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," RINFOG(7),RINFOG(8) (backward error est): %g, %g\n",mumps->id.RINFOG(7),mumps->id.RINFOG(8));CHKERRQ(ierr); 1360a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," RINFOG(9) (error estimate): %g \n",mumps->id.RINFOG(9));CHKERRQ(ierr); 1361a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," RINFOG(10),RINFOG(11)(condition numbers): %g, %g\n",mumps->id.RINFOG(10),mumps->id.RINFOG(11));CHKERRQ(ierr); 1362f6c57405SHong Zhang } 1363a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(12) (efficiency control): %d \n",mumps->id.ICNTL(12));CHKERRQ(ierr); 1364a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(13) (efficiency control): %d \n",mumps->id.ICNTL(13));CHKERRQ(ierr); 1365a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(14) (percentage of estimated workspace increase): %d \n",mumps->id.ICNTL(14));CHKERRQ(ierr); 1366f6c57405SHong Zhang /* ICNTL(15-17) not used */ 1367a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(18) (input mat struct): %d \n",mumps->id.ICNTL(18));CHKERRQ(ierr); 1368a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(19) (Shur complement info): %d \n",mumps->id.ICNTL(19));CHKERRQ(ierr); 1369a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(20) (rhs sparse pattern): %d \n",mumps->id.ICNTL(20));CHKERRQ(ierr); 1370a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(21) (somumpstion struct): %d \n",mumps->id.ICNTL(21));CHKERRQ(ierr); 1371a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(22) (in-core/out-of-core facility): %d \n",mumps->id.ICNTL(22));CHKERRQ(ierr); 1372a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(23) (max size of memory can be allocated locally):%d \n",mumps->id.ICNTL(23));CHKERRQ(ierr); 1373c0165424SHong Zhang 1374a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(24) (detection of null pivot rows): %d \n",mumps->id.ICNTL(24));CHKERRQ(ierr); 1375a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(25) (computation of a null space basis): %d \n",mumps->id.ICNTL(25));CHKERRQ(ierr); 1376a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(26) (Schur options for rhs or solution): %d \n",mumps->id.ICNTL(26));CHKERRQ(ierr); 1377a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(27) (experimental parameter): %d \n",mumps->id.ICNTL(27));CHKERRQ(ierr); 1378a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(28) (use parallel or sequential ordering): %d \n",mumps->id.ICNTL(28));CHKERRQ(ierr); 1379a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(29) (parallel ordering): %d \n",mumps->id.ICNTL(29));CHKERRQ(ierr); 138042179a6aSHong Zhang 1381a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(30) (user-specified set of entries in inv(A)): %d \n",mumps->id.ICNTL(30));CHKERRQ(ierr); 1382a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(31) (factors is discarded in the solve phase): %d \n",mumps->id.ICNTL(31));CHKERRQ(ierr); 1383a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(33) (compute determinant): %d \n",mumps->id.ICNTL(33));CHKERRQ(ierr); 1384f6c57405SHong Zhang 1385a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," CNTL(1) (relative pivoting threshold): %g \n",mumps->id.CNTL(1));CHKERRQ(ierr); 1386a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," CNTL(2) (stopping criterion of refinement): %g \n",mumps->id.CNTL(2));CHKERRQ(ierr); 1387a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," CNTL(3) (absomumpste pivoting threshold): %g \n",mumps->id.CNTL(3));CHKERRQ(ierr); 1388a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," CNTL(4) (vamumpse of static pivoting): %g \n",mumps->id.CNTL(4));CHKERRQ(ierr); 1389a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," CNTL(5) (fixation for null pivots): %g \n",mumps->id.CNTL(5));CHKERRQ(ierr); 1390f6c57405SHong Zhang 1391f6c57405SHong Zhang /* infomation local to each processor */ 139234ed7027SBarry Smith ierr = PetscViewerASCIIPrintf(viewer, " RINFO(1) (local estimated flops for the elimination after analysis): \n");CHKERRQ(ierr); 13937b23a99aSBarry Smith ierr = PetscViewerASCIISynchronizedAllow(viewer,PETSC_TRUE);CHKERRQ(ierr); 1394a5e57a09SHong Zhang ierr = PetscViewerASCIISynchronizedPrintf(viewer," [%d] %g \n",mumps->myid,mumps->id.RINFO(1));CHKERRQ(ierr); 139534ed7027SBarry Smith ierr = PetscViewerFlush(viewer); 139634ed7027SBarry Smith ierr = PetscViewerASCIIPrintf(viewer, " RINFO(2) (local estimated flops for the assembly after factorization): \n");CHKERRQ(ierr); 1397a5e57a09SHong Zhang ierr = PetscViewerASCIISynchronizedPrintf(viewer," [%d] %g \n",mumps->myid,mumps->id.RINFO(2));CHKERRQ(ierr); 139834ed7027SBarry Smith ierr = PetscViewerFlush(viewer); 139934ed7027SBarry Smith ierr = PetscViewerASCIIPrintf(viewer, " RINFO(3) (local estimated flops for the elimination after factorization): \n");CHKERRQ(ierr); 1400a5e57a09SHong Zhang ierr = PetscViewerASCIISynchronizedPrintf(viewer," [%d] %g \n",mumps->myid,mumps->id.RINFO(3));CHKERRQ(ierr); 140134ed7027SBarry Smith ierr = PetscViewerFlush(viewer); 1402f6c57405SHong Zhang 140334ed7027SBarry Smith ierr = PetscViewerASCIIPrintf(viewer, " INFO(15) (estimated size of (in MB) MUMPS internal data for running numerical factorization): \n");CHKERRQ(ierr); 1404a5e57a09SHong Zhang ierr = PetscViewerASCIISynchronizedPrintf(viewer," [%d] %d \n",mumps->myid,mumps->id.INFO(15));CHKERRQ(ierr); 140534ed7027SBarry Smith ierr = PetscViewerFlush(viewer); 1406f6c57405SHong Zhang 140734ed7027SBarry Smith ierr = PetscViewerASCIIPrintf(viewer, " INFO(16) (size of (in MB) MUMPS internal data used during numerical factorization): \n");CHKERRQ(ierr); 1408a5e57a09SHong Zhang ierr = PetscViewerASCIISynchronizedPrintf(viewer," [%d] %d \n",mumps->myid,mumps->id.INFO(16));CHKERRQ(ierr); 140934ed7027SBarry Smith ierr = PetscViewerFlush(viewer); 1410f6c57405SHong Zhang 141134ed7027SBarry Smith ierr = PetscViewerASCIIPrintf(viewer, " INFO(23) (num of pivots eliminated on this processor after factorization): \n");CHKERRQ(ierr); 1412a5e57a09SHong Zhang ierr = PetscViewerASCIISynchronizedPrintf(viewer," [%d] %d \n",mumps->myid,mumps->id.INFO(23));CHKERRQ(ierr); 141334ed7027SBarry Smith ierr = PetscViewerFlush(viewer); 14147b23a99aSBarry Smith ierr = PetscViewerASCIISynchronizedAllow(viewer,PETSC_FALSE);CHKERRQ(ierr); 1415f6c57405SHong Zhang 1416a5e57a09SHong Zhang if (!mumps->myid) { /* information from the host */ 1417a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," RINFOG(1) (global estimated flops for the elimination after analysis): %g \n",mumps->id.RINFOG(1));CHKERRQ(ierr); 1418a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," RINFOG(2) (global estimated flops for the assembly after factorization): %g \n",mumps->id.RINFOG(2));CHKERRQ(ierr); 1419a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," RINFOG(3) (global estimated flops for the elimination after factorization): %g \n",mumps->id.RINFOG(3));CHKERRQ(ierr); 1420a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," (RINFOG(12) RINFOG(13))*2^INFOG(34) (determinant): (%g,%g)*(2^%d)\n",mumps->id.RINFOG(12),mumps->id.RINFOG(13),mumps->id.INFOG(34));CHKERRQ(ierr); 1421f6c57405SHong Zhang 1422a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(3) (estimated real workspace for factors on all processors after analysis): %d \n",mumps->id.INFOG(3));CHKERRQ(ierr); 1423a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(4) (estimated integer workspace for factors on all processors after analysis): %d \n",mumps->id.INFOG(4));CHKERRQ(ierr); 1424a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(5) (estimated maximum front size in the complete tree): %d \n",mumps->id.INFOG(5));CHKERRQ(ierr); 1425a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(6) (number of nodes in the complete tree): %d \n",mumps->id.INFOG(6));CHKERRQ(ierr); 1426a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(7) (ordering option effectively use after analysis): %d \n",mumps->id.INFOG(7));CHKERRQ(ierr); 1427a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(8) (structural symmetry in percent of the permuted matrix after analysis): %d \n",mumps->id.INFOG(8));CHKERRQ(ierr); 1428a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(9) (total real/complex workspace to store the matrix factors after factorization): %d \n",mumps->id.INFOG(9));CHKERRQ(ierr); 1429a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(10) (total integer space store the matrix factors after factorization): %d \n",mumps->id.INFOG(10));CHKERRQ(ierr); 1430a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(11) (order of largest frontal matrix after factorization): %d \n",mumps->id.INFOG(11));CHKERRQ(ierr); 1431a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(12) (number of off-diagonal pivots): %d \n",mumps->id.INFOG(12));CHKERRQ(ierr); 1432a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(13) (number of delayed pivots after factorization): %d \n",mumps->id.INFOG(13));CHKERRQ(ierr); 1433a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(14) (number of memory compress after factorization): %d \n",mumps->id.INFOG(14));CHKERRQ(ierr); 1434a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(15) (number of steps of iterative refinement after solution): %d \n",mumps->id.INFOG(15));CHKERRQ(ierr); 1435a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(16) (estimated size (in MB) of all MUMPS internal data for factorization after analysis: value on the most memory consuming processor): %d \n",mumps->id.INFOG(16));CHKERRQ(ierr); 1436a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(17) (estimated size of all MUMPS internal data for factorization after analysis: sum over all processors): %d \n",mumps->id.INFOG(17));CHKERRQ(ierr); 1437a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(18) (size of all MUMPS internal data allocated during factorization: value on the most memory consuming processor): %d \n",mumps->id.INFOG(18));CHKERRQ(ierr); 1438a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(19) (size of all MUMPS internal data allocated during factorization: sum over all processors): %d \n",mumps->id.INFOG(19));CHKERRQ(ierr); 1439a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(20) (estimated number of entries in the factors): %d \n",mumps->id.INFOG(20));CHKERRQ(ierr); 1440a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(21) (size in MB of memory effectively used during factorization - value on the most memory consuming processor): %d \n",mumps->id.INFOG(21));CHKERRQ(ierr); 1441a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(22) (size in MB of memory effectively used during factorization - sum over all processors): %d \n",mumps->id.INFOG(22));CHKERRQ(ierr); 1442a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(23) (after analysis: value of ICNTL(6) effectively used): %d \n",mumps->id.INFOG(23));CHKERRQ(ierr); 1443a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(24) (after analysis: value of ICNTL(12) effectively used): %d \n",mumps->id.INFOG(24));CHKERRQ(ierr); 1444a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(25) (after factorization: number of pivots modified by static pivoting): %d \n",mumps->id.INFOG(25));CHKERRQ(ierr); 144540d435e3SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(28) (after factorization: number of null pivots encountered): %d\n",mumps->id.INFOG(28));CHKERRQ(ierr); 144640d435e3SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(29) (after factorization: effective number of entries in the factors (sum over all processors)): %d\n",mumps->id.INFOG(29));CHKERRQ(ierr); 144740d435e3SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(30, 31) (after solution: size in Mbytes of memory used during solution phase): %d, %d\n",mumps->id.INFOG(30),mumps->id.INFOG(31));CHKERRQ(ierr); 144840d435e3SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(32) (after analysis: type of analysis done): %d\n",mumps->id.INFOG(32));CHKERRQ(ierr); 144940d435e3SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(33) (value used for ICNTL(8)): %d\n",mumps->id.INFOG(33));CHKERRQ(ierr); 145040d435e3SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(34) (exponent of the determinant if determinant is requested): %d\n",mumps->id.INFOG(34));CHKERRQ(ierr); 1451f6c57405SHong Zhang } 1452f6c57405SHong Zhang } 1453cb828f0fSHong Zhang } 1454f6c57405SHong Zhang PetscFunctionReturn(0); 1455f6c57405SHong Zhang } 1456f6c57405SHong Zhang 145735bd34faSBarry Smith #undef __FUNCT__ 145835bd34faSBarry Smith #define __FUNCT__ "MatGetInfo_MUMPS" 145935bd34faSBarry Smith PetscErrorCode MatGetInfo_MUMPS(Mat A,MatInfoType flag,MatInfo *info) 146035bd34faSBarry Smith { 1461cb828f0fSHong Zhang Mat_MUMPS *mumps =(Mat_MUMPS*)A->spptr; 146235bd34faSBarry Smith 146335bd34faSBarry Smith PetscFunctionBegin; 146435bd34faSBarry Smith info->block_size = 1.0; 1465cb828f0fSHong Zhang info->nz_allocated = mumps->id.INFOG(20); 1466cb828f0fSHong Zhang info->nz_used = mumps->id.INFOG(20); 146735bd34faSBarry Smith info->nz_unneeded = 0.0; 146835bd34faSBarry Smith info->assemblies = 0.0; 146935bd34faSBarry Smith info->mallocs = 0.0; 147035bd34faSBarry Smith info->memory = 0.0; 147135bd34faSBarry Smith info->fill_ratio_given = 0; 147235bd34faSBarry Smith info->fill_ratio_needed = 0; 147335bd34faSBarry Smith info->factor_mallocs = 0; 147435bd34faSBarry Smith PetscFunctionReturn(0); 147535bd34faSBarry Smith } 147635bd34faSBarry Smith 14775ccb76cbSHong Zhang /* -------------------------------------------------------------------------------------------*/ 14785ccb76cbSHong Zhang #undef __FUNCT__ 14795ccb76cbSHong Zhang #define __FUNCT__ "MatMumpsSetIcntl_MUMPS" 14805ccb76cbSHong Zhang PetscErrorCode MatMumpsSetIcntl_MUMPS(Mat F,PetscInt icntl,PetscInt ival) 14815ccb76cbSHong Zhang { 1482a5e57a09SHong Zhang Mat_MUMPS *mumps =(Mat_MUMPS*)F->spptr; 14835ccb76cbSHong Zhang 14845ccb76cbSHong Zhang PetscFunctionBegin; 1485a5e57a09SHong Zhang mumps->id.ICNTL(icntl) = ival; 14865ccb76cbSHong Zhang PetscFunctionReturn(0); 14875ccb76cbSHong Zhang } 14885ccb76cbSHong Zhang 14895ccb76cbSHong Zhang #undef __FUNCT__ 1490bc6112feSHong Zhang #define __FUNCT__ "MatMumpsGetIcntl_MUMPS" 1491bc6112feSHong Zhang PetscErrorCode MatMumpsGetIcntl_MUMPS(Mat F,PetscInt icntl,PetscInt *ival) 1492bc6112feSHong Zhang { 1493bc6112feSHong Zhang Mat_MUMPS *mumps =(Mat_MUMPS*)F->spptr; 1494bc6112feSHong Zhang 1495bc6112feSHong Zhang PetscFunctionBegin; 1496bc6112feSHong Zhang *ival = mumps->id.ICNTL(icntl); 1497bc6112feSHong Zhang PetscFunctionReturn(0); 1498bc6112feSHong Zhang } 1499bc6112feSHong Zhang 1500bc6112feSHong Zhang #undef __FUNCT__ 15015ccb76cbSHong Zhang #define __FUNCT__ "MatMumpsSetIcntl" 15025ccb76cbSHong Zhang /*@ 15035ccb76cbSHong Zhang MatMumpsSetIcntl - Set MUMPS parameter ICNTL() 15045ccb76cbSHong Zhang 15055ccb76cbSHong Zhang Logically Collective on Mat 15065ccb76cbSHong Zhang 15075ccb76cbSHong Zhang Input Parameters: 15085ccb76cbSHong Zhang + F - the factored matrix obtained by calling MatGetFactor() from PETSc-MUMPS interface 15095ccb76cbSHong Zhang . icntl - index of MUMPS parameter array ICNTL() 15105ccb76cbSHong Zhang - ival - value of MUMPS ICNTL(icntl) 15115ccb76cbSHong Zhang 15125ccb76cbSHong Zhang Options Database: 15135ccb76cbSHong Zhang . -mat_mumps_icntl_<icntl> <ival> 15145ccb76cbSHong Zhang 15155ccb76cbSHong Zhang Level: beginner 15165ccb76cbSHong Zhang 15175ccb76cbSHong Zhang References: MUMPS Users' Guide 15185ccb76cbSHong Zhang 15195ccb76cbSHong Zhang .seealso: MatGetFactor() 15205ccb76cbSHong Zhang @*/ 15215ccb76cbSHong Zhang PetscErrorCode MatMumpsSetIcntl(Mat F,PetscInt icntl,PetscInt ival) 15225ccb76cbSHong Zhang { 15235ccb76cbSHong Zhang PetscErrorCode ierr; 15245ccb76cbSHong Zhang 15255ccb76cbSHong Zhang PetscFunctionBegin; 15265ccb76cbSHong Zhang PetscValidLogicalCollectiveInt(F,icntl,2); 15275ccb76cbSHong Zhang PetscValidLogicalCollectiveInt(F,ival,3); 15285ccb76cbSHong Zhang ierr = PetscTryMethod(F,"MatMumpsSetIcntl_C",(Mat,PetscInt,PetscInt),(F,icntl,ival));CHKERRQ(ierr); 15295ccb76cbSHong Zhang PetscFunctionReturn(0); 15305ccb76cbSHong Zhang } 15315ccb76cbSHong Zhang 1532bc6112feSHong Zhang #undef __FUNCT__ 1533bc6112feSHong Zhang #define __FUNCT__ "MatMumpsGetIcntl" 1534a21f80fcSHong Zhang /*@ 1535a21f80fcSHong Zhang MatMumpsGetIcntl - Get MUMPS parameter ICNTL() 1536a21f80fcSHong Zhang 1537a21f80fcSHong Zhang Logically Collective on Mat 1538a21f80fcSHong Zhang 1539a21f80fcSHong Zhang Input Parameters: 1540a21f80fcSHong Zhang + F - the factored matrix obtained by calling MatGetFactor() from PETSc-MUMPS interface 1541a21f80fcSHong Zhang - icntl - index of MUMPS parameter array ICNTL() 1542a21f80fcSHong Zhang 1543a21f80fcSHong Zhang Output Parameter: 1544a21f80fcSHong Zhang . ival - value of MUMPS ICNTL(icntl) 1545a21f80fcSHong Zhang 1546a21f80fcSHong Zhang Level: beginner 1547a21f80fcSHong Zhang 1548a21f80fcSHong Zhang References: MUMPS Users' Guide 1549a21f80fcSHong Zhang 1550a21f80fcSHong Zhang .seealso: MatGetFactor() 1551a21f80fcSHong Zhang @*/ 1552bc6112feSHong Zhang PetscErrorCode MatMumpsGetIcntl(Mat F,PetscInt icntl,PetscInt *ival) 1553bc6112feSHong Zhang { 1554bc6112feSHong Zhang PetscErrorCode ierr; 1555bc6112feSHong Zhang 1556bc6112feSHong Zhang PetscFunctionBegin; 1557bc6112feSHong Zhang PetscValidLogicalCollectiveInt(F,icntl,2); 1558bc6112feSHong Zhang PetscValidIntPointer(ival,3); 1559bc6112feSHong Zhang ierr = PetscTryMethod(F,"MatMumpsGetIcntl_C",(Mat,PetscInt,PetscInt*),(F,icntl,ival));CHKERRQ(ierr); 1560bc6112feSHong Zhang PetscFunctionReturn(0); 1561bc6112feSHong Zhang } 1562bc6112feSHong Zhang 15638928b65cSHong Zhang /* -------------------------------------------------------------------------------------------*/ 15648928b65cSHong Zhang #undef __FUNCT__ 15658928b65cSHong Zhang #define __FUNCT__ "MatMumpsSetCntl_MUMPS" 15668928b65cSHong Zhang PetscErrorCode MatMumpsSetCntl_MUMPS(Mat F,PetscInt icntl,PetscReal val) 15678928b65cSHong Zhang { 15688928b65cSHong Zhang Mat_MUMPS *mumps =(Mat_MUMPS*)F->spptr; 15698928b65cSHong Zhang 15708928b65cSHong Zhang PetscFunctionBegin; 15718928b65cSHong Zhang mumps->id.CNTL(icntl) = val; 15728928b65cSHong Zhang PetscFunctionReturn(0); 15738928b65cSHong Zhang } 15748928b65cSHong Zhang 15758928b65cSHong Zhang #undef __FUNCT__ 1576bc6112feSHong Zhang #define __FUNCT__ "MatMumpsGetCntl_MUMPS" 1577bc6112feSHong Zhang PetscErrorCode MatMumpsGetCntl_MUMPS(Mat F,PetscInt icntl,PetscReal *val) 1578bc6112feSHong Zhang { 1579bc6112feSHong Zhang Mat_MUMPS *mumps =(Mat_MUMPS*)F->spptr; 1580bc6112feSHong Zhang 1581bc6112feSHong Zhang PetscFunctionBegin; 1582bc6112feSHong Zhang *val = mumps->id.CNTL(icntl); 1583bc6112feSHong Zhang PetscFunctionReturn(0); 1584bc6112feSHong Zhang } 1585bc6112feSHong Zhang 1586bc6112feSHong Zhang #undef __FUNCT__ 15878928b65cSHong Zhang #define __FUNCT__ "MatMumpsSetCntl" 15888928b65cSHong Zhang /*@ 15898928b65cSHong Zhang MatMumpsSetCntl - Set MUMPS parameter CNTL() 15908928b65cSHong Zhang 15918928b65cSHong Zhang Logically Collective on Mat 15928928b65cSHong Zhang 15938928b65cSHong Zhang Input Parameters: 15948928b65cSHong Zhang + F - the factored matrix obtained by calling MatGetFactor() from PETSc-MUMPS interface 15958928b65cSHong Zhang . icntl - index of MUMPS parameter array CNTL() 15968928b65cSHong Zhang - val - value of MUMPS CNTL(icntl) 15978928b65cSHong Zhang 15988928b65cSHong Zhang Options Database: 15998928b65cSHong Zhang . -mat_mumps_cntl_<icntl> <val> 16008928b65cSHong Zhang 16018928b65cSHong Zhang Level: beginner 16028928b65cSHong Zhang 16038928b65cSHong Zhang References: MUMPS Users' Guide 16048928b65cSHong Zhang 16058928b65cSHong Zhang .seealso: MatGetFactor() 16068928b65cSHong Zhang @*/ 16078928b65cSHong Zhang PetscErrorCode MatMumpsSetCntl(Mat F,PetscInt icntl,PetscReal val) 16088928b65cSHong Zhang { 16098928b65cSHong Zhang PetscErrorCode ierr; 16108928b65cSHong Zhang 16118928b65cSHong Zhang PetscFunctionBegin; 16128928b65cSHong Zhang PetscValidLogicalCollectiveInt(F,icntl,2); 1613bc6112feSHong Zhang PetscValidLogicalCollectiveReal(F,val,3); 16148928b65cSHong Zhang ierr = PetscTryMethod(F,"MatMumpsSetCntl_C",(Mat,PetscInt,PetscReal),(F,icntl,val));CHKERRQ(ierr); 16158928b65cSHong Zhang PetscFunctionReturn(0); 16168928b65cSHong Zhang } 16178928b65cSHong Zhang 1618bc6112feSHong Zhang #undef __FUNCT__ 1619bc6112feSHong Zhang #define __FUNCT__ "MatMumpsGetCntl" 1620a21f80fcSHong Zhang /*@ 1621a21f80fcSHong Zhang MatMumpsGetCntl - Get MUMPS parameter CNTL() 1622a21f80fcSHong Zhang 1623a21f80fcSHong Zhang Logically Collective on Mat 1624a21f80fcSHong Zhang 1625a21f80fcSHong Zhang Input Parameters: 1626a21f80fcSHong Zhang + F - the factored matrix obtained by calling MatGetFactor() from PETSc-MUMPS interface 1627a21f80fcSHong Zhang - icntl - index of MUMPS parameter array CNTL() 1628a21f80fcSHong Zhang 1629a21f80fcSHong Zhang Output Parameter: 1630a21f80fcSHong Zhang . val - value of MUMPS CNTL(icntl) 1631a21f80fcSHong Zhang 1632a21f80fcSHong Zhang Level: beginner 1633a21f80fcSHong Zhang 1634a21f80fcSHong Zhang References: MUMPS Users' Guide 1635a21f80fcSHong Zhang 1636a21f80fcSHong Zhang .seealso: MatGetFactor() 1637a21f80fcSHong Zhang @*/ 1638bc6112feSHong Zhang PetscErrorCode MatMumpsGetCntl(Mat F,PetscInt icntl,PetscReal *val) 1639bc6112feSHong Zhang { 1640bc6112feSHong Zhang PetscErrorCode ierr; 1641bc6112feSHong Zhang 1642bc6112feSHong Zhang PetscFunctionBegin; 1643bc6112feSHong Zhang PetscValidLogicalCollectiveInt(F,icntl,2); 1644bc6112feSHong Zhang PetscValidRealPointer(val,3); 1645bc6112feSHong Zhang ierr = PetscTryMethod(F,"MatMumpsGetCntl_C",(Mat,PetscInt,PetscReal*),(F,icntl,val));CHKERRQ(ierr); 1646bc6112feSHong Zhang PetscFunctionReturn(0); 1647bc6112feSHong Zhang } 1648bc6112feSHong Zhang 1649bc6112feSHong Zhang #undef __FUNCT__ 1650ca810319SHong Zhang #define __FUNCT__ "MatMumpsGetInfo_MUMPS" 1651ca810319SHong Zhang PetscErrorCode MatMumpsGetInfo_MUMPS(Mat F,PetscInt icntl,PetscInt *info) 1652bc6112feSHong Zhang { 1653bc6112feSHong Zhang Mat_MUMPS *mumps =(Mat_MUMPS*)F->spptr; 1654bc6112feSHong Zhang 1655bc6112feSHong Zhang PetscFunctionBegin; 1656bc6112feSHong Zhang *info = mumps->id.INFO(icntl); 1657bc6112feSHong Zhang PetscFunctionReturn(0); 1658bc6112feSHong Zhang } 1659bc6112feSHong Zhang 1660bc6112feSHong Zhang #undef __FUNCT__ 1661ca810319SHong Zhang #define __FUNCT__ "MatMumpsGetInfog_MUMPS" 1662ca810319SHong Zhang PetscErrorCode MatMumpsGetInfog_MUMPS(Mat F,PetscInt icntl,PetscInt *infog) 1663bc6112feSHong Zhang { 1664bc6112feSHong Zhang Mat_MUMPS *mumps =(Mat_MUMPS*)F->spptr; 1665bc6112feSHong Zhang 1666bc6112feSHong Zhang PetscFunctionBegin; 1667bc6112feSHong Zhang *infog = mumps->id.INFOG(icntl); 1668bc6112feSHong Zhang PetscFunctionReturn(0); 1669bc6112feSHong Zhang } 1670bc6112feSHong Zhang 1671bc6112feSHong Zhang #undef __FUNCT__ 1672ca810319SHong Zhang #define __FUNCT__ "MatMumpsGetRinfo_MUMPS" 1673ca810319SHong Zhang PetscErrorCode MatMumpsGetRinfo_MUMPS(Mat F,PetscInt icntl,PetscReal *rinfo) 1674bc6112feSHong Zhang { 1675bc6112feSHong Zhang Mat_MUMPS *mumps =(Mat_MUMPS*)F->spptr; 1676bc6112feSHong Zhang 1677bc6112feSHong Zhang PetscFunctionBegin; 1678bc6112feSHong Zhang *rinfo = mumps->id.RINFO(icntl); 1679bc6112feSHong Zhang PetscFunctionReturn(0); 1680bc6112feSHong Zhang } 1681bc6112feSHong Zhang 1682bc6112feSHong Zhang #undef __FUNCT__ 1683ca810319SHong Zhang #define __FUNCT__ "MatMumpsGetRinfog_MUMPS" 1684ca810319SHong Zhang PetscErrorCode MatMumpsGetRinfog_MUMPS(Mat F,PetscInt icntl,PetscReal *rinfog) 1685bc6112feSHong Zhang { 1686bc6112feSHong Zhang Mat_MUMPS *mumps =(Mat_MUMPS*)F->spptr; 1687bc6112feSHong Zhang 1688bc6112feSHong Zhang PetscFunctionBegin; 1689bc6112feSHong Zhang *rinfog = mumps->id.RINFOG(icntl); 1690bc6112feSHong Zhang PetscFunctionReturn(0); 1691bc6112feSHong Zhang } 1692bc6112feSHong Zhang 1693bc6112feSHong Zhang #undef __FUNCT__ 1694ca810319SHong Zhang #define __FUNCT__ "MatMumpsGetInfo" 1695a21f80fcSHong Zhang /*@ 1696a21f80fcSHong Zhang MatMumpsGetInfo - Get MUMPS parameter INFO() 1697a21f80fcSHong Zhang 1698a21f80fcSHong Zhang Logically Collective on Mat 1699a21f80fcSHong Zhang 1700a21f80fcSHong Zhang Input Parameters: 1701a21f80fcSHong Zhang + F - the factored matrix obtained by calling MatGetFactor() from PETSc-MUMPS interface 1702a21f80fcSHong Zhang - icntl - index of MUMPS parameter array INFO() 1703a21f80fcSHong Zhang 1704a21f80fcSHong Zhang Output Parameter: 1705a21f80fcSHong Zhang . ival - value of MUMPS INFO(icntl) 1706a21f80fcSHong Zhang 1707a21f80fcSHong Zhang Level: beginner 1708a21f80fcSHong Zhang 1709a21f80fcSHong Zhang References: MUMPS Users' Guide 1710a21f80fcSHong Zhang 1711a21f80fcSHong Zhang .seealso: MatGetFactor() 1712a21f80fcSHong Zhang @*/ 1713ca810319SHong Zhang PetscErrorCode MatMumpsGetInfo(Mat F,PetscInt icntl,PetscInt *ival) 1714bc6112feSHong Zhang { 1715bc6112feSHong Zhang PetscErrorCode ierr; 1716bc6112feSHong Zhang 1717bc6112feSHong Zhang PetscFunctionBegin; 1718ca810319SHong Zhang PetscValidIntPointer(ival,3); 1719ca810319SHong Zhang ierr = PetscTryMethod(F,"MatMumpsGetInfo_C",(Mat,PetscInt,PetscInt*),(F,icntl,ival));CHKERRQ(ierr); 1720bc6112feSHong Zhang PetscFunctionReturn(0); 1721bc6112feSHong Zhang } 1722bc6112feSHong Zhang 1723bc6112feSHong Zhang #undef __FUNCT__ 1724ca810319SHong Zhang #define __FUNCT__ "MatMumpsGetInfog" 1725a21f80fcSHong Zhang /*@ 1726a21f80fcSHong Zhang MatMumpsGetInfog - Get MUMPS parameter INFOG() 1727a21f80fcSHong Zhang 1728a21f80fcSHong Zhang Logically Collective on Mat 1729a21f80fcSHong Zhang 1730a21f80fcSHong Zhang Input Parameters: 1731a21f80fcSHong Zhang + F - the factored matrix obtained by calling MatGetFactor() from PETSc-MUMPS interface 1732a21f80fcSHong Zhang - icntl - index of MUMPS parameter array INFOG() 1733a21f80fcSHong Zhang 1734a21f80fcSHong Zhang Output Parameter: 1735a21f80fcSHong Zhang . ival - value of MUMPS INFOG(icntl) 1736a21f80fcSHong Zhang 1737a21f80fcSHong Zhang Level: beginner 1738a21f80fcSHong Zhang 1739a21f80fcSHong Zhang References: MUMPS Users' Guide 1740a21f80fcSHong Zhang 1741a21f80fcSHong Zhang .seealso: MatGetFactor() 1742a21f80fcSHong Zhang @*/ 1743ca810319SHong Zhang PetscErrorCode MatMumpsGetInfog(Mat F,PetscInt icntl,PetscInt *ival) 1744bc6112feSHong Zhang { 1745bc6112feSHong Zhang PetscErrorCode ierr; 1746bc6112feSHong Zhang 1747bc6112feSHong Zhang PetscFunctionBegin; 1748ca810319SHong Zhang PetscValidIntPointer(ival,3); 1749ca810319SHong Zhang ierr = PetscTryMethod(F,"MatMumpsGetInfog_C",(Mat,PetscInt,PetscInt*),(F,icntl,ival));CHKERRQ(ierr); 1750bc6112feSHong Zhang PetscFunctionReturn(0); 1751bc6112feSHong Zhang } 1752bc6112feSHong Zhang 1753bc6112feSHong Zhang #undef __FUNCT__ 1754ca810319SHong Zhang #define __FUNCT__ "MatMumpsGetRinfo" 1755a21f80fcSHong Zhang /*@ 1756a21f80fcSHong Zhang MatMumpsGetRinfo - Get MUMPS parameter RINFO() 1757a21f80fcSHong Zhang 1758a21f80fcSHong Zhang Logically Collective on Mat 1759a21f80fcSHong Zhang 1760a21f80fcSHong Zhang Input Parameters: 1761a21f80fcSHong Zhang + F - the factored matrix obtained by calling MatGetFactor() from PETSc-MUMPS interface 1762a21f80fcSHong Zhang - icntl - index of MUMPS parameter array RINFO() 1763a21f80fcSHong Zhang 1764a21f80fcSHong Zhang Output Parameter: 1765a21f80fcSHong Zhang . val - value of MUMPS RINFO(icntl) 1766a21f80fcSHong Zhang 1767a21f80fcSHong Zhang Level: beginner 1768a21f80fcSHong Zhang 1769a21f80fcSHong Zhang References: MUMPS Users' Guide 1770a21f80fcSHong Zhang 1771a21f80fcSHong Zhang .seealso: MatGetFactor() 1772a21f80fcSHong Zhang @*/ 1773ca810319SHong Zhang PetscErrorCode MatMumpsGetRinfo(Mat F,PetscInt icntl,PetscReal *val) 1774bc6112feSHong Zhang { 1775bc6112feSHong Zhang PetscErrorCode ierr; 1776bc6112feSHong Zhang 1777bc6112feSHong Zhang PetscFunctionBegin; 1778bc6112feSHong Zhang PetscValidRealPointer(val,3); 1779ca810319SHong Zhang ierr = PetscTryMethod(F,"MatMumpsGetRinfo_C",(Mat,PetscInt,PetscReal*),(F,icntl,val));CHKERRQ(ierr); 1780bc6112feSHong Zhang PetscFunctionReturn(0); 1781bc6112feSHong Zhang } 1782bc6112feSHong Zhang 1783bc6112feSHong Zhang #undef __FUNCT__ 1784ca810319SHong Zhang #define __FUNCT__ "MatMumpsGetRinfog" 1785a21f80fcSHong Zhang /*@ 1786a21f80fcSHong Zhang MatMumpsGetRinfog - Get MUMPS parameter RINFOG() 1787a21f80fcSHong Zhang 1788a21f80fcSHong Zhang Logically Collective on Mat 1789a21f80fcSHong Zhang 1790a21f80fcSHong Zhang Input Parameters: 1791a21f80fcSHong Zhang + F - the factored matrix obtained by calling MatGetFactor() from PETSc-MUMPS interface 1792a21f80fcSHong Zhang - icntl - index of MUMPS parameter array RINFOG() 1793a21f80fcSHong Zhang 1794a21f80fcSHong Zhang Output Parameter: 1795a21f80fcSHong Zhang . val - value of MUMPS RINFOG(icntl) 1796a21f80fcSHong Zhang 1797a21f80fcSHong Zhang Level: beginner 1798a21f80fcSHong Zhang 1799a21f80fcSHong Zhang References: MUMPS Users' Guide 1800a21f80fcSHong Zhang 1801a21f80fcSHong Zhang .seealso: MatGetFactor() 1802a21f80fcSHong Zhang @*/ 1803ca810319SHong Zhang PetscErrorCode MatMumpsGetRinfog(Mat F,PetscInt icntl,PetscReal *val) 1804bc6112feSHong Zhang { 1805bc6112feSHong Zhang PetscErrorCode ierr; 1806bc6112feSHong Zhang 1807bc6112feSHong Zhang PetscFunctionBegin; 1808bc6112feSHong Zhang PetscValidRealPointer(val,3); 1809ca810319SHong Zhang ierr = PetscTryMethod(F,"MatMumpsGetRinfog_C",(Mat,PetscInt,PetscReal*),(F,icntl,val));CHKERRQ(ierr); 1810bc6112feSHong Zhang PetscFunctionReturn(0); 1811bc6112feSHong Zhang } 1812bc6112feSHong Zhang 181324b6179bSKris Buschelman /*MC 18142692d6eeSBarry Smith MATSOLVERMUMPS - A matrix type providing direct solvers (LU and Cholesky) for 181524b6179bSKris Buschelman distributed and sequential matrices via the external package MUMPS. 181624b6179bSKris Buschelman 181741c8de11SBarry Smith Works with MATAIJ and MATSBAIJ matrices 181824b6179bSKris Buschelman 181924b6179bSKris Buschelman Options Database Keys: 18204e34a73bSHong Zhang + -mat_mumps_icntl_1 <6>: ICNTL(1): output stream for error messages (None) 18214e34a73bSHong Zhang . -mat_mumps_icntl_2 <0>: ICNTL(2): output stream for diagnostic printing, statistics, and warning (None) 18224e34a73bSHong Zhang . -mat_mumps_icntl_3 <0>: ICNTL(3): output stream for global information, collected on the host (None) 18234e34a73bSHong Zhang . -mat_mumps_icntl_4 <0>: ICNTL(4): level of printing (0 to 4) (None) 18244e34a73bSHong Zhang . -mat_mumps_icntl_6 <7>: ICNTL(6): permutes to a zero-free diagonal and/or scale the matrix (0 to 7) (None) 18254e34a73bSHong Zhang . -mat_mumps_icntl_7 <7>: ICNTL(7): computes a symmetric permutation in sequential analysis (0 to 7). 3=Scotch, 4=PORD, 5=Metis (None) 18264e34a73bSHong Zhang . -mat_mumps_icntl_8 <77>: ICNTL(8): scaling strategy (-2 to 8 or 77) (None) 18274e34a73bSHong Zhang . -mat_mumps_icntl_10 <0>: ICNTL(10): max num of refinements (None) 18284e34a73bSHong Zhang . -mat_mumps_icntl_11 <0>: ICNTL(11): statistics related to an error analysis (via -ksp_view) (None) 18294e34a73bSHong Zhang . -mat_mumps_icntl_12 <1>: ICNTL(12): an ordering strategy for symmetric matrices (0 to 3) (None) 18304e34a73bSHong Zhang . -mat_mumps_icntl_13 <0>: ICNTL(13): parallelism of the root node (enable ScaLAPACK) and its splitting (None) 18314e34a73bSHong Zhang . -mat_mumps_icntl_14 <20>: ICNTL(14): percentage increase in the estimated working space (None) 18324e34a73bSHong Zhang . -mat_mumps_icntl_19 <0>: ICNTL(19): computes the Schur complement (None) 18334e34a73bSHong Zhang . -mat_mumps_icntl_22 <0>: ICNTL(22): in-core/out-of-core factorization and solve (0 or 1) (None) 18344e34a73bSHong Zhang . -mat_mumps_icntl_23 <0>: ICNTL(23): max size of the working memory (MB) that can allocate per processor (None) 18354e34a73bSHong Zhang . -mat_mumps_icntl_24 <0>: ICNTL(24): detection of null pivot rows (0 or 1) (None) 18364e34a73bSHong Zhang . -mat_mumps_icntl_25 <0>: ICNTL(25): compute a solution of a deficient matrix and a null space basis (None) 18374e34a73bSHong Zhang . -mat_mumps_icntl_26 <0>: ICNTL(26): drives the solution phase if a Schur complement matrix (None) 18384e34a73bSHong Zhang . -mat_mumps_icntl_28 <1>: ICNTL(28): use 1 for sequential analysis and ictnl(7) ordering, or 2 for parallel analysis and ictnl(29) ordering (None) 18394e34a73bSHong Zhang . -mat_mumps_icntl_29 <0>: ICNTL(29): parallel ordering 1 = ptscotch, 2 = parmetis (None) 18404e34a73bSHong Zhang . -mat_mumps_icntl_30 <0>: ICNTL(30): compute user-specified set of entries in inv(A) (None) 18414e34a73bSHong Zhang . -mat_mumps_icntl_31 <0>: ICNTL(31): indicates which factors may be discarded during factorization (None) 18424e34a73bSHong Zhang . -mat_mumps_icntl_33 <0>: ICNTL(33): compute determinant (None) 18434e34a73bSHong Zhang . -mat_mumps_cntl_1 <0.01>: CNTL(1): relative pivoting threshold (None) 18444e34a73bSHong Zhang . -mat_mumps_cntl_2 <1.49012e-08>: CNTL(2): stopping criterion of refinement (None) 18454e34a73bSHong Zhang . -mat_mumps_cntl_3 <0>: CNTL(3): absolute pivoting threshold (None) 18464e34a73bSHong Zhang . -mat_mumps_cntl_4 <-1>: CNTL(4): value for static pivoting (None) 18474e34a73bSHong Zhang - -mat_mumps_cntl_5 <0>: CNTL(5): fixation for null pivots (None) 184824b6179bSKris Buschelman 184924b6179bSKris Buschelman Level: beginner 185024b6179bSKris Buschelman 185141c8de11SBarry Smith .seealso: PCFactorSetMatSolverPackage(), MatSolverPackage 185241c8de11SBarry Smith 185324b6179bSKris Buschelman M*/ 185424b6179bSKris Buschelman 185535bd34faSBarry Smith #undef __FUNCT__ 185635bd34faSBarry Smith #define __FUNCT__ "MatFactorGetSolverPackage_mumps" 1857f7a08781SBarry Smith static PetscErrorCode MatFactorGetSolverPackage_mumps(Mat A,const MatSolverPackage *type) 185835bd34faSBarry Smith { 185935bd34faSBarry Smith PetscFunctionBegin; 18602692d6eeSBarry Smith *type = MATSOLVERMUMPS; 186135bd34faSBarry Smith PetscFunctionReturn(0); 186235bd34faSBarry Smith } 186335bd34faSBarry Smith 1864bccb9932SShri Abhyankar /* MatGetFactor for Seq and MPI AIJ matrices */ 18652877fffaSHong Zhang #undef __FUNCT__ 1866bccb9932SShri Abhyankar #define __FUNCT__ "MatGetFactor_aij_mumps" 18678cc058d9SJed Brown PETSC_EXTERN PetscErrorCode MatGetFactor_aij_mumps(Mat A,MatFactorType ftype,Mat *F) 18682877fffaSHong Zhang { 18692877fffaSHong Zhang Mat B; 18702877fffaSHong Zhang PetscErrorCode ierr; 18712877fffaSHong Zhang Mat_MUMPS *mumps; 1872ace3abfcSBarry Smith PetscBool isSeqAIJ; 18732877fffaSHong Zhang 18742877fffaSHong Zhang PetscFunctionBegin; 18752877fffaSHong Zhang /* Create the factorization matrix */ 1876251f4c67SDmitry Karpeev ierr = PetscObjectTypeCompare((PetscObject)A,MATSEQAIJ,&isSeqAIJ);CHKERRQ(ierr); 1877ce94432eSBarry Smith ierr = MatCreate(PetscObjectComm((PetscObject)A),&B);CHKERRQ(ierr); 18782877fffaSHong Zhang ierr = MatSetSizes(B,A->rmap->n,A->cmap->n,A->rmap->N,A->cmap->N);CHKERRQ(ierr); 18792877fffaSHong Zhang ierr = MatSetType(B,((PetscObject)A)->type_name);CHKERRQ(ierr); 1880bccb9932SShri Abhyankar if (isSeqAIJ) { 18810298fd71SBarry Smith ierr = MatSeqAIJSetPreallocation(B,0,NULL);CHKERRQ(ierr); 1882bccb9932SShri Abhyankar } else { 18830298fd71SBarry Smith ierr = MatMPIAIJSetPreallocation(B,0,NULL,0,NULL);CHKERRQ(ierr); 1884bccb9932SShri Abhyankar } 18852877fffaSHong Zhang 1886b00a9115SJed Brown ierr = PetscNewLog(B,&mumps);CHKERRQ(ierr); 18872205254eSKarl Rupp 18882877fffaSHong Zhang B->ops->view = MatView_MUMPS; 188935bd34faSBarry Smith B->ops->getinfo = MatGetInfo_MUMPS; 189020be8e61SHong Zhang B->ops->getdiagonal = MatGetDiagonal_MUMPS; 18912205254eSKarl Rupp 1892bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatFactorGetSolverPackage_C",MatFactorGetSolverPackage_mumps);CHKERRQ(ierr); 1893bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsSetIcntl_C",MatMumpsSetIcntl_MUMPS);CHKERRQ(ierr); 1894bc6112feSHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsGetIcntl_C",MatMumpsGetIcntl_MUMPS);CHKERRQ(ierr); 1895bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsSetCntl_C",MatMumpsSetCntl_MUMPS);CHKERRQ(ierr); 1896bc6112feSHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsGetCntl_C",MatMumpsGetCntl_MUMPS);CHKERRQ(ierr); 1897bc6112feSHong Zhang 1898ca810319SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsGetInfo_C",MatMumpsGetInfo_MUMPS);CHKERRQ(ierr); 1899ca810319SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsGetInfog_C",MatMumpsGetInfog_MUMPS);CHKERRQ(ierr); 1900ca810319SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsGetRinfo_C",MatMumpsGetRinfo_MUMPS);CHKERRQ(ierr); 1901ca810319SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsGetRinfog_C",MatMumpsGetRinfog_MUMPS);CHKERRQ(ierr); 1902450b117fSShri Abhyankar if (ftype == MAT_FACTOR_LU) { 1903450b117fSShri Abhyankar B->ops->lufactorsymbolic = MatLUFactorSymbolic_AIJMUMPS; 1904d5f3da31SBarry Smith B->factortype = MAT_FACTOR_LU; 1905bccb9932SShri Abhyankar if (isSeqAIJ) mumps->ConvertToTriples = MatConvertToTriples_seqaij_seqaij; 1906bccb9932SShri Abhyankar else mumps->ConvertToTriples = MatConvertToTriples_mpiaij_mpiaij; 1907746480a1SHong Zhang mumps->sym = 0; 1908dcd589f8SShri Abhyankar } else { 190967877ebaSShri Abhyankar B->ops->choleskyfactorsymbolic = MatCholeskyFactorSymbolic_MUMPS; 1910450b117fSShri Abhyankar B->factortype = MAT_FACTOR_CHOLESKY; 1911bccb9932SShri Abhyankar if (isSeqAIJ) mumps->ConvertToTriples = MatConvertToTriples_seqaij_seqsbaij; 1912bccb9932SShri Abhyankar else mumps->ConvertToTriples = MatConvertToTriples_mpiaij_mpisbaij; 19136fdc2a6dSBarry Smith if (A->spd_set && A->spd) mumps->sym = 1; 19146fdc2a6dSBarry Smith else mumps->sym = 2; 1915450b117fSShri Abhyankar } 19162877fffaSHong Zhang 19172877fffaSHong Zhang mumps->isAIJ = PETSC_TRUE; 1918bf0cc555SLisandro Dalcin mumps->Destroy = B->ops->destroy; 19192877fffaSHong Zhang B->ops->destroy = MatDestroy_MUMPS; 19202877fffaSHong Zhang B->spptr = (void*)mumps; 19212205254eSKarl Rupp 1922f697e70eSHong Zhang ierr = PetscInitializeMUMPS(A,mumps);CHKERRQ(ierr); 1923746480a1SHong Zhang 19242877fffaSHong Zhang *F = B; 19252877fffaSHong Zhang PetscFunctionReturn(0); 19262877fffaSHong Zhang } 19272877fffaSHong Zhang 1928bccb9932SShri Abhyankar /* MatGetFactor for Seq and MPI SBAIJ matrices */ 19292877fffaSHong Zhang #undef __FUNCT__ 1930bccb9932SShri Abhyankar #define __FUNCT__ "MatGetFactor_sbaij_mumps" 19318cc058d9SJed Brown PETSC_EXTERN PetscErrorCode MatGetFactor_sbaij_mumps(Mat A,MatFactorType ftype,Mat *F) 19322877fffaSHong Zhang { 19332877fffaSHong Zhang Mat B; 19342877fffaSHong Zhang PetscErrorCode ierr; 19352877fffaSHong Zhang Mat_MUMPS *mumps; 1936ace3abfcSBarry Smith PetscBool isSeqSBAIJ; 19372877fffaSHong Zhang 19382877fffaSHong Zhang PetscFunctionBegin; 1939ce94432eSBarry Smith if (ftype != MAT_FACTOR_CHOLESKY) SETERRQ(PetscObjectComm((PetscObject)A),PETSC_ERR_SUP,"Cannot use PETSc SBAIJ matrices with MUMPS LU, use AIJ matrix"); 1940ce94432eSBarry Smith if (A->rmap->bs > 1) SETERRQ(PetscObjectComm((PetscObject)A),PETSC_ERR_SUP,"Cannot use PETSc SBAIJ matrices with block size > 1 with MUMPS Cholesky, use AIJ matrix instead"); 1941251f4c67SDmitry Karpeev ierr = PetscObjectTypeCompare((PetscObject)A,MATSEQSBAIJ,&isSeqSBAIJ);CHKERRQ(ierr); 19422877fffaSHong Zhang /* Create the factorization matrix */ 1943ce94432eSBarry Smith ierr = MatCreate(PetscObjectComm((PetscObject)A),&B);CHKERRQ(ierr); 19442877fffaSHong Zhang ierr = MatSetSizes(B,A->rmap->n,A->cmap->n,A->rmap->N,A->cmap->N);CHKERRQ(ierr); 19452877fffaSHong Zhang ierr = MatSetType(B,((PetscObject)A)->type_name);CHKERRQ(ierr); 1946b00a9115SJed Brown ierr = PetscNewLog(B,&mumps);CHKERRQ(ierr); 1947bccb9932SShri Abhyankar if (isSeqSBAIJ) { 19480298fd71SBarry Smith ierr = MatSeqSBAIJSetPreallocation(B,1,0,NULL);CHKERRQ(ierr); 19492205254eSKarl Rupp 195016ebf90aSShri Abhyankar mumps->ConvertToTriples = MatConvertToTriples_seqsbaij_seqsbaij; 1951dcd589f8SShri Abhyankar } else { 19520298fd71SBarry Smith ierr = MatMPISBAIJSetPreallocation(B,1,0,NULL,0,NULL);CHKERRQ(ierr); 19532205254eSKarl Rupp 1954bccb9932SShri Abhyankar mumps->ConvertToTriples = MatConvertToTriples_mpisbaij_mpisbaij; 1955bccb9932SShri Abhyankar } 1956bccb9932SShri Abhyankar 195767877ebaSShri Abhyankar B->ops->choleskyfactorsymbolic = MatCholeskyFactorSymbolic_MUMPS; 1958bccb9932SShri Abhyankar B->ops->view = MatView_MUMPS; 195920be8e61SHong Zhang B->ops->getdiagonal = MatGetDiagonal_MUMPS; 19602205254eSKarl Rupp 1961bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatFactorGetSolverPackage_C",MatFactorGetSolverPackage_mumps);CHKERRQ(ierr); 1962b13644aeSHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsSetIcntl_C",MatMumpsSetIcntl_MUMPS);CHKERRQ(ierr); 1963b13644aeSHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsGetIcntl_C",MatMumpsGetIcntl_MUMPS);CHKERRQ(ierr); 1964b13644aeSHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsSetCntl_C",MatMumpsSetCntl_MUMPS);CHKERRQ(ierr); 1965b13644aeSHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsGetCntl_C",MatMumpsGetCntl_MUMPS);CHKERRQ(ierr); 1966bc6112feSHong Zhang 1967ca810319SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsGetInfo_C",MatMumpsGetInfo_MUMPS);CHKERRQ(ierr); 1968ca810319SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsGetInfog_C",MatMumpsGetInfog_MUMPS);CHKERRQ(ierr); 1969ca810319SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsGetRinfo_C",MatMumpsGetRinfo_MUMPS);CHKERRQ(ierr); 1970ca810319SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsGetRinfog_C",MatMumpsGetRinfog_MUMPS);CHKERRQ(ierr); 19712205254eSKarl Rupp 1972f4762488SHong Zhang B->factortype = MAT_FACTOR_CHOLESKY; 19736fdc2a6dSBarry Smith if (A->spd_set && A->spd) mumps->sym = 1; 19746fdc2a6dSBarry Smith else mumps->sym = 2; 1975a214ac2aSShri Abhyankar 1976bccb9932SShri Abhyankar mumps->isAIJ = PETSC_FALSE; 1977bf0cc555SLisandro Dalcin mumps->Destroy = B->ops->destroy; 1978f3c0ef26SHong Zhang B->ops->destroy = MatDestroy_MUMPS; 19792877fffaSHong Zhang B->spptr = (void*)mumps; 19802205254eSKarl Rupp 1981f697e70eSHong Zhang ierr = PetscInitializeMUMPS(A,mumps);CHKERRQ(ierr); 1982746480a1SHong Zhang 19832877fffaSHong Zhang *F = B; 19842877fffaSHong Zhang PetscFunctionReturn(0); 19852877fffaSHong Zhang } 198697969023SHong Zhang 1987450b117fSShri Abhyankar #undef __FUNCT__ 1988bccb9932SShri Abhyankar #define __FUNCT__ "MatGetFactor_baij_mumps" 19898cc058d9SJed Brown PETSC_EXTERN PetscErrorCode MatGetFactor_baij_mumps(Mat A,MatFactorType ftype,Mat *F) 199067877ebaSShri Abhyankar { 199167877ebaSShri Abhyankar Mat B; 199267877ebaSShri Abhyankar PetscErrorCode ierr; 199367877ebaSShri Abhyankar Mat_MUMPS *mumps; 1994ace3abfcSBarry Smith PetscBool isSeqBAIJ; 199567877ebaSShri Abhyankar 199667877ebaSShri Abhyankar PetscFunctionBegin; 199767877ebaSShri Abhyankar /* Create the factorization matrix */ 1998251f4c67SDmitry Karpeev ierr = PetscObjectTypeCompare((PetscObject)A,MATSEQBAIJ,&isSeqBAIJ);CHKERRQ(ierr); 1999ce94432eSBarry Smith ierr = MatCreate(PetscObjectComm((PetscObject)A),&B);CHKERRQ(ierr); 200067877ebaSShri Abhyankar ierr = MatSetSizes(B,A->rmap->n,A->cmap->n,A->rmap->N,A->cmap->N);CHKERRQ(ierr); 200167877ebaSShri Abhyankar ierr = MatSetType(B,((PetscObject)A)->type_name);CHKERRQ(ierr); 2002bccb9932SShri Abhyankar if (isSeqBAIJ) { 20030298fd71SBarry Smith ierr = MatSeqBAIJSetPreallocation(B,A->rmap->bs,0,NULL);CHKERRQ(ierr); 2004bccb9932SShri Abhyankar } else { 20050298fd71SBarry Smith ierr = MatMPIBAIJSetPreallocation(B,A->rmap->bs,0,NULL,0,NULL);CHKERRQ(ierr); 2006bccb9932SShri Abhyankar } 2007450b117fSShri Abhyankar 2008b00a9115SJed Brown ierr = PetscNewLog(B,&mumps);CHKERRQ(ierr); 2009450b117fSShri Abhyankar if (ftype == MAT_FACTOR_LU) { 2010450b117fSShri Abhyankar B->ops->lufactorsymbolic = MatLUFactorSymbolic_BAIJMUMPS; 2011450b117fSShri Abhyankar B->factortype = MAT_FACTOR_LU; 2012bccb9932SShri Abhyankar if (isSeqBAIJ) mumps->ConvertToTriples = MatConvertToTriples_seqbaij_seqaij; 2013bccb9932SShri Abhyankar else mumps->ConvertToTriples = MatConvertToTriples_mpibaij_mpiaij; 2014746480a1SHong Zhang mumps->sym = 0; 2015f23aa3ddSBarry Smith } else SETERRQ(PETSC_COMM_SELF,PETSC_ERR_SUP,"Cannot use PETSc BAIJ matrices with MUMPS Cholesky, use SBAIJ or AIJ matrix instead\n"); 2016bccb9932SShri Abhyankar 2017450b117fSShri Abhyankar B->ops->view = MatView_MUMPS; 201820be8e61SHong Zhang B->ops->getdiagonal = MatGetDiagonal_MUMPS; 20192205254eSKarl Rupp 2020bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatFactorGetSolverPackage_C",MatFactorGetSolverPackage_mumps);CHKERRQ(ierr); 2021bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsSetIcntl_C",MatMumpsSetIcntl_MUMPS);CHKERRQ(ierr); 2022bc6112feSHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsGetIcntl_C",MatMumpsGetIcntl_MUMPS);CHKERRQ(ierr); 2023bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsSetCntl_C",MatMumpsSetCntl_MUMPS);CHKERRQ(ierr); 2024bc6112feSHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsGetCntl_C",MatMumpsGetCntl_MUMPS);CHKERRQ(ierr); 2025bc6112feSHong Zhang 2026ca810319SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsGetInfo_C",MatMumpsGetInfo_MUMPS);CHKERRQ(ierr); 2027ca810319SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsGetInfog_C",MatMumpsGetInfog_MUMPS);CHKERRQ(ierr); 2028ca810319SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsGetRinfo_C",MatMumpsGetRinfo_MUMPS);CHKERRQ(ierr); 2029ca810319SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsGetRinfog_C",MatMumpsGetRinfog_MUMPS);CHKERRQ(ierr); 2030450b117fSShri Abhyankar 2031450b117fSShri Abhyankar mumps->isAIJ = PETSC_TRUE; 2032bf0cc555SLisandro Dalcin mumps->Destroy = B->ops->destroy; 2033450b117fSShri Abhyankar B->ops->destroy = MatDestroy_MUMPS; 2034450b117fSShri Abhyankar B->spptr = (void*)mumps; 20352205254eSKarl Rupp 2036f697e70eSHong Zhang ierr = PetscInitializeMUMPS(A,mumps);CHKERRQ(ierr); 2037746480a1SHong Zhang 2038450b117fSShri Abhyankar *F = B; 2039450b117fSShri Abhyankar PetscFunctionReturn(0); 2040450b117fSShri Abhyankar } 204142c9c57cSBarry Smith 204242c9c57cSBarry Smith PETSC_EXTERN PetscErrorCode MatGetFactor_aij_mumps(Mat,MatFactorType,Mat*); 204342c9c57cSBarry Smith PETSC_EXTERN PetscErrorCode MatGetFactor_baij_mumps(Mat,MatFactorType,Mat*); 204442c9c57cSBarry Smith PETSC_EXTERN PetscErrorCode MatGetFactor_sbaij_mumps(Mat,MatFactorType,Mat*); 204542c9c57cSBarry Smith 204642c9c57cSBarry Smith #undef __FUNCT__ 204742c9c57cSBarry Smith #define __FUNCT__ "MatSolverPackageRegister_MUMPS" 204829b38603SBarry Smith PETSC_EXTERN PetscErrorCode MatSolverPackageRegister_MUMPS(void) 204942c9c57cSBarry Smith { 205042c9c57cSBarry Smith PetscErrorCode ierr; 205142c9c57cSBarry Smith 205242c9c57cSBarry Smith PetscFunctionBegin; 205342c9c57cSBarry Smith ierr = MatSolverPackageRegister(MATSOLVERMUMPS,MATMPIAIJ, MAT_FACTOR_LU,MatGetFactor_aij_mumps);CHKERRQ(ierr); 205442c9c57cSBarry Smith ierr = MatSolverPackageRegister(MATSOLVERMUMPS,MATMPIAIJ, MAT_FACTOR_CHOLESKY,MatGetFactor_aij_mumps);CHKERRQ(ierr); 205542c9c57cSBarry Smith ierr = MatSolverPackageRegister(MATSOLVERMUMPS,MATMPIBAIJ, MAT_FACTOR_LU,MatGetFactor_baij_mumps);CHKERRQ(ierr); 205642c9c57cSBarry Smith ierr = MatSolverPackageRegister(MATSOLVERMUMPS,MATMPIBAIJ, MAT_FACTOR_CHOLESKY,MatGetFactor_baij_mumps);CHKERRQ(ierr); 205742c9c57cSBarry Smith ierr = MatSolverPackageRegister(MATSOLVERMUMPS,MATMPISBAIJ, MAT_FACTOR_CHOLESKY,MatGetFactor_sbaij_mumps);CHKERRQ(ierr); 205842c9c57cSBarry Smith ierr = MatSolverPackageRegister(MATSOLVERMUMPS,MATSEQAIJ, MAT_FACTOR_LU,MatGetFactor_aij_mumps);CHKERRQ(ierr); 205942c9c57cSBarry Smith ierr = MatSolverPackageRegister(MATSOLVERMUMPS,MATSEQAIJ, MAT_FACTOR_CHOLESKY,MatGetFactor_aij_mumps);CHKERRQ(ierr); 206042c9c57cSBarry Smith ierr = MatSolverPackageRegister(MATSOLVERMUMPS,MATSEQBAIJ, MAT_FACTOR_LU,MatGetFactor_baij_mumps);CHKERRQ(ierr); 206142c9c57cSBarry Smith ierr = MatSolverPackageRegister(MATSOLVERMUMPS,MATSEQBAIJ, MAT_FACTOR_CHOLESKY,MatGetFactor_baij_mumps);CHKERRQ(ierr); 206242c9c57cSBarry Smith ierr = MatSolverPackageRegister(MATSOLVERMUMPS,MATSEQSBAIJ, MAT_FACTOR_CHOLESKY,MatGetFactor_sbaij_mumps);CHKERRQ(ierr); 206342c9c57cSBarry Smith PetscFunctionReturn(0); 206442c9c57cSBarry Smith } 206542c9c57cSBarry Smith 2066