11c2a3de1SBarry Smith 2397b6df1SKris Buschelman /* 3c2b5dc30SHong Zhang Provides an interface to the MUMPS sparse solver 4397b6df1SKris Buschelman */ 551d5961aSHong Zhang 6c6db04a5SJed Brown #include <../src/mat/impls/aij/mpi/mpiaij.h> /*I "petscmat.h" I*/ 7c6db04a5SJed Brown #include <../src/mat/impls/sbaij/mpi/mpisbaij.h> 8397b6df1SKris Buschelman 9397b6df1SKris Buschelman EXTERN_C_BEGIN 10397b6df1SKris Buschelman #if defined(PETSC_USE_COMPLEX) 112907cef9SHong Zhang #if defined(PETSC_USE_REAL_SINGLE) 122907cef9SHong Zhang #include <cmumps_c.h> 132907cef9SHong Zhang #else 14c6db04a5SJed Brown #include <zmumps_c.h> 152907cef9SHong Zhang #endif 162907cef9SHong Zhang #else 172907cef9SHong Zhang #if defined(PETSC_USE_REAL_SINGLE) 182907cef9SHong Zhang #include <smumps_c.h> 19397b6df1SKris Buschelman #else 20c6db04a5SJed Brown #include <dmumps_c.h> 21397b6df1SKris Buschelman #endif 222907cef9SHong Zhang #endif 23397b6df1SKris Buschelman EXTERN_C_END 24397b6df1SKris Buschelman #define JOB_INIT -1 253d472b54SHong Zhang #define JOB_FACTSYMBOLIC 1 263d472b54SHong Zhang #define JOB_FACTNUMERIC 2 273d472b54SHong Zhang #define JOB_SOLVE 3 28397b6df1SKris Buschelman #define JOB_END -2 293d472b54SHong Zhang 302907cef9SHong Zhang /* calls to MUMPS */ 312907cef9SHong Zhang #if defined(PETSC_USE_COMPLEX) 322907cef9SHong Zhang #if defined(PETSC_USE_REAL_SINGLE) 332907cef9SHong Zhang #define PetscMUMPS_c cmumps_c 342907cef9SHong Zhang #else 352907cef9SHong Zhang #define PetscMUMPS_c zmumps_c 362907cef9SHong Zhang #endif 372907cef9SHong Zhang #else 382907cef9SHong Zhang #if defined(PETSC_USE_REAL_SINGLE) 392907cef9SHong Zhang #define PetscMUMPS_c smumps_c 402907cef9SHong Zhang #else 412907cef9SHong Zhang #define PetscMUMPS_c dmumps_c 422907cef9SHong Zhang #endif 432907cef9SHong Zhang #endif 442907cef9SHong Zhang 453d472b54SHong Zhang 46397b6df1SKris Buschelman /* macros s.t. indices match MUMPS documentation */ 47397b6df1SKris Buschelman #define ICNTL(I) icntl[(I)-1] 48397b6df1SKris Buschelman #define CNTL(I) cntl[(I)-1] 49397b6df1SKris Buschelman #define INFOG(I) infog[(I)-1] 50a7aca84bSHong Zhang #define INFO(I) info[(I)-1] 51397b6df1SKris Buschelman #define RINFOG(I) rinfog[(I)-1] 52adc1d99fSHong Zhang #define RINFO(I) rinfo[(I)-1] 53397b6df1SKris Buschelman 54397b6df1SKris Buschelman typedef struct { 55397b6df1SKris Buschelman #if defined(PETSC_USE_COMPLEX) 562907cef9SHong Zhang #if defined(PETSC_USE_REAL_SINGLE) 572907cef9SHong Zhang CMUMPS_STRUC_C id; 582907cef9SHong Zhang #else 59397b6df1SKris Buschelman ZMUMPS_STRUC_C id; 602907cef9SHong Zhang #endif 612907cef9SHong Zhang #else 622907cef9SHong Zhang #if defined(PETSC_USE_REAL_SINGLE) 632907cef9SHong Zhang SMUMPS_STRUC_C id; 64397b6df1SKris Buschelman #else 65397b6df1SKris Buschelman DMUMPS_STRUC_C id; 66397b6df1SKris Buschelman #endif 672907cef9SHong Zhang #endif 682907cef9SHong Zhang 69397b6df1SKris Buschelman MatStructure matstruc; 70c1490034SHong Zhang PetscMPIInt myid,size; 71a5e57a09SHong Zhang PetscInt *irn,*jcn,nz,sym; 72397b6df1SKris Buschelman PetscScalar *val; 73397b6df1SKris Buschelman MPI_Comm comm_mumps; 7464e6c443SBarry Smith PetscBool isAIJ,CleanUpMUMPS; 75a5e57a09SHong Zhang PetscInt ICNTL9_pre; /* check if ICNTL(9) is changed from previous MatSolve */ 76801fbe65SHong Zhang VecScatter scat_rhs, scat_sol; /* used by MatSolve() */ 77801fbe65SHong Zhang Vec b_seq,x_seq; 782205254eSKarl Rupp 79bf0cc555SLisandro Dalcin PetscErrorCode (*Destroy)(Mat); 80bccb9932SShri Abhyankar PetscErrorCode (*ConvertToTriples)(Mat, int, MatReuse, int*, int**, int**, PetscScalar**); 81f0c56d0fSKris Buschelman } Mat_MUMPS; 82f0c56d0fSKris Buschelman 8309573ac7SBarry Smith extern PetscErrorCode MatDuplicate_MUMPS(Mat,MatDuplicateOption,Mat*); 84b24902e0SBarry Smith 85397b6df1SKris Buschelman /* 86d341cd04SHong Zhang MatConvertToTriples_A_B - convert Petsc matrix to triples: row[nz], col[nz], val[nz] 87d341cd04SHong Zhang 88397b6df1SKris Buschelman input: 8967877ebaSShri Abhyankar A - matrix in aij,baij or sbaij (bs=1) format 90397b6df1SKris Buschelman shift - 0: C style output triple; 1: Fortran style output triple. 91bccb9932SShri Abhyankar reuse - MAT_INITIAL_MATRIX: spaces are allocated and values are set for the triple 92bccb9932SShri Abhyankar MAT_REUSE_MATRIX: only the values in v array are updated 93397b6df1SKris Buschelman output: 94397b6df1SKris Buschelman nnz - dim of r, c, and v (number of local nonzero entries of A) 95397b6df1SKris Buschelman r, c, v - row and col index, matrix values (matrix triples) 96eb9baa12SBarry Smith 97eb9baa12SBarry Smith The returned values r, c, and sometimes v are obtained in a single PetscMalloc(). Then in MatDestroy_MUMPS() it is 98eb9baa12SBarry Smith freed with PetscFree((mumps->irn); This is not ideal code, the fact that v is ONLY sometimes part of mumps->irn means 99eb9baa12SBarry Smith that the PetscMalloc() cannot easily be replaced with a PetscMalloc3(). 100eb9baa12SBarry Smith 101397b6df1SKris Buschelman */ 10216ebf90aSShri Abhyankar 10316ebf90aSShri Abhyankar #undef __FUNCT__ 10416ebf90aSShri Abhyankar #define __FUNCT__ "MatConvertToTriples_seqaij_seqaij" 105bccb9932SShri Abhyankar PetscErrorCode MatConvertToTriples_seqaij_seqaij(Mat A,int shift,MatReuse reuse,int *nnz,int **r, int **c, PetscScalar **v) 106b24902e0SBarry Smith { 107185f6596SHong Zhang const PetscInt *ai,*aj,*ajj,M=A->rmap->n; 10867877ebaSShri Abhyankar PetscInt nz,rnz,i,j; 109dfbe8321SBarry Smith PetscErrorCode ierr; 110c1490034SHong Zhang PetscInt *row,*col; 11116ebf90aSShri Abhyankar Mat_SeqAIJ *aa=(Mat_SeqAIJ*)A->data; 112397b6df1SKris Buschelman 113397b6df1SKris Buschelman PetscFunctionBegin; 11416ebf90aSShri Abhyankar *v=aa->a; 115bccb9932SShri Abhyankar if (reuse == MAT_INITIAL_MATRIX) { 1162205254eSKarl Rupp nz = aa->nz; 1172205254eSKarl Rupp ai = aa->i; 1182205254eSKarl Rupp aj = aa->j; 11916ebf90aSShri Abhyankar *nnz = nz; 120785e854fSJed Brown ierr = PetscMalloc1(2*nz, &row);CHKERRQ(ierr); 121185f6596SHong Zhang col = row + nz; 122185f6596SHong Zhang 12316ebf90aSShri Abhyankar nz = 0; 12416ebf90aSShri Abhyankar for (i=0; i<M; i++) { 12516ebf90aSShri Abhyankar rnz = ai[i+1] - ai[i]; 12667877ebaSShri Abhyankar ajj = aj + ai[i]; 12767877ebaSShri Abhyankar for (j=0; j<rnz; j++) { 12867877ebaSShri Abhyankar row[nz] = i+shift; col[nz++] = ajj[j] + shift; 12916ebf90aSShri Abhyankar } 13016ebf90aSShri Abhyankar } 13116ebf90aSShri Abhyankar *r = row; *c = col; 13216ebf90aSShri Abhyankar } 13316ebf90aSShri Abhyankar PetscFunctionReturn(0); 13416ebf90aSShri Abhyankar } 135397b6df1SKris Buschelman 13616ebf90aSShri Abhyankar #undef __FUNCT__ 13767877ebaSShri Abhyankar #define __FUNCT__ "MatConvertToTriples_seqbaij_seqaij" 138bccb9932SShri Abhyankar PetscErrorCode MatConvertToTriples_seqbaij_seqaij(Mat A,int shift,MatReuse reuse,int *nnz,int **r, int **c, PetscScalar **v) 13967877ebaSShri Abhyankar { 14067877ebaSShri Abhyankar Mat_SeqBAIJ *aa=(Mat_SeqBAIJ*)A->data; 14133d57670SJed Brown const PetscInt *ai,*aj,*ajj,bs2 = aa->bs2; 14233d57670SJed Brown PetscInt bs,M,nz,idx=0,rnz,i,j,k,m; 14367877ebaSShri Abhyankar PetscErrorCode ierr; 14467877ebaSShri Abhyankar PetscInt *row,*col; 14567877ebaSShri Abhyankar 14667877ebaSShri Abhyankar PetscFunctionBegin; 14733d57670SJed Brown ierr = MatGetBlockSize(A,&bs);CHKERRQ(ierr); 14833d57670SJed Brown M = A->rmap->N/bs; 149cf3759fdSShri Abhyankar *v = aa->a; 150bccb9932SShri Abhyankar if (reuse == MAT_INITIAL_MATRIX) { 151cf3759fdSShri Abhyankar ai = aa->i; aj = aa->j; 15267877ebaSShri Abhyankar nz = bs2*aa->nz; 15367877ebaSShri Abhyankar *nnz = nz; 154785e854fSJed Brown ierr = PetscMalloc1(2*nz, &row);CHKERRQ(ierr); 155185f6596SHong Zhang col = row + nz; 156185f6596SHong Zhang 15767877ebaSShri Abhyankar for (i=0; i<M; i++) { 15867877ebaSShri Abhyankar ajj = aj + ai[i]; 15967877ebaSShri Abhyankar rnz = ai[i+1] - ai[i]; 16067877ebaSShri Abhyankar for (k=0; k<rnz; k++) { 16167877ebaSShri Abhyankar for (j=0; j<bs; j++) { 16267877ebaSShri Abhyankar for (m=0; m<bs; m++) { 16367877ebaSShri Abhyankar row[idx] = i*bs + m + shift; 164cf3759fdSShri Abhyankar col[idx++] = bs*(ajj[k]) + j + shift; 16567877ebaSShri Abhyankar } 16667877ebaSShri Abhyankar } 16767877ebaSShri Abhyankar } 16867877ebaSShri Abhyankar } 169cf3759fdSShri Abhyankar *r = row; *c = col; 17067877ebaSShri Abhyankar } 17167877ebaSShri Abhyankar PetscFunctionReturn(0); 17267877ebaSShri Abhyankar } 17367877ebaSShri Abhyankar 17467877ebaSShri Abhyankar #undef __FUNCT__ 17516ebf90aSShri Abhyankar #define __FUNCT__ "MatConvertToTriples_seqsbaij_seqsbaij" 176bccb9932SShri Abhyankar PetscErrorCode MatConvertToTriples_seqsbaij_seqsbaij(Mat A,int shift,MatReuse reuse,int *nnz,int **r, int **c, PetscScalar **v) 17716ebf90aSShri Abhyankar { 17867877ebaSShri Abhyankar const PetscInt *ai, *aj,*ajj,M=A->rmap->n; 17967877ebaSShri Abhyankar PetscInt nz,rnz,i,j; 18016ebf90aSShri Abhyankar PetscErrorCode ierr; 18116ebf90aSShri Abhyankar PetscInt *row,*col; 18216ebf90aSShri Abhyankar Mat_SeqSBAIJ *aa=(Mat_SeqSBAIJ*)A->data; 18316ebf90aSShri Abhyankar 18416ebf90aSShri Abhyankar PetscFunctionBegin; 185882afa5aSHong Zhang *v = aa->a; 186bccb9932SShri Abhyankar if (reuse == MAT_INITIAL_MATRIX) { 1872205254eSKarl Rupp nz = aa->nz; 1882205254eSKarl Rupp ai = aa->i; 1892205254eSKarl Rupp aj = aa->j; 1902205254eSKarl Rupp *v = aa->a; 19116ebf90aSShri Abhyankar *nnz = nz; 192785e854fSJed Brown ierr = PetscMalloc1(2*nz, &row);CHKERRQ(ierr); 193185f6596SHong Zhang col = row + nz; 194185f6596SHong Zhang 19516ebf90aSShri Abhyankar nz = 0; 19616ebf90aSShri Abhyankar for (i=0; i<M; i++) { 19716ebf90aSShri Abhyankar rnz = ai[i+1] - ai[i]; 19867877ebaSShri Abhyankar ajj = aj + ai[i]; 19967877ebaSShri Abhyankar for (j=0; j<rnz; j++) { 20067877ebaSShri Abhyankar row[nz] = i+shift; col[nz++] = ajj[j] + shift; 20116ebf90aSShri Abhyankar } 20216ebf90aSShri Abhyankar } 20316ebf90aSShri Abhyankar *r = row; *c = col; 20416ebf90aSShri Abhyankar } 20516ebf90aSShri Abhyankar PetscFunctionReturn(0); 20616ebf90aSShri Abhyankar } 20716ebf90aSShri Abhyankar 20816ebf90aSShri Abhyankar #undef __FUNCT__ 20916ebf90aSShri Abhyankar #define __FUNCT__ "MatConvertToTriples_seqaij_seqsbaij" 210bccb9932SShri Abhyankar PetscErrorCode MatConvertToTriples_seqaij_seqsbaij(Mat A,int shift,MatReuse reuse,int *nnz,int **r, int **c, PetscScalar **v) 21116ebf90aSShri Abhyankar { 21267877ebaSShri Abhyankar const PetscInt *ai,*aj,*ajj,*adiag,M=A->rmap->n; 21367877ebaSShri Abhyankar PetscInt nz,rnz,i,j; 21467877ebaSShri Abhyankar const PetscScalar *av,*v1; 21516ebf90aSShri Abhyankar PetscScalar *val; 21616ebf90aSShri Abhyankar PetscErrorCode ierr; 21716ebf90aSShri Abhyankar PetscInt *row,*col; 218829b1710SHong Zhang Mat_SeqAIJ *aa=(Mat_SeqAIJ*)A->data; 21916ebf90aSShri Abhyankar 22016ebf90aSShri Abhyankar PetscFunctionBegin; 22116ebf90aSShri Abhyankar ai =aa->i; aj=aa->j;av=aa->a; 22216ebf90aSShri Abhyankar adiag=aa->diag; 223bccb9932SShri Abhyankar if (reuse == MAT_INITIAL_MATRIX) { 224829b1710SHong Zhang /* count nz in the uppper triangular part of A */ 225829b1710SHong Zhang nz = 0; 226829b1710SHong Zhang for (i=0; i<M; i++) nz += ai[i+1] - adiag[i]; 22716ebf90aSShri Abhyankar *nnz = nz; 228829b1710SHong Zhang 229185f6596SHong Zhang ierr = PetscMalloc((2*nz*sizeof(PetscInt)+nz*sizeof(PetscScalar)), &row);CHKERRQ(ierr); 230185f6596SHong Zhang col = row + nz; 231185f6596SHong Zhang val = (PetscScalar*)(col + nz); 232185f6596SHong Zhang 23316ebf90aSShri Abhyankar nz = 0; 23416ebf90aSShri Abhyankar for (i=0; i<M; i++) { 23516ebf90aSShri Abhyankar rnz = ai[i+1] - adiag[i]; 23667877ebaSShri Abhyankar ajj = aj + adiag[i]; 237cf3759fdSShri Abhyankar v1 = av + adiag[i]; 23867877ebaSShri Abhyankar for (j=0; j<rnz; j++) { 23967877ebaSShri Abhyankar row[nz] = i+shift; col[nz] = ajj[j] + shift; val[nz++] = v1[j]; 24016ebf90aSShri Abhyankar } 24116ebf90aSShri Abhyankar } 24216ebf90aSShri Abhyankar *r = row; *c = col; *v = val; 243397b6df1SKris Buschelman } else { 24416ebf90aSShri Abhyankar nz = 0; val = *v; 24516ebf90aSShri Abhyankar for (i=0; i <M; i++) { 24616ebf90aSShri Abhyankar rnz = ai[i+1] - adiag[i]; 24767877ebaSShri Abhyankar ajj = aj + adiag[i]; 24867877ebaSShri Abhyankar v1 = av + adiag[i]; 24967877ebaSShri Abhyankar for (j=0; j<rnz; j++) { 25067877ebaSShri Abhyankar val[nz++] = v1[j]; 25116ebf90aSShri Abhyankar } 25216ebf90aSShri Abhyankar } 25316ebf90aSShri Abhyankar } 25416ebf90aSShri Abhyankar PetscFunctionReturn(0); 25516ebf90aSShri Abhyankar } 25616ebf90aSShri Abhyankar 25716ebf90aSShri Abhyankar #undef __FUNCT__ 25816ebf90aSShri Abhyankar #define __FUNCT__ "MatConvertToTriples_mpisbaij_mpisbaij" 259bccb9932SShri Abhyankar PetscErrorCode MatConvertToTriples_mpisbaij_mpisbaij(Mat A,int shift,MatReuse reuse,int *nnz,int **r, int **c, PetscScalar **v) 26016ebf90aSShri Abhyankar { 26116ebf90aSShri Abhyankar const PetscInt *ai, *aj, *bi, *bj,*garray,m=A->rmap->n,*ajj,*bjj; 26216ebf90aSShri Abhyankar PetscErrorCode ierr; 26316ebf90aSShri Abhyankar PetscInt rstart,nz,i,j,jj,irow,countA,countB; 26416ebf90aSShri Abhyankar PetscInt *row,*col; 26516ebf90aSShri Abhyankar const PetscScalar *av, *bv,*v1,*v2; 26616ebf90aSShri Abhyankar PetscScalar *val; 267397b6df1SKris Buschelman Mat_MPISBAIJ *mat = (Mat_MPISBAIJ*)A->data; 268397b6df1SKris Buschelman Mat_SeqSBAIJ *aa = (Mat_SeqSBAIJ*)(mat->A)->data; 269397b6df1SKris Buschelman Mat_SeqBAIJ *bb = (Mat_SeqBAIJ*)(mat->B)->data; 27016ebf90aSShri Abhyankar 27116ebf90aSShri Abhyankar PetscFunctionBegin; 272d0f46423SBarry Smith ai=aa->i; aj=aa->j; bi=bb->i; bj=bb->j; rstart= A->rmap->rstart; 273397b6df1SKris Buschelman av=aa->a; bv=bb->a; 274397b6df1SKris Buschelman 2752205254eSKarl Rupp garray = mat->garray; 2762205254eSKarl Rupp 277bccb9932SShri Abhyankar if (reuse == MAT_INITIAL_MATRIX) { 27816ebf90aSShri Abhyankar nz = aa->nz + bb->nz; 27916ebf90aSShri Abhyankar *nnz = nz; 280185f6596SHong Zhang ierr = PetscMalloc((2*nz*sizeof(PetscInt)+nz*sizeof(PetscScalar)), &row);CHKERRQ(ierr); 281185f6596SHong Zhang col = row + nz; 282185f6596SHong Zhang val = (PetscScalar*)(col + nz); 283185f6596SHong Zhang 284397b6df1SKris Buschelman *r = row; *c = col; *v = val; 285397b6df1SKris Buschelman } else { 286397b6df1SKris Buschelman row = *r; col = *c; val = *v; 287397b6df1SKris Buschelman } 288397b6df1SKris Buschelman 289028e57e8SHong Zhang jj = 0; irow = rstart; 290397b6df1SKris Buschelman for (i=0; i<m; i++) { 291397b6df1SKris Buschelman ajj = aj + ai[i]; /* ptr to the beginning of this row */ 292397b6df1SKris Buschelman countA = ai[i+1] - ai[i]; 293397b6df1SKris Buschelman countB = bi[i+1] - bi[i]; 294397b6df1SKris Buschelman bjj = bj + bi[i]; 29516ebf90aSShri Abhyankar v1 = av + ai[i]; 29616ebf90aSShri Abhyankar v2 = bv + bi[i]; 297397b6df1SKris Buschelman 298397b6df1SKris Buschelman /* A-part */ 299397b6df1SKris Buschelman for (j=0; j<countA; j++) { 300bccb9932SShri Abhyankar if (reuse == MAT_INITIAL_MATRIX) { 301397b6df1SKris Buschelman row[jj] = irow + shift; col[jj] = rstart + ajj[j] + shift; 302397b6df1SKris Buschelman } 30316ebf90aSShri Abhyankar val[jj++] = v1[j]; 304397b6df1SKris Buschelman } 30516ebf90aSShri Abhyankar 30616ebf90aSShri Abhyankar /* B-part */ 30716ebf90aSShri Abhyankar for (j=0; j < countB; j++) { 308bccb9932SShri Abhyankar if (reuse == MAT_INITIAL_MATRIX) { 309397b6df1SKris Buschelman row[jj] = irow + shift; col[jj] = garray[bjj[j]] + shift; 310397b6df1SKris Buschelman } 31116ebf90aSShri Abhyankar val[jj++] = v2[j]; 31216ebf90aSShri Abhyankar } 31316ebf90aSShri Abhyankar irow++; 31416ebf90aSShri Abhyankar } 31516ebf90aSShri Abhyankar PetscFunctionReturn(0); 31616ebf90aSShri Abhyankar } 31716ebf90aSShri Abhyankar 31816ebf90aSShri Abhyankar #undef __FUNCT__ 31916ebf90aSShri Abhyankar #define __FUNCT__ "MatConvertToTriples_mpiaij_mpiaij" 320bccb9932SShri Abhyankar PetscErrorCode MatConvertToTriples_mpiaij_mpiaij(Mat A,int shift,MatReuse reuse,int *nnz,int **r, int **c, PetscScalar **v) 32116ebf90aSShri Abhyankar { 32216ebf90aSShri Abhyankar const PetscInt *ai, *aj, *bi, *bj,*garray,m=A->rmap->n,*ajj,*bjj; 32316ebf90aSShri Abhyankar PetscErrorCode ierr; 32416ebf90aSShri Abhyankar PetscInt rstart,nz,i,j,jj,irow,countA,countB; 32516ebf90aSShri Abhyankar PetscInt *row,*col; 32616ebf90aSShri Abhyankar const PetscScalar *av, *bv,*v1,*v2; 32716ebf90aSShri Abhyankar PetscScalar *val; 32816ebf90aSShri Abhyankar Mat_MPIAIJ *mat = (Mat_MPIAIJ*)A->data; 32916ebf90aSShri Abhyankar Mat_SeqAIJ *aa = (Mat_SeqAIJ*)(mat->A)->data; 33016ebf90aSShri Abhyankar Mat_SeqAIJ *bb = (Mat_SeqAIJ*)(mat->B)->data; 33116ebf90aSShri Abhyankar 33216ebf90aSShri Abhyankar PetscFunctionBegin; 33316ebf90aSShri Abhyankar ai=aa->i; aj=aa->j; bi=bb->i; bj=bb->j; rstart= A->rmap->rstart; 33416ebf90aSShri Abhyankar av=aa->a; bv=bb->a; 33516ebf90aSShri Abhyankar 3362205254eSKarl Rupp garray = mat->garray; 3372205254eSKarl Rupp 338bccb9932SShri Abhyankar if (reuse == MAT_INITIAL_MATRIX) { 33916ebf90aSShri Abhyankar nz = aa->nz + bb->nz; 34016ebf90aSShri Abhyankar *nnz = nz; 341185f6596SHong Zhang ierr = PetscMalloc((2*nz*sizeof(PetscInt)+nz*sizeof(PetscScalar)), &row);CHKERRQ(ierr); 342185f6596SHong Zhang col = row + nz; 343185f6596SHong Zhang val = (PetscScalar*)(col + nz); 344185f6596SHong Zhang 34516ebf90aSShri Abhyankar *r = row; *c = col; *v = val; 34616ebf90aSShri Abhyankar } else { 34716ebf90aSShri Abhyankar row = *r; col = *c; val = *v; 34816ebf90aSShri Abhyankar } 34916ebf90aSShri Abhyankar 35016ebf90aSShri Abhyankar jj = 0; irow = rstart; 35116ebf90aSShri Abhyankar for (i=0; i<m; i++) { 35216ebf90aSShri Abhyankar ajj = aj + ai[i]; /* ptr to the beginning of this row */ 35316ebf90aSShri Abhyankar countA = ai[i+1] - ai[i]; 35416ebf90aSShri Abhyankar countB = bi[i+1] - bi[i]; 35516ebf90aSShri Abhyankar bjj = bj + bi[i]; 35616ebf90aSShri Abhyankar v1 = av + ai[i]; 35716ebf90aSShri Abhyankar v2 = bv + bi[i]; 35816ebf90aSShri Abhyankar 35916ebf90aSShri Abhyankar /* A-part */ 36016ebf90aSShri Abhyankar for (j=0; j<countA; j++) { 361bccb9932SShri Abhyankar if (reuse == MAT_INITIAL_MATRIX) { 36216ebf90aSShri Abhyankar row[jj] = irow + shift; col[jj] = rstart + ajj[j] + shift; 36316ebf90aSShri Abhyankar } 36416ebf90aSShri Abhyankar val[jj++] = v1[j]; 36516ebf90aSShri Abhyankar } 36616ebf90aSShri Abhyankar 36716ebf90aSShri Abhyankar /* B-part */ 36816ebf90aSShri Abhyankar for (j=0; j < countB; j++) { 369bccb9932SShri Abhyankar if (reuse == MAT_INITIAL_MATRIX) { 37016ebf90aSShri Abhyankar row[jj] = irow + shift; col[jj] = garray[bjj[j]] + shift; 37116ebf90aSShri Abhyankar } 37216ebf90aSShri Abhyankar val[jj++] = v2[j]; 37316ebf90aSShri Abhyankar } 37416ebf90aSShri Abhyankar irow++; 37516ebf90aSShri Abhyankar } 37616ebf90aSShri Abhyankar PetscFunctionReturn(0); 37716ebf90aSShri Abhyankar } 37816ebf90aSShri Abhyankar 37916ebf90aSShri Abhyankar #undef __FUNCT__ 38067877ebaSShri Abhyankar #define __FUNCT__ "MatConvertToTriples_mpibaij_mpiaij" 381bccb9932SShri Abhyankar PetscErrorCode MatConvertToTriples_mpibaij_mpiaij(Mat A,int shift,MatReuse reuse,int *nnz,int **r, int **c, PetscScalar **v) 38267877ebaSShri Abhyankar { 38367877ebaSShri Abhyankar Mat_MPIBAIJ *mat = (Mat_MPIBAIJ*)A->data; 38467877ebaSShri Abhyankar Mat_SeqBAIJ *aa = (Mat_SeqBAIJ*)(mat->A)->data; 38567877ebaSShri Abhyankar Mat_SeqBAIJ *bb = (Mat_SeqBAIJ*)(mat->B)->data; 38667877ebaSShri Abhyankar const PetscInt *ai = aa->i, *bi = bb->i, *aj = aa->j, *bj = bb->j,*ajj, *bjj; 387d985c460SShri Abhyankar const PetscInt *garray = mat->garray,mbs=mat->mbs,rstart=A->rmap->rstart; 38833d57670SJed Brown const PetscInt bs2=mat->bs2; 38967877ebaSShri Abhyankar PetscErrorCode ierr; 39033d57670SJed Brown PetscInt bs,nz,i,j,k,n,jj,irow,countA,countB,idx; 39167877ebaSShri Abhyankar PetscInt *row,*col; 39267877ebaSShri Abhyankar const PetscScalar *av=aa->a, *bv=bb->a,*v1,*v2; 39367877ebaSShri Abhyankar PetscScalar *val; 39467877ebaSShri Abhyankar 39567877ebaSShri Abhyankar PetscFunctionBegin; 39633d57670SJed Brown ierr = MatGetBlockSize(A,&bs);CHKERRQ(ierr); 397bccb9932SShri Abhyankar if (reuse == MAT_INITIAL_MATRIX) { 39867877ebaSShri Abhyankar nz = bs2*(aa->nz + bb->nz); 39967877ebaSShri Abhyankar *nnz = nz; 400185f6596SHong Zhang ierr = PetscMalloc((2*nz*sizeof(PetscInt)+nz*sizeof(PetscScalar)), &row);CHKERRQ(ierr); 401185f6596SHong Zhang col = row + nz; 402185f6596SHong Zhang val = (PetscScalar*)(col + nz); 403185f6596SHong Zhang 40467877ebaSShri Abhyankar *r = row; *c = col; *v = val; 40567877ebaSShri Abhyankar } else { 40667877ebaSShri Abhyankar row = *r; col = *c; val = *v; 40767877ebaSShri Abhyankar } 40867877ebaSShri Abhyankar 409d985c460SShri Abhyankar jj = 0; irow = rstart; 41067877ebaSShri Abhyankar for (i=0; i<mbs; i++) { 41167877ebaSShri Abhyankar countA = ai[i+1] - ai[i]; 41267877ebaSShri Abhyankar countB = bi[i+1] - bi[i]; 41367877ebaSShri Abhyankar ajj = aj + ai[i]; 41467877ebaSShri Abhyankar bjj = bj + bi[i]; 41567877ebaSShri Abhyankar v1 = av + bs2*ai[i]; 41667877ebaSShri Abhyankar v2 = bv + bs2*bi[i]; 41767877ebaSShri Abhyankar 41867877ebaSShri Abhyankar idx = 0; 41967877ebaSShri Abhyankar /* A-part */ 42067877ebaSShri Abhyankar for (k=0; k<countA; k++) { 42167877ebaSShri Abhyankar for (j=0; j<bs; j++) { 42267877ebaSShri Abhyankar for (n=0; n<bs; n++) { 423bccb9932SShri Abhyankar if (reuse == MAT_INITIAL_MATRIX) { 424d985c460SShri Abhyankar row[jj] = irow + n + shift; 425d985c460SShri Abhyankar col[jj] = rstart + bs*ajj[k] + j + shift; 42667877ebaSShri Abhyankar } 42767877ebaSShri Abhyankar val[jj++] = v1[idx++]; 42867877ebaSShri Abhyankar } 42967877ebaSShri Abhyankar } 43067877ebaSShri Abhyankar } 43167877ebaSShri Abhyankar 43267877ebaSShri Abhyankar idx = 0; 43367877ebaSShri Abhyankar /* B-part */ 43467877ebaSShri Abhyankar for (k=0; k<countB; k++) { 43567877ebaSShri Abhyankar for (j=0; j<bs; j++) { 43667877ebaSShri Abhyankar for (n=0; n<bs; n++) { 437bccb9932SShri Abhyankar if (reuse == MAT_INITIAL_MATRIX) { 438d985c460SShri Abhyankar row[jj] = irow + n + shift; 439d985c460SShri Abhyankar col[jj] = bs*garray[bjj[k]] + j + shift; 44067877ebaSShri Abhyankar } 441d985c460SShri Abhyankar val[jj++] = v2[idx++]; 44267877ebaSShri Abhyankar } 44367877ebaSShri Abhyankar } 44467877ebaSShri Abhyankar } 445d985c460SShri Abhyankar irow += bs; 44667877ebaSShri Abhyankar } 44767877ebaSShri Abhyankar PetscFunctionReturn(0); 44867877ebaSShri Abhyankar } 44967877ebaSShri Abhyankar 45067877ebaSShri Abhyankar #undef __FUNCT__ 45116ebf90aSShri Abhyankar #define __FUNCT__ "MatConvertToTriples_mpiaij_mpisbaij" 452bccb9932SShri Abhyankar PetscErrorCode MatConvertToTriples_mpiaij_mpisbaij(Mat A,int shift,MatReuse reuse,int *nnz,int **r, int **c, PetscScalar **v) 45316ebf90aSShri Abhyankar { 45416ebf90aSShri Abhyankar const PetscInt *ai, *aj,*adiag, *bi, *bj,*garray,m=A->rmap->n,*ajj,*bjj; 45516ebf90aSShri Abhyankar PetscErrorCode ierr; 456e0bace9bSHong Zhang PetscInt rstart,nz,nza,nzb,i,j,jj,irow,countA,countB; 45716ebf90aSShri Abhyankar PetscInt *row,*col; 45816ebf90aSShri Abhyankar const PetscScalar *av, *bv,*v1,*v2; 45916ebf90aSShri Abhyankar PetscScalar *val; 46016ebf90aSShri Abhyankar Mat_MPIAIJ *mat = (Mat_MPIAIJ*)A->data; 46116ebf90aSShri Abhyankar Mat_SeqAIJ *aa =(Mat_SeqAIJ*)(mat->A)->data; 46216ebf90aSShri Abhyankar Mat_SeqAIJ *bb =(Mat_SeqAIJ*)(mat->B)->data; 46316ebf90aSShri Abhyankar 46416ebf90aSShri Abhyankar PetscFunctionBegin; 46516ebf90aSShri Abhyankar ai=aa->i; aj=aa->j; adiag=aa->diag; 46616ebf90aSShri Abhyankar bi=bb->i; bj=bb->j; garray = mat->garray; 46716ebf90aSShri Abhyankar av=aa->a; bv=bb->a; 4682205254eSKarl Rupp 46916ebf90aSShri Abhyankar rstart = A->rmap->rstart; 47016ebf90aSShri Abhyankar 471bccb9932SShri Abhyankar if (reuse == MAT_INITIAL_MATRIX) { 472e0bace9bSHong Zhang nza = 0; /* num of upper triangular entries in mat->A, including diagonals */ 473e0bace9bSHong Zhang nzb = 0; /* num of upper triangular entries in mat->B */ 47416ebf90aSShri Abhyankar for (i=0; i<m; i++) { 475e0bace9bSHong Zhang nza += (ai[i+1] - adiag[i]); 47616ebf90aSShri Abhyankar countB = bi[i+1] - bi[i]; 47716ebf90aSShri Abhyankar bjj = bj + bi[i]; 478e0bace9bSHong Zhang for (j=0; j<countB; j++) { 479e0bace9bSHong Zhang if (garray[bjj[j]] > rstart) nzb++; 480e0bace9bSHong Zhang } 481e0bace9bSHong Zhang } 48216ebf90aSShri Abhyankar 483e0bace9bSHong Zhang nz = nza + nzb; /* total nz of upper triangular part of mat */ 48416ebf90aSShri Abhyankar *nnz = nz; 485185f6596SHong Zhang ierr = PetscMalloc((2*nz*sizeof(PetscInt)+nz*sizeof(PetscScalar)), &row);CHKERRQ(ierr); 486185f6596SHong Zhang col = row + nz; 487185f6596SHong Zhang val = (PetscScalar*)(col + nz); 488185f6596SHong Zhang 48916ebf90aSShri Abhyankar *r = row; *c = col; *v = val; 49016ebf90aSShri Abhyankar } else { 49116ebf90aSShri Abhyankar row = *r; col = *c; val = *v; 49216ebf90aSShri Abhyankar } 49316ebf90aSShri Abhyankar 49416ebf90aSShri Abhyankar jj = 0; irow = rstart; 49516ebf90aSShri Abhyankar for (i=0; i<m; i++) { 49616ebf90aSShri Abhyankar ajj = aj + adiag[i]; /* ptr to the beginning of the diagonal of this row */ 49716ebf90aSShri Abhyankar v1 = av + adiag[i]; 49816ebf90aSShri Abhyankar countA = ai[i+1] - adiag[i]; 49916ebf90aSShri Abhyankar countB = bi[i+1] - bi[i]; 50016ebf90aSShri Abhyankar bjj = bj + bi[i]; 50116ebf90aSShri Abhyankar v2 = bv + bi[i]; 50216ebf90aSShri Abhyankar 50316ebf90aSShri Abhyankar /* A-part */ 50416ebf90aSShri Abhyankar for (j=0; j<countA; j++) { 505bccb9932SShri Abhyankar if (reuse == MAT_INITIAL_MATRIX) { 50616ebf90aSShri Abhyankar row[jj] = irow + shift; col[jj] = rstart + ajj[j] + shift; 50716ebf90aSShri Abhyankar } 50816ebf90aSShri Abhyankar val[jj++] = v1[j]; 50916ebf90aSShri Abhyankar } 51016ebf90aSShri Abhyankar 51116ebf90aSShri Abhyankar /* B-part */ 51216ebf90aSShri Abhyankar for (j=0; j < countB; j++) { 51316ebf90aSShri Abhyankar if (garray[bjj[j]] > rstart) { 514bccb9932SShri Abhyankar if (reuse == MAT_INITIAL_MATRIX) { 51516ebf90aSShri Abhyankar row[jj] = irow + shift; col[jj] = garray[bjj[j]] + shift; 51616ebf90aSShri Abhyankar } 51716ebf90aSShri Abhyankar val[jj++] = v2[j]; 51816ebf90aSShri Abhyankar } 519397b6df1SKris Buschelman } 520397b6df1SKris Buschelman irow++; 521397b6df1SKris Buschelman } 522397b6df1SKris Buschelman PetscFunctionReturn(0); 523397b6df1SKris Buschelman } 524397b6df1SKris Buschelman 525397b6df1SKris Buschelman #undef __FUNCT__ 52620be8e61SHong Zhang #define __FUNCT__ "MatGetDiagonal_MUMPS" 52720be8e61SHong Zhang PetscErrorCode MatGetDiagonal_MUMPS(Mat A,Vec v) 52820be8e61SHong Zhang { 52920be8e61SHong Zhang PetscFunctionBegin; 53020be8e61SHong Zhang SETERRQ(PetscObjectComm((PetscObject)A),PETSC_ERR_SUP,"Mat type: MUMPS factor"); 53120be8e61SHong Zhang PetscFunctionReturn(0); 53220be8e61SHong Zhang } 53320be8e61SHong Zhang 53420be8e61SHong Zhang #undef __FUNCT__ 5353924e44cSKris Buschelman #define __FUNCT__ "MatDestroy_MUMPS" 536dfbe8321SBarry Smith PetscErrorCode MatDestroy_MUMPS(Mat A) 537dfbe8321SBarry Smith { 538a5e57a09SHong Zhang Mat_MUMPS *mumps=(Mat_MUMPS*)A->spptr; 539dfbe8321SBarry Smith PetscErrorCode ierr; 540b24902e0SBarry Smith 541397b6df1SKris Buschelman PetscFunctionBegin; 542a5e57a09SHong Zhang if (mumps->CleanUpMUMPS) { 543397b6df1SKris Buschelman /* Terminate instance, deallocate memories */ 544a5e57a09SHong Zhang ierr = PetscFree2(mumps->id.sol_loc,mumps->id.isol_loc);CHKERRQ(ierr); 545a5e57a09SHong Zhang ierr = VecScatterDestroy(&mumps->scat_rhs);CHKERRQ(ierr); 546a5e57a09SHong Zhang ierr = VecScatterDestroy(&mumps->scat_sol);CHKERRQ(ierr); 547801fbe65SHong Zhang ierr = VecDestroy(&mumps->b_seq);CHKERRQ(ierr); 548a5e57a09SHong Zhang ierr = VecDestroy(&mumps->x_seq);CHKERRQ(ierr); 549a5e57a09SHong Zhang ierr = PetscFree(mumps->id.perm_in);CHKERRQ(ierr); 550a5e57a09SHong Zhang ierr = PetscFree(mumps->irn);CHKERRQ(ierr); 5512205254eSKarl Rupp 552a5e57a09SHong Zhang mumps->id.job = JOB_END; 553a5e57a09SHong Zhang PetscMUMPS_c(&mumps->id); 554a5e57a09SHong Zhang ierr = MPI_Comm_free(&(mumps->comm_mumps));CHKERRQ(ierr); 555397b6df1SKris Buschelman } 556a5e57a09SHong Zhang if (mumps->Destroy) { 557a5e57a09SHong Zhang ierr = (mumps->Destroy)(A);CHKERRQ(ierr); 558bf0cc555SLisandro Dalcin } 559bf0cc555SLisandro Dalcin ierr = PetscFree(A->spptr);CHKERRQ(ierr); 560bf0cc555SLisandro Dalcin 56197969023SHong Zhang /* clear composed functions */ 562bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)A,"MatFactorGetSolverPackage_C",NULL);CHKERRQ(ierr); 563bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)A,"MatMumpsSetIcntl_C",NULL);CHKERRQ(ierr); 564bc6112feSHong Zhang ierr = PetscObjectComposeFunction((PetscObject)A,"MatMumpsGetIcntl_C",NULL);CHKERRQ(ierr); 565bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)A,"MatMumpsSetCntl_C",NULL);CHKERRQ(ierr); 566bc6112feSHong Zhang ierr = PetscObjectComposeFunction((PetscObject)A,"MatMumpsGetCntl_C",NULL);CHKERRQ(ierr); 567bc6112feSHong Zhang 568ca810319SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)A,"MatMumpsGetInfo_C",NULL);CHKERRQ(ierr); 569ca810319SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)A,"MatMumpsGetInfog_C",NULL);CHKERRQ(ierr); 570ca810319SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)A,"MatMumpsGetRinfo_C",NULL);CHKERRQ(ierr); 571ca810319SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)A,"MatMumpsGetRinfog_C",NULL);CHKERRQ(ierr); 572397b6df1SKris Buschelman PetscFunctionReturn(0); 573397b6df1SKris Buschelman } 574397b6df1SKris Buschelman 575397b6df1SKris Buschelman #undef __FUNCT__ 576f6c57405SHong Zhang #define __FUNCT__ "MatSolve_MUMPS" 577b24902e0SBarry Smith PetscErrorCode MatSolve_MUMPS(Mat A,Vec b,Vec x) 578b24902e0SBarry Smith { 579a5e57a09SHong Zhang Mat_MUMPS *mumps=(Mat_MUMPS*)A->spptr; 580d54de34fSKris Buschelman PetscScalar *array; 58167877ebaSShri Abhyankar Vec b_seq; 582329ec9b3SHong Zhang IS is_iden,is_petsc; 583dfbe8321SBarry Smith PetscErrorCode ierr; 584329ec9b3SHong Zhang PetscInt i; 585883f2eb9SBarry Smith static PetscBool cite1 = PETSC_FALSE,cite2 = PETSC_FALSE; 586397b6df1SKris Buschelman 587397b6df1SKris Buschelman PetscFunctionBegin; 588883f2eb9SBarry Smith ierr = PetscCitationsRegister("@article{MUMPS01,\n author = {P.~R. Amestoy and I.~S. Duff and J.-Y. L'Excellent and J. Koster},\n title = {A fully asynchronous multifrontal solver using distributed dynamic scheduling},\n journal = {SIAM Journal on Matrix Analysis and Applications},\n volume = {23},\n number = {1},\n pages = {15--41},\n year = {2001}\n}\n",&cite1);CHKERRQ(ierr); 589883f2eb9SBarry Smith ierr = PetscCitationsRegister("@article{MUMPS02,\n author = {P.~R. Amestoy and A. Guermouche and J.-Y. L'Excellent and S. Pralet},\n title = {Hybrid scheduling for the parallel solution of linear systems},\n journal = {Parallel Computing},\n volume = {32},\n number = {2},\n pages = {136--156},\n year = {2006}\n}\n",&cite2);CHKERRQ(ierr); 590a5e57a09SHong Zhang mumps->id.nrhs = 1; 591a5e57a09SHong Zhang b_seq = mumps->b_seq; 592a5e57a09SHong Zhang if (mumps->size > 1) { 593329ec9b3SHong Zhang /* MUMPS only supports centralized rhs. Scatter b into a seqential rhs vector */ 594a5e57a09SHong Zhang ierr = VecScatterBegin(mumps->scat_rhs,b,b_seq,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 595a5e57a09SHong Zhang ierr = VecScatterEnd(mumps->scat_rhs,b,b_seq,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 596a5e57a09SHong Zhang if (!mumps->myid) {ierr = VecGetArray(b_seq,&array);CHKERRQ(ierr);} 597397b6df1SKris Buschelman } else { /* size == 1 */ 598397b6df1SKris Buschelman ierr = VecCopy(b,x);CHKERRQ(ierr); 599397b6df1SKris Buschelman ierr = VecGetArray(x,&array);CHKERRQ(ierr); 600397b6df1SKris Buschelman } 601a5e57a09SHong Zhang if (!mumps->myid) { /* define rhs on the host */ 602a5e57a09SHong Zhang mumps->id.nrhs = 1; 603397b6df1SKris Buschelman #if defined(PETSC_USE_COMPLEX) 6042907cef9SHong Zhang #if defined(PETSC_USE_REAL_SINGLE) 605a5e57a09SHong Zhang mumps->id.rhs = (mumps_complex*)array; 6062907cef9SHong Zhang #else 607a5e57a09SHong Zhang mumps->id.rhs = (mumps_double_complex*)array; 6082907cef9SHong Zhang #endif 609397b6df1SKris Buschelman #else 610a5e57a09SHong Zhang mumps->id.rhs = array; 611397b6df1SKris Buschelman #endif 612397b6df1SKris Buschelman } 613397b6df1SKris Buschelman 614397b6df1SKris Buschelman /* solve phase */ 615329ec9b3SHong Zhang /*-------------*/ 616a5e57a09SHong Zhang mumps->id.job = JOB_SOLVE; 617a5e57a09SHong Zhang PetscMUMPS_c(&mumps->id); 618a5e57a09SHong Zhang if (mumps->id.INFOG(1) < 0) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error reported by MUMPS in solve phase: INFOG(1)=%d\n",mumps->id.INFOG(1)); 619397b6df1SKris Buschelman 620a5e57a09SHong Zhang if (mumps->size > 1) { /* convert mumps distributed solution to petsc mpi x */ 621a5e57a09SHong Zhang if (mumps->scat_sol && mumps->ICNTL9_pre != mumps->id.ICNTL(9)) { 622a5e57a09SHong Zhang /* when id.ICNTL(9) changes, the contents of lsol_loc may change (not its size, lsol_loc), recreates scat_sol */ 623a5e57a09SHong Zhang ierr = VecScatterDestroy(&mumps->scat_sol);CHKERRQ(ierr); 624397b6df1SKris Buschelman } 625a5e57a09SHong Zhang if (!mumps->scat_sol) { /* create scatter scat_sol */ 626a5e57a09SHong Zhang ierr = ISCreateStride(PETSC_COMM_SELF,mumps->id.lsol_loc,0,1,&is_iden);CHKERRQ(ierr); /* from */ 627a5e57a09SHong Zhang for (i=0; i<mumps->id.lsol_loc; i++) { 628a5e57a09SHong Zhang mumps->id.isol_loc[i] -= 1; /* change Fortran style to C style */ 629a5e57a09SHong Zhang } 630a5e57a09SHong Zhang ierr = ISCreateGeneral(PETSC_COMM_SELF,mumps->id.lsol_loc,mumps->id.isol_loc,PETSC_COPY_VALUES,&is_petsc);CHKERRQ(ierr); /* to */ 631a5e57a09SHong Zhang ierr = VecScatterCreate(mumps->x_seq,is_iden,x,is_petsc,&mumps->scat_sol);CHKERRQ(ierr); 6326bf464f9SBarry Smith ierr = ISDestroy(&is_iden);CHKERRQ(ierr); 6336bf464f9SBarry Smith ierr = ISDestroy(&is_petsc);CHKERRQ(ierr); 6342205254eSKarl Rupp 635a5e57a09SHong Zhang mumps->ICNTL9_pre = mumps->id.ICNTL(9); /* save current value of id.ICNTL(9) */ 636397b6df1SKris Buschelman } 637a5e57a09SHong Zhang 638a5e57a09SHong Zhang ierr = VecScatterBegin(mumps->scat_sol,mumps->x_seq,x,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 639a5e57a09SHong Zhang ierr = VecScatterEnd(mumps->scat_sol,mumps->x_seq,x,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 640329ec9b3SHong Zhang } 641397b6df1SKris Buschelman PetscFunctionReturn(0); 642397b6df1SKris Buschelman } 643397b6df1SKris Buschelman 64451d5961aSHong Zhang #undef __FUNCT__ 64551d5961aSHong Zhang #define __FUNCT__ "MatSolveTranspose_MUMPS" 64651d5961aSHong Zhang PetscErrorCode MatSolveTranspose_MUMPS(Mat A,Vec b,Vec x) 64751d5961aSHong Zhang { 648a5e57a09SHong Zhang Mat_MUMPS *mumps=(Mat_MUMPS*)A->spptr; 64951d5961aSHong Zhang PetscErrorCode ierr; 65051d5961aSHong Zhang 65151d5961aSHong Zhang PetscFunctionBegin; 652a5e57a09SHong Zhang mumps->id.ICNTL(9) = 0; 6530ad0caddSJed Brown ierr = MatSolve_MUMPS(A,b,x);CHKERRQ(ierr); 654a5e57a09SHong Zhang mumps->id.ICNTL(9) = 1; 65551d5961aSHong Zhang PetscFunctionReturn(0); 65651d5961aSHong Zhang } 65751d5961aSHong Zhang 658e0b74bf9SHong Zhang #undef __FUNCT__ 659e0b74bf9SHong Zhang #define __FUNCT__ "MatMatSolve_MUMPS" 660e0b74bf9SHong Zhang PetscErrorCode MatMatSolve_MUMPS(Mat A,Mat B,Mat X) 661e0b74bf9SHong Zhang { 662bda8bf91SBarry Smith PetscErrorCode ierr; 663bda8bf91SBarry Smith PetscBool flg; 6644e34a73bSHong Zhang Mat_MUMPS *mumps=(Mat_MUMPS*)A->spptr; 665801fbe65SHong Zhang PetscInt i,nrhs,m,M,mx; 6662cd7d884SHong Zhang PetscScalar *array,*bray; 667bda8bf91SBarry Smith 668e0b74bf9SHong Zhang PetscFunctionBegin; 6690298fd71SBarry Smith ierr = PetscObjectTypeCompareAny((PetscObject)B,&flg,MATSEQDENSE,MATMPIDENSE,NULL);CHKERRQ(ierr); 670801fbe65SHong Zhang if (!flg) SETERRQ(PetscObjectComm((PetscObject)B),PETSC_ERR_ARG_WRONG,"Matrix B must be MATDENSE matrix"); 6710298fd71SBarry Smith ierr = PetscObjectTypeCompareAny((PetscObject)X,&flg,MATSEQDENSE,MATMPIDENSE,NULL);CHKERRQ(ierr); 672801fbe65SHong Zhang if (!flg) SETERRQ(PetscObjectComm((PetscObject)X),PETSC_ERR_ARG_WRONG,"Matrix X must be MATDENSE matrix"); 673801fbe65SHong Zhang if (B->rmap->n != X->rmap->n) SETERRQ(PetscObjectComm((PetscObject)B),PETSC_ERR_ARG_WRONG,"Matrix B and X must have same row distribution"); 6744e34a73bSHong Zhang 6752cd7d884SHong Zhang ierr = MatGetLocalSize(B,&m,NULL);CHKERRQ(ierr); 6762cd7d884SHong Zhang ierr = MatGetSize(B,&M,&nrhs);CHKERRQ(ierr); 6774e34a73bSHong Zhang 6782cd7d884SHong Zhang if (mumps->size == 1) { 6792cd7d884SHong Zhang /* copy B to X */ 6802cd7d884SHong Zhang ierr = MatDenseGetArray(B,&bray);CHKERRQ(ierr); 6812cd7d884SHong Zhang ierr = MatDenseGetArray(X,&array);CHKERRQ(ierr); 6822cd7d884SHong Zhang for (i=0; i<M*nrhs; i++) array[i] = bray[i]; 6832cd7d884SHong Zhang ierr = MatDenseRestoreArray(B,&bray);CHKERRQ(ierr); 6842cd7d884SHong Zhang 6852cd7d884SHong Zhang mumps->id.nrhs = nrhs; 6862cd7d884SHong Zhang mumps->id.lrhs = M; 6872cd7d884SHong Zhang #if defined(PETSC_USE_COMPLEX) 6882cd7d884SHong Zhang #if defined(PETSC_USE_REAL_SINGLE) 6892cd7d884SHong Zhang mumps->id.rhs = (mumps_complex*)array; 6902cd7d884SHong Zhang #else 6912cd7d884SHong Zhang mumps->id.rhs = (mumps_double_complex*)array; 6922cd7d884SHong Zhang #endif 6932cd7d884SHong Zhang #else 6942cd7d884SHong Zhang mumps->id.rhs = array; 6952cd7d884SHong Zhang #endif 696801fbe65SHong Zhang 6972cd7d884SHong Zhang /* solve phase */ 6982cd7d884SHong Zhang /*-------------*/ 6992cd7d884SHong Zhang mumps->id.job = JOB_SOLVE; 7002cd7d884SHong Zhang PetscMUMPS_c(&mumps->id); 7012cd7d884SHong Zhang if (mumps->id.INFOG(1) < 0) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error reported by MUMPS in solve phase: INFOG(1)=%d\n",mumps->id.INFOG(1)); 7022cd7d884SHong Zhang 7032cd7d884SHong Zhang ierr = MatDenseRestoreArray(X,&array);CHKERRQ(ierr); 704801fbe65SHong Zhang } else { /************** parallel case ***************/ 705*74f0fcc7SHong Zhang PetscInt lsol_loc,*isol_loc,*idx,*iidx,*idxx; 706*74f0fcc7SHong Zhang PetscScalar *sol_loc; 707801fbe65SHong Zhang IS is_to,is_from; 708801fbe65SHong Zhang PetscInt k,proc,j; 709801fbe65SHong Zhang const PetscInt *rstart; 710*74f0fcc7SHong Zhang Vec v_mpi,bb_seq; 711*74f0fcc7SHong Zhang VecScatter scat_rhss, scat_sols; 712801fbe65SHong Zhang 713801fbe65SHong Zhang /* create x_seq to hold local solution */ 714801fbe65SHong Zhang lsol_loc = nrhs*mumps->id.INFO(23); /* length of sol_loc */ 715801fbe65SHong Zhang 716801fbe65SHong Zhang ierr = PetscFree2(mumps->id.sol_loc,mumps->id.isol_loc);CHKERRQ(ierr); //save it for MatSovle()!!! 717801fbe65SHong Zhang 718801fbe65SHong Zhang ierr = PetscMalloc2(lsol_loc,&sol_loc,lsol_loc,&isol_loc);CHKERRQ(ierr); 719801fbe65SHong Zhang #if defined(PETSC_USE_COMPLEX) 720801fbe65SHong Zhang #if defined(PETSC_USE_REAL_SINGLE) 721801fbe65SHong Zhang mumps->id.sol_loc = (mumps_complex*)sol_loc; 722801fbe65SHong Zhang #else 723801fbe65SHong Zhang mumps->id.sol_loc = (mumps_double_complex*)sol_loc; 724801fbe65SHong Zhang #endif 725801fbe65SHong Zhang #else 726801fbe65SHong Zhang mumps->id.sol_loc = sol_loc; 727801fbe65SHong Zhang #endif 728801fbe65SHong Zhang mumps->id.isol_loc = isol_loc; 729801fbe65SHong Zhang 730801fbe65SHong Zhang ierr = VecDestroy(&mumps->x_seq);CHKERRQ(ierr); 731801fbe65SHong Zhang ierr = VecCreateSeqWithArray(PETSC_COMM_SELF,1,lsol_loc,sol_loc,&mumps->x_seq);CHKERRQ(ierr); 7322cd7d884SHong Zhang 733*74f0fcc7SHong Zhang /* copy rhs matrix B into vector v_mpi */ 734801fbe65SHong Zhang ierr = MatDenseGetArray(B,&bray);CHKERRQ(ierr); 735*74f0fcc7SHong Zhang ierr = VecCreateMPIWithArray(PetscObjectComm((PetscObject)B),1,nrhs*m,nrhs*M,(const PetscScalar*)bray,&v_mpi);CHKERRQ(ierr); 736801fbe65SHong Zhang ierr = MatDenseRestoreArray(B,&bray);CHKERRQ(ierr); 737801fbe65SHong Zhang 738*74f0fcc7SHong Zhang /* scatter v_mpi to bb_seq because MUMPS only supports centralized rhs */ 739*74f0fcc7SHong Zhang /* idx: maps from k-th index of v_mpi to (i,j)-th global entry of B; 740801fbe65SHong Zhang iidx: inverse of idx, will be used by scattering xx_seq -> X */ 741801fbe65SHong Zhang ierr = PetscMalloc2(nrhs*M,&idx,nrhs*M,&iidx);CHKERRQ(ierr); 742801fbe65SHong Zhang ierr = MatGetOwnershipRanges(B,&rstart);CHKERRQ(ierr); 743801fbe65SHong Zhang k = 0; 744801fbe65SHong Zhang for (proc=0; proc<mumps->size; proc++){ 745801fbe65SHong Zhang for (j=0; j<nrhs; j++){ 746801fbe65SHong Zhang for (i=rstart[proc]; i<rstart[proc+1]; i++){ 747801fbe65SHong Zhang iidx[j*M + i] = k; 748801fbe65SHong Zhang idx[k++] = j*M + i; 749801fbe65SHong Zhang } 750801fbe65SHong Zhang } 7512cd7d884SHong Zhang } 7522cd7d884SHong Zhang 753801fbe65SHong Zhang if (!mumps->myid) { 754*74f0fcc7SHong Zhang ierr = VecCreateSeq(PETSC_COMM_SELF,nrhs*M,&bb_seq);CHKERRQ(ierr); 755801fbe65SHong Zhang ierr = ISCreateGeneral(PETSC_COMM_SELF,nrhs*M,idx,PETSC_COPY_VALUES,&is_to);CHKERRQ(ierr); 756801fbe65SHong Zhang ierr = ISCreateStride(PETSC_COMM_SELF,nrhs*M,0,1,&is_from);CHKERRQ(ierr); 757801fbe65SHong Zhang } else { 758*74f0fcc7SHong Zhang ierr = VecCreateSeq(PETSC_COMM_SELF,0,&bb_seq);CHKERRQ(ierr); 759801fbe65SHong Zhang ierr = ISCreateStride(PETSC_COMM_SELF,0,0,1,&is_to);CHKERRQ(ierr); 760801fbe65SHong Zhang ierr = ISCreateStride(PETSC_COMM_SELF,0,0,1,&is_from);CHKERRQ(ierr); 761801fbe65SHong Zhang } 762*74f0fcc7SHong Zhang ierr = VecScatterCreate(v_mpi,is_from,bb_seq,is_to,&scat_rhss);CHKERRQ(ierr); 763*74f0fcc7SHong Zhang ierr = VecScatterBegin(scat_rhss,v_mpi,bb_seq,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 764801fbe65SHong Zhang ierr = ISDestroy(&is_to);CHKERRQ(ierr); 765801fbe65SHong Zhang ierr = ISDestroy(&is_from);CHKERRQ(ierr); 766*74f0fcc7SHong Zhang ierr = VecScatterEnd(scat_rhss,v_mpi,bb_seq,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 767801fbe65SHong Zhang 768801fbe65SHong Zhang if (!mumps->myid) { /* define rhs on the host */ 769*74f0fcc7SHong Zhang ierr = VecGetArray(bb_seq,&bray);CHKERRQ(ierr); 770801fbe65SHong Zhang mumps->id.nrhs = nrhs; 771801fbe65SHong Zhang mumps->id.lrhs = M; 772801fbe65SHong Zhang #if defined(PETSC_USE_COMPLEX) 773801fbe65SHong Zhang #if defined(PETSC_USE_REAL_SINGLE) 774801fbe65SHong Zhang mumps->id.rhs = (mumps_complex*)bray; 775801fbe65SHong Zhang #else 776801fbe65SHong Zhang mumps->id.rhs = (mumps_double_complex*)bray; 777801fbe65SHong Zhang #endif 778801fbe65SHong Zhang #else 779801fbe65SHong Zhang mumps->id.rhs = bray; 780801fbe65SHong Zhang #endif 781*74f0fcc7SHong Zhang ierr = VecRestoreArray(bb_seq,&bray);CHKERRQ(ierr); 782801fbe65SHong Zhang } 783801fbe65SHong Zhang 784801fbe65SHong Zhang /* solve phase */ 785801fbe65SHong Zhang /*-------------*/ 786801fbe65SHong Zhang mumps->id.job = JOB_SOLVE; 787801fbe65SHong Zhang PetscMUMPS_c(&mumps->id); 788801fbe65SHong Zhang if (mumps->id.INFOG(1) < 0) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error reported by MUMPS in solve phase: INFOG(1)=%d\n",mumps->id.INFOG(1)); 789801fbe65SHong Zhang 790801fbe65SHong Zhang /* put mumps distributed solution to petsc vector xx_mpi, which shares local arrays with solution matrix X */ 791*74f0fcc7SHong Zhang ierr = MatDenseGetArray(X,&array);CHKERRQ(ierr); 792*74f0fcc7SHong Zhang ierr = MatGetLocalSize(X,&mx,NULL);CHKERRQ(ierr); 793*74f0fcc7SHong Zhang ierr = VecPlaceArray(v_mpi,array);CHKERRQ(ierr); 794801fbe65SHong Zhang 795801fbe65SHong Zhang /* create scatter scat_sols */ 796801fbe65SHong Zhang ierr = PetscMalloc1(nrhs*mumps->id.lsol_loc,&idxx);CHKERRQ(ierr); 797801fbe65SHong Zhang ierr = ISCreateStride(PETSC_COMM_SELF,nrhs*mumps->id.lsol_loc,0,1,&is_from);CHKERRQ(ierr); 798801fbe65SHong Zhang for (i=0; i<mumps->id.lsol_loc; i++) { 799801fbe65SHong Zhang mumps->id.isol_loc[i] -= 1; /* change Fortran style to C style */ 800801fbe65SHong Zhang idxx[i] = iidx[mumps->id.isol_loc[i]]; 801801fbe65SHong Zhang for (j=1; j<nrhs; j++){ 802801fbe65SHong Zhang idxx[j*mumps->id.lsol_loc+i] = iidx[mumps->id.isol_loc[i]+j*M]; 803801fbe65SHong Zhang } 804801fbe65SHong Zhang } 805801fbe65SHong Zhang ierr = ISCreateGeneral(PETSC_COMM_SELF,nrhs*mumps->id.lsol_loc,idxx,PETSC_COPY_VALUES,&is_to);CHKERRQ(ierr); 806*74f0fcc7SHong Zhang ierr = VecScatterCreate(mumps->x_seq,is_from,v_mpi,is_to,&scat_sols);CHKERRQ(ierr); 807*74f0fcc7SHong Zhang ierr = VecScatterBegin(scat_sols,mumps->x_seq,v_mpi,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 808801fbe65SHong Zhang ierr = ISDestroy(&is_from);CHKERRQ(ierr); 809801fbe65SHong Zhang ierr = ISDestroy(&is_to);CHKERRQ(ierr); 810*74f0fcc7SHong Zhang ierr = VecScatterEnd(scat_sols,mumps->x_seq,v_mpi,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 811801fbe65SHong Zhang 812801fbe65SHong Zhang ierr = MatDenseRestoreArray(X,&array);CHKERRQ(ierr); 813801fbe65SHong Zhang //ierr = PetscFree2(sol_loc,isol_loc);CHKERRQ(ierr); 814801fbe65SHong Zhang ierr = PetscFree2(idx,iidx);CHKERRQ(ierr); 815801fbe65SHong Zhang ierr = PetscFree(idxx);CHKERRQ(ierr); 816*74f0fcc7SHong Zhang ierr = VecDestroy(&v_mpi);CHKERRQ(ierr); 817*74f0fcc7SHong Zhang ierr = VecDestroy(&bb_seq);CHKERRQ(ierr); 818*74f0fcc7SHong Zhang ierr = VecScatterDestroy(&scat_rhss);CHKERRQ(ierr); 819*74f0fcc7SHong Zhang ierr = VecScatterDestroy(&scat_sols);CHKERRQ(ierr); 820801fbe65SHong Zhang } 821e0b74bf9SHong Zhang PetscFunctionReturn(0); 822e0b74bf9SHong Zhang } 823e0b74bf9SHong Zhang 824ace3df97SHong Zhang #if !defined(PETSC_USE_COMPLEX) 825a58c3f20SHong Zhang /* 826a58c3f20SHong Zhang input: 827a58c3f20SHong Zhang F: numeric factor 828a58c3f20SHong Zhang output: 829a58c3f20SHong Zhang nneg: total number of negative pivots 830a58c3f20SHong Zhang nzero: 0 831a58c3f20SHong Zhang npos: (global dimension of F) - nneg 832a58c3f20SHong Zhang */ 833a58c3f20SHong Zhang 834a58c3f20SHong Zhang #undef __FUNCT__ 835a58c3f20SHong Zhang #define __FUNCT__ "MatGetInertia_SBAIJMUMPS" 836dfbe8321SBarry Smith PetscErrorCode MatGetInertia_SBAIJMUMPS(Mat F,int *nneg,int *nzero,int *npos) 837a58c3f20SHong Zhang { 838a5e57a09SHong Zhang Mat_MUMPS *mumps =(Mat_MUMPS*)F->spptr; 839dfbe8321SBarry Smith PetscErrorCode ierr; 840c1490034SHong Zhang PetscMPIInt size; 841a58c3f20SHong Zhang 842a58c3f20SHong Zhang PetscFunctionBegin; 843ce94432eSBarry Smith ierr = MPI_Comm_size(PetscObjectComm((PetscObject)F),&size);CHKERRQ(ierr); 844bcb30aebSHong Zhang /* MUMPS 4.3.1 calls ScaLAPACK when ICNTL(13)=0 (default), which does not offer the possibility to compute the inertia of a dense matrix. Set ICNTL(13)=1 to skip ScaLAPACK */ 845a5e57a09SHong Zhang if (size > 1 && mumps->id.ICNTL(13) != 1) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONG,"ICNTL(13)=%d. -mat_mumps_icntl_13 must be set as 1 for correct global matrix inertia\n",mumps->id.INFOG(13)); 846ed85ac9fSHong Zhang 847710ac8efSHong Zhang if (nneg) *nneg = mumps->id.INFOG(12); 848ed85ac9fSHong Zhang if (nzero || npos) { 849ed85ac9fSHong Zhang if (mumps->id.ICNTL(24) != 1) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONG,"-mat_mumps_icntl_24 must be set as 1 for null pivot row detection"); 850710ac8efSHong Zhang if (nzero) *nzero = mumps->id.INFOG(28); 851710ac8efSHong Zhang if (npos) *npos = F->rmap->N - (mumps->id.INFOG(12) + mumps->id.INFOG(28)); 852a58c3f20SHong Zhang } 853a58c3f20SHong Zhang PetscFunctionReturn(0); 854a58c3f20SHong Zhang } 855ace3df97SHong Zhang #endif /* !defined(PETSC_USE_COMPLEX) */ 856a58c3f20SHong Zhang 857397b6df1SKris Buschelman #undef __FUNCT__ 858f6c57405SHong Zhang #define __FUNCT__ "MatFactorNumeric_MUMPS" 8590481f469SBarry Smith PetscErrorCode MatFactorNumeric_MUMPS(Mat F,Mat A,const MatFactorInfo *info) 860af281ebdSHong Zhang { 861a5e57a09SHong Zhang Mat_MUMPS *mumps =(Mat_MUMPS*)(F)->spptr; 8626849ba73SBarry Smith PetscErrorCode ierr; 863e09efc27SHong Zhang Mat F_diag; 864ace3abfcSBarry Smith PetscBool isMPIAIJ; 865397b6df1SKris Buschelman 866397b6df1SKris Buschelman PetscFunctionBegin; 867a5e57a09SHong Zhang ierr = (*mumps->ConvertToTriples)(A, 1, MAT_REUSE_MATRIX, &mumps->nz, &mumps->irn, &mumps->jcn, &mumps->val);CHKERRQ(ierr); 868397b6df1SKris Buschelman 869397b6df1SKris Buschelman /* numerical factorization phase */ 870329ec9b3SHong Zhang /*-------------------------------*/ 871a5e57a09SHong Zhang mumps->id.job = JOB_FACTNUMERIC; 8724e34a73bSHong Zhang if (!mumps->id.ICNTL(18)) { /* A is centralized */ 873a5e57a09SHong Zhang if (!mumps->myid) { 874397b6df1SKris Buschelman #if defined(PETSC_USE_COMPLEX) 8752907cef9SHong Zhang #if defined(PETSC_USE_REAL_SINGLE) 876a5e57a09SHong Zhang mumps->id.a = (mumps_complex*)mumps->val; 8772907cef9SHong Zhang #else 878a5e57a09SHong Zhang mumps->id.a = (mumps_double_complex*)mumps->val; 8792907cef9SHong Zhang #endif 880397b6df1SKris Buschelman #else 881a5e57a09SHong Zhang mumps->id.a = mumps->val; 882397b6df1SKris Buschelman #endif 883397b6df1SKris Buschelman } 884397b6df1SKris Buschelman } else { 885397b6df1SKris Buschelman #if defined(PETSC_USE_COMPLEX) 8862907cef9SHong Zhang #if defined(PETSC_USE_REAL_SINGLE) 887a5e57a09SHong Zhang mumps->id.a_loc = (mumps_complex*)mumps->val; 8882907cef9SHong Zhang #else 889a5e57a09SHong Zhang mumps->id.a_loc = (mumps_double_complex*)mumps->val; 8902907cef9SHong Zhang #endif 891397b6df1SKris Buschelman #else 892a5e57a09SHong Zhang mumps->id.a_loc = mumps->val; 893397b6df1SKris Buschelman #endif 894397b6df1SKris Buschelman } 895a5e57a09SHong Zhang PetscMUMPS_c(&mumps->id); 896a5e57a09SHong Zhang if (mumps->id.INFOG(1) < 0) { 897151787a6SHong Zhang if (mumps->id.INFO(1) == -13) { 898151787a6SHong Zhang if (mumps->id.INFO(2) < 0) { 899151787a6SHong Zhang SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error reported by MUMPS in numerical factorization phase: Cannot allocate required memory %d megabytes\n",-mumps->id.INFO(2)); 900151787a6SHong Zhang } else { 901151787a6SHong Zhang SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error reported by MUMPS in numerical factorization phase: Cannot allocate required memory %d bytes\n",mumps->id.INFO(2)); 902151787a6SHong Zhang } 903151787a6SHong Zhang } else SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error reported by MUMPS in numerical factorization phase: INFO(1)=%d, INFO(2)=%d\n",mumps->id.INFO(1),mumps->id.INFO(2)); 904397b6df1SKris Buschelman } 905a5e57a09SHong Zhang if (!mumps->myid && mumps->id.ICNTL(16) > 0) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB," mumps->id.ICNTL(16):=%d\n",mumps->id.INFOG(16)); 906397b6df1SKris Buschelman 907dcd589f8SShri Abhyankar (F)->assembled = PETSC_TRUE; 908a5e57a09SHong Zhang mumps->matstruc = SAME_NONZERO_PATTERN; 909a5e57a09SHong Zhang mumps->CleanUpMUMPS = PETSC_TRUE; 91067877ebaSShri Abhyankar 911a5e57a09SHong Zhang if (mumps->size > 1) { 91267877ebaSShri Abhyankar PetscInt lsol_loc; 91367877ebaSShri Abhyankar PetscScalar *sol_loc; 9142205254eSKarl Rupp 915c2093ab7SHong Zhang ierr = PetscObjectTypeCompare((PetscObject)A,MATMPIAIJ,&isMPIAIJ);CHKERRQ(ierr); 916c2093ab7SHong Zhang if (isMPIAIJ) F_diag = ((Mat_MPIAIJ*)(F)->data)->A; 917c2093ab7SHong Zhang else F_diag = ((Mat_MPISBAIJ*)(F)->data)->A; 918c2093ab7SHong Zhang F_diag->assembled = PETSC_TRUE; 919c2093ab7SHong Zhang 920c2093ab7SHong Zhang /* distributed solution; Create x_seq=sol_loc for repeated use */ 921c2093ab7SHong Zhang if (mumps->x_seq) { 922c2093ab7SHong Zhang ierr = VecScatterDestroy(&mumps->scat_sol);CHKERRQ(ierr); 923c2093ab7SHong Zhang ierr = PetscFree2(mumps->id.sol_loc,mumps->id.isol_loc);CHKERRQ(ierr); 924c2093ab7SHong Zhang ierr = VecDestroy(&mumps->x_seq);CHKERRQ(ierr); 925c2093ab7SHong Zhang } 926a5e57a09SHong Zhang lsol_loc = mumps->id.INFO(23); /* length of sol_loc */ 927dcca6d9dSJed Brown ierr = PetscMalloc2(lsol_loc,&sol_loc,lsol_loc,&mumps->id.isol_loc);CHKERRQ(ierr); 928a5e57a09SHong Zhang mumps->id.lsol_loc = lsol_loc; 92967877ebaSShri Abhyankar #if defined(PETSC_USE_COMPLEX) 9302907cef9SHong Zhang #if defined(PETSC_USE_REAL_SINGLE) 931a5e57a09SHong Zhang mumps->id.sol_loc = (mumps_complex*)sol_loc; 9322907cef9SHong Zhang #else 933a5e57a09SHong Zhang mumps->id.sol_loc = (mumps_double_complex*)sol_loc; 9342907cef9SHong Zhang #endif 93567877ebaSShri Abhyankar #else 936a5e57a09SHong Zhang mumps->id.sol_loc = sol_loc; 93767877ebaSShri Abhyankar #endif 938a5e57a09SHong Zhang ierr = VecCreateSeqWithArray(PETSC_COMM_SELF,1,lsol_loc,sol_loc,&mumps->x_seq);CHKERRQ(ierr); 93967877ebaSShri Abhyankar } 940397b6df1SKris Buschelman PetscFunctionReturn(0); 941397b6df1SKris Buschelman } 942397b6df1SKris Buschelman 9439a2535b5SHong Zhang /* Sets MUMPS options from the options database */ 944dcd589f8SShri Abhyankar #undef __FUNCT__ 9459a2535b5SHong Zhang #define __FUNCT__ "PetscSetMUMPSFromOptions" 9469a2535b5SHong Zhang PetscErrorCode PetscSetMUMPSFromOptions(Mat F, Mat A) 947dcd589f8SShri Abhyankar { 9489a2535b5SHong Zhang Mat_MUMPS *mumps = (Mat_MUMPS*)F->spptr; 949dcd589f8SShri Abhyankar PetscErrorCode ierr; 950dcd589f8SShri Abhyankar PetscInt icntl; 951ace3abfcSBarry Smith PetscBool flg; 952dcd589f8SShri Abhyankar 953dcd589f8SShri Abhyankar PetscFunctionBegin; 954ce94432eSBarry Smith ierr = PetscOptionsBegin(PetscObjectComm((PetscObject)A),((PetscObject)A)->prefix,"MUMPS Options","Mat");CHKERRQ(ierr); 9559a2535b5SHong Zhang ierr = PetscOptionsInt("-mat_mumps_icntl_1","ICNTL(1): output stream for error messages","None",mumps->id.ICNTL(1),&icntl,&flg);CHKERRQ(ierr); 9569a2535b5SHong Zhang if (flg) mumps->id.ICNTL(1) = icntl; 9579a2535b5SHong Zhang ierr = PetscOptionsInt("-mat_mumps_icntl_2","ICNTL(2): output stream for diagnostic printing, statistics, and warning","None",mumps->id.ICNTL(2),&icntl,&flg);CHKERRQ(ierr); 9589a2535b5SHong Zhang if (flg) mumps->id.ICNTL(2) = icntl; 9599a2535b5SHong Zhang ierr = PetscOptionsInt("-mat_mumps_icntl_3","ICNTL(3): output stream for global information, collected on the host","None",mumps->id.ICNTL(3),&icntl,&flg);CHKERRQ(ierr); 9609a2535b5SHong Zhang if (flg) mumps->id.ICNTL(3) = icntl; 961dcd589f8SShri Abhyankar 9629a2535b5SHong Zhang ierr = PetscOptionsInt("-mat_mumps_icntl_4","ICNTL(4): level of printing (0 to 4)","None",mumps->id.ICNTL(4),&icntl,&flg);CHKERRQ(ierr); 9639a2535b5SHong Zhang if (flg) mumps->id.ICNTL(4) = icntl; 9649a2535b5SHong Zhang if (mumps->id.ICNTL(4) || PetscLogPrintInfo) mumps->id.ICNTL(3) = 6; /* resume MUMPS default id.ICNTL(3) = 6 */ 9659a2535b5SHong Zhang 966d341cd04SHong Zhang ierr = PetscOptionsInt("-mat_mumps_icntl_6","ICNTL(6): permutes to a zero-free diagonal and/or scale the matrix (0 to 7)","None",mumps->id.ICNTL(6),&icntl,&flg);CHKERRQ(ierr); 9679a2535b5SHong Zhang if (flg) mumps->id.ICNTL(6) = icntl; 9689a2535b5SHong Zhang 969d341cd04SHong Zhang ierr = PetscOptionsInt("-mat_mumps_icntl_7","ICNTL(7): computes a symmetric permutation in sequential analysis (0 to 7). 3=Scotch, 4=PORD, 5=Metis","None",mumps->id.ICNTL(7),&icntl,&flg);CHKERRQ(ierr); 970dcd589f8SShri Abhyankar if (flg) { 9712205254eSKarl Rupp if (icntl== 1 && mumps->size > 1) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_SUP,"pivot order be set by the user in PERM_IN -- not supported by the PETSc/MUMPS interface\n"); 9722205254eSKarl Rupp else mumps->id.ICNTL(7) = icntl; 973dcd589f8SShri Abhyankar } 974e0b74bf9SHong Zhang 9750298fd71SBarry Smith ierr = PetscOptionsInt("-mat_mumps_icntl_8","ICNTL(8): scaling strategy (-2 to 8 or 77)","None",mumps->id.ICNTL(8),&mumps->id.ICNTL(8),NULL);CHKERRQ(ierr); 976d341cd04SHong Zhang /* ierr = PetscOptionsInt("-mat_mumps_icntl_9","ICNTL(9): computes the solution using A or A^T","None",mumps->id.ICNTL(9),&mumps->id.ICNTL(9),NULL);CHKERRQ(ierr); handled by MatSolveTranspose_MUMPS() */ 9770298fd71SBarry Smith ierr = PetscOptionsInt("-mat_mumps_icntl_10","ICNTL(10): max num of refinements","None",mumps->id.ICNTL(10),&mumps->id.ICNTL(10),NULL);CHKERRQ(ierr); 978d341cd04SHong Zhang ierr = PetscOptionsInt("-mat_mumps_icntl_11","ICNTL(11): statistics related to an error analysis (via -ksp_view)","None",mumps->id.ICNTL(11),&mumps->id.ICNTL(11),NULL);CHKERRQ(ierr); 979d341cd04SHong Zhang ierr = PetscOptionsInt("-mat_mumps_icntl_12","ICNTL(12): an ordering strategy for symmetric matrices (0 to 3)","None",mumps->id.ICNTL(12),&mumps->id.ICNTL(12),NULL);CHKERRQ(ierr); 980d341cd04SHong Zhang ierr = PetscOptionsInt("-mat_mumps_icntl_13","ICNTL(13): parallelism of the root node (enable ScaLAPACK) and its splitting","None",mumps->id.ICNTL(13),&mumps->id.ICNTL(13),NULL);CHKERRQ(ierr); 981d341cd04SHong Zhang ierr = PetscOptionsInt("-mat_mumps_icntl_14","ICNTL(14): percentage increase in the estimated working space","None",mumps->id.ICNTL(14),&mumps->id.ICNTL(14),NULL);CHKERRQ(ierr); 982d341cd04SHong Zhang ierr = PetscOptionsInt("-mat_mumps_icntl_19","ICNTL(19): computes the Schur complement","None",mumps->id.ICNTL(19),&mumps->id.ICNTL(19),NULL);CHKERRQ(ierr); 9834e34a73bSHong Zhang /* ierr = PetscOptionsInt("-mat_mumps_icntl_20","ICNTL(20): the format (dense or sparse) of the right-hand sides","None",mumps->id.ICNTL(20),&mumps->id.ICNTL(20),NULL);CHKERRQ(ierr); -- sparse rhs is not supported in PETSc API */ 984d341cd04SHong Zhang /* ierr = PetscOptionsInt("-mat_mumps_icntl_21","ICNTL(21): the distribution (centralized or distributed) of the solution vectors","None",mumps->id.ICNTL(21),&mumps->id.ICNTL(21),NULL);CHKERRQ(ierr); we only use distributed solution vector */ 9859a2535b5SHong Zhang 986d341cd04SHong Zhang ierr = PetscOptionsInt("-mat_mumps_icntl_22","ICNTL(22): in-core/out-of-core factorization and solve (0 or 1)","None",mumps->id.ICNTL(22),&mumps->id.ICNTL(22),NULL);CHKERRQ(ierr); 9870298fd71SBarry Smith ierr = PetscOptionsInt("-mat_mumps_icntl_23","ICNTL(23): max size of the working memory (MB) that can allocate per processor","None",mumps->id.ICNTL(23),&mumps->id.ICNTL(23),NULL);CHKERRQ(ierr); 9880298fd71SBarry Smith ierr = PetscOptionsInt("-mat_mumps_icntl_24","ICNTL(24): detection of null pivot rows (0 or 1)","None",mumps->id.ICNTL(24),&mumps->id.ICNTL(24),NULL);CHKERRQ(ierr); 9899a2535b5SHong Zhang if (mumps->id.ICNTL(24)) { 9909a2535b5SHong Zhang mumps->id.ICNTL(13) = 1; /* turn-off ScaLAPACK to help with the correct detection of null pivots */ 991d7ebd59bSHong Zhang } 992d7ebd59bSHong Zhang 993d341cd04SHong Zhang ierr = PetscOptionsInt("-mat_mumps_icntl_25","ICNTL(25): compute a solution of a deficient matrix and a null space basis","None",mumps->id.ICNTL(25),&mumps->id.ICNTL(25),NULL);CHKERRQ(ierr); 994d341cd04SHong Zhang ierr = PetscOptionsInt("-mat_mumps_icntl_26","ICNTL(26): drives the solution phase if a Schur complement matrix","None",mumps->id.ICNTL(26),&mumps->id.ICNTL(26),NULL);CHKERRQ(ierr); 9952cd7d884SHong Zhang ierr = PetscOptionsInt("-mat_mumps_icntl_27","ICNTL(27): the blocking size for multiple right-hand sides","None",mumps->id.ICNTL(27),&mumps->id.ICNTL(27),NULL);CHKERRQ(ierr); 9960298fd71SBarry Smith ierr = PetscOptionsInt("-mat_mumps_icntl_28","ICNTL(28): use 1 for sequential analysis and ictnl(7) ordering, or 2 for parallel analysis and ictnl(29) ordering","None",mumps->id.ICNTL(28),&mumps->id.ICNTL(28),NULL);CHKERRQ(ierr); 997d341cd04SHong Zhang ierr = PetscOptionsInt("-mat_mumps_icntl_29","ICNTL(29): parallel ordering 1 = ptscotch, 2 = parmetis","None",mumps->id.ICNTL(29),&mumps->id.ICNTL(29),NULL);CHKERRQ(ierr); 9980298fd71SBarry Smith ierr = PetscOptionsInt("-mat_mumps_icntl_30","ICNTL(30): compute user-specified set of entries in inv(A)","None",mumps->id.ICNTL(30),&mumps->id.ICNTL(30),NULL);CHKERRQ(ierr); 999d341cd04SHong Zhang ierr = PetscOptionsInt("-mat_mumps_icntl_31","ICNTL(31): indicates which factors may be discarded during factorization","None",mumps->id.ICNTL(31),&mumps->id.ICNTL(31),NULL);CHKERRQ(ierr); 10004e34a73bSHong Zhang /* ierr = PetscOptionsInt("-mat_mumps_icntl_32","ICNTL(32): performs the forward elemination of the right-hand sides during factorization","None",mumps->id.ICNTL(32),&mumps->id.ICNTL(32),NULL);CHKERRQ(ierr); -- not supported by PETSc API */ 10010298fd71SBarry Smith ierr = PetscOptionsInt("-mat_mumps_icntl_33","ICNTL(33): compute determinant","None",mumps->id.ICNTL(33),&mumps->id.ICNTL(33),NULL);CHKERRQ(ierr); 1002dcd589f8SShri Abhyankar 10030298fd71SBarry Smith ierr = PetscOptionsReal("-mat_mumps_cntl_1","CNTL(1): relative pivoting threshold","None",mumps->id.CNTL(1),&mumps->id.CNTL(1),NULL);CHKERRQ(ierr); 10040298fd71SBarry Smith ierr = PetscOptionsReal("-mat_mumps_cntl_2","CNTL(2): stopping criterion of refinement","None",mumps->id.CNTL(2),&mumps->id.CNTL(2),NULL);CHKERRQ(ierr); 10050298fd71SBarry Smith ierr = PetscOptionsReal("-mat_mumps_cntl_3","CNTL(3): absolute pivoting threshold","None",mumps->id.CNTL(3),&mumps->id.CNTL(3),NULL);CHKERRQ(ierr); 10060298fd71SBarry Smith ierr = PetscOptionsReal("-mat_mumps_cntl_4","CNTL(4): value for static pivoting","None",mumps->id.CNTL(4),&mumps->id.CNTL(4),NULL);CHKERRQ(ierr); 10070298fd71SBarry Smith ierr = PetscOptionsReal("-mat_mumps_cntl_5","CNTL(5): fixation for null pivots","None",mumps->id.CNTL(5),&mumps->id.CNTL(5),NULL);CHKERRQ(ierr); 1008e5bb22a1SHong Zhang 10090298fd71SBarry Smith ierr = PetscOptionsString("-mat_mumps_ooc_tmpdir", "out of core directory", "None", mumps->id.ooc_tmpdir, mumps->id.ooc_tmpdir, 256, NULL); 1010dcd589f8SShri Abhyankar PetscOptionsEnd(); 1011dcd589f8SShri Abhyankar PetscFunctionReturn(0); 1012dcd589f8SShri Abhyankar } 1013dcd589f8SShri Abhyankar 1014dcd589f8SShri Abhyankar #undef __FUNCT__ 1015dcd589f8SShri Abhyankar #define __FUNCT__ "PetscInitializeMUMPS" 1016f697e70eSHong Zhang PetscErrorCode PetscInitializeMUMPS(Mat A,Mat_MUMPS *mumps) 1017dcd589f8SShri Abhyankar { 1018dcd589f8SShri Abhyankar PetscErrorCode ierr; 1019dcd589f8SShri Abhyankar 1020dcd589f8SShri Abhyankar PetscFunctionBegin; 1021ce94432eSBarry Smith ierr = MPI_Comm_rank(PetscObjectComm((PetscObject)A), &mumps->myid); 1022ce94432eSBarry Smith ierr = MPI_Comm_size(PetscObjectComm((PetscObject)A),&mumps->size);CHKERRQ(ierr); 1023ce94432eSBarry Smith ierr = MPI_Comm_dup(PetscObjectComm((PetscObject)A),&(mumps->comm_mumps));CHKERRQ(ierr); 10242205254eSKarl Rupp 1025f697e70eSHong Zhang mumps->id.comm_fortran = MPI_Comm_c2f(mumps->comm_mumps); 1026f697e70eSHong Zhang 1027f697e70eSHong Zhang mumps->id.job = JOB_INIT; 1028f697e70eSHong Zhang mumps->id.par = 1; /* host participates factorizaton and solve */ 1029f697e70eSHong Zhang mumps->id.sym = mumps->sym; 10302907cef9SHong Zhang PetscMUMPS_c(&mumps->id); 1031f697e70eSHong Zhang 1032f697e70eSHong Zhang mumps->CleanUpMUMPS = PETSC_FALSE; 10330298fd71SBarry Smith mumps->scat_rhs = NULL; 10340298fd71SBarry Smith mumps->scat_sol = NULL; 10359a2535b5SHong Zhang 103670544d5fSHong Zhang /* set PETSc-MUMPS default options - override MUMPS default */ 10379a2535b5SHong Zhang mumps->id.ICNTL(3) = 0; 10389a2535b5SHong Zhang mumps->id.ICNTL(4) = 0; 10399a2535b5SHong Zhang if (mumps->size == 1) { 10409a2535b5SHong Zhang mumps->id.ICNTL(18) = 0; /* centralized assembled matrix input */ 10419a2535b5SHong Zhang } else { 10429a2535b5SHong Zhang mumps->id.ICNTL(18) = 3; /* distributed assembled matrix input */ 10434e34a73bSHong Zhang mumps->id.ICNTL(20) = 0; /* rhs is in dense format */ 104470544d5fSHong Zhang mumps->id.ICNTL(21) = 1; /* distributed solution */ 10459a2535b5SHong Zhang } 1046dcd589f8SShri Abhyankar PetscFunctionReturn(0); 1047dcd589f8SShri Abhyankar } 1048dcd589f8SShri Abhyankar 1049a5e57a09SHong Zhang /* Note Petsc r(=c) permutation is used when mumps->id.ICNTL(7)==1 with centralized assembled matrix input; otherwise r and c are ignored */ 1050397b6df1SKris Buschelman #undef __FUNCT__ 1051f0c56d0fSKris Buschelman #define __FUNCT__ "MatLUFactorSymbolic_AIJMUMPS" 10520481f469SBarry Smith PetscErrorCode MatLUFactorSymbolic_AIJMUMPS(Mat F,Mat A,IS r,IS c,const MatFactorInfo *info) 1053b24902e0SBarry Smith { 1054a5e57a09SHong Zhang Mat_MUMPS *mumps = (Mat_MUMPS*)F->spptr; 1055dcd589f8SShri Abhyankar PetscErrorCode ierr; 105667877ebaSShri Abhyankar Vec b; 105767877ebaSShri Abhyankar IS is_iden; 105867877ebaSShri Abhyankar const PetscInt M = A->rmap->N; 1059397b6df1SKris Buschelman 1060397b6df1SKris Buschelman PetscFunctionBegin; 1061a5e57a09SHong Zhang mumps->matstruc = DIFFERENT_NONZERO_PATTERN; 1062dcd589f8SShri Abhyankar 10639a2535b5SHong Zhang /* Set MUMPS options from the options database */ 10649a2535b5SHong Zhang ierr = PetscSetMUMPSFromOptions(F,A);CHKERRQ(ierr); 1065dcd589f8SShri Abhyankar 1066a5e57a09SHong Zhang ierr = (*mumps->ConvertToTriples)(A, 1, MAT_INITIAL_MATRIX, &mumps->nz, &mumps->irn, &mumps->jcn, &mumps->val);CHKERRQ(ierr); 1067dcd589f8SShri Abhyankar 106867877ebaSShri Abhyankar /* analysis phase */ 106967877ebaSShri Abhyankar /*----------------*/ 1070a5e57a09SHong Zhang mumps->id.job = JOB_FACTSYMBOLIC; 1071a5e57a09SHong Zhang mumps->id.n = M; 1072a5e57a09SHong Zhang switch (mumps->id.ICNTL(18)) { 107367877ebaSShri Abhyankar case 0: /* centralized assembled matrix input */ 1074a5e57a09SHong Zhang if (!mumps->myid) { 1075a5e57a09SHong Zhang mumps->id.nz =mumps->nz; mumps->id.irn=mumps->irn; mumps->id.jcn=mumps->jcn; 1076a5e57a09SHong Zhang if (mumps->id.ICNTL(6)>1) { 107767877ebaSShri Abhyankar #if defined(PETSC_USE_COMPLEX) 10782907cef9SHong Zhang #if defined(PETSC_USE_REAL_SINGLE) 1079a5e57a09SHong Zhang mumps->id.a = (mumps_complex*)mumps->val; 10802907cef9SHong Zhang #else 1081a5e57a09SHong Zhang mumps->id.a = (mumps_double_complex*)mumps->val; 10822907cef9SHong Zhang #endif 108367877ebaSShri Abhyankar #else 1084a5e57a09SHong Zhang mumps->id.a = mumps->val; 108567877ebaSShri Abhyankar #endif 108667877ebaSShri Abhyankar } 1087a5e57a09SHong Zhang if (mumps->id.ICNTL(7) == 1) { /* use user-provide matrix ordering - assuming r = c ordering */ 10885248a706SHong Zhang /* 10895248a706SHong Zhang PetscBool flag; 10905248a706SHong Zhang ierr = ISEqual(r,c,&flag);CHKERRQ(ierr); 10915248a706SHong Zhang if (!flag) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_USER,"row_perm != col_perm"); 10925248a706SHong Zhang ierr = ISView(r,PETSC_VIEWER_STDOUT_SELF); 10935248a706SHong Zhang */ 1094a5e57a09SHong Zhang if (!mumps->myid) { 1095e0b74bf9SHong Zhang const PetscInt *idx; 1096e0b74bf9SHong Zhang PetscInt i,*perm_in; 10972205254eSKarl Rupp 1098785e854fSJed Brown ierr = PetscMalloc1(M,&perm_in);CHKERRQ(ierr); 1099e0b74bf9SHong Zhang ierr = ISGetIndices(r,&idx);CHKERRQ(ierr); 11002205254eSKarl Rupp 1101a5e57a09SHong Zhang mumps->id.perm_in = perm_in; 1102e0b74bf9SHong Zhang for (i=0; i<M; i++) perm_in[i] = idx[i]+1; /* perm_in[]: start from 1, not 0! */ 1103e0b74bf9SHong Zhang ierr = ISRestoreIndices(r,&idx);CHKERRQ(ierr); 1104e0b74bf9SHong Zhang } 1105e0b74bf9SHong Zhang } 110667877ebaSShri Abhyankar } 110767877ebaSShri Abhyankar break; 110867877ebaSShri Abhyankar case 3: /* distributed assembled matrix input (size>1) */ 1109a5e57a09SHong Zhang mumps->id.nz_loc = mumps->nz; 1110a5e57a09SHong Zhang mumps->id.irn_loc=mumps->irn; mumps->id.jcn_loc=mumps->jcn; 1111a5e57a09SHong Zhang if (mumps->id.ICNTL(6)>1) { 111267877ebaSShri Abhyankar #if defined(PETSC_USE_COMPLEX) 11132907cef9SHong Zhang #if defined(PETSC_USE_REAL_SINGLE) 1114a5e57a09SHong Zhang mumps->id.a_loc = (mumps_complex*)mumps->val; 11152907cef9SHong Zhang #else 1116a5e57a09SHong Zhang mumps->id.a_loc = (mumps_double_complex*)mumps->val; 11172907cef9SHong Zhang #endif 111867877ebaSShri Abhyankar #else 1119a5e57a09SHong Zhang mumps->id.a_loc = mumps->val; 112067877ebaSShri Abhyankar #endif 112167877ebaSShri Abhyankar } 112267877ebaSShri Abhyankar /* MUMPS only supports centralized rhs. Create scatter scat_rhs for repeated use in MatSolve() */ 1123a5e57a09SHong Zhang if (!mumps->myid) { 11242cd7d884SHong Zhang ierr = VecCreateSeq(PETSC_COMM_SELF,A->rmap->N,&mumps->b_seq);CHKERRQ(ierr); 11252cd7d884SHong Zhang ierr = ISCreateStride(PETSC_COMM_SELF,A->rmap->N,0,1,&is_iden);CHKERRQ(ierr); 112667877ebaSShri Abhyankar } else { 1127a5e57a09SHong Zhang ierr = VecCreateSeq(PETSC_COMM_SELF,0,&mumps->b_seq);CHKERRQ(ierr); 112867877ebaSShri Abhyankar ierr = ISCreateStride(PETSC_COMM_SELF,0,0,1,&is_iden);CHKERRQ(ierr); 112967877ebaSShri Abhyankar } 11302a7a6963SBarry Smith ierr = MatCreateVecs(A,NULL,&b);CHKERRQ(ierr); 1131a5e57a09SHong Zhang ierr = VecScatterCreate(b,is_iden,mumps->b_seq,is_iden,&mumps->scat_rhs);CHKERRQ(ierr); 11326bf464f9SBarry Smith ierr = ISDestroy(&is_iden);CHKERRQ(ierr); 11336bf464f9SBarry Smith ierr = VecDestroy(&b);CHKERRQ(ierr); 113467877ebaSShri Abhyankar break; 113567877ebaSShri Abhyankar } 1136a5e57a09SHong Zhang PetscMUMPS_c(&mumps->id); 1137a5e57a09SHong Zhang if (mumps->id.INFOG(1) < 0) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error reported by MUMPS in analysis phase: INFOG(1)=%d\n",mumps->id.INFOG(1)); 113867877ebaSShri Abhyankar 1139719d5645SBarry Smith F->ops->lufactornumeric = MatFactorNumeric_MUMPS; 1140dcd589f8SShri Abhyankar F->ops->solve = MatSolve_MUMPS; 114151d5961aSHong Zhang F->ops->solvetranspose = MatSolveTranspose_MUMPS; 11424e34a73bSHong Zhang F->ops->matsolve = MatMatSolve_MUMPS; 1143b24902e0SBarry Smith PetscFunctionReturn(0); 1144b24902e0SBarry Smith } 1145b24902e0SBarry Smith 1146450b117fSShri Abhyankar /* Note the Petsc r and c permutations are ignored */ 1147450b117fSShri Abhyankar #undef __FUNCT__ 1148450b117fSShri Abhyankar #define __FUNCT__ "MatLUFactorSymbolic_BAIJMUMPS" 1149450b117fSShri Abhyankar PetscErrorCode MatLUFactorSymbolic_BAIJMUMPS(Mat F,Mat A,IS r,IS c,const MatFactorInfo *info) 1150450b117fSShri Abhyankar { 1151a5e57a09SHong Zhang Mat_MUMPS *mumps = (Mat_MUMPS*)F->spptr; 1152dcd589f8SShri Abhyankar PetscErrorCode ierr; 115367877ebaSShri Abhyankar Vec b; 115467877ebaSShri Abhyankar IS is_iden; 115567877ebaSShri Abhyankar const PetscInt M = A->rmap->N; 1156450b117fSShri Abhyankar 1157450b117fSShri Abhyankar PetscFunctionBegin; 1158a5e57a09SHong Zhang mumps->matstruc = DIFFERENT_NONZERO_PATTERN; 1159dcd589f8SShri Abhyankar 11609a2535b5SHong Zhang /* Set MUMPS options from the options database */ 11619a2535b5SHong Zhang ierr = PetscSetMUMPSFromOptions(F,A);CHKERRQ(ierr); 1162dcd589f8SShri Abhyankar 1163a5e57a09SHong Zhang ierr = (*mumps->ConvertToTriples)(A, 1, MAT_INITIAL_MATRIX, &mumps->nz, &mumps->irn, &mumps->jcn, &mumps->val);CHKERRQ(ierr); 116467877ebaSShri Abhyankar 116567877ebaSShri Abhyankar /* analysis phase */ 116667877ebaSShri Abhyankar /*----------------*/ 1167a5e57a09SHong Zhang mumps->id.job = JOB_FACTSYMBOLIC; 1168a5e57a09SHong Zhang mumps->id.n = M; 1169a5e57a09SHong Zhang switch (mumps->id.ICNTL(18)) { 117067877ebaSShri Abhyankar case 0: /* centralized assembled matrix input */ 1171a5e57a09SHong Zhang if (!mumps->myid) { 1172a5e57a09SHong Zhang mumps->id.nz =mumps->nz; mumps->id.irn=mumps->irn; mumps->id.jcn=mumps->jcn; 1173a5e57a09SHong Zhang if (mumps->id.ICNTL(6)>1) { 117467877ebaSShri Abhyankar #if defined(PETSC_USE_COMPLEX) 11752907cef9SHong Zhang #if defined(PETSC_USE_REAL_SINGLE) 1176a5e57a09SHong Zhang mumps->id.a = (mumps_complex*)mumps->val; 11772907cef9SHong Zhang #else 1178a5e57a09SHong Zhang mumps->id.a = (mumps_double_complex*)mumps->val; 11792907cef9SHong Zhang #endif 118067877ebaSShri Abhyankar #else 1181a5e57a09SHong Zhang mumps->id.a = mumps->val; 118267877ebaSShri Abhyankar #endif 118367877ebaSShri Abhyankar } 118467877ebaSShri Abhyankar } 118567877ebaSShri Abhyankar break; 118667877ebaSShri Abhyankar case 3: /* distributed assembled matrix input (size>1) */ 1187a5e57a09SHong Zhang mumps->id.nz_loc = mumps->nz; 1188a5e57a09SHong Zhang mumps->id.irn_loc=mumps->irn; mumps->id.jcn_loc=mumps->jcn; 1189a5e57a09SHong Zhang if (mumps->id.ICNTL(6)>1) { 119067877ebaSShri Abhyankar #if defined(PETSC_USE_COMPLEX) 11912907cef9SHong Zhang #if defined(PETSC_USE_REAL_SINGLE) 1192a5e57a09SHong Zhang mumps->id.a_loc = (mumps_complex*)mumps->val; 11932907cef9SHong Zhang #else 1194a5e57a09SHong Zhang mumps->id.a_loc = (mumps_double_complex*)mumps->val; 11952907cef9SHong Zhang #endif 119667877ebaSShri Abhyankar #else 1197a5e57a09SHong Zhang mumps->id.a_loc = mumps->val; 119867877ebaSShri Abhyankar #endif 119967877ebaSShri Abhyankar } 120067877ebaSShri Abhyankar /* MUMPS only supports centralized rhs. Create scatter scat_rhs for repeated use in MatSolve() */ 1201a5e57a09SHong Zhang if (!mumps->myid) { 1202a5e57a09SHong Zhang ierr = VecCreateSeq(PETSC_COMM_SELF,A->cmap->N,&mumps->b_seq);CHKERRQ(ierr); 120367877ebaSShri Abhyankar ierr = ISCreateStride(PETSC_COMM_SELF,A->cmap->N,0,1,&is_iden);CHKERRQ(ierr); 120467877ebaSShri Abhyankar } else { 1205a5e57a09SHong Zhang ierr = VecCreateSeq(PETSC_COMM_SELF,0,&mumps->b_seq);CHKERRQ(ierr); 120667877ebaSShri Abhyankar ierr = ISCreateStride(PETSC_COMM_SELF,0,0,1,&is_iden);CHKERRQ(ierr); 120767877ebaSShri Abhyankar } 12082a7a6963SBarry Smith ierr = MatCreateVecs(A,NULL,&b);CHKERRQ(ierr); 1209a5e57a09SHong Zhang ierr = VecScatterCreate(b,is_iden,mumps->b_seq,is_iden,&mumps->scat_rhs);CHKERRQ(ierr); 12106bf464f9SBarry Smith ierr = ISDestroy(&is_iden);CHKERRQ(ierr); 12116bf464f9SBarry Smith ierr = VecDestroy(&b);CHKERRQ(ierr); 121267877ebaSShri Abhyankar break; 121367877ebaSShri Abhyankar } 1214a5e57a09SHong Zhang PetscMUMPS_c(&mumps->id); 1215a5e57a09SHong Zhang if (mumps->id.INFOG(1) < 0) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error reported by MUMPS in analysis phase: INFOG(1)=%d\n",mumps->id.INFOG(1)); 121667877ebaSShri Abhyankar 1217450b117fSShri Abhyankar F->ops->lufactornumeric = MatFactorNumeric_MUMPS; 1218dcd589f8SShri Abhyankar F->ops->solve = MatSolve_MUMPS; 121951d5961aSHong Zhang F->ops->solvetranspose = MatSolveTranspose_MUMPS; 1220450b117fSShri Abhyankar PetscFunctionReturn(0); 1221450b117fSShri Abhyankar } 1222b24902e0SBarry Smith 1223141f4205SHong Zhang /* Note the Petsc r permutation and factor info are ignored */ 1224397b6df1SKris Buschelman #undef __FUNCT__ 122567877ebaSShri Abhyankar #define __FUNCT__ "MatCholeskyFactorSymbolic_MUMPS" 122667877ebaSShri Abhyankar PetscErrorCode MatCholeskyFactorSymbolic_MUMPS(Mat F,Mat A,IS r,const MatFactorInfo *info) 1227b24902e0SBarry Smith { 1228a5e57a09SHong Zhang Mat_MUMPS *mumps = (Mat_MUMPS*)F->spptr; 1229dcd589f8SShri Abhyankar PetscErrorCode ierr; 123067877ebaSShri Abhyankar Vec b; 123167877ebaSShri Abhyankar IS is_iden; 123267877ebaSShri Abhyankar const PetscInt M = A->rmap->N; 1233397b6df1SKris Buschelman 1234397b6df1SKris Buschelman PetscFunctionBegin; 1235a5e57a09SHong Zhang mumps->matstruc = DIFFERENT_NONZERO_PATTERN; 1236dcd589f8SShri Abhyankar 12379a2535b5SHong Zhang /* Set MUMPS options from the options database */ 12389a2535b5SHong Zhang ierr = PetscSetMUMPSFromOptions(F,A);CHKERRQ(ierr); 1239dcd589f8SShri Abhyankar 1240a5e57a09SHong Zhang ierr = (*mumps->ConvertToTriples)(A, 1, MAT_INITIAL_MATRIX, &mumps->nz, &mumps->irn, &mumps->jcn, &mumps->val);CHKERRQ(ierr); 1241dcd589f8SShri Abhyankar 124267877ebaSShri Abhyankar /* analysis phase */ 124367877ebaSShri Abhyankar /*----------------*/ 1244a5e57a09SHong Zhang mumps->id.job = JOB_FACTSYMBOLIC; 1245a5e57a09SHong Zhang mumps->id.n = M; 1246a5e57a09SHong Zhang switch (mumps->id.ICNTL(18)) { 124767877ebaSShri Abhyankar case 0: /* centralized assembled matrix input */ 1248a5e57a09SHong Zhang if (!mumps->myid) { 1249a5e57a09SHong Zhang mumps->id.nz =mumps->nz; mumps->id.irn=mumps->irn; mumps->id.jcn=mumps->jcn; 1250a5e57a09SHong Zhang if (mumps->id.ICNTL(6)>1) { 125167877ebaSShri Abhyankar #if defined(PETSC_USE_COMPLEX) 12522907cef9SHong Zhang #if defined(PETSC_USE_REAL_SINGLE) 1253a5e57a09SHong Zhang mumps->id.a = (mumps_complex*)mumps->val; 12542907cef9SHong Zhang #else 1255a5e57a09SHong Zhang mumps->id.a = (mumps_double_complex*)mumps->val; 12562907cef9SHong Zhang #endif 125767877ebaSShri Abhyankar #else 1258a5e57a09SHong Zhang mumps->id.a = mumps->val; 125967877ebaSShri Abhyankar #endif 126067877ebaSShri Abhyankar } 126167877ebaSShri Abhyankar } 126267877ebaSShri Abhyankar break; 126367877ebaSShri Abhyankar case 3: /* distributed assembled matrix input (size>1) */ 1264a5e57a09SHong Zhang mumps->id.nz_loc = mumps->nz; 1265a5e57a09SHong Zhang mumps->id.irn_loc=mumps->irn; mumps->id.jcn_loc=mumps->jcn; 1266a5e57a09SHong Zhang if (mumps->id.ICNTL(6)>1) { 126767877ebaSShri Abhyankar #if defined(PETSC_USE_COMPLEX) 12682907cef9SHong Zhang #if defined(PETSC_USE_REAL_SINGLE) 1269a5e57a09SHong Zhang mumps->id.a_loc = (mumps_complex*)mumps->val; 12702907cef9SHong Zhang #else 1271a5e57a09SHong Zhang mumps->id.a_loc = (mumps_double_complex*)mumps->val; 12722907cef9SHong Zhang #endif 127367877ebaSShri Abhyankar #else 1274a5e57a09SHong Zhang mumps->id.a_loc = mumps->val; 127567877ebaSShri Abhyankar #endif 127667877ebaSShri Abhyankar } 127767877ebaSShri Abhyankar /* MUMPS only supports centralized rhs. Create scatter scat_rhs for repeated use in MatSolve() */ 1278a5e57a09SHong Zhang if (!mumps->myid) { 1279a5e57a09SHong Zhang ierr = VecCreateSeq(PETSC_COMM_SELF,A->cmap->N,&mumps->b_seq);CHKERRQ(ierr); 128067877ebaSShri Abhyankar ierr = ISCreateStride(PETSC_COMM_SELF,A->cmap->N,0,1,&is_iden);CHKERRQ(ierr); 128167877ebaSShri Abhyankar } else { 1282a5e57a09SHong Zhang ierr = VecCreateSeq(PETSC_COMM_SELF,0,&mumps->b_seq);CHKERRQ(ierr); 128367877ebaSShri Abhyankar ierr = ISCreateStride(PETSC_COMM_SELF,0,0,1,&is_iden);CHKERRQ(ierr); 128467877ebaSShri Abhyankar } 12852a7a6963SBarry Smith ierr = MatCreateVecs(A,NULL,&b);CHKERRQ(ierr); 1286a5e57a09SHong Zhang ierr = VecScatterCreate(b,is_iden,mumps->b_seq,is_iden,&mumps->scat_rhs);CHKERRQ(ierr); 12876bf464f9SBarry Smith ierr = ISDestroy(&is_iden);CHKERRQ(ierr); 12886bf464f9SBarry Smith ierr = VecDestroy(&b);CHKERRQ(ierr); 128967877ebaSShri Abhyankar break; 129067877ebaSShri Abhyankar } 1291a5e57a09SHong Zhang PetscMUMPS_c(&mumps->id); 1292a5e57a09SHong Zhang if (mumps->id.INFOG(1) < 0) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error reported by MUMPS in analysis phase: INFOG(1)=%d\n",mumps->id.INFOG(1)); 129367877ebaSShri Abhyankar 12942792810eSHong Zhang F->ops->choleskyfactornumeric = MatFactorNumeric_MUMPS; 1295dcd589f8SShri Abhyankar F->ops->solve = MatSolve_MUMPS; 129651d5961aSHong Zhang F->ops->solvetranspose = MatSolve_MUMPS; 12974e34a73bSHong Zhang F->ops->matsolve = MatMatSolve_MUMPS; 12984e34a73bSHong Zhang #if defined(PETSC_USE_COMPLEX) 12990298fd71SBarry Smith F->ops->getinertia = NULL; 13004e34a73bSHong Zhang #else 13014e34a73bSHong Zhang F->ops->getinertia = MatGetInertia_SBAIJMUMPS; 1302db4efbfdSBarry Smith #endif 1303b24902e0SBarry Smith PetscFunctionReturn(0); 1304b24902e0SBarry Smith } 1305b24902e0SBarry Smith 13064e34a73bSHong Zhang //update!!! 1307397b6df1SKris Buschelman #undef __FUNCT__ 130864e6c443SBarry Smith #define __FUNCT__ "MatView_MUMPS" 130964e6c443SBarry Smith PetscErrorCode MatView_MUMPS(Mat A,PetscViewer viewer) 131074ed9c26SBarry Smith { 1311f6c57405SHong Zhang PetscErrorCode ierr; 131264e6c443SBarry Smith PetscBool iascii; 131364e6c443SBarry Smith PetscViewerFormat format; 1314a5e57a09SHong Zhang Mat_MUMPS *mumps=(Mat_MUMPS*)A->spptr; 1315f6c57405SHong Zhang 1316f6c57405SHong Zhang PetscFunctionBegin; 131764e6c443SBarry Smith /* check if matrix is mumps type */ 131864e6c443SBarry Smith if (A->ops->solve != MatSolve_MUMPS) PetscFunctionReturn(0); 131964e6c443SBarry Smith 1320251f4c67SDmitry Karpeev ierr = PetscObjectTypeCompare((PetscObject)viewer,PETSCVIEWERASCII,&iascii);CHKERRQ(ierr); 132164e6c443SBarry Smith if (iascii) { 132264e6c443SBarry Smith ierr = PetscViewerGetFormat(viewer,&format);CHKERRQ(ierr); 132364e6c443SBarry Smith if (format == PETSC_VIEWER_ASCII_INFO) { 132464e6c443SBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"MUMPS run parameters:\n");CHKERRQ(ierr); 1325a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," SYM (matrix type): %d \n",mumps->id.sym);CHKERRQ(ierr); 1326a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," PAR (host participation): %d \n",mumps->id.par);CHKERRQ(ierr); 1327a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(1) (output for error): %d \n",mumps->id.ICNTL(1));CHKERRQ(ierr); 1328a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(2) (output of diagnostic msg): %d \n",mumps->id.ICNTL(2));CHKERRQ(ierr); 1329a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(3) (output for global info): %d \n",mumps->id.ICNTL(3));CHKERRQ(ierr); 1330a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(4) (level of printing): %d \n",mumps->id.ICNTL(4));CHKERRQ(ierr); 1331a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(5) (input mat struct): %d \n",mumps->id.ICNTL(5));CHKERRQ(ierr); 1332a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(6) (matrix prescaling): %d \n",mumps->id.ICNTL(6));CHKERRQ(ierr); 1333a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(7) (sequentia matrix ordering):%d \n",mumps->id.ICNTL(7));CHKERRQ(ierr); 1334a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(8) (scalling strategy): %d \n",mumps->id.ICNTL(8));CHKERRQ(ierr); 1335a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(10) (max num of refinements): %d \n",mumps->id.ICNTL(10));CHKERRQ(ierr); 1336a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(11) (error analysis): %d \n",mumps->id.ICNTL(11));CHKERRQ(ierr); 1337a5e57a09SHong Zhang if (mumps->id.ICNTL(11)>0) { 1338a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," RINFOG(4) (inf norm of input mat): %g\n",mumps->id.RINFOG(4));CHKERRQ(ierr); 1339a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," RINFOG(5) (inf norm of solution): %g\n",mumps->id.RINFOG(5));CHKERRQ(ierr); 1340a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," RINFOG(6) (inf norm of residual): %g\n",mumps->id.RINFOG(6));CHKERRQ(ierr); 1341a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," RINFOG(7),RINFOG(8) (backward error est): %g, %g\n",mumps->id.RINFOG(7),mumps->id.RINFOG(8));CHKERRQ(ierr); 1342a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," RINFOG(9) (error estimate): %g \n",mumps->id.RINFOG(9));CHKERRQ(ierr); 1343a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," RINFOG(10),RINFOG(11)(condition numbers): %g, %g\n",mumps->id.RINFOG(10),mumps->id.RINFOG(11));CHKERRQ(ierr); 1344f6c57405SHong Zhang } 1345a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(12) (efficiency control): %d \n",mumps->id.ICNTL(12));CHKERRQ(ierr); 1346a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(13) (efficiency control): %d \n",mumps->id.ICNTL(13));CHKERRQ(ierr); 1347a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(14) (percentage of estimated workspace increase): %d \n",mumps->id.ICNTL(14));CHKERRQ(ierr); 1348f6c57405SHong Zhang /* ICNTL(15-17) not used */ 1349a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(18) (input mat struct): %d \n",mumps->id.ICNTL(18));CHKERRQ(ierr); 1350a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(19) (Shur complement info): %d \n",mumps->id.ICNTL(19));CHKERRQ(ierr); 1351a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(20) (rhs sparse pattern): %d \n",mumps->id.ICNTL(20));CHKERRQ(ierr); 1352a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(21) (somumpstion struct): %d \n",mumps->id.ICNTL(21));CHKERRQ(ierr); 1353a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(22) (in-core/out-of-core facility): %d \n",mumps->id.ICNTL(22));CHKERRQ(ierr); 1354a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(23) (max size of memory can be allocated locally):%d \n",mumps->id.ICNTL(23));CHKERRQ(ierr); 1355c0165424SHong Zhang 1356a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(24) (detection of null pivot rows): %d \n",mumps->id.ICNTL(24));CHKERRQ(ierr); 1357a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(25) (computation of a null space basis): %d \n",mumps->id.ICNTL(25));CHKERRQ(ierr); 1358a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(26) (Schur options for rhs or solution): %d \n",mumps->id.ICNTL(26));CHKERRQ(ierr); 1359a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(27) (experimental parameter): %d \n",mumps->id.ICNTL(27));CHKERRQ(ierr); 1360a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(28) (use parallel or sequential ordering): %d \n",mumps->id.ICNTL(28));CHKERRQ(ierr); 1361a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(29) (parallel ordering): %d \n",mumps->id.ICNTL(29));CHKERRQ(ierr); 136242179a6aSHong Zhang 1363a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(30) (user-specified set of entries in inv(A)): %d \n",mumps->id.ICNTL(30));CHKERRQ(ierr); 1364a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(31) (factors is discarded in the solve phase): %d \n",mumps->id.ICNTL(31));CHKERRQ(ierr); 1365a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(33) (compute determinant): %d \n",mumps->id.ICNTL(33));CHKERRQ(ierr); 1366f6c57405SHong Zhang 1367a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," CNTL(1) (relative pivoting threshold): %g \n",mumps->id.CNTL(1));CHKERRQ(ierr); 1368a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," CNTL(2) (stopping criterion of refinement): %g \n",mumps->id.CNTL(2));CHKERRQ(ierr); 1369a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," CNTL(3) (absomumpste pivoting threshold): %g \n",mumps->id.CNTL(3));CHKERRQ(ierr); 1370a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," CNTL(4) (vamumpse of static pivoting): %g \n",mumps->id.CNTL(4));CHKERRQ(ierr); 1371a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," CNTL(5) (fixation for null pivots): %g \n",mumps->id.CNTL(5));CHKERRQ(ierr); 1372f6c57405SHong Zhang 1373f6c57405SHong Zhang /* infomation local to each processor */ 137434ed7027SBarry Smith ierr = PetscViewerASCIIPrintf(viewer, " RINFO(1) (local estimated flops for the elimination after analysis): \n");CHKERRQ(ierr); 13757b23a99aSBarry Smith ierr = PetscViewerASCIISynchronizedAllow(viewer,PETSC_TRUE);CHKERRQ(ierr); 1376a5e57a09SHong Zhang ierr = PetscViewerASCIISynchronizedPrintf(viewer," [%d] %g \n",mumps->myid,mumps->id.RINFO(1));CHKERRQ(ierr); 137734ed7027SBarry Smith ierr = PetscViewerFlush(viewer); 137834ed7027SBarry Smith ierr = PetscViewerASCIIPrintf(viewer, " RINFO(2) (local estimated flops for the assembly after factorization): \n");CHKERRQ(ierr); 1379a5e57a09SHong Zhang ierr = PetscViewerASCIISynchronizedPrintf(viewer," [%d] %g \n",mumps->myid,mumps->id.RINFO(2));CHKERRQ(ierr); 138034ed7027SBarry Smith ierr = PetscViewerFlush(viewer); 138134ed7027SBarry Smith ierr = PetscViewerASCIIPrintf(viewer, " RINFO(3) (local estimated flops for the elimination after factorization): \n");CHKERRQ(ierr); 1382a5e57a09SHong Zhang ierr = PetscViewerASCIISynchronizedPrintf(viewer," [%d] %g \n",mumps->myid,mumps->id.RINFO(3));CHKERRQ(ierr); 138334ed7027SBarry Smith ierr = PetscViewerFlush(viewer); 1384f6c57405SHong Zhang 138534ed7027SBarry Smith ierr = PetscViewerASCIIPrintf(viewer, " INFO(15) (estimated size of (in MB) MUMPS internal data for running numerical factorization): \n");CHKERRQ(ierr); 1386a5e57a09SHong Zhang ierr = PetscViewerASCIISynchronizedPrintf(viewer," [%d] %d \n",mumps->myid,mumps->id.INFO(15));CHKERRQ(ierr); 138734ed7027SBarry Smith ierr = PetscViewerFlush(viewer); 1388f6c57405SHong Zhang 138934ed7027SBarry Smith ierr = PetscViewerASCIIPrintf(viewer, " INFO(16) (size of (in MB) MUMPS internal data used during numerical factorization): \n");CHKERRQ(ierr); 1390a5e57a09SHong Zhang ierr = PetscViewerASCIISynchronizedPrintf(viewer," [%d] %d \n",mumps->myid,mumps->id.INFO(16));CHKERRQ(ierr); 139134ed7027SBarry Smith ierr = PetscViewerFlush(viewer); 1392f6c57405SHong Zhang 139334ed7027SBarry Smith ierr = PetscViewerASCIIPrintf(viewer, " INFO(23) (num of pivots eliminated on this processor after factorization): \n");CHKERRQ(ierr); 1394a5e57a09SHong Zhang ierr = PetscViewerASCIISynchronizedPrintf(viewer," [%d] %d \n",mumps->myid,mumps->id.INFO(23));CHKERRQ(ierr); 139534ed7027SBarry Smith ierr = PetscViewerFlush(viewer); 13967b23a99aSBarry Smith ierr = PetscViewerASCIISynchronizedAllow(viewer,PETSC_FALSE);CHKERRQ(ierr); 1397f6c57405SHong Zhang 1398a5e57a09SHong Zhang if (!mumps->myid) { /* information from the host */ 1399a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," RINFOG(1) (global estimated flops for the elimination after analysis): %g \n",mumps->id.RINFOG(1));CHKERRQ(ierr); 1400a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," RINFOG(2) (global estimated flops for the assembly after factorization): %g \n",mumps->id.RINFOG(2));CHKERRQ(ierr); 1401a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," RINFOG(3) (global estimated flops for the elimination after factorization): %g \n",mumps->id.RINFOG(3));CHKERRQ(ierr); 1402a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," (RINFOG(12) RINFOG(13))*2^INFOG(34) (determinant): (%g,%g)*(2^%d)\n",mumps->id.RINFOG(12),mumps->id.RINFOG(13),mumps->id.INFOG(34));CHKERRQ(ierr); 1403f6c57405SHong Zhang 1404a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(3) (estimated real workspace for factors on all processors after analysis): %d \n",mumps->id.INFOG(3));CHKERRQ(ierr); 1405a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(4) (estimated integer workspace for factors on all processors after analysis): %d \n",mumps->id.INFOG(4));CHKERRQ(ierr); 1406a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(5) (estimated maximum front size in the complete tree): %d \n",mumps->id.INFOG(5));CHKERRQ(ierr); 1407a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(6) (number of nodes in the complete tree): %d \n",mumps->id.INFOG(6));CHKERRQ(ierr); 1408a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(7) (ordering option effectively use after analysis): %d \n",mumps->id.INFOG(7));CHKERRQ(ierr); 1409a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(8) (structural symmetry in percent of the permuted matrix after analysis): %d \n",mumps->id.INFOG(8));CHKERRQ(ierr); 1410a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(9) (total real/complex workspace to store the matrix factors after factorization): %d \n",mumps->id.INFOG(9));CHKERRQ(ierr); 1411a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(10) (total integer space store the matrix factors after factorization): %d \n",mumps->id.INFOG(10));CHKERRQ(ierr); 1412a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(11) (order of largest frontal matrix after factorization): %d \n",mumps->id.INFOG(11));CHKERRQ(ierr); 1413a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(12) (number of off-diagonal pivots): %d \n",mumps->id.INFOG(12));CHKERRQ(ierr); 1414a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(13) (number of delayed pivots after factorization): %d \n",mumps->id.INFOG(13));CHKERRQ(ierr); 1415a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(14) (number of memory compress after factorization): %d \n",mumps->id.INFOG(14));CHKERRQ(ierr); 1416a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(15) (number of steps of iterative refinement after solution): %d \n",mumps->id.INFOG(15));CHKERRQ(ierr); 1417a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(16) (estimated size (in MB) of all MUMPS internal data for factorization after analysis: value on the most memory consuming processor): %d \n",mumps->id.INFOG(16));CHKERRQ(ierr); 1418a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(17) (estimated size of all MUMPS internal data for factorization after analysis: sum over all processors): %d \n",mumps->id.INFOG(17));CHKERRQ(ierr); 1419a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(18) (size of all MUMPS internal data allocated during factorization: value on the most memory consuming processor): %d \n",mumps->id.INFOG(18));CHKERRQ(ierr); 1420a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(19) (size of all MUMPS internal data allocated during factorization: sum over all processors): %d \n",mumps->id.INFOG(19));CHKERRQ(ierr); 1421a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(20) (estimated number of entries in the factors): %d \n",mumps->id.INFOG(20));CHKERRQ(ierr); 1422a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(21) (size in MB of memory effectively used during factorization - value on the most memory consuming processor): %d \n",mumps->id.INFOG(21));CHKERRQ(ierr); 1423a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(22) (size in MB of memory effectively used during factorization - sum over all processors): %d \n",mumps->id.INFOG(22));CHKERRQ(ierr); 1424a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(23) (after analysis: value of ICNTL(6) effectively used): %d \n",mumps->id.INFOG(23));CHKERRQ(ierr); 1425a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(24) (after analysis: value of ICNTL(12) effectively used): %d \n",mumps->id.INFOG(24));CHKERRQ(ierr); 1426a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(25) (after factorization: number of pivots modified by static pivoting): %d \n",mumps->id.INFOG(25));CHKERRQ(ierr); 142740d435e3SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(28) (after factorization: number of null pivots encountered): %d\n",mumps->id.INFOG(28));CHKERRQ(ierr); 142840d435e3SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(29) (after factorization: effective number of entries in the factors (sum over all processors)): %d\n",mumps->id.INFOG(29));CHKERRQ(ierr); 142940d435e3SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(30, 31) (after solution: size in Mbytes of memory used during solution phase): %d, %d\n",mumps->id.INFOG(30),mumps->id.INFOG(31));CHKERRQ(ierr); 143040d435e3SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(32) (after analysis: type of analysis done): %d\n",mumps->id.INFOG(32));CHKERRQ(ierr); 143140d435e3SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(33) (value used for ICNTL(8)): %d\n",mumps->id.INFOG(33));CHKERRQ(ierr); 143240d435e3SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(34) (exponent of the determinant if determinant is requested): %d\n",mumps->id.INFOG(34));CHKERRQ(ierr); 1433f6c57405SHong Zhang } 1434f6c57405SHong Zhang } 1435cb828f0fSHong Zhang } 1436f6c57405SHong Zhang PetscFunctionReturn(0); 1437f6c57405SHong Zhang } 1438f6c57405SHong Zhang 143935bd34faSBarry Smith #undef __FUNCT__ 144035bd34faSBarry Smith #define __FUNCT__ "MatGetInfo_MUMPS" 144135bd34faSBarry Smith PetscErrorCode MatGetInfo_MUMPS(Mat A,MatInfoType flag,MatInfo *info) 144235bd34faSBarry Smith { 1443cb828f0fSHong Zhang Mat_MUMPS *mumps =(Mat_MUMPS*)A->spptr; 144435bd34faSBarry Smith 144535bd34faSBarry Smith PetscFunctionBegin; 144635bd34faSBarry Smith info->block_size = 1.0; 1447cb828f0fSHong Zhang info->nz_allocated = mumps->id.INFOG(20); 1448cb828f0fSHong Zhang info->nz_used = mumps->id.INFOG(20); 144935bd34faSBarry Smith info->nz_unneeded = 0.0; 145035bd34faSBarry Smith info->assemblies = 0.0; 145135bd34faSBarry Smith info->mallocs = 0.0; 145235bd34faSBarry Smith info->memory = 0.0; 145335bd34faSBarry Smith info->fill_ratio_given = 0; 145435bd34faSBarry Smith info->fill_ratio_needed = 0; 145535bd34faSBarry Smith info->factor_mallocs = 0; 145635bd34faSBarry Smith PetscFunctionReturn(0); 145735bd34faSBarry Smith } 145835bd34faSBarry Smith 14595ccb76cbSHong Zhang /* -------------------------------------------------------------------------------------------*/ 14605ccb76cbSHong Zhang #undef __FUNCT__ 14615ccb76cbSHong Zhang #define __FUNCT__ "MatMumpsSetIcntl_MUMPS" 14625ccb76cbSHong Zhang PetscErrorCode MatMumpsSetIcntl_MUMPS(Mat F,PetscInt icntl,PetscInt ival) 14635ccb76cbSHong Zhang { 1464a5e57a09SHong Zhang Mat_MUMPS *mumps =(Mat_MUMPS*)F->spptr; 14655ccb76cbSHong Zhang 14665ccb76cbSHong Zhang PetscFunctionBegin; 1467a5e57a09SHong Zhang mumps->id.ICNTL(icntl) = ival; 14685ccb76cbSHong Zhang PetscFunctionReturn(0); 14695ccb76cbSHong Zhang } 14705ccb76cbSHong Zhang 14715ccb76cbSHong Zhang #undef __FUNCT__ 1472bc6112feSHong Zhang #define __FUNCT__ "MatMumpsGetIcntl_MUMPS" 1473bc6112feSHong Zhang PetscErrorCode MatMumpsGetIcntl_MUMPS(Mat F,PetscInt icntl,PetscInt *ival) 1474bc6112feSHong Zhang { 1475bc6112feSHong Zhang Mat_MUMPS *mumps =(Mat_MUMPS*)F->spptr; 1476bc6112feSHong Zhang 1477bc6112feSHong Zhang PetscFunctionBegin; 1478bc6112feSHong Zhang *ival = mumps->id.ICNTL(icntl); 1479bc6112feSHong Zhang PetscFunctionReturn(0); 1480bc6112feSHong Zhang } 1481bc6112feSHong Zhang 1482bc6112feSHong Zhang #undef __FUNCT__ 14835ccb76cbSHong Zhang #define __FUNCT__ "MatMumpsSetIcntl" 14845ccb76cbSHong Zhang /*@ 14855ccb76cbSHong Zhang MatMumpsSetIcntl - Set MUMPS parameter ICNTL() 14865ccb76cbSHong Zhang 14875ccb76cbSHong Zhang Logically Collective on Mat 14885ccb76cbSHong Zhang 14895ccb76cbSHong Zhang Input Parameters: 14905ccb76cbSHong Zhang + F - the factored matrix obtained by calling MatGetFactor() from PETSc-MUMPS interface 14915ccb76cbSHong Zhang . icntl - index of MUMPS parameter array ICNTL() 14925ccb76cbSHong Zhang - ival - value of MUMPS ICNTL(icntl) 14935ccb76cbSHong Zhang 14945ccb76cbSHong Zhang Options Database: 14955ccb76cbSHong Zhang . -mat_mumps_icntl_<icntl> <ival> 14965ccb76cbSHong Zhang 14975ccb76cbSHong Zhang Level: beginner 14985ccb76cbSHong Zhang 14995ccb76cbSHong Zhang References: MUMPS Users' Guide 15005ccb76cbSHong Zhang 15015ccb76cbSHong Zhang .seealso: MatGetFactor() 15025ccb76cbSHong Zhang @*/ 15035ccb76cbSHong Zhang PetscErrorCode MatMumpsSetIcntl(Mat F,PetscInt icntl,PetscInt ival) 15045ccb76cbSHong Zhang { 15055ccb76cbSHong Zhang PetscErrorCode ierr; 15065ccb76cbSHong Zhang 15075ccb76cbSHong Zhang PetscFunctionBegin; 15085ccb76cbSHong Zhang PetscValidLogicalCollectiveInt(F,icntl,2); 15095ccb76cbSHong Zhang PetscValidLogicalCollectiveInt(F,ival,3); 15105ccb76cbSHong Zhang ierr = PetscTryMethod(F,"MatMumpsSetIcntl_C",(Mat,PetscInt,PetscInt),(F,icntl,ival));CHKERRQ(ierr); 15115ccb76cbSHong Zhang PetscFunctionReturn(0); 15125ccb76cbSHong Zhang } 15135ccb76cbSHong Zhang 1514bc6112feSHong Zhang #undef __FUNCT__ 1515bc6112feSHong Zhang #define __FUNCT__ "MatMumpsGetIcntl" 1516a21f80fcSHong Zhang /*@ 1517a21f80fcSHong Zhang MatMumpsGetIcntl - Get MUMPS parameter ICNTL() 1518a21f80fcSHong Zhang 1519a21f80fcSHong Zhang Logically Collective on Mat 1520a21f80fcSHong Zhang 1521a21f80fcSHong Zhang Input Parameters: 1522a21f80fcSHong Zhang + F - the factored matrix obtained by calling MatGetFactor() from PETSc-MUMPS interface 1523a21f80fcSHong Zhang - icntl - index of MUMPS parameter array ICNTL() 1524a21f80fcSHong Zhang 1525a21f80fcSHong Zhang Output Parameter: 1526a21f80fcSHong Zhang . ival - value of MUMPS ICNTL(icntl) 1527a21f80fcSHong Zhang 1528a21f80fcSHong Zhang Level: beginner 1529a21f80fcSHong Zhang 1530a21f80fcSHong Zhang References: MUMPS Users' Guide 1531a21f80fcSHong Zhang 1532a21f80fcSHong Zhang .seealso: MatGetFactor() 1533a21f80fcSHong Zhang @*/ 1534bc6112feSHong Zhang PetscErrorCode MatMumpsGetIcntl(Mat F,PetscInt icntl,PetscInt *ival) 1535bc6112feSHong Zhang { 1536bc6112feSHong Zhang PetscErrorCode ierr; 1537bc6112feSHong Zhang 1538bc6112feSHong Zhang PetscFunctionBegin; 1539bc6112feSHong Zhang PetscValidLogicalCollectiveInt(F,icntl,2); 1540bc6112feSHong Zhang PetscValidIntPointer(ival,3); 1541bc6112feSHong Zhang ierr = PetscTryMethod(F,"MatMumpsGetIcntl_C",(Mat,PetscInt,PetscInt*),(F,icntl,ival));CHKERRQ(ierr); 1542bc6112feSHong Zhang PetscFunctionReturn(0); 1543bc6112feSHong Zhang } 1544bc6112feSHong Zhang 15458928b65cSHong Zhang /* -------------------------------------------------------------------------------------------*/ 15468928b65cSHong Zhang #undef __FUNCT__ 15478928b65cSHong Zhang #define __FUNCT__ "MatMumpsSetCntl_MUMPS" 15488928b65cSHong Zhang PetscErrorCode MatMumpsSetCntl_MUMPS(Mat F,PetscInt icntl,PetscReal val) 15498928b65cSHong Zhang { 15508928b65cSHong Zhang Mat_MUMPS *mumps =(Mat_MUMPS*)F->spptr; 15518928b65cSHong Zhang 15528928b65cSHong Zhang PetscFunctionBegin; 15538928b65cSHong Zhang mumps->id.CNTL(icntl) = val; 15548928b65cSHong Zhang PetscFunctionReturn(0); 15558928b65cSHong Zhang } 15568928b65cSHong Zhang 15578928b65cSHong Zhang #undef __FUNCT__ 1558bc6112feSHong Zhang #define __FUNCT__ "MatMumpsGetCntl_MUMPS" 1559bc6112feSHong Zhang PetscErrorCode MatMumpsGetCntl_MUMPS(Mat F,PetscInt icntl,PetscReal *val) 1560bc6112feSHong Zhang { 1561bc6112feSHong Zhang Mat_MUMPS *mumps =(Mat_MUMPS*)F->spptr; 1562bc6112feSHong Zhang 1563bc6112feSHong Zhang PetscFunctionBegin; 1564bc6112feSHong Zhang *val = mumps->id.CNTL(icntl); 1565bc6112feSHong Zhang PetscFunctionReturn(0); 1566bc6112feSHong Zhang } 1567bc6112feSHong Zhang 1568bc6112feSHong Zhang #undef __FUNCT__ 15698928b65cSHong Zhang #define __FUNCT__ "MatMumpsSetCntl" 15708928b65cSHong Zhang /*@ 15718928b65cSHong Zhang MatMumpsSetCntl - Set MUMPS parameter CNTL() 15728928b65cSHong Zhang 15738928b65cSHong Zhang Logically Collective on Mat 15748928b65cSHong Zhang 15758928b65cSHong Zhang Input Parameters: 15768928b65cSHong Zhang + F - the factored matrix obtained by calling MatGetFactor() from PETSc-MUMPS interface 15778928b65cSHong Zhang . icntl - index of MUMPS parameter array CNTL() 15788928b65cSHong Zhang - val - value of MUMPS CNTL(icntl) 15798928b65cSHong Zhang 15808928b65cSHong Zhang Options Database: 15818928b65cSHong Zhang . -mat_mumps_cntl_<icntl> <val> 15828928b65cSHong Zhang 15838928b65cSHong Zhang Level: beginner 15848928b65cSHong Zhang 15858928b65cSHong Zhang References: MUMPS Users' Guide 15868928b65cSHong Zhang 15878928b65cSHong Zhang .seealso: MatGetFactor() 15888928b65cSHong Zhang @*/ 15898928b65cSHong Zhang PetscErrorCode MatMumpsSetCntl(Mat F,PetscInt icntl,PetscReal val) 15908928b65cSHong Zhang { 15918928b65cSHong Zhang PetscErrorCode ierr; 15928928b65cSHong Zhang 15938928b65cSHong Zhang PetscFunctionBegin; 15948928b65cSHong Zhang PetscValidLogicalCollectiveInt(F,icntl,2); 1595bc6112feSHong Zhang PetscValidLogicalCollectiveReal(F,val,3); 15968928b65cSHong Zhang ierr = PetscTryMethod(F,"MatMumpsSetCntl_C",(Mat,PetscInt,PetscReal),(F,icntl,val));CHKERRQ(ierr); 15978928b65cSHong Zhang PetscFunctionReturn(0); 15988928b65cSHong Zhang } 15998928b65cSHong Zhang 1600bc6112feSHong Zhang #undef __FUNCT__ 1601bc6112feSHong Zhang #define __FUNCT__ "MatMumpsGetCntl" 1602a21f80fcSHong Zhang /*@ 1603a21f80fcSHong Zhang MatMumpsGetCntl - Get MUMPS parameter CNTL() 1604a21f80fcSHong Zhang 1605a21f80fcSHong Zhang Logically Collective on Mat 1606a21f80fcSHong Zhang 1607a21f80fcSHong Zhang Input Parameters: 1608a21f80fcSHong Zhang + F - the factored matrix obtained by calling MatGetFactor() from PETSc-MUMPS interface 1609a21f80fcSHong Zhang - icntl - index of MUMPS parameter array CNTL() 1610a21f80fcSHong Zhang 1611a21f80fcSHong Zhang Output Parameter: 1612a21f80fcSHong Zhang . val - value of MUMPS CNTL(icntl) 1613a21f80fcSHong Zhang 1614a21f80fcSHong Zhang Level: beginner 1615a21f80fcSHong Zhang 1616a21f80fcSHong Zhang References: MUMPS Users' Guide 1617a21f80fcSHong Zhang 1618a21f80fcSHong Zhang .seealso: MatGetFactor() 1619a21f80fcSHong Zhang @*/ 1620bc6112feSHong Zhang PetscErrorCode MatMumpsGetCntl(Mat F,PetscInt icntl,PetscReal *val) 1621bc6112feSHong Zhang { 1622bc6112feSHong Zhang PetscErrorCode ierr; 1623bc6112feSHong Zhang 1624bc6112feSHong Zhang PetscFunctionBegin; 1625bc6112feSHong Zhang PetscValidLogicalCollectiveInt(F,icntl,2); 1626bc6112feSHong Zhang PetscValidRealPointer(val,3); 1627bc6112feSHong Zhang ierr = PetscTryMethod(F,"MatMumpsGetCntl_C",(Mat,PetscInt,PetscReal*),(F,icntl,val));CHKERRQ(ierr); 1628bc6112feSHong Zhang PetscFunctionReturn(0); 1629bc6112feSHong Zhang } 1630bc6112feSHong Zhang 1631bc6112feSHong Zhang #undef __FUNCT__ 1632ca810319SHong Zhang #define __FUNCT__ "MatMumpsGetInfo_MUMPS" 1633ca810319SHong Zhang PetscErrorCode MatMumpsGetInfo_MUMPS(Mat F,PetscInt icntl,PetscInt *info) 1634bc6112feSHong Zhang { 1635bc6112feSHong Zhang Mat_MUMPS *mumps =(Mat_MUMPS*)F->spptr; 1636bc6112feSHong Zhang 1637bc6112feSHong Zhang PetscFunctionBegin; 1638bc6112feSHong Zhang *info = mumps->id.INFO(icntl); 1639bc6112feSHong Zhang PetscFunctionReturn(0); 1640bc6112feSHong Zhang } 1641bc6112feSHong Zhang 1642bc6112feSHong Zhang #undef __FUNCT__ 1643ca810319SHong Zhang #define __FUNCT__ "MatMumpsGetInfog_MUMPS" 1644ca810319SHong Zhang PetscErrorCode MatMumpsGetInfog_MUMPS(Mat F,PetscInt icntl,PetscInt *infog) 1645bc6112feSHong Zhang { 1646bc6112feSHong Zhang Mat_MUMPS *mumps =(Mat_MUMPS*)F->spptr; 1647bc6112feSHong Zhang 1648bc6112feSHong Zhang PetscFunctionBegin; 1649bc6112feSHong Zhang *infog = mumps->id.INFOG(icntl); 1650bc6112feSHong Zhang PetscFunctionReturn(0); 1651bc6112feSHong Zhang } 1652bc6112feSHong Zhang 1653bc6112feSHong Zhang #undef __FUNCT__ 1654ca810319SHong Zhang #define __FUNCT__ "MatMumpsGetRinfo_MUMPS" 1655ca810319SHong Zhang PetscErrorCode MatMumpsGetRinfo_MUMPS(Mat F,PetscInt icntl,PetscReal *rinfo) 1656bc6112feSHong Zhang { 1657bc6112feSHong Zhang Mat_MUMPS *mumps =(Mat_MUMPS*)F->spptr; 1658bc6112feSHong Zhang 1659bc6112feSHong Zhang PetscFunctionBegin; 1660bc6112feSHong Zhang *rinfo = mumps->id.RINFO(icntl); 1661bc6112feSHong Zhang PetscFunctionReturn(0); 1662bc6112feSHong Zhang } 1663bc6112feSHong Zhang 1664bc6112feSHong Zhang #undef __FUNCT__ 1665ca810319SHong Zhang #define __FUNCT__ "MatMumpsGetRinfog_MUMPS" 1666ca810319SHong Zhang PetscErrorCode MatMumpsGetRinfog_MUMPS(Mat F,PetscInt icntl,PetscReal *rinfog) 1667bc6112feSHong Zhang { 1668bc6112feSHong Zhang Mat_MUMPS *mumps =(Mat_MUMPS*)F->spptr; 1669bc6112feSHong Zhang 1670bc6112feSHong Zhang PetscFunctionBegin; 1671bc6112feSHong Zhang *rinfog = mumps->id.RINFOG(icntl); 1672bc6112feSHong Zhang PetscFunctionReturn(0); 1673bc6112feSHong Zhang } 1674bc6112feSHong Zhang 1675bc6112feSHong Zhang #undef __FUNCT__ 1676ca810319SHong Zhang #define __FUNCT__ "MatMumpsGetInfo" 1677a21f80fcSHong Zhang /*@ 1678a21f80fcSHong Zhang MatMumpsGetInfo - Get MUMPS parameter INFO() 1679a21f80fcSHong Zhang 1680a21f80fcSHong Zhang Logically Collective on Mat 1681a21f80fcSHong Zhang 1682a21f80fcSHong Zhang Input Parameters: 1683a21f80fcSHong Zhang + F - the factored matrix obtained by calling MatGetFactor() from PETSc-MUMPS interface 1684a21f80fcSHong Zhang - icntl - index of MUMPS parameter array INFO() 1685a21f80fcSHong Zhang 1686a21f80fcSHong Zhang Output Parameter: 1687a21f80fcSHong Zhang . ival - value of MUMPS INFO(icntl) 1688a21f80fcSHong Zhang 1689a21f80fcSHong Zhang Level: beginner 1690a21f80fcSHong Zhang 1691a21f80fcSHong Zhang References: MUMPS Users' Guide 1692a21f80fcSHong Zhang 1693a21f80fcSHong Zhang .seealso: MatGetFactor() 1694a21f80fcSHong Zhang @*/ 1695ca810319SHong Zhang PetscErrorCode MatMumpsGetInfo(Mat F,PetscInt icntl,PetscInt *ival) 1696bc6112feSHong Zhang { 1697bc6112feSHong Zhang PetscErrorCode ierr; 1698bc6112feSHong Zhang 1699bc6112feSHong Zhang PetscFunctionBegin; 1700ca810319SHong Zhang PetscValidIntPointer(ival,3); 1701ca810319SHong Zhang ierr = PetscTryMethod(F,"MatMumpsGetInfo_C",(Mat,PetscInt,PetscInt*),(F,icntl,ival));CHKERRQ(ierr); 1702bc6112feSHong Zhang PetscFunctionReturn(0); 1703bc6112feSHong Zhang } 1704bc6112feSHong Zhang 1705bc6112feSHong Zhang #undef __FUNCT__ 1706ca810319SHong Zhang #define __FUNCT__ "MatMumpsGetInfog" 1707a21f80fcSHong Zhang /*@ 1708a21f80fcSHong Zhang MatMumpsGetInfog - Get MUMPS parameter INFOG() 1709a21f80fcSHong Zhang 1710a21f80fcSHong Zhang Logically Collective on Mat 1711a21f80fcSHong Zhang 1712a21f80fcSHong Zhang Input Parameters: 1713a21f80fcSHong Zhang + F - the factored matrix obtained by calling MatGetFactor() from PETSc-MUMPS interface 1714a21f80fcSHong Zhang - icntl - index of MUMPS parameter array INFOG() 1715a21f80fcSHong Zhang 1716a21f80fcSHong Zhang Output Parameter: 1717a21f80fcSHong Zhang . ival - value of MUMPS INFOG(icntl) 1718a21f80fcSHong Zhang 1719a21f80fcSHong Zhang Level: beginner 1720a21f80fcSHong Zhang 1721a21f80fcSHong Zhang References: MUMPS Users' Guide 1722a21f80fcSHong Zhang 1723a21f80fcSHong Zhang .seealso: MatGetFactor() 1724a21f80fcSHong Zhang @*/ 1725ca810319SHong Zhang PetscErrorCode MatMumpsGetInfog(Mat F,PetscInt icntl,PetscInt *ival) 1726bc6112feSHong Zhang { 1727bc6112feSHong Zhang PetscErrorCode ierr; 1728bc6112feSHong Zhang 1729bc6112feSHong Zhang PetscFunctionBegin; 1730ca810319SHong Zhang PetscValidIntPointer(ival,3); 1731ca810319SHong Zhang ierr = PetscTryMethod(F,"MatMumpsGetInfog_C",(Mat,PetscInt,PetscInt*),(F,icntl,ival));CHKERRQ(ierr); 1732bc6112feSHong Zhang PetscFunctionReturn(0); 1733bc6112feSHong Zhang } 1734bc6112feSHong Zhang 1735bc6112feSHong Zhang #undef __FUNCT__ 1736ca810319SHong Zhang #define __FUNCT__ "MatMumpsGetRinfo" 1737a21f80fcSHong Zhang /*@ 1738a21f80fcSHong Zhang MatMumpsGetRinfo - Get MUMPS parameter RINFO() 1739a21f80fcSHong Zhang 1740a21f80fcSHong Zhang Logically Collective on Mat 1741a21f80fcSHong Zhang 1742a21f80fcSHong Zhang Input Parameters: 1743a21f80fcSHong Zhang + F - the factored matrix obtained by calling MatGetFactor() from PETSc-MUMPS interface 1744a21f80fcSHong Zhang - icntl - index of MUMPS parameter array RINFO() 1745a21f80fcSHong Zhang 1746a21f80fcSHong Zhang Output Parameter: 1747a21f80fcSHong Zhang . val - value of MUMPS RINFO(icntl) 1748a21f80fcSHong Zhang 1749a21f80fcSHong Zhang Level: beginner 1750a21f80fcSHong Zhang 1751a21f80fcSHong Zhang References: MUMPS Users' Guide 1752a21f80fcSHong Zhang 1753a21f80fcSHong Zhang .seealso: MatGetFactor() 1754a21f80fcSHong Zhang @*/ 1755ca810319SHong Zhang PetscErrorCode MatMumpsGetRinfo(Mat F,PetscInt icntl,PetscReal *val) 1756bc6112feSHong Zhang { 1757bc6112feSHong Zhang PetscErrorCode ierr; 1758bc6112feSHong Zhang 1759bc6112feSHong Zhang PetscFunctionBegin; 1760bc6112feSHong Zhang PetscValidRealPointer(val,3); 1761ca810319SHong Zhang ierr = PetscTryMethod(F,"MatMumpsGetRinfo_C",(Mat,PetscInt,PetscReal*),(F,icntl,val));CHKERRQ(ierr); 1762bc6112feSHong Zhang PetscFunctionReturn(0); 1763bc6112feSHong Zhang } 1764bc6112feSHong Zhang 1765bc6112feSHong Zhang #undef __FUNCT__ 1766ca810319SHong Zhang #define __FUNCT__ "MatMumpsGetRinfog" 1767a21f80fcSHong Zhang /*@ 1768a21f80fcSHong Zhang MatMumpsGetRinfog - Get MUMPS parameter RINFOG() 1769a21f80fcSHong Zhang 1770a21f80fcSHong Zhang Logically Collective on Mat 1771a21f80fcSHong Zhang 1772a21f80fcSHong Zhang Input Parameters: 1773a21f80fcSHong Zhang + F - the factored matrix obtained by calling MatGetFactor() from PETSc-MUMPS interface 1774a21f80fcSHong Zhang - icntl - index of MUMPS parameter array RINFOG() 1775a21f80fcSHong Zhang 1776a21f80fcSHong Zhang Output Parameter: 1777a21f80fcSHong Zhang . val - value of MUMPS RINFOG(icntl) 1778a21f80fcSHong Zhang 1779a21f80fcSHong Zhang Level: beginner 1780a21f80fcSHong Zhang 1781a21f80fcSHong Zhang References: MUMPS Users' Guide 1782a21f80fcSHong Zhang 1783a21f80fcSHong Zhang .seealso: MatGetFactor() 1784a21f80fcSHong Zhang @*/ 1785ca810319SHong Zhang PetscErrorCode MatMumpsGetRinfog(Mat F,PetscInt icntl,PetscReal *val) 1786bc6112feSHong Zhang { 1787bc6112feSHong Zhang PetscErrorCode ierr; 1788bc6112feSHong Zhang 1789bc6112feSHong Zhang PetscFunctionBegin; 1790bc6112feSHong Zhang PetscValidRealPointer(val,3); 1791ca810319SHong Zhang ierr = PetscTryMethod(F,"MatMumpsGetRinfog_C",(Mat,PetscInt,PetscReal*),(F,icntl,val));CHKERRQ(ierr); 1792bc6112feSHong Zhang PetscFunctionReturn(0); 1793bc6112feSHong Zhang } 1794bc6112feSHong Zhang 179524b6179bSKris Buschelman /*MC 17962692d6eeSBarry Smith MATSOLVERMUMPS - A matrix type providing direct solvers (LU and Cholesky) for 179724b6179bSKris Buschelman distributed and sequential matrices via the external package MUMPS. 179824b6179bSKris Buschelman 179941c8de11SBarry Smith Works with MATAIJ and MATSBAIJ matrices 180024b6179bSKris Buschelman 180124b6179bSKris Buschelman Options Database Keys: 18024e34a73bSHong Zhang + -mat_mumps_icntl_1 <6>: ICNTL(1): output stream for error messages (None) 18034e34a73bSHong Zhang . -mat_mumps_icntl_2 <0>: ICNTL(2): output stream for diagnostic printing, statistics, and warning (None) 18044e34a73bSHong Zhang . -mat_mumps_icntl_3 <0>: ICNTL(3): output stream for global information, collected on the host (None) 18054e34a73bSHong Zhang . -mat_mumps_icntl_4 <0>: ICNTL(4): level of printing (0 to 4) (None) 18064e34a73bSHong Zhang . -mat_mumps_icntl_6 <7>: ICNTL(6): permutes to a zero-free diagonal and/or scale the matrix (0 to 7) (None) 18074e34a73bSHong Zhang . -mat_mumps_icntl_7 <7>: ICNTL(7): computes a symmetric permutation in sequential analysis (0 to 7). 3=Scotch, 4=PORD, 5=Metis (None) 18084e34a73bSHong Zhang . -mat_mumps_icntl_8 <77>: ICNTL(8): scaling strategy (-2 to 8 or 77) (None) 18094e34a73bSHong Zhang . -mat_mumps_icntl_10 <0>: ICNTL(10): max num of refinements (None) 18104e34a73bSHong Zhang . -mat_mumps_icntl_11 <0>: ICNTL(11): statistics related to an error analysis (via -ksp_view) (None) 18114e34a73bSHong Zhang . -mat_mumps_icntl_12 <1>: ICNTL(12): an ordering strategy for symmetric matrices (0 to 3) (None) 18124e34a73bSHong Zhang . -mat_mumps_icntl_13 <0>: ICNTL(13): parallelism of the root node (enable ScaLAPACK) and its splitting (None) 18134e34a73bSHong Zhang . -mat_mumps_icntl_14 <20>: ICNTL(14): percentage increase in the estimated working space (None) 18144e34a73bSHong Zhang . -mat_mumps_icntl_19 <0>: ICNTL(19): computes the Schur complement (None) 18154e34a73bSHong Zhang . -mat_mumps_icntl_22 <0>: ICNTL(22): in-core/out-of-core factorization and solve (0 or 1) (None) 18164e34a73bSHong Zhang . -mat_mumps_icntl_23 <0>: ICNTL(23): max size of the working memory (MB) that can allocate per processor (None) 18174e34a73bSHong Zhang . -mat_mumps_icntl_24 <0>: ICNTL(24): detection of null pivot rows (0 or 1) (None) 18184e34a73bSHong Zhang . -mat_mumps_icntl_25 <0>: ICNTL(25): compute a solution of a deficient matrix and a null space basis (None) 18194e34a73bSHong Zhang . -mat_mumps_icntl_26 <0>: ICNTL(26): drives the solution phase if a Schur complement matrix (None) 18204e34a73bSHong Zhang . -mat_mumps_icntl_28 <1>: ICNTL(28): use 1 for sequential analysis and ictnl(7) ordering, or 2 for parallel analysis and ictnl(29) ordering (None) 18214e34a73bSHong Zhang . -mat_mumps_icntl_29 <0>: ICNTL(29): parallel ordering 1 = ptscotch, 2 = parmetis (None) 18224e34a73bSHong Zhang . -mat_mumps_icntl_30 <0>: ICNTL(30): compute user-specified set of entries in inv(A) (None) 18234e34a73bSHong Zhang . -mat_mumps_icntl_31 <0>: ICNTL(31): indicates which factors may be discarded during factorization (None) 18244e34a73bSHong Zhang . -mat_mumps_icntl_33 <0>: ICNTL(33): compute determinant (None) 18254e34a73bSHong Zhang . -mat_mumps_cntl_1 <0.01>: CNTL(1): relative pivoting threshold (None) 18264e34a73bSHong Zhang . -mat_mumps_cntl_2 <1.49012e-08>: CNTL(2): stopping criterion of refinement (None) 18274e34a73bSHong Zhang . -mat_mumps_cntl_3 <0>: CNTL(3): absolute pivoting threshold (None) 18284e34a73bSHong Zhang . -mat_mumps_cntl_4 <-1>: CNTL(4): value for static pivoting (None) 18294e34a73bSHong Zhang - -mat_mumps_cntl_5 <0>: CNTL(5): fixation for null pivots (None) 183024b6179bSKris Buschelman 183124b6179bSKris Buschelman Level: beginner 183224b6179bSKris Buschelman 183341c8de11SBarry Smith .seealso: PCFactorSetMatSolverPackage(), MatSolverPackage 183441c8de11SBarry Smith 183524b6179bSKris Buschelman M*/ 183624b6179bSKris Buschelman 183735bd34faSBarry Smith #undef __FUNCT__ 183835bd34faSBarry Smith #define __FUNCT__ "MatFactorGetSolverPackage_mumps" 1839f7a08781SBarry Smith static PetscErrorCode MatFactorGetSolverPackage_mumps(Mat A,const MatSolverPackage *type) 184035bd34faSBarry Smith { 184135bd34faSBarry Smith PetscFunctionBegin; 18422692d6eeSBarry Smith *type = MATSOLVERMUMPS; 184335bd34faSBarry Smith PetscFunctionReturn(0); 184435bd34faSBarry Smith } 184535bd34faSBarry Smith 1846bccb9932SShri Abhyankar /* MatGetFactor for Seq and MPI AIJ matrices */ 18472877fffaSHong Zhang #undef __FUNCT__ 1848bccb9932SShri Abhyankar #define __FUNCT__ "MatGetFactor_aij_mumps" 18498cc058d9SJed Brown PETSC_EXTERN PetscErrorCode MatGetFactor_aij_mumps(Mat A,MatFactorType ftype,Mat *F) 18502877fffaSHong Zhang { 18512877fffaSHong Zhang Mat B; 18522877fffaSHong Zhang PetscErrorCode ierr; 18532877fffaSHong Zhang Mat_MUMPS *mumps; 1854ace3abfcSBarry Smith PetscBool isSeqAIJ; 18552877fffaSHong Zhang 18562877fffaSHong Zhang PetscFunctionBegin; 18572877fffaSHong Zhang /* Create the factorization matrix */ 1858251f4c67SDmitry Karpeev ierr = PetscObjectTypeCompare((PetscObject)A,MATSEQAIJ,&isSeqAIJ);CHKERRQ(ierr); 1859ce94432eSBarry Smith ierr = MatCreate(PetscObjectComm((PetscObject)A),&B);CHKERRQ(ierr); 18602877fffaSHong Zhang ierr = MatSetSizes(B,A->rmap->n,A->cmap->n,A->rmap->N,A->cmap->N);CHKERRQ(ierr); 18612877fffaSHong Zhang ierr = MatSetType(B,((PetscObject)A)->type_name);CHKERRQ(ierr); 1862bccb9932SShri Abhyankar if (isSeqAIJ) { 18630298fd71SBarry Smith ierr = MatSeqAIJSetPreallocation(B,0,NULL);CHKERRQ(ierr); 1864bccb9932SShri Abhyankar } else { 18650298fd71SBarry Smith ierr = MatMPIAIJSetPreallocation(B,0,NULL,0,NULL);CHKERRQ(ierr); 1866bccb9932SShri Abhyankar } 18672877fffaSHong Zhang 1868b00a9115SJed Brown ierr = PetscNewLog(B,&mumps);CHKERRQ(ierr); 18692205254eSKarl Rupp 18702877fffaSHong Zhang B->ops->view = MatView_MUMPS; 187135bd34faSBarry Smith B->ops->getinfo = MatGetInfo_MUMPS; 187220be8e61SHong Zhang B->ops->getdiagonal = MatGetDiagonal_MUMPS; 18732205254eSKarl Rupp 1874bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatFactorGetSolverPackage_C",MatFactorGetSolverPackage_mumps);CHKERRQ(ierr); 1875bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsSetIcntl_C",MatMumpsSetIcntl_MUMPS);CHKERRQ(ierr); 1876bc6112feSHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsGetIcntl_C",MatMumpsGetIcntl_MUMPS);CHKERRQ(ierr); 1877bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsSetCntl_C",MatMumpsSetCntl_MUMPS);CHKERRQ(ierr); 1878bc6112feSHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsGetCntl_C",MatMumpsGetCntl_MUMPS);CHKERRQ(ierr); 1879bc6112feSHong Zhang 1880ca810319SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsGetInfo_C",MatMumpsGetInfo_MUMPS);CHKERRQ(ierr); 1881ca810319SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsGetInfog_C",MatMumpsGetInfog_MUMPS);CHKERRQ(ierr); 1882ca810319SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsGetRinfo_C",MatMumpsGetRinfo_MUMPS);CHKERRQ(ierr); 1883ca810319SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsGetRinfog_C",MatMumpsGetRinfog_MUMPS);CHKERRQ(ierr); 1884450b117fSShri Abhyankar if (ftype == MAT_FACTOR_LU) { 1885450b117fSShri Abhyankar B->ops->lufactorsymbolic = MatLUFactorSymbolic_AIJMUMPS; 1886d5f3da31SBarry Smith B->factortype = MAT_FACTOR_LU; 1887bccb9932SShri Abhyankar if (isSeqAIJ) mumps->ConvertToTriples = MatConvertToTriples_seqaij_seqaij; 1888bccb9932SShri Abhyankar else mumps->ConvertToTriples = MatConvertToTriples_mpiaij_mpiaij; 1889746480a1SHong Zhang mumps->sym = 0; 1890dcd589f8SShri Abhyankar } else { 189167877ebaSShri Abhyankar B->ops->choleskyfactorsymbolic = MatCholeskyFactorSymbolic_MUMPS; 1892450b117fSShri Abhyankar B->factortype = MAT_FACTOR_CHOLESKY; 1893bccb9932SShri Abhyankar if (isSeqAIJ) mumps->ConvertToTriples = MatConvertToTriples_seqaij_seqsbaij; 1894bccb9932SShri Abhyankar else mumps->ConvertToTriples = MatConvertToTriples_mpiaij_mpisbaij; 18956fdc2a6dSBarry Smith if (A->spd_set && A->spd) mumps->sym = 1; 18966fdc2a6dSBarry Smith else mumps->sym = 2; 1897450b117fSShri Abhyankar } 18982877fffaSHong Zhang 18992877fffaSHong Zhang mumps->isAIJ = PETSC_TRUE; 1900bf0cc555SLisandro Dalcin mumps->Destroy = B->ops->destroy; 19012877fffaSHong Zhang B->ops->destroy = MatDestroy_MUMPS; 19022877fffaSHong Zhang B->spptr = (void*)mumps; 19032205254eSKarl Rupp 1904f697e70eSHong Zhang ierr = PetscInitializeMUMPS(A,mumps);CHKERRQ(ierr); 1905746480a1SHong Zhang 19062877fffaSHong Zhang *F = B; 19072877fffaSHong Zhang PetscFunctionReturn(0); 19082877fffaSHong Zhang } 19092877fffaSHong Zhang 1910bccb9932SShri Abhyankar /* MatGetFactor for Seq and MPI SBAIJ matrices */ 19112877fffaSHong Zhang #undef __FUNCT__ 1912bccb9932SShri Abhyankar #define __FUNCT__ "MatGetFactor_sbaij_mumps" 19138cc058d9SJed Brown PETSC_EXTERN PetscErrorCode MatGetFactor_sbaij_mumps(Mat A,MatFactorType ftype,Mat *F) 19142877fffaSHong Zhang { 19152877fffaSHong Zhang Mat B; 19162877fffaSHong Zhang PetscErrorCode ierr; 19172877fffaSHong Zhang Mat_MUMPS *mumps; 1918ace3abfcSBarry Smith PetscBool isSeqSBAIJ; 19192877fffaSHong Zhang 19202877fffaSHong Zhang PetscFunctionBegin; 1921ce94432eSBarry Smith if (ftype != MAT_FACTOR_CHOLESKY) SETERRQ(PetscObjectComm((PetscObject)A),PETSC_ERR_SUP,"Cannot use PETSc SBAIJ matrices with MUMPS LU, use AIJ matrix"); 1922ce94432eSBarry Smith if (A->rmap->bs > 1) SETERRQ(PetscObjectComm((PetscObject)A),PETSC_ERR_SUP,"Cannot use PETSc SBAIJ matrices with block size > 1 with MUMPS Cholesky, use AIJ matrix instead"); 1923251f4c67SDmitry Karpeev ierr = PetscObjectTypeCompare((PetscObject)A,MATSEQSBAIJ,&isSeqSBAIJ);CHKERRQ(ierr); 19242877fffaSHong Zhang /* Create the factorization matrix */ 1925ce94432eSBarry Smith ierr = MatCreate(PetscObjectComm((PetscObject)A),&B);CHKERRQ(ierr); 19262877fffaSHong Zhang ierr = MatSetSizes(B,A->rmap->n,A->cmap->n,A->rmap->N,A->cmap->N);CHKERRQ(ierr); 19272877fffaSHong Zhang ierr = MatSetType(B,((PetscObject)A)->type_name);CHKERRQ(ierr); 1928b00a9115SJed Brown ierr = PetscNewLog(B,&mumps);CHKERRQ(ierr); 1929bccb9932SShri Abhyankar if (isSeqSBAIJ) { 19300298fd71SBarry Smith ierr = MatSeqSBAIJSetPreallocation(B,1,0,NULL);CHKERRQ(ierr); 19312205254eSKarl Rupp 193216ebf90aSShri Abhyankar mumps->ConvertToTriples = MatConvertToTriples_seqsbaij_seqsbaij; 1933dcd589f8SShri Abhyankar } else { 19340298fd71SBarry Smith ierr = MatMPISBAIJSetPreallocation(B,1,0,NULL,0,NULL);CHKERRQ(ierr); 19352205254eSKarl Rupp 1936bccb9932SShri Abhyankar mumps->ConvertToTriples = MatConvertToTriples_mpisbaij_mpisbaij; 1937bccb9932SShri Abhyankar } 1938bccb9932SShri Abhyankar 193967877ebaSShri Abhyankar B->ops->choleskyfactorsymbolic = MatCholeskyFactorSymbolic_MUMPS; 1940bccb9932SShri Abhyankar B->ops->view = MatView_MUMPS; 194120be8e61SHong Zhang B->ops->getdiagonal = MatGetDiagonal_MUMPS; 19422205254eSKarl Rupp 1943bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatFactorGetSolverPackage_C",MatFactorGetSolverPackage_mumps);CHKERRQ(ierr); 1944b13644aeSHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsSetIcntl_C",MatMumpsSetIcntl_MUMPS);CHKERRQ(ierr); 1945b13644aeSHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsGetIcntl_C",MatMumpsGetIcntl_MUMPS);CHKERRQ(ierr); 1946b13644aeSHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsSetCntl_C",MatMumpsSetCntl_MUMPS);CHKERRQ(ierr); 1947b13644aeSHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsGetCntl_C",MatMumpsGetCntl_MUMPS);CHKERRQ(ierr); 1948bc6112feSHong Zhang 1949ca810319SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsGetInfo_C",MatMumpsGetInfo_MUMPS);CHKERRQ(ierr); 1950ca810319SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsGetInfog_C",MatMumpsGetInfog_MUMPS);CHKERRQ(ierr); 1951ca810319SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsGetRinfo_C",MatMumpsGetRinfo_MUMPS);CHKERRQ(ierr); 1952ca810319SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsGetRinfog_C",MatMumpsGetRinfog_MUMPS);CHKERRQ(ierr); 19532205254eSKarl Rupp 1954f4762488SHong Zhang B->factortype = MAT_FACTOR_CHOLESKY; 19556fdc2a6dSBarry Smith if (A->spd_set && A->spd) mumps->sym = 1; 19566fdc2a6dSBarry Smith else mumps->sym = 2; 1957a214ac2aSShri Abhyankar 1958bccb9932SShri Abhyankar mumps->isAIJ = PETSC_FALSE; 1959bf0cc555SLisandro Dalcin mumps->Destroy = B->ops->destroy; 1960f3c0ef26SHong Zhang B->ops->destroy = MatDestroy_MUMPS; 19612877fffaSHong Zhang B->spptr = (void*)mumps; 19622205254eSKarl Rupp 1963f697e70eSHong Zhang ierr = PetscInitializeMUMPS(A,mumps);CHKERRQ(ierr); 1964746480a1SHong Zhang 19652877fffaSHong Zhang *F = B; 19662877fffaSHong Zhang PetscFunctionReturn(0); 19672877fffaSHong Zhang } 196897969023SHong Zhang 1969450b117fSShri Abhyankar #undef __FUNCT__ 1970bccb9932SShri Abhyankar #define __FUNCT__ "MatGetFactor_baij_mumps" 19718cc058d9SJed Brown PETSC_EXTERN PetscErrorCode MatGetFactor_baij_mumps(Mat A,MatFactorType ftype,Mat *F) 197267877ebaSShri Abhyankar { 197367877ebaSShri Abhyankar Mat B; 197467877ebaSShri Abhyankar PetscErrorCode ierr; 197567877ebaSShri Abhyankar Mat_MUMPS *mumps; 1976ace3abfcSBarry Smith PetscBool isSeqBAIJ; 197767877ebaSShri Abhyankar 197867877ebaSShri Abhyankar PetscFunctionBegin; 197967877ebaSShri Abhyankar /* Create the factorization matrix */ 1980251f4c67SDmitry Karpeev ierr = PetscObjectTypeCompare((PetscObject)A,MATSEQBAIJ,&isSeqBAIJ);CHKERRQ(ierr); 1981ce94432eSBarry Smith ierr = MatCreate(PetscObjectComm((PetscObject)A),&B);CHKERRQ(ierr); 198267877ebaSShri Abhyankar ierr = MatSetSizes(B,A->rmap->n,A->cmap->n,A->rmap->N,A->cmap->N);CHKERRQ(ierr); 198367877ebaSShri Abhyankar ierr = MatSetType(B,((PetscObject)A)->type_name);CHKERRQ(ierr); 1984bccb9932SShri Abhyankar if (isSeqBAIJ) { 19850298fd71SBarry Smith ierr = MatSeqBAIJSetPreallocation(B,A->rmap->bs,0,NULL);CHKERRQ(ierr); 1986bccb9932SShri Abhyankar } else { 19870298fd71SBarry Smith ierr = MatMPIBAIJSetPreallocation(B,A->rmap->bs,0,NULL,0,NULL);CHKERRQ(ierr); 1988bccb9932SShri Abhyankar } 1989450b117fSShri Abhyankar 1990b00a9115SJed Brown ierr = PetscNewLog(B,&mumps);CHKERRQ(ierr); 1991450b117fSShri Abhyankar if (ftype == MAT_FACTOR_LU) { 1992450b117fSShri Abhyankar B->ops->lufactorsymbolic = MatLUFactorSymbolic_BAIJMUMPS; 1993450b117fSShri Abhyankar B->factortype = MAT_FACTOR_LU; 1994bccb9932SShri Abhyankar if (isSeqBAIJ) mumps->ConvertToTriples = MatConvertToTriples_seqbaij_seqaij; 1995bccb9932SShri Abhyankar else mumps->ConvertToTriples = MatConvertToTriples_mpibaij_mpiaij; 1996746480a1SHong Zhang mumps->sym = 0; 1997f23aa3ddSBarry Smith } else SETERRQ(PETSC_COMM_SELF,PETSC_ERR_SUP,"Cannot use PETSc BAIJ matrices with MUMPS Cholesky, use SBAIJ or AIJ matrix instead\n"); 1998bccb9932SShri Abhyankar 1999450b117fSShri Abhyankar B->ops->view = MatView_MUMPS; 200020be8e61SHong Zhang B->ops->getdiagonal = MatGetDiagonal_MUMPS; 20012205254eSKarl Rupp 2002bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatFactorGetSolverPackage_C",MatFactorGetSolverPackage_mumps);CHKERRQ(ierr); 2003bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsSetIcntl_C",MatMumpsSetIcntl_MUMPS);CHKERRQ(ierr); 2004bc6112feSHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsGetIcntl_C",MatMumpsGetIcntl_MUMPS);CHKERRQ(ierr); 2005bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsSetCntl_C",MatMumpsSetCntl_MUMPS);CHKERRQ(ierr); 2006bc6112feSHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsGetCntl_C",MatMumpsGetCntl_MUMPS);CHKERRQ(ierr); 2007bc6112feSHong Zhang 2008ca810319SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsGetInfo_C",MatMumpsGetInfo_MUMPS);CHKERRQ(ierr); 2009ca810319SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsGetInfog_C",MatMumpsGetInfog_MUMPS);CHKERRQ(ierr); 2010ca810319SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsGetRinfo_C",MatMumpsGetRinfo_MUMPS);CHKERRQ(ierr); 2011ca810319SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsGetRinfog_C",MatMumpsGetRinfog_MUMPS);CHKERRQ(ierr); 2012450b117fSShri Abhyankar 2013450b117fSShri Abhyankar mumps->isAIJ = PETSC_TRUE; 2014bf0cc555SLisandro Dalcin mumps->Destroy = B->ops->destroy; 2015450b117fSShri Abhyankar B->ops->destroy = MatDestroy_MUMPS; 2016450b117fSShri Abhyankar B->spptr = (void*)mumps; 20172205254eSKarl Rupp 2018f697e70eSHong Zhang ierr = PetscInitializeMUMPS(A,mumps);CHKERRQ(ierr); 2019746480a1SHong Zhang 2020450b117fSShri Abhyankar *F = B; 2021450b117fSShri Abhyankar PetscFunctionReturn(0); 2022450b117fSShri Abhyankar } 202342c9c57cSBarry Smith 202442c9c57cSBarry Smith PETSC_EXTERN PetscErrorCode MatGetFactor_aij_mumps(Mat,MatFactorType,Mat*); 202542c9c57cSBarry Smith PETSC_EXTERN PetscErrorCode MatGetFactor_baij_mumps(Mat,MatFactorType,Mat*); 202642c9c57cSBarry Smith PETSC_EXTERN PetscErrorCode MatGetFactor_sbaij_mumps(Mat,MatFactorType,Mat*); 202742c9c57cSBarry Smith 202842c9c57cSBarry Smith #undef __FUNCT__ 202942c9c57cSBarry Smith #define __FUNCT__ "MatSolverPackageRegister_MUMPS" 203029b38603SBarry Smith PETSC_EXTERN PetscErrorCode MatSolverPackageRegister_MUMPS(void) 203142c9c57cSBarry Smith { 203242c9c57cSBarry Smith PetscErrorCode ierr; 203342c9c57cSBarry Smith 203442c9c57cSBarry Smith PetscFunctionBegin; 203542c9c57cSBarry Smith ierr = MatSolverPackageRegister(MATSOLVERMUMPS,MATMPIAIJ, MAT_FACTOR_LU,MatGetFactor_aij_mumps);CHKERRQ(ierr); 203642c9c57cSBarry Smith ierr = MatSolverPackageRegister(MATSOLVERMUMPS,MATMPIAIJ, MAT_FACTOR_CHOLESKY,MatGetFactor_aij_mumps);CHKERRQ(ierr); 203742c9c57cSBarry Smith ierr = MatSolverPackageRegister(MATSOLVERMUMPS,MATMPIBAIJ, MAT_FACTOR_LU,MatGetFactor_baij_mumps);CHKERRQ(ierr); 203842c9c57cSBarry Smith ierr = MatSolverPackageRegister(MATSOLVERMUMPS,MATMPIBAIJ, MAT_FACTOR_CHOLESKY,MatGetFactor_baij_mumps);CHKERRQ(ierr); 203942c9c57cSBarry Smith ierr = MatSolverPackageRegister(MATSOLVERMUMPS,MATMPISBAIJ, MAT_FACTOR_CHOLESKY,MatGetFactor_sbaij_mumps);CHKERRQ(ierr); 204042c9c57cSBarry Smith ierr = MatSolverPackageRegister(MATSOLVERMUMPS,MATSEQAIJ, MAT_FACTOR_LU,MatGetFactor_aij_mumps);CHKERRQ(ierr); 204142c9c57cSBarry Smith ierr = MatSolverPackageRegister(MATSOLVERMUMPS,MATSEQAIJ, MAT_FACTOR_CHOLESKY,MatGetFactor_aij_mumps);CHKERRQ(ierr); 204242c9c57cSBarry Smith ierr = MatSolverPackageRegister(MATSOLVERMUMPS,MATSEQBAIJ, MAT_FACTOR_LU,MatGetFactor_baij_mumps);CHKERRQ(ierr); 204342c9c57cSBarry Smith ierr = MatSolverPackageRegister(MATSOLVERMUMPS,MATSEQBAIJ, MAT_FACTOR_CHOLESKY,MatGetFactor_baij_mumps);CHKERRQ(ierr); 204442c9c57cSBarry Smith ierr = MatSolverPackageRegister(MATSOLVERMUMPS,MATSEQSBAIJ, MAT_FACTOR_CHOLESKY,MatGetFactor_sbaij_mumps);CHKERRQ(ierr); 204542c9c57cSBarry Smith PetscFunctionReturn(0); 204642c9c57cSBarry Smith } 204742c9c57cSBarry Smith 2048