11c2a3de1SBarry Smith 2397b6df1SKris Buschelman /* 3c2b5dc30SHong Zhang Provides an interface to the MUMPS sparse solver 4397b6df1SKris Buschelman */ 551d5961aSHong Zhang 6c6db04a5SJed Brown #include <../src/mat/impls/aij/mpi/mpiaij.h> /*I "petscmat.h" I*/ 7c6db04a5SJed Brown #include <../src/mat/impls/sbaij/mpi/mpisbaij.h> 8b5fa320bSStefano Zampini #include <petscblaslapack.h> 9397b6df1SKris Buschelman 10397b6df1SKris Buschelman EXTERN_C_BEGIN 11397b6df1SKris Buschelman #if defined(PETSC_USE_COMPLEX) 122907cef9SHong Zhang #if defined(PETSC_USE_REAL_SINGLE) 132907cef9SHong Zhang #include <cmumps_c.h> 142907cef9SHong Zhang #else 15c6db04a5SJed Brown #include <zmumps_c.h> 162907cef9SHong Zhang #endif 172907cef9SHong Zhang #else 182907cef9SHong Zhang #if defined(PETSC_USE_REAL_SINGLE) 192907cef9SHong Zhang #include <smumps_c.h> 20397b6df1SKris Buschelman #else 21c6db04a5SJed Brown #include <dmumps_c.h> 22397b6df1SKris Buschelman #endif 232907cef9SHong Zhang #endif 24397b6df1SKris Buschelman EXTERN_C_END 25397b6df1SKris Buschelman #define JOB_INIT -1 263d472b54SHong Zhang #define JOB_FACTSYMBOLIC 1 273d472b54SHong Zhang #define JOB_FACTNUMERIC 2 283d472b54SHong Zhang #define JOB_SOLVE 3 29397b6df1SKris Buschelman #define JOB_END -2 303d472b54SHong Zhang 312907cef9SHong Zhang /* calls to MUMPS */ 322907cef9SHong Zhang #if defined(PETSC_USE_COMPLEX) 332907cef9SHong Zhang #if defined(PETSC_USE_REAL_SINGLE) 342907cef9SHong Zhang #define PetscMUMPS_c cmumps_c 352907cef9SHong Zhang #else 362907cef9SHong Zhang #define PetscMUMPS_c zmumps_c 372907cef9SHong Zhang #endif 382907cef9SHong Zhang #else 392907cef9SHong Zhang #if defined(PETSC_USE_REAL_SINGLE) 402907cef9SHong Zhang #define PetscMUMPS_c smumps_c 412907cef9SHong Zhang #else 422907cef9SHong Zhang #define PetscMUMPS_c dmumps_c 432907cef9SHong Zhang #endif 442907cef9SHong Zhang #endif 452907cef9SHong Zhang 46940cd9d6SSatish Balay /* declare MumpsScalar */ 47940cd9d6SSatish Balay #if defined(PETSC_USE_COMPLEX) 48940cd9d6SSatish Balay #if defined(PETSC_USE_REAL_SINGLE) 49940cd9d6SSatish Balay #define MumpsScalar mumps_complex 50940cd9d6SSatish Balay #else 51940cd9d6SSatish Balay #define MumpsScalar mumps_double_complex 52940cd9d6SSatish Balay #endif 53940cd9d6SSatish Balay #else 54940cd9d6SSatish Balay #define MumpsScalar PetscScalar 55940cd9d6SSatish Balay #endif 563d472b54SHong Zhang 57397b6df1SKris Buschelman /* macros s.t. indices match MUMPS documentation */ 58397b6df1SKris Buschelman #define ICNTL(I) icntl[(I)-1] 59397b6df1SKris Buschelman #define CNTL(I) cntl[(I)-1] 60397b6df1SKris Buschelman #define INFOG(I) infog[(I)-1] 61a7aca84bSHong Zhang #define INFO(I) info[(I)-1] 62397b6df1SKris Buschelman #define RINFOG(I) rinfog[(I)-1] 63adc1d99fSHong Zhang #define RINFO(I) rinfo[(I)-1] 64397b6df1SKris Buschelman 65397b6df1SKris Buschelman typedef struct { 66397b6df1SKris Buschelman #if defined(PETSC_USE_COMPLEX) 672907cef9SHong Zhang #if defined(PETSC_USE_REAL_SINGLE) 682907cef9SHong Zhang CMUMPS_STRUC_C id; 692907cef9SHong Zhang #else 70397b6df1SKris Buschelman ZMUMPS_STRUC_C id; 712907cef9SHong Zhang #endif 722907cef9SHong Zhang #else 732907cef9SHong Zhang #if defined(PETSC_USE_REAL_SINGLE) 742907cef9SHong Zhang SMUMPS_STRUC_C id; 75397b6df1SKris Buschelman #else 76397b6df1SKris Buschelman DMUMPS_STRUC_C id; 77397b6df1SKris Buschelman #endif 782907cef9SHong Zhang #endif 792907cef9SHong Zhang 80397b6df1SKris Buschelman MatStructure matstruc; 81c1490034SHong Zhang PetscMPIInt myid,size; 82a5e57a09SHong Zhang PetscInt *irn,*jcn,nz,sym; 83397b6df1SKris Buschelman PetscScalar *val; 84397b6df1SKris Buschelman MPI_Comm comm_mumps; 856f3cc6f9SBarry Smith PetscBool isAIJ; 86a5e57a09SHong Zhang PetscInt ICNTL9_pre; /* check if ICNTL(9) is changed from previous MatSolve */ 87801fbe65SHong Zhang VecScatter scat_rhs, scat_sol; /* used by MatSolve() */ 88801fbe65SHong Zhang Vec b_seq,x_seq; 89b34f08ffSHong Zhang PetscInt ninfo,*info; /* display INFO */ 90b5fa320bSStefano Zampini PetscInt sizeredrhs; 91b5fa320bSStefano Zampini PetscInt *schur_pivots; 9259ac8732SStefano Zampini PetscInt schur_B_lwork; 93b5fa320bSStefano Zampini PetscScalar *schur_work; 9459ac8732SStefano Zampini PetscScalar *schur_sol; 9559ac8732SStefano Zampini PetscInt schur_sizesol; 9659ac8732SStefano Zampini PetscBool schur_factored; 9759ac8732SStefano Zampini PetscBool schur_inverted; 982205254eSKarl Rupp 99bf0cc555SLisandro Dalcin PetscErrorCode (*Destroy)(Mat); 100bccb9932SShri Abhyankar PetscErrorCode (*ConvertToTriples)(Mat, int, MatReuse, int*, int**, int**, PetscScalar**); 101f0c56d0fSKris Buschelman } Mat_MUMPS; 102f0c56d0fSKris Buschelman 10309573ac7SBarry Smith extern PetscErrorCode MatDuplicate_MUMPS(Mat,MatDuplicateOption,Mat*); 104b24902e0SBarry Smith 10559ac8732SStefano Zampini #undef __FUNCT__ 10659ac8732SStefano Zampini #define __FUNCT__ "MatMumpsResetSchur_Private" 10759ac8732SStefano Zampini static PetscErrorCode MatMumpsResetSchur_Private(Mat_MUMPS* mumps) 108b5fa320bSStefano Zampini { 109b5fa320bSStefano Zampini PetscErrorCode ierr; 110b5fa320bSStefano Zampini 111b5fa320bSStefano Zampini PetscFunctionBegin; 11259ac8732SStefano Zampini ierr = PetscFree2(mumps->id.listvar_schur,mumps->id.schur);CHKERRQ(ierr); 11359ac8732SStefano Zampini ierr = PetscFree(mumps->id.redrhs);CHKERRQ(ierr); 11459ac8732SStefano Zampini ierr = PetscFree(mumps->schur_sol);CHKERRQ(ierr); 11559ac8732SStefano Zampini ierr = PetscFree(mumps->schur_pivots);CHKERRQ(ierr); 11659ac8732SStefano Zampini ierr = PetscFree(mumps->schur_work);CHKERRQ(ierr); 11759ac8732SStefano Zampini mumps->id.size_schur = 0; 11859ac8732SStefano Zampini mumps->id.ICNTL(19) = 0; 11959ac8732SStefano Zampini PetscFunctionReturn(0); 12059ac8732SStefano Zampini } 12159ac8732SStefano Zampini 12259ac8732SStefano Zampini #undef __FUNCT__ 12359ac8732SStefano Zampini #define __FUNCT__ "MatMumpsFactorSchur_Private" 12459ac8732SStefano Zampini static PetscErrorCode MatMumpsFactorSchur_Private(Mat_MUMPS* mumps) 12559ac8732SStefano Zampini { 12659ac8732SStefano Zampini PetscBLASInt B_N,B_ierr,B_slda; 12759ac8732SStefano Zampini PetscErrorCode ierr; 12859ac8732SStefano Zampini 12959ac8732SStefano Zampini PetscFunctionBegin; 13059ac8732SStefano Zampini if (mumps->schur_factored) { 13159ac8732SStefano Zampini PetscFunctionReturn(0); 13259ac8732SStefano Zampini } 13359ac8732SStefano Zampini ierr = PetscBLASIntCast(mumps->id.size_schur,&B_N);CHKERRQ(ierr); 13459ac8732SStefano Zampini ierr = PetscBLASIntCast(mumps->id.schur_lld,&B_slda);CHKERRQ(ierr); 13559ac8732SStefano Zampini if (!mumps->sym) { /* MUMPS always return a full Schur matrix */ 13659ac8732SStefano Zampini if (!mumps->schur_pivots) { 13759ac8732SStefano Zampini ierr = PetscMalloc1(B_N,&mumps->schur_pivots);CHKERRQ(ierr); 13859ac8732SStefano Zampini } 13959ac8732SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 14059ac8732SStefano Zampini PetscStackCallBLAS("LAPACKgetrf",LAPACKgetrf_(&B_N,&B_N,(PetscScalar*)mumps->id.schur,&B_slda,mumps->schur_pivots,&B_ierr)); 14159ac8732SStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 14259ac8732SStefano Zampini if (B_ierr) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in GETRF Lapack routine %d",(int)B_ierr); 14359ac8732SStefano Zampini } else { /* either full or lower-triangular (not packed) */ 14459ac8732SStefano Zampini char ord[2]; 14559ac8732SStefano Zampini if (mumps->id.ICNTL(19) == 2 || mumps->id.ICNTL(19) == 3) { /* lower triangular stored by columns or full matrix */ 14659ac8732SStefano Zampini sprintf(ord,"L"); 14759ac8732SStefano Zampini } else { /* ICNTL(19) == 1 lower triangular stored by rows */ 14859ac8732SStefano Zampini sprintf(ord,"U"); 14959ac8732SStefano Zampini } 15059ac8732SStefano Zampini if (mumps->id.sym == 2) { 15159ac8732SStefano Zampini if (!mumps->schur_pivots) { 15259ac8732SStefano Zampini PetscScalar lwork; 15359ac8732SStefano Zampini 15459ac8732SStefano Zampini ierr = PetscMalloc1(B_N,&mumps->schur_pivots);CHKERRQ(ierr); 15559ac8732SStefano Zampini mumps->schur_B_lwork=-1; 15659ac8732SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 15759ac8732SStefano Zampini PetscStackCallBLAS("LAPACKsytrf",LAPACKsytrf_(ord,&B_N,(PetscScalar*)mumps->id.schur,&B_slda,mumps->schur_pivots,&lwork,&mumps->schur_B_lwork,&B_ierr)); 15859ac8732SStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 15959ac8732SStefano Zampini if (B_ierr) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in query to SYTRF Lapack routine %d",(int)B_ierr); 16059ac8732SStefano Zampini ierr = PetscBLASIntCast((PetscInt)PetscRealPart(lwork),&mumps->schur_B_lwork);CHKERRQ(ierr); 16159ac8732SStefano Zampini ierr = PetscMalloc1(mumps->schur_B_lwork,&mumps->schur_work);CHKERRQ(ierr); 16259ac8732SStefano Zampini } 16359ac8732SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 16459ac8732SStefano Zampini PetscStackCallBLAS("LAPACKsytrf",LAPACKsytrf_(ord,&B_N,(PetscScalar*)mumps->id.schur,&B_slda,mumps->schur_pivots,mumps->schur_work,&mumps->schur_B_lwork,&B_ierr)); 16559ac8732SStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 16659ac8732SStefano Zampini if (B_ierr) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in SYTRF Lapack routine %d",(int)B_ierr); 16759ac8732SStefano Zampini } else { 16859ac8732SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 16959ac8732SStefano Zampini PetscStackCallBLAS("LAPACKpotrf",LAPACKpotrf_(ord,&B_N,(PetscScalar*)mumps->id.schur,&B_slda,&B_ierr)); 17059ac8732SStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 17159ac8732SStefano Zampini if (B_ierr) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in POTRF Lapack routine %d",(int)B_ierr); 17259ac8732SStefano Zampini } 17359ac8732SStefano Zampini } 17459ac8732SStefano Zampini mumps->schur_factored = PETSC_TRUE; 17559ac8732SStefano Zampini PetscFunctionReturn(0); 17659ac8732SStefano Zampini } 17759ac8732SStefano Zampini 17859ac8732SStefano Zampini #undef __FUNCT__ 17959ac8732SStefano Zampini #define __FUNCT__ "MatMumpsInvertSchur_Private" 18059ac8732SStefano Zampini static PetscErrorCode MatMumpsInvertSchur_Private(Mat_MUMPS* mumps) 18159ac8732SStefano Zampini { 18259ac8732SStefano Zampini PetscBLASInt B_N,B_ierr,B_slda; 18359ac8732SStefano Zampini PetscErrorCode ierr; 18459ac8732SStefano Zampini 18559ac8732SStefano Zampini PetscFunctionBegin; 18659ac8732SStefano Zampini ierr = MatMumpsFactorSchur_Private(mumps);CHKERRQ(ierr); 18759ac8732SStefano Zampini ierr = PetscBLASIntCast(mumps->id.size_schur,&B_N);CHKERRQ(ierr); 18859ac8732SStefano Zampini ierr = PetscBLASIntCast(mumps->id.schur_lld,&B_slda);CHKERRQ(ierr); 18959ac8732SStefano Zampini if (!mumps->sym) { /* MUMPS always return a full Schur matrix */ 19059ac8732SStefano Zampini if (!mumps->schur_work) { 19159ac8732SStefano Zampini PetscScalar lwork; 19259ac8732SStefano Zampini 19359ac8732SStefano Zampini mumps->schur_B_lwork = -1; 19459ac8732SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 19559ac8732SStefano Zampini PetscStackCallBLAS("LAPACKgetri",LAPACKgetri_(&B_N,(PetscScalar*)mumps->id.schur,&B_N,mumps->schur_pivots,&lwork,&mumps->schur_B_lwork,&B_ierr)); 19659ac8732SStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 19759ac8732SStefano Zampini if (B_ierr) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in query to GETRI Lapack routine %d",(int)B_ierr); 19859ac8732SStefano Zampini ierr = PetscBLASIntCast((PetscInt)PetscRealPart(lwork),&mumps->schur_B_lwork);CHKERRQ(ierr); 19959ac8732SStefano Zampini ierr = PetscMalloc1(mumps->schur_B_lwork,&mumps->schur_work);CHKERRQ(ierr); 20059ac8732SStefano Zampini } 20159ac8732SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 20259ac8732SStefano Zampini PetscStackCallBLAS("LAPACKgetri",LAPACKgetri_(&B_N,(PetscScalar*)mumps->id.schur,&B_N,mumps->schur_pivots,mumps->schur_work,&mumps->schur_B_lwork,&B_ierr)); 20359ac8732SStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 20459ac8732SStefano Zampini if (B_ierr) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in GETRI Lapack routine %d",(int)B_ierr); 20559ac8732SStefano Zampini } else { /* either full or lower-triangular (not packed) */ 20659ac8732SStefano Zampini char ord[2]; 20759ac8732SStefano Zampini if (mumps->id.ICNTL(19) == 2 || mumps->id.ICNTL(19) == 3) { /* lower triangular stored by columns or full matrix */ 20859ac8732SStefano Zampini sprintf(ord,"L"); 20959ac8732SStefano Zampini } else { /* ICNTL(19) == 1 lower triangular stored by rows */ 21059ac8732SStefano Zampini sprintf(ord,"U"); 21159ac8732SStefano Zampini } 21259ac8732SStefano Zampini if (mumps->id.sym == 2) { 21359ac8732SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 21459ac8732SStefano Zampini PetscStackCallBLAS("LAPACKsytri",LAPACKsytri_(ord,&B_N,(PetscScalar*)mumps->id.schur,&B_N,mumps->schur_pivots,mumps->schur_work,&B_ierr)); 21559ac8732SStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 21659ac8732SStefano Zampini if (B_ierr) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in SYTRI Lapack routine %d",(int)B_ierr); 21759ac8732SStefano Zampini } else { 21859ac8732SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 21959ac8732SStefano Zampini PetscStackCallBLAS("LAPACKpotri",LAPACKpotri_(ord,&B_N,(PetscScalar*)mumps->id.schur,&B_N,&B_ierr)); 22059ac8732SStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 22159ac8732SStefano Zampini if (B_ierr) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in POTRI Lapack routine %d",(int)B_ierr); 22259ac8732SStefano Zampini } 22359ac8732SStefano Zampini } 22459ac8732SStefano Zampini mumps->schur_inverted = PETSC_TRUE; 22559ac8732SStefano Zampini PetscFunctionReturn(0); 22659ac8732SStefano Zampini } 22759ac8732SStefano Zampini 22859ac8732SStefano Zampini #undef __FUNCT__ 22959ac8732SStefano Zampini #define __FUNCT__ "MatMumpsSolveSchur_Private" 230e807eca7SStefano Zampini static PetscErrorCode MatMumpsSolveSchur_Private(Mat_MUMPS* mumps, PetscBool sol_in_redrhs) 23159ac8732SStefano Zampini { 23259ac8732SStefano Zampini PetscBLASInt B_N,B_Nrhs,B_ierr,B_slda,B_rlda; 23359ac8732SStefano Zampini PetscScalar one=1.,zero=0.; 23459ac8732SStefano Zampini PetscErrorCode ierr; 23559ac8732SStefano Zampini 23659ac8732SStefano Zampini PetscFunctionBegin; 23759ac8732SStefano Zampini ierr = MatMumpsFactorSchur_Private(mumps);CHKERRQ(ierr); 238b5fa320bSStefano Zampini ierr = PetscBLASIntCast(mumps->id.size_schur,&B_N);CHKERRQ(ierr); 239b5fa320bSStefano Zampini ierr = PetscBLASIntCast(mumps->id.schur_lld,&B_slda);CHKERRQ(ierr); 240b5fa320bSStefano Zampini ierr = PetscBLASIntCast(mumps->id.nrhs,&B_Nrhs);CHKERRQ(ierr); 241b5fa320bSStefano Zampini ierr = PetscBLASIntCast(mumps->id.lredrhs,&B_rlda);CHKERRQ(ierr); 24259ac8732SStefano Zampini if (mumps->schur_inverted) { 24359ac8732SStefano Zampini PetscInt sizesol = B_Nrhs*B_N; 24459ac8732SStefano Zampini if (!mumps->schur_sol || sizesol > mumps->schur_sizesol) { 24559ac8732SStefano Zampini ierr = PetscFree(mumps->schur_sol);CHKERRQ(ierr); 24659ac8732SStefano Zampini ierr = PetscMalloc1(sizesol,&mumps->schur_sol);CHKERRQ(ierr); 24759ac8732SStefano Zampini mumps->schur_sizesol = sizesol; 248b5fa320bSStefano Zampini } 24959ac8732SStefano Zampini if (!mumps->sym) { 25059ac8732SStefano Zampini char type[2]; 251b5fa320bSStefano Zampini if (mumps->id.ICNTL(19) == 1) { /* stored by rows */ 25259ac8732SStefano Zampini if (!mumps->id.ICNTL(9)) { /* transpose solve */ 25359ac8732SStefano Zampini sprintf(type,"N"); 254b5fa320bSStefano Zampini } else { 25559ac8732SStefano Zampini sprintf(type,"T"); 256b5fa320bSStefano Zampini } 25759ac8732SStefano Zampini } else { /* stored by columns */ 25859ac8732SStefano Zampini if (!mumps->id.ICNTL(9)) { /* transpose solve */ 25959ac8732SStefano Zampini sprintf(type,"T"); 26059ac8732SStefano Zampini } else { 26159ac8732SStefano Zampini sprintf(type,"N"); 26259ac8732SStefano Zampini } 26359ac8732SStefano Zampini } 26459ac8732SStefano Zampini PetscStackCallBLAS("BLASgemm",BLASgemm_(type,"N",&B_N,&B_Nrhs,&B_N,&one,(PetscScalar*)mumps->id.schur,&B_slda,(PetscScalar*)mumps->id.redrhs,&B_rlda,&zero,mumps->schur_sol,&B_rlda)); 26559ac8732SStefano Zampini } else { 26659ac8732SStefano Zampini char ord[2]; 26759ac8732SStefano Zampini if (mumps->id.ICNTL(19) == 2 || mumps->id.ICNTL(19) == 3) { /* lower triangular stored by columns or full matrix */ 26859ac8732SStefano Zampini sprintf(ord,"L"); 26959ac8732SStefano Zampini } else { /* ICNTL(19) == 1 lower triangular stored by rows */ 27059ac8732SStefano Zampini sprintf(ord,"U"); 27159ac8732SStefano Zampini } 27259ac8732SStefano Zampini PetscStackCallBLAS("BLASsymm",BLASsymm_("L",ord,&B_N,&B_Nrhs,&one,(PetscScalar*)mumps->id.schur,&B_slda,(PetscScalar*)mumps->id.redrhs,&B_rlda,&zero,mumps->schur_sol,&B_rlda)); 27359ac8732SStefano Zampini } 274e807eca7SStefano Zampini if (sol_in_redrhs) { 27559ac8732SStefano Zampini ierr = PetscMemcpy(mumps->id.redrhs,mumps->schur_sol,sizesol*sizeof(PetscScalar));CHKERRQ(ierr); 276e807eca7SStefano Zampini } 277a12f35bfSStefano Zampini } else { /* Schur complement has not been inverted */ 278a12f35bfSStefano Zampini MumpsScalar *orhs=NULL; 279a12f35bfSStefano Zampini 280a12f35bfSStefano Zampini if (!sol_in_redrhs) { 281a12f35bfSStefano Zampini PetscInt sizesol = B_Nrhs*B_N; 282a12f35bfSStefano Zampini if (!mumps->schur_sol || sizesol > mumps->schur_sizesol) { 283a12f35bfSStefano Zampini ierr = PetscFree(mumps->schur_sol);CHKERRQ(ierr); 284a12f35bfSStefano Zampini ierr = PetscMalloc1(sizesol,&mumps->schur_sol);CHKERRQ(ierr); 285a12f35bfSStefano Zampini mumps->schur_sizesol = sizesol; 286a12f35bfSStefano Zampini } 287a12f35bfSStefano Zampini orhs = mumps->id.redrhs; 288a12f35bfSStefano Zampini ierr = PetscMemcpy(mumps->schur_sol,mumps->id.redrhs,sizesol*sizeof(PetscScalar));CHKERRQ(ierr); 289a12f35bfSStefano Zampini mumps->id.redrhs = (MumpsScalar*)mumps->schur_sol; 290a12f35bfSStefano Zampini } 29159ac8732SStefano Zampini if (!mumps->sym) { /* MUMPS always return a full Schur matrix */ 29259ac8732SStefano Zampini char type[2]; 29359ac8732SStefano Zampini if (mumps->id.ICNTL(19) == 1) { /* stored by rows */ 29459ac8732SStefano Zampini if (!mumps->id.ICNTL(9)) { /* transpose solve */ 29559ac8732SStefano Zampini sprintf(type,"N"); 29659ac8732SStefano Zampini } else { 29759ac8732SStefano Zampini sprintf(type,"T"); 29859ac8732SStefano Zampini } 29959ac8732SStefano Zampini } else { /* stored by columns */ 30059ac8732SStefano Zampini if (!mumps->id.ICNTL(9)) { /* transpose solve */ 30159ac8732SStefano Zampini sprintf(type,"T"); 30259ac8732SStefano Zampini } else { 30359ac8732SStefano Zampini sprintf(type,"N"); 30459ac8732SStefano Zampini } 30559ac8732SStefano Zampini } 30659ac8732SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 30759ac8732SStefano Zampini PetscStackCallBLAS("LAPACKgetrs",LAPACKgetrs_(type,&B_N,&B_Nrhs,(PetscScalar*)mumps->id.schur,&B_slda,mumps->schur_pivots,(PetscScalar*)mumps->id.redrhs,&B_rlda,&B_ierr)); 308b5fa320bSStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 309b5fa320bSStefano Zampini if (B_ierr) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in GETRS Lapack routine %d",(int)B_ierr); 310b5fa320bSStefano Zampini } else { /* either full or lower-triangular (not packed) */ 311b5fa320bSStefano Zampini char ord[2]; 312b5fa320bSStefano Zampini if (mumps->id.ICNTL(19) == 2 || mumps->id.ICNTL(19) == 3) { /* lower triangular stored by columns or full matrix */ 313b5fa320bSStefano Zampini sprintf(ord,"L"); 314b5fa320bSStefano Zampini } else { /* ICNTL(19) == 1 lower triangular stored by rows */ 315b5fa320bSStefano Zampini sprintf(ord,"U"); 316b5fa320bSStefano Zampini } 317b5fa320bSStefano Zampini if (mumps->id.sym == 2) { 318b5fa320bSStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 31959ac8732SStefano Zampini PetscStackCallBLAS("LAPACKsytrs",LAPACKsytrs_(ord,&B_N,&B_Nrhs,(PetscScalar*)mumps->id.schur,&B_slda,mumps->schur_pivots,(PetscScalar*)mumps->id.redrhs,&B_rlda,&B_ierr)); 320b5fa320bSStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 321b5fa320bSStefano Zampini if (B_ierr) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in SYTRS Lapack routine %d",(int)B_ierr); 322b5fa320bSStefano Zampini } else { 323b5fa320bSStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 32459ac8732SStefano Zampini PetscStackCallBLAS("LAPACKpotrs",LAPACKpotrs_(ord,&B_N,&B_Nrhs,(PetscScalar*)mumps->id.schur,&B_slda,(PetscScalar*)mumps->id.redrhs,&B_rlda,&B_ierr)); 325b5fa320bSStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 326b5fa320bSStefano Zampini if (B_ierr) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in POTRS Lapack routine %d",(int)B_ierr); 327b5fa320bSStefano Zampini } 328b5fa320bSStefano Zampini } 329e807eca7SStefano Zampini if (!sol_in_redrhs) { 330a12f35bfSStefano Zampini mumps->id.redrhs = orhs; 331e807eca7SStefano Zampini } 33259ac8732SStefano Zampini } 333b5fa320bSStefano Zampini PetscFunctionReturn(0); 334b5fa320bSStefano Zampini } 335b5fa320bSStefano Zampini 33659ac8732SStefano Zampini #undef __FUNCT__ 33759ac8732SStefano Zampini #define __FUNCT__ "MatMumpsHandleSchur_Private" 338b8f61ee1SStefano Zampini static PetscErrorCode MatMumpsHandleSchur_Private(Mat_MUMPS* mumps, PetscBool expansion) 339b5fa320bSStefano Zampini { 340b5fa320bSStefano Zampini PetscErrorCode ierr; 341b5fa320bSStefano Zampini 342b5fa320bSStefano Zampini PetscFunctionBegin; 343b5fa320bSStefano Zampini if (!mumps->id.ICNTL(19)) { /* do nothing when Schur complement has not been computed */ 344b5fa320bSStefano Zampini PetscFunctionReturn(0); 345b5fa320bSStefano Zampini } 346b8f61ee1SStefano Zampini if (!expansion) { /* prepare for the condensation step */ 347b5fa320bSStefano Zampini PetscInt sizeredrhs = mumps->id.nrhs*mumps->id.size_schur; 348b5fa320bSStefano Zampini /* allocate MUMPS internal array to store reduced right-hand sides */ 349b5fa320bSStefano Zampini if (!mumps->id.redrhs || sizeredrhs > mumps->sizeredrhs) { 350b5fa320bSStefano Zampini ierr = PetscFree(mumps->id.redrhs);CHKERRQ(ierr); 351b5fa320bSStefano Zampini mumps->id.lredrhs = mumps->id.size_schur; 352b5fa320bSStefano Zampini ierr = PetscMalloc1(mumps->id.nrhs*mumps->id.lredrhs,&mumps->id.redrhs);CHKERRQ(ierr); 353b5fa320bSStefano Zampini mumps->sizeredrhs = mumps->id.nrhs*mumps->id.lredrhs; 354b5fa320bSStefano Zampini } 355b5fa320bSStefano Zampini mumps->id.ICNTL(26) = 1; /* condensation phase */ 356b5fa320bSStefano Zampini } else { /* prepare for the expansion step */ 357b8f61ee1SStefano Zampini /* solve Schur complement (this has to be done by the MUMPS user, so basically us) */ 358e807eca7SStefano Zampini ierr = MatMumpsSolveSchur_Private(mumps,PETSC_TRUE);CHKERRQ(ierr); 359b5fa320bSStefano Zampini mumps->id.ICNTL(26) = 2; /* expansion phase */ 360b5fa320bSStefano Zampini PetscMUMPS_c(&mumps->id); 361b5fa320bSStefano Zampini if (mumps->id.INFOG(1) < 0) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error reported by MUMPS in solve phase: INFOG(1)=%d\n",mumps->id.INFOG(1)); 362b5fa320bSStefano Zampini /* restore defaults */ 363b5fa320bSStefano Zampini mumps->id.ICNTL(26) = -1; 364b5fa320bSStefano Zampini } 365b5fa320bSStefano Zampini PetscFunctionReturn(0); 366b5fa320bSStefano Zampini } 367b5fa320bSStefano Zampini 368397b6df1SKris Buschelman /* 369d341cd04SHong Zhang MatConvertToTriples_A_B - convert Petsc matrix to triples: row[nz], col[nz], val[nz] 370d341cd04SHong Zhang 371397b6df1SKris Buschelman input: 37267877ebaSShri Abhyankar A - matrix in aij,baij or sbaij (bs=1) format 373397b6df1SKris Buschelman shift - 0: C style output triple; 1: Fortran style output triple. 374bccb9932SShri Abhyankar reuse - MAT_INITIAL_MATRIX: spaces are allocated and values are set for the triple 375bccb9932SShri Abhyankar MAT_REUSE_MATRIX: only the values in v array are updated 376397b6df1SKris Buschelman output: 377397b6df1SKris Buschelman nnz - dim of r, c, and v (number of local nonzero entries of A) 378397b6df1SKris Buschelman r, c, v - row and col index, matrix values (matrix triples) 379eb9baa12SBarry Smith 380eb9baa12SBarry Smith The returned values r, c, and sometimes v are obtained in a single PetscMalloc(). Then in MatDestroy_MUMPS() it is 381eb9baa12SBarry Smith freed with PetscFree((mumps->irn); This is not ideal code, the fact that v is ONLY sometimes part of mumps->irn means 382eb9baa12SBarry Smith that the PetscMalloc() cannot easily be replaced with a PetscMalloc3(). 383eb9baa12SBarry Smith 384397b6df1SKris Buschelman */ 38516ebf90aSShri Abhyankar 38616ebf90aSShri Abhyankar #undef __FUNCT__ 38716ebf90aSShri Abhyankar #define __FUNCT__ "MatConvertToTriples_seqaij_seqaij" 388bccb9932SShri Abhyankar PetscErrorCode MatConvertToTriples_seqaij_seqaij(Mat A,int shift,MatReuse reuse,int *nnz,int **r, int **c, PetscScalar **v) 389b24902e0SBarry Smith { 390185f6596SHong Zhang const PetscInt *ai,*aj,*ajj,M=A->rmap->n; 39167877ebaSShri Abhyankar PetscInt nz,rnz,i,j; 392dfbe8321SBarry Smith PetscErrorCode ierr; 393c1490034SHong Zhang PetscInt *row,*col; 39416ebf90aSShri Abhyankar Mat_SeqAIJ *aa=(Mat_SeqAIJ*)A->data; 395397b6df1SKris Buschelman 396397b6df1SKris Buschelman PetscFunctionBegin; 39716ebf90aSShri Abhyankar *v=aa->a; 398bccb9932SShri Abhyankar if (reuse == MAT_INITIAL_MATRIX) { 3992205254eSKarl Rupp nz = aa->nz; 4002205254eSKarl Rupp ai = aa->i; 4012205254eSKarl Rupp aj = aa->j; 40216ebf90aSShri Abhyankar *nnz = nz; 403785e854fSJed Brown ierr = PetscMalloc1(2*nz, &row);CHKERRQ(ierr); 404185f6596SHong Zhang col = row + nz; 405185f6596SHong Zhang 40616ebf90aSShri Abhyankar nz = 0; 40716ebf90aSShri Abhyankar for (i=0; i<M; i++) { 40816ebf90aSShri Abhyankar rnz = ai[i+1] - ai[i]; 40967877ebaSShri Abhyankar ajj = aj + ai[i]; 41067877ebaSShri Abhyankar for (j=0; j<rnz; j++) { 41167877ebaSShri Abhyankar row[nz] = i+shift; col[nz++] = ajj[j] + shift; 41216ebf90aSShri Abhyankar } 41316ebf90aSShri Abhyankar } 41416ebf90aSShri Abhyankar *r = row; *c = col; 41516ebf90aSShri Abhyankar } 41616ebf90aSShri Abhyankar PetscFunctionReturn(0); 41716ebf90aSShri Abhyankar } 418397b6df1SKris Buschelman 41916ebf90aSShri Abhyankar #undef __FUNCT__ 42067877ebaSShri Abhyankar #define __FUNCT__ "MatConvertToTriples_seqbaij_seqaij" 421bccb9932SShri Abhyankar PetscErrorCode MatConvertToTriples_seqbaij_seqaij(Mat A,int shift,MatReuse reuse,int *nnz,int **r, int **c, PetscScalar **v) 42267877ebaSShri Abhyankar { 42367877ebaSShri Abhyankar Mat_SeqBAIJ *aa=(Mat_SeqBAIJ*)A->data; 42433d57670SJed Brown const PetscInt *ai,*aj,*ajj,bs2 = aa->bs2; 42533d57670SJed Brown PetscInt bs,M,nz,idx=0,rnz,i,j,k,m; 42667877ebaSShri Abhyankar PetscErrorCode ierr; 42767877ebaSShri Abhyankar PetscInt *row,*col; 42867877ebaSShri Abhyankar 42967877ebaSShri Abhyankar PetscFunctionBegin; 43033d57670SJed Brown ierr = MatGetBlockSize(A,&bs);CHKERRQ(ierr); 43133d57670SJed Brown M = A->rmap->N/bs; 432cf3759fdSShri Abhyankar *v = aa->a; 433bccb9932SShri Abhyankar if (reuse == MAT_INITIAL_MATRIX) { 434cf3759fdSShri Abhyankar ai = aa->i; aj = aa->j; 43567877ebaSShri Abhyankar nz = bs2*aa->nz; 43667877ebaSShri Abhyankar *nnz = nz; 437785e854fSJed Brown ierr = PetscMalloc1(2*nz, &row);CHKERRQ(ierr); 438185f6596SHong Zhang col = row + nz; 439185f6596SHong Zhang 44067877ebaSShri Abhyankar for (i=0; i<M; i++) { 44167877ebaSShri Abhyankar ajj = aj + ai[i]; 44267877ebaSShri Abhyankar rnz = ai[i+1] - ai[i]; 44367877ebaSShri Abhyankar for (k=0; k<rnz; k++) { 44467877ebaSShri Abhyankar for (j=0; j<bs; j++) { 44567877ebaSShri Abhyankar for (m=0; m<bs; m++) { 44667877ebaSShri Abhyankar row[idx] = i*bs + m + shift; 447cf3759fdSShri Abhyankar col[idx++] = bs*(ajj[k]) + j + shift; 44867877ebaSShri Abhyankar } 44967877ebaSShri Abhyankar } 45067877ebaSShri Abhyankar } 45167877ebaSShri Abhyankar } 452cf3759fdSShri Abhyankar *r = row; *c = col; 45367877ebaSShri Abhyankar } 45467877ebaSShri Abhyankar PetscFunctionReturn(0); 45567877ebaSShri Abhyankar } 45667877ebaSShri Abhyankar 45767877ebaSShri Abhyankar #undef __FUNCT__ 45816ebf90aSShri Abhyankar #define __FUNCT__ "MatConvertToTriples_seqsbaij_seqsbaij" 459bccb9932SShri Abhyankar PetscErrorCode MatConvertToTriples_seqsbaij_seqsbaij(Mat A,int shift,MatReuse reuse,int *nnz,int **r, int **c, PetscScalar **v) 46016ebf90aSShri Abhyankar { 46167877ebaSShri Abhyankar const PetscInt *ai, *aj,*ajj,M=A->rmap->n; 46267877ebaSShri Abhyankar PetscInt nz,rnz,i,j; 46316ebf90aSShri Abhyankar PetscErrorCode ierr; 46416ebf90aSShri Abhyankar PetscInt *row,*col; 46516ebf90aSShri Abhyankar Mat_SeqSBAIJ *aa=(Mat_SeqSBAIJ*)A->data; 46616ebf90aSShri Abhyankar 46716ebf90aSShri Abhyankar PetscFunctionBegin; 468882afa5aSHong Zhang *v = aa->a; 469bccb9932SShri Abhyankar if (reuse == MAT_INITIAL_MATRIX) { 4702205254eSKarl Rupp nz = aa->nz; 4712205254eSKarl Rupp ai = aa->i; 4722205254eSKarl Rupp aj = aa->j; 4732205254eSKarl Rupp *v = aa->a; 47416ebf90aSShri Abhyankar *nnz = nz; 475785e854fSJed Brown ierr = PetscMalloc1(2*nz, &row);CHKERRQ(ierr); 476185f6596SHong Zhang col = row + nz; 477185f6596SHong Zhang 47816ebf90aSShri Abhyankar nz = 0; 47916ebf90aSShri Abhyankar for (i=0; i<M; i++) { 48016ebf90aSShri Abhyankar rnz = ai[i+1] - ai[i]; 48167877ebaSShri Abhyankar ajj = aj + ai[i]; 48267877ebaSShri Abhyankar for (j=0; j<rnz; j++) { 48367877ebaSShri Abhyankar row[nz] = i+shift; col[nz++] = ajj[j] + shift; 48416ebf90aSShri Abhyankar } 48516ebf90aSShri Abhyankar } 48616ebf90aSShri Abhyankar *r = row; *c = col; 48716ebf90aSShri Abhyankar } 48816ebf90aSShri Abhyankar PetscFunctionReturn(0); 48916ebf90aSShri Abhyankar } 49016ebf90aSShri Abhyankar 49116ebf90aSShri Abhyankar #undef __FUNCT__ 49216ebf90aSShri Abhyankar #define __FUNCT__ "MatConvertToTriples_seqaij_seqsbaij" 493bccb9932SShri Abhyankar PetscErrorCode MatConvertToTriples_seqaij_seqsbaij(Mat A,int shift,MatReuse reuse,int *nnz,int **r, int **c, PetscScalar **v) 49416ebf90aSShri Abhyankar { 49567877ebaSShri Abhyankar const PetscInt *ai,*aj,*ajj,*adiag,M=A->rmap->n; 49667877ebaSShri Abhyankar PetscInt nz,rnz,i,j; 49767877ebaSShri Abhyankar const PetscScalar *av,*v1; 49816ebf90aSShri Abhyankar PetscScalar *val; 49916ebf90aSShri Abhyankar PetscErrorCode ierr; 50016ebf90aSShri Abhyankar PetscInt *row,*col; 501829b1710SHong Zhang Mat_SeqAIJ *aa=(Mat_SeqAIJ*)A->data; 50216ebf90aSShri Abhyankar 50316ebf90aSShri Abhyankar PetscFunctionBegin; 50416ebf90aSShri Abhyankar ai =aa->i; aj=aa->j;av=aa->a; 50516ebf90aSShri Abhyankar adiag=aa->diag; 506bccb9932SShri Abhyankar if (reuse == MAT_INITIAL_MATRIX) { 507829b1710SHong Zhang /* count nz in the uppper triangular part of A */ 508829b1710SHong Zhang nz = 0; 509829b1710SHong Zhang for (i=0; i<M; i++) nz += ai[i+1] - adiag[i]; 51016ebf90aSShri Abhyankar *nnz = nz; 511829b1710SHong Zhang 512185f6596SHong Zhang ierr = PetscMalloc((2*nz*sizeof(PetscInt)+nz*sizeof(PetscScalar)), &row);CHKERRQ(ierr); 513185f6596SHong Zhang col = row + nz; 514185f6596SHong Zhang val = (PetscScalar*)(col + nz); 515185f6596SHong Zhang 51616ebf90aSShri Abhyankar nz = 0; 51716ebf90aSShri Abhyankar for (i=0; i<M; i++) { 51816ebf90aSShri Abhyankar rnz = ai[i+1] - adiag[i]; 51967877ebaSShri Abhyankar ajj = aj + adiag[i]; 520cf3759fdSShri Abhyankar v1 = av + adiag[i]; 52167877ebaSShri Abhyankar for (j=0; j<rnz; j++) { 52267877ebaSShri Abhyankar row[nz] = i+shift; col[nz] = ajj[j] + shift; val[nz++] = v1[j]; 52316ebf90aSShri Abhyankar } 52416ebf90aSShri Abhyankar } 52516ebf90aSShri Abhyankar *r = row; *c = col; *v = val; 526397b6df1SKris Buschelman } else { 52716ebf90aSShri Abhyankar nz = 0; val = *v; 52816ebf90aSShri Abhyankar for (i=0; i <M; i++) { 52916ebf90aSShri Abhyankar rnz = ai[i+1] - adiag[i]; 53067877ebaSShri Abhyankar ajj = aj + adiag[i]; 53167877ebaSShri Abhyankar v1 = av + adiag[i]; 53267877ebaSShri Abhyankar for (j=0; j<rnz; j++) { 53367877ebaSShri Abhyankar val[nz++] = v1[j]; 53416ebf90aSShri Abhyankar } 53516ebf90aSShri Abhyankar } 53616ebf90aSShri Abhyankar } 53716ebf90aSShri Abhyankar PetscFunctionReturn(0); 53816ebf90aSShri Abhyankar } 53916ebf90aSShri Abhyankar 54016ebf90aSShri Abhyankar #undef __FUNCT__ 54116ebf90aSShri Abhyankar #define __FUNCT__ "MatConvertToTriples_mpisbaij_mpisbaij" 542bccb9932SShri Abhyankar PetscErrorCode MatConvertToTriples_mpisbaij_mpisbaij(Mat A,int shift,MatReuse reuse,int *nnz,int **r, int **c, PetscScalar **v) 54316ebf90aSShri Abhyankar { 54416ebf90aSShri Abhyankar const PetscInt *ai, *aj, *bi, *bj,*garray,m=A->rmap->n,*ajj,*bjj; 54516ebf90aSShri Abhyankar PetscErrorCode ierr; 54616ebf90aSShri Abhyankar PetscInt rstart,nz,i,j,jj,irow,countA,countB; 54716ebf90aSShri Abhyankar PetscInt *row,*col; 54816ebf90aSShri Abhyankar const PetscScalar *av, *bv,*v1,*v2; 54916ebf90aSShri Abhyankar PetscScalar *val; 550397b6df1SKris Buschelman Mat_MPISBAIJ *mat = (Mat_MPISBAIJ*)A->data; 551397b6df1SKris Buschelman Mat_SeqSBAIJ *aa = (Mat_SeqSBAIJ*)(mat->A)->data; 552397b6df1SKris Buschelman Mat_SeqBAIJ *bb = (Mat_SeqBAIJ*)(mat->B)->data; 55316ebf90aSShri Abhyankar 55416ebf90aSShri Abhyankar PetscFunctionBegin; 555d0f46423SBarry Smith ai=aa->i; aj=aa->j; bi=bb->i; bj=bb->j; rstart= A->rmap->rstart; 556397b6df1SKris Buschelman av=aa->a; bv=bb->a; 557397b6df1SKris Buschelman 5582205254eSKarl Rupp garray = mat->garray; 5592205254eSKarl Rupp 560bccb9932SShri Abhyankar if (reuse == MAT_INITIAL_MATRIX) { 56116ebf90aSShri Abhyankar nz = aa->nz + bb->nz; 56216ebf90aSShri Abhyankar *nnz = nz; 563185f6596SHong Zhang ierr = PetscMalloc((2*nz*sizeof(PetscInt)+nz*sizeof(PetscScalar)), &row);CHKERRQ(ierr); 564185f6596SHong Zhang col = row + nz; 565185f6596SHong Zhang val = (PetscScalar*)(col + nz); 566185f6596SHong Zhang 567397b6df1SKris Buschelman *r = row; *c = col; *v = val; 568397b6df1SKris Buschelman } else { 569397b6df1SKris Buschelman row = *r; col = *c; val = *v; 570397b6df1SKris Buschelman } 571397b6df1SKris Buschelman 572028e57e8SHong Zhang jj = 0; irow = rstart; 573397b6df1SKris Buschelman for (i=0; i<m; i++) { 574397b6df1SKris Buschelman ajj = aj + ai[i]; /* ptr to the beginning of this row */ 575397b6df1SKris Buschelman countA = ai[i+1] - ai[i]; 576397b6df1SKris Buschelman countB = bi[i+1] - bi[i]; 577397b6df1SKris Buschelman bjj = bj + bi[i]; 57816ebf90aSShri Abhyankar v1 = av + ai[i]; 57916ebf90aSShri Abhyankar v2 = bv + bi[i]; 580397b6df1SKris Buschelman 581397b6df1SKris Buschelman /* A-part */ 582397b6df1SKris Buschelman for (j=0; j<countA; j++) { 583bccb9932SShri Abhyankar if (reuse == MAT_INITIAL_MATRIX) { 584397b6df1SKris Buschelman row[jj] = irow + shift; col[jj] = rstart + ajj[j] + shift; 585397b6df1SKris Buschelman } 58616ebf90aSShri Abhyankar val[jj++] = v1[j]; 587397b6df1SKris Buschelman } 58816ebf90aSShri Abhyankar 58916ebf90aSShri Abhyankar /* B-part */ 59016ebf90aSShri Abhyankar for (j=0; j < countB; j++) { 591bccb9932SShri Abhyankar if (reuse == MAT_INITIAL_MATRIX) { 592397b6df1SKris Buschelman row[jj] = irow + shift; col[jj] = garray[bjj[j]] + shift; 593397b6df1SKris Buschelman } 59416ebf90aSShri Abhyankar val[jj++] = v2[j]; 59516ebf90aSShri Abhyankar } 59616ebf90aSShri Abhyankar irow++; 59716ebf90aSShri Abhyankar } 59816ebf90aSShri Abhyankar PetscFunctionReturn(0); 59916ebf90aSShri Abhyankar } 60016ebf90aSShri Abhyankar 60116ebf90aSShri Abhyankar #undef __FUNCT__ 60216ebf90aSShri Abhyankar #define __FUNCT__ "MatConvertToTriples_mpiaij_mpiaij" 603bccb9932SShri Abhyankar PetscErrorCode MatConvertToTriples_mpiaij_mpiaij(Mat A,int shift,MatReuse reuse,int *nnz,int **r, int **c, PetscScalar **v) 60416ebf90aSShri Abhyankar { 60516ebf90aSShri Abhyankar const PetscInt *ai, *aj, *bi, *bj,*garray,m=A->rmap->n,*ajj,*bjj; 60616ebf90aSShri Abhyankar PetscErrorCode ierr; 60716ebf90aSShri Abhyankar PetscInt rstart,nz,i,j,jj,irow,countA,countB; 60816ebf90aSShri Abhyankar PetscInt *row,*col; 60916ebf90aSShri Abhyankar const PetscScalar *av, *bv,*v1,*v2; 61016ebf90aSShri Abhyankar PetscScalar *val; 61116ebf90aSShri Abhyankar Mat_MPIAIJ *mat = (Mat_MPIAIJ*)A->data; 61216ebf90aSShri Abhyankar Mat_SeqAIJ *aa = (Mat_SeqAIJ*)(mat->A)->data; 61316ebf90aSShri Abhyankar Mat_SeqAIJ *bb = (Mat_SeqAIJ*)(mat->B)->data; 61416ebf90aSShri Abhyankar 61516ebf90aSShri Abhyankar PetscFunctionBegin; 61616ebf90aSShri Abhyankar ai=aa->i; aj=aa->j; bi=bb->i; bj=bb->j; rstart= A->rmap->rstart; 61716ebf90aSShri Abhyankar av=aa->a; bv=bb->a; 61816ebf90aSShri Abhyankar 6192205254eSKarl Rupp garray = mat->garray; 6202205254eSKarl Rupp 621bccb9932SShri Abhyankar if (reuse == MAT_INITIAL_MATRIX) { 62216ebf90aSShri Abhyankar nz = aa->nz + bb->nz; 62316ebf90aSShri Abhyankar *nnz = nz; 624185f6596SHong Zhang ierr = PetscMalloc((2*nz*sizeof(PetscInt)+nz*sizeof(PetscScalar)), &row);CHKERRQ(ierr); 625185f6596SHong Zhang col = row + nz; 626185f6596SHong Zhang val = (PetscScalar*)(col + nz); 627185f6596SHong Zhang 62816ebf90aSShri Abhyankar *r = row; *c = col; *v = val; 62916ebf90aSShri Abhyankar } else { 63016ebf90aSShri Abhyankar row = *r; col = *c; val = *v; 63116ebf90aSShri Abhyankar } 63216ebf90aSShri Abhyankar 63316ebf90aSShri Abhyankar jj = 0; irow = rstart; 63416ebf90aSShri Abhyankar for (i=0; i<m; i++) { 63516ebf90aSShri Abhyankar ajj = aj + ai[i]; /* ptr to the beginning of this row */ 63616ebf90aSShri Abhyankar countA = ai[i+1] - ai[i]; 63716ebf90aSShri Abhyankar countB = bi[i+1] - bi[i]; 63816ebf90aSShri Abhyankar bjj = bj + bi[i]; 63916ebf90aSShri Abhyankar v1 = av + ai[i]; 64016ebf90aSShri Abhyankar v2 = bv + bi[i]; 64116ebf90aSShri Abhyankar 64216ebf90aSShri Abhyankar /* A-part */ 64316ebf90aSShri Abhyankar for (j=0; j<countA; j++) { 644bccb9932SShri Abhyankar if (reuse == MAT_INITIAL_MATRIX) { 64516ebf90aSShri Abhyankar row[jj] = irow + shift; col[jj] = rstart + ajj[j] + shift; 64616ebf90aSShri Abhyankar } 64716ebf90aSShri Abhyankar val[jj++] = v1[j]; 64816ebf90aSShri Abhyankar } 64916ebf90aSShri Abhyankar 65016ebf90aSShri Abhyankar /* B-part */ 65116ebf90aSShri Abhyankar for (j=0; j < countB; j++) { 652bccb9932SShri Abhyankar if (reuse == MAT_INITIAL_MATRIX) { 65316ebf90aSShri Abhyankar row[jj] = irow + shift; col[jj] = garray[bjj[j]] + shift; 65416ebf90aSShri Abhyankar } 65516ebf90aSShri Abhyankar val[jj++] = v2[j]; 65616ebf90aSShri Abhyankar } 65716ebf90aSShri Abhyankar irow++; 65816ebf90aSShri Abhyankar } 65916ebf90aSShri Abhyankar PetscFunctionReturn(0); 66016ebf90aSShri Abhyankar } 66116ebf90aSShri Abhyankar 66216ebf90aSShri Abhyankar #undef __FUNCT__ 66367877ebaSShri Abhyankar #define __FUNCT__ "MatConvertToTriples_mpibaij_mpiaij" 664bccb9932SShri Abhyankar PetscErrorCode MatConvertToTriples_mpibaij_mpiaij(Mat A,int shift,MatReuse reuse,int *nnz,int **r, int **c, PetscScalar **v) 66567877ebaSShri Abhyankar { 66667877ebaSShri Abhyankar Mat_MPIBAIJ *mat = (Mat_MPIBAIJ*)A->data; 66767877ebaSShri Abhyankar Mat_SeqBAIJ *aa = (Mat_SeqBAIJ*)(mat->A)->data; 66867877ebaSShri Abhyankar Mat_SeqBAIJ *bb = (Mat_SeqBAIJ*)(mat->B)->data; 66967877ebaSShri Abhyankar const PetscInt *ai = aa->i, *bi = bb->i, *aj = aa->j, *bj = bb->j,*ajj, *bjj; 670d985c460SShri Abhyankar const PetscInt *garray = mat->garray,mbs=mat->mbs,rstart=A->rmap->rstart; 67133d57670SJed Brown const PetscInt bs2=mat->bs2; 67267877ebaSShri Abhyankar PetscErrorCode ierr; 67333d57670SJed Brown PetscInt bs,nz,i,j,k,n,jj,irow,countA,countB,idx; 67467877ebaSShri Abhyankar PetscInt *row,*col; 67567877ebaSShri Abhyankar const PetscScalar *av=aa->a, *bv=bb->a,*v1,*v2; 67667877ebaSShri Abhyankar PetscScalar *val; 67767877ebaSShri Abhyankar 67867877ebaSShri Abhyankar PetscFunctionBegin; 67933d57670SJed Brown ierr = MatGetBlockSize(A,&bs);CHKERRQ(ierr); 680bccb9932SShri Abhyankar if (reuse == MAT_INITIAL_MATRIX) { 68167877ebaSShri Abhyankar nz = bs2*(aa->nz + bb->nz); 68267877ebaSShri Abhyankar *nnz = nz; 683185f6596SHong Zhang ierr = PetscMalloc((2*nz*sizeof(PetscInt)+nz*sizeof(PetscScalar)), &row);CHKERRQ(ierr); 684185f6596SHong Zhang col = row + nz; 685185f6596SHong Zhang val = (PetscScalar*)(col + nz); 686185f6596SHong Zhang 68767877ebaSShri Abhyankar *r = row; *c = col; *v = val; 68867877ebaSShri Abhyankar } else { 68967877ebaSShri Abhyankar row = *r; col = *c; val = *v; 69067877ebaSShri Abhyankar } 69167877ebaSShri Abhyankar 692d985c460SShri Abhyankar jj = 0; irow = rstart; 69367877ebaSShri Abhyankar for (i=0; i<mbs; i++) { 69467877ebaSShri Abhyankar countA = ai[i+1] - ai[i]; 69567877ebaSShri Abhyankar countB = bi[i+1] - bi[i]; 69667877ebaSShri Abhyankar ajj = aj + ai[i]; 69767877ebaSShri Abhyankar bjj = bj + bi[i]; 69867877ebaSShri Abhyankar v1 = av + bs2*ai[i]; 69967877ebaSShri Abhyankar v2 = bv + bs2*bi[i]; 70067877ebaSShri Abhyankar 70167877ebaSShri Abhyankar idx = 0; 70267877ebaSShri Abhyankar /* A-part */ 70367877ebaSShri Abhyankar for (k=0; k<countA; k++) { 70467877ebaSShri Abhyankar for (j=0; j<bs; j++) { 70567877ebaSShri Abhyankar for (n=0; n<bs; n++) { 706bccb9932SShri Abhyankar if (reuse == MAT_INITIAL_MATRIX) { 707d985c460SShri Abhyankar row[jj] = irow + n + shift; 708d985c460SShri Abhyankar col[jj] = rstart + bs*ajj[k] + j + shift; 70967877ebaSShri Abhyankar } 71067877ebaSShri Abhyankar val[jj++] = v1[idx++]; 71167877ebaSShri Abhyankar } 71267877ebaSShri Abhyankar } 71367877ebaSShri Abhyankar } 71467877ebaSShri Abhyankar 71567877ebaSShri Abhyankar idx = 0; 71667877ebaSShri Abhyankar /* B-part */ 71767877ebaSShri Abhyankar for (k=0; k<countB; k++) { 71867877ebaSShri Abhyankar for (j=0; j<bs; j++) { 71967877ebaSShri Abhyankar for (n=0; n<bs; n++) { 720bccb9932SShri Abhyankar if (reuse == MAT_INITIAL_MATRIX) { 721d985c460SShri Abhyankar row[jj] = irow + n + shift; 722d985c460SShri Abhyankar col[jj] = bs*garray[bjj[k]] + j + shift; 72367877ebaSShri Abhyankar } 724d985c460SShri Abhyankar val[jj++] = v2[idx++]; 72567877ebaSShri Abhyankar } 72667877ebaSShri Abhyankar } 72767877ebaSShri Abhyankar } 728d985c460SShri Abhyankar irow += bs; 72967877ebaSShri Abhyankar } 73067877ebaSShri Abhyankar PetscFunctionReturn(0); 73167877ebaSShri Abhyankar } 73267877ebaSShri Abhyankar 73367877ebaSShri Abhyankar #undef __FUNCT__ 73416ebf90aSShri Abhyankar #define __FUNCT__ "MatConvertToTriples_mpiaij_mpisbaij" 735bccb9932SShri Abhyankar PetscErrorCode MatConvertToTriples_mpiaij_mpisbaij(Mat A,int shift,MatReuse reuse,int *nnz,int **r, int **c, PetscScalar **v) 73616ebf90aSShri Abhyankar { 73716ebf90aSShri Abhyankar const PetscInt *ai, *aj,*adiag, *bi, *bj,*garray,m=A->rmap->n,*ajj,*bjj; 73816ebf90aSShri Abhyankar PetscErrorCode ierr; 739e0bace9bSHong Zhang PetscInt rstart,nz,nza,nzb,i,j,jj,irow,countA,countB; 74016ebf90aSShri Abhyankar PetscInt *row,*col; 74116ebf90aSShri Abhyankar const PetscScalar *av, *bv,*v1,*v2; 74216ebf90aSShri Abhyankar PetscScalar *val; 74316ebf90aSShri Abhyankar Mat_MPIAIJ *mat = (Mat_MPIAIJ*)A->data; 74416ebf90aSShri Abhyankar Mat_SeqAIJ *aa =(Mat_SeqAIJ*)(mat->A)->data; 74516ebf90aSShri Abhyankar Mat_SeqAIJ *bb =(Mat_SeqAIJ*)(mat->B)->data; 74616ebf90aSShri Abhyankar 74716ebf90aSShri Abhyankar PetscFunctionBegin; 74816ebf90aSShri Abhyankar ai=aa->i; aj=aa->j; adiag=aa->diag; 74916ebf90aSShri Abhyankar bi=bb->i; bj=bb->j; garray = mat->garray; 75016ebf90aSShri Abhyankar av=aa->a; bv=bb->a; 7512205254eSKarl Rupp 75216ebf90aSShri Abhyankar rstart = A->rmap->rstart; 75316ebf90aSShri Abhyankar 754bccb9932SShri Abhyankar if (reuse == MAT_INITIAL_MATRIX) { 755e0bace9bSHong Zhang nza = 0; /* num of upper triangular entries in mat->A, including diagonals */ 756e0bace9bSHong Zhang nzb = 0; /* num of upper triangular entries in mat->B */ 75716ebf90aSShri Abhyankar for (i=0; i<m; i++) { 758e0bace9bSHong Zhang nza += (ai[i+1] - adiag[i]); 75916ebf90aSShri Abhyankar countB = bi[i+1] - bi[i]; 76016ebf90aSShri Abhyankar bjj = bj + bi[i]; 761e0bace9bSHong Zhang for (j=0; j<countB; j++) { 762e0bace9bSHong Zhang if (garray[bjj[j]] > rstart) nzb++; 763e0bace9bSHong Zhang } 764e0bace9bSHong Zhang } 76516ebf90aSShri Abhyankar 766e0bace9bSHong Zhang nz = nza + nzb; /* total nz of upper triangular part of mat */ 76716ebf90aSShri Abhyankar *nnz = nz; 768185f6596SHong Zhang ierr = PetscMalloc((2*nz*sizeof(PetscInt)+nz*sizeof(PetscScalar)), &row);CHKERRQ(ierr); 769185f6596SHong Zhang col = row + nz; 770185f6596SHong Zhang val = (PetscScalar*)(col + nz); 771185f6596SHong Zhang 77216ebf90aSShri Abhyankar *r = row; *c = col; *v = val; 77316ebf90aSShri Abhyankar } else { 77416ebf90aSShri Abhyankar row = *r; col = *c; val = *v; 77516ebf90aSShri Abhyankar } 77616ebf90aSShri Abhyankar 77716ebf90aSShri Abhyankar jj = 0; irow = rstart; 77816ebf90aSShri Abhyankar for (i=0; i<m; i++) { 77916ebf90aSShri Abhyankar ajj = aj + adiag[i]; /* ptr to the beginning of the diagonal of this row */ 78016ebf90aSShri Abhyankar v1 = av + adiag[i]; 78116ebf90aSShri Abhyankar countA = ai[i+1] - adiag[i]; 78216ebf90aSShri Abhyankar countB = bi[i+1] - bi[i]; 78316ebf90aSShri Abhyankar bjj = bj + bi[i]; 78416ebf90aSShri Abhyankar v2 = bv + bi[i]; 78516ebf90aSShri Abhyankar 78616ebf90aSShri Abhyankar /* A-part */ 78716ebf90aSShri Abhyankar for (j=0; j<countA; j++) { 788bccb9932SShri Abhyankar if (reuse == MAT_INITIAL_MATRIX) { 78916ebf90aSShri Abhyankar row[jj] = irow + shift; col[jj] = rstart + ajj[j] + shift; 79016ebf90aSShri Abhyankar } 79116ebf90aSShri Abhyankar val[jj++] = v1[j]; 79216ebf90aSShri Abhyankar } 79316ebf90aSShri Abhyankar 79416ebf90aSShri Abhyankar /* B-part */ 79516ebf90aSShri Abhyankar for (j=0; j < countB; j++) { 79616ebf90aSShri Abhyankar if (garray[bjj[j]] > rstart) { 797bccb9932SShri Abhyankar if (reuse == MAT_INITIAL_MATRIX) { 79816ebf90aSShri Abhyankar row[jj] = irow + shift; col[jj] = garray[bjj[j]] + shift; 79916ebf90aSShri Abhyankar } 80016ebf90aSShri Abhyankar val[jj++] = v2[j]; 80116ebf90aSShri Abhyankar } 802397b6df1SKris Buschelman } 803397b6df1SKris Buschelman irow++; 804397b6df1SKris Buschelman } 805397b6df1SKris Buschelman PetscFunctionReturn(0); 806397b6df1SKris Buschelman } 807397b6df1SKris Buschelman 808397b6df1SKris Buschelman #undef __FUNCT__ 80920be8e61SHong Zhang #define __FUNCT__ "MatGetDiagonal_MUMPS" 81020be8e61SHong Zhang PetscErrorCode MatGetDiagonal_MUMPS(Mat A,Vec v) 81120be8e61SHong Zhang { 81220be8e61SHong Zhang PetscFunctionBegin; 81320be8e61SHong Zhang SETERRQ(PetscObjectComm((PetscObject)A),PETSC_ERR_SUP,"Mat type: MUMPS factor"); 81420be8e61SHong Zhang PetscFunctionReturn(0); 81520be8e61SHong Zhang } 81620be8e61SHong Zhang 81720be8e61SHong Zhang #undef __FUNCT__ 8183924e44cSKris Buschelman #define __FUNCT__ "MatDestroy_MUMPS" 819dfbe8321SBarry Smith PetscErrorCode MatDestroy_MUMPS(Mat A) 820dfbe8321SBarry Smith { 821a5e57a09SHong Zhang Mat_MUMPS *mumps=(Mat_MUMPS*)A->spptr; 822dfbe8321SBarry Smith PetscErrorCode ierr; 823b24902e0SBarry Smith 824397b6df1SKris Buschelman PetscFunctionBegin; 825a5e57a09SHong Zhang ierr = PetscFree2(mumps->id.sol_loc,mumps->id.isol_loc);CHKERRQ(ierr); 826a5e57a09SHong Zhang ierr = VecScatterDestroy(&mumps->scat_rhs);CHKERRQ(ierr); 827a5e57a09SHong Zhang ierr = VecScatterDestroy(&mumps->scat_sol);CHKERRQ(ierr); 828801fbe65SHong Zhang ierr = VecDestroy(&mumps->b_seq);CHKERRQ(ierr); 829a5e57a09SHong Zhang ierr = VecDestroy(&mumps->x_seq);CHKERRQ(ierr); 830a5e57a09SHong Zhang ierr = PetscFree(mumps->id.perm_in);CHKERRQ(ierr); 831a5e57a09SHong Zhang ierr = PetscFree(mumps->irn);CHKERRQ(ierr); 832b34f08ffSHong Zhang ierr = PetscFree(mumps->info);CHKERRQ(ierr); 83359ac8732SStefano Zampini ierr = MatMumpsResetSchur_Private(mumps);CHKERRQ(ierr); 834a5e57a09SHong Zhang mumps->id.job = JOB_END; 835a5e57a09SHong Zhang PetscMUMPS_c(&mumps->id); 8366f3cc6f9SBarry Smith ierr = MPI_Comm_free(&mumps->comm_mumps);CHKERRQ(ierr); 837a5e57a09SHong Zhang if (mumps->Destroy) { 838a5e57a09SHong Zhang ierr = (mumps->Destroy)(A);CHKERRQ(ierr); 839bf0cc555SLisandro Dalcin } 840bf0cc555SLisandro Dalcin ierr = PetscFree(A->spptr);CHKERRQ(ierr); 841bf0cc555SLisandro Dalcin 84297969023SHong Zhang /* clear composed functions */ 843bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)A,"MatFactorGetSolverPackage_C",NULL);CHKERRQ(ierr); 8445a05ddb0SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)A,"MatFactorSetSchurIS_C",NULL);CHKERRQ(ierr); 8455a05ddb0SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)A,"MatFactorInvertSchurComplement_C",NULL);CHKERRQ(ierr); 8465a05ddb0SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)A,"MatFactorCreateSchurComplement_C",NULL);CHKERRQ(ierr); 8475a05ddb0SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)A,"MatFactorGetSchurComplement_C",NULL);CHKERRQ(ierr); 8485a05ddb0SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)A,"MatFactorSolveSchurComplement_C",NULL);CHKERRQ(ierr); 8495a05ddb0SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)A,"MatFactorSolveSchurComplementTranspose_C",NULL);CHKERRQ(ierr); 850bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)A,"MatMumpsSetIcntl_C",NULL);CHKERRQ(ierr); 851bc6112feSHong Zhang ierr = PetscObjectComposeFunction((PetscObject)A,"MatMumpsGetIcntl_C",NULL);CHKERRQ(ierr); 852bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)A,"MatMumpsSetCntl_C",NULL);CHKERRQ(ierr); 853bc6112feSHong Zhang ierr = PetscObjectComposeFunction((PetscObject)A,"MatMumpsGetCntl_C",NULL);CHKERRQ(ierr); 854ca810319SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)A,"MatMumpsGetInfo_C",NULL);CHKERRQ(ierr); 855ca810319SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)A,"MatMumpsGetInfog_C",NULL);CHKERRQ(ierr); 856ca810319SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)A,"MatMumpsGetRinfo_C",NULL);CHKERRQ(ierr); 857ca810319SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)A,"MatMumpsGetRinfog_C",NULL);CHKERRQ(ierr); 858397b6df1SKris Buschelman PetscFunctionReturn(0); 859397b6df1SKris Buschelman } 860397b6df1SKris Buschelman 861397b6df1SKris Buschelman #undef __FUNCT__ 862f6c57405SHong Zhang #define __FUNCT__ "MatSolve_MUMPS" 863b24902e0SBarry Smith PetscErrorCode MatSolve_MUMPS(Mat A,Vec b,Vec x) 864b24902e0SBarry Smith { 865a5e57a09SHong Zhang Mat_MUMPS *mumps=(Mat_MUMPS*)A->spptr; 866d54de34fSKris Buschelman PetscScalar *array; 86767877ebaSShri Abhyankar Vec b_seq; 868329ec9b3SHong Zhang IS is_iden,is_petsc; 869dfbe8321SBarry Smith PetscErrorCode ierr; 870329ec9b3SHong Zhang PetscInt i; 871*cc86f929SStefano Zampini PetscBool second_solve = PETSC_FALSE; 872883f2eb9SBarry Smith static PetscBool cite1 = PETSC_FALSE,cite2 = PETSC_FALSE; 873397b6df1SKris Buschelman 874397b6df1SKris Buschelman PetscFunctionBegin; 875883f2eb9SBarry Smith ierr = PetscCitationsRegister("@article{MUMPS01,\n author = {P.~R. Amestoy and I.~S. Duff and J.-Y. L'Excellent and J. Koster},\n title = {A fully asynchronous multifrontal solver using distributed dynamic scheduling},\n journal = {SIAM Journal on Matrix Analysis and Applications},\n volume = {23},\n number = {1},\n pages = {15--41},\n year = {2001}\n}\n",&cite1);CHKERRQ(ierr); 876883f2eb9SBarry Smith ierr = PetscCitationsRegister("@article{MUMPS02,\n author = {P.~R. Amestoy and A. Guermouche and J.-Y. L'Excellent and S. Pralet},\n title = {Hybrid scheduling for the parallel solution of linear systems},\n journal = {Parallel Computing},\n volume = {32},\n number = {2},\n pages = {136--156},\n year = {2006}\n}\n",&cite2);CHKERRQ(ierr); 877a5e57a09SHong Zhang mumps->id.nrhs = 1; 878a5e57a09SHong Zhang b_seq = mumps->b_seq; 879a5e57a09SHong Zhang if (mumps->size > 1) { 880329ec9b3SHong Zhang /* MUMPS only supports centralized rhs. Scatter b into a seqential rhs vector */ 881a5e57a09SHong Zhang ierr = VecScatterBegin(mumps->scat_rhs,b,b_seq,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 882a5e57a09SHong Zhang ierr = VecScatterEnd(mumps->scat_rhs,b,b_seq,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 883a5e57a09SHong Zhang if (!mumps->myid) {ierr = VecGetArray(b_seq,&array);CHKERRQ(ierr);} 884397b6df1SKris Buschelman } else { /* size == 1 */ 885397b6df1SKris Buschelman ierr = VecCopy(b,x);CHKERRQ(ierr); 886397b6df1SKris Buschelman ierr = VecGetArray(x,&array);CHKERRQ(ierr); 887397b6df1SKris Buschelman } 888a5e57a09SHong Zhang if (!mumps->myid) { /* define rhs on the host */ 889a5e57a09SHong Zhang mumps->id.nrhs = 1; 890940cd9d6SSatish Balay mumps->id.rhs = (MumpsScalar*)array; 891397b6df1SKris Buschelman } 892397b6df1SKris Buschelman 893*cc86f929SStefano Zampini /* 894*cc86f929SStefano Zampini handle condensation step of Schur complement (if any) 895*cc86f929SStefano Zampini We set by default ICNTL(26) == -1 when Schur indices have been provided by the user. 896*cc86f929SStefano Zampini According to MUMPS (5.0.0) manual, any value should be harmful during the factorization phase 897*cc86f929SStefano Zampini Unless the user provides a valid value for ICNTL(26), MatSolve and MatMatSolve routines solve the full system. 898*cc86f929SStefano Zampini This requires an extra call to PetscMUMPS_c and the computation of the factors for S 899*cc86f929SStefano Zampini */ 900*cc86f929SStefano Zampini if (mumps->id.ICNTL(26) < 0 || mumps->id.ICNTL(26) > 2) { 901*cc86f929SStefano Zampini second_solve = PETSC_TRUE; 902b8f61ee1SStefano Zampini ierr = MatMumpsHandleSchur_Private(mumps,PETSC_FALSE);CHKERRQ(ierr); 903*cc86f929SStefano Zampini } 904397b6df1SKris Buschelman /* solve phase */ 905329ec9b3SHong Zhang /*-------------*/ 906a5e57a09SHong Zhang mumps->id.job = JOB_SOLVE; 907a5e57a09SHong Zhang PetscMUMPS_c(&mumps->id); 908a5e57a09SHong Zhang if (mumps->id.INFOG(1) < 0) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error reported by MUMPS in solve phase: INFOG(1)=%d\n",mumps->id.INFOG(1)); 909397b6df1SKris Buschelman 910b5fa320bSStefano Zampini /* handle expansion step of Schur complement (if any) */ 911*cc86f929SStefano Zampini if (second_solve) { 912b8f61ee1SStefano Zampini ierr = MatMumpsHandleSchur_Private(mumps,PETSC_TRUE);CHKERRQ(ierr); 913*cc86f929SStefano Zampini } 914b5fa320bSStefano Zampini 915a5e57a09SHong Zhang if (mumps->size > 1) { /* convert mumps distributed solution to petsc mpi x */ 916a5e57a09SHong Zhang if (mumps->scat_sol && mumps->ICNTL9_pre != mumps->id.ICNTL(9)) { 917a5e57a09SHong Zhang /* when id.ICNTL(9) changes, the contents of lsol_loc may change (not its size, lsol_loc), recreates scat_sol */ 918a5e57a09SHong Zhang ierr = VecScatterDestroy(&mumps->scat_sol);CHKERRQ(ierr); 919397b6df1SKris Buschelman } 920a5e57a09SHong Zhang if (!mumps->scat_sol) { /* create scatter scat_sol */ 921a5e57a09SHong Zhang ierr = ISCreateStride(PETSC_COMM_SELF,mumps->id.lsol_loc,0,1,&is_iden);CHKERRQ(ierr); /* from */ 922a5e57a09SHong Zhang for (i=0; i<mumps->id.lsol_loc; i++) { 923a5e57a09SHong Zhang mumps->id.isol_loc[i] -= 1; /* change Fortran style to C style */ 924a5e57a09SHong Zhang } 925a5e57a09SHong Zhang ierr = ISCreateGeneral(PETSC_COMM_SELF,mumps->id.lsol_loc,mumps->id.isol_loc,PETSC_COPY_VALUES,&is_petsc);CHKERRQ(ierr); /* to */ 926a5e57a09SHong Zhang ierr = VecScatterCreate(mumps->x_seq,is_iden,x,is_petsc,&mumps->scat_sol);CHKERRQ(ierr); 9276bf464f9SBarry Smith ierr = ISDestroy(&is_iden);CHKERRQ(ierr); 9286bf464f9SBarry Smith ierr = ISDestroy(&is_petsc);CHKERRQ(ierr); 9292205254eSKarl Rupp 930a5e57a09SHong Zhang mumps->ICNTL9_pre = mumps->id.ICNTL(9); /* save current value of id.ICNTL(9) */ 931397b6df1SKris Buschelman } 932a5e57a09SHong Zhang 933a5e57a09SHong Zhang ierr = VecScatterBegin(mumps->scat_sol,mumps->x_seq,x,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 934a5e57a09SHong Zhang ierr = VecScatterEnd(mumps->scat_sol,mumps->x_seq,x,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 935329ec9b3SHong Zhang } 936397b6df1SKris Buschelman PetscFunctionReturn(0); 937397b6df1SKris Buschelman } 938397b6df1SKris Buschelman 93951d5961aSHong Zhang #undef __FUNCT__ 94051d5961aSHong Zhang #define __FUNCT__ "MatSolveTranspose_MUMPS" 94151d5961aSHong Zhang PetscErrorCode MatSolveTranspose_MUMPS(Mat A,Vec b,Vec x) 94251d5961aSHong Zhang { 943a5e57a09SHong Zhang Mat_MUMPS *mumps=(Mat_MUMPS*)A->spptr; 94451d5961aSHong Zhang PetscErrorCode ierr; 94551d5961aSHong Zhang 94651d5961aSHong Zhang PetscFunctionBegin; 947a5e57a09SHong Zhang mumps->id.ICNTL(9) = 0; 9480ad0caddSJed Brown ierr = MatSolve_MUMPS(A,b,x);CHKERRQ(ierr); 949a5e57a09SHong Zhang mumps->id.ICNTL(9) = 1; 95051d5961aSHong Zhang PetscFunctionReturn(0); 95151d5961aSHong Zhang } 95251d5961aSHong Zhang 953e0b74bf9SHong Zhang #undef __FUNCT__ 954e0b74bf9SHong Zhang #define __FUNCT__ "MatMatSolve_MUMPS" 955e0b74bf9SHong Zhang PetscErrorCode MatMatSolve_MUMPS(Mat A,Mat B,Mat X) 956e0b74bf9SHong Zhang { 957bda8bf91SBarry Smith PetscErrorCode ierr; 958bda8bf91SBarry Smith PetscBool flg; 9594e34a73bSHong Zhang Mat_MUMPS *mumps=(Mat_MUMPS*)A->spptr; 960334c5f61SHong Zhang PetscInt i,nrhs,M; 9612cd7d884SHong Zhang PetscScalar *array,*bray; 962bda8bf91SBarry Smith 963e0b74bf9SHong Zhang PetscFunctionBegin; 9640298fd71SBarry Smith ierr = PetscObjectTypeCompareAny((PetscObject)B,&flg,MATSEQDENSE,MATMPIDENSE,NULL);CHKERRQ(ierr); 965801fbe65SHong Zhang if (!flg) SETERRQ(PetscObjectComm((PetscObject)B),PETSC_ERR_ARG_WRONG,"Matrix B must be MATDENSE matrix"); 9660298fd71SBarry Smith ierr = PetscObjectTypeCompareAny((PetscObject)X,&flg,MATSEQDENSE,MATMPIDENSE,NULL);CHKERRQ(ierr); 967801fbe65SHong Zhang if (!flg) SETERRQ(PetscObjectComm((PetscObject)X),PETSC_ERR_ARG_WRONG,"Matrix X must be MATDENSE matrix"); 968801fbe65SHong Zhang if (B->rmap->n != X->rmap->n) SETERRQ(PetscObjectComm((PetscObject)B),PETSC_ERR_ARG_WRONG,"Matrix B and X must have same row distribution"); 9694e34a73bSHong Zhang 9702cd7d884SHong Zhang ierr = MatGetSize(B,&M,&nrhs);CHKERRQ(ierr); 971334c5f61SHong Zhang mumps->id.nrhs = nrhs; 972334c5f61SHong Zhang mumps->id.lrhs = M; 9734e34a73bSHong Zhang 9742cd7d884SHong Zhang if (mumps->size == 1) { 9752cd7d884SHong Zhang /* copy B to X */ 9762cd7d884SHong Zhang ierr = MatDenseGetArray(B,&bray);CHKERRQ(ierr); 9772cd7d884SHong Zhang ierr = MatDenseGetArray(X,&array);CHKERRQ(ierr); 9786444a565SStefano Zampini ierr = PetscMemcpy(array,bray,M*nrhs*sizeof(PetscScalar));CHKERRQ(ierr); 9792cd7d884SHong Zhang ierr = MatDenseRestoreArray(B,&bray);CHKERRQ(ierr); 980940cd9d6SSatish Balay mumps->id.rhs = (MumpsScalar*)array; 981b5fa320bSStefano Zampini /* handle condensation step of Schur complement (if any) */ 982b8f61ee1SStefano Zampini ierr = MatMumpsHandleSchur_Private(mumps,PETSC_FALSE);CHKERRQ(ierr); 983801fbe65SHong Zhang 9842cd7d884SHong Zhang /* solve phase */ 9852cd7d884SHong Zhang /*-------------*/ 9862cd7d884SHong Zhang mumps->id.job = JOB_SOLVE; 9872cd7d884SHong Zhang PetscMUMPS_c(&mumps->id); 9882cd7d884SHong Zhang if (mumps->id.INFOG(1) < 0) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error reported by MUMPS in solve phase: INFOG(1)=%d\n",mumps->id.INFOG(1)); 989b5fa320bSStefano Zampini 990b5fa320bSStefano Zampini /* handle expansion step of Schur complement (if any) */ 991b8f61ee1SStefano Zampini ierr = MatMumpsHandleSchur_Private(mumps,PETSC_TRUE);CHKERRQ(ierr); 9922cd7d884SHong Zhang ierr = MatDenseRestoreArray(X,&array);CHKERRQ(ierr); 993334c5f61SHong Zhang } else { /*--------- parallel case --------*/ 99471aed81dSHong Zhang PetscInt lsol_loc,nlsol_loc,*isol_loc,*idx,*iidx,*idxx,*isol_loc_save; 9951070efccSSatish Balay MumpsScalar *sol_loc,*sol_loc_save; 996801fbe65SHong Zhang IS is_to,is_from; 997334c5f61SHong Zhang PetscInt k,proc,j,m; 998801fbe65SHong Zhang const PetscInt *rstart; 999334c5f61SHong Zhang Vec v_mpi,b_seq,x_seq; 1000334c5f61SHong Zhang VecScatter scat_rhs,scat_sol; 1001801fbe65SHong Zhang 1002801fbe65SHong Zhang /* create x_seq to hold local solution */ 100371aed81dSHong Zhang isol_loc_save = mumps->id.isol_loc; /* save it for MatSovle() */ 100471aed81dSHong Zhang sol_loc_save = mumps->id.sol_loc; 1005801fbe65SHong Zhang 100671aed81dSHong Zhang lsol_loc = mumps->id.INFO(23); 100771aed81dSHong Zhang nlsol_loc = nrhs*lsol_loc; /* length of sol_loc */ 100871aed81dSHong Zhang ierr = PetscMalloc2(nlsol_loc,&sol_loc,nlsol_loc,&isol_loc);CHKERRQ(ierr); 1009940cd9d6SSatish Balay mumps->id.sol_loc = (MumpsScalar*)sol_loc; 1010801fbe65SHong Zhang mumps->id.isol_loc = isol_loc; 1011801fbe65SHong Zhang 10121070efccSSatish Balay ierr = VecCreateSeqWithArray(PETSC_COMM_SELF,1,nlsol_loc,(PetscScalar*)sol_loc,&x_seq);CHKERRQ(ierr); 10132cd7d884SHong Zhang 101474f0fcc7SHong Zhang /* copy rhs matrix B into vector v_mpi */ 1015334c5f61SHong Zhang ierr = MatGetLocalSize(B,&m,NULL);CHKERRQ(ierr); 1016801fbe65SHong Zhang ierr = MatDenseGetArray(B,&bray);CHKERRQ(ierr); 101774f0fcc7SHong Zhang ierr = VecCreateMPIWithArray(PetscObjectComm((PetscObject)B),1,nrhs*m,nrhs*M,(const PetscScalar*)bray,&v_mpi);CHKERRQ(ierr); 1018801fbe65SHong Zhang ierr = MatDenseRestoreArray(B,&bray);CHKERRQ(ierr); 1019801fbe65SHong Zhang 1020334c5f61SHong Zhang /* scatter v_mpi to b_seq because MUMPS only supports centralized rhs */ 102174f0fcc7SHong Zhang /* idx: maps from k-th index of v_mpi to (i,j)-th global entry of B; 1022801fbe65SHong Zhang iidx: inverse of idx, will be used by scattering xx_seq -> X */ 1023801fbe65SHong Zhang ierr = PetscMalloc2(nrhs*M,&idx,nrhs*M,&iidx);CHKERRQ(ierr); 1024801fbe65SHong Zhang ierr = MatGetOwnershipRanges(B,&rstart);CHKERRQ(ierr); 1025801fbe65SHong Zhang k = 0; 1026801fbe65SHong Zhang for (proc=0; proc<mumps->size; proc++){ 1027801fbe65SHong Zhang for (j=0; j<nrhs; j++){ 1028801fbe65SHong Zhang for (i=rstart[proc]; i<rstart[proc+1]; i++){ 1029801fbe65SHong Zhang iidx[j*M + i] = k; 1030801fbe65SHong Zhang idx[k++] = j*M + i; 1031801fbe65SHong Zhang } 1032801fbe65SHong Zhang } 10332cd7d884SHong Zhang } 10342cd7d884SHong Zhang 1035801fbe65SHong Zhang if (!mumps->myid) { 1036334c5f61SHong Zhang ierr = VecCreateSeq(PETSC_COMM_SELF,nrhs*M,&b_seq);CHKERRQ(ierr); 1037801fbe65SHong Zhang ierr = ISCreateGeneral(PETSC_COMM_SELF,nrhs*M,idx,PETSC_COPY_VALUES,&is_to);CHKERRQ(ierr); 1038801fbe65SHong Zhang ierr = ISCreateStride(PETSC_COMM_SELF,nrhs*M,0,1,&is_from);CHKERRQ(ierr); 1039801fbe65SHong Zhang } else { 1040334c5f61SHong Zhang ierr = VecCreateSeq(PETSC_COMM_SELF,0,&b_seq);CHKERRQ(ierr); 1041801fbe65SHong Zhang ierr = ISCreateStride(PETSC_COMM_SELF,0,0,1,&is_to);CHKERRQ(ierr); 1042801fbe65SHong Zhang ierr = ISCreateStride(PETSC_COMM_SELF,0,0,1,&is_from);CHKERRQ(ierr); 1043801fbe65SHong Zhang } 1044334c5f61SHong Zhang ierr = VecScatterCreate(v_mpi,is_from,b_seq,is_to,&scat_rhs);CHKERRQ(ierr); 1045334c5f61SHong Zhang ierr = VecScatterBegin(scat_rhs,v_mpi,b_seq,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 1046801fbe65SHong Zhang ierr = ISDestroy(&is_to);CHKERRQ(ierr); 1047801fbe65SHong Zhang ierr = ISDestroy(&is_from);CHKERRQ(ierr); 1048334c5f61SHong Zhang ierr = VecScatterEnd(scat_rhs,v_mpi,b_seq,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 1049801fbe65SHong Zhang 1050801fbe65SHong Zhang if (!mumps->myid) { /* define rhs on the host */ 1051334c5f61SHong Zhang ierr = VecGetArray(b_seq,&bray);CHKERRQ(ierr); 1052940cd9d6SSatish Balay mumps->id.rhs = (MumpsScalar*)bray; 1053334c5f61SHong Zhang ierr = VecRestoreArray(b_seq,&bray);CHKERRQ(ierr); 1054801fbe65SHong Zhang } 1055801fbe65SHong Zhang 1056801fbe65SHong Zhang /* solve phase */ 1057801fbe65SHong Zhang /*-------------*/ 1058801fbe65SHong Zhang mumps->id.job = JOB_SOLVE; 1059801fbe65SHong Zhang PetscMUMPS_c(&mumps->id); 1060801fbe65SHong Zhang if (mumps->id.INFOG(1) < 0) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error reported by MUMPS in solve phase: INFOG(1)=%d\n",mumps->id.INFOG(1)); 1061801fbe65SHong Zhang 1062334c5f61SHong Zhang /* scatter mumps distributed solution to petsc vector v_mpi, which shares local arrays with solution matrix X */ 106374f0fcc7SHong Zhang ierr = MatDenseGetArray(X,&array);CHKERRQ(ierr); 106474f0fcc7SHong Zhang ierr = VecPlaceArray(v_mpi,array);CHKERRQ(ierr); 1065801fbe65SHong Zhang 1066334c5f61SHong Zhang /* create scatter scat_sol */ 106771aed81dSHong Zhang ierr = PetscMalloc1(nlsol_loc,&idxx);CHKERRQ(ierr); 106871aed81dSHong Zhang ierr = ISCreateStride(PETSC_COMM_SELF,nlsol_loc,0,1,&is_from);CHKERRQ(ierr); 106971aed81dSHong Zhang for (i=0; i<lsol_loc; i++) { 1070334c5f61SHong Zhang isol_loc[i] -= 1; /* change Fortran style to C style */ 1071334c5f61SHong Zhang idxx[i] = iidx[isol_loc[i]]; 1072801fbe65SHong Zhang for (j=1; j<nrhs; j++){ 1073334c5f61SHong Zhang idxx[j*lsol_loc+i] = iidx[isol_loc[i]+j*M]; 1074801fbe65SHong Zhang } 1075801fbe65SHong Zhang } 107671aed81dSHong Zhang ierr = ISCreateGeneral(PETSC_COMM_SELF,nlsol_loc,idxx,PETSC_COPY_VALUES,&is_to);CHKERRQ(ierr); 1077334c5f61SHong Zhang ierr = VecScatterCreate(x_seq,is_from,v_mpi,is_to,&scat_sol);CHKERRQ(ierr); 1078334c5f61SHong Zhang ierr = VecScatterBegin(scat_sol,x_seq,v_mpi,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 1079801fbe65SHong Zhang ierr = ISDestroy(&is_from);CHKERRQ(ierr); 1080801fbe65SHong Zhang ierr = ISDestroy(&is_to);CHKERRQ(ierr); 1081334c5f61SHong Zhang ierr = VecScatterEnd(scat_sol,x_seq,v_mpi,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 1082801fbe65SHong Zhang ierr = MatDenseRestoreArray(X,&array);CHKERRQ(ierr); 108371aed81dSHong Zhang 108471aed81dSHong Zhang /* free spaces */ 108571aed81dSHong Zhang mumps->id.sol_loc = sol_loc_save; 108671aed81dSHong Zhang mumps->id.isol_loc = isol_loc_save; 108771aed81dSHong Zhang 108871aed81dSHong Zhang ierr = PetscFree2(sol_loc,isol_loc);CHKERRQ(ierr); 1089801fbe65SHong Zhang ierr = PetscFree2(idx,iidx);CHKERRQ(ierr); 1090801fbe65SHong Zhang ierr = PetscFree(idxx);CHKERRQ(ierr); 109171aed81dSHong Zhang ierr = VecDestroy(&x_seq);CHKERRQ(ierr); 109274f0fcc7SHong Zhang ierr = VecDestroy(&v_mpi);CHKERRQ(ierr); 1093334c5f61SHong Zhang ierr = VecDestroy(&b_seq);CHKERRQ(ierr); 1094334c5f61SHong Zhang ierr = VecScatterDestroy(&scat_rhs);CHKERRQ(ierr); 1095334c5f61SHong Zhang ierr = VecScatterDestroy(&scat_sol);CHKERRQ(ierr); 1096801fbe65SHong Zhang } 1097e0b74bf9SHong Zhang PetscFunctionReturn(0); 1098e0b74bf9SHong Zhang } 1099e0b74bf9SHong Zhang 1100ace3df97SHong Zhang #if !defined(PETSC_USE_COMPLEX) 1101a58c3f20SHong Zhang /* 1102a58c3f20SHong Zhang input: 1103a58c3f20SHong Zhang F: numeric factor 1104a58c3f20SHong Zhang output: 1105a58c3f20SHong Zhang nneg: total number of negative pivots 1106a58c3f20SHong Zhang nzero: 0 1107a58c3f20SHong Zhang npos: (global dimension of F) - nneg 1108a58c3f20SHong Zhang */ 1109a58c3f20SHong Zhang 1110a58c3f20SHong Zhang #undef __FUNCT__ 1111a58c3f20SHong Zhang #define __FUNCT__ "MatGetInertia_SBAIJMUMPS" 1112dfbe8321SBarry Smith PetscErrorCode MatGetInertia_SBAIJMUMPS(Mat F,int *nneg,int *nzero,int *npos) 1113a58c3f20SHong Zhang { 1114a5e57a09SHong Zhang Mat_MUMPS *mumps =(Mat_MUMPS*)F->spptr; 1115dfbe8321SBarry Smith PetscErrorCode ierr; 1116c1490034SHong Zhang PetscMPIInt size; 1117a58c3f20SHong Zhang 1118a58c3f20SHong Zhang PetscFunctionBegin; 1119ce94432eSBarry Smith ierr = MPI_Comm_size(PetscObjectComm((PetscObject)F),&size);CHKERRQ(ierr); 1120bcb30aebSHong Zhang /* MUMPS 4.3.1 calls ScaLAPACK when ICNTL(13)=0 (default), which does not offer the possibility to compute the inertia of a dense matrix. Set ICNTL(13)=1 to skip ScaLAPACK */ 1121a5e57a09SHong Zhang if (size > 1 && mumps->id.ICNTL(13) != 1) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONG,"ICNTL(13)=%d. -mat_mumps_icntl_13 must be set as 1 for correct global matrix inertia\n",mumps->id.INFOG(13)); 1122ed85ac9fSHong Zhang 1123710ac8efSHong Zhang if (nneg) *nneg = mumps->id.INFOG(12); 1124ed85ac9fSHong Zhang if (nzero || npos) { 1125ed85ac9fSHong Zhang if (mumps->id.ICNTL(24) != 1) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONG,"-mat_mumps_icntl_24 must be set as 1 for null pivot row detection"); 1126710ac8efSHong Zhang if (nzero) *nzero = mumps->id.INFOG(28); 1127710ac8efSHong Zhang if (npos) *npos = F->rmap->N - (mumps->id.INFOG(12) + mumps->id.INFOG(28)); 1128a58c3f20SHong Zhang } 1129a58c3f20SHong Zhang PetscFunctionReturn(0); 1130a58c3f20SHong Zhang } 1131ace3df97SHong Zhang #endif /* !defined(PETSC_USE_COMPLEX) */ 1132a58c3f20SHong Zhang 1133397b6df1SKris Buschelman #undef __FUNCT__ 1134f6c57405SHong Zhang #define __FUNCT__ "MatFactorNumeric_MUMPS" 11350481f469SBarry Smith PetscErrorCode MatFactorNumeric_MUMPS(Mat F,Mat A,const MatFactorInfo *info) 1136af281ebdSHong Zhang { 1137a5e57a09SHong Zhang Mat_MUMPS *mumps =(Mat_MUMPS*)(F)->spptr; 11386849ba73SBarry Smith PetscErrorCode ierr; 1139e09efc27SHong Zhang Mat F_diag; 1140ace3abfcSBarry Smith PetscBool isMPIAIJ; 1141397b6df1SKris Buschelman 1142397b6df1SKris Buschelman PetscFunctionBegin; 1143a5e57a09SHong Zhang ierr = (*mumps->ConvertToTriples)(A, 1, MAT_REUSE_MATRIX, &mumps->nz, &mumps->irn, &mumps->jcn, &mumps->val);CHKERRQ(ierr); 1144397b6df1SKris Buschelman 1145397b6df1SKris Buschelman /* numerical factorization phase */ 1146329ec9b3SHong Zhang /*-------------------------------*/ 1147a5e57a09SHong Zhang mumps->id.job = JOB_FACTNUMERIC; 11484e34a73bSHong Zhang if (!mumps->id.ICNTL(18)) { /* A is centralized */ 1149a5e57a09SHong Zhang if (!mumps->myid) { 1150940cd9d6SSatish Balay mumps->id.a = (MumpsScalar*)mumps->val; 1151397b6df1SKris Buschelman } 1152397b6df1SKris Buschelman } else { 1153940cd9d6SSatish Balay mumps->id.a_loc = (MumpsScalar*)mumps->val; 1154397b6df1SKris Buschelman } 1155a5e57a09SHong Zhang PetscMUMPS_c(&mumps->id); 1156a5e57a09SHong Zhang if (mumps->id.INFOG(1) < 0) { 1157151787a6SHong Zhang if (mumps->id.INFO(1) == -13) { 1158151787a6SHong Zhang if (mumps->id.INFO(2) < 0) { 1159151787a6SHong Zhang SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error reported by MUMPS in numerical factorization phase: Cannot allocate required memory %d megabytes\n",-mumps->id.INFO(2)); 1160151787a6SHong Zhang } else { 1161151787a6SHong Zhang SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error reported by MUMPS in numerical factorization phase: Cannot allocate required memory %d bytes\n",mumps->id.INFO(2)); 1162151787a6SHong Zhang } 1163151787a6SHong Zhang } else SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error reported by MUMPS in numerical factorization phase: INFO(1)=%d, INFO(2)=%d\n",mumps->id.INFO(1),mumps->id.INFO(2)); 1164397b6df1SKris Buschelman } 1165a5e57a09SHong Zhang if (!mumps->myid && mumps->id.ICNTL(16) > 0) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB," mumps->id.ICNTL(16):=%d\n",mumps->id.INFOG(16)); 1166397b6df1SKris Buschelman 1167dcd589f8SShri Abhyankar (F)->assembled = PETSC_TRUE; 1168a5e57a09SHong Zhang mumps->matstruc = SAME_NONZERO_PATTERN; 1169b5fa320bSStefano Zampini mumps->schur_factored = PETSC_FALSE; 117059ac8732SStefano Zampini mumps->schur_inverted = PETSC_FALSE; 117167877ebaSShri Abhyankar 1172066565c5SStefano Zampini /* just to be sure that ICNTL(19) value returned by a call from MatMumpsGetIcntl is always consistent */ 1173066565c5SStefano Zampini if (!mumps->sym && mumps->id.ICNTL(19) && mumps->id.ICNTL(19) != 1) mumps->id.ICNTL(19) = 3; 1174066565c5SStefano Zampini 1175a5e57a09SHong Zhang if (mumps->size > 1) { 117667877ebaSShri Abhyankar PetscInt lsol_loc; 117767877ebaSShri Abhyankar PetscScalar *sol_loc; 11782205254eSKarl Rupp 1179c2093ab7SHong Zhang ierr = PetscObjectTypeCompare((PetscObject)A,MATMPIAIJ,&isMPIAIJ);CHKERRQ(ierr); 1180c2093ab7SHong Zhang if (isMPIAIJ) F_diag = ((Mat_MPIAIJ*)(F)->data)->A; 1181c2093ab7SHong Zhang else F_diag = ((Mat_MPISBAIJ*)(F)->data)->A; 1182c2093ab7SHong Zhang F_diag->assembled = PETSC_TRUE; 1183c2093ab7SHong Zhang 1184c2093ab7SHong Zhang /* distributed solution; Create x_seq=sol_loc for repeated use */ 1185c2093ab7SHong Zhang if (mumps->x_seq) { 1186c2093ab7SHong Zhang ierr = VecScatterDestroy(&mumps->scat_sol);CHKERRQ(ierr); 1187c2093ab7SHong Zhang ierr = PetscFree2(mumps->id.sol_loc,mumps->id.isol_loc);CHKERRQ(ierr); 1188c2093ab7SHong Zhang ierr = VecDestroy(&mumps->x_seq);CHKERRQ(ierr); 1189c2093ab7SHong Zhang } 1190a5e57a09SHong Zhang lsol_loc = mumps->id.INFO(23); /* length of sol_loc */ 1191dcca6d9dSJed Brown ierr = PetscMalloc2(lsol_loc,&sol_loc,lsol_loc,&mumps->id.isol_loc);CHKERRQ(ierr); 1192a5e57a09SHong Zhang mumps->id.lsol_loc = lsol_loc; 1193940cd9d6SSatish Balay mumps->id.sol_loc = (MumpsScalar*)sol_loc; 1194a5e57a09SHong Zhang ierr = VecCreateSeqWithArray(PETSC_COMM_SELF,1,lsol_loc,sol_loc,&mumps->x_seq);CHKERRQ(ierr); 119567877ebaSShri Abhyankar } 1196397b6df1SKris Buschelman PetscFunctionReturn(0); 1197397b6df1SKris Buschelman } 1198397b6df1SKris Buschelman 11999a2535b5SHong Zhang /* Sets MUMPS options from the options database */ 1200dcd589f8SShri Abhyankar #undef __FUNCT__ 12019a2535b5SHong Zhang #define __FUNCT__ "PetscSetMUMPSFromOptions" 12029a2535b5SHong Zhang PetscErrorCode PetscSetMUMPSFromOptions(Mat F, Mat A) 1203dcd589f8SShri Abhyankar { 12049a2535b5SHong Zhang Mat_MUMPS *mumps = (Mat_MUMPS*)F->spptr; 1205dcd589f8SShri Abhyankar PetscErrorCode ierr; 1206b34f08ffSHong Zhang PetscInt icntl,info[40],i,ninfo=40; 1207ace3abfcSBarry Smith PetscBool flg; 1208dcd589f8SShri Abhyankar 1209dcd589f8SShri Abhyankar PetscFunctionBegin; 1210ce94432eSBarry Smith ierr = PetscOptionsBegin(PetscObjectComm((PetscObject)A),((PetscObject)A)->prefix,"MUMPS Options","Mat");CHKERRQ(ierr); 12119a2535b5SHong Zhang ierr = PetscOptionsInt("-mat_mumps_icntl_1","ICNTL(1): output stream for error messages","None",mumps->id.ICNTL(1),&icntl,&flg);CHKERRQ(ierr); 12129a2535b5SHong Zhang if (flg) mumps->id.ICNTL(1) = icntl; 12139a2535b5SHong Zhang ierr = PetscOptionsInt("-mat_mumps_icntl_2","ICNTL(2): output stream for diagnostic printing, statistics, and warning","None",mumps->id.ICNTL(2),&icntl,&flg);CHKERRQ(ierr); 12149a2535b5SHong Zhang if (flg) mumps->id.ICNTL(2) = icntl; 12159a2535b5SHong Zhang ierr = PetscOptionsInt("-mat_mumps_icntl_3","ICNTL(3): output stream for global information, collected on the host","None",mumps->id.ICNTL(3),&icntl,&flg);CHKERRQ(ierr); 12169a2535b5SHong Zhang if (flg) mumps->id.ICNTL(3) = icntl; 1217dcd589f8SShri Abhyankar 12189a2535b5SHong Zhang ierr = PetscOptionsInt("-mat_mumps_icntl_4","ICNTL(4): level of printing (0 to 4)","None",mumps->id.ICNTL(4),&icntl,&flg);CHKERRQ(ierr); 12199a2535b5SHong Zhang if (flg) mumps->id.ICNTL(4) = icntl; 12209a2535b5SHong Zhang if (mumps->id.ICNTL(4) || PetscLogPrintInfo) mumps->id.ICNTL(3) = 6; /* resume MUMPS default id.ICNTL(3) = 6 */ 12219a2535b5SHong Zhang 1222d341cd04SHong Zhang ierr = PetscOptionsInt("-mat_mumps_icntl_6","ICNTL(6): permutes to a zero-free diagonal and/or scale the matrix (0 to 7)","None",mumps->id.ICNTL(6),&icntl,&flg);CHKERRQ(ierr); 12239a2535b5SHong Zhang if (flg) mumps->id.ICNTL(6) = icntl; 12249a2535b5SHong Zhang 1225d341cd04SHong Zhang ierr = PetscOptionsInt("-mat_mumps_icntl_7","ICNTL(7): computes a symmetric permutation in sequential analysis (0 to 7). 3=Scotch, 4=PORD, 5=Metis","None",mumps->id.ICNTL(7),&icntl,&flg);CHKERRQ(ierr); 1226dcd589f8SShri Abhyankar if (flg) { 12272205254eSKarl Rupp if (icntl== 1 && mumps->size > 1) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_SUP,"pivot order be set by the user in PERM_IN -- not supported by the PETSc/MUMPS interface\n"); 12282205254eSKarl Rupp else mumps->id.ICNTL(7) = icntl; 1229dcd589f8SShri Abhyankar } 1230e0b74bf9SHong Zhang 12310298fd71SBarry Smith ierr = PetscOptionsInt("-mat_mumps_icntl_8","ICNTL(8): scaling strategy (-2 to 8 or 77)","None",mumps->id.ICNTL(8),&mumps->id.ICNTL(8),NULL);CHKERRQ(ierr); 1232d341cd04SHong Zhang /* ierr = PetscOptionsInt("-mat_mumps_icntl_9","ICNTL(9): computes the solution using A or A^T","None",mumps->id.ICNTL(9),&mumps->id.ICNTL(9),NULL);CHKERRQ(ierr); handled by MatSolveTranspose_MUMPS() */ 12330298fd71SBarry Smith ierr = PetscOptionsInt("-mat_mumps_icntl_10","ICNTL(10): max num of refinements","None",mumps->id.ICNTL(10),&mumps->id.ICNTL(10),NULL);CHKERRQ(ierr); 1234d341cd04SHong Zhang ierr = PetscOptionsInt("-mat_mumps_icntl_11","ICNTL(11): statistics related to an error analysis (via -ksp_view)","None",mumps->id.ICNTL(11),&mumps->id.ICNTL(11),NULL);CHKERRQ(ierr); 1235d341cd04SHong Zhang ierr = PetscOptionsInt("-mat_mumps_icntl_12","ICNTL(12): an ordering strategy for symmetric matrices (0 to 3)","None",mumps->id.ICNTL(12),&mumps->id.ICNTL(12),NULL);CHKERRQ(ierr); 1236d341cd04SHong Zhang ierr = PetscOptionsInt("-mat_mumps_icntl_13","ICNTL(13): parallelism of the root node (enable ScaLAPACK) and its splitting","None",mumps->id.ICNTL(13),&mumps->id.ICNTL(13),NULL);CHKERRQ(ierr); 1237d341cd04SHong Zhang ierr = PetscOptionsInt("-mat_mumps_icntl_14","ICNTL(14): percentage increase in the estimated working space","None",mumps->id.ICNTL(14),&mumps->id.ICNTL(14),NULL);CHKERRQ(ierr); 1238d341cd04SHong Zhang ierr = PetscOptionsInt("-mat_mumps_icntl_19","ICNTL(19): computes the Schur complement","None",mumps->id.ICNTL(19),&mumps->id.ICNTL(19),NULL);CHKERRQ(ierr); 123959ac8732SStefano Zampini if (mumps->id.ICNTL(19) <= 0 || mumps->id.ICNTL(19) > 3) { /* reset any schur data (if any) */ 124059ac8732SStefano Zampini ierr = MatMumpsResetSchur_Private(mumps);CHKERRQ(ierr); 124159ac8732SStefano Zampini } 12424e34a73bSHong Zhang /* ierr = PetscOptionsInt("-mat_mumps_icntl_20","ICNTL(20): the format (dense or sparse) of the right-hand sides","None",mumps->id.ICNTL(20),&mumps->id.ICNTL(20),NULL);CHKERRQ(ierr); -- sparse rhs is not supported in PETSc API */ 1243d341cd04SHong Zhang /* ierr = PetscOptionsInt("-mat_mumps_icntl_21","ICNTL(21): the distribution (centralized or distributed) of the solution vectors","None",mumps->id.ICNTL(21),&mumps->id.ICNTL(21),NULL);CHKERRQ(ierr); we only use distributed solution vector */ 12449a2535b5SHong Zhang 1245d341cd04SHong Zhang ierr = PetscOptionsInt("-mat_mumps_icntl_22","ICNTL(22): in-core/out-of-core factorization and solve (0 or 1)","None",mumps->id.ICNTL(22),&mumps->id.ICNTL(22),NULL);CHKERRQ(ierr); 12460298fd71SBarry Smith ierr = PetscOptionsInt("-mat_mumps_icntl_23","ICNTL(23): max size of the working memory (MB) that can allocate per processor","None",mumps->id.ICNTL(23),&mumps->id.ICNTL(23),NULL);CHKERRQ(ierr); 12470298fd71SBarry Smith ierr = PetscOptionsInt("-mat_mumps_icntl_24","ICNTL(24): detection of null pivot rows (0 or 1)","None",mumps->id.ICNTL(24),&mumps->id.ICNTL(24),NULL);CHKERRQ(ierr); 12489a2535b5SHong Zhang if (mumps->id.ICNTL(24)) { 12499a2535b5SHong Zhang mumps->id.ICNTL(13) = 1; /* turn-off ScaLAPACK to help with the correct detection of null pivots */ 1250d7ebd59bSHong Zhang } 1251d7ebd59bSHong Zhang 1252d341cd04SHong Zhang ierr = PetscOptionsInt("-mat_mumps_icntl_25","ICNTL(25): compute a solution of a deficient matrix and a null space basis","None",mumps->id.ICNTL(25),&mumps->id.ICNTL(25),NULL);CHKERRQ(ierr); 1253d341cd04SHong Zhang ierr = PetscOptionsInt("-mat_mumps_icntl_26","ICNTL(26): drives the solution phase if a Schur complement matrix","None",mumps->id.ICNTL(26),&mumps->id.ICNTL(26),NULL);CHKERRQ(ierr); 12542cd7d884SHong Zhang ierr = PetscOptionsInt("-mat_mumps_icntl_27","ICNTL(27): the blocking size for multiple right-hand sides","None",mumps->id.ICNTL(27),&mumps->id.ICNTL(27),NULL);CHKERRQ(ierr); 12550298fd71SBarry Smith ierr = PetscOptionsInt("-mat_mumps_icntl_28","ICNTL(28): use 1 for sequential analysis and ictnl(7) ordering, or 2 for parallel analysis and ictnl(29) ordering","None",mumps->id.ICNTL(28),&mumps->id.ICNTL(28),NULL);CHKERRQ(ierr); 1256d341cd04SHong Zhang ierr = PetscOptionsInt("-mat_mumps_icntl_29","ICNTL(29): parallel ordering 1 = ptscotch, 2 = parmetis","None",mumps->id.ICNTL(29),&mumps->id.ICNTL(29),NULL);CHKERRQ(ierr); 12570298fd71SBarry Smith ierr = PetscOptionsInt("-mat_mumps_icntl_30","ICNTL(30): compute user-specified set of entries in inv(A)","None",mumps->id.ICNTL(30),&mumps->id.ICNTL(30),NULL);CHKERRQ(ierr); 1258d341cd04SHong Zhang ierr = PetscOptionsInt("-mat_mumps_icntl_31","ICNTL(31): indicates which factors may be discarded during factorization","None",mumps->id.ICNTL(31),&mumps->id.ICNTL(31),NULL);CHKERRQ(ierr); 12594e34a73bSHong Zhang /* ierr = PetscOptionsInt("-mat_mumps_icntl_32","ICNTL(32): performs the forward elemination of the right-hand sides during factorization","None",mumps->id.ICNTL(32),&mumps->id.ICNTL(32),NULL);CHKERRQ(ierr); -- not supported by PETSc API */ 12600298fd71SBarry Smith ierr = PetscOptionsInt("-mat_mumps_icntl_33","ICNTL(33): compute determinant","None",mumps->id.ICNTL(33),&mumps->id.ICNTL(33),NULL);CHKERRQ(ierr); 1261dcd589f8SShri Abhyankar 12620298fd71SBarry Smith ierr = PetscOptionsReal("-mat_mumps_cntl_1","CNTL(1): relative pivoting threshold","None",mumps->id.CNTL(1),&mumps->id.CNTL(1),NULL);CHKERRQ(ierr); 12630298fd71SBarry Smith ierr = PetscOptionsReal("-mat_mumps_cntl_2","CNTL(2): stopping criterion of refinement","None",mumps->id.CNTL(2),&mumps->id.CNTL(2),NULL);CHKERRQ(ierr); 12640298fd71SBarry Smith ierr = PetscOptionsReal("-mat_mumps_cntl_3","CNTL(3): absolute pivoting threshold","None",mumps->id.CNTL(3),&mumps->id.CNTL(3),NULL);CHKERRQ(ierr); 12650298fd71SBarry Smith ierr = PetscOptionsReal("-mat_mumps_cntl_4","CNTL(4): value for static pivoting","None",mumps->id.CNTL(4),&mumps->id.CNTL(4),NULL);CHKERRQ(ierr); 12660298fd71SBarry Smith ierr = PetscOptionsReal("-mat_mumps_cntl_5","CNTL(5): fixation for null pivots","None",mumps->id.CNTL(5),&mumps->id.CNTL(5),NULL);CHKERRQ(ierr); 1267e5bb22a1SHong Zhang 12680298fd71SBarry Smith ierr = PetscOptionsString("-mat_mumps_ooc_tmpdir", "out of core directory", "None", mumps->id.ooc_tmpdir, mumps->id.ooc_tmpdir, 256, NULL); 1269b34f08ffSHong Zhang 127016d797efSHong Zhang ierr = PetscOptionsIntArray("-mat_mumps_view_info","request INFO local to each processor","",info,&ninfo,NULL);CHKERRQ(ierr); 1271b34f08ffSHong Zhang if (ninfo) { 1272b34f08ffSHong Zhang if (ninfo > 40) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_USER,"number of INFO %d must <= 40\n",ninfo); 1273b34f08ffSHong Zhang ierr = PetscMalloc1(ninfo,&mumps->info);CHKERRQ(ierr); 1274b34f08ffSHong Zhang mumps->ninfo = ninfo; 1275b34f08ffSHong Zhang for (i=0; i<ninfo; i++) { 1276b34f08ffSHong Zhang if (info[i] < 0 || info[i]>40) { 1277b34f08ffSHong Zhang SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_USER,"index of INFO %d must between 1 and 40\n",ninfo); 1278b34f08ffSHong Zhang } else { 1279b34f08ffSHong Zhang mumps->info[i] = info[i]; 1280b34f08ffSHong Zhang } 1281b34f08ffSHong Zhang } 1282b34f08ffSHong Zhang } 1283b34f08ffSHong Zhang 1284dcd589f8SShri Abhyankar PetscOptionsEnd(); 1285dcd589f8SShri Abhyankar PetscFunctionReturn(0); 1286dcd589f8SShri Abhyankar } 1287dcd589f8SShri Abhyankar 1288dcd589f8SShri Abhyankar #undef __FUNCT__ 1289dcd589f8SShri Abhyankar #define __FUNCT__ "PetscInitializeMUMPS" 1290f697e70eSHong Zhang PetscErrorCode PetscInitializeMUMPS(Mat A,Mat_MUMPS *mumps) 1291dcd589f8SShri Abhyankar { 1292dcd589f8SShri Abhyankar PetscErrorCode ierr; 1293dcd589f8SShri Abhyankar 1294dcd589f8SShri Abhyankar PetscFunctionBegin; 1295ce94432eSBarry Smith ierr = MPI_Comm_rank(PetscObjectComm((PetscObject)A), &mumps->myid); 1296ce94432eSBarry Smith ierr = MPI_Comm_size(PetscObjectComm((PetscObject)A),&mumps->size);CHKERRQ(ierr); 1297ce94432eSBarry Smith ierr = MPI_Comm_dup(PetscObjectComm((PetscObject)A),&(mumps->comm_mumps));CHKERRQ(ierr); 12982205254eSKarl Rupp 1299f697e70eSHong Zhang mumps->id.comm_fortran = MPI_Comm_c2f(mumps->comm_mumps); 1300f697e70eSHong Zhang 1301f697e70eSHong Zhang mumps->id.job = JOB_INIT; 1302f697e70eSHong Zhang mumps->id.par = 1; /* host participates factorizaton and solve */ 1303f697e70eSHong Zhang mumps->id.sym = mumps->sym; 13042907cef9SHong Zhang PetscMUMPS_c(&mumps->id); 1305f697e70eSHong Zhang 13060298fd71SBarry Smith mumps->scat_rhs = NULL; 13070298fd71SBarry Smith mumps->scat_sol = NULL; 13089a2535b5SHong Zhang 130970544d5fSHong Zhang /* set PETSc-MUMPS default options - override MUMPS default */ 13109a2535b5SHong Zhang mumps->id.ICNTL(3) = 0; 13119a2535b5SHong Zhang mumps->id.ICNTL(4) = 0; 13129a2535b5SHong Zhang if (mumps->size == 1) { 13139a2535b5SHong Zhang mumps->id.ICNTL(18) = 0; /* centralized assembled matrix input */ 13149a2535b5SHong Zhang } else { 13159a2535b5SHong Zhang mumps->id.ICNTL(18) = 3; /* distributed assembled matrix input */ 13164e34a73bSHong Zhang mumps->id.ICNTL(20) = 0; /* rhs is in dense format */ 131770544d5fSHong Zhang mumps->id.ICNTL(21) = 1; /* distributed solution */ 13189a2535b5SHong Zhang } 13196444a565SStefano Zampini 13206444a565SStefano Zampini /* schur */ 13216444a565SStefano Zampini mumps->id.size_schur = 0; 13226444a565SStefano Zampini mumps->id.listvar_schur = NULL; 13236444a565SStefano Zampini mumps->id.schur = NULL; 1324b5fa320bSStefano Zampini mumps->sizeredrhs = 0; 1325b5fa320bSStefano Zampini mumps->schur_pivots = NULL; 1326b5fa320bSStefano Zampini mumps->schur_work = NULL; 132759ac8732SStefano Zampini mumps->schur_sol = NULL; 132859ac8732SStefano Zampini mumps->schur_sizesol = 0; 132959ac8732SStefano Zampini mumps->schur_factored = PETSC_FALSE; 133059ac8732SStefano Zampini mumps->schur_inverted = PETSC_FALSE; 1331dcd589f8SShri Abhyankar PetscFunctionReturn(0); 1332dcd589f8SShri Abhyankar } 1333dcd589f8SShri Abhyankar 1334a5e57a09SHong Zhang /* Note Petsc r(=c) permutation is used when mumps->id.ICNTL(7)==1 with centralized assembled matrix input; otherwise r and c are ignored */ 1335397b6df1SKris Buschelman #undef __FUNCT__ 1336f0c56d0fSKris Buschelman #define __FUNCT__ "MatLUFactorSymbolic_AIJMUMPS" 13370481f469SBarry Smith PetscErrorCode MatLUFactorSymbolic_AIJMUMPS(Mat F,Mat A,IS r,IS c,const MatFactorInfo *info) 1338b24902e0SBarry Smith { 1339a5e57a09SHong Zhang Mat_MUMPS *mumps = (Mat_MUMPS*)F->spptr; 1340dcd589f8SShri Abhyankar PetscErrorCode ierr; 134167877ebaSShri Abhyankar Vec b; 134267877ebaSShri Abhyankar IS is_iden; 134367877ebaSShri Abhyankar const PetscInt M = A->rmap->N; 1344397b6df1SKris Buschelman 1345397b6df1SKris Buschelman PetscFunctionBegin; 1346a5e57a09SHong Zhang mumps->matstruc = DIFFERENT_NONZERO_PATTERN; 1347dcd589f8SShri Abhyankar 13489a2535b5SHong Zhang /* Set MUMPS options from the options database */ 13499a2535b5SHong Zhang ierr = PetscSetMUMPSFromOptions(F,A);CHKERRQ(ierr); 1350dcd589f8SShri Abhyankar 1351a5e57a09SHong Zhang ierr = (*mumps->ConvertToTriples)(A, 1, MAT_INITIAL_MATRIX, &mumps->nz, &mumps->irn, &mumps->jcn, &mumps->val);CHKERRQ(ierr); 1352dcd589f8SShri Abhyankar 135367877ebaSShri Abhyankar /* analysis phase */ 135467877ebaSShri Abhyankar /*----------------*/ 1355a5e57a09SHong Zhang mumps->id.job = JOB_FACTSYMBOLIC; 1356a5e57a09SHong Zhang mumps->id.n = M; 1357a5e57a09SHong Zhang switch (mumps->id.ICNTL(18)) { 135867877ebaSShri Abhyankar case 0: /* centralized assembled matrix input */ 1359a5e57a09SHong Zhang if (!mumps->myid) { 1360a5e57a09SHong Zhang mumps->id.nz =mumps->nz; mumps->id.irn=mumps->irn; mumps->id.jcn=mumps->jcn; 1361a5e57a09SHong Zhang if (mumps->id.ICNTL(6)>1) { 1362940cd9d6SSatish Balay mumps->id.a = (MumpsScalar*)mumps->val; 136367877ebaSShri Abhyankar } 1364a5e57a09SHong Zhang if (mumps->id.ICNTL(7) == 1) { /* use user-provide matrix ordering - assuming r = c ordering */ 13655248a706SHong Zhang /* 13665248a706SHong Zhang PetscBool flag; 13675248a706SHong Zhang ierr = ISEqual(r,c,&flag);CHKERRQ(ierr); 13685248a706SHong Zhang if (!flag) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_USER,"row_perm != col_perm"); 13695248a706SHong Zhang ierr = ISView(r,PETSC_VIEWER_STDOUT_SELF); 13705248a706SHong Zhang */ 1371a5e57a09SHong Zhang if (!mumps->myid) { 1372e0b74bf9SHong Zhang const PetscInt *idx; 1373e0b74bf9SHong Zhang PetscInt i,*perm_in; 13742205254eSKarl Rupp 1375785e854fSJed Brown ierr = PetscMalloc1(M,&perm_in);CHKERRQ(ierr); 1376e0b74bf9SHong Zhang ierr = ISGetIndices(r,&idx);CHKERRQ(ierr); 13772205254eSKarl Rupp 1378a5e57a09SHong Zhang mumps->id.perm_in = perm_in; 1379e0b74bf9SHong Zhang for (i=0; i<M; i++) perm_in[i] = idx[i]+1; /* perm_in[]: start from 1, not 0! */ 1380e0b74bf9SHong Zhang ierr = ISRestoreIndices(r,&idx);CHKERRQ(ierr); 1381e0b74bf9SHong Zhang } 1382e0b74bf9SHong Zhang } 138367877ebaSShri Abhyankar } 138467877ebaSShri Abhyankar break; 138567877ebaSShri Abhyankar case 3: /* distributed assembled matrix input (size>1) */ 1386a5e57a09SHong Zhang mumps->id.nz_loc = mumps->nz; 1387a5e57a09SHong Zhang mumps->id.irn_loc=mumps->irn; mumps->id.jcn_loc=mumps->jcn; 1388a5e57a09SHong Zhang if (mumps->id.ICNTL(6)>1) { 1389940cd9d6SSatish Balay mumps->id.a_loc = (MumpsScalar*)mumps->val; 139067877ebaSShri Abhyankar } 139167877ebaSShri Abhyankar /* MUMPS only supports centralized rhs. Create scatter scat_rhs for repeated use in MatSolve() */ 1392a5e57a09SHong Zhang if (!mumps->myid) { 13932cd7d884SHong Zhang ierr = VecCreateSeq(PETSC_COMM_SELF,A->rmap->N,&mumps->b_seq);CHKERRQ(ierr); 13942cd7d884SHong Zhang ierr = ISCreateStride(PETSC_COMM_SELF,A->rmap->N,0,1,&is_iden);CHKERRQ(ierr); 139567877ebaSShri Abhyankar } else { 1396a5e57a09SHong Zhang ierr = VecCreateSeq(PETSC_COMM_SELF,0,&mumps->b_seq);CHKERRQ(ierr); 139767877ebaSShri Abhyankar ierr = ISCreateStride(PETSC_COMM_SELF,0,0,1,&is_iden);CHKERRQ(ierr); 139867877ebaSShri Abhyankar } 13992a7a6963SBarry Smith ierr = MatCreateVecs(A,NULL,&b);CHKERRQ(ierr); 1400a5e57a09SHong Zhang ierr = VecScatterCreate(b,is_iden,mumps->b_seq,is_iden,&mumps->scat_rhs);CHKERRQ(ierr); 14016bf464f9SBarry Smith ierr = ISDestroy(&is_iden);CHKERRQ(ierr); 14026bf464f9SBarry Smith ierr = VecDestroy(&b);CHKERRQ(ierr); 140367877ebaSShri Abhyankar break; 140467877ebaSShri Abhyankar } 1405a5e57a09SHong Zhang PetscMUMPS_c(&mumps->id); 1406a5e57a09SHong Zhang if (mumps->id.INFOG(1) < 0) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error reported by MUMPS in analysis phase: INFOG(1)=%d\n",mumps->id.INFOG(1)); 140767877ebaSShri Abhyankar 1408719d5645SBarry Smith F->ops->lufactornumeric = MatFactorNumeric_MUMPS; 1409dcd589f8SShri Abhyankar F->ops->solve = MatSolve_MUMPS; 141051d5961aSHong Zhang F->ops->solvetranspose = MatSolveTranspose_MUMPS; 14114e34a73bSHong Zhang F->ops->matsolve = MatMatSolve_MUMPS; 1412b24902e0SBarry Smith PetscFunctionReturn(0); 1413b24902e0SBarry Smith } 1414b24902e0SBarry Smith 1415450b117fSShri Abhyankar /* Note the Petsc r and c permutations are ignored */ 1416450b117fSShri Abhyankar #undef __FUNCT__ 1417450b117fSShri Abhyankar #define __FUNCT__ "MatLUFactorSymbolic_BAIJMUMPS" 1418450b117fSShri Abhyankar PetscErrorCode MatLUFactorSymbolic_BAIJMUMPS(Mat F,Mat A,IS r,IS c,const MatFactorInfo *info) 1419450b117fSShri Abhyankar { 1420a5e57a09SHong Zhang Mat_MUMPS *mumps = (Mat_MUMPS*)F->spptr; 1421dcd589f8SShri Abhyankar PetscErrorCode ierr; 142267877ebaSShri Abhyankar Vec b; 142367877ebaSShri Abhyankar IS is_iden; 142467877ebaSShri Abhyankar const PetscInt M = A->rmap->N; 1425450b117fSShri Abhyankar 1426450b117fSShri Abhyankar PetscFunctionBegin; 1427a5e57a09SHong Zhang mumps->matstruc = DIFFERENT_NONZERO_PATTERN; 1428dcd589f8SShri Abhyankar 14299a2535b5SHong Zhang /* Set MUMPS options from the options database */ 14309a2535b5SHong Zhang ierr = PetscSetMUMPSFromOptions(F,A);CHKERRQ(ierr); 1431dcd589f8SShri Abhyankar 1432a5e57a09SHong Zhang ierr = (*mumps->ConvertToTriples)(A, 1, MAT_INITIAL_MATRIX, &mumps->nz, &mumps->irn, &mumps->jcn, &mumps->val);CHKERRQ(ierr); 143367877ebaSShri Abhyankar 143467877ebaSShri Abhyankar /* analysis phase */ 143567877ebaSShri Abhyankar /*----------------*/ 1436a5e57a09SHong Zhang mumps->id.job = JOB_FACTSYMBOLIC; 1437a5e57a09SHong Zhang mumps->id.n = M; 1438a5e57a09SHong Zhang switch (mumps->id.ICNTL(18)) { 143967877ebaSShri Abhyankar case 0: /* centralized assembled matrix input */ 1440a5e57a09SHong Zhang if (!mumps->myid) { 1441a5e57a09SHong Zhang mumps->id.nz =mumps->nz; mumps->id.irn=mumps->irn; mumps->id.jcn=mumps->jcn; 1442a5e57a09SHong Zhang if (mumps->id.ICNTL(6)>1) { 1443940cd9d6SSatish Balay mumps->id.a = (MumpsScalar*)mumps->val; 144467877ebaSShri Abhyankar } 144567877ebaSShri Abhyankar } 144667877ebaSShri Abhyankar break; 144767877ebaSShri Abhyankar case 3: /* distributed assembled matrix input (size>1) */ 1448a5e57a09SHong Zhang mumps->id.nz_loc = mumps->nz; 1449a5e57a09SHong Zhang mumps->id.irn_loc=mumps->irn; mumps->id.jcn_loc=mumps->jcn; 1450a5e57a09SHong Zhang if (mumps->id.ICNTL(6)>1) { 1451940cd9d6SSatish Balay mumps->id.a_loc = (MumpsScalar*)mumps->val; 145267877ebaSShri Abhyankar } 145367877ebaSShri Abhyankar /* MUMPS only supports centralized rhs. Create scatter scat_rhs for repeated use in MatSolve() */ 1454a5e57a09SHong Zhang if (!mumps->myid) { 1455a5e57a09SHong Zhang ierr = VecCreateSeq(PETSC_COMM_SELF,A->cmap->N,&mumps->b_seq);CHKERRQ(ierr); 145667877ebaSShri Abhyankar ierr = ISCreateStride(PETSC_COMM_SELF,A->cmap->N,0,1,&is_iden);CHKERRQ(ierr); 145767877ebaSShri Abhyankar } else { 1458a5e57a09SHong Zhang ierr = VecCreateSeq(PETSC_COMM_SELF,0,&mumps->b_seq);CHKERRQ(ierr); 145967877ebaSShri Abhyankar ierr = ISCreateStride(PETSC_COMM_SELF,0,0,1,&is_iden);CHKERRQ(ierr); 146067877ebaSShri Abhyankar } 14612a7a6963SBarry Smith ierr = MatCreateVecs(A,NULL,&b);CHKERRQ(ierr); 1462a5e57a09SHong Zhang ierr = VecScatterCreate(b,is_iden,mumps->b_seq,is_iden,&mumps->scat_rhs);CHKERRQ(ierr); 14636bf464f9SBarry Smith ierr = ISDestroy(&is_iden);CHKERRQ(ierr); 14646bf464f9SBarry Smith ierr = VecDestroy(&b);CHKERRQ(ierr); 146567877ebaSShri Abhyankar break; 146667877ebaSShri Abhyankar } 1467a5e57a09SHong Zhang PetscMUMPS_c(&mumps->id); 1468a5e57a09SHong Zhang if (mumps->id.INFOG(1) < 0) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error reported by MUMPS in analysis phase: INFOG(1)=%d\n",mumps->id.INFOG(1)); 146967877ebaSShri Abhyankar 1470450b117fSShri Abhyankar F->ops->lufactornumeric = MatFactorNumeric_MUMPS; 1471dcd589f8SShri Abhyankar F->ops->solve = MatSolve_MUMPS; 147251d5961aSHong Zhang F->ops->solvetranspose = MatSolveTranspose_MUMPS; 1473450b117fSShri Abhyankar PetscFunctionReturn(0); 1474450b117fSShri Abhyankar } 1475b24902e0SBarry Smith 1476141f4205SHong Zhang /* Note the Petsc r permutation and factor info are ignored */ 1477397b6df1SKris Buschelman #undef __FUNCT__ 147867877ebaSShri Abhyankar #define __FUNCT__ "MatCholeskyFactorSymbolic_MUMPS" 147967877ebaSShri Abhyankar PetscErrorCode MatCholeskyFactorSymbolic_MUMPS(Mat F,Mat A,IS r,const MatFactorInfo *info) 1480b24902e0SBarry Smith { 1481a5e57a09SHong Zhang Mat_MUMPS *mumps = (Mat_MUMPS*)F->spptr; 1482dcd589f8SShri Abhyankar PetscErrorCode ierr; 148367877ebaSShri Abhyankar Vec b; 148467877ebaSShri Abhyankar IS is_iden; 148567877ebaSShri Abhyankar const PetscInt M = A->rmap->N; 1486397b6df1SKris Buschelman 1487397b6df1SKris Buschelman PetscFunctionBegin; 1488a5e57a09SHong Zhang mumps->matstruc = DIFFERENT_NONZERO_PATTERN; 1489dcd589f8SShri Abhyankar 14909a2535b5SHong Zhang /* Set MUMPS options from the options database */ 14919a2535b5SHong Zhang ierr = PetscSetMUMPSFromOptions(F,A);CHKERRQ(ierr); 1492dcd589f8SShri Abhyankar 1493a5e57a09SHong Zhang ierr = (*mumps->ConvertToTriples)(A, 1, MAT_INITIAL_MATRIX, &mumps->nz, &mumps->irn, &mumps->jcn, &mumps->val);CHKERRQ(ierr); 1494dcd589f8SShri Abhyankar 149567877ebaSShri Abhyankar /* analysis phase */ 149667877ebaSShri Abhyankar /*----------------*/ 1497a5e57a09SHong Zhang mumps->id.job = JOB_FACTSYMBOLIC; 1498a5e57a09SHong Zhang mumps->id.n = M; 1499a5e57a09SHong Zhang switch (mumps->id.ICNTL(18)) { 150067877ebaSShri Abhyankar case 0: /* centralized assembled matrix input */ 1501a5e57a09SHong Zhang if (!mumps->myid) { 1502a5e57a09SHong Zhang mumps->id.nz =mumps->nz; mumps->id.irn=mumps->irn; mumps->id.jcn=mumps->jcn; 1503a5e57a09SHong Zhang if (mumps->id.ICNTL(6)>1) { 1504940cd9d6SSatish Balay mumps->id.a = (MumpsScalar*)mumps->val; 150567877ebaSShri Abhyankar } 150667877ebaSShri Abhyankar } 150767877ebaSShri Abhyankar break; 150867877ebaSShri Abhyankar case 3: /* distributed assembled matrix input (size>1) */ 1509a5e57a09SHong Zhang mumps->id.nz_loc = mumps->nz; 1510a5e57a09SHong Zhang mumps->id.irn_loc=mumps->irn; mumps->id.jcn_loc=mumps->jcn; 1511a5e57a09SHong Zhang if (mumps->id.ICNTL(6)>1) { 1512940cd9d6SSatish Balay mumps->id.a_loc = (MumpsScalar*)mumps->val; 151367877ebaSShri Abhyankar } 151467877ebaSShri Abhyankar /* MUMPS only supports centralized rhs. Create scatter scat_rhs for repeated use in MatSolve() */ 1515a5e57a09SHong Zhang if (!mumps->myid) { 1516a5e57a09SHong Zhang ierr = VecCreateSeq(PETSC_COMM_SELF,A->cmap->N,&mumps->b_seq);CHKERRQ(ierr); 151767877ebaSShri Abhyankar ierr = ISCreateStride(PETSC_COMM_SELF,A->cmap->N,0,1,&is_iden);CHKERRQ(ierr); 151867877ebaSShri Abhyankar } else { 1519a5e57a09SHong Zhang ierr = VecCreateSeq(PETSC_COMM_SELF,0,&mumps->b_seq);CHKERRQ(ierr); 152067877ebaSShri Abhyankar ierr = ISCreateStride(PETSC_COMM_SELF,0,0,1,&is_iden);CHKERRQ(ierr); 152167877ebaSShri Abhyankar } 15222a7a6963SBarry Smith ierr = MatCreateVecs(A,NULL,&b);CHKERRQ(ierr); 1523a5e57a09SHong Zhang ierr = VecScatterCreate(b,is_iden,mumps->b_seq,is_iden,&mumps->scat_rhs);CHKERRQ(ierr); 15246bf464f9SBarry Smith ierr = ISDestroy(&is_iden);CHKERRQ(ierr); 15256bf464f9SBarry Smith ierr = VecDestroy(&b);CHKERRQ(ierr); 152667877ebaSShri Abhyankar break; 152767877ebaSShri Abhyankar } 1528a5e57a09SHong Zhang PetscMUMPS_c(&mumps->id); 1529a5e57a09SHong Zhang if (mumps->id.INFOG(1) < 0) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error reported by MUMPS in analysis phase: INFOG(1)=%d\n",mumps->id.INFOG(1)); 153067877ebaSShri Abhyankar 15312792810eSHong Zhang F->ops->choleskyfactornumeric = MatFactorNumeric_MUMPS; 1532dcd589f8SShri Abhyankar F->ops->solve = MatSolve_MUMPS; 153351d5961aSHong Zhang F->ops->solvetranspose = MatSolve_MUMPS; 15344e34a73bSHong Zhang F->ops->matsolve = MatMatSolve_MUMPS; 15354e34a73bSHong Zhang #if defined(PETSC_USE_COMPLEX) 15360298fd71SBarry Smith F->ops->getinertia = NULL; 15374e34a73bSHong Zhang #else 15384e34a73bSHong Zhang F->ops->getinertia = MatGetInertia_SBAIJMUMPS; 1539db4efbfdSBarry Smith #endif 1540b24902e0SBarry Smith PetscFunctionReturn(0); 1541b24902e0SBarry Smith } 1542b24902e0SBarry Smith 1543397b6df1SKris Buschelman #undef __FUNCT__ 154464e6c443SBarry Smith #define __FUNCT__ "MatView_MUMPS" 154564e6c443SBarry Smith PetscErrorCode MatView_MUMPS(Mat A,PetscViewer viewer) 154674ed9c26SBarry Smith { 1547f6c57405SHong Zhang PetscErrorCode ierr; 154864e6c443SBarry Smith PetscBool iascii; 154964e6c443SBarry Smith PetscViewerFormat format; 1550a5e57a09SHong Zhang Mat_MUMPS *mumps=(Mat_MUMPS*)A->spptr; 1551f6c57405SHong Zhang 1552f6c57405SHong Zhang PetscFunctionBegin; 155364e6c443SBarry Smith /* check if matrix is mumps type */ 155464e6c443SBarry Smith if (A->ops->solve != MatSolve_MUMPS) PetscFunctionReturn(0); 155564e6c443SBarry Smith 1556251f4c67SDmitry Karpeev ierr = PetscObjectTypeCompare((PetscObject)viewer,PETSCVIEWERASCII,&iascii);CHKERRQ(ierr); 155764e6c443SBarry Smith if (iascii) { 155864e6c443SBarry Smith ierr = PetscViewerGetFormat(viewer,&format);CHKERRQ(ierr); 155964e6c443SBarry Smith if (format == PETSC_VIEWER_ASCII_INFO) { 156064e6c443SBarry Smith ierr = PetscViewerASCIIPrintf(viewer,"MUMPS run parameters:\n");CHKERRQ(ierr); 1561a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," SYM (matrix type): %d \n",mumps->id.sym);CHKERRQ(ierr); 1562a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," PAR (host participation): %d \n",mumps->id.par);CHKERRQ(ierr); 1563a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(1) (output for error): %d \n",mumps->id.ICNTL(1));CHKERRQ(ierr); 1564a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(2) (output of diagnostic msg): %d \n",mumps->id.ICNTL(2));CHKERRQ(ierr); 1565a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(3) (output for global info): %d \n",mumps->id.ICNTL(3));CHKERRQ(ierr); 1566a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(4) (level of printing): %d \n",mumps->id.ICNTL(4));CHKERRQ(ierr); 1567a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(5) (input mat struct): %d \n",mumps->id.ICNTL(5));CHKERRQ(ierr); 1568a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(6) (matrix prescaling): %d \n",mumps->id.ICNTL(6));CHKERRQ(ierr); 1569a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(7) (sequentia matrix ordering):%d \n",mumps->id.ICNTL(7));CHKERRQ(ierr); 1570a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(8) (scalling strategy): %d \n",mumps->id.ICNTL(8));CHKERRQ(ierr); 1571a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(10) (max num of refinements): %d \n",mumps->id.ICNTL(10));CHKERRQ(ierr); 1572a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(11) (error analysis): %d \n",mumps->id.ICNTL(11));CHKERRQ(ierr); 1573a5e57a09SHong Zhang if (mumps->id.ICNTL(11)>0) { 1574a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," RINFOG(4) (inf norm of input mat): %g\n",mumps->id.RINFOG(4));CHKERRQ(ierr); 1575a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," RINFOG(5) (inf norm of solution): %g\n",mumps->id.RINFOG(5));CHKERRQ(ierr); 1576a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," RINFOG(6) (inf norm of residual): %g\n",mumps->id.RINFOG(6));CHKERRQ(ierr); 1577a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," RINFOG(7),RINFOG(8) (backward error est): %g, %g\n",mumps->id.RINFOG(7),mumps->id.RINFOG(8));CHKERRQ(ierr); 1578a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," RINFOG(9) (error estimate): %g \n",mumps->id.RINFOG(9));CHKERRQ(ierr); 1579a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," RINFOG(10),RINFOG(11)(condition numbers): %g, %g\n",mumps->id.RINFOG(10),mumps->id.RINFOG(11));CHKERRQ(ierr); 1580f6c57405SHong Zhang } 1581a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(12) (efficiency control): %d \n",mumps->id.ICNTL(12));CHKERRQ(ierr); 1582a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(13) (efficiency control): %d \n",mumps->id.ICNTL(13));CHKERRQ(ierr); 1583a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(14) (percentage of estimated workspace increase): %d \n",mumps->id.ICNTL(14));CHKERRQ(ierr); 1584f6c57405SHong Zhang /* ICNTL(15-17) not used */ 1585a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(18) (input mat struct): %d \n",mumps->id.ICNTL(18));CHKERRQ(ierr); 1586a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(19) (Shur complement info): %d \n",mumps->id.ICNTL(19));CHKERRQ(ierr); 1587a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(20) (rhs sparse pattern): %d \n",mumps->id.ICNTL(20));CHKERRQ(ierr); 1588ca3dc52bSPierre Jolivet ierr = PetscViewerASCIIPrintf(viewer," ICNTL(21) (solution struct): %d \n",mumps->id.ICNTL(21));CHKERRQ(ierr); 1589a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(22) (in-core/out-of-core facility): %d \n",mumps->id.ICNTL(22));CHKERRQ(ierr); 1590a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(23) (max size of memory can be allocated locally):%d \n",mumps->id.ICNTL(23));CHKERRQ(ierr); 1591c0165424SHong Zhang 1592a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(24) (detection of null pivot rows): %d \n",mumps->id.ICNTL(24));CHKERRQ(ierr); 1593a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(25) (computation of a null space basis): %d \n",mumps->id.ICNTL(25));CHKERRQ(ierr); 1594a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(26) (Schur options for rhs or solution): %d \n",mumps->id.ICNTL(26));CHKERRQ(ierr); 1595a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(27) (experimental parameter): %d \n",mumps->id.ICNTL(27));CHKERRQ(ierr); 1596a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(28) (use parallel or sequential ordering): %d \n",mumps->id.ICNTL(28));CHKERRQ(ierr); 1597a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(29) (parallel ordering): %d \n",mumps->id.ICNTL(29));CHKERRQ(ierr); 159842179a6aSHong Zhang 1599a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(30) (user-specified set of entries in inv(A)): %d \n",mumps->id.ICNTL(30));CHKERRQ(ierr); 1600a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(31) (factors is discarded in the solve phase): %d \n",mumps->id.ICNTL(31));CHKERRQ(ierr); 1601a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," ICNTL(33) (compute determinant): %d \n",mumps->id.ICNTL(33));CHKERRQ(ierr); 1602f6c57405SHong Zhang 1603a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," CNTL(1) (relative pivoting threshold): %g \n",mumps->id.CNTL(1));CHKERRQ(ierr); 1604a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," CNTL(2) (stopping criterion of refinement): %g \n",mumps->id.CNTL(2));CHKERRQ(ierr); 1605ca3dc52bSPierre Jolivet ierr = PetscViewerASCIIPrintf(viewer," CNTL(3) (absolute pivoting threshold): %g \n",mumps->id.CNTL(3));CHKERRQ(ierr); 1606ca3dc52bSPierre Jolivet ierr = PetscViewerASCIIPrintf(viewer," CNTL(4) (value of static pivoting): %g \n",mumps->id.CNTL(4));CHKERRQ(ierr); 1607a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," CNTL(5) (fixation for null pivots): %g \n",mumps->id.CNTL(5));CHKERRQ(ierr); 1608f6c57405SHong Zhang 1609f6c57405SHong Zhang /* infomation local to each processor */ 161034ed7027SBarry Smith ierr = PetscViewerASCIIPrintf(viewer, " RINFO(1) (local estimated flops for the elimination after analysis): \n");CHKERRQ(ierr); 16111575c14dSBarry Smith ierr = PetscViewerASCIIPushSynchronized(viewer);CHKERRQ(ierr); 1612a5e57a09SHong Zhang ierr = PetscViewerASCIISynchronizedPrintf(viewer," [%d] %g \n",mumps->myid,mumps->id.RINFO(1));CHKERRQ(ierr); 161334ed7027SBarry Smith ierr = PetscViewerFlush(viewer); 161434ed7027SBarry Smith ierr = PetscViewerASCIIPrintf(viewer, " RINFO(2) (local estimated flops for the assembly after factorization): \n");CHKERRQ(ierr); 1615a5e57a09SHong Zhang ierr = PetscViewerASCIISynchronizedPrintf(viewer," [%d] %g \n",mumps->myid,mumps->id.RINFO(2));CHKERRQ(ierr); 161634ed7027SBarry Smith ierr = PetscViewerFlush(viewer); 161734ed7027SBarry Smith ierr = PetscViewerASCIIPrintf(viewer, " RINFO(3) (local estimated flops for the elimination after factorization): \n");CHKERRQ(ierr); 1618a5e57a09SHong Zhang ierr = PetscViewerASCIISynchronizedPrintf(viewer," [%d] %g \n",mumps->myid,mumps->id.RINFO(3));CHKERRQ(ierr); 161934ed7027SBarry Smith ierr = PetscViewerFlush(viewer); 1620f6c57405SHong Zhang 162134ed7027SBarry Smith ierr = PetscViewerASCIIPrintf(viewer, " INFO(15) (estimated size of (in MB) MUMPS internal data for running numerical factorization): \n");CHKERRQ(ierr); 1622a5e57a09SHong Zhang ierr = PetscViewerASCIISynchronizedPrintf(viewer," [%d] %d \n",mumps->myid,mumps->id.INFO(15));CHKERRQ(ierr); 162334ed7027SBarry Smith ierr = PetscViewerFlush(viewer); 1624f6c57405SHong Zhang 162534ed7027SBarry Smith ierr = PetscViewerASCIIPrintf(viewer, " INFO(16) (size of (in MB) MUMPS internal data used during numerical factorization): \n");CHKERRQ(ierr); 1626a5e57a09SHong Zhang ierr = PetscViewerASCIISynchronizedPrintf(viewer," [%d] %d \n",mumps->myid,mumps->id.INFO(16));CHKERRQ(ierr); 162734ed7027SBarry Smith ierr = PetscViewerFlush(viewer); 1628f6c57405SHong Zhang 162934ed7027SBarry Smith ierr = PetscViewerASCIIPrintf(viewer, " INFO(23) (num of pivots eliminated on this processor after factorization): \n");CHKERRQ(ierr); 1630a5e57a09SHong Zhang ierr = PetscViewerASCIISynchronizedPrintf(viewer," [%d] %d \n",mumps->myid,mumps->id.INFO(23));CHKERRQ(ierr); 163134ed7027SBarry Smith ierr = PetscViewerFlush(viewer); 1632b34f08ffSHong Zhang 1633b34f08ffSHong Zhang if (mumps->ninfo && mumps->ninfo <= 40){ 1634b34f08ffSHong Zhang PetscInt i; 1635b34f08ffSHong Zhang for (i=0; i<mumps->ninfo; i++){ 1636b34f08ffSHong Zhang ierr = PetscViewerASCIIPrintf(viewer, " INFO(%d): \n",mumps->info[i]);CHKERRQ(ierr); 1637b34f08ffSHong Zhang ierr = PetscViewerASCIISynchronizedPrintf(viewer," [%d] %d \n",mumps->myid,mumps->id.INFO(mumps->info[i]));CHKERRQ(ierr); 1638b34f08ffSHong Zhang ierr = PetscViewerFlush(viewer); 1639b34f08ffSHong Zhang } 1640b34f08ffSHong Zhang } 1641b34f08ffSHong Zhang 1642b34f08ffSHong Zhang 16431575c14dSBarry Smith ierr = PetscViewerASCIIPopSynchronized(viewer);CHKERRQ(ierr); 1644f6c57405SHong Zhang 1645a5e57a09SHong Zhang if (!mumps->myid) { /* information from the host */ 1646a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," RINFOG(1) (global estimated flops for the elimination after analysis): %g \n",mumps->id.RINFOG(1));CHKERRQ(ierr); 1647a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," RINFOG(2) (global estimated flops for the assembly after factorization): %g \n",mumps->id.RINFOG(2));CHKERRQ(ierr); 1648a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," RINFOG(3) (global estimated flops for the elimination after factorization): %g \n",mumps->id.RINFOG(3));CHKERRQ(ierr); 1649a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," (RINFOG(12) RINFOG(13))*2^INFOG(34) (determinant): (%g,%g)*(2^%d)\n",mumps->id.RINFOG(12),mumps->id.RINFOG(13),mumps->id.INFOG(34));CHKERRQ(ierr); 1650f6c57405SHong Zhang 1651a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(3) (estimated real workspace for factors on all processors after analysis): %d \n",mumps->id.INFOG(3));CHKERRQ(ierr); 1652a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(4) (estimated integer workspace for factors on all processors after analysis): %d \n",mumps->id.INFOG(4));CHKERRQ(ierr); 1653a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(5) (estimated maximum front size in the complete tree): %d \n",mumps->id.INFOG(5));CHKERRQ(ierr); 1654a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(6) (number of nodes in the complete tree): %d \n",mumps->id.INFOG(6));CHKERRQ(ierr); 1655a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(7) (ordering option effectively use after analysis): %d \n",mumps->id.INFOG(7));CHKERRQ(ierr); 1656a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(8) (structural symmetry in percent of the permuted matrix after analysis): %d \n",mumps->id.INFOG(8));CHKERRQ(ierr); 1657a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(9) (total real/complex workspace to store the matrix factors after factorization): %d \n",mumps->id.INFOG(9));CHKERRQ(ierr); 1658a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(10) (total integer space store the matrix factors after factorization): %d \n",mumps->id.INFOG(10));CHKERRQ(ierr); 1659a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(11) (order of largest frontal matrix after factorization): %d \n",mumps->id.INFOG(11));CHKERRQ(ierr); 1660a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(12) (number of off-diagonal pivots): %d \n",mumps->id.INFOG(12));CHKERRQ(ierr); 1661a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(13) (number of delayed pivots after factorization): %d \n",mumps->id.INFOG(13));CHKERRQ(ierr); 1662a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(14) (number of memory compress after factorization): %d \n",mumps->id.INFOG(14));CHKERRQ(ierr); 1663a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(15) (number of steps of iterative refinement after solution): %d \n",mumps->id.INFOG(15));CHKERRQ(ierr); 1664a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(16) (estimated size (in MB) of all MUMPS internal data for factorization after analysis: value on the most memory consuming processor): %d \n",mumps->id.INFOG(16));CHKERRQ(ierr); 1665a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(17) (estimated size of all MUMPS internal data for factorization after analysis: sum over all processors): %d \n",mumps->id.INFOG(17));CHKERRQ(ierr); 1666a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(18) (size of all MUMPS internal data allocated during factorization: value on the most memory consuming processor): %d \n",mumps->id.INFOG(18));CHKERRQ(ierr); 1667a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(19) (size of all MUMPS internal data allocated during factorization: sum over all processors): %d \n",mumps->id.INFOG(19));CHKERRQ(ierr); 1668a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(20) (estimated number of entries in the factors): %d \n",mumps->id.INFOG(20));CHKERRQ(ierr); 1669a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(21) (size in MB of memory effectively used during factorization - value on the most memory consuming processor): %d \n",mumps->id.INFOG(21));CHKERRQ(ierr); 1670a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(22) (size in MB of memory effectively used during factorization - sum over all processors): %d \n",mumps->id.INFOG(22));CHKERRQ(ierr); 1671a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(23) (after analysis: value of ICNTL(6) effectively used): %d \n",mumps->id.INFOG(23));CHKERRQ(ierr); 1672a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(24) (after analysis: value of ICNTL(12) effectively used): %d \n",mumps->id.INFOG(24));CHKERRQ(ierr); 1673a5e57a09SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(25) (after factorization: number of pivots modified by static pivoting): %d \n",mumps->id.INFOG(25));CHKERRQ(ierr); 167440d435e3SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(28) (after factorization: number of null pivots encountered): %d\n",mumps->id.INFOG(28));CHKERRQ(ierr); 167540d435e3SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(29) (after factorization: effective number of entries in the factors (sum over all processors)): %d\n",mumps->id.INFOG(29));CHKERRQ(ierr); 167640d435e3SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(30, 31) (after solution: size in Mbytes of memory used during solution phase): %d, %d\n",mumps->id.INFOG(30),mumps->id.INFOG(31));CHKERRQ(ierr); 167740d435e3SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(32) (after analysis: type of analysis done): %d\n",mumps->id.INFOG(32));CHKERRQ(ierr); 167840d435e3SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(33) (value used for ICNTL(8)): %d\n",mumps->id.INFOG(33));CHKERRQ(ierr); 167940d435e3SHong Zhang ierr = PetscViewerASCIIPrintf(viewer," INFOG(34) (exponent of the determinant if determinant is requested): %d\n",mumps->id.INFOG(34));CHKERRQ(ierr); 1680f6c57405SHong Zhang } 1681f6c57405SHong Zhang } 1682cb828f0fSHong Zhang } 1683f6c57405SHong Zhang PetscFunctionReturn(0); 1684f6c57405SHong Zhang } 1685f6c57405SHong Zhang 168635bd34faSBarry Smith #undef __FUNCT__ 168735bd34faSBarry Smith #define __FUNCT__ "MatGetInfo_MUMPS" 168835bd34faSBarry Smith PetscErrorCode MatGetInfo_MUMPS(Mat A,MatInfoType flag,MatInfo *info) 168935bd34faSBarry Smith { 1690cb828f0fSHong Zhang Mat_MUMPS *mumps =(Mat_MUMPS*)A->spptr; 169135bd34faSBarry Smith 169235bd34faSBarry Smith PetscFunctionBegin; 169335bd34faSBarry Smith info->block_size = 1.0; 1694cb828f0fSHong Zhang info->nz_allocated = mumps->id.INFOG(20); 1695cb828f0fSHong Zhang info->nz_used = mumps->id.INFOG(20); 169635bd34faSBarry Smith info->nz_unneeded = 0.0; 169735bd34faSBarry Smith info->assemblies = 0.0; 169835bd34faSBarry Smith info->mallocs = 0.0; 169935bd34faSBarry Smith info->memory = 0.0; 170035bd34faSBarry Smith info->fill_ratio_given = 0; 170135bd34faSBarry Smith info->fill_ratio_needed = 0; 170235bd34faSBarry Smith info->factor_mallocs = 0; 170335bd34faSBarry Smith PetscFunctionReturn(0); 170435bd34faSBarry Smith } 170535bd34faSBarry Smith 17065ccb76cbSHong Zhang /* -------------------------------------------------------------------------------------------*/ 17075ccb76cbSHong Zhang #undef __FUNCT__ 17088e7ba810SStefano Zampini #define __FUNCT__ "MatFactorSetSchurIS_MUMPS" 17098e7ba810SStefano Zampini PetscErrorCode MatFactorSetSchurIS_MUMPS(Mat F, IS is) 17106444a565SStefano Zampini { 17116444a565SStefano Zampini Mat_MUMPS *mumps =(Mat_MUMPS*)F->spptr; 17128e7ba810SStefano Zampini const PetscInt *idxs; 17138e7ba810SStefano Zampini PetscInt size,i; 17146444a565SStefano Zampini PetscErrorCode ierr; 17156444a565SStefano Zampini 17166444a565SStefano Zampini PetscFunctionBegin; 171759ac8732SStefano Zampini if (mumps->size > 1) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_SUP,"MUMPS parallel Schur complements not yet supported from PETSc\n"); 17188e7ba810SStefano Zampini ierr = ISGetLocalSize(is,&size);CHKERRQ(ierr); 17196444a565SStefano Zampini if (mumps->id.size_schur != size) { 17206444a565SStefano Zampini ierr = PetscFree2(mumps->id.listvar_schur,mumps->id.schur);CHKERRQ(ierr); 17216444a565SStefano Zampini mumps->id.size_schur = size; 17226444a565SStefano Zampini mumps->id.schur_lld = size; 17236444a565SStefano Zampini ierr = PetscMalloc2(size,&mumps->id.listvar_schur,size*size,&mumps->id.schur);CHKERRQ(ierr); 17246444a565SStefano Zampini } 17258e7ba810SStefano Zampini ierr = ISGetIndices(is,&idxs);CHKERRQ(ierr); 17266444a565SStefano Zampini ierr = PetscMemcpy(mumps->id.listvar_schur,idxs,size*sizeof(PetscInt));CHKERRQ(ierr); 17278e7ba810SStefano Zampini /* MUMPS expects Fortran style indices */ 17288e7ba810SStefano Zampini for (i=0;i<size;i++) mumps->id.listvar_schur[i]++; 17298e7ba810SStefano Zampini ierr = ISRestoreIndices(is,&idxs);CHKERRQ(ierr); 173078a7176cSStefano Zampini if (size) { /* turn on Schur switch if we the set of indices is not empty */ 17316444a565SStefano Zampini if (F->factortype == MAT_FACTOR_LU) { 173259ac8732SStefano Zampini mumps->id.ICNTL(19) = 3; /* MUMPS returns full matrix */ 17336444a565SStefano Zampini } else { 173459ac8732SStefano Zampini mumps->id.ICNTL(19) = 2; /* MUMPS returns lower triangular part */ 17356444a565SStefano Zampini } 173659ac8732SStefano Zampini /* set a special value of ICNTL (not handled my MUMPS) to be used in the solve phase by PETSc */ 1737b5fa320bSStefano Zampini mumps->id.ICNTL(26) = -1; 173878a7176cSStefano Zampini } 17396444a565SStefano Zampini PetscFunctionReturn(0); 17406444a565SStefano Zampini } 17416444a565SStefano Zampini 17426444a565SStefano Zampini /* -------------------------------------------------------------------------------------------*/ 17436444a565SStefano Zampini #undef __FUNCT__ 17445a05ddb0SStefano Zampini #define __FUNCT__ "MatFactorCreateSchurComplement_MUMPS" 17455a05ddb0SStefano Zampini PetscErrorCode MatFactorCreateSchurComplement_MUMPS(Mat F,Mat* S) 17466444a565SStefano Zampini { 17476444a565SStefano Zampini Mat St; 17486444a565SStefano Zampini Mat_MUMPS *mumps =(Mat_MUMPS*)F->spptr; 17496444a565SStefano Zampini PetscScalar *array; 17506444a565SStefano Zampini #if defined(PETSC_USE_COMPLEX) 17518ac429a0SStefano Zampini PetscScalar im = PetscSqrtScalar((PetscScalar)-1.0); 17526444a565SStefano Zampini #endif 17536444a565SStefano Zampini PetscErrorCode ierr; 17546444a565SStefano Zampini 17556444a565SStefano Zampini PetscFunctionBegin; 17565a05ddb0SStefano Zampini if (!mumps->id.ICNTL(19)) SETERRQ(PetscObjectComm((PetscObject)F),PETSC_ERR_ORDER,"Schur complement mode not selected! You should call MatFactorSetSchurIS to enable it"); 17575a05ddb0SStefano Zampini else if (!mumps->id.size_schur) SETERRQ(PetscObjectComm((PetscObject)F),PETSC_ERR_ORDER,"Schur indices not set! You should call MatFactorSetSchurIS before"); 17586f3cc6f9SBarry Smith 17596444a565SStefano Zampini ierr = MatCreate(PetscObjectComm((PetscObject)F),&St);CHKERRQ(ierr); 17606444a565SStefano Zampini ierr = MatSetSizes(St,PETSC_DECIDE,PETSC_DECIDE,mumps->id.size_schur,mumps->id.size_schur);CHKERRQ(ierr); 17616444a565SStefano Zampini ierr = MatSetType(St,MATDENSE);CHKERRQ(ierr); 17626444a565SStefano Zampini ierr = MatSetUp(St);CHKERRQ(ierr); 17636444a565SStefano Zampini ierr = MatDenseGetArray(St,&array);CHKERRQ(ierr); 176459ac8732SStefano Zampini if (!mumps->sym) { /* MUMPS always return a full matrix */ 17656444a565SStefano Zampini if (mumps->id.ICNTL(19) == 1) { /* stored by rows */ 17666444a565SStefano Zampini PetscInt i,j,N=mumps->id.size_schur; 17676444a565SStefano Zampini for (i=0;i<N;i++) { 17686444a565SStefano Zampini for (j=0;j<N;j++) { 17696444a565SStefano Zampini #if !defined(PETSC_USE_COMPLEX) 17706444a565SStefano Zampini PetscScalar val = mumps->id.schur[i*N+j]; 17716444a565SStefano Zampini #else 17726444a565SStefano Zampini PetscScalar val = mumps->id.schur[i*N+j].r + im*mumps->id.schur[i*N+j].i; 17736444a565SStefano Zampini #endif 17746444a565SStefano Zampini array[j*N+i] = val; 17756444a565SStefano Zampini } 17766444a565SStefano Zampini } 17776444a565SStefano Zampini } else { /* stored by columns */ 17786444a565SStefano Zampini ierr = PetscMemcpy(array,mumps->id.schur,mumps->id.size_schur*mumps->id.size_schur*sizeof(PetscScalar));CHKERRQ(ierr); 17796444a565SStefano Zampini } 17806444a565SStefano Zampini } else { /* either full or lower-triangular (not packed) */ 17816444a565SStefano Zampini if (mumps->id.ICNTL(19) == 2) { /* lower triangular stored by columns */ 17826444a565SStefano Zampini PetscInt i,j,N=mumps->id.size_schur; 17836444a565SStefano Zampini for (i=0;i<N;i++) { 17846444a565SStefano Zampini for (j=i;j<N;j++) { 17856444a565SStefano Zampini #if !defined(PETSC_USE_COMPLEX) 17866444a565SStefano Zampini PetscScalar val = mumps->id.schur[i*N+j]; 17876444a565SStefano Zampini #else 17886444a565SStefano Zampini PetscScalar val = mumps->id.schur[i*N+j].r + im*mumps->id.schur[i*N+j].i; 17896444a565SStefano Zampini #endif 17906444a565SStefano Zampini array[i*N+j] = val; 17916444a565SStefano Zampini array[j*N+i] = val; 17926444a565SStefano Zampini } 17936444a565SStefano Zampini } 17946444a565SStefano Zampini } else if (mumps->id.ICNTL(19) == 3) { /* full matrix */ 17956444a565SStefano Zampini ierr = PetscMemcpy(array,mumps->id.schur,mumps->id.size_schur*mumps->id.size_schur*sizeof(PetscScalar));CHKERRQ(ierr); 17966444a565SStefano Zampini } else { /* ICNTL(19) == 1 lower triangular stored by rows */ 17976444a565SStefano Zampini PetscInt i,j,N=mumps->id.size_schur; 17986444a565SStefano Zampini for (i=0;i<N;i++) { 17996444a565SStefano Zampini for (j=0;j<i+1;j++) { 18006444a565SStefano Zampini #if !defined(PETSC_USE_COMPLEX) 18016444a565SStefano Zampini PetscScalar val = mumps->id.schur[i*N+j]; 18026444a565SStefano Zampini #else 18036444a565SStefano Zampini PetscScalar val = mumps->id.schur[i*N+j].r + im*mumps->id.schur[i*N+j].i; 18046444a565SStefano Zampini #endif 18056444a565SStefano Zampini array[i*N+j] = val; 18066444a565SStefano Zampini array[j*N+i] = val; 18076444a565SStefano Zampini } 18086444a565SStefano Zampini } 18096444a565SStefano Zampini } 18106444a565SStefano Zampini } 18116444a565SStefano Zampini ierr = MatDenseRestoreArray(St,&array);CHKERRQ(ierr); 18126444a565SStefano Zampini *S = St; 18136444a565SStefano Zampini PetscFunctionReturn(0); 18146444a565SStefano Zampini } 18156444a565SStefano Zampini 181659ac8732SStefano Zampini /* -------------------------------------------------------------------------------------------*/ 181759ac8732SStefano Zampini #undef __FUNCT__ 18185a05ddb0SStefano Zampini #define __FUNCT__ "MatFactorGetSchurComplement_MUMPS" 18195a05ddb0SStefano Zampini PetscErrorCode MatFactorGetSchurComplement_MUMPS(Mat F,Mat* S) 182059ac8732SStefano Zampini { 182159ac8732SStefano Zampini Mat St; 182259ac8732SStefano Zampini Mat_MUMPS *mumps =(Mat_MUMPS*)F->spptr; 182359ac8732SStefano Zampini PetscErrorCode ierr; 182459ac8732SStefano Zampini 182559ac8732SStefano Zampini PetscFunctionBegin; 18265a05ddb0SStefano Zampini if (!mumps->id.ICNTL(19)) SETERRQ(PetscObjectComm((PetscObject)F),PETSC_ERR_ORDER,"Schur complement mode not selected! You should call MatFactorSetSchurIS to enable it"); 18275a05ddb0SStefano Zampini else if (!mumps->id.size_schur) SETERRQ(PetscObjectComm((PetscObject)F),PETSC_ERR_ORDER,"Schur indices not set! You should call MatFactorSetSchurIS before"); 18286f3cc6f9SBarry Smith 18297bc32933SStefano Zampini /* It should be the responsibility of the user to handle different ICNTL(19) cases and factorization stages if they want to work with the raw data */ 183059ac8732SStefano Zampini ierr = MatCreateSeqDense(PetscObjectComm((PetscObject)F),mumps->id.size_schur,mumps->id.size_schur,(PetscScalar*)mumps->id.schur,&St);CHKERRQ(ierr); 183159ac8732SStefano Zampini *S = St; 183259ac8732SStefano Zampini PetscFunctionReturn(0); 183359ac8732SStefano Zampini } 183459ac8732SStefano Zampini 183559ac8732SStefano Zampini /* -------------------------------------------------------------------------------------------*/ 183659ac8732SStefano Zampini #undef __FUNCT__ 18375a05ddb0SStefano Zampini #define __FUNCT__ "MatFactorInvertSchurComplement_MUMPS" 18385a05ddb0SStefano Zampini PetscErrorCode MatFactorInvertSchurComplement_MUMPS(Mat F) 183959ac8732SStefano Zampini { 184059ac8732SStefano Zampini Mat_MUMPS *mumps =(Mat_MUMPS*)F->spptr; 184159ac8732SStefano Zampini PetscErrorCode ierr; 184259ac8732SStefano Zampini 184359ac8732SStefano Zampini PetscFunctionBegin; 184459ac8732SStefano Zampini if (!mumps->id.ICNTL(19)) { /* do nothing */ 184559ac8732SStefano Zampini PetscFunctionReturn(0); 184659ac8732SStefano Zampini } 18475a05ddb0SStefano Zampini if (!mumps->id.size_schur) SETERRQ(PetscObjectComm((PetscObject)F),PETSC_ERR_ORDER,"Schur indices not set! You should call MatFactorSetSchurIS before"); 184859ac8732SStefano Zampini ierr = MatMumpsInvertSchur_Private(mumps);CHKERRQ(ierr); 184959ac8732SStefano Zampini PetscFunctionReturn(0); 185059ac8732SStefano Zampini } 185159ac8732SStefano Zampini 18526444a565SStefano Zampini /* -------------------------------------------------------------------------------------------*/ 18536444a565SStefano Zampini #undef __FUNCT__ 18545a05ddb0SStefano Zampini #define __FUNCT__ "MatFactorSolveSchurComplement_MUMPS" 18555a05ddb0SStefano Zampini PetscErrorCode MatFactorSolveSchurComplement_MUMPS(Mat F, Vec rhs, Vec sol) 1856e807eca7SStefano Zampini { 1857e807eca7SStefano Zampini Mat_MUMPS *mumps =(Mat_MUMPS*)F->spptr; 1858e807eca7SStefano Zampini MumpsScalar *orhs; 1859e807eca7SStefano Zampini PetscScalar *osol,*nrhs,*nsol; 18609a3a5937SStefano Zampini PetscInt orhs_size,osol_size,olrhs_size; 1861e807eca7SStefano Zampini PetscErrorCode ierr; 1862e807eca7SStefano Zampini 1863e807eca7SStefano Zampini PetscFunctionBegin; 18645a05ddb0SStefano Zampini if (!mumps->id.ICNTL(19)) SETERRQ(PetscObjectComm((PetscObject)F),PETSC_ERR_ORDER,"Schur complement mode not selected! You should call MatFactorSetSchurIS to enable it"); 18655a05ddb0SStefano Zampini if (!mumps->id.size_schur) SETERRQ(PetscObjectComm((PetscObject)F),PETSC_ERR_ORDER,"Schur indices not set! You should call MatFactorSetSchurIS before"); 18666f3cc6f9SBarry Smith 1867e807eca7SStefano Zampini /* swap pointers */ 1868e807eca7SStefano Zampini orhs = mumps->id.redrhs; 18699a3a5937SStefano Zampini olrhs_size = mumps->id.lredrhs; 1870a12f35bfSStefano Zampini orhs_size = mumps->sizeredrhs; 1871e807eca7SStefano Zampini osol = mumps->schur_sol; 1872a12f35bfSStefano Zampini osol_size = mumps->schur_sizesol; 1873e807eca7SStefano Zampini ierr = VecGetArray(rhs,&nrhs);CHKERRQ(ierr); 1874e807eca7SStefano Zampini ierr = VecGetArray(sol,&nsol);CHKERRQ(ierr); 1875e807eca7SStefano Zampini mumps->id.redrhs = (MumpsScalar*)nrhs; 1876a12f35bfSStefano Zampini ierr = VecGetLocalSize(rhs,&mumps->sizeredrhs);CHKERRQ(ierr); 18779a3a5937SStefano Zampini mumps->id.lredrhs = mumps->sizeredrhs; 1878e807eca7SStefano Zampini mumps->schur_sol = nsol; 1879a12f35bfSStefano Zampini ierr = VecGetLocalSize(sol,&mumps->schur_sizesol);CHKERRQ(ierr); 1880a12f35bfSStefano Zampini 1881e807eca7SStefano Zampini /* solve Schur complement */ 1882e807eca7SStefano Zampini mumps->id.nrhs = 1; 1883e807eca7SStefano Zampini ierr = MatMumpsSolveSchur_Private(mumps,PETSC_FALSE);CHKERRQ(ierr); 1884e807eca7SStefano Zampini /* restore pointers */ 1885e807eca7SStefano Zampini ierr = VecRestoreArray(rhs,&nrhs);CHKERRQ(ierr); 1886e807eca7SStefano Zampini ierr = VecRestoreArray(sol,&nsol);CHKERRQ(ierr); 1887e807eca7SStefano Zampini mumps->id.redrhs = orhs; 18889a3a5937SStefano Zampini mumps->id.lredrhs = olrhs_size; 1889a12f35bfSStefano Zampini mumps->sizeredrhs = orhs_size; 1890e807eca7SStefano Zampini mumps->schur_sol = osol; 1891a12f35bfSStefano Zampini mumps->schur_sizesol = osol_size; 1892e807eca7SStefano Zampini PetscFunctionReturn(0); 1893e807eca7SStefano Zampini } 1894e807eca7SStefano Zampini 18957404bcfbSStefano Zampini /* -------------------------------------------------------------------------------------------*/ 18967404bcfbSStefano Zampini #undef __FUNCT__ 18975a05ddb0SStefano Zampini #define __FUNCT__ "MatFactorSolveSchurComplementTranspose_MUMPS" 18985a05ddb0SStefano Zampini PetscErrorCode MatFactorSolveSchurComplementTranspose_MUMPS(Mat F, Vec rhs, Vec sol) 18997404bcfbSStefano Zampini { 19007404bcfbSStefano Zampini Mat_MUMPS *mumps =(Mat_MUMPS*)F->spptr; 19017404bcfbSStefano Zampini MumpsScalar *orhs; 19027404bcfbSStefano Zampini PetscScalar *osol,*nrhs,*nsol; 1903a12f35bfSStefano Zampini PetscInt orhs_size,osol_size; 19047404bcfbSStefano Zampini PetscErrorCode ierr; 19057404bcfbSStefano Zampini 19067404bcfbSStefano Zampini PetscFunctionBegin; 19075a05ddb0SStefano Zampini if (!mumps->id.ICNTL(19)) SETERRQ(PetscObjectComm((PetscObject)F),PETSC_ERR_ORDER,"Schur complement mode not selected! You should call MatFactorSetSchurIS to enable it"); 19085a05ddb0SStefano Zampini else if (!mumps->id.size_schur) SETERRQ(PetscObjectComm((PetscObject)F),PETSC_ERR_ORDER,"Schur indices not set! You should call MatFactorSetSchurIS before"); 19096f3cc6f9SBarry Smith 19107404bcfbSStefano Zampini /* swap pointers */ 19117404bcfbSStefano Zampini orhs = mumps->id.redrhs; 1912a12f35bfSStefano Zampini orhs_size = mumps->sizeredrhs; 19137404bcfbSStefano Zampini osol = mumps->schur_sol; 1914a12f35bfSStefano Zampini osol_size = mumps->schur_sizesol; 19157404bcfbSStefano Zampini ierr = VecGetArray(rhs,&nrhs);CHKERRQ(ierr); 19167404bcfbSStefano Zampini ierr = VecGetArray(sol,&nsol);CHKERRQ(ierr); 19177404bcfbSStefano Zampini mumps->id.redrhs = (MumpsScalar*)nrhs; 1918a12f35bfSStefano Zampini ierr = VecGetLocalSize(rhs,&mumps->sizeredrhs);CHKERRQ(ierr); 19197404bcfbSStefano Zampini mumps->schur_sol = nsol; 1920a12f35bfSStefano Zampini ierr = VecGetLocalSize(sol,&mumps->schur_sizesol);CHKERRQ(ierr); 1921a12f35bfSStefano Zampini 19227404bcfbSStefano Zampini /* solve Schur complement */ 19237404bcfbSStefano Zampini mumps->id.nrhs = 1; 19247404bcfbSStefano Zampini mumps->id.ICNTL(9) = 0; 19257404bcfbSStefano Zampini ierr = MatMumpsSolveSchur_Private(mumps,PETSC_FALSE);CHKERRQ(ierr); 19267404bcfbSStefano Zampini mumps->id.ICNTL(9) = 1; 19277404bcfbSStefano Zampini /* restore pointers */ 19287404bcfbSStefano Zampini ierr = VecRestoreArray(rhs,&nrhs);CHKERRQ(ierr); 19297404bcfbSStefano Zampini ierr = VecRestoreArray(sol,&nsol);CHKERRQ(ierr); 19307404bcfbSStefano Zampini mumps->id.redrhs = orhs; 1931a12f35bfSStefano Zampini mumps->sizeredrhs = orhs_size; 19327404bcfbSStefano Zampini mumps->schur_sol = osol; 1933a12f35bfSStefano Zampini mumps->schur_sizesol = osol_size; 19347404bcfbSStefano Zampini PetscFunctionReturn(0); 19357404bcfbSStefano Zampini } 19367404bcfbSStefano Zampini 1937e807eca7SStefano Zampini /* -------------------------------------------------------------------------------------------*/ 1938e807eca7SStefano Zampini #undef __FUNCT__ 19395ccb76cbSHong Zhang #define __FUNCT__ "MatMumpsSetIcntl_MUMPS" 19405ccb76cbSHong Zhang PetscErrorCode MatMumpsSetIcntl_MUMPS(Mat F,PetscInt icntl,PetscInt ival) 19415ccb76cbSHong Zhang { 1942a5e57a09SHong Zhang Mat_MUMPS *mumps =(Mat_MUMPS*)F->spptr; 19435ccb76cbSHong Zhang 19445ccb76cbSHong Zhang PetscFunctionBegin; 1945a5e57a09SHong Zhang mumps->id.ICNTL(icntl) = ival; 19465ccb76cbSHong Zhang PetscFunctionReturn(0); 19475ccb76cbSHong Zhang } 19485ccb76cbSHong Zhang 19495ccb76cbSHong Zhang #undef __FUNCT__ 1950bc6112feSHong Zhang #define __FUNCT__ "MatMumpsGetIcntl_MUMPS" 1951bc6112feSHong Zhang PetscErrorCode MatMumpsGetIcntl_MUMPS(Mat F,PetscInt icntl,PetscInt *ival) 1952bc6112feSHong Zhang { 1953bc6112feSHong Zhang Mat_MUMPS *mumps =(Mat_MUMPS*)F->spptr; 1954bc6112feSHong Zhang 1955bc6112feSHong Zhang PetscFunctionBegin; 1956bc6112feSHong Zhang *ival = mumps->id.ICNTL(icntl); 1957bc6112feSHong Zhang PetscFunctionReturn(0); 1958bc6112feSHong Zhang } 1959bc6112feSHong Zhang 1960bc6112feSHong Zhang #undef __FUNCT__ 19615ccb76cbSHong Zhang #define __FUNCT__ "MatMumpsSetIcntl" 19625ccb76cbSHong Zhang /*@ 19635ccb76cbSHong Zhang MatMumpsSetIcntl - Set MUMPS parameter ICNTL() 19645ccb76cbSHong Zhang 19655ccb76cbSHong Zhang Logically Collective on Mat 19665ccb76cbSHong Zhang 19675ccb76cbSHong Zhang Input Parameters: 19685ccb76cbSHong Zhang + F - the factored matrix obtained by calling MatGetFactor() from PETSc-MUMPS interface 19695ccb76cbSHong Zhang . icntl - index of MUMPS parameter array ICNTL() 19705ccb76cbSHong Zhang - ival - value of MUMPS ICNTL(icntl) 19715ccb76cbSHong Zhang 19725ccb76cbSHong Zhang Options Database: 19735ccb76cbSHong Zhang . -mat_mumps_icntl_<icntl> <ival> 19745ccb76cbSHong Zhang 19755ccb76cbSHong Zhang Level: beginner 19765ccb76cbSHong Zhang 19775ccb76cbSHong Zhang References: MUMPS Users' Guide 19785ccb76cbSHong Zhang 19795ccb76cbSHong Zhang .seealso: MatGetFactor() 19805ccb76cbSHong Zhang @*/ 19815ccb76cbSHong Zhang PetscErrorCode MatMumpsSetIcntl(Mat F,PetscInt icntl,PetscInt ival) 19825ccb76cbSHong Zhang { 19835ccb76cbSHong Zhang PetscErrorCode ierr; 19845ccb76cbSHong Zhang 19855ccb76cbSHong Zhang PetscFunctionBegin; 19865ccb76cbSHong Zhang PetscValidLogicalCollectiveInt(F,icntl,2); 19875ccb76cbSHong Zhang PetscValidLogicalCollectiveInt(F,ival,3); 19885ccb76cbSHong Zhang ierr = PetscTryMethod(F,"MatMumpsSetIcntl_C",(Mat,PetscInt,PetscInt),(F,icntl,ival));CHKERRQ(ierr); 19895ccb76cbSHong Zhang PetscFunctionReturn(0); 19905ccb76cbSHong Zhang } 19915ccb76cbSHong Zhang 1992bc6112feSHong Zhang #undef __FUNCT__ 1993bc6112feSHong Zhang #define __FUNCT__ "MatMumpsGetIcntl" 1994a21f80fcSHong Zhang /*@ 1995a21f80fcSHong Zhang MatMumpsGetIcntl - Get MUMPS parameter ICNTL() 1996a21f80fcSHong Zhang 1997a21f80fcSHong Zhang Logically Collective on Mat 1998a21f80fcSHong Zhang 1999a21f80fcSHong Zhang Input Parameters: 2000a21f80fcSHong Zhang + F - the factored matrix obtained by calling MatGetFactor() from PETSc-MUMPS interface 2001a21f80fcSHong Zhang - icntl - index of MUMPS parameter array ICNTL() 2002a21f80fcSHong Zhang 2003a21f80fcSHong Zhang Output Parameter: 2004a21f80fcSHong Zhang . ival - value of MUMPS ICNTL(icntl) 2005a21f80fcSHong Zhang 2006a21f80fcSHong Zhang Level: beginner 2007a21f80fcSHong Zhang 2008a21f80fcSHong Zhang References: MUMPS Users' Guide 2009a21f80fcSHong Zhang 2010a21f80fcSHong Zhang .seealso: MatGetFactor() 2011a21f80fcSHong Zhang @*/ 2012bc6112feSHong Zhang PetscErrorCode MatMumpsGetIcntl(Mat F,PetscInt icntl,PetscInt *ival) 2013bc6112feSHong Zhang { 2014bc6112feSHong Zhang PetscErrorCode ierr; 2015bc6112feSHong Zhang 2016bc6112feSHong Zhang PetscFunctionBegin; 2017bc6112feSHong Zhang PetscValidLogicalCollectiveInt(F,icntl,2); 2018bc6112feSHong Zhang PetscValidIntPointer(ival,3); 2019bc6112feSHong Zhang ierr = PetscTryMethod(F,"MatMumpsGetIcntl_C",(Mat,PetscInt,PetscInt*),(F,icntl,ival));CHKERRQ(ierr); 2020bc6112feSHong Zhang PetscFunctionReturn(0); 2021bc6112feSHong Zhang } 2022bc6112feSHong Zhang 20238928b65cSHong Zhang /* -------------------------------------------------------------------------------------------*/ 20248928b65cSHong Zhang #undef __FUNCT__ 20258928b65cSHong Zhang #define __FUNCT__ "MatMumpsSetCntl_MUMPS" 20268928b65cSHong Zhang PetscErrorCode MatMumpsSetCntl_MUMPS(Mat F,PetscInt icntl,PetscReal val) 20278928b65cSHong Zhang { 20288928b65cSHong Zhang Mat_MUMPS *mumps =(Mat_MUMPS*)F->spptr; 20298928b65cSHong Zhang 20308928b65cSHong Zhang PetscFunctionBegin; 20318928b65cSHong Zhang mumps->id.CNTL(icntl) = val; 20328928b65cSHong Zhang PetscFunctionReturn(0); 20338928b65cSHong Zhang } 20348928b65cSHong Zhang 20358928b65cSHong Zhang #undef __FUNCT__ 2036bc6112feSHong Zhang #define __FUNCT__ "MatMumpsGetCntl_MUMPS" 2037bc6112feSHong Zhang PetscErrorCode MatMumpsGetCntl_MUMPS(Mat F,PetscInt icntl,PetscReal *val) 2038bc6112feSHong Zhang { 2039bc6112feSHong Zhang Mat_MUMPS *mumps =(Mat_MUMPS*)F->spptr; 2040bc6112feSHong Zhang 2041bc6112feSHong Zhang PetscFunctionBegin; 2042bc6112feSHong Zhang *val = mumps->id.CNTL(icntl); 2043bc6112feSHong Zhang PetscFunctionReturn(0); 2044bc6112feSHong Zhang } 2045bc6112feSHong Zhang 2046bc6112feSHong Zhang #undef __FUNCT__ 20478928b65cSHong Zhang #define __FUNCT__ "MatMumpsSetCntl" 20488928b65cSHong Zhang /*@ 20498928b65cSHong Zhang MatMumpsSetCntl - Set MUMPS parameter CNTL() 20508928b65cSHong Zhang 20518928b65cSHong Zhang Logically Collective on Mat 20528928b65cSHong Zhang 20538928b65cSHong Zhang Input Parameters: 20548928b65cSHong Zhang + F - the factored matrix obtained by calling MatGetFactor() from PETSc-MUMPS interface 20558928b65cSHong Zhang . icntl - index of MUMPS parameter array CNTL() 20568928b65cSHong Zhang - val - value of MUMPS CNTL(icntl) 20578928b65cSHong Zhang 20588928b65cSHong Zhang Options Database: 20598928b65cSHong Zhang . -mat_mumps_cntl_<icntl> <val> 20608928b65cSHong Zhang 20618928b65cSHong Zhang Level: beginner 20628928b65cSHong Zhang 20638928b65cSHong Zhang References: MUMPS Users' Guide 20648928b65cSHong Zhang 20658928b65cSHong Zhang .seealso: MatGetFactor() 20668928b65cSHong Zhang @*/ 20678928b65cSHong Zhang PetscErrorCode MatMumpsSetCntl(Mat F,PetscInt icntl,PetscReal val) 20688928b65cSHong Zhang { 20698928b65cSHong Zhang PetscErrorCode ierr; 20708928b65cSHong Zhang 20718928b65cSHong Zhang PetscFunctionBegin; 20728928b65cSHong Zhang PetscValidLogicalCollectiveInt(F,icntl,2); 2073bc6112feSHong Zhang PetscValidLogicalCollectiveReal(F,val,3); 20748928b65cSHong Zhang ierr = PetscTryMethod(F,"MatMumpsSetCntl_C",(Mat,PetscInt,PetscReal),(F,icntl,val));CHKERRQ(ierr); 20758928b65cSHong Zhang PetscFunctionReturn(0); 20768928b65cSHong Zhang } 20778928b65cSHong Zhang 2078bc6112feSHong Zhang #undef __FUNCT__ 2079bc6112feSHong Zhang #define __FUNCT__ "MatMumpsGetCntl" 2080a21f80fcSHong Zhang /*@ 2081a21f80fcSHong Zhang MatMumpsGetCntl - Get MUMPS parameter CNTL() 2082a21f80fcSHong Zhang 2083a21f80fcSHong Zhang Logically Collective on Mat 2084a21f80fcSHong Zhang 2085a21f80fcSHong Zhang Input Parameters: 2086a21f80fcSHong Zhang + F - the factored matrix obtained by calling MatGetFactor() from PETSc-MUMPS interface 2087a21f80fcSHong Zhang - icntl - index of MUMPS parameter array CNTL() 2088a21f80fcSHong Zhang 2089a21f80fcSHong Zhang Output Parameter: 2090a21f80fcSHong Zhang . val - value of MUMPS CNTL(icntl) 2091a21f80fcSHong Zhang 2092a21f80fcSHong Zhang Level: beginner 2093a21f80fcSHong Zhang 2094a21f80fcSHong Zhang References: MUMPS Users' Guide 2095a21f80fcSHong Zhang 2096a21f80fcSHong Zhang .seealso: MatGetFactor() 2097a21f80fcSHong Zhang @*/ 2098bc6112feSHong Zhang PetscErrorCode MatMumpsGetCntl(Mat F,PetscInt icntl,PetscReal *val) 2099bc6112feSHong Zhang { 2100bc6112feSHong Zhang PetscErrorCode ierr; 2101bc6112feSHong Zhang 2102bc6112feSHong Zhang PetscFunctionBegin; 2103bc6112feSHong Zhang PetscValidLogicalCollectiveInt(F,icntl,2); 2104bc6112feSHong Zhang PetscValidRealPointer(val,3); 2105bc6112feSHong Zhang ierr = PetscTryMethod(F,"MatMumpsGetCntl_C",(Mat,PetscInt,PetscReal*),(F,icntl,val));CHKERRQ(ierr); 2106bc6112feSHong Zhang PetscFunctionReturn(0); 2107bc6112feSHong Zhang } 2108bc6112feSHong Zhang 2109bc6112feSHong Zhang #undef __FUNCT__ 2110ca810319SHong Zhang #define __FUNCT__ "MatMumpsGetInfo_MUMPS" 2111ca810319SHong Zhang PetscErrorCode MatMumpsGetInfo_MUMPS(Mat F,PetscInt icntl,PetscInt *info) 2112bc6112feSHong Zhang { 2113bc6112feSHong Zhang Mat_MUMPS *mumps =(Mat_MUMPS*)F->spptr; 2114bc6112feSHong Zhang 2115bc6112feSHong Zhang PetscFunctionBegin; 2116bc6112feSHong Zhang *info = mumps->id.INFO(icntl); 2117bc6112feSHong Zhang PetscFunctionReturn(0); 2118bc6112feSHong Zhang } 2119bc6112feSHong Zhang 2120bc6112feSHong Zhang #undef __FUNCT__ 2121ca810319SHong Zhang #define __FUNCT__ "MatMumpsGetInfog_MUMPS" 2122ca810319SHong Zhang PetscErrorCode MatMumpsGetInfog_MUMPS(Mat F,PetscInt icntl,PetscInt *infog) 2123bc6112feSHong Zhang { 2124bc6112feSHong Zhang Mat_MUMPS *mumps =(Mat_MUMPS*)F->spptr; 2125bc6112feSHong Zhang 2126bc6112feSHong Zhang PetscFunctionBegin; 2127bc6112feSHong Zhang *infog = mumps->id.INFOG(icntl); 2128bc6112feSHong Zhang PetscFunctionReturn(0); 2129bc6112feSHong Zhang } 2130bc6112feSHong Zhang 2131bc6112feSHong Zhang #undef __FUNCT__ 2132ca810319SHong Zhang #define __FUNCT__ "MatMumpsGetRinfo_MUMPS" 2133ca810319SHong Zhang PetscErrorCode MatMumpsGetRinfo_MUMPS(Mat F,PetscInt icntl,PetscReal *rinfo) 2134bc6112feSHong Zhang { 2135bc6112feSHong Zhang Mat_MUMPS *mumps =(Mat_MUMPS*)F->spptr; 2136bc6112feSHong Zhang 2137bc6112feSHong Zhang PetscFunctionBegin; 2138bc6112feSHong Zhang *rinfo = mumps->id.RINFO(icntl); 2139bc6112feSHong Zhang PetscFunctionReturn(0); 2140bc6112feSHong Zhang } 2141bc6112feSHong Zhang 2142bc6112feSHong Zhang #undef __FUNCT__ 2143ca810319SHong Zhang #define __FUNCT__ "MatMumpsGetRinfog_MUMPS" 2144ca810319SHong Zhang PetscErrorCode MatMumpsGetRinfog_MUMPS(Mat F,PetscInt icntl,PetscReal *rinfog) 2145bc6112feSHong Zhang { 2146bc6112feSHong Zhang Mat_MUMPS *mumps =(Mat_MUMPS*)F->spptr; 2147bc6112feSHong Zhang 2148bc6112feSHong Zhang PetscFunctionBegin; 2149bc6112feSHong Zhang *rinfog = mumps->id.RINFOG(icntl); 2150bc6112feSHong Zhang PetscFunctionReturn(0); 2151bc6112feSHong Zhang } 2152bc6112feSHong Zhang 2153bc6112feSHong Zhang #undef __FUNCT__ 2154ca810319SHong Zhang #define __FUNCT__ "MatMumpsGetInfo" 2155a21f80fcSHong Zhang /*@ 2156a21f80fcSHong Zhang MatMumpsGetInfo - Get MUMPS parameter INFO() 2157a21f80fcSHong Zhang 2158a21f80fcSHong Zhang Logically Collective on Mat 2159a21f80fcSHong Zhang 2160a21f80fcSHong Zhang Input Parameters: 2161a21f80fcSHong Zhang + F - the factored matrix obtained by calling MatGetFactor() from PETSc-MUMPS interface 2162a21f80fcSHong Zhang - icntl - index of MUMPS parameter array INFO() 2163a21f80fcSHong Zhang 2164a21f80fcSHong Zhang Output Parameter: 2165a21f80fcSHong Zhang . ival - value of MUMPS INFO(icntl) 2166a21f80fcSHong Zhang 2167a21f80fcSHong Zhang Level: beginner 2168a21f80fcSHong Zhang 2169a21f80fcSHong Zhang References: MUMPS Users' Guide 2170a21f80fcSHong Zhang 2171a21f80fcSHong Zhang .seealso: MatGetFactor() 2172a21f80fcSHong Zhang @*/ 2173ca810319SHong Zhang PetscErrorCode MatMumpsGetInfo(Mat F,PetscInt icntl,PetscInt *ival) 2174bc6112feSHong Zhang { 2175bc6112feSHong Zhang PetscErrorCode ierr; 2176bc6112feSHong Zhang 2177bc6112feSHong Zhang PetscFunctionBegin; 2178ca810319SHong Zhang PetscValidIntPointer(ival,3); 2179ca810319SHong Zhang ierr = PetscTryMethod(F,"MatMumpsGetInfo_C",(Mat,PetscInt,PetscInt*),(F,icntl,ival));CHKERRQ(ierr); 2180bc6112feSHong Zhang PetscFunctionReturn(0); 2181bc6112feSHong Zhang } 2182bc6112feSHong Zhang 2183bc6112feSHong Zhang #undef __FUNCT__ 2184ca810319SHong Zhang #define __FUNCT__ "MatMumpsGetInfog" 2185a21f80fcSHong Zhang /*@ 2186a21f80fcSHong Zhang MatMumpsGetInfog - Get MUMPS parameter INFOG() 2187a21f80fcSHong Zhang 2188a21f80fcSHong Zhang Logically Collective on Mat 2189a21f80fcSHong Zhang 2190a21f80fcSHong Zhang Input Parameters: 2191a21f80fcSHong Zhang + F - the factored matrix obtained by calling MatGetFactor() from PETSc-MUMPS interface 2192a21f80fcSHong Zhang - icntl - index of MUMPS parameter array INFOG() 2193a21f80fcSHong Zhang 2194a21f80fcSHong Zhang Output Parameter: 2195a21f80fcSHong Zhang . ival - value of MUMPS INFOG(icntl) 2196a21f80fcSHong Zhang 2197a21f80fcSHong Zhang Level: beginner 2198a21f80fcSHong Zhang 2199a21f80fcSHong Zhang References: MUMPS Users' Guide 2200a21f80fcSHong Zhang 2201a21f80fcSHong Zhang .seealso: MatGetFactor() 2202a21f80fcSHong Zhang @*/ 2203ca810319SHong Zhang PetscErrorCode MatMumpsGetInfog(Mat F,PetscInt icntl,PetscInt *ival) 2204bc6112feSHong Zhang { 2205bc6112feSHong Zhang PetscErrorCode ierr; 2206bc6112feSHong Zhang 2207bc6112feSHong Zhang PetscFunctionBegin; 2208ca810319SHong Zhang PetscValidIntPointer(ival,3); 2209ca810319SHong Zhang ierr = PetscTryMethod(F,"MatMumpsGetInfog_C",(Mat,PetscInt,PetscInt*),(F,icntl,ival));CHKERRQ(ierr); 2210bc6112feSHong Zhang PetscFunctionReturn(0); 2211bc6112feSHong Zhang } 2212bc6112feSHong Zhang 2213bc6112feSHong Zhang #undef __FUNCT__ 2214ca810319SHong Zhang #define __FUNCT__ "MatMumpsGetRinfo" 2215a21f80fcSHong Zhang /*@ 2216a21f80fcSHong Zhang MatMumpsGetRinfo - Get MUMPS parameter RINFO() 2217a21f80fcSHong Zhang 2218a21f80fcSHong Zhang Logically Collective on Mat 2219a21f80fcSHong Zhang 2220a21f80fcSHong Zhang Input Parameters: 2221a21f80fcSHong Zhang + F - the factored matrix obtained by calling MatGetFactor() from PETSc-MUMPS interface 2222a21f80fcSHong Zhang - icntl - index of MUMPS parameter array RINFO() 2223a21f80fcSHong Zhang 2224a21f80fcSHong Zhang Output Parameter: 2225a21f80fcSHong Zhang . val - value of MUMPS RINFO(icntl) 2226a21f80fcSHong Zhang 2227a21f80fcSHong Zhang Level: beginner 2228a21f80fcSHong Zhang 2229a21f80fcSHong Zhang References: MUMPS Users' Guide 2230a21f80fcSHong Zhang 2231a21f80fcSHong Zhang .seealso: MatGetFactor() 2232a21f80fcSHong Zhang @*/ 2233ca810319SHong Zhang PetscErrorCode MatMumpsGetRinfo(Mat F,PetscInt icntl,PetscReal *val) 2234bc6112feSHong Zhang { 2235bc6112feSHong Zhang PetscErrorCode ierr; 2236bc6112feSHong Zhang 2237bc6112feSHong Zhang PetscFunctionBegin; 2238bc6112feSHong Zhang PetscValidRealPointer(val,3); 2239ca810319SHong Zhang ierr = PetscTryMethod(F,"MatMumpsGetRinfo_C",(Mat,PetscInt,PetscReal*),(F,icntl,val));CHKERRQ(ierr); 2240bc6112feSHong Zhang PetscFunctionReturn(0); 2241bc6112feSHong Zhang } 2242bc6112feSHong Zhang 2243bc6112feSHong Zhang #undef __FUNCT__ 2244ca810319SHong Zhang #define __FUNCT__ "MatMumpsGetRinfog" 2245a21f80fcSHong Zhang /*@ 2246a21f80fcSHong Zhang MatMumpsGetRinfog - Get MUMPS parameter RINFOG() 2247a21f80fcSHong Zhang 2248a21f80fcSHong Zhang Logically Collective on Mat 2249a21f80fcSHong Zhang 2250a21f80fcSHong Zhang Input Parameters: 2251a21f80fcSHong Zhang + F - the factored matrix obtained by calling MatGetFactor() from PETSc-MUMPS interface 2252a21f80fcSHong Zhang - icntl - index of MUMPS parameter array RINFOG() 2253a21f80fcSHong Zhang 2254a21f80fcSHong Zhang Output Parameter: 2255a21f80fcSHong Zhang . val - value of MUMPS RINFOG(icntl) 2256a21f80fcSHong Zhang 2257a21f80fcSHong Zhang Level: beginner 2258a21f80fcSHong Zhang 2259a21f80fcSHong Zhang References: MUMPS Users' Guide 2260a21f80fcSHong Zhang 2261a21f80fcSHong Zhang .seealso: MatGetFactor() 2262a21f80fcSHong Zhang @*/ 2263ca810319SHong Zhang PetscErrorCode MatMumpsGetRinfog(Mat F,PetscInt icntl,PetscReal *val) 2264bc6112feSHong Zhang { 2265bc6112feSHong Zhang PetscErrorCode ierr; 2266bc6112feSHong Zhang 2267bc6112feSHong Zhang PetscFunctionBegin; 2268bc6112feSHong Zhang PetscValidRealPointer(val,3); 2269ca810319SHong Zhang ierr = PetscTryMethod(F,"MatMumpsGetRinfog_C",(Mat,PetscInt,PetscReal*),(F,icntl,val));CHKERRQ(ierr); 2270bc6112feSHong Zhang PetscFunctionReturn(0); 2271bc6112feSHong Zhang } 2272bc6112feSHong Zhang 227324b6179bSKris Buschelman /*MC 22742692d6eeSBarry Smith MATSOLVERMUMPS - A matrix type providing direct solvers (LU and Cholesky) for 227524b6179bSKris Buschelman distributed and sequential matrices via the external package MUMPS. 227624b6179bSKris Buschelman 227741c8de11SBarry Smith Works with MATAIJ and MATSBAIJ matrices 227824b6179bSKris Buschelman 2279c2b89b5dSBarry Smith Use ./configure --download-mumps --download-scalapack --download-parmetis --download-metis --download-ptscotch to have PETSc installed with MUMPS 2280c2b89b5dSBarry Smith 2281c2b89b5dSBarry Smith Use -pc_type cholesky or lu -pc_factor_mat_solver_package mumps to us this direct solver 2282c2b89b5dSBarry Smith 228324b6179bSKris Buschelman Options Database Keys: 22844e34a73bSHong Zhang + -mat_mumps_icntl_1 <6>: ICNTL(1): output stream for error messages (None) 22854e34a73bSHong Zhang . -mat_mumps_icntl_2 <0>: ICNTL(2): output stream for diagnostic printing, statistics, and warning (None) 22864e34a73bSHong Zhang . -mat_mumps_icntl_3 <0>: ICNTL(3): output stream for global information, collected on the host (None) 22874e34a73bSHong Zhang . -mat_mumps_icntl_4 <0>: ICNTL(4): level of printing (0 to 4) (None) 22884e34a73bSHong Zhang . -mat_mumps_icntl_6 <7>: ICNTL(6): permutes to a zero-free diagonal and/or scale the matrix (0 to 7) (None) 22894e34a73bSHong Zhang . -mat_mumps_icntl_7 <7>: ICNTL(7): computes a symmetric permutation in sequential analysis (0 to 7). 3=Scotch, 4=PORD, 5=Metis (None) 22904e34a73bSHong Zhang . -mat_mumps_icntl_8 <77>: ICNTL(8): scaling strategy (-2 to 8 or 77) (None) 22914e34a73bSHong Zhang . -mat_mumps_icntl_10 <0>: ICNTL(10): max num of refinements (None) 22924e34a73bSHong Zhang . -mat_mumps_icntl_11 <0>: ICNTL(11): statistics related to an error analysis (via -ksp_view) (None) 22934e34a73bSHong Zhang . -mat_mumps_icntl_12 <1>: ICNTL(12): an ordering strategy for symmetric matrices (0 to 3) (None) 22944e34a73bSHong Zhang . -mat_mumps_icntl_13 <0>: ICNTL(13): parallelism of the root node (enable ScaLAPACK) and its splitting (None) 22954e34a73bSHong Zhang . -mat_mumps_icntl_14 <20>: ICNTL(14): percentage increase in the estimated working space (None) 22964e34a73bSHong Zhang . -mat_mumps_icntl_19 <0>: ICNTL(19): computes the Schur complement (None) 22974e34a73bSHong Zhang . -mat_mumps_icntl_22 <0>: ICNTL(22): in-core/out-of-core factorization and solve (0 or 1) (None) 22984e34a73bSHong Zhang . -mat_mumps_icntl_23 <0>: ICNTL(23): max size of the working memory (MB) that can allocate per processor (None) 22994e34a73bSHong Zhang . -mat_mumps_icntl_24 <0>: ICNTL(24): detection of null pivot rows (0 or 1) (None) 23004e34a73bSHong Zhang . -mat_mumps_icntl_25 <0>: ICNTL(25): compute a solution of a deficient matrix and a null space basis (None) 23014e34a73bSHong Zhang . -mat_mumps_icntl_26 <0>: ICNTL(26): drives the solution phase if a Schur complement matrix (None) 23024e34a73bSHong Zhang . -mat_mumps_icntl_28 <1>: ICNTL(28): use 1 for sequential analysis and ictnl(7) ordering, or 2 for parallel analysis and ictnl(29) ordering (None) 23034e34a73bSHong Zhang . -mat_mumps_icntl_29 <0>: ICNTL(29): parallel ordering 1 = ptscotch, 2 = parmetis (None) 23044e34a73bSHong Zhang . -mat_mumps_icntl_30 <0>: ICNTL(30): compute user-specified set of entries in inv(A) (None) 23054e34a73bSHong Zhang . -mat_mumps_icntl_31 <0>: ICNTL(31): indicates which factors may be discarded during factorization (None) 23064e34a73bSHong Zhang . -mat_mumps_icntl_33 <0>: ICNTL(33): compute determinant (None) 23074e34a73bSHong Zhang . -mat_mumps_cntl_1 <0.01>: CNTL(1): relative pivoting threshold (None) 23084e34a73bSHong Zhang . -mat_mumps_cntl_2 <1.49012e-08>: CNTL(2): stopping criterion of refinement (None) 23094e34a73bSHong Zhang . -mat_mumps_cntl_3 <0>: CNTL(3): absolute pivoting threshold (None) 23104e34a73bSHong Zhang . -mat_mumps_cntl_4 <-1>: CNTL(4): value for static pivoting (None) 23114e34a73bSHong Zhang - -mat_mumps_cntl_5 <0>: CNTL(5): fixation for null pivots (None) 231224b6179bSKris Buschelman 231324b6179bSKris Buschelman Level: beginner 231424b6179bSKris Buschelman 231541c8de11SBarry Smith .seealso: PCFactorSetMatSolverPackage(), MatSolverPackage 231641c8de11SBarry Smith 231724b6179bSKris Buschelman M*/ 231824b6179bSKris Buschelman 231935bd34faSBarry Smith #undef __FUNCT__ 232035bd34faSBarry Smith #define __FUNCT__ "MatFactorGetSolverPackage_mumps" 2321f7a08781SBarry Smith static PetscErrorCode MatFactorGetSolverPackage_mumps(Mat A,const MatSolverPackage *type) 232235bd34faSBarry Smith { 232335bd34faSBarry Smith PetscFunctionBegin; 23242692d6eeSBarry Smith *type = MATSOLVERMUMPS; 232535bd34faSBarry Smith PetscFunctionReturn(0); 232635bd34faSBarry Smith } 232735bd34faSBarry Smith 2328bccb9932SShri Abhyankar /* MatGetFactor for Seq and MPI AIJ matrices */ 23292877fffaSHong Zhang #undef __FUNCT__ 2330bccb9932SShri Abhyankar #define __FUNCT__ "MatGetFactor_aij_mumps" 23318cc058d9SJed Brown PETSC_EXTERN PetscErrorCode MatGetFactor_aij_mumps(Mat A,MatFactorType ftype,Mat *F) 23322877fffaSHong Zhang { 23332877fffaSHong Zhang Mat B; 23342877fffaSHong Zhang PetscErrorCode ierr; 23352877fffaSHong Zhang Mat_MUMPS *mumps; 2336ace3abfcSBarry Smith PetscBool isSeqAIJ; 23372877fffaSHong Zhang 23382877fffaSHong Zhang PetscFunctionBegin; 23392877fffaSHong Zhang /* Create the factorization matrix */ 2340251f4c67SDmitry Karpeev ierr = PetscObjectTypeCompare((PetscObject)A,MATSEQAIJ,&isSeqAIJ);CHKERRQ(ierr); 2341ce94432eSBarry Smith ierr = MatCreate(PetscObjectComm((PetscObject)A),&B);CHKERRQ(ierr); 23422877fffaSHong Zhang ierr = MatSetSizes(B,A->rmap->n,A->cmap->n,A->rmap->N,A->cmap->N);CHKERRQ(ierr); 23432877fffaSHong Zhang ierr = MatSetType(B,((PetscObject)A)->type_name);CHKERRQ(ierr); 2344bccb9932SShri Abhyankar if (isSeqAIJ) { 23450298fd71SBarry Smith ierr = MatSeqAIJSetPreallocation(B,0,NULL);CHKERRQ(ierr); 2346bccb9932SShri Abhyankar } else { 23470298fd71SBarry Smith ierr = MatMPIAIJSetPreallocation(B,0,NULL,0,NULL);CHKERRQ(ierr); 2348bccb9932SShri Abhyankar } 23492877fffaSHong Zhang 2350b00a9115SJed Brown ierr = PetscNewLog(B,&mumps);CHKERRQ(ierr); 23512205254eSKarl Rupp 23522877fffaSHong Zhang B->ops->view = MatView_MUMPS; 235335bd34faSBarry Smith B->ops->getinfo = MatGetInfo_MUMPS; 235420be8e61SHong Zhang B->ops->getdiagonal = MatGetDiagonal_MUMPS; 23552205254eSKarl Rupp 2356bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatFactorGetSolverPackage_C",MatFactorGetSolverPackage_mumps);CHKERRQ(ierr); 23575a05ddb0SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatFactorSetSchurIS_C",MatFactorSetSchurIS_MUMPS);CHKERRQ(ierr); 23585a05ddb0SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatFactorInvertSchurComplement_C",MatFactorInvertSchurComplement_MUMPS);CHKERRQ(ierr); 23595a05ddb0SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatFactorCreateSchurComplement_C",MatFactorCreateSchurComplement_MUMPS);CHKERRQ(ierr); 23605a05ddb0SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatFactorGetSchurComplement_C",MatFactorGetSchurComplement_MUMPS);CHKERRQ(ierr); 23615a05ddb0SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatFactorSolveSchurComplement_C",MatFactorSolveSchurComplement_MUMPS);CHKERRQ(ierr); 23625a05ddb0SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatFactorSolveSchurComplementTranspose_C",MatFactorSolveSchurComplementTranspose_MUMPS);CHKERRQ(ierr); 2363bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsSetIcntl_C",MatMumpsSetIcntl_MUMPS);CHKERRQ(ierr); 2364bc6112feSHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsGetIcntl_C",MatMumpsGetIcntl_MUMPS);CHKERRQ(ierr); 2365bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsSetCntl_C",MatMumpsSetCntl_MUMPS);CHKERRQ(ierr); 2366bc6112feSHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsGetCntl_C",MatMumpsGetCntl_MUMPS);CHKERRQ(ierr); 2367ca810319SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsGetInfo_C",MatMumpsGetInfo_MUMPS);CHKERRQ(ierr); 2368ca810319SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsGetInfog_C",MatMumpsGetInfog_MUMPS);CHKERRQ(ierr); 2369ca810319SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsGetRinfo_C",MatMumpsGetRinfo_MUMPS);CHKERRQ(ierr); 2370ca810319SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsGetRinfog_C",MatMumpsGetRinfog_MUMPS);CHKERRQ(ierr); 23716444a565SStefano Zampini 2372450b117fSShri Abhyankar if (ftype == MAT_FACTOR_LU) { 2373450b117fSShri Abhyankar B->ops->lufactorsymbolic = MatLUFactorSymbolic_AIJMUMPS; 2374d5f3da31SBarry Smith B->factortype = MAT_FACTOR_LU; 2375bccb9932SShri Abhyankar if (isSeqAIJ) mumps->ConvertToTriples = MatConvertToTriples_seqaij_seqaij; 2376bccb9932SShri Abhyankar else mumps->ConvertToTriples = MatConvertToTriples_mpiaij_mpiaij; 2377746480a1SHong Zhang mumps->sym = 0; 2378dcd589f8SShri Abhyankar } else { 237967877ebaSShri Abhyankar B->ops->choleskyfactorsymbolic = MatCholeskyFactorSymbolic_MUMPS; 2380450b117fSShri Abhyankar B->factortype = MAT_FACTOR_CHOLESKY; 2381bccb9932SShri Abhyankar if (isSeqAIJ) mumps->ConvertToTriples = MatConvertToTriples_seqaij_seqsbaij; 2382bccb9932SShri Abhyankar else mumps->ConvertToTriples = MatConvertToTriples_mpiaij_mpisbaij; 238359ac8732SStefano Zampini #if defined(PETSC_USE_COMPLEX) 238459ac8732SStefano Zampini mumps->sym = 2; 238559ac8732SStefano Zampini #else 23866fdc2a6dSBarry Smith if (A->spd_set && A->spd) mumps->sym = 1; 23876fdc2a6dSBarry Smith else mumps->sym = 2; 238859ac8732SStefano Zampini #endif 2389450b117fSShri Abhyankar } 23902877fffaSHong Zhang 23912877fffaSHong Zhang mumps->isAIJ = PETSC_TRUE; 2392bf0cc555SLisandro Dalcin mumps->Destroy = B->ops->destroy; 23932877fffaSHong Zhang B->ops->destroy = MatDestroy_MUMPS; 23942877fffaSHong Zhang B->spptr = (void*)mumps; 23952205254eSKarl Rupp 2396f697e70eSHong Zhang ierr = PetscInitializeMUMPS(A,mumps);CHKERRQ(ierr); 2397746480a1SHong Zhang 23982877fffaSHong Zhang *F = B; 23992877fffaSHong Zhang PetscFunctionReturn(0); 24002877fffaSHong Zhang } 24012877fffaSHong Zhang 2402bccb9932SShri Abhyankar /* MatGetFactor for Seq and MPI SBAIJ matrices */ 24032877fffaSHong Zhang #undef __FUNCT__ 2404bccb9932SShri Abhyankar #define __FUNCT__ "MatGetFactor_sbaij_mumps" 24058cc058d9SJed Brown PETSC_EXTERN PetscErrorCode MatGetFactor_sbaij_mumps(Mat A,MatFactorType ftype,Mat *F) 24062877fffaSHong Zhang { 24072877fffaSHong Zhang Mat B; 24082877fffaSHong Zhang PetscErrorCode ierr; 24092877fffaSHong Zhang Mat_MUMPS *mumps; 2410ace3abfcSBarry Smith PetscBool isSeqSBAIJ; 24112877fffaSHong Zhang 24122877fffaSHong Zhang PetscFunctionBegin; 2413ce94432eSBarry Smith if (ftype != MAT_FACTOR_CHOLESKY) SETERRQ(PetscObjectComm((PetscObject)A),PETSC_ERR_SUP,"Cannot use PETSc SBAIJ matrices with MUMPS LU, use AIJ matrix"); 2414ce94432eSBarry Smith if (A->rmap->bs > 1) SETERRQ(PetscObjectComm((PetscObject)A),PETSC_ERR_SUP,"Cannot use PETSc SBAIJ matrices with block size > 1 with MUMPS Cholesky, use AIJ matrix instead"); 2415251f4c67SDmitry Karpeev ierr = PetscObjectTypeCompare((PetscObject)A,MATSEQSBAIJ,&isSeqSBAIJ);CHKERRQ(ierr); 24162877fffaSHong Zhang /* Create the factorization matrix */ 2417ce94432eSBarry Smith ierr = MatCreate(PetscObjectComm((PetscObject)A),&B);CHKERRQ(ierr); 24182877fffaSHong Zhang ierr = MatSetSizes(B,A->rmap->n,A->cmap->n,A->rmap->N,A->cmap->N);CHKERRQ(ierr); 24192877fffaSHong Zhang ierr = MatSetType(B,((PetscObject)A)->type_name);CHKERRQ(ierr); 2420b00a9115SJed Brown ierr = PetscNewLog(B,&mumps);CHKERRQ(ierr); 2421bccb9932SShri Abhyankar if (isSeqSBAIJ) { 24220298fd71SBarry Smith ierr = MatSeqSBAIJSetPreallocation(B,1,0,NULL);CHKERRQ(ierr); 24232205254eSKarl Rupp 242416ebf90aSShri Abhyankar mumps->ConvertToTriples = MatConvertToTriples_seqsbaij_seqsbaij; 2425dcd589f8SShri Abhyankar } else { 24260298fd71SBarry Smith ierr = MatMPISBAIJSetPreallocation(B,1,0,NULL,0,NULL);CHKERRQ(ierr); 24272205254eSKarl Rupp 2428bccb9932SShri Abhyankar mumps->ConvertToTriples = MatConvertToTriples_mpisbaij_mpisbaij; 2429bccb9932SShri Abhyankar } 2430bccb9932SShri Abhyankar 243167877ebaSShri Abhyankar B->ops->choleskyfactorsymbolic = MatCholeskyFactorSymbolic_MUMPS; 2432bccb9932SShri Abhyankar B->ops->view = MatView_MUMPS; 243320be8e61SHong Zhang B->ops->getdiagonal = MatGetDiagonal_MUMPS; 24342205254eSKarl Rupp 2435bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatFactorGetSolverPackage_C",MatFactorGetSolverPackage_mumps);CHKERRQ(ierr); 24365a05ddb0SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatFactorSetSchurIS_C",MatFactorSetSchurIS_MUMPS);CHKERRQ(ierr); 24375a05ddb0SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatFactorInvertSchurComplement_C",MatFactorInvertSchurComplement_MUMPS);CHKERRQ(ierr); 24385a05ddb0SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatFactorCreateSchurComplement_C",MatFactorCreateSchurComplement_MUMPS);CHKERRQ(ierr); 24395a05ddb0SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatFactorGetSchurComplement_C",MatFactorGetSchurComplement_MUMPS);CHKERRQ(ierr); 24405a05ddb0SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatFactorSolveSchurComplement_C",MatFactorSolveSchurComplement_MUMPS);CHKERRQ(ierr); 24415a05ddb0SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatFactorSolveSchurComplementTranspose_C",MatFactorSolveSchurComplementTranspose_MUMPS);CHKERRQ(ierr); 2442b13644aeSHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsSetIcntl_C",MatMumpsSetIcntl_MUMPS);CHKERRQ(ierr); 2443b13644aeSHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsGetIcntl_C",MatMumpsGetIcntl_MUMPS);CHKERRQ(ierr); 2444b13644aeSHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsSetCntl_C",MatMumpsSetCntl_MUMPS);CHKERRQ(ierr); 2445b13644aeSHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsGetCntl_C",MatMumpsGetCntl_MUMPS);CHKERRQ(ierr); 2446ca810319SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsGetInfo_C",MatMumpsGetInfo_MUMPS);CHKERRQ(ierr); 2447ca810319SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsGetInfog_C",MatMumpsGetInfog_MUMPS);CHKERRQ(ierr); 2448ca810319SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsGetRinfo_C",MatMumpsGetRinfo_MUMPS);CHKERRQ(ierr); 2449ca810319SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsGetRinfog_C",MatMumpsGetRinfog_MUMPS);CHKERRQ(ierr); 24502205254eSKarl Rupp 2451f4762488SHong Zhang B->factortype = MAT_FACTOR_CHOLESKY; 245259ac8732SStefano Zampini #if defined(PETSC_USE_COMPLEX) 245359ac8732SStefano Zampini mumps->sym = 2; 245459ac8732SStefano Zampini #else 24556fdc2a6dSBarry Smith if (A->spd_set && A->spd) mumps->sym = 1; 24566fdc2a6dSBarry Smith else mumps->sym = 2; 245759ac8732SStefano Zampini #endif 2458a214ac2aSShri Abhyankar 2459bccb9932SShri Abhyankar mumps->isAIJ = PETSC_FALSE; 2460bf0cc555SLisandro Dalcin mumps->Destroy = B->ops->destroy; 2461f3c0ef26SHong Zhang B->ops->destroy = MatDestroy_MUMPS; 24622877fffaSHong Zhang B->spptr = (void*)mumps; 24632205254eSKarl Rupp 2464f697e70eSHong Zhang ierr = PetscInitializeMUMPS(A,mumps);CHKERRQ(ierr); 2465746480a1SHong Zhang 24662877fffaSHong Zhang *F = B; 24672877fffaSHong Zhang PetscFunctionReturn(0); 24682877fffaSHong Zhang } 246997969023SHong Zhang 2470450b117fSShri Abhyankar #undef __FUNCT__ 2471bccb9932SShri Abhyankar #define __FUNCT__ "MatGetFactor_baij_mumps" 24728cc058d9SJed Brown PETSC_EXTERN PetscErrorCode MatGetFactor_baij_mumps(Mat A,MatFactorType ftype,Mat *F) 247367877ebaSShri Abhyankar { 247467877ebaSShri Abhyankar Mat B; 247567877ebaSShri Abhyankar PetscErrorCode ierr; 247667877ebaSShri Abhyankar Mat_MUMPS *mumps; 2477ace3abfcSBarry Smith PetscBool isSeqBAIJ; 247867877ebaSShri Abhyankar 247967877ebaSShri Abhyankar PetscFunctionBegin; 248067877ebaSShri Abhyankar /* Create the factorization matrix */ 2481251f4c67SDmitry Karpeev ierr = PetscObjectTypeCompare((PetscObject)A,MATSEQBAIJ,&isSeqBAIJ);CHKERRQ(ierr); 2482ce94432eSBarry Smith ierr = MatCreate(PetscObjectComm((PetscObject)A),&B);CHKERRQ(ierr); 248367877ebaSShri Abhyankar ierr = MatSetSizes(B,A->rmap->n,A->cmap->n,A->rmap->N,A->cmap->N);CHKERRQ(ierr); 248467877ebaSShri Abhyankar ierr = MatSetType(B,((PetscObject)A)->type_name);CHKERRQ(ierr); 2485bccb9932SShri Abhyankar if (isSeqBAIJ) { 24860298fd71SBarry Smith ierr = MatSeqBAIJSetPreallocation(B,A->rmap->bs,0,NULL);CHKERRQ(ierr); 2487bccb9932SShri Abhyankar } else { 24880298fd71SBarry Smith ierr = MatMPIBAIJSetPreallocation(B,A->rmap->bs,0,NULL,0,NULL);CHKERRQ(ierr); 2489bccb9932SShri Abhyankar } 2490450b117fSShri Abhyankar 2491b00a9115SJed Brown ierr = PetscNewLog(B,&mumps);CHKERRQ(ierr); 2492450b117fSShri Abhyankar if (ftype == MAT_FACTOR_LU) { 2493450b117fSShri Abhyankar B->ops->lufactorsymbolic = MatLUFactorSymbolic_BAIJMUMPS; 2494450b117fSShri Abhyankar B->factortype = MAT_FACTOR_LU; 2495bccb9932SShri Abhyankar if (isSeqBAIJ) mumps->ConvertToTriples = MatConvertToTriples_seqbaij_seqaij; 2496bccb9932SShri Abhyankar else mumps->ConvertToTriples = MatConvertToTriples_mpibaij_mpiaij; 2497746480a1SHong Zhang mumps->sym = 0; 2498f23aa3ddSBarry Smith } else SETERRQ(PETSC_COMM_SELF,PETSC_ERR_SUP,"Cannot use PETSc BAIJ matrices with MUMPS Cholesky, use SBAIJ or AIJ matrix instead\n"); 2499bccb9932SShri Abhyankar 2500450b117fSShri Abhyankar B->ops->view = MatView_MUMPS; 250120be8e61SHong Zhang B->ops->getdiagonal = MatGetDiagonal_MUMPS; 25022205254eSKarl Rupp 2503bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatFactorGetSolverPackage_C",MatFactorGetSolverPackage_mumps);CHKERRQ(ierr); 25045a05ddb0SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatFactorSetSchurIS_C",MatFactorSetSchurIS_MUMPS);CHKERRQ(ierr); 25055a05ddb0SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatFactorInvertSchurComplement_C",MatFactorInvertSchurComplement_MUMPS);CHKERRQ(ierr); 25065a05ddb0SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatFactorCreateSchurComplement_C",MatFactorCreateSchurComplement_MUMPS);CHKERRQ(ierr); 25075a05ddb0SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatFactorGetSchurComplement_C",MatFactorGetSchurComplement_MUMPS);CHKERRQ(ierr); 25085a05ddb0SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatFactorSolveSchurComplement_C",MatFactorSolveSchurComplement_MUMPS);CHKERRQ(ierr); 25095a05ddb0SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)B,"MatFactorSolveSchurComplementTranspose_C",MatFactorSolveSchurComplementTranspose_MUMPS);CHKERRQ(ierr); 2510bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsSetIcntl_C",MatMumpsSetIcntl_MUMPS);CHKERRQ(ierr); 2511bc6112feSHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsGetIcntl_C",MatMumpsGetIcntl_MUMPS);CHKERRQ(ierr); 2512bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsSetCntl_C",MatMumpsSetCntl_MUMPS);CHKERRQ(ierr); 2513bc6112feSHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsGetCntl_C",MatMumpsGetCntl_MUMPS);CHKERRQ(ierr); 2514ca810319SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsGetInfo_C",MatMumpsGetInfo_MUMPS);CHKERRQ(ierr); 2515ca810319SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsGetInfog_C",MatMumpsGetInfog_MUMPS);CHKERRQ(ierr); 2516ca810319SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsGetRinfo_C",MatMumpsGetRinfo_MUMPS);CHKERRQ(ierr); 2517ca810319SHong Zhang ierr = PetscObjectComposeFunction((PetscObject)B,"MatMumpsGetRinfog_C",MatMumpsGetRinfog_MUMPS);CHKERRQ(ierr); 2518450b117fSShri Abhyankar 2519450b117fSShri Abhyankar mumps->isAIJ = PETSC_TRUE; 2520bf0cc555SLisandro Dalcin mumps->Destroy = B->ops->destroy; 2521450b117fSShri Abhyankar B->ops->destroy = MatDestroy_MUMPS; 2522450b117fSShri Abhyankar B->spptr = (void*)mumps; 25232205254eSKarl Rupp 2524f697e70eSHong Zhang ierr = PetscInitializeMUMPS(A,mumps);CHKERRQ(ierr); 2525746480a1SHong Zhang 2526450b117fSShri Abhyankar *F = B; 2527450b117fSShri Abhyankar PetscFunctionReturn(0); 2528450b117fSShri Abhyankar } 252942c9c57cSBarry Smith 253042c9c57cSBarry Smith PETSC_EXTERN PetscErrorCode MatGetFactor_aij_mumps(Mat,MatFactorType,Mat*); 253142c9c57cSBarry Smith PETSC_EXTERN PetscErrorCode MatGetFactor_baij_mumps(Mat,MatFactorType,Mat*); 253242c9c57cSBarry Smith PETSC_EXTERN PetscErrorCode MatGetFactor_sbaij_mumps(Mat,MatFactorType,Mat*); 253342c9c57cSBarry Smith 253442c9c57cSBarry Smith #undef __FUNCT__ 253542c9c57cSBarry Smith #define __FUNCT__ "MatSolverPackageRegister_MUMPS" 253629b38603SBarry Smith PETSC_EXTERN PetscErrorCode MatSolverPackageRegister_MUMPS(void) 253742c9c57cSBarry Smith { 253842c9c57cSBarry Smith PetscErrorCode ierr; 253942c9c57cSBarry Smith 254042c9c57cSBarry Smith PetscFunctionBegin; 254142c9c57cSBarry Smith ierr = MatSolverPackageRegister(MATSOLVERMUMPS,MATMPIAIJ,MAT_FACTOR_LU,MatGetFactor_aij_mumps);CHKERRQ(ierr); 254242c9c57cSBarry Smith ierr = MatSolverPackageRegister(MATSOLVERMUMPS,MATMPIAIJ,MAT_FACTOR_CHOLESKY,MatGetFactor_aij_mumps);CHKERRQ(ierr); 254342c9c57cSBarry Smith ierr = MatSolverPackageRegister(MATSOLVERMUMPS,MATMPIBAIJ,MAT_FACTOR_LU,MatGetFactor_baij_mumps);CHKERRQ(ierr); 254442c9c57cSBarry Smith ierr = MatSolverPackageRegister(MATSOLVERMUMPS,MATMPIBAIJ,MAT_FACTOR_CHOLESKY,MatGetFactor_baij_mumps);CHKERRQ(ierr); 254542c9c57cSBarry Smith ierr = MatSolverPackageRegister(MATSOLVERMUMPS,MATMPISBAIJ,MAT_FACTOR_CHOLESKY,MatGetFactor_sbaij_mumps);CHKERRQ(ierr); 254642c9c57cSBarry Smith ierr = MatSolverPackageRegister(MATSOLVERMUMPS,MATSEQAIJ,MAT_FACTOR_LU,MatGetFactor_aij_mumps);CHKERRQ(ierr); 254742c9c57cSBarry Smith ierr = MatSolverPackageRegister(MATSOLVERMUMPS,MATSEQAIJ,MAT_FACTOR_CHOLESKY,MatGetFactor_aij_mumps);CHKERRQ(ierr); 254842c9c57cSBarry Smith ierr = MatSolverPackageRegister(MATSOLVERMUMPS,MATSEQBAIJ,MAT_FACTOR_LU,MatGetFactor_baij_mumps);CHKERRQ(ierr); 254942c9c57cSBarry Smith ierr = MatSolverPackageRegister(MATSOLVERMUMPS,MATSEQBAIJ,MAT_FACTOR_CHOLESKY,MatGetFactor_baij_mumps);CHKERRQ(ierr); 255042c9c57cSBarry Smith ierr = MatSolverPackageRegister(MATSOLVERMUMPS,MATSEQSBAIJ,MAT_FACTOR_CHOLESKY,MatGetFactor_sbaij_mumps);CHKERRQ(ierr); 255142c9c57cSBarry Smith PetscFunctionReturn(0); 255242c9c57cSBarry Smith } 255342c9c57cSBarry Smith 2554